Remove / comment-out unneeded code

This commit is contained in:
Changho Hwang
2023-02-06 06:46:54 +00:00
parent f3e6f7fe8b
commit 6679e85953
5 changed files with 490 additions and 1310 deletions

View File

@@ -79,19 +79,19 @@ mscclppResult_t mscclppSocketGetAddr(struct mscclppSocket* sock, union mscclppSo
// Connect to sock->addr. sock->fd is set after a successful call.
mscclppResult_t mscclppSocketConnect(struct mscclppSocket* sock);
// Return socket connection state.
mscclppResult_t mscclppSocketReady(struct mscclppSocket* sock, int *running);
// mscclppResult_t mscclppSocketReady(struct mscclppSocket* sock, int *running);
// Accept an incoming connection from listenSock->fd and keep the file descriptor in sock->fd, with the remote side IP/port in sock->addr.
mscclppResult_t mscclppSocketAccept(struct mscclppSocket* sock, struct mscclppSocket* ulistenSock);
mscclppResult_t mscclppSocketGetFd(struct mscclppSocket* sock, int* fd);
mscclppResult_t mscclppSocketSetFd(int fd, struct mscclppSocket* sock);
// mscclppResult_t mscclppSocketGetFd(struct mscclppSocket* sock, int* fd);
// mscclppResult_t mscclppSocketSetFd(int fd, struct mscclppSocket* sock);
#define MSCCLPP_SOCKET_SEND 0
#define MSCCLPP_SOCKET_RECV 1
mscclppResult_t mscclppSocketProgress(int op, struct mscclppSocket* sock, void* ptr, int size, int* offset);
mscclppResult_t mscclppSocketWait(int op, struct mscclppSocket* sock, void* ptr, int size, int* offset);
// mscclppResult_t mscclppSocketWait(int op, struct mscclppSocket* sock, void* ptr, int size, int* offset);
mscclppResult_t mscclppSocketSend(struct mscclppSocket* sock, void* ptr, int size);
mscclppResult_t mscclppSocketRecv(struct mscclppSocket* sock, void* ptr, int size);
mscclppResult_t mscclppSocketTryRecv(struct mscclppSocket* sock, void* ptr, int size, int* closed);
// mscclppResult_t mscclppSocketTryRecv(struct mscclppSocket* sock, void* ptr, int size, int* closed);
mscclppResult_t mscclppSocketClose(struct mscclppSocket* sock);
#endif

View File

@@ -15,7 +15,7 @@
#include <sched.h>
#include <new>
int mscclppCudaCompCap();
// int mscclppCudaCompCap();
// PCI Bus ID <-> int64 conversion functions
mscclppResult_t int64ToBusId(int64_t id, char* busId);
@@ -64,15 +64,15 @@ inline mscclppResult_t getRandomData(void* buffer, size_t bytes) {
////////////////////////////////////////////////////////////////////////////////
template<typename Int>
inline void mscclppAtomicRefCountIncrement(Int* refs) {
__atomic_fetch_add(refs, 1, __ATOMIC_RELAXED);
}
// template<typename Int>
// inline void mscclppAtomicRefCountIncrement(Int* refs) {
// __atomic_fetch_add(refs, 1, __ATOMIC_RELAXED);
// }
template<typename Int>
inline Int mscclppAtomicRefCountDecrement(Int* refs) {
return __atomic_sub_fetch(refs, 1, __ATOMIC_ACQ_REL);
}
// template<typename Int>
// inline Int mscclppAtomicRefCountDecrement(Int* refs) {
// return __atomic_sub_fetch(refs, 1, __ATOMIC_ACQ_REL);
// }
////////////////////////////////////////////////////////////////////////////////
/* mscclppMemoryStack: Pools memory for fast LIFO ordered allocation. Note that
@@ -84,14 +84,14 @@ inline Int mscclppAtomicRefCountDecrement(Int* refs) {
* cannot be popped. Therefor objects allocated in the nil frame cannot be
* deallocated sooner than stack destruction.
*/
struct mscclppMemoryStack;
// struct mscclppMemoryStack;
void mscclppMemoryStackConstruct(struct mscclppMemoryStack* me);
void mscclppMemoryStackDestruct(struct mscclppMemoryStack* me);
void mscclppMemoryStackPush(struct mscclppMemoryStack* me);
void mscclppMemoryStackPop(struct mscclppMemoryStack* me);
template<typename T>
T* mscclppMemoryStackAlloc(struct mscclppMemoryStack* me, size_t n=1);
// void mscclppMemoryStackConstruct(struct mscclppMemoryStack* me);
// void mscclppMemoryStackDestruct(struct mscclppMemoryStack* me);
// void mscclppMemoryStackPush(struct mscclppMemoryStack* me);
// void mscclppMemoryStackPop(struct mscclppMemoryStack* me);
// template<typename T>
// T* mscclppMemoryStackAlloc(struct mscclppMemoryStack* me, size_t n=1);
////////////////////////////////////////////////////////////////////////////////
/* mscclppMemoryPool: A free-list of same-sized allocations. It is an invalid for
@@ -101,15 +101,15 @@ T* mscclppMemoryStackAlloc(struct mscclppMemoryStack* me, size_t n=1);
* backing any currently held object is deallocated then it is an error to do
* anything other than reconstruct it, after which it is a valid empty pool.
*/
struct mscclppMemoryPool;
// struct mscclppMemoryPool;
// Equivalent to zero-initialization
void mscclppMemoryPoolConstruct(struct mscclppMemoryPool* me);
template<typename T>
T* mscclppMemoryPoolAlloc(struct mscclppMemoryPool* me, struct mscclppMemoryStack* backing);
template<typename T>
void mscclppMemoryPoolFree(struct mscclppMemoryPool* me, T* obj);
void mscclppMemoryPoolTakeAll(struct mscclppMemoryPool* me, struct mscclppMemoryPool* from);
// void mscclppMemoryPoolConstruct(struct mscclppMemoryPool* me);
// template<typename T>
// T* mscclppMemoryPoolAlloc(struct mscclppMemoryPool* me, struct mscclppMemoryStack* backing);
// template<typename T>
// void mscclppMemoryPoolFree(struct mscclppMemoryPool* me, T* obj);
// void mscclppMemoryPoolTakeAll(struct mscclppMemoryPool* me, struct mscclppMemoryPool* from);
////////////////////////////////////////////////////////////////////////////////
/* mscclppIntruQueue: A singly-linked list queue where the per-object next pointer
@@ -122,380 +122,380 @@ void mscclppMemoryPoolTakeAll(struct mscclppMemoryPool* me, struct mscclppMemory
* mscclppIntruQueue<Foo, &Foo::next1> list1;
* mscclppIntruQueue<Foo, &Foo::next2> list2;
*/
template<typename T, T *T::*next>
struct mscclppIntruQueue;
// template<typename T, T *T::*next>
// struct mscclppIntruQueue;
template<typename T, T *T::*next>
void mscclppIntruQueueConstruct(mscclppIntruQueue<T,next> *me);
template<typename T, T *T::*next>
bool mscclppIntruQueueEmpty(mscclppIntruQueue<T,next> *me);
template<typename T, T *T::*next>
T* mscclppIntruQueueHead(mscclppIntruQueue<T,next> *me);
template<typename T, T *T::*next>
void mscclppIntruQueueEnqueue(mscclppIntruQueue<T,next> *me, T *x);
template<typename T, T *T::*next>
T* mscclppIntruQueueDequeue(mscclppIntruQueue<T,next> *me);
template<typename T, T *T::*next>
T* mscclppIntruQueueTryDequeue(mscclppIntruQueue<T,next> *me);
template<typename T, T *T::*next>
void mscclppIntruQueueFreeAll(mscclppIntruQueue<T,next> *me, mscclppMemoryPool *memPool);
// template<typename T, T *T::*next>
// void mscclppIntruQueueConstruct(mscclppIntruQueue<T,next> *me);
// template<typename T, T *T::*next>
// bool mscclppIntruQueueEmpty(mscclppIntruQueue<T,next> *me);
// template<typename T, T *T::*next>
// T* mscclppIntruQueueHead(mscclppIntruQueue<T,next> *me);
// template<typename T, T *T::*next>
// void mscclppIntruQueueEnqueue(mscclppIntruQueue<T,next> *me, T *x);
// template<typename T, T *T::*next>
// T* mscclppIntruQueueDequeue(mscclppIntruQueue<T,next> *me);
// template<typename T, T *T::*next>
// T* mscclppIntruQueueTryDequeue(mscclppIntruQueue<T,next> *me);
// template<typename T, T *T::*next>
// void mscclppIntruQueueFreeAll(mscclppIntruQueue<T,next> *me, mscclppMemoryPool *memPool);
////////////////////////////////////////////////////////////////////////////////
/* mscclppThreadSignal: Couples a pthread mutex and cond together. The "mutex"
* and "cond" fields are part of the public interface.
*/
struct mscclppThreadSignal {
pthread_mutex_t mutex;
pthread_cond_t cond;
};
// struct mscclppThreadSignal {
// pthread_mutex_t mutex;
// pthread_cond_t cond;
// };
// returns {PTHREAD_MUTEX_INITIALIZER, PTHREAD_COND_INITIALIZER}
constexpr mscclppThreadSignal mscclppThreadSignalStaticInitializer();
// constexpr mscclppThreadSignal mscclppThreadSignalStaticInitializer();
void mscclppThreadSignalConstruct(struct mscclppThreadSignal* me);
void mscclppThreadSignalDestruct(struct mscclppThreadSignal* me);
// void mscclppThreadSignalConstruct(struct mscclppThreadSignal* me);
// void mscclppThreadSignalDestruct(struct mscclppThreadSignal* me);
// A convenience instance per-thread.
extern __thread struct mscclppThreadSignal mscclppThreadSignalLocalInstance;
// extern __thread struct mscclppThreadSignal mscclppThreadSignalLocalInstance;
////////////////////////////////////////////////////////////////////////////////
template<typename T, T *T::*next>
struct mscclppIntruQueueMpsc;
// template<typename T, T *T::*next>
// struct mscclppIntruQueueMpsc;
template<typename T, T *T::*next>
void mscclppIntruQueueMpscConstruct(struct mscclppIntruQueueMpsc<T,next>* me);
template<typename T, T *T::*next>
bool mscclppIntruQueueMpscEmpty(struct mscclppIntruQueueMpsc<T,next>* me);
// template<typename T, T *T::*next>
// void mscclppIntruQueueMpscConstruct(struct mscclppIntruQueueMpsc<T,next>* me);
// template<typename T, T *T::*next>
// bool mscclppIntruQueueMpscEmpty(struct mscclppIntruQueueMpsc<T,next>* me);
// Enqueue element. Returns true if queue is not abandoned. Even if queue is
// abandoned the element enqueued, so the caller needs to make arrangements for
// the queue to be tended.
template<typename T, T *T::*next>
bool mscclppIntruQueueMpscEnqueue(struct mscclppIntruQueueMpsc<T,next>* me, T* x);
// template<typename T, T *T::*next>
// bool mscclppIntruQueueMpscEnqueue(struct mscclppIntruQueueMpsc<T,next>* me, T* x);
// Dequeue all elements at a glance. If there aren't any and `waitSome` is
// true then this call will wait until it can return a non empty list.
template<typename T, T *T::*next>
T* mscclppIntruQueueMpscDequeueAll(struct mscclppIntruQueueMpsc<T,next>* me, bool waitSome);
// template<typename T, T *T::*next>
// T* mscclppIntruQueueMpscDequeueAll(struct mscclppIntruQueueMpsc<T,next>* me, bool waitSome);
// Dequeue all elements and set queue to abandoned state.
template<typename T, T *T::*next>
T* mscclppIntruQueueMpscAbandon(struct mscclppIntruQueueMpsc<T,next>* me);
// template<typename T, T *T::*next>
// T* mscclppIntruQueueMpscAbandon(struct mscclppIntruQueueMpsc<T,next>* me);
////////////////////////////////////////////////////////////////////////////////
struct mscclppMemoryStack {
struct Hunk {
struct Hunk* above; // reverse stack pointer
size_t size; // size of this allocation (including this header struct)
};
struct Unhunk { // proxy header for objects allocated out-of-hunk
struct Unhunk* next;
void* obj;
};
struct Frame {
struct Hunk* hunk; // top of non-empty hunks
uintptr_t bumper, end; // points into top hunk
struct Unhunk* unhunks;
struct Frame* below;
};
// struct mscclppMemoryStack {
// struct Hunk {
// struct Hunk* above; // reverse stack pointer
// size_t size; // size of this allocation (including this header struct)
// };
// struct Unhunk { // proxy header for objects allocated out-of-hunk
// struct Unhunk* next;
// void* obj;
// };
// struct Frame {
// struct Hunk* hunk; // top of non-empty hunks
// uintptr_t bumper, end; // points into top hunk
// struct Unhunk* unhunks;
// struct Frame* below;
// };
static void* allocateSpilled(struct mscclppMemoryStack* me, size_t size, size_t align);
static void* allocate(struct mscclppMemoryStack* me, size_t size, size_t align);
// static void* allocateSpilled(struct mscclppMemoryStack* me, size_t size, size_t align);
// static void* allocate(struct mscclppMemoryStack* me, size_t size, size_t align);
struct Hunk stub;
struct Frame topFrame;
};
// struct Hunk stub;
// struct Frame topFrame;
// };
inline void mscclppMemoryStackConstruct(struct mscclppMemoryStack* me) {
me->stub.above = nullptr;
me->stub.size = 0;
me->topFrame.hunk = &me->stub;
me->topFrame.bumper = 0;
me->topFrame.end = 0;
me->topFrame.unhunks = nullptr;
me->topFrame.below = nullptr;
}
// inline void mscclppMemoryStackConstruct(struct mscclppMemoryStack* me) {
// me->stub.above = nullptr;
// me->stub.size = 0;
// me->topFrame.hunk = &me->stub;
// me->topFrame.bumper = 0;
// me->topFrame.end = 0;
// me->topFrame.unhunks = nullptr;
// me->topFrame.below = nullptr;
// }
inline void* mscclppMemoryStack::allocate(struct mscclppMemoryStack* me, size_t size, size_t align) {
uintptr_t o = (me->topFrame.bumper + align-1) & -uintptr_t(align);
void* obj;
if (__builtin_expect(o + size <= me->topFrame.end, true)) {
me->topFrame.bumper = o + size;
obj = reinterpret_cast<void*>(o);
} else {
obj = allocateSpilled(me, size, align);
}
return obj;
}
// inline void* mscclppMemoryStack::allocate(struct mscclppMemoryStack* me, size_t size, size_t align) {
// uintptr_t o = (me->topFrame.bumper + align-1) & -uintptr_t(align);
// void* obj;
// if (__builtin_expect(o + size <= me->topFrame.end, true)) {
// me->topFrame.bumper = o + size;
// obj = reinterpret_cast<void*>(o);
// } else {
// obj = allocateSpilled(me, size, align);
// }
// return obj;
// }
template<typename T>
inline T* mscclppMemoryStackAlloc(struct mscclppMemoryStack* me, size_t n) {
void *obj = mscclppMemoryStack::allocate(me, n*sizeof(T), alignof(T));
memset(obj, 0, n*sizeof(T));
return (T*)obj;
}
// template<typename T>
// inline T* mscclppMemoryStackAlloc(struct mscclppMemoryStack* me, size_t n) {
// void *obj = mscclppMemoryStack::allocate(me, n*sizeof(T), alignof(T));
// memset(obj, 0, n*sizeof(T));
// return (T*)obj;
// }
inline void mscclppMemoryStackPush(struct mscclppMemoryStack* me) {
using Frame = mscclppMemoryStack::Frame;
Frame tmp = me->topFrame;
Frame* snapshot = (Frame*)mscclppMemoryStack::allocate(me, sizeof(Frame), alignof(Frame));
*snapshot = tmp; // C++ struct assignment
me->topFrame.unhunks = nullptr;
me->topFrame.below = snapshot;
}
// inline void mscclppMemoryStackPush(struct mscclppMemoryStack* me) {
// using Frame = mscclppMemoryStack::Frame;
// Frame tmp = me->topFrame;
// Frame* snapshot = (Frame*)mscclppMemoryStack::allocate(me, sizeof(Frame), alignof(Frame));
// *snapshot = tmp; // C++ struct assignment
// me->topFrame.unhunks = nullptr;
// me->topFrame.below = snapshot;
// }
inline void mscclppMemoryStackPop(struct mscclppMemoryStack* me) {
mscclppMemoryStack::Unhunk* un = me->topFrame.unhunks;
while (un != nullptr) {
free(un->obj);
un = un->next;
}
me->topFrame = *me->topFrame.below; // C++ struct assignment
}
// inline void mscclppMemoryStackPop(struct mscclppMemoryStack* me) {
// mscclppMemoryStack::Unhunk* un = me->topFrame.unhunks;
// while (un != nullptr) {
// free(un->obj);
// un = un->next;
// }
// me->topFrame = *me->topFrame.below; // C++ struct assignment
// }
////////////////////////////////////////////////////////////////////////////////
struct mscclppMemoryPool {
struct Cell {
Cell *next;
};
template<int Size, int Align>
union CellSized {
Cell cell;
alignas(Align) char space[Size];
};
struct Cell* head;
struct Cell* tail; // meaningful only when head != nullptr
};
// struct mscclppMemoryPool {
// struct Cell {
// Cell *next;
// };
// template<int Size, int Align>
// union CellSized {
// Cell cell;
// alignas(Align) char space[Size];
// };
// struct Cell* head;
// struct Cell* tail; // meaningful only when head != nullptr
// };
inline void mscclppMemoryPoolConstruct(struct mscclppMemoryPool* me) {
me->head = nullptr;
}
// inline void mscclppMemoryPoolConstruct(struct mscclppMemoryPool* me) {
// me->head = nullptr;
// }
template<typename T>
inline T* mscclppMemoryPoolAlloc(struct mscclppMemoryPool* me, struct mscclppMemoryStack* backing) {
using Cell = mscclppMemoryPool::Cell;
using CellSized = mscclppMemoryPool::CellSized<sizeof(T), alignof(T)>;
Cell* cell;
if (__builtin_expect(me->head != nullptr, true)) {
cell = me->head;
me->head = cell->next;
} else {
// Use the internal allocate() since it doesn't memset to 0 yet.
cell = (Cell*)mscclppMemoryStack::allocate(backing, sizeof(CellSized), alignof(CellSized));
}
memset(cell, 0, sizeof(T));
return reinterpret_cast<T*>(cell);
}
// template<typename T>
// inline T* mscclppMemoryPoolAlloc(struct mscclppMemoryPool* me, struct mscclppMemoryStack* backing) {
// using Cell = mscclppMemoryPool::Cell;
// using CellSized = mscclppMemoryPool::CellSized<sizeof(T), alignof(T)>;
// Cell* cell;
// if (__builtin_expect(me->head != nullptr, true)) {
// cell = me->head;
// me->head = cell->next;
// } else {
// // Use the internal allocate() since it doesn't memset to 0 yet.
// cell = (Cell*)mscclppMemoryStack::allocate(backing, sizeof(CellSized), alignof(CellSized));
// }
// memset(cell, 0, sizeof(T));
// return reinterpret_cast<T*>(cell);
// }
template<typename T>
inline void mscclppMemoryPoolFree(struct mscclppMemoryPool* me, T* obj) {
using Cell = mscclppMemoryPool::Cell;
Cell* cell = reinterpret_cast<Cell*>(obj);
cell->next = me->head;
if (me->head == nullptr) me->tail = cell;
me->head = cell;
}
// template<typename T>
// inline void mscclppMemoryPoolFree(struct mscclppMemoryPool* me, T* obj) {
// using Cell = mscclppMemoryPool::Cell;
// Cell* cell = reinterpret_cast<Cell*>(obj);
// cell->next = me->head;
// if (me->head == nullptr) me->tail = cell;
// me->head = cell;
// }
inline void mscclppMemoryPoolTakeAll(struct mscclppMemoryPool* me, struct mscclppMemoryPool* from) {
if (from->head != nullptr) {
from->tail->next = me->head;
if (me->head == nullptr) me->tail = from->tail;
me->head = from->head;
from->head = nullptr;
}
}
// inline void mscclppMemoryPoolTakeAll(struct mscclppMemoryPool* me, struct mscclppMemoryPool* from) {
// if (from->head != nullptr) {
// from->tail->next = me->head;
// if (me->head == nullptr) me->tail = from->tail;
// me->head = from->head;
// from->head = nullptr;
// }
// }
////////////////////////////////////////////////////////////////////////////////
template<typename T, T *T::*next>
struct mscclppIntruQueue {
T *head, *tail;
};
// template<typename T, T *T::*next>
// struct mscclppIntruQueue {
// T *head, *tail;
// };
template<typename T, T *T::*next>
inline void mscclppIntruQueueConstruct(mscclppIntruQueue<T,next> *me) {
me->head = nullptr;
me->tail = nullptr;
}
// template<typename T, T *T::*next>
// inline void mscclppIntruQueueConstruct(mscclppIntruQueue<T,next> *me) {
// me->head = nullptr;
// me->tail = nullptr;
// }
template<typename T, T *T::*next>
inline bool mscclppIntruQueueEmpty(mscclppIntruQueue<T,next> *me) {
return me->head == nullptr;
}
// template<typename T, T *T::*next>
// inline bool mscclppIntruQueueEmpty(mscclppIntruQueue<T,next> *me) {
// return me->head == nullptr;
// }
template<typename T, T *T::*next>
inline T* mscclppIntruQueueHead(mscclppIntruQueue<T,next> *me) {
return me->head;
}
// template<typename T, T *T::*next>
// inline T* mscclppIntruQueueHead(mscclppIntruQueue<T,next> *me) {
// return me->head;
// }
template<typename T, T *T::*next>
inline T* mscclppIntruQueueTail(mscclppIntruQueue<T,next> *me) {
return me->tail;
}
// template<typename T, T *T::*next>
// inline T* mscclppIntruQueueTail(mscclppIntruQueue<T,next> *me) {
// return me->tail;
// }
template<typename T, T *T::*next>
inline void mscclppIntruQueueEnqueue(mscclppIntruQueue<T,next> *me, T *x) {
x->*next = nullptr;
(me->head ? me->tail->*next : me->head) = x;
me->tail = x;
}
// template<typename T, T *T::*next>
// inline void mscclppIntruQueueEnqueue(mscclppIntruQueue<T,next> *me, T *x) {
// x->*next = nullptr;
// (me->head ? me->tail->*next : me->head) = x;
// me->tail = x;
// }
template<typename T, T *T::*next>
inline T* mscclppIntruQueueDequeue(mscclppIntruQueue<T,next> *me) {
T *ans = me->head;
me->head = ans->*next;
if (me->head == nullptr) me->tail = nullptr;
return ans;
}
// template<typename T, T *T::*next>
// inline T* mscclppIntruQueueDequeue(mscclppIntruQueue<T,next> *me) {
// T *ans = me->head;
// me->head = ans->*next;
// if (me->head == nullptr) me->tail = nullptr;
// return ans;
// }
template<typename T, T *T::*next>
inline T* mscclppIntruQueueTryDequeue(mscclppIntruQueue<T,next> *me) {
T *ans = me->head;
if (ans != nullptr) {
me->head = ans->*next;
if (me->head == nullptr) me->tail = nullptr;
}
return ans;
}
// template<typename T, T *T::*next>
// inline T* mscclppIntruQueueTryDequeue(mscclppIntruQueue<T,next> *me) {
// T *ans = me->head;
// if (ans != nullptr) {
// me->head = ans->*next;
// if (me->head == nullptr) me->tail = nullptr;
// }
// return ans;
// }
template<typename T, T *T::*next>
void mscclppIntruQueueFreeAll(mscclppIntruQueue<T,next> *me, mscclppMemoryPool *pool) {
T *head = me->head;
me->head = nullptr;
me->tail = nullptr;
while (head != nullptr) {
T *tmp = head->*next;
mscclppMemoryPoolFree(pool, tmp);
head = tmp;
}
}
// template<typename T, T *T::*next>
// void mscclppIntruQueueFreeAll(mscclppIntruQueue<T,next> *me, mscclppMemoryPool *pool) {
// T *head = me->head;
// me->head = nullptr;
// me->tail = nullptr;
// while (head != nullptr) {
// T *tmp = head->*next;
// mscclppMemoryPoolFree(pool, tmp);
// head = tmp;
// }
// }
////////////////////////////////////////////////////////////////////////////////
constexpr mscclppThreadSignal mscclppThreadSignalStaticInitializer() {
return {PTHREAD_MUTEX_INITIALIZER, PTHREAD_COND_INITIALIZER};
}
// constexpr mscclppThreadSignal mscclppThreadSignalStaticInitializer() {
// return {PTHREAD_MUTEX_INITIALIZER, PTHREAD_COND_INITIALIZER};
// }
inline void mscclppThreadSignalConstruct(struct mscclppThreadSignal* me) {
pthread_mutex_init(&me->mutex, nullptr);
pthread_cond_init(&me->cond, nullptr);
}
// inline void mscclppThreadSignalConstruct(struct mscclppThreadSignal* me) {
// pthread_mutex_init(&me->mutex, nullptr);
// pthread_cond_init(&me->cond, nullptr);
// }
inline void mscclppThreadSignalDestruct(struct mscclppThreadSignal* me) {
pthread_mutex_destroy(&me->mutex);
pthread_cond_destroy(&me->cond);
}
// inline void mscclppThreadSignalDestruct(struct mscclppThreadSignal* me) {
// pthread_mutex_destroy(&me->mutex);
// pthread_cond_destroy(&me->cond);
// }
////////////////////////////////////////////////////////////////////////////////
template<typename T, T *T::*next>
struct mscclppIntruQueueMpsc {
T* head;
uintptr_t tail;
struct mscclppThreadSignal* waiting;
};
// template<typename T, T *T::*next>
// struct mscclppIntruQueueMpsc {
// T* head;
// uintptr_t tail;
// struct mscclppThreadSignal* waiting;
// };
template<typename T, T *T::*next>
void mscclppIntruQueueMpscConstruct(struct mscclppIntruQueueMpsc<T,next>* me) {
me->head = nullptr;
me->tail = 0x0;
me->waiting = nullptr;
}
// template<typename T, T *T::*next>
// void mscclppIntruQueueMpscConstruct(struct mscclppIntruQueueMpsc<T,next>* me) {
// me->head = nullptr;
// me->tail = 0x0;
// me->waiting = nullptr;
// }
template<typename T, T *T::*next>
bool mscclppIntruQueueMpscEmpty(struct mscclppIntruQueueMpsc<T,next>* me) {
return __atomic_load_n(&me->tail, __ATOMIC_RELAXED) <= 0x2;
}
// template<typename T, T *T::*next>
// bool mscclppIntruQueueMpscEmpty(struct mscclppIntruQueueMpsc<T,next>* me) {
// return __atomic_load_n(&me->tail, __ATOMIC_RELAXED) <= 0x2;
// }
template<typename T, T *T::*next>
bool mscclppIntruQueueMpscEnqueue(mscclppIntruQueueMpsc<T,next>* me, T* x) {
__atomic_store_n(&(x->*next), nullptr, __ATOMIC_RELAXED);
uintptr_t utail = __atomic_exchange_n(&me->tail, reinterpret_cast<uintptr_t>(x), __ATOMIC_ACQ_REL);
T* prev = reinterpret_cast<T*>(utail);
T** prevNext = utail <= 0x2 ? &me->head : &(prev->*next);
__atomic_store_n(prevNext, x, __ATOMIC_RELAXED);
if (utail == 0x1) { // waiting
__atomic_thread_fence(__ATOMIC_ACQUIRE); // to see me->waiting
// This lock/unlock is essential to ensure we don't race ahead of the consumer
// and signal the cond before they begin waiting on it.
struct mscclppThreadSignal* waiting = me->waiting;
pthread_mutex_lock(&waiting->mutex);
pthread_mutex_unlock(&waiting->mutex);
pthread_cond_broadcast(&waiting->cond);
}
return utail != 0x2; // not abandoned
}
// template<typename T, T *T::*next>
// bool mscclppIntruQueueMpscEnqueue(mscclppIntruQueueMpsc<T,next>* me, T* x) {
// __atomic_store_n(&(x->*next), nullptr, __ATOMIC_RELAXED);
// uintptr_t utail = __atomic_exchange_n(&me->tail, reinterpret_cast<uintptr_t>(x), __ATOMIC_ACQ_REL);
// T* prev = reinterpret_cast<T*>(utail);
// T** prevNext = utail <= 0x2 ? &me->head : &(prev->*next);
// __atomic_store_n(prevNext, x, __ATOMIC_RELAXED);
// if (utail == 0x1) { // waiting
// __atomic_thread_fence(__ATOMIC_ACQUIRE); // to see me->waiting
// // This lock/unlock is essential to ensure we don't race ahead of the consumer
// // and signal the cond before they begin waiting on it.
// struct mscclppThreadSignal* waiting = me->waiting;
// pthread_mutex_lock(&waiting->mutex);
// pthread_mutex_unlock(&waiting->mutex);
// pthread_cond_broadcast(&waiting->cond);
// }
// return utail != 0x2; // not abandoned
// }
template<typename T, T *T::*next>
T* mscclppIntruQueueMpscDequeueAll(mscclppIntruQueueMpsc<T,next>* me, bool waitSome) {
T* head = __atomic_load_n(&me->head, __ATOMIC_RELAXED);
if (head == nullptr) {
if (!waitSome) return nullptr;
uint64_t t0 = clockNano();
bool sleeping = false;
do {
if (clockNano()-t0 >= 10*1000) { // spin for first 10us
struct mscclppThreadSignal* waitSignal = &mscclppThreadSignalLocalInstance;
pthread_mutex_lock(&waitSignal->mutex);
uintptr_t expected = sleeping ? 0x1 : 0x0;
uintptr_t desired = 0x1;
me->waiting = waitSignal; // release done by successful compare exchange
if (__atomic_compare_exchange_n(&me->tail, &expected, desired, /*weak=*/true, __ATOMIC_RELEASE, __ATOMIC_RELAXED)) {
sleeping = true;
pthread_cond_wait(&waitSignal->cond, &waitSignal->mutex);
}
pthread_mutex_unlock(&waitSignal->mutex);
}
head = __atomic_load_n(&me->head, __ATOMIC_RELAXED);
} while (head == nullptr);
}
// template<typename T, T *T::*next>
// T* mscclppIntruQueueMpscDequeueAll(mscclppIntruQueueMpsc<T,next>* me, bool waitSome) {
// T* head = __atomic_load_n(&me->head, __ATOMIC_RELAXED);
// if (head == nullptr) {
// if (!waitSome) return nullptr;
// uint64_t t0 = clockNano();
// bool sleeping = false;
// do {
// if (clockNano()-t0 >= 10*1000) { // spin for first 10us
// struct mscclppThreadSignal* waitSignal = &mscclppThreadSignalLocalInstance;
// pthread_mutex_lock(&waitSignal->mutex);
// uintptr_t expected = sleeping ? 0x1 : 0x0;
// uintptr_t desired = 0x1;
// me->waiting = waitSignal; // release done by successful compare exchange
// if (__atomic_compare_exchange_n(&me->tail, &expected, desired, /*weak=*/true, __ATOMIC_RELEASE, __ATOMIC_RELAXED)) {
// sleeping = true;
// pthread_cond_wait(&waitSignal->cond, &waitSignal->mutex);
// }
// pthread_mutex_unlock(&waitSignal->mutex);
// }
// head = __atomic_load_n(&me->head, __ATOMIC_RELAXED);
// } while (head == nullptr);
// }
__atomic_store_n(&me->head, nullptr, __ATOMIC_RELAXED);
uintptr_t utail = __atomic_exchange_n(&me->tail, 0x0, __ATOMIC_ACQ_REL);
T* tail = utail <= 0x2 ? nullptr : reinterpret_cast<T*>(utail);
T *x = head;
while (x != tail) {
T *x1;
int spins = 0;
while (true) {
x1 = __atomic_load_n(&(x->*next), __ATOMIC_RELAXED);
if (x1 != nullptr) break;
if (++spins == 1024) { spins = 1024-1; sched_yield(); }
}
x = x1;
}
return head;
}
// __atomic_store_n(&me->head, nullptr, __ATOMIC_RELAXED);
// uintptr_t utail = __atomic_exchange_n(&me->tail, 0x0, __ATOMIC_ACQ_REL);
// T* tail = utail <= 0x2 ? nullptr : reinterpret_cast<T*>(utail);
// T *x = head;
// while (x != tail) {
// T *x1;
// int spins = 0;
// while (true) {
// x1 = __atomic_load_n(&(x->*next), __ATOMIC_RELAXED);
// if (x1 != nullptr) break;
// if (++spins == 1024) { spins = 1024-1; sched_yield(); }
// }
// x = x1;
// }
// return head;
// }
template<typename T, T *T::*next>
T* mscclppIntruQueueMpscAbandon(mscclppIntruQueueMpsc<T,next>* me) {
uintptr_t expected = 0x0;
if (__atomic_compare_exchange_n(&me->tail, &expected, /*desired=*/0x2, /*weak=*/true, __ATOMIC_RELAXED, __ATOMIC_RELAXED)) {
return nullptr;
} else {
int spins = 0;
T* head;
while (true) {
head = __atomic_load_n(&me->head, __ATOMIC_RELAXED);
if (head != nullptr) break;
if (++spins == 1024) { spins = 1024-1; sched_yield(); }
}
__atomic_store_n(&me->head, nullptr, __ATOMIC_RELAXED);
uintptr_t utail = __atomic_exchange_n(&me->tail, 0x2, __ATOMIC_ACQ_REL);
T* tail = utail <= 0x2 ? nullptr : reinterpret_cast<T*>(utail);
T *x = head;
while (x != tail) {
T *x1;
spins = 0;
while (true) {
x1 = __atomic_load_n(&(x->*next), __ATOMIC_RELAXED);
if (x1 != nullptr) break;
if (++spins == 1024) { spins = 1024-1; sched_yield(); }
}
x = x1;
}
return head;
}
}
// template<typename T, T *T::*next>
// T* mscclppIntruQueueMpscAbandon(mscclppIntruQueueMpsc<T,next>* me) {
// uintptr_t expected = 0x0;
// if (__atomic_compare_exchange_n(&me->tail, &expected, /*desired=*/0x2, /*weak=*/true, __ATOMIC_RELAXED, __ATOMIC_RELAXED)) {
// return nullptr;
// } else {
// int spins = 0;
// T* head;
// while (true) {
// head = __atomic_load_n(&me->head, __ATOMIC_RELAXED);
// if (head != nullptr) break;
// if (++spins == 1024) { spins = 1024-1; sched_yield(); }
// }
// __atomic_store_n(&me->head, nullptr, __ATOMIC_RELAXED);
// uintptr_t utail = __atomic_exchange_n(&me->tail, 0x2, __ATOMIC_ACQ_REL);
// T* tail = utail <= 0x2 ? nullptr : reinterpret_cast<T*>(utail);
// T *x = head;
// while (x != tail) {
// T *x1;
// spins = 0;
// while (true) {
// x1 = __atomic_load_n(&(x->*next), __ATOMIC_RELAXED);
// if (x1 != nullptr) break;
// if (++spins == 1024) { spins = 1024-1; sched_yield(); }
// }
// x = x1;
// }
// return head;
// }
// }
#endif

View File

@@ -1,820 +0,0 @@
/*************************************************************************
* Copyright (c) 2016-2022, NVIDIA CORPORATION. All rights reserved.
*
* See LICENSE.txt for license information
************************************************************************/
#include "socket.h"
// #include "utils.h"
#include <stdlib.h>
#include <unistd.h>
#include <ifaddrs.h>
#include <net/if.h>
static mscclppResult_t socketProgressOpt(int op, struct mscclppSocket* sock, void* ptr, int size, int* offset, int block, int* closed) {
int bytes = 0;
*closed = 0;
char* data = (char*)ptr;
char line[SOCKET_NAME_MAXLEN+1];
do {
if (op == MSCCLPP_SOCKET_RECV) bytes = recv(sock->fd, data+(*offset), size-(*offset), block ? 0 : MSG_DONTWAIT);
if (op == MSCCLPP_SOCKET_SEND) bytes = send(sock->fd, data+(*offset), size-(*offset), block ? MSG_NOSIGNAL : MSG_DONTWAIT | MSG_NOSIGNAL);
if (op == MSCCLPP_SOCKET_RECV && bytes == 0) {
*closed = 1;
return mscclppSuccess;
}
if (bytes == -1) {
if (errno != EINTR && errno != EWOULDBLOCK && errno != EAGAIN) {
WARN("socketProgressOpt: Call to recv from %s failed : %s", mscclppSocketToString(&sock->addr, line), strerror(errno));
return mscclppRemoteError;
} else {
bytes = 0;
}
}
(*offset) += bytes;
if (sock->abortFlag && *sock->abortFlag != 0) {
INFO(MSCCLPP_NET, "socketProgressOpt: abort called");
return mscclppInternalError;
}
} while (bytes > 0 && (*offset) < size);
return mscclppSuccess;
}
static mscclppResult_t socketProgress(int op, struct mscclppSocket* sock, void* ptr, int size, int* offset) {
int closed;
MSCCLPPCHECK(socketProgressOpt(op, sock, ptr, size, offset, 0, &closed));
if (closed) {
char line[SOCKET_NAME_MAXLEN+1];
WARN("socketProgress: Connection closed by remote peer %s", mscclppSocketToString(&sock->addr, line, 0));
return mscclppRemoteError;
}
return mscclppSuccess;
}
static mscclppResult_t socketWait(int op, struct mscclppSocket* sock, void* ptr, int size, int* offset) {
while (*offset < size)
MSCCLPPCHECK(socketProgress(op, sock, ptr, size, offset));
return mscclppSuccess;
}
/* Format a string representation of a (union mscclppSocketAddress *) socket address using getnameinfo()
*
* Output: "IPv4/IPv6 address<port>"
*/
const char *mscclppSocketToString(union mscclppSocketAddress *addr, char *buf, const int numericHostForm /*= 1*/) {
if (buf == NULL || addr == NULL) return NULL;
struct sockaddr *saddr = &addr->sa;
if (saddr->sa_family != AF_INET && saddr->sa_family != AF_INET6) { buf[0]='\0'; return buf; }
char host[NI_MAXHOST], service[NI_MAXSERV];
/* NI_NUMERICHOST: If set, then the numeric form of the hostname is returned.
* (When not set, this will still happen in case the node's name cannot be determined.)
*/
int flag = NI_NUMERICSERV | (numericHostForm ? NI_NUMERICHOST : 0);
(void) getnameinfo(saddr, sizeof(union mscclppSocketAddress), host, NI_MAXHOST, service, NI_MAXSERV, flag);
sprintf(buf, "%s<%s>", host, service);
return buf;
}
static uint16_t socketToPort(union mscclppSocketAddress *addr) {
struct sockaddr *saddr = &addr->sa;
return ntohs(saddr->sa_family == AF_INET ? addr->sin.sin_port : addr->sin6.sin6_port);
}
/* Allow the user to force the IPv4/IPv6 interface selection */
static int envSocketFamily(void) {
int family = -1; // Family selection is not forced, will use first one found
char* env = getenv("MSCCLPP_SOCKET_FAMILY");
if (env == NULL)
return family;
INFO(MSCCLPP_ENV, "MSCCLPP_SOCKET_FAMILY set by environment to %s", env);
if (strcmp(env, "AF_INET") == 0)
family = AF_INET; // IPv4
else if (strcmp(env, "AF_INET6") == 0)
family = AF_INET6; // IPv6
return family;
}
static int findInterfaces(const char* prefixList, char* names, union mscclppSocketAddress *addrs, int sock_family, int maxIfNameSize, int maxIfs) {
#ifdef ENABLE_TRACE
char line[SOCKET_NAME_MAXLEN+1];
#endif
struct netIf userIfs[MAX_IFS];
bool searchNot = prefixList && prefixList[0] == '^';
if (searchNot) prefixList++;
bool searchExact = prefixList && prefixList[0] == '=';
if (searchExact) prefixList++;
int nUserIfs = parseStringList(prefixList, userIfs, MAX_IFS);
int found = 0;
struct ifaddrs *interfaces, *interface;
getifaddrs(&interfaces);
for (interface = interfaces; interface && found < maxIfs; interface = interface->ifa_next) {
if (interface->ifa_addr == NULL) continue;
/* We only support IPv4 & IPv6 */
int family = interface->ifa_addr->sa_family;
if (family != AF_INET && family != AF_INET6)
continue;
TRACE(MSCCLPP_INIT|MSCCLPP_NET,"Found interface %s:%s", interface->ifa_name, mscclppSocketToString((union mscclppSocketAddress *) interface->ifa_addr, line));
/* Allow the caller to force the socket family type */
if (sock_family != -1 && family != sock_family)
continue;
/* We also need to skip IPv6 loopback interfaces */
if (family == AF_INET6) {
struct sockaddr_in6* sa = (struct sockaddr_in6*)(interface->ifa_addr);
if (IN6_IS_ADDR_LOOPBACK(&sa->sin6_addr)) continue;
}
// check against user specified interfaces
if (!(matchIfList(interface->ifa_name, -1, userIfs, nUserIfs, searchExact) ^ searchNot)) {
continue;
}
// Check that this interface has not already been saved
// getifaddrs() normal order appears to be; IPv4, IPv6 Global, IPv6 Link
bool duplicate = false;
for (int i = 0; i < found; i++) {
if (strcmp(interface->ifa_name, names+i*maxIfNameSize) == 0) { duplicate = true; break; }
}
if (!duplicate) {
// Store the interface name
strncpy(names+found*maxIfNameSize, interface->ifa_name, maxIfNameSize);
// Store the IP address
int salen = (family == AF_INET) ? sizeof(struct sockaddr_in) : sizeof(struct sockaddr_in6);
memcpy(addrs+found, interface->ifa_addr, salen);
found++;
}
}
freeifaddrs(interfaces);
return found;
}
static bool matchSubnet(struct ifaddrs local_if, union mscclppSocketAddress* remote) {
/* Check family first */
int family = local_if.ifa_addr->sa_family;
if (family != remote->sa.sa_family) {
return false;
}
if (family == AF_INET) {
struct sockaddr_in* local_addr = (struct sockaddr_in*)(local_if.ifa_addr);
struct sockaddr_in* mask = (struct sockaddr_in*)(local_if.ifa_netmask);
struct sockaddr_in& remote_addr = remote->sin;
struct in_addr local_subnet, remote_subnet;
local_subnet.s_addr = local_addr->sin_addr.s_addr & mask->sin_addr.s_addr;
remote_subnet.s_addr = remote_addr.sin_addr.s_addr & mask->sin_addr.s_addr;
return (local_subnet.s_addr ^ remote_subnet.s_addr) ? false : true;
} else if (family == AF_INET6) {
struct sockaddr_in6* local_addr = (struct sockaddr_in6*)(local_if.ifa_addr);
struct sockaddr_in6* mask = (struct sockaddr_in6*)(local_if.ifa_netmask);
struct sockaddr_in6& remote_addr = remote->sin6;
struct in6_addr& local_in6 = local_addr->sin6_addr;
struct in6_addr& mask_in6 = mask->sin6_addr;
struct in6_addr& remote_in6 = remote_addr.sin6_addr;
bool same = true;
int len = 16; //IPv6 address is 16 unsigned char
for (int c = 0; c < len; c++) { //Network byte order is big-endian
char c1 = local_in6.s6_addr[c] & mask_in6.s6_addr[c];
char c2 = remote_in6.s6_addr[c] & mask_in6.s6_addr[c];
if (c1 ^ c2) {
same = false;
break;
}
}
// At last, we need to compare scope id
// Two Link-type addresses can have the same subnet address even though they are not in the same scope
// For Global type, this field is 0, so a comparison wouldn't matter
same &= (local_addr->sin6_scope_id == remote_addr.sin6_scope_id);
return same;
} else {
WARN("Net : Unsupported address family type");
return false;
}
}
int mscclppFindInterfaceMatchSubnet(char* ifNames, union mscclppSocketAddress* localAddrs, union mscclppSocketAddress* remoteAddr, int ifNameMaxSize, int maxIfs) {
#ifdef ENABLE_TRACE
char line[SOCKET_NAME_MAXLEN+1];
#endif
char line_a[SOCKET_NAME_MAXLEN+1];
int found = 0;
struct ifaddrs *interfaces, *interface;
getifaddrs(&interfaces);
for (interface = interfaces; interface && !found; interface = interface->ifa_next) {
if (interface->ifa_addr == NULL) continue;
/* We only support IPv4 & IPv6 */
int family = interface->ifa_addr->sa_family;
if (family != AF_INET && family != AF_INET6)
continue;
// check against user specified interfaces
if (!matchSubnet(*interface, remoteAddr)) {
continue;
}
// Store the local IP address
int salen = (family == AF_INET) ? sizeof(struct sockaddr_in) : sizeof(struct sockaddr_in6);
memcpy(localAddrs+found, interface->ifa_addr, salen);
// Store the interface name
strncpy(ifNames+found*ifNameMaxSize, interface->ifa_name, ifNameMaxSize);
TRACE(MSCCLPP_INIT|MSCCLPP_NET,"NET : Found interface %s:%s in the same subnet as remote address %s", interface->ifa_name, mscclppSocketToString(localAddrs+found, line), mscclppSocketToString(remoteAddr, line_a));
found++;
if (found == maxIfs) break;
}
if (found == 0) {
WARN("Net : No interface found in the same subnet as remote address %s", mscclppSocketToString(remoteAddr, line_a));
}
freeifaddrs(interfaces);
return found;
}
mscclppResult_t mscclppSocketGetAddrFromString(union mscclppSocketAddress* ua, const char* ip_port_pair) {
if (!(ip_port_pair && strlen(ip_port_pair) > 1)) {
WARN("Net : string is null");
return mscclppInvalidArgument;
}
bool ipv6 = ip_port_pair[0] == '[';
/* Construct the sockaddress structure */
if (!ipv6) {
struct netIf ni;
// parse <ip_or_hostname>:<port> string, expect one pair
if (parseStringList(ip_port_pair, &ni, 1) != 1) {
WARN("Net : No valid <IPv4_or_hostname>:<port> pair found");
return mscclppInvalidArgument;
}
struct addrinfo hints, *p;
int rv;
memset(&hints, 0, sizeof(hints));
hints.ai_family = AF_UNSPEC;
hints.ai_socktype = SOCK_STREAM;
if ( (rv = getaddrinfo(ni.prefix, NULL, &hints, &p)) != 0) {
WARN("Net : error encountered when getting address info : %s", gai_strerror(rv));
return mscclppInvalidArgument;
}
// use the first
if (p->ai_family == AF_INET) {
struct sockaddr_in& sin = ua->sin;
memcpy(&sin, p->ai_addr, sizeof(struct sockaddr_in));
sin.sin_family = AF_INET; // IPv4
//inet_pton(AF_INET, ni.prefix, &(sin.sin_addr)); // IP address
sin.sin_port = htons(ni.port); // port
} else if (p->ai_family == AF_INET6) {
struct sockaddr_in6& sin6 = ua->sin6;
memcpy(&sin6, p->ai_addr, sizeof(struct sockaddr_in6));
sin6.sin6_family = AF_INET6; // IPv6
sin6.sin6_port = htons(ni.port); // port
sin6.sin6_flowinfo = 0; // needed by IPv6, but possibly obsolete
sin6.sin6_scope_id = 0; // should be global scope, set to 0
} else {
WARN("Net : unsupported IP family");
return mscclppInvalidArgument;
}
freeaddrinfo(p); // all done with this structure
} else {
int i, j = -1, len = strlen(ip_port_pair);
for (i = 1; i < len; i++) {
if (ip_port_pair[i] == '%') j = i;
if (ip_port_pair[i] == ']') break;
}
if (i == len) {
WARN("Net : No valid [IPv6]:port pair found");
return mscclppInvalidArgument;
}
bool global_scope = (j == -1 ? true : false); // If no % found, global scope; otherwise, link scope
char ip_str[NI_MAXHOST], port_str[NI_MAXSERV], if_name[IFNAMSIZ];
memset(ip_str, '\0', sizeof(ip_str));
memset(port_str, '\0', sizeof(port_str));
memset(if_name, '\0', sizeof(if_name));
strncpy(ip_str, ip_port_pair+1, global_scope ? i-1 : j-1);
strncpy(port_str, ip_port_pair+i+2, len-i-1);
int port = atoi(port_str);
if (!global_scope) strncpy(if_name, ip_port_pair+j+1, i-j-1); // If not global scope, we need the intf name
struct sockaddr_in6& sin6 = ua->sin6;
sin6.sin6_family = AF_INET6; // IPv6
inet_pton(AF_INET6, ip_str, &(sin6.sin6_addr)); // IP address
sin6.sin6_port = htons(port); // port
sin6.sin6_flowinfo = 0; // needed by IPv6, but possibly obsolete
sin6.sin6_scope_id = global_scope ? 0 : if_nametoindex(if_name); // 0 if global scope; intf index if link scope
}
return mscclppSuccess;
}
int mscclppFindInterfaces(char* ifNames, union mscclppSocketAddress *ifAddrs, int ifNameMaxSize, int maxIfs) {
static int shownIfName = 0;
int nIfs = 0;
// Allow user to force the INET socket family selection
int sock_family = envSocketFamily();
// User specified interface
char* env = getenv("MSCCLPP_SOCKET_IFNAME");
if (env && strlen(env) > 1) {
INFO(MSCCLPP_ENV, "MSCCLPP_SOCKET_IFNAME set by environment to %s", env);
// Specified by user : find or fail
if (shownIfName++ == 0) INFO(MSCCLPP_NET, "MSCCLPP_SOCKET_IFNAME set to %s", env);
nIfs = findInterfaces(env, ifNames, ifAddrs, sock_family, ifNameMaxSize, maxIfs);
} else {
// Try to automatically pick the right one
// Start with IB
nIfs = findInterfaces("ib", ifNames, ifAddrs, sock_family, ifNameMaxSize, maxIfs);
// else see if we can get some hint from COMM ID
if (nIfs == 0) {
char* commId = getenv("MSCCLPP_COMM_ID");
if (commId && strlen(commId) > 1) {
INFO(MSCCLPP_ENV, "MSCCLPP_COMM_ID set by environment to %s", commId);
// Try to find interface that is in the same subnet as the IP in comm id
union mscclppSocketAddress idAddr;
mscclppSocketGetAddrFromString(&idAddr, commId);
nIfs = mscclppFindInterfaceMatchSubnet(ifNames, ifAddrs, &idAddr, ifNameMaxSize, maxIfs);
}
}
// Then look for anything else (but not docker or lo)
if (nIfs == 0) nIfs = findInterfaces("^docker,lo", ifNames, ifAddrs, sock_family, ifNameMaxSize, maxIfs);
// Finally look for docker, then lo.
if (nIfs == 0) nIfs = findInterfaces("docker", ifNames, ifAddrs, sock_family, ifNameMaxSize, maxIfs);
if (nIfs == 0) nIfs = findInterfaces("lo", ifNames, ifAddrs, sock_family, ifNameMaxSize, maxIfs);
}
return nIfs;
}
mscclppResult_t mscclppSocketListen(struct mscclppSocket* sock) {
if (sock == NULL) {
WARN("mscclppSocketListen: pass NULL socket");
return mscclppInvalidArgument;
}
if (sock->fd == -1) {
WARN("mscclppSocketListen: file descriptor is -1");
return mscclppInvalidArgument;
}
if (socketToPort(&sock->addr)) {
// Port is forced by env. Make sure we get the port.
int opt = 1;
#if defined(SO_REUSEPORT)
SYSCHECK(setsockopt(sock->fd, SOL_SOCKET, SO_REUSEADDR | SO_REUSEPORT, &opt, sizeof(opt)), "setsockopt");
#else
SYSCHECK(setsockopt(sock->fd, SOL_SOCKET, SO_REUSEADDR, &opt, sizeof(opt)), "setsockopt");
#endif
}
// addr port should be 0 (Any port)
SYSCHECK(bind(sock->fd, &sock->addr.sa, sock->salen), "bind");
/* Get the assigned Port */
socklen_t size = sock->salen;
SYSCHECK(getsockname(sock->fd, &sock->addr.sa, &size), "getsockname");
#ifdef ENABLE_TRACE
char line[SOCKET_NAME_MAXLEN+1];
TRACE(MSCCLPP_INIT|MSCCLPP_NET,"Listening on socket %s", mscclppSocketToString(&sock->addr, line));
#endif
/* Put the socket in listen mode
* NB: The backlog will be silently truncated to the value in /proc/sys/net/core/somaxconn
*/
SYSCHECK(listen(sock->fd, 16384), "listen");
sock->state = mscclppSocketStateReady;
return mscclppSuccess;
}
mscclppResult_t mscclppSocketGetAddr(struct mscclppSocket* sock, union mscclppSocketAddress* addr) {
if (sock == NULL) {
WARN("mscclppSocketGetAddr: pass NULL socket");
return mscclppInvalidArgument;
}
if (sock->state != mscclppSocketStateReady) return mscclppInternalError;
memcpy(addr, &sock->addr, sizeof(union mscclppSocketAddress));
return mscclppSuccess;
}
static mscclppResult_t socketTryAccept(struct mscclppSocket* sock) {
socklen_t socklen = sizeof(union mscclppSocketAddress);
sock->fd = accept(sock->acceptFd, &sock->addr.sa, &socklen);
if (sock->fd != -1) {
sock->state = mscclppSocketStateAccepted;
} else if (errno != EAGAIN && errno != EWOULDBLOCK) {
WARN("socketTryAccept: get errno %d that is not EAGAIN or EWOULDBLOCK", errno);
return mscclppSystemError;
}
return mscclppSuccess;
}
static mscclppResult_t socketFinalizeAccept(struct mscclppSocket* sock) {
uint64_t magic;
enum mscclppSocketType type;
int received = 0;
MSCCLPPCHECK(mscclppSocketProgress(MSCCLPP_SOCKET_RECV, sock, &magic, sizeof(magic), &received));
if (received == 0) return mscclppSuccess;
MSCCLPPCHECK(socketWait(MSCCLPP_SOCKET_RECV, sock, &magic, sizeof(magic), &received));
if (magic != sock->magic) {
WARN("socketFinalizeAccept: wrong magic %lx != %lx", magic, sock->magic);
close(sock->fd);
sock->fd = -1;
// Ignore spurious connection and accept again
sock->state = mscclppSocketStateAccepting;
return mscclppSuccess;
} else {
received = 0;
MSCCLPPCHECK(socketWait(MSCCLPP_SOCKET_RECV, sock, &type, sizeof(type), &received));
if (type != sock->type) {
WARN("socketFinalizeAccept: wrong type %d != %d", type, sock->type);
sock->state = mscclppSocketStateError;
close(sock->fd);
sock->fd = -1;
return mscclppInternalError;
} else {
sock->state = mscclppSocketStateReady;
}
}
return mscclppSuccess;
}
static mscclppResult_t socketStartConnect(struct mscclppSocket* sock) {
/* blocking/non-blocking connect() is determined by asyncFlag. */
int ret = connect(sock->fd, &sock->addr.sa, sock->salen);
if (ret == 0) {
sock->state = mscclppSocketStateConnected;
return mscclppSuccess;
} else if (errno == EINPROGRESS) {
sock->state = mscclppSocketStateConnectPolling;
return mscclppSuccess;
} else if (errno == ECONNREFUSED) {
if (++sock->refusedRetries == RETRY_REFUSED_TIMES) {
sock->state = mscclppSocketStateError;
WARN("socketStartConnect: exceeded retries (%d)", sock->refusedRetries);
return mscclppRemoteError;
}
usleep(SLEEP_INT);
if (sock->refusedRetries % 1000 == 0) INFO(MSCCLPP_ALL, "Call to connect returned %s, retrying", strerror(errno));
return mscclppSuccess;
} else if (errno == ETIMEDOUT) {
if (++sock->timedOutRetries == RETRY_TIMEDOUT_TIMES) {
sock->state = mscclppSocketStateError;
WARN("socketStartConnect: exceeded timeouts (%d)", sock->timedOutRetries);
return mscclppRemoteError;
}
usleep(SLEEP_INT);
return mscclppSuccess;
} else {
char line[SOCKET_NAME_MAXLEN+1];
sock->state = mscclppSocketStateError;
WARN("socketStartConnect: Connect to %s failed : %s", mscclppSocketToString(&sock->addr, line), strerror(errno));
return mscclppSystemError;
}
}
static mscclppResult_t socketPollConnect(struct mscclppSocket* sock) {
struct pollfd pfd;
int timeout = 1, ret;
socklen_t rlen = sizeof(int);
memset(&pfd, 0, sizeof(struct pollfd));
pfd.fd = sock->fd;
pfd.events = POLLOUT;
SYSCHECK(ret = poll(&pfd, 1, timeout), "poll");
if (ret == 0) return mscclppSuccess;
/* check socket status */
EQCHECK(ret == 1 && (pfd.revents & POLLOUT), 0);
SYSCHECK(getsockopt(sock->fd, SOL_SOCKET, SO_ERROR, (void*)&ret, &rlen), "getsockopt");
if (ret == 0) {
sock->state = mscclppSocketStateConnected;
} else if (ret == ECONNREFUSED) {
if (++sock->refusedRetries == RETRY_REFUSED_TIMES) {
sock->state = mscclppSocketStateError;
WARN("socketPollConnect: exceeded retries (%d)", sock->refusedRetries);
return mscclppRemoteError;
}
if (sock->refusedRetries % 1000 == 0) INFO(MSCCLPP_ALL, "Call to connect returned %s, retrying", strerror(errno));
usleep(SLEEP_INT);
sock->state = mscclppSocketStateConnecting;
} else if (ret == ETIMEDOUT) {
if (++sock->timedOutRetries == RETRY_TIMEDOUT_TIMES) {
sock->state = mscclppSocketStateError;
WARN("socketPollConnect: exceeded timeouts (%d)", sock->timedOutRetries);
return mscclppRemoteError;
}
usleep(SLEEP_INT);
sock->state = mscclppSocketStateConnecting;
} else if (ret != EINPROGRESS) {
sock->state = mscclppSocketStateError;
return mscclppSystemError;
}
return mscclppSuccess;
}
mscclppResult_t mscclppSocketPollConnect(struct mscclppSocket* sock) {
if (sock == NULL) {
WARN("mscclppSocketPollConnect: pass NULL socket");
return mscclppInvalidArgument;
}
MSCCLPPCHECK(socketPollConnect(sock));
return mscclppSuccess;
}
static mscclppResult_t socketFinalizeConnect(struct mscclppSocket* sock) {
int sent = 0;
MSCCLPPCHECK(socketProgress(MSCCLPP_SOCKET_SEND, sock, &sock->magic, sizeof(sock->magic), &sent));
if (sent == 0) return mscclppSuccess;
MSCCLPPCHECK(socketWait(MSCCLPP_SOCKET_SEND, sock, &sock->magic, sizeof(sock->magic), &sent));
sent = 0;
MSCCLPPCHECK(socketWait(MSCCLPP_SOCKET_SEND, sock, &sock->type, sizeof(sock->type), &sent));
sock->state = mscclppSocketStateReady;
return mscclppSuccess;
}
static mscclppResult_t socketProgressState(struct mscclppSocket* sock) {
if (sock->state == mscclppSocketStateAccepting) {
MSCCLPPCHECK(socketTryAccept(sock));
}
if (sock->state == mscclppSocketStateAccepted) {
MSCCLPPCHECK(socketFinalizeAccept(sock));
}
if (sock->state == mscclppSocketStateConnecting) {
MSCCLPPCHECK(socketStartConnect(sock));
}
if (sock->state == mscclppSocketStateConnectPolling) {
MSCCLPPCHECK(socketPollConnect(sock));
}
if (sock->state == mscclppSocketStateConnected) {
MSCCLPPCHECK(socketFinalizeConnect(sock));
}
return mscclppSuccess;
}
mscclppResult_t mscclppSocketReady(struct mscclppSocket* sock, int *running) {
if (sock == NULL) {
*running = 0;
return mscclppSuccess;
}
if (sock->state == mscclppSocketStateError || sock->state == mscclppSocketStateClosed) {
WARN("mscclppSocketReady: unexpected socket state %d", sock->state);
return mscclppRemoteError;
}
*running = (sock->state == mscclppSocketStateReady) ? 1 : 0;
if (*running == 0) {
MSCCLPPCHECK(socketProgressState(sock));
*running = (sock->state == mscclppSocketStateReady) ? 1 : 0;
}
return mscclppSuccess;
}
mscclppResult_t mscclppSocketConnect(struct mscclppSocket* sock) {
#ifdef ENABLE_TRACE
char line[SOCKET_NAME_MAXLEN+1];
#endif
const int one = 1;
if (sock == NULL) {
WARN("mscclppSocketConnect: pass NULL socket");
return mscclppInvalidArgument;
}
if (sock->fd == -1) {
WARN("mscclppSocketConnect: file descriptor is -1");
return mscclppInvalidArgument;
}
if (sock->state != mscclppSocketStateInitialized) {
WARN("mscclppSocketConnect: wrong socket state %d", sock->state);
if (sock->state == mscclppSocketStateError) return mscclppRemoteError;
return mscclppInternalError;
}
TRACE(MSCCLPP_INIT|MSCCLPP_NET,"Connecting to socket %s", mscclppSocketToString(&sock->addr, line));
SYSCHECK(setsockopt(sock->fd, IPPROTO_TCP, TCP_NODELAY, (char*)&one, sizeof(int)), "setsockopt");
sock->state = mscclppSocketStateConnecting;
do {
MSCCLPPCHECK(socketProgressState(sock));
} while (sock->asyncFlag == 0 &&
(sock->abortFlag == NULL || *sock->abortFlag == 0) &&
(sock->state == mscclppSocketStateConnecting ||
sock->state == mscclppSocketStateConnectPolling ||
sock->state == mscclppSocketStateConnected));
if (sock->abortFlag && *sock->abortFlag != 0) return mscclppInternalError;
switch (sock->state) {
case mscclppSocketStateConnecting:
case mscclppSocketStateConnectPolling:
case mscclppSocketStateConnected:
case mscclppSocketStateReady:
return mscclppSuccess;
case mscclppSocketStateError:
return mscclppSystemError;
default:
WARN("mscclppSocketConnect: wrong socket state %d", sock->state);
return mscclppInternalError;
}
}
mscclppResult_t mscclppSocketAccept(struct mscclppSocket* sock, struct mscclppSocket* listenSock) {
mscclppResult_t ret = mscclppSuccess;
if (listenSock == NULL || sock == NULL) {
WARN("mscclppSocketAccept: pass NULL socket");
ret = mscclppInvalidArgument;
goto exit;
}
if (listenSock->state != mscclppSocketStateReady) {
WARN("mscclppSocketAccept: wrong socket state %d", listenSock->state);
if (listenSock->state == mscclppSocketStateError)
ret = mscclppSystemError;
else
ret = mscclppInternalError;
goto exit;
}
if (sock->acceptFd == -1) {
memcpy(sock, listenSock, sizeof(struct mscclppSocket));
sock->acceptFd = listenSock->fd;
sock->state = mscclppSocketStateAccepting;
}
do {
MSCCLPPCHECKGOTO(socketProgressState(sock), ret, exit);
} while (sock->asyncFlag == 0 &&
(sock->abortFlag == NULL || *sock->abortFlag == 0) &&
(sock->state == mscclppSocketStateAccepting ||
sock->state == mscclppSocketStateAccepted));
if (sock->abortFlag && *sock->abortFlag != 0) return mscclppInternalError;
switch (sock->state) {
case mscclppSocketStateAccepting:
case mscclppSocketStateAccepted:
case mscclppSocketStateReady:
ret = mscclppSuccess;
break;
case mscclppSocketStateError:
ret = mscclppSystemError;
break;
default:
WARN("mscclppSocketAccept: wrong socket state %d", sock->state);
ret = mscclppInternalError;
break;
}
exit:
return ret;
}
mscclppResult_t mscclppSocketInit(struct mscclppSocket* sock, union mscclppSocketAddress* addr, uint64_t magic, enum mscclppSocketType type, volatile uint32_t* abortFlag, int asyncFlag) {
mscclppResult_t ret = mscclppSuccess;
if (sock == NULL) goto exit;
sock->timedOutRetries = 0;
sock->refusedRetries = 0;
sock->abortFlag = abortFlag;
sock->asyncFlag = asyncFlag;
sock->state = mscclppSocketStateInitialized;
sock->magic = magic;
sock->type = type;
sock->fd = -1;
sock->acceptFd = -1;
if (addr) {
/* IPv4/IPv6 support */
int family;
memcpy(&sock->addr, addr, sizeof(union mscclppSocketAddress));
family = sock->addr.sa.sa_family;
if (family != AF_INET && family != AF_INET6) {
char line[SOCKET_NAME_MAXLEN+1];
WARN("mscclppSocketInit: connecting to address %s with family %d is neither AF_INET(%d) nor AF_INET6(%d)",
mscclppSocketToString(&sock->addr, line), family, AF_INET, AF_INET6);
ret = mscclppInternalError;
goto fail;
}
sock->salen = (family == AF_INET) ? sizeof(struct sockaddr_in) : sizeof(struct sockaddr_in6);
/* Connect to a hostname / port */
sock->fd = socket(family, SOCK_STREAM, 0);
if (sock->fd == -1) {
WARN("mscclppSocketInit: Socket creation failed : %s", strerror(errno));
ret = mscclppSystemError;
goto fail;
}
} else {
memset(&sock->addr, 0, sizeof(union mscclppSocketAddress));
}
/* Set socket as non-blocking if async or if we need to be able to abort */
if ((sock->asyncFlag || sock->abortFlag) && sock->fd >= 0) {
int flags;
EQCHECKGOTO(flags = fcntl(sock->fd, F_GETFL), -1, ret, fail);
SYSCHECKGOTO(fcntl(sock->fd, F_SETFL, flags | O_NONBLOCK), ret, fail);
}
exit:
return ret;
fail:
goto exit;
}
mscclppResult_t mscclppSocketProgress(int op, struct mscclppSocket* sock, void* ptr, int size, int* offset) {
if (sock == NULL) {
WARN("mscclppSocketProgress: pass NULL socket");
return mscclppInvalidArgument;
}
MSCCLPPCHECK(socketProgress(op, sock, ptr, size, offset));
return mscclppSuccess;
}
mscclppResult_t mscclppSocketWait(int op, struct mscclppSocket* sock, void* ptr, int size, int* offset) {
if (sock == NULL) {
WARN("mscclppSocketWait: pass NULL socket");
return mscclppInvalidArgument;
}
MSCCLPPCHECK(socketWait(op, sock, ptr, size, offset));
return mscclppSuccess;
}
mscclppResult_t mscclppSocketSend(struct mscclppSocket* sock, void* ptr, int size) {
int offset = 0;
if (sock == NULL) {
WARN("mscclppSocketSend: pass NULL socket");
return mscclppInvalidArgument;
}
if (sock->state != mscclppSocketStateReady) {
WARN("mscclppSocketSend: socket state (%d) is not ready", sock->state);
return mscclppInternalError;
}
MSCCLPPCHECK(socketWait(MSCCLPP_SOCKET_SEND, sock, ptr, size, &offset));
return mscclppSuccess;
}
mscclppResult_t mscclppSocketRecv(struct mscclppSocket* sock, void* ptr, int size) {
int offset = 0;
if (sock == NULL) {
WARN("mscclppSocketRecv: pass NULL socket");
return mscclppInvalidArgument;
}
if (sock->state != mscclppSocketStateReady) {
WARN("mscclppSocketRecv: socket state (%d) is not ready", sock->state);
return mscclppInternalError;
}
MSCCLPPCHECK(socketWait(MSCCLPP_SOCKET_RECV, sock, ptr, size, &offset));
return mscclppSuccess;
}
// Receive or detect connection closed
mscclppResult_t mscclppSocketTryRecv(struct mscclppSocket* sock, void* ptr, int size, int* closed) {
int offset = 0;
if (sock == NULL) {
WARN("mscclppSocketTryRecv: pass NULL socket");
return mscclppInvalidArgument;
}
*closed = 0;
while (offset < size) {
MSCCLPPCHECK(socketProgressOpt(MSCCLPP_SOCKET_RECV, sock, ptr, size, &offset, 0, closed));
if (*closed) return mscclppSuccess;
}
return mscclppSuccess;
}
mscclppResult_t mscclppSocketClose(struct mscclppSocket* sock) {
if (sock != NULL) {
if (sock->fd >= 0) close(sock->fd);
sock->state = mscclppSocketStateClosed;
sock->fd = -1;
}
return mscclppSuccess;
}
mscclppResult_t mscclppSocketGetFd(struct mscclppSocket* sock, int* fd) {
if (sock == NULL) {
WARN("mscclppSocketGetFd: pass NULL socket");
return mscclppInvalidArgument;
}
if (fd) *fd = sock->fd;
return mscclppSuccess;
}
mscclppResult_t mscclppSocketSetFd(int fd, struct mscclppSocket* sock) {
if (sock == NULL) {
WARN("mscclppSocketGetFd: pass NULL socket");
return mscclppInvalidArgument;
}
sock->fd = fd;
return mscclppSuccess;
}

View File

@@ -562,22 +562,22 @@ static mscclppResult_t socketProgressState(struct mscclppSocket* sock) {
return mscclppSuccess;
}
mscclppResult_t mscclppSocketReady(struct mscclppSocket* sock, int *running) {
if (sock == NULL) {
*running = 0;
return mscclppSuccess;
}
if (sock->state == mscclppSocketStateError || sock->state == mscclppSocketStateClosed) {
WARN("mscclppSocketReady: unexpected socket state %d", sock->state);
return mscclppRemoteError;
}
*running = (sock->state == mscclppSocketStateReady) ? 1 : 0;
if (*running == 0) {
MSCCLPPCHECK(socketProgressState(sock));
*running = (sock->state == mscclppSocketStateReady) ? 1 : 0;
}
return mscclppSuccess;
}
// mscclppResult_t mscclppSocketReady(struct mscclppSocket* sock, int *running) {
// if (sock == NULL) {
// *running = 0;
// return mscclppSuccess;
// }
// if (sock->state == mscclppSocketStateError || sock->state == mscclppSocketStateClosed) {
// WARN("mscclppSocketReady: unexpected socket state %d", sock->state);
// return mscclppRemoteError;
// }
// *running = (sock->state == mscclppSocketStateReady) ? 1 : 0;
// if (*running == 0) {
// MSCCLPPCHECK(socketProgressState(sock));
// *running = (sock->state == mscclppSocketStateReady) ? 1 : 0;
// }
// return mscclppSuccess;
// }
mscclppResult_t mscclppSocketConnect(struct mscclppSocket* sock) {
#ifdef ENABLE_TRACE
@@ -740,14 +740,14 @@ mscclppResult_t mscclppSocketProgress(int op, struct mscclppSocket* sock, void*
return mscclppSuccess;
}
mscclppResult_t mscclppSocketWait(int op, struct mscclppSocket* sock, void* ptr, int size, int* offset) {
if (sock == NULL) {
WARN("mscclppSocketWait: pass NULL socket");
return mscclppInvalidArgument;
}
MSCCLPPCHECK(socketWait(op, sock, ptr, size, offset));
return mscclppSuccess;
}
// mscclppResult_t mscclppSocketWait(int op, struct mscclppSocket* sock, void* ptr, int size, int* offset) {
// if (sock == NULL) {
// WARN("mscclppSocketWait: pass NULL socket");
// return mscclppInvalidArgument;
// }
// MSCCLPPCHECK(socketWait(op, sock, ptr, size, offset));
// return mscclppSuccess;
// }
mscclppResult_t mscclppSocketSend(struct mscclppSocket* sock, void* ptr, int size) {
int offset = 0;
@@ -778,19 +778,19 @@ mscclppResult_t mscclppSocketRecv(struct mscclppSocket* sock, void* ptr, int siz
}
// Receive or detect connection closed
mscclppResult_t mscclppSocketTryRecv(struct mscclppSocket* sock, void* ptr, int size, int* closed) {
int offset = 0;
if (sock == NULL) {
WARN("mscclppSocketTryRecv: pass NULL socket");
return mscclppInvalidArgument;
}
*closed = 0;
while (offset < size) {
MSCCLPPCHECK(socketProgressOpt(MSCCLPP_SOCKET_RECV, sock, ptr, size, &offset, 0, closed));
if (*closed) return mscclppSuccess;
}
return mscclppSuccess;
}
// mscclppResult_t mscclppSocketTryRecv(struct mscclppSocket* sock, void* ptr, int size, int* closed) {
// int offset = 0;
// if (sock == NULL) {
// WARN("mscclppSocketTryRecv: pass NULL socket");
// return mscclppInvalidArgument;
// }
// *closed = 0;
// while (offset < size) {
// MSCCLPPCHECK(socketProgressOpt(MSCCLPP_SOCKET_RECV, sock, ptr, size, &offset, 0, closed));
// if (*closed) return mscclppSuccess;
// }
// return mscclppSuccess;
// }
mscclppResult_t mscclppSocketClose(struct mscclppSocket* sock) {
if (sock != NULL) {
@@ -801,20 +801,20 @@ mscclppResult_t mscclppSocketClose(struct mscclppSocket* sock) {
return mscclppSuccess;
}
mscclppResult_t mscclppSocketGetFd(struct mscclppSocket* sock, int* fd) {
if (sock == NULL) {
WARN("mscclppSocketGetFd: pass NULL socket");
return mscclppInvalidArgument;
}
if (fd) *fd = sock->fd;
return mscclppSuccess;
}
// mscclppResult_t mscclppSocketGetFd(struct mscclppSocket* sock, int* fd) {
// if (sock == NULL) {
// WARN("mscclppSocketGetFd: pass NULL socket");
// return mscclppInvalidArgument;
// }
// if (fd) *fd = sock->fd;
// return mscclppSuccess;
// }
mscclppResult_t mscclppSocketSetFd(int fd, struct mscclppSocket* sock) {
if (sock == NULL) {
WARN("mscclppSocketGetFd: pass NULL socket");
return mscclppInvalidArgument;
}
sock->fd = fd;
return mscclppSuccess;
}
// mscclppResult_t mscclppSocketSetFd(int fd, struct mscclppSocket* sock) {
// if (sock == NULL) {
// WARN("mscclppSocketGetFd: pass NULL socket");
// return mscclppInvalidArgument;
// }
// sock->fd = fd;
// return mscclppSuccess;
// }

View File

@@ -12,14 +12,14 @@
#include <stdlib.h>
// Get current Compute Capability
int mscclppCudaCompCap() {
int cudaDev;
if (cudaGetDevice(&cudaDev) != cudaSuccess) return 0;
int ccMajor, ccMinor;
if (cudaDeviceGetAttribute(&ccMajor, cudaDevAttrComputeCapabilityMajor, cudaDev) != cudaSuccess) return 0;
if (cudaDeviceGetAttribute(&ccMinor, cudaDevAttrComputeCapabilityMinor, cudaDev) != cudaSuccess) return 0;
return ccMajor*10+ccMinor;
}
// int mscclppCudaCompCap() {
// int cudaDev;
// if (cudaGetDevice(&cudaDev) != cudaSuccess) return 0;
// int ccMajor, ccMinor;
// if (cudaDeviceGetAttribute(&ccMajor, cudaDevAttrComputeCapabilityMajor, cudaDev) != cudaSuccess) return 0;
// if (cudaDeviceGetAttribute(&ccMinor, cudaDevAttrComputeCapabilityMinor, cudaDev) != cudaSuccess) return 0;
// return ccMajor*10+ccMinor;
// }
mscclppResult_t int64ToBusId(int64_t id, char* busId) {
sprintf(busId, "%04lx:%02lx:%02lx.%01lx", (id) >> 20, (id & 0xff000) >> 12, (id & 0xff0) >> 4, (id & 0xf));
@@ -193,101 +193,101 @@ bool matchIfList(const char* string, int port, struct netIf* ifList, int listSiz
return false;
}
__thread struct mscclppThreadSignal mscclppThreadSignalLocalInstance = mscclppThreadSignalStaticInitializer();
// __thread struct mscclppThreadSignal mscclppThreadSignalLocalInstance = mscclppThreadSignalStaticInitializer();
void* mscclppMemoryStack::allocateSpilled(struct mscclppMemoryStack* me, size_t size, size_t align) {
// `me->hunks` points to the top of the stack non-empty hunks. Hunks above
// this (reachable via `->above`) are empty.
struct Hunk* top = me->topFrame.hunk;
size_t mallocSize = 0;
// void* mscclppMemoryStack::allocateSpilled(struct mscclppMemoryStack* me, size_t size, size_t align) {
// // `me->hunks` points to the top of the stack non-empty hunks. Hunks above
// // this (reachable via `->above`) are empty.
// struct Hunk* top = me->topFrame.hunk;
// size_t mallocSize = 0;
// If we have lots of space left in hunk but that wasn't enough then we'll
// allocate the object unhunked.
if (me->topFrame.end - me->topFrame.bumper >= 8<<10)
goto unhunked;
// // If we have lots of space left in hunk but that wasn't enough then we'll
// // allocate the object unhunked.
// if (me->topFrame.end - me->topFrame.bumper >= 8<<10)
// goto unhunked;
// If we have another hunk (which must be empty) waiting above this one and
// the object fits then use that.
if (top && top->above) {
struct Hunk* top1 = top->above;
uintptr_t uobj = (reinterpret_cast<uintptr_t>(top1) + sizeof(struct Hunk) + align-1) & -uintptr_t(align);
if (uobj + size <= reinterpret_cast<uintptr_t>(top1) + top1->size) {
me->topFrame.hunk = top1;
me->topFrame.bumper = uobj + size;
me->topFrame.end = reinterpret_cast<uintptr_t>(top1) + top1->size;
return reinterpret_cast<void*>(uobj);
}
}
// // If we have another hunk (which must be empty) waiting above this one and
// // the object fits then use that.
// if (top && top->above) {
// struct Hunk* top1 = top->above;
// uintptr_t uobj = (reinterpret_cast<uintptr_t>(top1) + sizeof(struct Hunk) + align-1) & -uintptr_t(align);
// if (uobj + size <= reinterpret_cast<uintptr_t>(top1) + top1->size) {
// me->topFrame.hunk = top1;
// me->topFrame.bumper = uobj + size;
// me->topFrame.end = reinterpret_cast<uintptr_t>(top1) + top1->size;
// return reinterpret_cast<void*>(uobj);
// }
// }
{ // If the next hunk we're going to allocate wouldn't be big enough but the
// Unhunk proxy fits in the current hunk then go allocate as unhunked.
size_t nextSize = (top ? top->size : 0) + (64<<10);
constexpr size_t maxAlign = 64;
if (nextSize < sizeof(struct Hunk) + maxAlign + size) {
uintptr_t uproxy = (me->topFrame.bumper + alignof(Unhunk)-1) & -uintptr_t(alignof(Unhunk));
if (uproxy + sizeof(struct Unhunk) <= me->topFrame.end)
goto unhunked;
}
// { // If the next hunk we're going to allocate wouldn't be big enough but the
// // Unhunk proxy fits in the current hunk then go allocate as unhunked.
// size_t nextSize = (top ? top->size : 0) + (64<<10);
// constexpr size_t maxAlign = 64;
// if (nextSize < sizeof(struct Hunk) + maxAlign + size) {
// uintptr_t uproxy = (me->topFrame.bumper + alignof(Unhunk)-1) & -uintptr_t(alignof(Unhunk));
// if (uproxy + sizeof(struct Unhunk) <= me->topFrame.end)
// goto unhunked;
// }
// At this point we must need another hunk, either to fit the object
// itself or its Unhunk proxy.
mallocSize = nextSize;
INFO(MSCCLPP_ALLOC, "%s:%d memory stack hunk malloc(%llu)", __FILE__, __LINE__, (unsigned long long)mallocSize);
struct Hunk *top1 = (struct Hunk*)malloc(mallocSize);
if (top1 == nullptr) goto malloc_exhausted;
top1->size = nextSize;
top1->above = nullptr;
if (top) top->above = top1;
top = top1;
me->topFrame.hunk = top;
me->topFrame.end = reinterpret_cast<uintptr_t>(top) + nextSize;
me->topFrame.bumper = reinterpret_cast<uintptr_t>(top) + sizeof(struct Hunk);
}
// // At this point we must need another hunk, either to fit the object
// // itself or its Unhunk proxy.
// mallocSize = nextSize;
// INFO(MSCCLPP_ALLOC, "%s:%d memory stack hunk malloc(%llu)", __FILE__, __LINE__, (unsigned long long)mallocSize);
// struct Hunk *top1 = (struct Hunk*)malloc(mallocSize);
// if (top1 == nullptr) goto malloc_exhausted;
// top1->size = nextSize;
// top1->above = nullptr;
// if (top) top->above = top1;
// top = top1;
// me->topFrame.hunk = top;
// me->topFrame.end = reinterpret_cast<uintptr_t>(top) + nextSize;
// me->topFrame.bumper = reinterpret_cast<uintptr_t>(top) + sizeof(struct Hunk);
// }
{ // Try to fit object in the new top hunk.
uintptr_t uobj = (me->topFrame.bumper + align-1) & -uintptr_t(align);
if (uobj + size <= me->topFrame.end) {
me->topFrame.bumper = uobj + size;
return reinterpret_cast<void*>(uobj);
}
}
// { // Try to fit object in the new top hunk.
// uintptr_t uobj = (me->topFrame.bumper + align-1) & -uintptr_t(align);
// if (uobj + size <= me->topFrame.end) {
// me->topFrame.bumper = uobj + size;
// return reinterpret_cast<void*>(uobj);
// }
// }
unhunked:
{ // We need to allocate the object out-of-band and put an Unhunk proxy in-band
// to keep track of it.
uintptr_t uproxy = (me->topFrame.bumper + alignof(Unhunk)-1) & -uintptr_t(alignof(Unhunk));
Unhunk* proxy = reinterpret_cast<Unhunk*>(uproxy);
me->topFrame.bumper = uproxy + sizeof(Unhunk);
proxy->next = me->topFrame.unhunks;
me->topFrame.unhunks = proxy;
mallocSize = size;
proxy->obj = malloc(mallocSize);
INFO(MSCCLPP_ALLOC, "%s:%d memory stack non-hunk malloc(%llu)", __FILE__, __LINE__, (unsigned long long)mallocSize);
if (proxy->obj == nullptr) goto malloc_exhausted;
return proxy->obj;
}
// unhunked:
// { // We need to allocate the object out-of-band and put an Unhunk proxy in-band
// // to keep track of it.
// uintptr_t uproxy = (me->topFrame.bumper + alignof(Unhunk)-1) & -uintptr_t(alignof(Unhunk));
// Unhunk* proxy = reinterpret_cast<Unhunk*>(uproxy);
// me->topFrame.bumper = uproxy + sizeof(Unhunk);
// proxy->next = me->topFrame.unhunks;
// me->topFrame.unhunks = proxy;
// mallocSize = size;
// proxy->obj = malloc(mallocSize);
// INFO(MSCCLPP_ALLOC, "%s:%d memory stack non-hunk malloc(%llu)", __FILE__, __LINE__, (unsigned long long)mallocSize);
// if (proxy->obj == nullptr) goto malloc_exhausted;
// return proxy->obj;
// }
malloc_exhausted:
WARN("%s:%d Unrecoverable error detected: malloc(size=%llu) returned null.", __FILE__, __LINE__, (unsigned long long)mallocSize);
abort();
}
// malloc_exhausted:
// WARN("%s:%d Unrecoverable error detected: malloc(size=%llu) returned null.", __FILE__, __LINE__, (unsigned long long)mallocSize);
// abort();
// }
void mscclppMemoryStackDestruct(struct mscclppMemoryStack* me) {
// Free unhunks first because both the frames and unhunk proxies lie within the hunks.
struct mscclppMemoryStack::Frame* f = &me->topFrame;
while (f != nullptr) {
struct mscclppMemoryStack::Unhunk* u = f->unhunks;
while (u != nullptr) {
free(u->obj);
u = u->next;
}
f = f->below;
}
// Free hunks
struct mscclppMemoryStack::Hunk* h = me->stub.above;
while (h != nullptr) {
struct mscclppMemoryStack::Hunk *h1 = h->above;
free(h);
h = h1;
}
}
// void mscclppMemoryStackDestruct(struct mscclppMemoryStack* me) {
// // Free unhunks first because both the frames and unhunk proxies lie within the hunks.
// struct mscclppMemoryStack::Frame* f = &me->topFrame;
// while (f != nullptr) {
// struct mscclppMemoryStack::Unhunk* u = f->unhunks;
// while (u != nullptr) {
// free(u->obj);
// u = u->next;
// }
// f = f->below;
// }
// // Free hunks
// struct mscclppMemoryStack::Hunk* h = me->stub.above;
// while (h != nullptr) {
// struct mscclppMemoryStack::Hunk *h1 = h->above;
// free(h);
// h = h1;
// }
// }