mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2026-05-21 04:49:03 +00:00
add kt-kernel
This commit is contained in:
81
kt-kernel/cpu_backend/shared_mem_buffer.cpp
Normal file
81
kt-kernel/cpu_backend/shared_mem_buffer.cpp
Normal file
@@ -0,0 +1,81 @@
|
||||
/**
|
||||
* @Description :
|
||||
* @Author : chenht2022
|
||||
* @Date : 2024-08-05 04:49:08
|
||||
* @Version : 1.0.0
|
||||
* @LastEditors : chenht2022
|
||||
* @LastEditTime : 2024-08-05 09:21:29
|
||||
* @Copyright (c) 2024 by KVCache.AI, All Rights Reserved.
|
||||
**/
|
||||
#include "shared_mem_buffer.h"
|
||||
|
||||
#include <numa.h>
|
||||
|
||||
#include <cstdio>
|
||||
|
||||
size_t MemoryRequest::total_size() {
|
||||
size_t total = 0;
|
||||
for (size_t i = 0; i < sizes.size(); ++i) {
|
||||
total += sizes[i];
|
||||
}
|
||||
return total;
|
||||
}
|
||||
|
||||
void MemoryRequest::update_base_ptr(void* base) {
|
||||
size_t total_offset = 0;
|
||||
for (size_t i = 0; i < funcs.size(); ++i) {
|
||||
funcs[i]((uint8_t*)base + total_offset);
|
||||
total_offset += sizes[i];
|
||||
}
|
||||
}
|
||||
|
||||
void MemoryRequest::append_function(std::function<void(void*)> func, size_t size) {
|
||||
funcs.push_back(func);
|
||||
sizes.push_back(size);
|
||||
}
|
||||
|
||||
SharedMemBuffer::SharedMemBuffer() {
|
||||
buffer = nullptr;
|
||||
size = 0;
|
||||
}
|
||||
|
||||
SharedMemBuffer::~SharedMemBuffer() {
|
||||
if (buffer) {
|
||||
free(buffer);
|
||||
}
|
||||
}
|
||||
|
||||
void SharedMemBuffer::alloc(void* object, MemoryRequest requests) {
|
||||
size_t total_size = requests.total_size();
|
||||
object_requests.push_back(requests);
|
||||
|
||||
if (total_size > size) {
|
||||
if (buffer) {
|
||||
free(buffer);
|
||||
}
|
||||
buffer = std::aligned_alloc(64, total_size);
|
||||
if (!buffer) {
|
||||
printf("cannot aligned alloc %ld bytes\n", total_size);
|
||||
perror("aligned_alloc"); // errno == ENOMEM/EINVAL
|
||||
exit(1);
|
||||
}
|
||||
size = total_size;
|
||||
for (auto& req : object_requests) {
|
||||
req.update_base_ptr(buffer);
|
||||
}
|
||||
} else {
|
||||
requests.update_base_ptr(buffer);
|
||||
}
|
||||
}
|
||||
|
||||
void SharedMemBufferNuma::alloc(int numa, void* object, MemoryRequest requests) {
|
||||
std::lock_guard<std::mutex> guard(lock);
|
||||
if (numa != numa_node_of_cpu(sched_getcpu())) {
|
||||
printf("alloc %d from other numa for %lx\n", numa, reinterpret_cast<intptr_t>(object));
|
||||
}
|
||||
if (numa_mem.count(numa) == 0) {
|
||||
numa_mem[numa] = std::unique_ptr<SharedMemBuffer>(new SharedMemBuffer());
|
||||
}
|
||||
// printf("numa %d alloc for %lx\n", numa,reinterpret_cast<intptr_t> (object));
|
||||
numa_mem.at(numa)->alloc(object, requests);
|
||||
}
|
||||
Reference in New Issue
Block a user