mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2026-05-11 00:10:07 +00:00
add balance-serve, support concurrence
This commit is contained in:
@@ -68,4 +68,4 @@ PYBIND11_MODULE(KTransformersOps, m) {
|
||||
py::arg("perm"), py::arg("workspace"), py::arg("num_bits"), py::arg("size_m"),
|
||||
py::arg("size_n"), py::arg("size_k"), py::arg("is_k_full"));
|
||||
#endif
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user