mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-27 06:39:25 +01:00
common : add support for cpu_get_num_physical_cores() on Windows (#8771)
* Add support for cpu_get_num_phsical_cores() on Windows * fix build bug on msys2-clang64 and ucrt64 * avoid adding new function * add new macros to avoid windows+mingw64 * Add error checking to return default value
This commit is contained in:
parent
2a24c8caa6
commit
fb487bb567
@ -110,8 +110,34 @@ int32_t cpu_get_num_physical_cores() {
|
|||||||
if (result == 0) {
|
if (result == 0) {
|
||||||
return num_physical_cores;
|
return num_physical_cores;
|
||||||
}
|
}
|
||||||
#elif defined(_WIN32)
|
#elif defined(_WIN32) && (_WIN32_WINNT >= 0x0601) && !defined(__MINGW64__) // windows 7 and later
|
||||||
//TODO: Implement
|
// TODO: windows + arm64 + mingw64
|
||||||
|
unsigned int n_threads_win = std::thread::hardware_concurrency();
|
||||||
|
unsigned int default_threads = n_threads_win > 0 ? (n_threads_win <= 4 ? n_threads_win : n_threads_win / 2) : 4;
|
||||||
|
|
||||||
|
DWORD buffer_size = 0;
|
||||||
|
if (!GetLogicalProcessorInformationEx(RelationProcessorCore, nullptr, &buffer_size)) {
|
||||||
|
if (GetLastError() != ERROR_INSUFFICIENT_BUFFER) {
|
||||||
|
return default_threads;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
std::vector<char> buffer(buffer_size);
|
||||||
|
if (!GetLogicalProcessorInformationEx(RelationProcessorCore, reinterpret_cast<PSYSTEM_LOGICAL_PROCESSOR_INFORMATION_EX>(buffer.data()), &buffer_size)) {
|
||||||
|
return default_threads;
|
||||||
|
}
|
||||||
|
|
||||||
|
int32_t num_physical_cores = 0;
|
||||||
|
PSYSTEM_LOGICAL_PROCESSOR_INFORMATION_EX info = reinterpret_cast<PSYSTEM_LOGICAL_PROCESSOR_INFORMATION_EX>(buffer.data());
|
||||||
|
while (buffer_size > 0) {
|
||||||
|
if (info->Relationship == RelationProcessorCore) {
|
||||||
|
num_physical_cores += info->Processor.GroupCount;
|
||||||
|
}
|
||||||
|
buffer_size -= info->Size;
|
||||||
|
info = reinterpret_cast<PSYSTEM_LOGICAL_PROCESSOR_INFORMATION_EX>(reinterpret_cast<char*>(info) + info->Size);
|
||||||
|
}
|
||||||
|
|
||||||
|
return num_physical_cores > 0 ? num_physical_cores : default_threads;
|
||||||
#endif
|
#endif
|
||||||
unsigned int n_threads = std::thread::hardware_concurrency();
|
unsigned int n_threads = std::thread::hardware_concurrency();
|
||||||
return n_threads > 0 ? (n_threads <= 4 ? n_threads : n_threads / 2) : 4;
|
return n_threads > 0 ? (n_threads <= 4 ? n_threads : n_threads / 2) : 4;
|
||||||
@ -1727,7 +1753,13 @@ std::string gpt_params_get_system_info(const gpt_params & params) {
|
|||||||
if (params.n_threads_batch != -1) {
|
if (params.n_threads_batch != -1) {
|
||||||
os << " (n_threads_batch = " << params.n_threads_batch << ")";
|
os << " (n_threads_batch = " << params.n_threads_batch << ")";
|
||||||
}
|
}
|
||||||
|
#if defined(_WIN32) && (_WIN32_WINNT >= 0x0601) && !defined(__MINGW64__) // windows 7 and later
|
||||||
|
// TODO: windows + arm64 + mingw64
|
||||||
|
DWORD logicalProcessorCount = GetActiveProcessorCount(ALL_PROCESSOR_GROUPS);
|
||||||
|
os << " / " << logicalProcessorCount << " | " << llama_print_system_info();
|
||||||
|
#else
|
||||||
os << " / " << std::thread::hardware_concurrency() << " | " << llama_print_system_info();
|
os << " / " << std::thread::hardware_concurrency() << " | " << llama_print_system_info();
|
||||||
|
#endif
|
||||||
|
|
||||||
return os.str();
|
return os.str();
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user