mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-31 22:04:35 +00:00
Updated preloader to use multithreading
Tested on Windows - a small performance hit during loading is not avoidable but this is the fastest method I found On Linux - madvise needs a test if it's working. otherwise readahead() needs to be implemented in the TODO region
This commit is contained in:
parent
f4c1c6b97a
commit
6e65b8a817
@ -225,13 +225,19 @@ struct llama_mmap {
|
|||||||
perror("sysconf");
|
perror("sysconf");
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
#ifdef _WIN32
|
||||||
HANDLE hProcess = GetCurrentProcess();
|
HANDLE hProcess = GetCurrentProcess();
|
||||||
WIN32_MEMORY_RANGE_ENTRY range;
|
WIN32_MEMORY_RANGE_ENTRY range;
|
||||||
range.VirtualAddress = addr;
|
range.VirtualAddress = addr;
|
||||||
range.NumberOfBytes = length;
|
range.NumberOfBytes = length;
|
||||||
|
|
||||||
// if (!VirtualLock(addr, length)) { }; // no benefit. for systems with too little RAM we should lock a part and restrict the preload to that new length
|
// if (!VirtualLock(addr, length)) { }; // no benefit. for systems with too little RAM we should lock a part and restrict the preload to that new length
|
||||||
if (!PrefetchVirtualMemory(hProcess, 1, &range, 0)) { }; // Prefetches part of the data and signals readahead to the file system
|
if (!PrefetchVirtualMemory(hProcess, 1, &range, 0)) { }; // Prefetches part of the data and signals readahead to the file system
|
||||||
|
#else
|
||||||
|
// todo
|
||||||
|
//if (posix_madvise(addr, length, POSIX_MADV_WILLNEED) == -1) { };
|
||||||
|
// readahead() should be the equivalent method for Linux. I don't think madvise will cause a full fetch
|
||||||
|
// the multi threaded read below is pseudo sequential, it also needs a test without OS level readahead in place (worst case set threads to 1 in linux or return)
|
||||||
|
#endif
|
||||||
|
|
||||||
if (n_threads > 32)
|
if (n_threads > 32)
|
||||||
n_threads = 32;
|
n_threads = 32;
|
||||||
|
Loading…
Reference in New Issue
Block a user