mirror of
https://github.com/vosen/ZLUDA.git
synced 2025-08-03 06:40:21 +00:00
Improve ZLUDA injection (#37)
Improve injector&redirector so it's no longer required to manually mess with files if the application links nvcuda.dll. Additionally inject into child processes
This commit is contained in:
parent
972f612562
commit
36514bd6eb
5 changed files with 664 additions and 79 deletions
|
@ -52,13 +52,16 @@ Overall, ZLUDA is slower in GeekBench by roughly 2%.
|
||||||
|
|
||||||
### Windows
|
### Windows
|
||||||
You should have the most recent Intel GPU drivers installed.\
|
You should have the most recent Intel GPU drivers installed.\
|
||||||
Copy `nvcuda.dll` to the application directory (the directory where .exe file is) and launch it normally
|
Run your application like this:
|
||||||
|
```
|
||||||
|
<ZLUDA_DIRECTORY>\zluda_with.exe -- <APPLICATION> <APPLICATIONS_ARGUMENTS>
|
||||||
|
```
|
||||||
|
|
||||||
### Linux
|
### Linux
|
||||||
A very recent version of [compute-runtime](https://github.com/intel/compute-runtime) and [Level Zero loader](https://github.com/oneapi-src/level-zero/releases) is required. At the time of the writing 20.45.18403 is the oldest recommended version.
|
A very recent version of [compute-runtime](https://github.com/intel/compute-runtime) and [Level Zero loader](https://github.com/oneapi-src/level-zero/releases) is required. At the time of the writing 20.45.18403 is the oldest recommended version.
|
||||||
Run your application like this:
|
Run your application like this:
|
||||||
```
|
```
|
||||||
LD_LIBRARY_PATH=<PATH_TO_THE_DIRECTORY_WITH_ZLUDA_PROVIDED_LIBCUDA> <YOUR_APPLICATION>
|
LD_LIBRARY_PATH=<ZLUDA_DIRECTORY> <APPLICATION> <APPLICATIONS_ARGUMENTS>
|
||||||
```
|
```
|
||||||
|
|
||||||
## Building
|
## Building
|
||||||
|
|
|
@ -14,7 +14,7 @@ lz4-sys = "1.9"
|
||||||
regex = "1.4"
|
regex = "1.4"
|
||||||
|
|
||||||
[target.'cfg(windows)'.dependencies]
|
[target.'cfg(windows)'.dependencies]
|
||||||
winapi = { version = "0.3", features = ["libloaderapi", "debugapi"] }
|
winapi = { version = "0.3", features = ["libloaderapi", "debugapi", "std"] }
|
||||||
wchar = "0.6"
|
wchar = "0.6"
|
||||||
detours-sys = { path = "../detours-sys" }
|
detours-sys = { path = "../detours-sys" }
|
||||||
|
|
||||||
|
|
|
@ -9,5 +9,5 @@ name = "zluda_with"
|
||||||
path = "src/main.rs"
|
path = "src/main.rs"
|
||||||
|
|
||||||
[target.'cfg(windows)'.dependencies]
|
[target.'cfg(windows)'.dependencies]
|
||||||
winapi = { version = "0.3", features = ["jobapi2", "processthreadsapi", "std", "synchapi", "winbase"] }
|
winapi = { version = "0.3", features = ["jobapi2", "processthreadsapi", "synchapi", "winbase", "std"] }
|
||||||
detours-sys = { path = "../detours-sys" }
|
detours-sys = { path = "../detours-sys" }
|
||||||
|
|
|
@ -10,4 +10,4 @@ crate-type = ["cdylib"]
|
||||||
[target.'cfg(windows)'.dependencies]
|
[target.'cfg(windows)'.dependencies]
|
||||||
detours-sys = { path = "../detours-sys" }
|
detours-sys = { path = "../detours-sys" }
|
||||||
wchar = "0.6"
|
wchar = "0.6"
|
||||||
winapi = { version = "0.3", features = ["processthreadsapi", "winbase", "winnt", "winerror", "libloaderapi", "std"] }
|
winapi = { version = "0.3", features = ["processthreadsapi", "winbase", "winnt", "winerror", "libloaderapi", "tlhelp32", "std"] }
|
|
@ -3,19 +3,49 @@
|
||||||
extern crate detours_sys;
|
extern crate detours_sys;
|
||||||
extern crate winapi;
|
extern crate winapi;
|
||||||
|
|
||||||
use std::{mem, ptr, slice};
|
use std::{
|
||||||
|
ffi::c_void,
|
||||||
|
mem,
|
||||||
|
os::raw::{c_int, c_uint, c_ulong},
|
||||||
|
ptr, slice, usize,
|
||||||
|
};
|
||||||
|
|
||||||
use detours_sys::{
|
use detours_sys::{
|
||||||
DetourAttach, DetourDetach, DetourRestoreAfterWith, DetourTransactionBegin,
|
DetourAttach, DetourDetach, DetourRestoreAfterWith, DetourTransactionAbort,
|
||||||
DetourTransactionCommit, DetourUpdateThread,
|
DetourTransactionBegin, DetourTransactionCommit, DetourUpdateProcessWithDll,
|
||||||
|
DetourUpdateThread,
|
||||||
};
|
};
|
||||||
use wchar::wch;
|
use wchar::wch;
|
||||||
use winapi::um::processthreadsapi::GetCurrentThread;
|
use winapi::{
|
||||||
use winapi::um::winnt::{DLL_PROCESS_ATTACH, DLL_PROCESS_DETACH, HANDLE, LPCWSTR};
|
shared::minwindef::{BOOL, LPVOID},
|
||||||
|
um::{
|
||||||
|
handleapi::{CloseHandle, INVALID_HANDLE_VALUE},
|
||||||
|
minwinbase::LPSECURITY_ATTRIBUTES,
|
||||||
|
processthreadsapi::{
|
||||||
|
CreateProcessA, GetCurrentProcessId, GetCurrentThread, GetCurrentThreadId, OpenThread,
|
||||||
|
ResumeThread, SuspendThread, TerminateProcess, LPPROCESS_INFORMATION, LPSTARTUPINFOA,
|
||||||
|
LPSTARTUPINFOW,
|
||||||
|
},
|
||||||
|
tlhelp32::{
|
||||||
|
CreateToolhelp32Snapshot, Thread32First, Thread32Next, TH32CS_SNAPTHREAD, THREADENTRY32,
|
||||||
|
},
|
||||||
|
winbase::CREATE_SUSPENDED,
|
||||||
|
winnt::{LPSTR, LPWSTR, THREAD_SUSPEND_RESUME},
|
||||||
|
},
|
||||||
|
};
|
||||||
use winapi::{
|
use winapi::{
|
||||||
shared::minwindef::{DWORD, FALSE, HMODULE, TRUE},
|
shared::minwindef::{DWORD, FALSE, HMODULE, TRUE},
|
||||||
um::{libloaderapi::LoadLibraryExA, winnt::LPCSTR},
|
um::{libloaderapi::LoadLibraryExA, winnt::LPCSTR},
|
||||||
};
|
};
|
||||||
|
use winapi::{
|
||||||
|
shared::minwindef::{FARPROC, HINSTANCE},
|
||||||
|
um::{
|
||||||
|
libloaderapi::{GetModuleFileNameA, GetProcAddress},
|
||||||
|
processthreadsapi::{CreateProcessAsUserW, CreateProcessW},
|
||||||
|
winbase::{CreateProcessWithLogonW, CreateProcessWithTokenW},
|
||||||
|
winnt::{DLL_PROCESS_ATTACH, DLL_PROCESS_DETACH, HANDLE, LPCWSTR},
|
||||||
|
},
|
||||||
|
};
|
||||||
use winapi::{
|
use winapi::{
|
||||||
shared::winerror::NO_ERROR,
|
shared::winerror::NO_ERROR,
|
||||||
um::libloaderapi::{LoadLibraryA, LoadLibraryExW, LoadLibraryW},
|
um::libloaderapi::{LoadLibraryA, LoadLibraryExW, LoadLibraryW},
|
||||||
|
@ -27,6 +57,12 @@ const NVCUDA_UTF8: &'static str = "NVCUDA.DLL";
|
||||||
const NVCUDA_UTF16: &[u16] = wch!("NVCUDA.DLL");
|
const NVCUDA_UTF16: &[u16] = wch!("NVCUDA.DLL");
|
||||||
static mut ZLUDA_PATH_UTF8: Vec<u8> = Vec::new();
|
static mut ZLUDA_PATH_UTF8: Vec<u8> = Vec::new();
|
||||||
static mut ZLUDA_PATH_UTF16: Option<&'static [u16]> = None;
|
static mut ZLUDA_PATH_UTF16: Option<&'static [u16]> = None;
|
||||||
|
static mut DETACH_LOAD_LIBRARY: bool = false;
|
||||||
|
static mut NVCUDA_ORIGINAL_MODULE: HMODULE = ptr::null_mut();
|
||||||
|
static mut CUINIT_ORIGINAL_FN: FARPROC = ptr::null_mut();
|
||||||
|
static mut CURRENT_MODULE_FILENAME: Vec<u8> = Vec::new();
|
||||||
|
const CUDA_ERROR_NOT_SUPPORTED: c_uint = 801;
|
||||||
|
const CUDA_ERROR_UNKNOWN: c_uint = 999;
|
||||||
|
|
||||||
static mut LOAD_LIBRARY_A: unsafe extern "system" fn(lpLibFileName: LPCSTR) -> HMODULE =
|
static mut LOAD_LIBRARY_A: unsafe extern "system" fn(lpLibFileName: LPCSTR) -> HMODULE =
|
||||||
LoadLibraryA;
|
LoadLibraryA;
|
||||||
|
@ -40,6 +76,72 @@ static mut LOAD_LIBRARY_EX_A: unsafe extern "system" fn(
|
||||||
dwFlags: DWORD,
|
dwFlags: DWORD,
|
||||||
) -> HMODULE = LoadLibraryExA;
|
) -> HMODULE = LoadLibraryExA;
|
||||||
|
|
||||||
|
static mut CREATE_PROCESS_A: unsafe extern "system" fn(
|
||||||
|
lpApplicationName: LPCSTR,
|
||||||
|
lpCommandLine: LPSTR,
|
||||||
|
lpProcessAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
lpThreadAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
bInheritHandles: BOOL,
|
||||||
|
dwCreationFlags: DWORD,
|
||||||
|
lpEnvironment: LPVOID,
|
||||||
|
lpCurrentDirectory: LPCSTR,
|
||||||
|
lpStartupInfo: LPSTARTUPINFOA,
|
||||||
|
lpProcessInformation: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL = CreateProcessA;
|
||||||
|
|
||||||
|
static mut CREATE_PROCESS_W: unsafe extern "system" fn(
|
||||||
|
lpApplicationName: LPCWSTR,
|
||||||
|
lpCommandLine: LPWSTR,
|
||||||
|
lpProcessAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
lpThreadAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
bInheritHandles: BOOL,
|
||||||
|
dwCreationFlags: DWORD,
|
||||||
|
lpEnvironment: LPVOID,
|
||||||
|
lpCurrentDirectory: LPCWSTR,
|
||||||
|
lpStartupInfo: LPSTARTUPINFOW,
|
||||||
|
lpProcessInformation: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL = CreateProcessW;
|
||||||
|
|
||||||
|
static mut CREATE_PROCESS_AS_USER_W: unsafe extern "system" fn(
|
||||||
|
hToken: HANDLE,
|
||||||
|
lpApplicationName: LPCWSTR,
|
||||||
|
lpCommandLine: LPWSTR,
|
||||||
|
lpProcessAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
lpThreadAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
bInheritHandles: BOOL,
|
||||||
|
dwCreationFlags: DWORD,
|
||||||
|
lpEnvironment: LPVOID,
|
||||||
|
lpCurrentDirectory: LPCWSTR,
|
||||||
|
lpStartupInfo: LPSTARTUPINFOW,
|
||||||
|
lpProcessInformation: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL = CreateProcessAsUserW;
|
||||||
|
|
||||||
|
static mut CREATE_PROCESS_WITH_TOKEN_W: unsafe extern "system" fn(
|
||||||
|
hToken: HANDLE,
|
||||||
|
dwLogonFlags: DWORD,
|
||||||
|
lpApplicationName: LPCWSTR,
|
||||||
|
lpCommandLine: LPWSTR,
|
||||||
|
dwCreationFlags: DWORD,
|
||||||
|
lpEnvironment: LPVOID,
|
||||||
|
lpCurrentDirectory: LPCWSTR,
|
||||||
|
lpStartupInfo: LPSTARTUPINFOW,
|
||||||
|
lpProcessInformation: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL = CreateProcessWithTokenW;
|
||||||
|
|
||||||
|
static mut CREATE_PROCESS_WITH_LOGON_W: unsafe extern "system" fn(
|
||||||
|
lpUsername: LPCWSTR,
|
||||||
|
lpDomain: LPCWSTR,
|
||||||
|
lpPassword: LPCWSTR,
|
||||||
|
dwLogonFlags: DWORD,
|
||||||
|
lpApplicationName: LPCWSTR,
|
||||||
|
lpCommandLine: LPWSTR,
|
||||||
|
dwCreationFlags: DWORD,
|
||||||
|
lpEnvironment: LPVOID,
|
||||||
|
lpCurrentDirectory: LPCWSTR,
|
||||||
|
lpStartupInfo: LPSTARTUPINFOW,
|
||||||
|
lpProcessInformation: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL = CreateProcessWithLogonW;
|
||||||
|
|
||||||
static mut LOAD_LIBRARY_EX_W: unsafe extern "system" fn(
|
static mut LOAD_LIBRARY_EX_W: unsafe extern "system" fn(
|
||||||
lpLibFileName: LPCWSTR,
|
lpLibFileName: LPCWSTR,
|
||||||
hFile: HANDLE,
|
hFile: HANDLE,
|
||||||
|
@ -100,6 +202,293 @@ unsafe extern "system" fn ZludaLoadLibraryExW(
|
||||||
(LOAD_LIBRARY_EX_W)(nvcuda_file_name, hFile, dwFlags)
|
(LOAD_LIBRARY_EX_W)(nvcuda_file_name, hFile, dwFlags)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[allow(non_snake_case)]
|
||||||
|
unsafe extern "system" fn ZludaCreateProcessA(
|
||||||
|
lpApplicationName: LPCSTR,
|
||||||
|
lpCommandLine: LPSTR,
|
||||||
|
lpProcessAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
lpThreadAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
bInheritHandles: BOOL,
|
||||||
|
dwCreationFlags: DWORD,
|
||||||
|
lpEnvironment: LPVOID,
|
||||||
|
lpCurrentDirectory: LPCSTR,
|
||||||
|
lpStartupInfo: LPSTARTUPINFOA,
|
||||||
|
lpProcessInformation: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL {
|
||||||
|
let create_proc_result = CREATE_PROCESS_A(
|
||||||
|
lpApplicationName,
|
||||||
|
lpCommandLine,
|
||||||
|
lpProcessAttributes,
|
||||||
|
lpThreadAttributes,
|
||||||
|
bInheritHandles,
|
||||||
|
dwCreationFlags | CREATE_SUSPENDED,
|
||||||
|
lpEnvironment,
|
||||||
|
lpCurrentDirectory,
|
||||||
|
lpStartupInfo,
|
||||||
|
lpProcessInformation,
|
||||||
|
);
|
||||||
|
continue_create_process_hook(create_proc_result, dwCreationFlags, lpProcessInformation)
|
||||||
|
}
|
||||||
|
|
||||||
|
#[allow(non_snake_case)]
|
||||||
|
unsafe extern "system" fn ZludaCreateProcessW(
|
||||||
|
lpApplicationName: LPCWSTR,
|
||||||
|
lpCommandLine: LPWSTR,
|
||||||
|
lpProcessAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
lpThreadAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
bInheritHandles: BOOL,
|
||||||
|
dwCreationFlags: DWORD,
|
||||||
|
lpEnvironment: LPVOID,
|
||||||
|
lpCurrentDirectory: LPCWSTR,
|
||||||
|
lpStartupInfo: LPSTARTUPINFOW,
|
||||||
|
lpProcessInformation: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL {
|
||||||
|
let create_proc_result = CREATE_PROCESS_W(
|
||||||
|
lpApplicationName,
|
||||||
|
lpCommandLine,
|
||||||
|
lpProcessAttributes,
|
||||||
|
lpThreadAttributes,
|
||||||
|
bInheritHandles,
|
||||||
|
dwCreationFlags | CREATE_SUSPENDED,
|
||||||
|
lpEnvironment,
|
||||||
|
lpCurrentDirectory,
|
||||||
|
lpStartupInfo,
|
||||||
|
lpProcessInformation,
|
||||||
|
);
|
||||||
|
continue_create_process_hook(create_proc_result, dwCreationFlags, lpProcessInformation)
|
||||||
|
}
|
||||||
|
|
||||||
|
#[allow(non_snake_case)]
|
||||||
|
unsafe extern "system" fn ZludaCreateProcessAsUserW(
|
||||||
|
hToken: HANDLE,
|
||||||
|
lpApplicationName: LPCWSTR,
|
||||||
|
lpCommandLine: LPWSTR,
|
||||||
|
lpProcessAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
lpThreadAttributes: LPSECURITY_ATTRIBUTES,
|
||||||
|
bInheritHandles: BOOL,
|
||||||
|
dwCreationFlags: DWORD,
|
||||||
|
lpEnvironment: LPVOID,
|
||||||
|
lpCurrentDirectory: LPCWSTR,
|
||||||
|
lpStartupInfo: LPSTARTUPINFOW,
|
||||||
|
lpProcessInformation: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL {
|
||||||
|
let create_proc_result = CREATE_PROCESS_AS_USER_W(
|
||||||
|
hToken,
|
||||||
|
lpApplicationName,
|
||||||
|
lpCommandLine,
|
||||||
|
lpProcessAttributes,
|
||||||
|
lpThreadAttributes,
|
||||||
|
bInheritHandles,
|
||||||
|
dwCreationFlags | CREATE_SUSPENDED,
|
||||||
|
lpEnvironment,
|
||||||
|
lpCurrentDirectory,
|
||||||
|
lpStartupInfo,
|
||||||
|
lpProcessInformation,
|
||||||
|
);
|
||||||
|
continue_create_process_hook(create_proc_result, dwCreationFlags, lpProcessInformation)
|
||||||
|
}
|
||||||
|
|
||||||
|
#[allow(non_snake_case)]
|
||||||
|
unsafe extern "system" fn ZludaCreateProcessWithLogonW(
|
||||||
|
lpUsername: LPCWSTR,
|
||||||
|
lpDomain: LPCWSTR,
|
||||||
|
lpPassword: LPCWSTR,
|
||||||
|
dwLogonFlags: DWORD,
|
||||||
|
lpApplicationName: LPCWSTR,
|
||||||
|
lpCommandLine: LPWSTR,
|
||||||
|
dwCreationFlags: DWORD,
|
||||||
|
lpEnvironment: LPVOID,
|
||||||
|
lpCurrentDirectory: LPCWSTR,
|
||||||
|
lpStartupInfo: LPSTARTUPINFOW,
|
||||||
|
lpProcessInformation: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL {
|
||||||
|
let create_proc_result = CREATE_PROCESS_WITH_LOGON_W(
|
||||||
|
lpUsername,
|
||||||
|
lpDomain,
|
||||||
|
lpPassword,
|
||||||
|
dwLogonFlags,
|
||||||
|
lpApplicationName,
|
||||||
|
lpCommandLine,
|
||||||
|
dwCreationFlags | CREATE_SUSPENDED,
|
||||||
|
lpEnvironment,
|
||||||
|
lpCurrentDirectory,
|
||||||
|
lpStartupInfo,
|
||||||
|
lpProcessInformation,
|
||||||
|
);
|
||||||
|
continue_create_process_hook(create_proc_result, dwCreationFlags, lpProcessInformation)
|
||||||
|
}
|
||||||
|
|
||||||
|
#[allow(non_snake_case)]
|
||||||
|
unsafe extern "system" fn ZludaCreateProcessWithTokenW(
|
||||||
|
hToken: HANDLE,
|
||||||
|
dwLogonFlags: DWORD,
|
||||||
|
lpApplicationName: LPCWSTR,
|
||||||
|
lpCommandLine: LPWSTR,
|
||||||
|
dwCreationFlags: DWORD,
|
||||||
|
lpEnvironment: LPVOID,
|
||||||
|
lpCurrentDirectory: LPCWSTR,
|
||||||
|
lpStartupInfo: LPSTARTUPINFOW,
|
||||||
|
lpProcessInformation: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL {
|
||||||
|
let create_proc_result = CREATE_PROCESS_WITH_TOKEN_W(
|
||||||
|
hToken,
|
||||||
|
dwLogonFlags,
|
||||||
|
lpApplicationName,
|
||||||
|
lpCommandLine,
|
||||||
|
dwCreationFlags,
|
||||||
|
lpEnvironment,
|
||||||
|
lpCurrentDirectory,
|
||||||
|
lpStartupInfo,
|
||||||
|
lpProcessInformation,
|
||||||
|
);
|
||||||
|
continue_create_process_hook(create_proc_result, dwCreationFlags, lpProcessInformation)
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn continue_create_process_hook(
|
||||||
|
create_proc_result: BOOL,
|
||||||
|
creation_flags: DWORD,
|
||||||
|
process_information: LPPROCESS_INFORMATION,
|
||||||
|
) -> BOOL {
|
||||||
|
if create_proc_result == 0 {
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
if DetourUpdateProcessWithDll(
|
||||||
|
(*process_information).hProcess,
|
||||||
|
&mut CURRENT_MODULE_FILENAME.as_ptr() as *mut _ as *mut _,
|
||||||
|
1,
|
||||||
|
) == 0
|
||||||
|
{
|
||||||
|
TerminateProcess((*process_information).hProcess, 1);
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
if detours_sys::DetourCopyPayloadToProcess(
|
||||||
|
(*process_information).hProcess,
|
||||||
|
&PAYLOAD_GUID,
|
||||||
|
ZLUDA_PATH_UTF16.unwrap().as_ptr() as *mut _,
|
||||||
|
(ZLUDA_PATH_UTF16.unwrap().len() * mem::size_of::<u16>()) as u32,
|
||||||
|
) == FALSE
|
||||||
|
{
|
||||||
|
TerminateProcess((*process_information).hProcess, 1);
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
if creation_flags & CREATE_SUSPENDED == 0 {
|
||||||
|
if ResumeThread((*process_information).hThread) == -1i32 as u32 {
|
||||||
|
TerminateProcess((*process_information).hProcess, 1);
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
create_proc_result
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe extern "C" fn cuinit_detour(flags: c_uint) -> c_uint {
|
||||||
|
let zluda_module = LoadLibraryW(ZLUDA_PATH_UTF16.unwrap().as_ptr());
|
||||||
|
if zluda_module == ptr::null_mut() {
|
||||||
|
return CUDA_ERROR_UNKNOWN;
|
||||||
|
}
|
||||||
|
let suspended_threads = suspend_all_threads_except_current();
|
||||||
|
let suspended_threads = match suspended_threads {
|
||||||
|
Some(t) => t,
|
||||||
|
None => return CUDA_ERROR_UNKNOWN,
|
||||||
|
};
|
||||||
|
if DetourTransactionBegin() != NO_ERROR as i32 {
|
||||||
|
resume_threads(&suspended_threads);
|
||||||
|
return CUDA_ERROR_UNKNOWN;
|
||||||
|
}
|
||||||
|
for t in suspended_threads.iter() {
|
||||||
|
if DetourUpdateThread(*t) != NO_ERROR as i32 {
|
||||||
|
DetourTransactionAbort();
|
||||||
|
resume_threads(&suspended_threads);
|
||||||
|
return CUDA_ERROR_UNKNOWN;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
if detours_sys::DetourEnumerateExports(
|
||||||
|
NVCUDA_ORIGINAL_MODULE as *mut _,
|
||||||
|
&zluda_module as *const _ as *mut _,
|
||||||
|
Some(override_nvcuda_export),
|
||||||
|
) == FALSE
|
||||||
|
{
|
||||||
|
DetourTransactionAbort();
|
||||||
|
resume_threads(&suspended_threads);
|
||||||
|
return CUDA_ERROR_UNKNOWN;
|
||||||
|
}
|
||||||
|
if DetourTransactionCommit() != NO_ERROR as i32 {
|
||||||
|
DetourTransactionAbort();
|
||||||
|
resume_threads(&suspended_threads);
|
||||||
|
return CUDA_ERROR_UNKNOWN;
|
||||||
|
}
|
||||||
|
resume_threads(&suspended_threads);
|
||||||
|
let zluda_cuinit = GetProcAddress(zluda_module, b"cuInit\0".as_ptr() as *const _);
|
||||||
|
(mem::transmute::<_, unsafe extern "C" fn(c_uint) -> c_uint>(zluda_cuinit))(flags)
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn suspend_all_threads_except_current() -> Option<Vec<*mut c_void>> {
|
||||||
|
let thread_snap = CreateToolhelp32Snapshot(TH32CS_SNAPTHREAD, 0);
|
||||||
|
if thread_snap == INVALID_HANDLE_VALUE {
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
let current_thread = GetCurrentThreadId();
|
||||||
|
let current_process = GetCurrentProcessId();
|
||||||
|
let mut threads = Vec::new();
|
||||||
|
let mut thread = mem::zeroed::<THREADENTRY32>();
|
||||||
|
thread.dwSize = mem::size_of::<THREADENTRY32>() as u32;
|
||||||
|
if Thread32First(thread_snap, &mut thread) == 0 {
|
||||||
|
CloseHandle(thread_snap);
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
loop {
|
||||||
|
if thread.th32OwnerProcessID == current_process && thread.th32ThreadID != current_thread {
|
||||||
|
let thread_handle = OpenThread(THREAD_SUSPEND_RESUME, 0, thread.th32ThreadID);
|
||||||
|
if thread_handle == ptr::null_mut() {
|
||||||
|
CloseHandle(thread_snap);
|
||||||
|
resume_threads(&threads);
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
if SuspendThread(thread_handle) == (-1i32 as u32) {
|
||||||
|
CloseHandle(thread_snap);
|
||||||
|
resume_threads(&threads);
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
threads.push(thread_handle);
|
||||||
|
}
|
||||||
|
if Thread32Next(thread_snap, &mut thread) == 0 {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
CloseHandle(thread_snap);
|
||||||
|
Some(threads)
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn resume_threads(threads: &[*mut c_void]) {
|
||||||
|
for t in threads {
|
||||||
|
ResumeThread(*t);
|
||||||
|
CloseHandle(*t);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe extern "C" fn override_nvcuda_export(
|
||||||
|
context_ptr: *mut c_void,
|
||||||
|
_: c_ulong,
|
||||||
|
name: LPCSTR,
|
||||||
|
mut address: *mut c_void,
|
||||||
|
) -> c_int {
|
||||||
|
let zluda_module: HMODULE = *(context_ptr as *mut HMODULE);
|
||||||
|
let mut zluda_fn = GetProcAddress(zluda_module, name);
|
||||||
|
if zluda_fn == ptr::null_mut() {
|
||||||
|
// We only support 64 bits and in all relevant calling conventions stack
|
||||||
|
// is caller-cleaned, so probably we will not crash
|
||||||
|
zluda_fn = unsupported_cuda_fn as *mut _;
|
||||||
|
}
|
||||||
|
if DetourAttach((&mut address) as *mut _, zluda_fn as *mut _) != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
TRUE
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe extern "C" fn unsupported_cuda_fn() -> c_uint {
|
||||||
|
CUDA_ERROR_NOT_SUPPORTED
|
||||||
|
}
|
||||||
|
|
||||||
fn is_nvcuda_dll_utf8(lib: *const u8) -> bool {
|
fn is_nvcuda_dll_utf8(lib: *const u8) -> bool {
|
||||||
is_nvcuda_dll(lib, 0, NVCUDA_UTF8.as_bytes(), |c| {
|
is_nvcuda_dll(lib, 0, NVCUDA_UTF8.as_bytes(), |c| {
|
||||||
if c >= 'a' as u8 && c <= 'z' as u8 {
|
if c >= 'a' as u8 && c <= 'z' as u8 {
|
||||||
|
@ -147,94 +536,207 @@ fn is_nvcuda_dll<T: Copy + PartialEq>(
|
||||||
|
|
||||||
#[allow(non_snake_case)]
|
#[allow(non_snake_case)]
|
||||||
#[no_mangle]
|
#[no_mangle]
|
||||||
unsafe extern "system" fn DllMain(_: *const u8, dwReason: u32, _: *const u8) -> i32 {
|
unsafe extern "system" fn DllMain(instDLL: HINSTANCE, dwReason: u32, _: *const u8) -> i32 {
|
||||||
if dwReason == DLL_PROCESS_ATTACH {
|
if dwReason == DLL_PROCESS_ATTACH {
|
||||||
if DetourRestoreAfterWith() == FALSE {
|
if DetourRestoreAfterWith() == FALSE {
|
||||||
return FALSE;
|
return FALSE;
|
||||||
}
|
}
|
||||||
|
if !initialize_current_module_name(instDLL) {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
match get_zluda_dll_path() {
|
match get_zluda_dll_path() {
|
||||||
Some(path) => {
|
Some(path) => {
|
||||||
ZLUDA_PATH_UTF16 = Some(path);
|
ZLUDA_PATH_UTF16 = Some(path);
|
||||||
|
// from_utf16_lossy(...) handles terminating NULL correctly
|
||||||
ZLUDA_PATH_UTF8 = String::from_utf16_lossy(path).into_bytes();
|
ZLUDA_PATH_UTF8 = String::from_utf16_lossy(path).into_bytes();
|
||||||
}
|
}
|
||||||
None => return FALSE,
|
None => return FALSE,
|
||||||
}
|
}
|
||||||
if DetourTransactionBegin() != NO_ERROR as i32 {
|
// If the application (directly or not) links to nvcuda.dll, nvcuda.dll
|
||||||
return FALSE;
|
// will get loaded before we can act. In this case, instead of
|
||||||
}
|
// redirecting LoadLibrary* to load ZLUDA, we redirect cuInit to
|
||||||
if DetourUpdateThread(GetCurrentThread()) != NO_ERROR as i32 {
|
// a cuInit implementation that will load ZLUDA and set up detouts.
|
||||||
return FALSE;
|
// We can't do it here because LoadLibrary* inside DllMain is illegal.
|
||||||
}
|
// We greatly prefer wholesale redirecting inside LoadLibrary*.
|
||||||
if DetourAttach(
|
// Hooking inside cuInit is brittle in the face of multiple
|
||||||
mem::transmute(&mut LOAD_LIBRARY_A),
|
// threads (DetourUpdateThread)
|
||||||
ZludaLoadLibraryA as *mut _,
|
match get_cuinit() {
|
||||||
) != NO_ERROR as i32
|
Some((nvcuda_mod, cuinit_fn)) => attach_cuinit(nvcuda_mod, cuinit_fn),
|
||||||
{
|
None => attach_load_libary(),
|
||||||
return FALSE;
|
|
||||||
}
|
|
||||||
if DetourAttach(
|
|
||||||
mem::transmute(&mut LOAD_LIBRARY_W),
|
|
||||||
ZludaLoadLibraryW as *mut _,
|
|
||||||
) != NO_ERROR as i32
|
|
||||||
{
|
|
||||||
return FALSE;
|
|
||||||
}
|
|
||||||
if DetourAttach(
|
|
||||||
mem::transmute(&mut LOAD_LIBRARY_EX_A),
|
|
||||||
ZludaLoadLibraryExA as *mut _,
|
|
||||||
) != NO_ERROR as i32
|
|
||||||
{
|
|
||||||
return FALSE;
|
|
||||||
}
|
|
||||||
if DetourAttach(
|
|
||||||
mem::transmute(&mut LOAD_LIBRARY_EX_W),
|
|
||||||
ZludaLoadLibraryExW as *mut _,
|
|
||||||
) != NO_ERROR as i32
|
|
||||||
{
|
|
||||||
return FALSE;
|
|
||||||
}
|
|
||||||
if DetourTransactionCommit() != NO_ERROR as i32 {
|
|
||||||
return FALSE;
|
|
||||||
}
|
}
|
||||||
} else if dwReason == DLL_PROCESS_DETACH {
|
} else if dwReason == DLL_PROCESS_DETACH {
|
||||||
if DetourTransactionBegin() != NO_ERROR as i32 {
|
if DETACH_LOAD_LIBRARY {
|
||||||
return FALSE;
|
detach_load_library()
|
||||||
|
} else {
|
||||||
|
detach_cuinit()
|
||||||
}
|
}
|
||||||
if DetourUpdateThread(GetCurrentThread()) != NO_ERROR as i32 {
|
} else {
|
||||||
return FALSE;
|
TRUE
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
unsafe fn initialize_current_module_name(current_module: HINSTANCE) -> bool {
|
||||||
|
let mut name = vec![0; 128 as usize];
|
||||||
|
loop {
|
||||||
|
let size = GetModuleFileNameA(
|
||||||
|
current_module,
|
||||||
|
name.as_mut_ptr() as *mut _,
|
||||||
|
name.len() as u32,
|
||||||
|
);
|
||||||
|
if size == 0 {
|
||||||
|
return false;
|
||||||
}
|
}
|
||||||
if DetourDetach(
|
if size < name.len() as u32 {
|
||||||
mem::transmute(&mut LOAD_LIBRARY_A),
|
name.truncate(size as usize);
|
||||||
ZludaLoadLibraryA as *mut _,
|
CURRENT_MODULE_FILENAME = name;
|
||||||
) != NO_ERROR as i32
|
return true;
|
||||||
{
|
|
||||||
return FALSE;
|
|
||||||
}
|
}
|
||||||
if DetourDetach(
|
name.resize(name.len() * 2, 0);
|
||||||
mem::transmute(&mut LOAD_LIBRARY_W),
|
}
|
||||||
ZludaLoadLibraryW as *mut _,
|
}
|
||||||
) != NO_ERROR as i32
|
|
||||||
{
|
unsafe fn get_cuinit() -> Option<(HMODULE, FARPROC)> {
|
||||||
return FALSE;
|
let mut module = ptr::null_mut();
|
||||||
|
loop {
|
||||||
|
module = detours_sys::DetourEnumerateModules(module);
|
||||||
|
if module == ptr::null_mut() {
|
||||||
|
return None;
|
||||||
}
|
}
|
||||||
if DetourDetach(
|
let cuinit_addr = GetProcAddress(module as *mut _, b"cuInit\0".as_ptr() as *const _);
|
||||||
mem::transmute(&mut LOAD_LIBRARY_EX_A),
|
if cuinit_addr != ptr::null_mut() {
|
||||||
ZludaLoadLibraryExA as *mut _,
|
return Some((module as *mut _, cuinit_addr));
|
||||||
) != NO_ERROR as i32
|
|
||||||
{
|
|
||||||
return FALSE;
|
|
||||||
}
|
|
||||||
if DetourDetach(
|
|
||||||
mem::transmute(&mut LOAD_LIBRARY_EX_W),
|
|
||||||
ZludaLoadLibraryExW as *mut _,
|
|
||||||
) != NO_ERROR as i32
|
|
||||||
{
|
|
||||||
return FALSE;
|
|
||||||
}
|
|
||||||
if DetourTransactionCommit() != NO_ERROR as i32 {
|
|
||||||
return FALSE;
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
unsafe fn attach_cuinit(nvcuda_mod: HMODULE, mut cuinit: FARPROC) -> i32 {
|
||||||
|
if DetourTransactionBegin() != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if !attach_create_process() {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
NVCUDA_ORIGINAL_MODULE = nvcuda_mod;
|
||||||
|
CUINIT_ORIGINAL_FN = cuinit;
|
||||||
|
if DetourAttach(mem::transmute(&mut cuinit), cuinit_detour as *mut _) != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourTransactionCommit() != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
TRUE
|
||||||
|
}
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
unsafe fn detach_cuinit() -> i32 {
|
||||||
|
if DetourTransactionBegin() != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if !detach_create_process() {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourUpdateThread(GetCurrentThread()) != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourDetach(
|
||||||
|
mem::transmute(&mut CUINIT_ORIGINAL_FN),
|
||||||
|
cuinit_detour as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourTransactionCommit() != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
TRUE
|
||||||
|
}
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
unsafe fn attach_load_libary() -> i32 {
|
||||||
|
if DetourTransactionBegin() != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if !attach_create_process() {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourAttach(
|
||||||
|
mem::transmute(&mut LOAD_LIBRARY_A),
|
||||||
|
ZludaLoadLibraryA as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourAttach(
|
||||||
|
mem::transmute(&mut LOAD_LIBRARY_W),
|
||||||
|
ZludaLoadLibraryW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourAttach(
|
||||||
|
mem::transmute(&mut LOAD_LIBRARY_EX_A),
|
||||||
|
ZludaLoadLibraryExA as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourAttach(
|
||||||
|
mem::transmute(&mut LOAD_LIBRARY_EX_W),
|
||||||
|
ZludaLoadLibraryExW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourTransactionCommit() != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
TRUE
|
||||||
|
}
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
unsafe fn detach_load_library() -> i32 {
|
||||||
|
if DetourTransactionBegin() != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if !detach_create_process() {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourUpdateThread(GetCurrentThread()) != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourDetach(
|
||||||
|
mem::transmute(&mut LOAD_LIBRARY_A),
|
||||||
|
ZludaLoadLibraryA as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourDetach(
|
||||||
|
mem::transmute(&mut LOAD_LIBRARY_W),
|
||||||
|
ZludaLoadLibraryW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourDetach(
|
||||||
|
mem::transmute(&mut LOAD_LIBRARY_EX_A),
|
||||||
|
ZludaLoadLibraryExA as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourDetach(
|
||||||
|
mem::transmute(&mut LOAD_LIBRARY_EX_W),
|
||||||
|
ZludaLoadLibraryExW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
|
if DetourTransactionCommit() != NO_ERROR as i32 {
|
||||||
|
return FALSE;
|
||||||
|
}
|
||||||
TRUE
|
TRUE
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -258,3 +760,83 @@ fn get_zluda_dll_path() -> Option<&'static [u16]> {
|
||||||
}
|
}
|
||||||
None
|
None
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
unsafe fn attach_create_process() -> bool {
|
||||||
|
if DetourAttach(
|
||||||
|
mem::transmute(&mut CREATE_PROCESS_A),
|
||||||
|
ZludaCreateProcessA as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if DetourAttach(
|
||||||
|
mem::transmute(&mut CREATE_PROCESS_W),
|
||||||
|
ZludaCreateProcessW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if DetourAttach(
|
||||||
|
mem::transmute(&mut CREATE_PROCESS_AS_USER_W),
|
||||||
|
ZludaCreateProcessAsUserW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if DetourAttach(
|
||||||
|
mem::transmute(&mut CREATE_PROCESS_WITH_LOGON_W),
|
||||||
|
ZludaCreateProcessWithLogonW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if DetourAttach(
|
||||||
|
mem::transmute(&mut CREATE_PROCESS_WITH_TOKEN_W),
|
||||||
|
ZludaCreateProcessWithTokenW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
true
|
||||||
|
}
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
unsafe fn detach_create_process() -> bool {
|
||||||
|
if DetourDetach(
|
||||||
|
mem::transmute(&mut CREATE_PROCESS_A),
|
||||||
|
ZludaCreateProcessA as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if DetourDetach(
|
||||||
|
mem::transmute(&mut CREATE_PROCESS_W),
|
||||||
|
ZludaCreateProcessW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if DetourDetach(
|
||||||
|
mem::transmute(&mut CREATE_PROCESS_AS_USER_W),
|
||||||
|
ZludaCreateProcessAsUserW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if DetourDetach(
|
||||||
|
mem::transmute(&mut CREATE_PROCESS_WITH_LOGON_W),
|
||||||
|
ZludaCreateProcessWithLogonW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if DetourDetach(
|
||||||
|
mem::transmute(&mut CREATE_PROCESS_WITH_TOKEN_W),
|
||||||
|
ZludaCreateProcessWithTokenW as *mut _,
|
||||||
|
) != NO_ERROR as i32
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
true
|
||||||
|
}
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue