From a98e37ca12fc59bccb782ae3866d68d21407a15b Mon Sep 17 00:00:00 2001 From: Pedro Valente Date: Tue, 20 Feb 2024 18:02:47 +0000 Subject: [PATCH] reduced number of gpu layers to not cause integer overflow --- crates/edgen_rt_llama_cpp/src/lib.rs | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/crates/edgen_rt_llama_cpp/src/lib.rs b/crates/edgen_rt_llama_cpp/src/lib.rs index 0a56edd..c09edd3 100644 --- a/crates/edgen_rt_llama_cpp/src/lib.rs +++ b/crates/edgen_rt_llama_cpp/src/lib.rs @@ -301,7 +301,7 @@ async fn get_or_init_model( args.n_gpu_layers = 0; } DevicePolicy::AlwaysDevice { .. } => { - args.n_gpu_layers = u32::MAX; + args.n_gpu_layers = i32::MAX as u32; } _ => { unimplemented!()