diff --git a/LLama.Benchmark/LLamaExecutorBenchmark/Prefill.cs b/LLama.Benchmark/LLamaExecutorBenchmark/Prefill.cs index 7f3c251bb..0abe80775 100644 --- a/LLama.Benchmark/LLamaExecutorBenchmark/Prefill.cs +++ b/LLama.Benchmark/LLamaExecutorBenchmark/Prefill.cs @@ -38,9 +38,9 @@ public class PrefillBenchmark public IEnumerable<(string, int)> ModelAndGpuLayerCounts => new (string, int)[] // TODO: specify the native library to load here to test cpu case better. { - (Path.Combine(Constants.ModelDir, Constants.Generative7BModelPath), 0), - (Path.Combine(Constants.ModelDir, Constants.Generative7BModelPath), 10), - (Path.Combine(Constants.ModelDir, Constants.Generative7BModelPath), 20) + ("/llamasharp_ci/models_benchmark/llama-2-7b-chat.Q3_K_S.gguf", 0), + ("/llamasharp_ci/models_benchmark/llama-2-7b-chat.Q3_K_S.gguf", 10), + ("/llamasharp_ci/models_benchmark/llama-2-7b-chat.Q3_K_S.gguf", 20) }; public IEnumerable ExecutorTypes => new ExecutorType[]