From 932faab35b01aa2fa9319244dd212b3bc238f88b Mon Sep 17 00:00:00 2001 From: Tristan Druyen Date: Wed, 27 Nov 2024 10:18:54 +0100 Subject: [PATCH] Make nemotron run with desktop env --- llama_proxy_man/config.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/llama_proxy_man/config.yaml b/llama_proxy_man/config.yaml index eb637cc..25fb678 100644 --- a/llama_proxy_man/config.yaml +++ b/llama_proxy_man/config.yaml @@ -60,7 +60,7 @@ models: CUDA_VISIBLE_DEVICES: 0 HSA_OVERRIDE_GFX_VERSION: '11.0.0' args: - ctx-size: 16384 + ctx-size: 8192 flash-attn: true cache-type-k: q8_0 cache-type-v: q8_0