Spaces:

John6666
/

text2tag-llm

Running on Zero

John6666 commited on Aug 22

Commit

3c9dc34

•

1 Parent(s): 8b1b5ef

Upload llmdolphin.py

Files changed (1) hide show

llmdolphin.py CHANGED Viewed

@@ -692,7 +692,7 @@ def dolphin_respond(
     llm = Llama(
         model_path=str(Path(f"{llm_models_dir}/{model}")),
         flash_attn=True,
-        n_gpu_layers=35, # 81
         n_batch=1024,
         n_ctx=4096, #8192
         n_threads=8,
@@ -787,7 +787,7 @@ def dolphin_respond_auto(
     llm = Llama(
         model_path=str(Path(f"{llm_models_dir}/{model}")),
         flash_attn=True,
-        n_gpu_layers=35, # 81
         n_batch=1024,
         n_ctx=4096, #8192
         n_threads=8,

     llm = Llama(
         model_path=str(Path(f"{llm_models_dir}/{model}")),
         flash_attn=True,
+        n_gpu_layers=40, # 81
         n_batch=1024,
         n_ctx=4096, #8192
         n_threads=8,
     llm = Llama(
         model_path=str(Path(f"{llm_models_dir}/{model}")),
         flash_attn=True,
+        n_gpu_layers=40, # 81
         n_batch=1024,
         n_ctx=4096, #8192
         n_threads=8,