Chat_with_Meta_llama3_8b

Sleeping

leoskyscape commited on Nov 14

Commit

c3d6a36

verified ·

1 Parent(s): f7249b1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ from llama_cpp import Llama
 # Set the model repo + filename (change filename if needed)
 MODEL_REPO = "mlabonne/Meta-Llama-3.1-8B-Instruct-abliterated-GGUF"
-MODEL_FILE = "Meta-Llama-3.1-8B-Instruct-abliterated.Q4_K_M.gguf"
 print("Downloading model from HF Hub...")
 model_path = hf_hub_download(
@@ -23,7 +23,7 @@ print(f"Model downloaded to: {model_path}")
 llm = Llama(
     model_path=model_path,
-    n_gpu_layers=-1,       # GPU acceleration if available
     n_ctx=4096,
     chat_format="llama-3",
 )

 # Set the model repo + filename (change filename if needed)
 MODEL_REPO = "mlabonne/Meta-Llama-3.1-8B-Instruct-abliterated-GGUF"
+MODEL_FILE = "meta-llama-3.1-8b-instruct-abliterated.Q4_K_M.gguf"
 print("Downloading model from HF Hub...")
 model_path = hf_hub_download(
 llm = Llama(
     model_path=model_path,
+    n_gpu_layers=0,       # GPU acceleration if available
     n_ctx=4096,
     chat_format="llama-3",
 )