Update app.py
Browse files
app.py
CHANGED
|
@@ -6,10 +6,10 @@ from llama_cpp import Llama
|
|
| 6 |
HF_TOKEN = os.environ.get("scalable")
|
| 7 |
|
| 8 |
# 🧠 Your GGUF repo on Hugging Face
|
| 9 |
-
MODEL_ID = "FatimaZh/llama-3.2-1b-merged-code-gguf"
|
| 10 |
|
| 11 |
# ❗ Replace this with the EXACT gguf filename in that repo
|
| 12 |
-
GGUF_FILENAME = "
|
| 13 |
|
| 14 |
# 🧠 Load the GGUF model via llama-cpp
|
| 15 |
llm = Llama.from_pretrained(
|
|
|
|
| 6 |
HF_TOKEN = os.environ.get("scalable")
|
| 7 |
|
| 8 |
# 🧠 Your GGUF repo on Hugging Face
|
| 9 |
+
MODEL_ID = "FatimaZh/llama-3.2-1b-merged-code-gguf-v2"
|
| 10 |
|
| 11 |
# ❗ Replace this with the EXACT gguf filename in that repo
|
| 12 |
+
GGUF_FILENAME = "merged_fp16_code_v2.gguf" # <-- CHANGE ME
|
| 13 |
|
| 14 |
# 🧠 Load the GGUF model via llama-cpp
|
| 15 |
llm = Llama.from_pretrained(
|