arjunanand13 commited on
Commit
f805e1b
1 Parent(s): 36aa4cf

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -19,8 +19,8 @@ data = dataset["train"]
19
  data = data.add_faiss_index("embeddings") # column name that has the embeddings of the dataset
20
 
21
 
22
- model_id = "meta-llama/Meta-Llama-3-8B-Instruct"
23
-
24
  # use quantization to lower GPU usage
25
  bnb_config = BitsAndBytesConfig(
26
  load_in_4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=torch.bfloat16
 
19
  data = data.add_faiss_index("embeddings") # column name that has the embeddings of the dataset
20
 
21
 
22
+ # model_id = "meta-llama/Meta-Llama-3-8B-Instruct"
23
+ model_id="unsloth/llama-3-8b-bnb-4bit"
24
  # use quantization to lower GPU usage
25
  bnb_config = BitsAndBytesConfig(
26
  load_in_4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=torch.bfloat16