ehristoforu commited on
Commit
70b5193
β€’
1 Parent(s): c528c03

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -33,7 +33,7 @@ tokenizer = GemmaTokenizerFast.from_pretrained(model_id)
33
  model = AutoModelForCausalLM.from_pretrained(
34
  model_id,
35
  device_map="auto",
36
- #quantization_config=BitsAndBytesConfig(load_in_8bit=True),
37
  )
38
  model.config.sliding_window = 4096
39
  model.eval()
 
33
  model = AutoModelForCausalLM.from_pretrained(
34
  model_id,
35
  device_map="auto",
36
+ quantization_config=BitsAndBytesConfig(load_in_4bit=True),
37
  )
38
  model.config.sliding_window = 4096
39
  model.eval()