AnishHF commited on
Commit
db46f1f
1 Parent(s): 4eef962

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -2
app.py CHANGED
@@ -2,11 +2,13 @@ import os
2
  import bitsandbytes as bnb
3
  import torch
4
  import gradio as gr
5
- from transformers import AutoTokenizer, AutoModelForCausalLM, HqqConfig
6
 
7
  access_token = os.environ["GATED_ACCESS_TOKEN"]
8
 
9
- quantization_config = HqqConfig()
 
 
10
 
11
  model = AutoModelForCausalLM.from_pretrained("mistralai/Mistral-7B-v0.1", quantization_config=quantization_config, device_map="auto", token=access_token)
12
  tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-v0.1")
 
2
  import bitsandbytes as bnb
3
  import torch
4
  import gradio as gr
5
+ from transformers import AutoTokenizer, AutoModelForCausalLM, QuantoConfig
6
 
7
  access_token = os.environ["GATED_ACCESS_TOKEN"]
8
 
9
+ quantization_config = QuantoConfig(
10
+ weights = "int4"
11
+ )
12
 
13
  model = AutoModelForCausalLM.from_pretrained("mistralai/Mistral-7B-v0.1", quantization_config=quantization_config, device_map="auto", token=access_token)
14
  tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-v0.1")