Spaces:

jordigonzm
/

Phi-3-mini-128k-instruct

Runtime error

jordigonzm commited on Apr 25

Commit

896b82a

•

1 Parent(s): f455b1e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -12,14 +12,14 @@ def get_device():
 model_name = "microsoft/Phi-3-mini-128k-instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
-model = AutoModelForCausalLM.from_pretrained(model_name, trust_remote_code=True)
 # Obtener el dispositivo adecuado según la disponibilidad de GPU
 device = get_device()
 model.to(device)
-model = torch.quantization.quantize_dynamic(
-    model, {torch.nn.Linear}, dtype=torch.qint8
-)
 pipeline = transformers.pipeline(
     "text-generation",

 model_name = "microsoft/Phi-3-mini-128k-instruct"
 tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
+model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.bfloat16, trust_remote_code=True)
 # Obtener el dispositivo adecuado según la disponibilidad de GPU
 device = get_device()
 model.to(device)
+#model = torch.quantization.quantize_dynamic(
+#    model, {torch.nn.Linear}, dtype=torch.qint8
+#)
 pipeline = transformers.pipeline(
     "text-generation",