igea-instruct

Sleeping

Detsutut commited on Jun 27

Commit

7a4dff7

•

1 Parent(s): 82aa38e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,8 +8,7 @@ model_id = "Detsutut/Igea-350M-v0.0.1"
 pipeline = transformers.pipeline(
     "text-generation",
     model=model_id,
-    model_kwargs={"torch_dtype": torch.bfloat16},
-    device_map="auto",
 )
 # Define the function to generate text
@@ -55,8 +54,8 @@ top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0.95, step=0.01, label="Top-p"
 split_output = gr.Checkbox(label="Quick single-sentence output", value=True)
 with gr.Blocks() as iface:
-    gr.Markdown("# Igea Text Generation Interface")
-    gr.Markdown("Enter a prompt to generate text using the **Igea-350M** model and adjust the hyperparameters.")
     input_text.render()
     with gr.Accordion("Advanced Options", open=False):
         max_new_tokens.render()
@@ -73,4 +72,4 @@ with gr.Blocks() as iface:
 # Launch the interface
 if __name__ == "__main__":
-    iface.launch()

 pipeline = transformers.pipeline(
     "text-generation",
     model=model_id,
+    model_kwargs={"torch_dtype": torch.bfloat16}
 )
 # Define the function to generate text
 split_output = gr.Checkbox(label="Quick single-sentence output", value=True)
 with gr.Blocks() as iface:
+    gr.Markdown("# Igea 350M Text Generation Interface")
+    gr.Markdown("⚠️ 🐢💬 This model runs on a hardware-limited, free-tier HuggingFace space, resulting in a low output token throughput (approx. 1 token/s)")
     input_text.render()
     with gr.Accordion("Advanced Options", open=False):
         max_new_tokens.render()
 # Launch the interface
 if __name__ == "__main__":
+    iface.launch()