Spaces:

KingNish
/

OpenGPT-4o

Running on Zero

App Files Files Community

KingNish commited on Jul 10

Commit

f3cfba4

•

1 Parent(s): faa634d

Update chatbot.py

Browse files

Files changed (1) hide show

chatbot.py +13 -12

chatbot.py CHANGED Viewed

@@ -315,7 +315,7 @@ def model_inference(
         temperature,
         max_new_tokens,
         repetition_penalty,
-        top_p,
         web_search,
 ):
     # Define generation_args at the beginning of the function
@@ -332,6 +332,7 @@ def model_inference(
             generate_kwargs = dict(
                 max_new_tokens=4000,
                 do_sample=True,
             )
             # Format the prompt for the language model
             formatted_prompt = format_prompt(
@@ -351,6 +352,7 @@ def model_inference(
             generate_kwargs = dict(
                 max_new_tokens=5000,
                 do_sample=True,
             )
             # Format the prompt for the language model
             formatted_prompt = format_prompt(
@@ -389,16 +391,15 @@ def model_inference(
         }
         assert decoding_strategy in [
             "Greedy",
-            "Top P Sampling",
         ]
         if decoding_strategy == "Greedy":
             generation_args["do_sample"] = False
-        elif decoding_strategy == "Top P Sampling":
             generation_args["temperature"] = temperature
             generation_args["do_sample"] = True
-            generation_args["top_p"] = top_p
-        # Creating model inputs
         (
             resulting_text,
             resulting_images,
@@ -440,7 +441,7 @@ FEATURES = datasets.Features(
         "temperature": datasets.Value("float32"),
         "max_new_tokens": datasets.Value("int32"),
         "repetition_penalty": datasets.Value("float32"),
-        "top_p": datasets.Value("int32"),
     }
 )
@@ -465,9 +466,9 @@ repetition_penalty = gr.Slider(
 decoding_strategy = gr.Radio(
     [
         "Greedy",
-        "Top P Sampling",
     ],
-    value="Top P Sampling",
     label="Decoding strategy",
     interactive=True,
     info="Higher values are equivalent to sampling more low-probability tokens.",
@@ -482,14 +483,14 @@ temperature = gr.Slider(
     label="Sampling temperature",
     info="Higher values will produce more diverse outputs.",
 )
-top_p = gr.Slider(
     minimum=0.01,
-    maximum=0.99,
-    value=0.9,
     step=0.01,
     visible=True,
     interactive=True,
-    label="Top P",
     info="Higher values are equivalent to sampling more low-probability tokens.",
 )

         temperature,
         max_new_tokens,
         repetition_penalty,
+        min_p,
         web_search,
 ):
     # Define generation_args at the beginning of the function
             generate_kwargs = dict(
                 max_new_tokens=4000,
                 do_sample=True,
+                min_p=0.08,
             )
             # Format the prompt for the language model
             formatted_prompt = format_prompt(
             generate_kwargs = dict(
                 max_new_tokens=5000,
                 do_sample=True,
+                min_p=0.08,
             )
             # Format the prompt for the language model
             formatted_prompt = format_prompt(
         }
         assert decoding_strategy in [
             "Greedy",
+            "Min P Sampling",
         ]
         if decoding_strategy == "Greedy":
             generation_args["do_sample"] = False
+        elif decoding_strategy == "Min P Sampling":
             generation_args["temperature"] = temperature
             generation_args["do_sample"] = True
+            generation_args["min_p"] = min_p
         (
             resulting_text,
             resulting_images,
         "temperature": datasets.Value("float32"),
         "max_new_tokens": datasets.Value("int32"),
         "repetition_penalty": datasets.Value("float32"),
+        "min_p": datasets.Value("int32"),
     }
 )
 decoding_strategy = gr.Radio(
     [
         "Greedy",
+        "Min P Sampling",
     ],
+    value="Min P Sampling",
     label="Decoding strategy",
     interactive=True,
     info="Higher values are equivalent to sampling more low-probability tokens.",
     label="Sampling temperature",
     info="Higher values will produce more diverse outputs.",
 )
+min_p = gr.Slider(
     minimum=0.01,
+    maximum=0.49,
+    value=0.08,
     step=0.01,
     visible=True,
     interactive=True,
+    label="Min P",
     info="Higher values are equivalent to sampling more low-probability tokens.",
 )