Spaces:

neuralspace
/

wer_calculator

Sleeping

App Files Files Community

dalmeow commited on Sep 25, 2023

Commit

b5ddedb

•

1 Parent(s): d9bd25a

added file upload feature

Browse files

Files changed (2) hide show

app.py +43 -12
trial.csv +2 -0

app.py CHANGED Viewed

@@ -8,42 +8,73 @@ REGEX_YAML_BLOCK = re.compile(r"---[\n\r]+([\S\s]*?)[\n\r]+---[\n\r]")
 def parse_readme(filepath):
-    """Parses a repositories README and removes"""
     if not os.path.exists(filepath):
         return "No README.md found."
     with open(filepath, "r") as f:
         text = f.read()
         match = REGEX_YAML_BLOCK.search(text)
         if match:
-            text = text[match.end() :]
     return text
-def compute(input):
-    preds = input['prediction'].tolist()
-    truths = input['truth'].tolist()
     print(truths, preds, type(truths))
     err = wer(truths, preds)
-    print(err)
     return err
 description = """
 To calculate WER:
 * Type the `prediction` and the `truth` in the respective columns in the below calculator.
 * You can insert multiple predictions and truths by clicking on the `New row` button.
 * To calculate the WER after inserting all the texts, click on `Submit`.
 """
 demo = gr.Interface(
         fn=compute,
-        inputs=gr.components.Dataframe(
-            headers=["prediction", "truth"],
-            col_count=2,
-            row_count=1,
-            label="Input"
-        ),
         outputs=gr.components.Textbox(label="WER"),
         description=description,
         title="WER Calculator",

 def parse_readme(filepath):
     if not os.path.exists(filepath):
         return "No README.md found."
     with open(filepath, "r") as f:
         text = f.read()
         match = REGEX_YAML_BLOCK.search(text)
         if match:
+            text = text[match.end():]
     return text
+def get_wer(df: pd.DataFrame):
+    print(df.keys())
+    preds = df.iloc[:, 0].tolist()
+    truths = df.iloc[:, 1].tolist()
     print(truths, preds, type(truths))
     err = wer(truths, preds)
     return err
+def compute(input_df: pd.DataFrame = None, input_file: str = None):
+    if input_df is not None and not input_df.empty and input_file is None:
+        print("in df")
+        if not (input_df.values == "").any():
+            print("in df but empty string")
+            return get_wer(input_df)
+    elif input_file and (input_df.values == "").any():
+        print("in file")
+        file_df = pd.read_csv(input_file.name)
+        print(file_df)
+        return get_wer(file_df)
+    else:
+        print("in error")
+        raise ValueError("Please don't provide both DataFrame and file.")
 description = """
 To calculate WER:
 * Type the `prediction` and the `truth` in the respective columns in the below calculator.
 * You can insert multiple predictions and truths by clicking on the `New row` button.
 * To calculate the WER after inserting all the texts, click on `Submit`.
+OR
+* Upload a CSV file with the columns being `prediction` and `truth`.
+* The first row of the file is supposed to have the column names.
+* The sentences should be enclosed within `""` and the prediction and truth need to be separated by `,`.
+* Find an example file [here](trial.csv).
+NOTE: Pleasd don't use both the methods at once.
 """
 demo = gr.Interface(
         fn=compute,
+        inputs=[
+            gr.components.Dataframe(
+                headers=["prediction", "truth"],
+                col_count=2,
+                row_count=1,
+                label="Input"
+            ),
+            gr.File(
+                file_count='single',
+                file_types=['.csv'],
+                label="CSV File"
+            )
+        ],
         outputs=gr.components.Textbox(label="WER"),
         description=description,
         title="WER Calculator",

trial.csv ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ prediction,truth
2	+ "hi this is a trial","hi thissss is a, trial"