HylandDocumentVisualQA

Runtime error

File size: 1,997 Bytes

c4ea48a
0489f49
 
 
 
 
c4ea48a
 
cc74800
 
0489f49
 
 
 
c4ea48a
0489f49
 
 
 
 
 
 
c4ea48a
0489f49
 
c4ea48a
0489f49
05ef389
725eef9
53e95b0
c4ea48a
0489f49
 
 
c4ea48a
 
 
06b0d16
bd78f47
7273548
c4ea48a
 
 
 
 
06b0d16

import gradio as gr
import base64
import io
import requests
import json
from PIL import Image


def analyze_image(image, question):

    #img64 = base64.b64decode(image)
    im = Image.fromarray(image)
    in_mem_file = io.BytesIO()
    im.save(in_mem_file, format="png")

    payload = {
        "model":"Baseline",
        "tasktype":"Extraction",
        "questions":[{"Pages":[1],"Text":question}],
        "image": base64.b64encode(in_mem_file.getvalue()).decode()
    } 
    url = "https://ky8mfb27dj.execute-api.us-east-1.amazonaws.com/dev/analyzedocument/submit"

    payload = json.dumps(payload)
    headers = {'Content-Type': 'application/json'}

    response = requests.request("POST", url, headers=headers, data=payload)

    jsonresponse = json.loads(response.text)
    return "Answer: {0} \nConfidence: {1}".format(jsonresponse['body'][0]['result'][0]['answer'][0], jsonresponse['body'][0]['result'][0]['score'])
    
description = "Hyland Demo for Document Question & Answering , fine-tuned on DocVQA (document visual question answering). To use it, simply upload your image and type a question and click 'submit', or click one of the examples to load them. Read more at the links below."
title = "DocVQA"
article = "<p style='text-align: center'><a href='https://www.docvqa.org/datasets/docvqa' target='_blank'>DocVQA: Challenge | <a href='https://rrc.cvc.uab.es/?ch=17' target='_blank'>Overview - Document Visual Question Answering</a></p>"
examples =[['publaynet_example.jpeg']]
css = ".output-image, .input-image, .image-preview {height: 600px !important}"

demo = gr.Interface(fn=analyze_image, 
                     inputs=[gr.inputs.Image(type="pil", label="Document image"),"text"], 
                     outputs=gr.outputs.Textbox(type="auto", label="Answer"),
                     title=title,
                     description=description,
                     article=article,
                     css=css,
                     enable_queue=True)
demo.launch(debug=True)