Spaces:

rishabh062
/

donutCordImgToCsv

Runtime error

App Files Files Community

rishabh062 commited on Apr 1, 2023

Commit

97f9f1f

•

1 Parent(s): 6fc74ef

Removed image name error

Browse files

Files changed (1) hide show

app.py +18 -16

app.py CHANGED Viewed

@@ -1,6 +1,5 @@
 import gradio as gr
 import csv
-import json
 import re
 import torch
@@ -38,35 +37,38 @@ def process_document(image):
     sequence = processor.batch_decode(outputs.sequences)[0]
     sequence = sequence.replace(processor.tokenizer.eos_token, "").replace(processor.tokenizer.pad_token, "")
     sequence = re.sub(r"<.*?>", "", sequence, count=1).strip()  # remove first task start token
     with open('output.csv', 'a', newline='') as file:
         writer = csv.writer(file)
-        writer.writerow([image_filename, sequence])
-    return {"json": processor.token2json(sequence)}
-def download_csv(output_csv):
-    with open(output_csv) as f:
-        response = f.read()
-    return response, {"Content-Type": "text/csv"}
 description = "To use it, simply upload your image and click 'submit', or click one of the examples to load them. Read more at the links below."
 article = "<p style='text-align: center'><a href='https://arxiv.org/abs/2111.15664' target='_blank'>Donut: OCR-free Document Understanding Transformer</a> | <a href='https://github.com/clovaai/donut' target='_blank'>Github Repo</a></p>"
-output_csv = "output.csv"
-demo = gr.Interface(
-    fn=process_document,
-    inputs="image",
-    outputs="json",
     title="Donut 🍩 for Document Parsing and Converting the Image to Database",
     description=description,
     article=article,
     enable_queue=True,
-    examples=[["example.png"], ["example_2.png"], ["example_3.png"]],
     cache_examples=False,
     allow_download=True,
-    download_name="output.csv",
-    download=download_csv
 )
-demo.launch()

 import gradio as gr
 import csv
 import re
 import torch
     sequence = processor.batch_decode(outputs.sequences)[0]
     sequence = sequence.replace(processor.tokenizer.eos_token, "").replace(processor.tokenizer.pad_token, "")
     sequence = re.sub(r"<.*?>", "", sequence, count=1).strip()  # remove first task start token
     with open('output.csv', 'a', newline='') as file:
         writer = csv.writer(file)
+        writer.writerow(["image", sequence])
+    return processor.token2json(sequence)
+def download_csv():
+    return "output.csv"
 description = "To use it, simply upload your image and click 'submit', or click one of the examples to load them. Read more at the links below."
 article = "<p style='text-align: center'><a href='https://arxiv.org/abs/2111.15664' target='_blank'>Donut: OCR-free Document Understanding Transformer</a> | <a href='https://github.com/clovaai/donut' target='_blank'>Github Repo</a></p>"
+inputs = gr.inputs.Image()
+outputs = gr.outputs.Json()
+examples = [["example.png"], ["example_2.png"], ["example_3.png"]]
+download_button = gr.outputs.Button("Download CSV")
+interface = gr.Interface(
+    process_document,
+    inputs=inputs,
+    outputs=outputs,
     title="Donut 🍩 for Document Parsing and Converting the Image to Database",
     description=description,
     article=article,
+    examples=examples,
     enable_queue=True,
     cache_examples=False,
     allow_download=True,
+    download_button=download_button
 )
+interface.launch()