Spaces:

raahinaez
/

doc

Runtime error

App Files Files Community

raahinaez commited on 8 days ago

Commit

ced4216

verified ·

1 Parent(s): 3d7667b

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -3

app.py CHANGED Viewed

@@ -2,30 +2,54 @@ import os
 import gradio as gr
 from docling.document_converter import DocumentConverter, PdfFormatOption
 from docling.datamodel.base_models import InputFormat
 import tempfile
 def pdf_to_markdown(file):
     # Save uploaded file temporarily
     tmp_path = file.name
     # Convert PDF using Docling/VLM (Granite Docling)
     converter = DocumentConverter(
         format_options={
             InputFormat.PDF: PdfFormatOption()
         }
     )
     result = converter.convert(tmp_path)
     doc = result.document
     # Export to Markdown (or you can export to JSON via doc.model_dump())
     md = doc.export_to_markdown()
     return md
 interface = gr.Interface(
     fn=pdf_to_markdown,
     inputs=gr.File(file_types=[".pdf"]),
-    outputs="text",
-    title="PDF → Markdown/JSON with Granite Docling",
-    description="Upload a PDF and get parsed Markdown (or JSON) using Granite Docling via Docling."
 )
 if __name__ == "__main__":
     interface.launch()

 import gradio as gr
 from docling.document_converter import DocumentConverter, PdfFormatOption
 from docling.datamodel.base_models import InputFormat
+from transformers import AutoModelForSequenceClassification, AutoTokenizer
 import tempfile
+# Path to the model
+model_name = "ibm-granite/granite-docling-258M"
+# Load the OCR model from Hugging Face (assuming you have access to it)
+# In this case, let's load the model and tokenizer if needed
+ocr_model = AutoModelForSequenceClassification.from_pretrained(model_name)
+ocr_tokenizer = AutoTokenizer.from_pretrained(model_name)
 def pdf_to_markdown(file):
     # Save uploaded file temporarily
     tmp_path = file.name
     # Convert PDF using Docling/VLM (Granite Docling)
     converter = DocumentConverter(
         format_options={
             InputFormat.PDF: PdfFormatOption()
         }
     )
+    # Perform OCR using granite-docling model if the file contains scanned text
     result = converter.convert(tmp_path)
     doc = result.document
     # Export to Markdown (or you can export to JSON via doc.model_dump())
     md = doc.export_to_markdown()
     return md
+# Define the output box size
+output_box = gr.Textbox(
+    label="Markdown Output",
+    lines=20,       # initial visible lines
+    max_lines=50,   # maximum scrollable lines
+    placeholder="Converted Markdown will appear here..."
+)
+# Create the Gradio Interface
 interface = gr.Interface(
     fn=pdf_to_markdown,
     inputs=gr.File(file_types=[".pdf"]),
+    outputs=output_box,
+    title="PDF → Markdown/JSON with Granite Docling (OCR)",
+    description="Upload a PDF (including scanned PDFs) and get parsed Markdown (or JSON) using Granite Docling via Docling, with OCR support."
 )
+# Launch the interface
 if __name__ == "__main__":
     interface.launch()