Spaces:

deepsh2207
/

TextExtractor

Sleeping

App Files Files Community

deepsh2207 commited on Mar 4, 2024

Commit

d812fea

1 Parent(s): cdd9cb4

Updates in readme, parameters

Browse files

Files changed (3) hide show

README.md +1 -1
app.py +23 -15
backend/pytorch.py +16 -16

README.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-title: docTR
 emoji: 📑
 colorFrom: purple
 colorTo: pink

 ---
+title: Text Extractor
 emoji: 📑
 colorFrom: purple
 colorTo: pink

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
-import cv2
-import matplotlib.pyplot as plt
 import numpy as np
 import streamlit as st
 import torch
@@ -7,7 +7,7 @@ import torch
 from doctr.io import DocumentFile
 from doctr.utils.visualization import visualize_page
-from backend.pytorch import DET_ARCHS, RECO_ARCHS, forward_image, load_predictor
 forward_device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
@@ -50,18 +50,18 @@ def main(det_archs, reco_archs):
     det_arch = st.sidebar.selectbox("Text detection model", det_archs)
     reco_arch = st.sidebar.selectbox("Text recognition model", reco_archs)
-    # For newline
-    st.sidebar.write("\n")
-    # Only straight pages or possible rotation
-    st.sidebar.title("Parameters")
-    assume_straight_pages = st.sidebar.checkbox("Assume straight pages", value=True)
-    st.sidebar.write("\n")
-    # Straighten pages
-    straighten_pages = st.sidebar.checkbox("Straighten pages", value=False)
-    st.sidebar.write("\n")
-    # Binarization threshold
-    bin_thresh = st.sidebar.slider("Binarization threshold", min_value=0.1, max_value=0.9, value=0.3, step=0.1)
-    st.sidebar.write("\n")
     if st.sidebar.button("Analyze page"):
         if uploaded_file is None:
@@ -69,6 +69,9 @@ def main(det_archs, reco_archs):
         else:
             with st.spinner("Loading model..."):
                 predictor = load_predictor(
                     det_arch, reco_arch, assume_straight_pages, straighten_pages, bin_thresh, forward_device
                 )
@@ -96,6 +99,11 @@ def main(det_archs, reco_archs):
                     img = out.pages[0].synthesize()
                     cols[2].image(img, clamp=True)
                 # Display JSON
                 st.markdown("\nHere are your analysis results in JSON format:")
                 st.json(page_export, expanded=False)

+# import cv2
+# import matplotlib.pyplot as plt
 import numpy as np
 import streamlit as st
 import torch
 from doctr.io import DocumentFile
 from doctr.utils.visualization import visualize_page
+from backend.pytorch import DET_ARCHS, RECO_ARCHS, load_predictor #forward_image
 forward_device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
     det_arch = st.sidebar.selectbox("Text detection model", det_archs)
     reco_arch = st.sidebar.selectbox("Text recognition model", reco_archs)
+    # # For newline
+    # st.sidebar.write("\n")
+    # # Only straight pages or possible rotation
+    # st.sidebar.title("Parameters")
+    # assume_straight_pages = st.sidebar.checkbox("Assume straight pages", value=True)
+    # st.sidebar.write("\n")
+    # # Straighten pages
+    # straighten_pages = st.sidebar.checkbox("Straighten pages", value=False)
+    # st.sidebar.write("\n")
+    # # Binarization threshold
+    # bin_thresh = st.sidebar.slider("Binarization threshold", min_value=0.1, max_value=0.9, value=0.3, step=0.1)
+    # st.sidebar.write("\n")
     if st.sidebar.button("Analyze page"):
         if uploaded_file is None:
         else:
             with st.spinner("Loading model..."):
+                # Default Values
+                assume_straight_pages, straighten_pages, bin_thresh = True, False, 0.3
                 predictor = load_predictor(
                     det_arch, reco_arch, assume_straight_pages, straighten_pages, bin_thresh, forward_device
                 )
                     img = out.pages[0].synthesize()
                     cols[2].image(img, clamp=True)
+                print('out',out)
+                print('\n')
+                print('page_export',page_export)
+                print('\n')
                 # Display JSON
                 st.markdown("\nHere are your analysis results in JSON format:")
                 st.json(page_export, expanded=False)

backend/pytorch.py CHANGED Viewed

@@ -60,22 +60,22 @@ def load_predictor(
     return predictor
-def forward_image(predictor: OCRPredictor, image: np.ndarray, device: torch.device) -> np.ndarray:
-    """Forward an image through the predictor
-    Args:
-    ----
-        predictor: instance of OCRPredictor
-        image: image to process
-        device: torch.device, the device to process the image on
-    Returns:
-    -------
-        segmentation map
-    """
-    with torch.no_grad():
-        processed_batches = predictor.det_predictor.pre_processor([image])
-        out = predictor.det_predictor.model(processed_batches[0].to(device), return_model_output=True)
-        seg_map = out["out_map"].to("cpu").numpy()
-    return seg_map

     return predictor
+# def forward_image(predictor: OCRPredictor, image: np.ndarray, device: torch.device) -> np.ndarray:
+#     """Forward an image through the predictor
+#     Args:
+#     ----
+#         predictor: instance of OCRPredictor
+#         image: image to process
+#         device: torch.device, the device to process the image on
+#     Returns:
+#     -------
+#         segmentation map
+#     """
+#     with torch.no_grad():
+#         processed_batches = predictor.det_predictor.pre_processor([image])
+#         out = predictor.det_predictor.model(processed_batches[0].to(device), return_model_output=True)
+#         seg_map = out["out_map"].to("cpu").numpy()
+#     return seg_map