Spaces:

Ahmud
/

MobicaFind

Build error

App Files Files Community

Ahmud commited on Mar 5

Commit

3c92b7e

verified ·

1 Parent(s): 1ca2d7f

Upload 4 files

Browse files

Files changed (4) hide show

app.py +565 -0
embeddings_metadata.pkl +3 -0
packages.txt +2 -0
requirements.txt +9 -0

app.py ADDED Viewed

	@@ -0,0 +1,565 @@

+import streamlit as st
+import pickle
+import numpy as np
+import torch
+import torch.nn.functional as F
+from PIL import Image, UnidentifiedImageError
+from sklearn.metrics.pairwise import cosine_similarity
+import os
+from pdf2image import convert_from_path
+from streamlit_cropper import st_cropper
+import easyocr
+from reportlab.lib.pagesizes import letter
+from reportlab.pdfgen import canvas
+from reportlab.lib.utils import ImageReader
+import io
+import base64
+# -------------------
+# Set page config (must be done before other elements)
+# -------------------
+st.set_page_config(
+    page_title="Mobica Find",
+)
+# Inject custom CSS to force a black background
+st.markdown(
+    """
+    <style>
+    .stApp {
+        background-color: black;
+        color: white; /* Ensures your text is visible on black background */
+    }
+    </style>
+    """,
+    unsafe_allow_html=True
+)
+# ---------------
+# Inject top-left logo
+# ---------------
+logo_path = r"E:\Mobica\pdf_parser\logo_mobica.png"
+with open(logo_path, "rb") as f:
+    logo_bytes = f.read()
+encoded_logo = base64.b64encode(logo_bytes).decode()
+st.markdown(
+    f"""
+    <style>
+    .top-left-logo {{
+        position: fixed;
+        top: 1rem;
+        left: 1rem;
+        z-index: 9999;
+    }}
+    </style>
+    <div class="top-left-logo">
+        <img src="data:image/png;base64,{encoded_logo}" width="240">
+    </div>
+    """,
+    unsafe_allow_html=True
+)
+# --------------------
+# Load Processor, Model, and Metadata
+# --------------------
+@st.cache_resource()
+def load_resources():
+    model_name = "kakaobrain/align-base"
+    # Load processor and model directly from Hugging Face
+    processor = AutoProcessor.from_pretrained(model_name)
+    model = AlignModel.from_pretrained(model_name)
+    # Move model to GPU if available
+    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    model.to(device)
+    return processor, model
+processor, model = load_resources()
+def extract_text_with_easyocr(image, language="en"):
+    """ Extracts text from an image using EasyOCR. """
+    try:
+        results = reader.readtext(np.array(image), detail=0)  # Get only text results
+        return " ".join(results) if results else ""
+    except Exception as e:
+        st.error(f"Error during OCR: {e}")
+        return ""
+# --------------------
+# Embedding Functions
+# --------------------
+def get_image_embedding(image):
+    """Return normalized image embedding."""
+    image_inputs = processor(images=image, return_tensors="pt")
+    image_outputs = model.get_image_features(**image_inputs)
+    return F.normalize(image_outputs, dim=1).detach().cpu().numpy()
+def get_text_embedding(text):
+    """Return normalized text embedding."""
+    text_inputs = processor(text=[text], return_tensors="pt", padding=True, truncation=True)
+    text_outputs = model.get_text_features(**text_inputs)
+    return F.normalize(text_outputs, dim=1).detach().cpu().numpy()
+# --------------------
+# Search Function
+# --------------------
+def find_most_similar_products(
+    image=None,
+    description=None,
+    n=3,
+    combine_method="none"  # "none" (image-only), "text-only", or "average" for combining
+):
+    """
+    Returns the top-n most similar products based on the specified method:
+      - image-only
+      - description-only
+      - both (average of embeddings)
+    """
+    # Prepare the query embedding
+    if combine_method == "none" and image is not None:
+        query_embed = get_image_embedding(image)  # image-only
+    elif combine_method == "text-only" and description is not None:
+        query_embed = get_text_embedding(description)  # text-only
+    else:
+        # "average" => must have both image & description
+        img_emb = get_image_embedding(image)
+        txt_emb = get_text_embedding(description)
+        query_embed = (img_emb + txt_emb) / 2.0  # simple average
+    similarities = []
+    # Loop through each product in metadata and compute similarity
+    for entry in embeddings_metadata.values():
+        image_similarities = []
+        for emb_path in entry.get("image_embedding_paths", []):
+            emb_path = os.path.normpath(emb_path)
+            if os.path.exists(emb_path):
+                stored_embedding = np.load(emb_path)
+                # Cosine similarity
+                image_similarities.append(cosine_similarity(query_embed, stored_embedding).mean())
+        # Average all image sims in the product
+        overall_score = np.mean(image_similarities) if image_similarities else 0
+        if overall_score > 0:
+            similarities.append((overall_score, entry))
+    # Sort descending by similarity
+    return sorted(similarities, key=lambda x: x[0], reverse=True)[:n]
+# --------------------
+# Session State Setup
+# --------------------
+if "pdf_crops" not in st.session_state:
+    # We'll store pairs (snippet_image, product_image) for each page
+    st.session_state["pdf_crops"] = []
+if "results" not in st.session_state:
+    st.session_state["results"] = []
+# --------------------
+# APP UI
+# --------------------
+st.title("Mobica Find")
+search_method = st.selectbox(
+    "Choose Search Method",
+    ["Upload PDF", "Image Only", "Description Only", "Both (Image + Description)"]
+)
+# -----------------------------------------------------------------------------
+# 1) PDF METHOD
+# -----------------------------------------------------------------------------
+# -----------------------------------------------------------------------------
+# 1) PDF METHOD
+# -----------------------------------------------------------------------------
+# Initialize EasyOCR reader (Supports multiple languages)
+reader = easyocr.Reader(["en", "ar"])  # Add languages as needed
+# -------------------
+# Set page config (must be done before other elements)
+# -------------------
+st.set_page_config(
+    page_title="Mobica Find",
+)
+# Inject custom CSS to force a black background
+st.markdown(
+    """
+    <style>
+    .stApp {
+        background-color: black;
+        color: white; /* Ensures your text is visible on black background */
+    }
+    </style>
+    """,
+    unsafe_allow_html=True
+)
+# ---------------
+# Inject top-left logo
+# ---------------
+logo_path = r"E:\Mobica\pdf_parser\logo_mobica.png"
+with open(logo_path, "rb") as f:
+    logo_bytes = f.read()
+encoded_logo = base64.b64encode(logo_bytes).decode()
+st.markdown(
+    f"""
+    <style>
+    .top-left-logo {{
+        position: fixed;
+        top: 1rem;
+        left: 1rem;
+        z-index: 9999;
+    }}
+    </style>
+    <div class="top-left-logo">
+        <img src="data:image/png;base64,{encoded_logo}" width="240">
+    </div>
+    """,
+    unsafe_allow_html=True
+)
+# --------------------
+# Load Processor, Model, and Metadata
+# --------------------
+@st.cache_resource()
+def load_resources():
+    with open(r"E:\Mobica\pdf_parser\Data Sheet\align_processor.pkl", "rb") as f:
+        processor = pickle.load(f)
+    with open(r"E:\Mobica\pdf_parser\Data Sheet\align_model.pkl", "rb") as f:
+        model = pickle.load(f)
+    with open(r"E:\Mobica\pdf_parser\Data Sheet\embeddings_metadata.pkl", "rb") as f:
+        embeddings_metadata = pickle.load(f)
+    return processor, model, embeddings_metadata
+processor, model, embeddings_metadata = load_resources()
+# --------------------
+# OCR Function using EasyOCR
+# --------------------
+def extract_text_with_easyocr(image, language="en"):
+    """ Extracts text from an image using EasyOCR. """
+    try:
+        results = reader.readtext(np.array(image), detail=0)  # Get only text results
+        return " ".join(results) if results else ""
+    except Exception as e:
+        st.error(f"Error during OCR: {e}")
+        return ""
+# --------------------
+# APP UI
+# --------------------
+st.title("Mobica Find")
+search_method = st.selectbox(
+    "Choose Search Method",
+    ["Upload PDF", "Image Only", "Description Only", "Both (Image + Description)"]
+)
+# -----------------------------------------------------------------------------
+# PDF Processing Section
+# -----------------------------------------------------------------------------
+if search_method == "Upload PDF":
+    st.subheader("Upload a PDF")
+    uploaded_pdf = st.file_uploader("Upload a PDF", type=["pdf"])
+    if uploaded_pdf:
+        pdf_path = f"temp_{uploaded_pdf.name}"
+        with open(pdf_path, "wb") as f:
+            f.write(uploaded_pdf.getbuffer())
+        st.write("Extracting pages from PDF...")
+        pages = convert_from_path(pdf_path, 300)
+        if pages:
+            page_num = st.number_input("Select Page Number", min_value=1, max_value=len(pages), value=1) - 1
+            page_image = pages[page_num]
+            # -------------------- Crop Snippet for OCR (description) --------------------
+            st.subheader("Crop Snippet from PDF for OCR")
+            cropped_img_pdf_snippet = st_cropper(page_image, realtime_update=True, box_color='#FF0000')
+            description_ocr = ""
+            if cropped_img_pdf_snippet:
+                cropped_img_pdf_snippet = cropped_img_pdf_snippet.convert("RGB")
+                st.image(cropped_img_pdf_snippet, caption="Cropped PDF Snippet (For OCR)")
+                # Use EasyOCR instead of Tesseract
+                selected_lang = st.selectbox("Select OCR Language", ["en", "ar", "en+ar"], index=0)
+                description_ocr = extract_text_with_easyocr(cropped_img_pdf_snippet, language=selected_lang)
+                if description_ocr:
+                    st.success("OCR text extracted successfully!")
+                    st.write("**Detected Text**:", description_ocr)
+                else:
+                    st.warning("No text detected.")
+            # -------------------- Crop for product image --------------------
+            st.subheader("Crop the Product Image")
+            furniture_cropped_img = st_cropper(page_image, realtime_update=True, box_color='#00FF00')
+            if furniture_cropped_img:
+                furniture_cropped_img = furniture_cropped_img.convert("RGB")
+                st.image(furniture_cropped_img, caption="Cropped Product Image")
+            # -------------------- "Done" Button to save both crops --------------------
+            if st.button("Done"):
+                st.session_state.setdefault("pdf_crops", []).append(
+                    (cropped_img_pdf_snippet, furniture_cropped_img)
+                )
+                st.success(f"Crop #{len(st.session_state['pdf_crops'])} saved!")
+    # -------------------- Show saved crops if any --------------------
+    if "pdf_crops" in st.session_state and len(st.session_state["pdf_crops"]) > 0:
+        st.subheader("📊 View Saved Crops")
+        crop_index = st.slider("Select Crop", 1, len(st.session_state["pdf_crops"]), 1) - 1
+        snippet_img, product_img = st.session_state["pdf_crops"][crop_index]
+        col1, col2 = st.columns(2)
+        with col1:
+            if snippet_img:
+                st.image(snippet_img, caption=f"Snippet Crop {crop_index+1}", use_column_width=True)
+        with col2:
+            if product_img:
+                st.image(product_img, caption=f"Product Crop {crop_index+1}", use_column_width=True)
+        if st.button(f"Delete Crop {crop_index+1}"):
+            st.session_state["pdf_crops"].pop(crop_index)
+            st.success(f"Crop {crop_index+1} deleted!")
+            st.experimental_rerun()
+    # -------------------- Let user choose how many similar products --------------------
+    n_similar = st.slider("How many similar products do you want?", 1, 10, 3)
+    # -------------------- "Find Similar Products" button --------------------
+    if st.button("Find Similar Products"):
+        st.session_state["results"] = []
+        # We'll do an image-based search using the product crop only
+        for snippet_img, product_img in st.session_state["pdf_crops"]:
+            if product_img is not None:
+                results_for_img = find_most_similar_products(
+                    image=product_img,
+                    n=n_similar,
+                    combine_method="none"  # image-only
+                )
+                st.session_state["results"].append(results_for_img)
+        st.success("Results generated!")
+        # -------------- Display results in the Streamlit GUI --------------
+        for i, results_for_img in enumerate(st.session_state["results"]):
+            st.write(f"**Results for Crop {i+1}**:")
+            if results_for_img:
+                for sim_score, matched_entry in results_for_img:
+                    # Extract product code from the original image path
+                    if "original_image_paths" in matched_entry and matched_entry["original_image_paths"]:
+                        matched_img_path = os.path.normpath(matched_entry["original_image_paths"][0])
+                        product_code = os.path.basename(matched_img_path).split('_')[0]  # Extract product code
+                    st.subheader(f"🔹 Match (Similarity: {sim_score:.4f})")
+                    st.write(f"**Product Code:** {product_code}")  # Display product code
+                    st.write(f"**Description:** {matched_entry.get('description', 'No description')}")
+                    # Show the first matched image (if available)
+                    if os.path.exists(matched_img_path):
+                        try:
+                            img_matched = Image.open(matched_img_path).convert("RGB")
+                            st.image(
+                                img_matched,
+                                caption=f"Matched Image (Sim: {sim_score:.4f})",
+                                use_column_width=True
+                            )
+                        except UnidentifiedImageError:
+                            st.warning(f"⚠️ Cannot open image: {matched_img_path}. It might be corrupted.")
+                    else:
+                        st.warning(f"⚠️ Image file not found: {matched_img_path}")
+            else:
+                st.warning(f"No similar products found for Crop {i+1}.")
+    # -------------------- Generate PDF if results are available --------------------
+    if len(st.session_state["results"]) > 0:
+        pdf_buffer = io.BytesIO()
+        pdf = canvas.Canvas(pdf_buffer, pagesize=letter)
+        # st.session_state["results"] is a list of lists
+        # st.session_state["pdf_crops"] is a list of (snippet_img, product_img)
+        for i, (snippet_img, product_img) in enumerate(st.session_state["pdf_crops"]):
+            pdf.drawString(100, 750, f"Crop {i+1}")
+            # Add cropped product image to PDF
+            if product_img:
+                img_byte_arr = io.BytesIO()
+                product_img.save(img_byte_arr, format='JPEG')
+                img_byte_arr.seek(0)
+                pdf.drawImage(ImageReader(img_byte_arr), 100, 550, width=200, height=150)
+            y_pos = 530
+            # Go through the matched results for this product
+            if i < len(st.session_state["results"]):
+                for sim_score, matched_entry in st.session_state["results"][i]:
+                    if "original_image_paths" in matched_entry and len(matched_entry["original_image_paths"]) > 0:
+                        matched_img_path = os.path.normpath(matched_entry["original_image_paths"][0])
+                        product_code = os.path.basename(matched_img_path).split('_')[0]  # Extract product code
+                        pdf.drawString(100, y_pos, f"Product Code: {product_code}")  # Add product code to PDF
+                        #pdf.drawString(100, y_pos - 20, f"Similarity: {sim_score:.4f}")
+                        y_pos -= 40
+                        if os.path.exists(matched_img_path):
+                            pdf.drawImage(matched_img_path, 350, y_pos - 50, width=150, height=100)
+                            y_pos -= 120
+            pdf.showPage()
+        pdf.save()
+        pdf_buffer.seek(0)
+        st.download_button(
+            "📥 Download Results PDF",
+            pdf_buffer,
+            f"{uploaded_pdf.name}_results.pdf",
+            "application/pdf"
+        )
+# -----------------------------------------------------------------------------
+# 2) IMAGE ONLY
+# -----------------------------------------------------------------------------
+elif search_method == "Image Only":
+    st.subheader("Upload an Image")
+    uploaded_image = st.file_uploader("Select an Image", type=["png", "jpg", "jpeg"])
+    if uploaded_image is not None:
+        image_obj = Image.open(uploaded_image).convert("RGB")
+        st.image(image_obj, use_column_width=True)
+        # Let user choose how many similar products
+        n_similar = st.slider("How many similar products do you want?", 1, 10, 3)
+        # Button to trigger the search
+        if st.button("Find Similar Products"):
+            results = find_most_similar_products(
+                image=image_obj,
+                n=n_similar,
+                combine_method="none"  # image-only
+            )
+            if results:
+                for sim_score, matched_entry in results:
+                    st.subheader(f"🔹 Match (Similarity: {sim_score:.4f})")
+                    st.write(f"**Description:** {matched_entry.get('description','No description')}")
+                    # Display the first image of the matched entry
+                    if "original_image_paths" in matched_entry and matched_entry["original_image_paths"]:
+                        img_path = os.path.normpath(matched_entry["original_image_paths"][0])  # Normalize path
+                        if os.path.exists(img_path):
+                            try:
+                                img_matched = Image.open(img_path).convert("RGB")
+                                st.image(
+                                    img_matched,
+                                    caption=f"Matched Image (Sim: {sim_score:.4f})",
+                                    use_column_width=True
+                                )
+                            except UnidentifiedImageError:
+                                st.warning(f"⚠️ Cannot open image: {img_path}. It might be corrupted.")
+                        else:
+                            st.warning(f"⚠️ Image file not found: {img_path}")
+            else:
+                st.warning("No similar products found.")
+# -----------------------------------------------------------------------------
+# 3) DESCRIPTION ONLY
+# -----------------------------------------------------------------------------
+elif search_method == "Description Only":
+    st.subheader("Enter a Description")
+    user_description = st.text_area("Type or paste your description here")
+    if user_description.strip():
+        # Let user choose how many similar products
+        n_similar = st.slider("How many similar products do you want?", 1, 10, 3)
+        # Button to trigger the search
+        if st.button("Find Similar Products"):
+            results = find_most_similar_products(
+                description=user_description,
+                n=n_similar,
+                combine_method="text-only"
+            )
+            if results:
+                for sim_score, matched_entry in results:
+                    st.subheader(f"🔹 Match (Similarity: {sim_score:.4f})")
+                    st.write(f"**Description:** {matched_entry.get('description','No description')}")
+                    # Display the first image of the matched entry
+                    if "original_image_paths" in matched_entry and matched_entry["original_image_paths"]:
+                        img_path = os.path.normpath(matched_entry["original_image_paths"][0])
+                        if os.path.exists(img_path):
+                            try:
+                                img_matched = Image.open(img_path).convert("RGB")
+                                st.image(
+                                    img_matched,
+                                    caption=f"Matched Image (Sim: {sim_score:.4f})",
+                                    use_column_width=True
+                                )
+                            except UnidentifiedImageError:
+                                st.warning(f"⚠️ Cannot open image: {img_path}. It might be corrupted.")
+                        else:
+                            st.warning(f"⚠️ Image file not found: {img_path}")
+            else:
+                st.warning("No similar products found.")
+# -----------------------------------------------------------------------------
+# 4) BOTH (IMAGE + DESCRIPTION)
+# -----------------------------------------------------------------------------
+elif search_method == "Both (Image + Description)":
+    st.subheader("Upload an Image and Enter a Description")
+    uploaded_image = st.file_uploader("Select an Image", type=["png", "jpg", "jpeg"])
+    user_description = st.text_area("Type or paste your description here")
+    if uploaded_image is not None:
+        image_obj = Image.open(uploaded_image).convert("RGB")
+        st.image(image_obj, use_column_width=True)
+        if user_description.strip():
+            # Let user choose how many similar products
+            n_similar = st.slider("How many similar products do you want?", 1, 10, 3)
+            # Button to trigger the search
+            if st.button("Find Similar Products"):
+                results = find_most_similar_products(
+                    image=image_obj,
+                    description=user_description,
+                    n=n_similar,
+                    combine_method="average"
+                )
+                if results:
+                    for sim_score, matched_entry in results:
+                        st.subheader(f"🔹 Match (Similarity: {sim_score:.4f})")
+                        st.write(f"**Description:** {matched_entry.get('description','No description')}")
+                        # Display the first image of the matched entry
+                        if "original_image_paths" in matched_entry and matched_entry["original_image_paths"]:
+                            img_path = os.path.normpath(matched_entry["original_image_paths"][0])
+                            if os.path.exists(img_path):
+                                try:
+                                    img_matched = Image.open(img_path).convert("RGB")
+                                    st.image(
+                                        img_matched,
+                                        caption=f"Matched Image (Sim: {sim_score:.4f})",
+                                        use_column_width=True
+                                    )
+                                except UnidentifiedImageError:
+                                    st.warning(f"⚠️ Cannot open image: {img_path}. It might be corrupted.")
+                            else:
+                                st.warning(f"⚠️ Image file not found: {img_path}")
+                else:
+                    st.warning("No similar products found.")

embeddings_metadata.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:25f96cefa7b214660cef0e4ee06c3685141b17dd920944d7f8d724e65761d54a
+size 209465

packages.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ poppler-utils
2	+ tesseract-ocr

requirements.txt ADDED Viewed

	@@ -0,0 +1,9 @@

+streamlit==1.31.1
+numpy==1.26.4
+torch==2.6.0+cpu
+PIL==10.2.0
+sklearn==1.4.0
+pdf2image==1.17.0
+streamlit_cropper==0.2.1
+pytesseract==0.3.10
+reportlab==4.3.1