Dua Rajper commited on
Commit
c185222
·
verified ·
1 Parent(s): 4038998

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +26 -0
app.py ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ from PIL import Image
3
+ import easyocr
4
+ from transformers import CLIPProcessor, CLIPModel
5
+
6
+ # Load OCR & CLIP
7
+ reader = easyocr.Reader(['en'])
8
+ model = CLIPModel.from_pretrained("openai/clip-vit-base-patch32")
9
+ processor = CLIPProcessor.from_pretrained("openai/clip-vit-base-patch32")
10
+
11
+ st.title("Multimodal AI Assistant")
12
+ uploaded_file = st.file_uploader("Upload an Image", type=["png", "jpg", "jpeg"])
13
+
14
+ if uploaded_file is not None:
15
+ image = Image.open(uploaded_file)
16
+ st.image(image, caption="Uploaded Image", use_column_width=True)
17
+
18
+ # Extract text from image
19
+ extracted_text = reader.readtext(uploaded_file, detail=0)
20
+ st.write("Extracted Text:", extracted_text)
21
+
22
+ # CLIP Analysis
23
+ text_descriptions = ["A car", "A dog", "A person", "A building"]
24
+ inputs = processor(text=text_descriptions, images=image, return_tensors="pt")
25
+ outputs = model(**inputs)
26
+ st.write("CLIP Model Scores:", outputs.logits_per_image.tolist())