vignesh-fynd commited on
Commit
ff87042
·
1 Parent(s): 53fb893

updated layout

Browse files
Files changed (1) hide show
  1. pages/1_📊_About.py +55 -57
pages/1_📊_About.py CHANGED
@@ -7,63 +7,61 @@ st.sidebar.header("About Semantic Search with LLMs")
7
 
8
  tab1, tab2 = st.tabs(["Product Discovery", "Question And Answering"])
9
  with tab1:
10
- st.header("Product Discovery")
11
- with st.expander("Details"):
12
- st.markdown("**Application:** Gofynd.com")
13
- st.markdown("**Total Products:** 14,000")
14
- st.markdown("**Data Used:**")
15
- st.markdown("- Text fields - Name, Brand, Category, Gender")
16
- st.markdown("- Images - Single Images (First image of the product)")
17
- st.markdown("Embedding Model: Used CLIP model for Generating the Embeddings for Text and Image")
18
- st.markdown("Weightage [Text, Image]: [0.1, 0.9]")
19
- st.markdown("Vector Database: Milvus")
20
- st.markdown("ML Pipeline Orchestration: Vertex AI Pipeline")
21
- st.markdown("Supported Input data format:")
22
- st.markdown("Similarity Metric: Inner Product")
23
- st.markdown("Type of Index: FLAT_L2")
24
-
25
- st.subheader("Input Sample Data:")
26
- st.markdown("Sample data can be displayed here.")
27
-
28
- st.subheader("STEPS")
29
- st.markdown("**TRAINING:**")
30
- st.markdown("1. Pull the Catalog data from Fynd Platform")
31
- st.markdown("2. Parse Textual and Image data from Catalog data")
32
- st.markdown("3. Generate Embeddings for Textual fields")
33
- st.markdown("4. Generate Embeddings for Image")
34
- st.markdown("5. Aggregate Embeddings with help of defined weightage")
35
- st.markdown("6. Store it to Vector DB - Milvus")
36
-
37
- st.markdown("**SERVING:**")
38
- st.markdown("1. Convert the Users’s query as Input text string to Embeddings with CLIP model")
39
- st.markdown("2. Pass the user’s search query to LLM - OpenAI’S GPT3 to detect the search entities - Query, Brand, Category, Price, Sorting type")
40
- st.markdown("3. Prepare and Apply Search Query on Collection of Milvus DB on which the data is indexed")
41
- st.markdown("4. Fetch top N results")
42
- st.markdown("5. Apply filters and return the results")
43
 
44
  with tab2:
45
  st.header("Question And Answering")
46
- with st.expander("Details"):
47
- st.markdown("**Application:** Gofynd.com")
48
- st.markdown("**Total Documents:** FAQ, Return, Shipping, T&C")
49
- st.markdown("**Framework:** Langchain")
50
- st.markdown("Embedding Model: Used OpenAI’s GPT3.5 model for Generating the Embeddings for Text docus")
51
- st.markdown("Vector Database: Milvus")
52
- st.markdown("ML Pipeline Orchestration: Vertex AI Pipeline")
53
- st.markdown("Supported Input data format: Strict JSON format (Other formats to be added shortly)")
54
- st.markdown("Support file type: JSON")
55
- st.markdown("Similarity Metric: Inner Product")
56
- st.markdown("Type of Index: FLAT_L2")
57
-
58
- st.subheader("STEPS")
59
- st.markdown("**TRAINING:**")
60
- st.markdown("1. Pull Textual policy documents from FDK")
61
- st.markdown("2. Parse the file data and make all documents at flat level")
62
- st.markdown("3. Apply splitters to convert the documents to chunks")
63
- st.markdown("4. Generate the Embeddings for those chunks")
64
- st.markdown("5. Store Embeddings to Milvus DB and create Index")
65
-
66
- st.markdown("**SERVING:**")
67
- st.markdown("1. Convert users’ question to embeddings with help of OpenAI’s GPT3.5 model")
68
- st.markdown("2. Apply Embedding Search Query on Collection of Milvus DB on which the data is indexed and Fetch top 10 Docs")
69
- st.markdown("3. Use PROMPT template to prepare PROMPT = TEMPLATE + CONTEXT and use OpenAI’s to generate the response")
 
7
 
8
  tab1, tab2 = st.tabs(["Product Discovery", "Question And Answering"])
9
  with tab1:
10
+ st.header("Product Discovery")
11
+ st.markdown("**Application:** Gofynd.com")
12
+ st.markdown("**Total Products:** 14,000")
13
+ st.markdown("**Data Used:**")
14
+ st.markdown("- Text fields - Name, Brand, Category, Gender")
15
+ st.markdown("- Images - Single Images (First image of the product)")
16
+ st.markdown("Embedding Model: Used CLIP model for Generating the Embeddings for Text and Image")
17
+ st.markdown("Weightage [Text, Image]: [0.1, 0.9]")
18
+ st.markdown("Vector Database: Milvus")
19
+ st.markdown("ML Pipeline Orchestration: Vertex AI Pipeline")
20
+ st.markdown("Supported Input data format:")
21
+ st.markdown("Similarity Metric: Inner Product")
22
+ st.markdown("Type of Index: FLAT_L2")
23
+
24
+ st.subheader("Input Sample Data:")
25
+ st.markdown("Sample data can be displayed here.")
26
+
27
+ st.subheader("STEPS")
28
+ st.markdown("**TRAINING:**")
29
+ st.markdown("1. Pull the Catalog data from Fynd Platform")
30
+ st.markdown("2. Parse Textual and Image data from Catalog data")
31
+ st.markdown("3. Generate Embeddings for Textual fields")
32
+ st.markdown("4. Generate Embeddings for Image")
33
+ st.markdown("5. Aggregate Embeddings with help of defined weightage")
34
+ st.markdown("6. Store it to Vector DB - Milvus")
35
+
36
+ st.markdown("**SERVING:**")
37
+ st.markdown("1. Convert the Users’s query as Input text string to Embeddings with CLIP model")
38
+ st.markdown("2. Pass the user’s search query to LLM - OpenAI’S GPT3 to detect the search entities - Query, Brand, Category, Price, Sorting type")
39
+ st.markdown("3. Prepare and Apply Search Query on Collection of Milvus DB on which the data is indexed")
40
+ st.markdown("4. Fetch top N results")
41
+ st.markdown("5. Apply filters and return the results")
 
42
 
43
  with tab2:
44
  st.header("Question And Answering")
45
+ st.markdown("**Application:** Gofynd.com")
46
+ st.markdown("**Total Documents:** FAQ, Return, Shipping, T&C")
47
+ st.markdown("**Framework:** Langchain")
48
+ st.markdown("Embedding Model: Used OpenAI’s GPT3.5 model for Generating the Embeddings for Text docus")
49
+ st.markdown("Vector Database: Milvus")
50
+ st.markdown("ML Pipeline Orchestration: Vertex AI Pipeline")
51
+ st.markdown("Supported Input data format: Strict JSON format (Other formats to be added shortly)")
52
+ st.markdown("Support file type: JSON")
53
+ st.markdown("Similarity Metric: Inner Product")
54
+ st.markdown("Type of Index: FLAT_L2")
55
+
56
+ st.subheader("STEPS")
57
+ st.markdown("**TRAINING:**")
58
+ st.markdown("1. Pull Textual policy documents from FDK")
59
+ st.markdown("2. Parse the file data and make all documents at flat level")
60
+ st.markdown("3. Apply splitters to convert the documents to chunks")
61
+ st.markdown("4. Generate the Embeddings for those chunks")
62
+ st.markdown("5. Store Embeddings to Milvus DB and create Index")
63
+
64
+ st.markdown("**SERVING:**")
65
+ st.markdown("1. Convert users’ question to embeddings with help of OpenAI’s GPT3.5 model")
66
+ st.markdown("2. Apply Embedding Search Query on Collection of Milvus DB on which the data is indexed and Fetch top 10 Docs")
67
+ st.markdown("3. Use PROMPT template to prepare PROMPT = TEMPLATE + CONTEXT and use OpenAI’s to generate the response")