Spaces:

GIZ
/

Development-Project-Synergy-Finder

Sleeping

Jan Mühlnikel

added semantic search function

71de22d about 2 years ago

933 Bytes

	import pickle
	import faiss
	import streamlit as st
	from sentence_transformers import SentenceTransformer
	import pandas as pd

	def search(query, model, embeddings, filtered_df, top_x=30):

	filtered_df_indecies_list = filtered_df.index
	filtered_embeddings = embeddings[filtered_df_indecies_list]

	# Load or create FAISS index
	dimension = filtered_embeddings.shape[1]
	faiss_index = faiss.IndexFlatL2(dimension)
	faiss_index.add(filtered_embeddings)

	# Convert query to embedding
	query_embedding = model.encode([query])[0].reshape(1, -1)

	# Perform search
	D, I = faiss_index.search(query_embedding, k=top_x) # Search for top x similar items

	# Extract the sentences corresponding to the top indices
	#print(filtered_df.columns())
	top_indecies = [i for i in I[0]]

	return filtered_df.iloc[top_indecies]