coachable-course-agent / scripts /test_courses_chroma.py
rdisipio's picture
recommend courses
855e546
raw
history blame contribute delete
869 Bytes
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
from langchain.vectorstores import Chroma
from langchain.embeddings import HuggingFaceEmbeddings
embedding_model = HuggingFaceEmbeddings(model_name="all-MiniLM-L6-v2")
courses_collection = Chroma(
persist_directory="data/courses_chroma",
embedding_function=embedding_model
)
# Print number of stored courses
try:
n_courses = courses_collection._collection.count()
print(f"Number of stored courses in Chroma: {n_courses}")
except Exception as e:
print(f"Could not count courses: {e}")
# Print a few sample documents (if any)
try:
docs = courses_collection._collection.get(limit=3)
print("Sample documents:")
for i, doc in enumerate(docs["documents"]):
print(f"--- Document {i+1} ---")
print(doc)
except Exception as e:
print(f"Could not fetch sample documents: {e}")