notebooklm-fast / check_chroma_data.py
jashdoshi77
Update UI styling and message formatting improvements
abc646e
"""Quick script to check what's stored in ChromaDB metadata collection."""
from services.chroma_service import ChromaService
def check_metadata():
print("Connecting to ChromaDB...")
c = ChromaService()
data = c.metadata_collection.get()
total = len(data['ids'])
print(f"Total entries in document_metadata: {total}")
if total > 0:
print("\n--- Sample entry (first) ---")
meta = data['metadatas'][0]
for key, value in sorted(meta.items()):
print(f" {key}: {value}")
# Find Feb 2026 renewals
print("\n--- Entries with Feb 2026 renewal ---")
feb_count = 0
for meta in data['metadatas']:
rd = str(meta.get('renewal_date', ''))
ry = meta.get('renewal_year', 0)
# Check for Feb 2026
if ry == 2026 and '-02-' in rd:
feb_count += 1
print(f" {meta.get('document_title')}: renewal_date={rd}, renewal_year={ry}")
print(f"\nTotal Feb 2026 renewals found: {feb_count}")
# Show all unique renewal years
years = set(meta.get('renewal_year', 0) for meta in data['metadatas'])
print(f"\nAll renewal years in data: {sorted(years)}")
else:
print("No data found!")
if __name__ == "__main__":
check_metadata()