Spaces:
Runtime error
Runtime error
| import asyncio | |
| from chroma import ChromaClient, TransformersEmbeddingFunction | |
| async def main(): | |
| # Chroma client | |
| client = ChromaClient() | |
| # Connect to backend | |
| # BERT embedding | |
| embedder = TransformersEmbeddingFunction('bert-base-uncased') | |
| # Create collection | |
| collection = await client.createCollection({'name':'my_collection', | |
| 'embeddingFunction': embedder}) | |
| # Load document | |
| with open('Caribbean-Artificial-Intelligence-Policy-Roadmap.txt') as f: | |
| doc = f.read() | |
| # Tokenize | |
| sentences = sent_tokenize(doc) | |
| # Generate embeddings | |
| embeddings = [] | |
| for sentence in sentences: | |
| embeddings.append(embedder.encode(sentence)) | |
| # Add to Chroma | |
| await collection.add({'ids': list(range(len(sentences))), | |
| 'embeddings': embeddings, | |
| 'documents': sentences}) | |
| print("Documents indexed successfully!") | |
| asyncio.run(main()) |