File size: 601 Bytes
c1e438c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
from memory.long_term import LongTermMemory
from memory.embedder import Embedder

class DatasetIngestor:
    def __init__(self):
        self.memory = LongTermMemory()
        self.embedder = Embedder()

    def ingest(self, samples, limit=None):
        for i, sample in enumerate(samples):
            if limit and i >= limit:
                break

            text = sample["text"]
            meta = sample.get("meta", {})

            embedding = self.embedder.encode(text)
            self.memory.add(text, embedding, meta)

        print(f"[INGEST] {i + 1} samples added to long-term memory")