Spaces:
Sleeping
Sleeping
| import os, json, numpy as np | |
| from core.vector import embed | |
| def load_docs(base="data/demo"): | |
| meta = json.load(open(os.path.join(base, "metadata.json"))) | |
| docs = [] | |
| for fname, m in meta.items(): | |
| text = open(os.path.join(base, "documents", fname), encoding="utf-8").read() | |
| docs.append({ | |
| "id": fname, | |
| "text": text, | |
| "vec": embed(text), | |
| "agency": m["agency"], | |
| "year": m["year"], | |
| "program": m.get("program", "Unknown") | |
| }) | |
| return docs |