Spaces:
Sleeping
Sleeping
| set -euo pipefail | |
| ROOT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)" | |
| CORPUS_DIR="${CORPUS_DIR:-${ROOT_DIR}/training_corpus}" | |
| CORPUS_DB_DIR="${CORPUS_DB_DIR:-${ROOT_DIR}/outputs/corpus_dbs}" | |
| PYTHON_BIN="${PYTHON_BIN:-${ROOT_DIR}/.venv/bin/python}" | |
| mkdir -p "${CORPUS_DB_DIR}" | |
| cd "${ROOT_DIR}" | |
| seed_one() { | |
| local name="$1" | |
| local rel_path="$2" | |
| local source_path="${CORPUS_DIR}/${rel_path}" | |
| local db_path="${CORPUS_DB_DIR}/${name}.db" | |
| if [[ ! -d "${source_path}" ]]; then | |
| echo "[WARN] Missing source for ${name}: ${source_path}" | |
| return | |
| fi | |
| echo "[SEED] ${name} from ${source_path}" | |
| GRAPHREVIEW_DB_PATH="${db_path}" "${PYTHON_BIN}" -m db.seed "${source_path}" --force | |
| } | |
| # Tier 1 | |
| seed_one requests requests/src/requests | |
| seed_one flask flask/src/flask | |
| seed_one fastapi fastapi/fastapi | |
| seed_one pydantic pydantic/pydantic | |
| # Tier 2 | |
| seed_one celery celery/celery | |
| seed_one scrapy_core scrapy/scrapy/core | |
| seed_one scrapy_pipelines scrapy/scrapy/pipelines | |
| seed_one django_db django/django/db | |
| seed_one django_http django/django/http | |
| seed_one django_auth django/django/contrib/auth | |
| seed_one airflow airflow/airflow | |
| # Tier 3 | |
| seed_one erpnext erpnext/erpnext | |
| seed_one fastapi_tdd fastapi-tdd-docker/project | |
| seed_one rest_api_smorest rest-api-smorest-docker/app | |
| echo "[DONE] Corpus seeding complete -> ${CORPUS_DB_DIR}" | |