File size: 2,115 Bytes
2cc32a5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
#!/usr/bin/env bash
set -euo pipefail

# ============================================================
# InsureOS Models — Environment Setup
# Target: 16GB GPU VM (Bytical Audio)
# ============================================================

echo "=== InsureOS Models Setup ==="
echo "GPU check:"
nvidia-smi --query-gpu=name,memory.total --format=csv,noheader 2>/dev/null || echo "WARNING: No GPU detected"

# System packages
echo "=== Installing system dependencies ==="
sudo apt-get update -qq
sudo apt-get install -y -qq python3-pip python3-venv git curl wget

# Create venv
echo "=== Creating Python virtual environment ==="
python3 -m venv .venv
source .venv/bin/activate

# Core ML
echo "=== Installing PyTorch + CUDA ==="
pip install --upgrade pip wheel setuptools
pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121

# Training stack
echo "=== Installing training dependencies ==="
pip install \
    transformers>=4.50.0 \
    datasets>=3.0.0 \
    accelerate>=1.2.0 \
    peft>=0.14.0 \
    trl>=0.15.0 \
    bitsandbytes>=0.45.0 \
    flash-attn --no-build-isolation \
    sentencepiece \
    protobuf \
    wandb

# Specialized ML
echo "=== Installing specialized ML packages ==="
pip install \
    scikit-learn>=1.5.0 \
    xgboost>=2.1.0 \
    lightgbm>=4.5.0 \
    interpret>=0.6.0 \
    statsmodels>=0.14.0 \
    scipy>=1.14.0 \
    networkx>=3.4 \
    torch-geometric>=2.6.0 \
    pyg-lib -f https://data.pyg.org/whl/torch-2.5.0+cu121.html

# Serving
echo "=== Installing serving dependencies ==="
pip install \
    fastapi>=0.115.0 \
    uvicorn>=0.32.0 \
    pydantic>=2.10.0

# Evaluation
echo "=== Installing evaluation packages ==="
pip install \
    rouge-score \
    nltk \
    bert-score \
    seqeval

# Data generation
echo "=== Installing data generation packages ==="
pip install \
    faker>=33.0.0 \
    numpy>=1.26.0 \
    pandas>=2.2.0 \
    tqdm>=4.67.0

echo ""
echo "=== Setup complete! ==="
echo "Activate with: source .venv/bin/activate"
echo "Generate data: python -m data.generate_all"
echo "Train all:     bash scripts/train_all.sh"