supanthadey1's picture
Add BERTose and AFFINose training code release
1d6f391 verified
Raw
History Blame Contribute Delete
1.72 kB
#!/bin/bash
#SBATCH --job-name=emb_deep_dive
#SBATCH --partition=nova
#SBATCH --nodes=1
#SBATCH --ntasks=1
#SBATCH --cpus-per-task=8
#SBATCH --gres=gpu:1
#SBATCH --mem=64G
#SBATCH --time=02:00:00
#SBATCH --output=bert_v6_contrastive/scripts/emb_analysis_%j.out
#SBATCH --error=bert_v6_contrastive/scripts/emb_analysis_%j.err
#SBATCH --mail-type=END,FAIL
echo "=== Embedding Deep Dive ==="
echo "Job: $SLURM_JOB_ID | Node: $(hostname) | $(date)"
nvidia-smi --query-gpu=name --format=csv,noheader
source activate glycan_bert 2>/dev/null || conda activate glycan_bert 2>/dev/null || true
cd /work/ratul1/supantha/glycan-SD-VS/bert_training_v3/v3.1_cluster_training
pip install umap-learn scikit-learn 2>/dev/null || true
mkdir -p bert_v6_contrastive/analysis
echo -e "\n=== Step 1: Extract V6 ==="
python3 bert_v6_contrastive/scripts/extract_embeddings.py \
--checkpoint checkpoints_v6/phase_3_hard_checkpoint.pt --name v6
echo -e "\n=== Step 2: Extract V5 ==="
python3 bert_v6_contrastive/scripts/extract_embeddings.py \
--checkpoint checkpoints_v5_bpe_topo/best_v5_bpe_topo_model.pt --name v5
echo -e "\n=== Step 3: Analyze V6 ==="
python3 bert_v6_contrastive/scripts/analyze_embeddings.py \
--input bert_v6_contrastive/analysis/embeddings_v6.npz --name v6
echo -e "\n=== Step 4: Analyze V5 ==="
python3 bert_v6_contrastive/scripts/analyze_embeddings.py \
--input bert_v6_contrastive/analysis/embeddings_v5.npz --name v5
echo -e "\n=== Step 5: V5 vs V6 Comparison ==="
python3 bert_v6_contrastive/scripts/analyze_embeddings.py \
--input bert_v6_contrastive/analysis/embeddings_v6.npz --name v6 --compare
echo -e "\n=== Results ==="
ls -la bert_v6_contrastive/analysis/
echo "Done! $(date)"