_wandb: value: cli_version: 0.24.2 e: pxth32swik88a7oyr9u8qwmlfzkbrv44: args: - --critic_model=value_kc_critic - --use_wandb - --wandb_project_name=task1_all_kc - --kc_to_que_path=data/XES3G5M/metadata/kc_questions_map.json - --kc_emb_path=data/XES3G5M_embeddings/kc_emb.json - --cluster_to_kc_path=data/XES3G5M/metadata/kc_clusters.json - --cluster_to_que_path=data/XES3G5M/metadata/cluster_to_que_ids_map.json - --pretrained_model_path=data/pretrained_kt_model.ckpt - --dataloader_num_workers=8 - --seed=2 cpu_count: 252 cpu_count_logical: 252 cudaVersion: "12.8" disk: /: total: "1247017926656" used: "1016719900672" email: maxonorris@gmail.com executable: /mnt/pvc/Baselines/ExRec/.venv_task1/bin/python gpu: NVIDIA A100-SXM4-40GB gpu_count: 1 gpu_nvidia: - architecture: Ampere cudaCores: 6912 memoryTotal: "42949672960" name: NVIDIA A100-SXM4-40GB uuid: GPU-f1a4021e-f23e-b122-cea9-c1f45d48e2c0 host: alphamcts-run-models-ppo-default-rkq45-8g8ll memory: total: "962415210496" os: Linux-6.8.0-55-generic-x86_64-with-glibc2.31 program: -m train_test.all_kc_train_ppo python: CPython 3.10.13 root: /mnt/pvc/Baselines/ExRec startedAt: "2026-02-10T16:16:12.977346Z" writerId: pxth32swik88a7oyr9u8qwmlfzkbrv44 m: [] python_version: 3.10.13 t: "1": - 1 - 5 - 53 "2": - 1 - 5 - 53 "3": - 2 - 13 - 15 - 16 "4": 3.10.13 "5": 0.24.2 "12": 0.24.2 "13": linux-x86_64 action_size: value: 768 actor_lr: value: 5e-05 actor_up_projection_size: value: 1200 advantage_normalization: value: false batch_size: value: 512 checkpoint_path: value: ./ppo_saved_models/ab6dc5e4-15f4-4d4c-80ce-7a3122cdd6e1 cluster_to_kc_path: value: data/XES3G5M/metadata/kc_clusters.json cluster_to_que_path: value: data/XES3G5M/metadata/cluster_to_que_ids_map.json critic_hidden_size: value: 300 critic_model: value: value_kc_critic critic_up_projection_size: value: 1200 dataloader_num_workers: value: 8 deterministic_eval: value: false discount_factor: value: 0.99 dual_clip: value: null ent_coef: value: 0.01 eps_clip: value: 0.2 gae_lambda: value: 0.95 hidden_size: value: 300 kc_emb_path: value: data/XES3G5M_embeddings/kc_emb.json kc_emb_size: value: 768 kc_to_que_path: value: data/XES3G5M/metadata/kc_questions_map.json log_dir: value: ./train_ppo_logs log_path: value: ./train_ppo_logs/ab6dc5e4-15f4-4d4c-80ce-7a3122cdd6e1 max_batchsize: value: 512 max_grad_norm: value: null n_epoch: value: 100 pretrained_model_path: value: data/pretrained_kt_model.ckpt recompute_advantage: value: false repeat_per_update: value: 1 reward_normalization: value: false save_dir: value: ./ppo_saved_models seed: value: 2 student_state_size: value: 300 test_batch_size: value: 2048 test_init_seq_size: value: 100 test_last_n_steps: value: 10 test_log_wandb: value: false test_max_steps: value: 10 test_n_episode: value: 2048 test_reward_func: value: step_by_step test_reward_scale: value: 1000 train_batch_size: value: 512 train_folds: value: 2-3-4 train_init_seq_size: value: 100 train_last_n_steps: value: 10 train_max_steps: value: 10 train_max_steps_until_student_change: value: 10 train_n_episode: value: 512 train_replay_buffer_size: value: 12 train_reward_func: value: step_by_step train_reward_scale: value: 1000 use_wandb: value: true value_clip: value: false vf_coef: value: 0.5 wandb_project_name: value: task1_all_kc wandb_run_name: value: ppo