Respair's picture
Upload folder using huggingface_hub
b386992 verified
task,model,size,system,dtype,num_gpus,seq_len,tp_size,pp_size,cp_size,ep_size,vp_size,mbs,gbs,etp_size,cuda_graphs,use_mcore_fsdp,recompute_layers,activation_offload_layers,recompute_modules,keep_fsdp_fp8_transpose_cache,use_user_buffer_registration,use_sharp
lora,llama3,70b,b200,fp8,8,4096,1,4,1,1,20,1,32,,0,0,0,0,,,,
lora,llama3,70b,b200,bf16,8,4096,1,4,1,1,20,1,32,,0,0,0,0,,,,
lora,llama3,8b,b200,bf16,8,16384,1,1,1,1,1,1,8,,1,0,0,0,,,,
lora,llama3,8b,b200,fp8,8,16384,1,1,1,1,1,1,8,,0,0,0,0,,,,
lora,llama31,405b,b200,fp8,32,2048,4,4,1,1,4,1,32,,0,0,0,0,,,,
lora,llama31,405b,b200,bf16,32,4096,4,4,1,1,4,1,32,,0,0,0,0,,,,
pre_train,gpt3,175b,b200,bf16,128,2048,4,4,1,1,12,2,256,,0,0,0,0,,,,
pre_train,gpt3,175b,b200,fp8,128,2048,4,4,1,1,12,2,256,,0,0,0,0,,,,
pre_train,gpt3,175b,b200,fp8,512,2048,4,4,1,1,6,2,2048,,0,0,0,0,,,,
pre_train,llama3,8b,b200,bf16,8,8192,1,1,1,1,1,2,128,,1,0,0,0,,,,
pre_train,llama3,8b,b200,fp8,8,8192,1,1,1,1,1,2,128,,1,0,0,0,,,,
pre_train,llama3,70b,b200,fp8,64,8192,1,1,1,1,1,1,128,,0,1,10,0,,,1,1
pre_train,llama3,70b,b200,bf16,64,8192,2,4,2,1,5,1,128,,1,0,0,0,,,,
pre_train,llama31,405b,b200,bf16,128,8192,4,8,2,1,8,1,64,,0,0,0,0,,,,
pre_train,llama31,405b,b200,fp8,128,8192,4,8,2,1,8,1,64,,0,0,0,0,,,,
pre_train,mixtral,8x7b,b200,bf16,64,4096,1,1,1,8,1,2,256,,1,0,0,0,,,,
pre_train,mixtral,8x7b,b200,fp8,64,4096,1,1,1,8,1,2,256,,1,0,0,0,,,,
pre_train,mixtral,8x22b,b200,bf16,256,65536,2,4,8,8,14,1,64,1,0,0,0,0,,,,
pre_train,mixtral,8x22b,b200,fp8,256,65536,2,4,8,8,14,1,64,1,0,0,0,0,,,,
pre_train,nemotron4,15b,b200,bf16,64,4096,1,1,1,1,1,2,256,,1,0,0,0,,,,
pre_train,nemotron4,340b,b200,bf16,128,4096,8,4,1,1,12,1,32,,1,0,0,0,,,,
pre_train,nemotron4,340b,b200,fp8,128,4096,8,4,1,1,12,1,32,,1,0,0,0,,,,
pre_train,nemotron4,15b,b200,fp8,64,4096,1,1,1,1,1,2,256,,1,0,0,0,,,,
pre_train,deepseek,v3,b200,bf16,1024,4096,2,16,1,8,1,1,8192,1,0,0,0,0,,,,
pre_train,deepseek,v3,b200,bf16,256,4096,2,16,1,8,1,1,2048,1,0,0,0,0,,,,
pre_train,deepseek,v3,b200,bf16,128,4096,2,16,1,8,1,1,1024,1,0,0,0,0,,,,
pre_train,nemotronh,8b,gb200,fp8,8,8192,1,1,1,1,1,2,128,,1,0,0,0,,,,
pre_train,nemotronh,47b,gb200,fp8,64,8192,2,1,1,1,1,1,192,,1,0,0,0,,,,
pre_train,nemotronh,56b,gb200,fp8,64,8192,4,1,1,1,1,2,192,,1,0,0,0,,,,
pre_train,nemotronh,56b,gb200,fp8,256,8192,4,1,1,1,1,2,768,,1,0,0,0,,,,
sft,llama3,8b,b200,fp8,8,16384,1,1,1,1,1,1,8,,1,0,0,0,,,,
sft,llama3,70b,b200,bf16,32,4096,2,4,1,1,5,1,32,,1,0,0,0,,,,
sft,llama3,70b,b200,fp8,32,4096,2,4,1,1,5,1,32,,1,0,0,0,,,,
sft,llama3,8b,b200,bf16,8,16384,1,1,1,1,1,1,8,,1,0,0,0,,,,
sft,llama4,e128,b200,bf16,256.0,4096.0,8.0,1.0,1.0,32.0,1.0,1.0,32.0,8.0,0,0,0,0,,,,
pre_train,llama4,e16,b200,bf16,64.0,8192.0,1.0,2.0,1.0,8.0,24.0,1.0,1024.0,1.0,0,0,0,0,,,,
pre_train,llama4,e128,b200,bf16,128.0,8192.0,1.0,2.0,1.0,64.0,12.0,1.0,1024.0,1.0,0,0,0,0,,,,
pre_train,vlm_llama4,e16,b200,bf16,64.0,8192.0,1.0,1.0,1.0,16.0,1.0,1.0,1024.0,1.0,0,0,0,0,,,,
pre_train,vlm_llama4,e128,b200,bf16,128.0,8192.0,1.0,2.0,1.0,64.0,12.0,1.0,1024.0,1.0,0,0,0,0,,,,
pre_train,qwen3,30b_a3b,b200,bf16,8.0,4096.0,1.0,1.0,1.0,8.0,1.0,1.0,512.0,1.0,1,0,0,0,,,,
pre_train,qwen3,235b_a22b,b200,bf16,64.0,4096.0,1.0,8.0,1.0,8.0,12.0,1.0,1024.0,1.0,0,0,0,0,,,,