appleeji commited on
Commit
1b8d732
·
verified ·
1 Parent(s): dee8162

Upload main.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. main.py +3 -1
main.py CHANGED
@@ -253,9 +253,11 @@ criterion = nn.SmoothL1Loss(reduction="none")
253
 
254
  num_epochs = train_config["num_epochs"]
255
 
 
 
256
  model_engine, optimizer, _, _ = deepspeed.initialize(args=args,
257
  model=model,
258
- model_parameters=model.parameters(),
259
  )
260
 
261
  global_rank = deepspeed.comm.get_rank()
 
253
 
254
  num_epochs = train_config["num_epochs"]
255
 
256
+ # Only pass trainable parameters to DeepSpeed (frozen params cause grad tracking errors)
257
+ trainable_params = [p for p in model.parameters() if p.requires_grad]
258
  model_engine, optimizer, _, _ = deepspeed.initialize(args=args,
259
  model=model,
260
+ model_parameters=trainable_params,
261
  )
262
 
263
  global_rank = deepspeed.comm.get_rank()