Upload main.py with huggingface_hub
Browse files
main.py
CHANGED
|
@@ -253,9 +253,11 @@ criterion = nn.SmoothL1Loss(reduction="none")
|
|
| 253 |
|
| 254 |
num_epochs = train_config["num_epochs"]
|
| 255 |
|
|
|
|
|
|
|
| 256 |
model_engine, optimizer, _, _ = deepspeed.initialize(args=args,
|
| 257 |
model=model,
|
| 258 |
-
model_parameters=
|
| 259 |
)
|
| 260 |
|
| 261 |
global_rank = deepspeed.comm.get_rank()
|
|
|
|
| 253 |
|
| 254 |
num_epochs = train_config["num_epochs"]
|
| 255 |
|
| 256 |
+
# Only pass trainable parameters to DeepSpeed (frozen params cause grad tracking errors)
|
| 257 |
+
trainable_params = [p for p in model.parameters() if p.requires_grad]
|
| 258 |
model_engine, optimizer, _, _ = deepspeed.initialize(args=args,
|
| 259 |
model=model,
|
| 260 |
+
model_parameters=trainable_params,
|
| 261 |
)
|
| 262 |
|
| 263 |
global_rank = deepspeed.comm.get_rank()
|