Ctrl+K
- huggingface Upload full checkpoint: global_step_96
- extra_state_world_size_8_rank_0.pt14.6 kB
Detected Pickle imports (7)
- "numpy.ndarray",
- "torch._utils._rebuild_tensor_v2",
- "numpy.dtype",
- "collections.OrderedDict",
- "numpy.core.multiarray._reconstruct",
- "_codecs.encode",
- "torch.ByteStorage"
xetUpload full checkpoint: global_step_96 - extra_state_world_size_8_rank_1.pt14.6 kB
Detected Pickle imports (7)
- "numpy.ndarray",
- "torch._utils._rebuild_tensor_v2",
- "numpy.dtype",
- "collections.OrderedDict",
- "numpy.core.multiarray._reconstruct",
- "_codecs.encode",
- "torch.ByteStorage"
xetUpload full checkpoint: global_step_96 - extra_state_world_size_8_rank_2.pt14.6 kB
Detected Pickle imports (7)
- "numpy.ndarray",
- "torch._utils._rebuild_tensor_v2",
- "numpy.dtype",
- "collections.OrderedDict",
- "numpy.core.multiarray._reconstruct",
- "_codecs.encode",
- "torch.ByteStorage"
xetUpload full checkpoint: global_step_96 - extra_state_world_size_8_rank_3.pt14.6 kB
Detected Pickle imports (7)
- "numpy.ndarray",
- "torch._utils._rebuild_tensor_v2",
- "numpy.dtype",
- "collections.OrderedDict",
- "numpy.core.multiarray._reconstruct",
- "_codecs.encode",
- "torch.ByteStorage"
xetUpload full checkpoint: global_step_96 - extra_state_world_size_8_rank_4.pt14.6 kB
Detected Pickle imports (7)
- "numpy.ndarray",
- "torch._utils._rebuild_tensor_v2",
- "numpy.dtype",
- "collections.OrderedDict",
- "numpy.core.multiarray._reconstruct",
- "_codecs.encode",
- "torch.ByteStorage"
xetUpload full checkpoint: global_step_96 - extra_state_world_size_8_rank_5.pt14.6 kB
Detected Pickle imports (7)
- "numpy.ndarray",
- "torch._utils._rebuild_tensor_v2",
- "numpy.dtype",
- "collections.OrderedDict",
- "numpy.core.multiarray._reconstruct",
- "_codecs.encode",
- "torch.ByteStorage"
xetUpload full checkpoint: global_step_96 - extra_state_world_size_8_rank_6.pt14.6 kB
Detected Pickle imports (7)
- "numpy.ndarray",
- "torch._utils._rebuild_tensor_v2",
- "numpy.dtype",
- "collections.OrderedDict",
- "numpy.core.multiarray._reconstruct",
- "_codecs.encode",
- "torch.ByteStorage"
xetUpload full checkpoint: global_step_96 - extra_state_world_size_8_rank_7.pt14.6 kB
Detected Pickle imports (7)
- "numpy.ndarray",
- "torch._utils._rebuild_tensor_v2",
- "numpy.dtype",
- "collections.OrderedDict",
- "numpy.core.multiarray._reconstruct",
- "_codecs.encode",
- "torch.ByteStorage"
xetUpload full checkpoint: global_step_96 - 46 Bytes Upload full checkpoint: global_step_96
- 3.69 GB xetUpload full checkpoint: global_step_96
- model_world_size_8_rank_1.pt3.69 GB
Detected Pickle imports (15)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch.distributed.tensor.DTensor",
- "torch._tensor._rebuild_from_type_v2",
- "torch.bfloat16",
- "torch.device",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - model_world_size_8_rank_2.pt3.69 GB
Detected Pickle imports (15)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch.distributed.tensor.DTensor",
- "torch._tensor._rebuild_from_type_v2",
- "torch.bfloat16",
- "torch.device",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - model_world_size_8_rank_3.pt3.69 GB
Detected Pickle imports (15)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch.distributed.tensor.DTensor",
- "torch._tensor._rebuild_from_type_v2",
- "torch.bfloat16",
- "torch.device",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - model_world_size_8_rank_4.pt3.69 GB
Detected Pickle imports (15)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch.distributed.tensor.DTensor",
- "torch._tensor._rebuild_from_type_v2",
- "torch.bfloat16",
- "torch.device",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - model_world_size_8_rank_5.pt3.69 GB
Detected Pickle imports (15)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch.distributed.tensor.DTensor",
- "torch._tensor._rebuild_from_type_v2",
- "torch.bfloat16",
- "torch.device",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - model_world_size_8_rank_6.pt3.69 GB
Detected Pickle imports (15)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch.distributed.tensor.DTensor",
- "torch._tensor._rebuild_from_type_v2",
- "torch.bfloat16",
- "torch.device",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - model_world_size_8_rank_7.pt3.69 GB
Detected Pickle imports (15)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch.distributed.tensor.DTensor",
- "torch._tensor._rebuild_from_type_v2",
- "torch.bfloat16",
- "torch.device",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - optim_world_size_8_rank_0.pt7.39 GB
Detected Pickle imports (16)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch._tensor._rebuild_from_type_v2",
- "torch.distributed.tensor.DTensor",
- "torch.bfloat16",
- "torch.device",
- "torch.FloatStorage",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - optim_world_size_8_rank_1.pt7.39 GB
Detected Pickle imports (16)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch._tensor._rebuild_from_type_v2",
- "torch.distributed.tensor.DTensor",
- "torch.bfloat16",
- "torch.device",
- "torch.FloatStorage",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - optim_world_size_8_rank_2.pt7.39 GB
Detected Pickle imports (16)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch._tensor._rebuild_from_type_v2",
- "torch.distributed.tensor.DTensor",
- "torch.bfloat16",
- "torch.device",
- "torch.FloatStorage",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - optim_world_size_8_rank_3.pt7.39 GB
Detected Pickle imports (16)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch._tensor._rebuild_from_type_v2",
- "torch.distributed.tensor.DTensor",
- "torch.bfloat16",
- "torch.device",
- "torch.FloatStorage",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - optim_world_size_8_rank_4.pt7.39 GB
Detected Pickle imports (16)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch._tensor._rebuild_from_type_v2",
- "torch.distributed.tensor.DTensor",
- "torch.bfloat16",
- "torch.device",
- "torch.FloatStorage",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - optim_world_size_8_rank_5.pt7.39 GB
Detected Pickle imports (16)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch._tensor._rebuild_from_type_v2",
- "torch.distributed.tensor.DTensor",
- "torch.bfloat16",
- "torch.device",
- "torch.FloatStorage",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - optim_world_size_8_rank_6.pt7.39 GB
Detected Pickle imports (16)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch._tensor._rebuild_from_type_v2",
- "torch.distributed.tensor.DTensor",
- "torch.bfloat16",
- "torch.device",
- "torch.FloatStorage",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96 - optim_world_size_8_rank_7.pt7.39 GB
Detected Pickle imports (16)
- "torch._utils._rebuild_wrapper_subclass",
- "torch.IntStorage",
- "torch.serialization._get_layout",
- "collections.OrderedDict",
- "torch._tensor._rebuild_from_type_v2",
- "torch.distributed.tensor.DTensor",
- "torch.bfloat16",
- "torch.device",
- "torch.FloatStorage",
- "torch.distributed.device_mesh.DeviceMesh",
- "torch.distributed.tensor._dtensor_spec.TensorMeta",
- "torch.Size",
- "torch.BFloat16Storage",
- "torch.distributed.tensor._dtensor_spec.DTensorSpec",
- "torch._utils._rebuild_tensor_v2",
- "torch.distributed.tensor.placement_types.Shard"
xetUpload full checkpoint: global_step_96