| docker run -it --gpus all \ | |
| --ipc host --net host --privileged --cap-add IPC_LOCK \ | |
| --ulimit memlock=-1 --ulimit stack=67108864 \ | |
| --rm \ | |
| -v $(pwd):/workspace/LLaVA-OneVision-2 \ | |
| -v /vlm:/vlm \ | |
| -v /ov2:/ov2 \ | |
| -v /video_vit:/video_vit \ | |
| -v /root/.ssh:/ov2/xiangan/ssh_configs/.ssh \ | |
| -e NCCL_TIMEOUT=1800 \ | |
| -e CUDA_DEVICE_MAX_CONNECTIONS=1 \ | |
| -e NCCL_SOCKET_IFNAME=eth0 \ | |
| -e NCCL_IB_GID_INDEX=3 \ | |
| -e NCCL_IB_DISABLE=0 \ | |
| -e NCCL_IB_HCA="mlx5_2,mlx5_3,mlx5_4,mlx5_5,mlx5_6,mlx5_7,mlx5_8,mlx5_1" \ | |
| -e NCCL_NET_GDR_LEVEL=2 \ | |
| -e NCCL_IB_QPS_PER_CONNECTION=4 \ | |
| -e NCCL_IB_TC=160 \ | |
| -e NCCL_IB_TIMEOUT=22 \ | |
| -e NCCL_CROSS_NIC=1 \ | |
| -e NCCL_MIN_NCHANNELS=8 \ | |
| -e NCCL_MAX_NCHANNELS=16 \ | |
| -w /workspace/LLaVA-OneVision-2 \ | |
| --name "llava_megatron_container_feilong1" \ | |
| llava_megatron:2601dist bash -c "service ssh restart; bash; " | |
| # docker run -it --gpus all \ | |