File size: 939 Bytes
d51113f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
docker run -it --gpus all \
    --ipc host --net host --privileged --cap-add IPC_LOCK \
    --ulimit memlock=-1 --ulimit stack=67108864 \
    --rm \
    -v $(pwd):/workspace/LLaVA-OneVision-2 \
    -v /vlm:/vlm \
    -v /ov2:/ov2 \
    -v /video_vit:/video_vit \
    -v /root/.ssh:/ov2/xiangan/ssh_configs/.ssh \
    -e NCCL_TIMEOUT=1800 \
    -e CUDA_DEVICE_MAX_CONNECTIONS=1 \
    -e NCCL_SOCKET_IFNAME=eth0 \
    -e NCCL_IB_GID_INDEX=3 \
    -e NCCL_IB_DISABLE=0 \
    -e NCCL_IB_HCA="mlx5_2,mlx5_3,mlx5_4,mlx5_5,mlx5_6,mlx5_7,mlx5_8,mlx5_1" \
    -e NCCL_NET_GDR_LEVEL=2 \
    -e NCCL_IB_QPS_PER_CONNECTION=4 \
    -e NCCL_IB_TC=160 \
    -e NCCL_IB_TIMEOUT=22 \
    -e NCCL_CROSS_NIC=1 \
    -e NCCL_MIN_NCHANNELS=8 \
    -e NCCL_MAX_NCHANNELS=16 \
    -w /workspace/LLaVA-OneVision-2 \
    --name "llava_megatron_container_feilong1" \
    llava_megatron:2601dist bash -c "service ssh restart; bash; "


# docker run -it --gpus all \