accelerate config
CCL_ZE_IPC_EXCHANGE=sockets accelerate launch --main_process_port=29502 ccl_test.py --device xpu --launch torch
accelerate launch --main_process_port=29502 ccl_test.py --device cuda 2>&1 |tee nvidia.log
CCL_ZE_IPC_EXCHANGE=sockets mpirun -n 2 -l python ccl_test.py --device xpu --launch mpi