环境变量说明 ================== .. code-block:: shell # 服务化多机配套变量 export MIES_CONTAINER_IP=127.0.0.1 export RANK_TABLE_FILE=rank_table_file.json # 虚拟内存 export PYTORCH_NPU_ALLOC_CONF=expandable_segments:True # ATB WorkSpace 使能 export ATB_WORKSPACE_MEM_ALLOC_ALG_TYPE=3 export ATB_WORKSPACE_MEM_ALLOC_GLOBAL=1 # 单线程加速权重加载 export OMP_NUM_THREADS=10 # 设置显存占比 export NPU_MEMORY_FRACTION=0.97 # 设置精度饱和模式,防止fp16引起的上下溢出 export INF_NAN_MODE_ENABLE=0 # 关闭确定性计算 export HCCL_DETERMINISTIC=false export HCCL_OP_EXPANSION_MODE="AIV" export HCCL_CONNECT_TIMEOUT=7200 export HCCL_EXEC_TIMEOUT=0 # G8600 A+X机型单机配置混合并行,需要额外配置HCCL环境变量: # export ATB_LLM_HCCL_ENABLE=1 # export ATB_LLM_COMM_BACKEND="hccl" # 使能内存复用 export ATB_LAYER_INTERNAL_TENSOR_REUSE=1 export ATB_OPERATION_EXECUTE_ASYNC=1 export ATB_CONVERT_NCHW_TO_ND=1 export ATB_WORKSPACE_MEM_ALLOC_GLOBAL=1 export ATB_WORKSPACE_MEM_ALLOC_ALG_TYPE=3 export ATB_CONTEXT_WORKSPACE_SIZE=0 export ATB_LAUNCH_KERNEL_WITH_TILING=1 export ATB_LLM_ENABLE_AUTO_TRANSPOSE=0 export MINDIE_ASYNC_SCHEDULING_ENABLE=1 # CPU亲和性调度 export CPU_AFFINITY_CONF=1 export TASK_QUEUE_ENABLE=2 unset ASCEND_LAUNCH_BLOCKING # 日志打屏 export MINDIE_LLM_LOG_TO_STDOUT=1 export MINDIE_LOG_TO_STDOUT=1 export ASCEND_SLOG_PRINT_TO_STDOUT=1