AI开发平台MODELARTS-附录:rank_table_file.json文件

时间:2025-02-22 17:22:00

附录:rank_table_file.json文件

rank_table_file.json文件样例如下,需要根据实际修改server_count,device_ip,server_id,container_ip参数,每台机器上的rank_table_file.json文件内容一致。在步骤三:创建rank_table_file.json步骤中会用到。

  • server_count:节点个数。4机部署为4,2机部署为2。当2机部署时,server_list中填写的内容也只需要2机16卡的相关信息,当前样例为4机32卡,2机时请删除多余的信息。
  • device_ip:当前卡的IP地址,每台机器共8张卡。device_ip查询命令
    for i in {0..7};do hccn_tool -i $i -ip -g; done
  • server_id:当前Server节点的IP地址,涉及4台机器。
  • container_ip:容器IP地址,无特殊配置时与server_id保存一致。
{
    "server_count": "4",
    "server_list": [
        {
            "device": [
                {
                    "device_id": "0",
                    "device_ip": "29.82.85.12",
                    "rank_id": "0"
                },
                {
                    "device_id": "1",
                    "device_ip": "29.82.98.67",
                    "rank_id": "1"
                },
                {
                    "device_id": "2",
                    "device_ip": "29.82.133.21",
                    "rank_id": "2"
                },
                {
                    "device_id": "3",
                    "device_ip": "29.82.175.69",
                    "rank_id": "3"
                },
                {
                    "device_id": "4",
                    "device_ip": "29.82.13.154",
                    "rank_id": "4"
                },
                {
                    "device_id": "5",
                    "device_ip": "29.82.140.51",
                    "rank_id": "5"
                },
                {
                    "device_id": "6",
                    "device_ip": "29.82.157.87",
                    "rank_id": "6"
                },
                {
                    "device_id": "7",
                    "device_ip": "29.82.15.225",
                    "rank_id": "7"
                }
            ],
            "server_id": "7.242.110.112",
            "container_ip": "7.242.110.112"
        },
        {
            "device": [
                {
                    "device_id": "0",
                    "device_ip": "29.82.177.28",
                    "rank_id": "8"
                },
                {
                    "device_id": "1",
                    "device_ip": "29.82.41.231",
                    "rank_id": "9"
                },
                {
                    "device_id": "2",
                    "device_ip": "29.82.16.3",
                    "rank_id": "10"
                },
                {
                    "device_id": "3",
                    "device_ip": "29.82.154.20",
                    "rank_id": "11"
                },
                {
                    "device_id": "4",
                    "device_ip": "29.82.56.73",
                    "rank_id": "12"
                },
                {
                    "device_id": "5",
                    "device_ip": "29.82.177.138",
                    "rank_id": "13"
                },
                {
                    "device_id": "6",
                    "device_ip": "29.82.29.230",
                    "rank_id": "14"
                },
                {
                    "device_id": "7",
                    "device_ip": "29.82.1.176",
                    "rank_id": "15"
                }
            ],
            "server_id": "7.242.104.54",
            "container_ip": "7.242.104.54"
        },
        {
            "device": [
                {
                    "device_id": "0",
                    "device_ip": "29.82.107.58",
                    "rank_id": "16"
                },
                {
                    "device_id": "1",
                    "device_ip": "29.82.179.159",
                    "rank_id": "17"
                },
                {
                    "device_id": "2",
                    "device_ip": "29.82.140.144",
                    "rank_id": "18"
                },
                {
                    "device_id": "3",
                    "device_ip": "29.82.6.71",
                    "rank_id": "19"
                },
                {
                    "device_id": "4",
                    "device_ip": "29.82.145.96",
                    "rank_id": "20"
                },
                {
                    "device_id": "5",
                    "device_ip": "29.82.0.173",
                    "rank_id": "21"
                },
                {
                    "device_id": "6",
                    "device_ip": "29.82.122.160",
                    "rank_id": "22"
                },
                {
                    "device_id": "7",
                    "device_ip": "29.82.155.63",
                    "rank_id": "23"
                }
            ],
            "server_id": "7.242.111.217",
            "container_ip": "7.242.111.217"
        },
        {
            "device": [
                {
                    "device_id": "0",
                    "device_ip": "29.82.106.127",
                    "rank_id": "24"
                },
                {
                    "device_id": "1",
                    "device_ip": "29.82.102.14",
                    "rank_id": "25"
                },
                {
                    "device_id": "2",
                    "device_ip": "29.82.145.46",
                    "rank_id": "26"
                },
                {
                    "device_id": "3",
                    "device_ip": "29.82.119.165",
                    "rank_id": "27"
                },
                {
                    "device_id": "4",
                    "device_ip": "29.82.58.169",
                    "rank_id": "28"
                },
                {
                    "device_id": "5",
                    "device_ip": "29.82.9.114",
                    "rank_id": "29"
                },
                {
                    "device_id": "6",
                    "device_ip": "29.82.117.18",
                    "rank_id": "30"
                },
                {
                    "device_id": "7",
                    "device_ip": "29.82.17.169",
                    "rank_id": "31"
                }
            ],
            "server_id": "7.242.108.165",
            "container_ip": "7.242.108.165"
        }
    ],
    "status": "completed",
    "version": "1.0"
}
support.huaweicloud.com/bestpractice-modelarts/modelarts_ds_infer_0004.html