Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
The table of contents is too big for display.
Diff view
Diff view
  •  
  •  
  •  
Empty file modified .jenkins/rules/pylint/pylintrc
100755 → 100644
Empty file.
1 change: 0 additions & 1 deletion akg
Submodule akg deleted from e53ad9
Empty file modified build.sh
100755 → 100644
Empty file.
Empty file modified cmake/gencode.cmake
100755 → 100644
Empty file.
348 changes: 174 additions & 174 deletions config/hccl_multi_machine_multi_rank.json
Original file line number Diff line number Diff line change
@@ -1,175 +1,175 @@
{
"board_id": "0x0000",
"chip_info": "910",
"deploy_mode": "lab",
"group_count": "1",
"group_list": [{
"device_num": "16",
"server_num": "2",
"group_name": "",
"instance_count": "16",
"instance_list": [{
"devices": [{
"device_id": "0",
"device_ip": "[A_device_ip_0]"
}],
"rank_id": "0",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "1",
"device_ip": "[A_device_ip_1]"
}],
"rank_id": "1",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "2",
"device_ip": "[A_device_ip_2]"
}],
"rank_id": "2",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "3",
"device_ip": "[A_device_ip_3]"
}],
"rank_id": "3",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "4",
"device_ip": "[A_device_ip_4]"
}],
"rank_id": "4",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "5",
"device_ip": "[A_device_ip_5]"
}],
"rank_id": "5",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "6",
"device_ip": "[A_device_ip_6]"
}],
"rank_id": "6",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "7",
"device_ip": "[A_device_ip_7]"
}],
"rank_id": "7",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "0",
"device_ip": "[B_device_ip_0]"
}],
"rank_id": "8",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "1",
"device_ip": "[B_device_ip_1]"
}],
"rank_id": "9",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "2",
"device_ip": "[B_device_ip_2]"
}],
"rank_id": "10",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "3",
"device_ip": "[B_device_ip_3]"
}],
"rank_id": "11",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "4",
"device_ip": "[B_device_ip_4]"
}],
"rank_id": "12",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "5",
"device_ip": "[B_device_ip_5]"
}],
"rank_id": "13",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "6",
"device_ip": "[B_device_ip_6]"
}],
"rank_id": "14",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "7",
"device_ip": "[B_device_ip_7]"
}],
"rank_id": "15",
"server_id": "[server_id_B]"
}
]
}],
"para_plane_nic_location": "device",
"para_plane_nic_name": [
"eth0",
"eth1",
"eth2",
"eth3",
"eth4",
"eth5",
"eth6",
"eth7"
],
"para_plane_nic_num": "8",
"status": "completed",
"hccl_config_json_spec": {
"board_id": "board id, current support x0000 or 0x3000",
"chip_info": "chip info, current is 910",
"deploy_mode": "current use lab",
"group_count": "number of groups used",
"group_list": "detailed group information",
"device_num": "number of devices used, the value is the nth power of 2",
"server_num": "number of multiple machines, single machine is 1",
"group_name": "default is hccl_world_group or specified",
"instance_count": "number of instance used, generally equal to device_num",
"instance_list": "detailed instance information",
"device_id": "designated davinic device id to use, values start from 0, but no more than single machine total device num.if server_num greater than 1, the id can be restart from 0",
"device_ip": "ip corresponding to device_id",
"rank_id": "the first device must be 0 and then increase in order",
"server_id": "can be specified as the machine's ip address",
"para_plane_nic_location": "current use device",
"para_plane_nic_name": "network card corresponding to device ip",
"para_plane_nic_num": "number of network cards used",
"status": "current use completed"
}
{
"board_id": "0x0000",
"chip_info": "910",
"deploy_mode": "lab",
"group_count": "1",
"group_list": [{
"device_num": "16",
"server_num": "2",
"group_name": "",
"instance_count": "16",
"instance_list": [{
"devices": [{
"device_id": "0",
"device_ip": "[A_device_ip_0]"
}],
"rank_id": "0",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "1",
"device_ip": "[A_device_ip_1]"
}],
"rank_id": "1",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "2",
"device_ip": "[A_device_ip_2]"
}],
"rank_id": "2",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "3",
"device_ip": "[A_device_ip_3]"
}],
"rank_id": "3",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "4",
"device_ip": "[A_device_ip_4]"
}],
"rank_id": "4",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "5",
"device_ip": "[A_device_ip_5]"
}],
"rank_id": "5",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "6",
"device_ip": "[A_device_ip_6]"
}],
"rank_id": "6",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "7",
"device_ip": "[A_device_ip_7]"
}],
"rank_id": "7",
"server_id": "[server_id_A]"
},
{
"devices": [{
"device_id": "0",
"device_ip": "[B_device_ip_0]"
}],
"rank_id": "8",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "1",
"device_ip": "[B_device_ip_1]"
}],
"rank_id": "9",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "2",
"device_ip": "[B_device_ip_2]"
}],
"rank_id": "10",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "3",
"device_ip": "[B_device_ip_3]"
}],
"rank_id": "11",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "4",
"device_ip": "[B_device_ip_4]"
}],
"rank_id": "12",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "5",
"device_ip": "[B_device_ip_5]"
}],
"rank_id": "13",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "6",
"device_ip": "[B_device_ip_6]"
}],
"rank_id": "14",
"server_id": "[server_id_B]"
},
{
"devices": [{
"device_id": "7",
"device_ip": "[B_device_ip_7]"
}],
"rank_id": "15",
"server_id": "[server_id_B]"
}
]
}],
"para_plane_nic_location": "device",
"para_plane_nic_name": [
"eth0",
"eth1",
"eth2",
"eth3",
"eth4",
"eth5",
"eth6",
"eth7"
],
"para_plane_nic_num": "8",
"status": "completed",

"hccl_config_json_spec": {
"board_id": "board id, current support x0000 or 0x3000",
"chip_info": "chip info, current is 910",
"deploy_mode": "current use lab",
"group_count": "number of groups used",
"group_list": "detailed group information",
"device_num": "number of devices used, the value is the nth power of 2",
"server_num": "number of multiple machines, single machine is 1",
"group_name": "default is hccl_world_group or specified",
"instance_count": "number of instance used, generally equal to device_num",
"instance_list": "detailed instance information",
"device_id": "designated davinic device id to use, values start from 0, but no more than single machine total device num.if server_num greater than 1, the id can be restart from 0",
"device_ip": "ip corresponding to device_id",
"rank_id": "the first device must be 0 and then increase in order",
"server_id": "can be specified as the machine's ip address",
"para_plane_nic_location": "current use device",
"para_plane_nic_name": "network card corresponding to device ip",
"para_plane_nic_num": "number of network cards used",
"status": "current use completed"
}
}
Loading