Skip to content

Commit

Permalink
[iluvatar] fix bugs
Browse files Browse the repository at this point in the history
  • Loading branch information
yu.song committed Feb 5, 2025
1 parent 2e754ed commit aac6741
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 4 deletions.
2 changes: 1 addition & 1 deletion training/run_benchmarks/config/cluster_conf.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
'''Cluster configs'''

# Hosts to run the benchmark. Each item is an IP address or a hostname.
HOSTS = ["localhost"]
HOSTS = ["10.1.2.2", "10.1.2.3", "10.1.2.4"]

# Hosts port to run the tensorflow distribution_strategy = 'multi_worker_mirrored'
HOSTS_PORTS = ["2222"]
Expand Down
6 changes: 3 additions & 3 deletions training/run_benchmarks/config/test_conf.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@

# Set accelerator's vendor name, e.g. iluvatar, cambricon, kunlunxin, ascend, mthreads, metax and dcu.
# We will run benchmarks in training/<vendor>
VENDOR = "iluvatar"
VENDOR = "nvidia"

# Accelerator options for docker. TODO FIXME support more accelerators.
# possible value of ACCE_CONTAINER_OPT are:
Expand All @@ -25,7 +25,7 @@
# " --device=/dev/infiniband --device=/dev/dri --device=/dev/mxcd --group-add video"
# dcu:
# "-v /opt/hyhal/:/opt/hyhal/ --device=/dev/kfd --device=/dev/dri/ --group-add video"
ACCE_CONTAINER_OPT = " --privileged --pid=host --ipc=host --cap-add=ALL -v /dev:/dev -v /lib/modules:/lib/modules -v /mnt:/mnt -v /usr/src:/usr/src -v /home:/home "
ACCE_CONTAINER_OPT = " --gpus all"

# XXX_VISIBLE_DEVICE item name in env
# possible value of ACCE_VISIBLE_DEVICE_ENV_NAME are:
Expand All @@ -43,7 +43,7 @@
# The path that flagperf deploy in the cluster.
# Users must set FLAGPERF_PATH to where flagperf deploy
# You can assume the preset "/home/FlagPerf/training" points to Null
FLAGPERF_PATH = "/home/zhiyuan/FlagPerf/training"
FLAGPERF_PATH = "/home/FlagPerf/training"

# Set log path on the host here.
FLAGPERF_LOG_PATH = FLAGPERF_PATH + "/result/"
Expand Down

0 comments on commit aac6741

Please sign in to comment.