From 792f9c468d3e1b8d8eb0ea5069968ad8a4525057 Mon Sep 17 00:00:00 2001
From: cTuning <admin@ctuning.org>
Date: Sun, 18 Feb 2024 19:57:05 +0000
Subject: [PATCH] Updated docs

---
 .../README.md                                 | 16 +++----
 .../app-stable-diffusion-onnx-py/README.md    | 16 +++----
 .../script/get-generic-python-lib/README.md   |  6 +++
 .../README.md                                 | 27 ++++++++++-
 .../script/run-mlperf-inference-app/README.md | 47 ++++++++++---------
 5 files changed, 71 insertions(+), 41 deletions(-)

diff --git a/cm-mlops/script/app-image-classification-onnx-py/README.md b/cm-mlops/script/app-image-classification-onnx-py/README.md
index 461ca5ca8d..fd04daf86c 100644
--- a/cm-mlops/script/app-image-classification-onnx-py/README.md
+++ b/cm-mlops/script/app-image-classification-onnx-py/README.md
@@ -36,7 +36,7 @@ See extra [notes](README-extra.md) from the authors and contributors.
 * CM GitHub repository: *[mlcommons@ck](https://github.com/mlcommons/ck/tree/master/cm-mlops)*
 * GitHub directory for this script: *[GitHub](https://github.com/mlcommons/ck/tree/master/cm-mlops/script/app-image-classification-onnx-py)*
 * CM meta description for this script: *[_cm.yaml](_cm.yaml)*
-* CM "database" tags to find this script: *app,image-classification,onnx,python*
+* CM "database" tags to find this script: *modular,python,app,image-classification,onnx*
 * Output cached? *False*
 ___
 ### Reuse this script in your project
@@ -53,9 +53,9 @@ ___
 
 #### Run this script from command line
 
-1. `cm run script --tags=app,image-classification,onnx,python[,variations] [--input_flags]`
+1. `cm run script --tags=modular,python,app,image-classification,onnx[,variations] [--input_flags]`
 
-2. `cmr "app image-classification onnx python[ variations]" [--input_flags]`
+2. `cmr "modular python app image-classification onnx[ variations]" [--input_flags]`
 
 * `variations` can be seen [here](#variations)
 
@@ -72,7 +72,7 @@ import cmind
 
 r = cmind.access({'action':'run'
                   'automation':'script',
-                  'tags':'app,image-classification,onnx,python'
+                  'tags':'modular,python,app,image-classification,onnx'
                   'out':'con',
                   ...
                   (other input keys for this script)
@@ -89,13 +89,13 @@ if r['return']>0:
 
 #### Run this script via GUI
 
-```cmr "cm gui" --script="app,image-classification,onnx,python"```
+```cmr "cm gui" --script="modular,python,app,image-classification,onnx"```
 
-Use this [online GUI](https://cKnowledge.org/cm-gui/?tags=app,image-classification,onnx,python) to generate CM CMD.
+Use this [online GUI](https://cKnowledge.org/cm-gui/?tags=modular,python,app,image-classification,onnx) to generate CM CMD.
 
 #### Run this script via Docker (beta)
 
-`cm docker script "app image-classification onnx python[ variations]" [--input_flags]`
+`cm docker script "modular python app image-classification onnx[ variations]" [--input_flags]`
 
 ___
 ### Customization
@@ -217,7 +217,7 @@ ___
 
 ___
 ### Script output
-`cmr "app image-classification onnx python[,variations]" [--input_flags] -j`
+`cmr "modular python app image-classification onnx[,variations]" [--input_flags] -j`
 #### New environment keys (filter)
 
 * `CM_APP_IMAGE_CLASSIFICATION_ONNX_PY*`
diff --git a/cm-mlops/script/app-stable-diffusion-onnx-py/README.md b/cm-mlops/script/app-stable-diffusion-onnx-py/README.md
index 8615047b1f..5f820009bb 100644
--- a/cm-mlops/script/app-stable-diffusion-onnx-py/README.md
+++ b/cm-mlops/script/app-stable-diffusion-onnx-py/README.md
@@ -36,7 +36,7 @@ See extra [notes](README-extra.md) from the authors and contributors.
 * CM GitHub repository: *[mlcommons@ck](https://github.com/mlcommons/ck/tree/master/cm-mlops)*
 * GitHub directory for this script: *[GitHub](https://github.com/mlcommons/ck/tree/master/cm-mlops/script/app-stable-diffusion-onnx-py)*
 * CM meta description for this script: *[_cm.yaml](_cm.yaml)*
-* CM "database" tags to find this script: *app,stable,diffusion,stable-diffusion,onnx,python*
+* CM "database" tags to find this script: *modular,python,app,stable-diffusion,onnx*
 * Output cached? *False*
 ___
 ### Reuse this script in your project
@@ -53,9 +53,9 @@ ___
 
 #### Run this script from command line
 
-1. `cm run script --tags=app,stable,diffusion,stable-diffusion,onnx,python[,variations] [--input_flags]`
+1. `cm run script --tags=modular,python,app,stable-diffusion,onnx[,variations] [--input_flags]`
 
-2. `cmr "app stable diffusion stable-diffusion onnx python[ variations]" [--input_flags]`
+2. `cmr "modular python app stable-diffusion onnx[ variations]" [--input_flags]`
 
 * `variations` can be seen [here](#variations)
 
@@ -72,7 +72,7 @@ import cmind
 
 r = cmind.access({'action':'run'
                   'automation':'script',
-                  'tags':'app,stable,diffusion,stable-diffusion,onnx,python'
+                  'tags':'modular,python,app,stable-diffusion,onnx'
                   'out':'con',
                   ...
                   (other input keys for this script)
@@ -89,13 +89,13 @@ if r['return']>0:
 
 #### Run this script via GUI
 
-```cmr "cm gui" --script="app,stable,diffusion,stable-diffusion,onnx,python"```
+```cmr "cm gui" --script="modular,python,app,stable-diffusion,onnx"```
 
-Use this [online GUI](https://cKnowledge.org/cm-gui/?tags=app,stable,diffusion,stable-diffusion,onnx,python) to generate CM CMD.
+Use this [online GUI](https://cKnowledge.org/cm-gui/?tags=modular,python,app,stable-diffusion,onnx) to generate CM CMD.
 
 #### Run this script via Docker (beta)
 
-`cm docker script "app stable diffusion stable-diffusion onnx python[ variations]" [--input_flags]`
+`cm docker script "modular python app stable-diffusion onnx[ variations]" [--input_flags]`
 
 ___
 ### Customization
@@ -208,7 +208,7 @@ ___
 
 ___
 ### Script output
-`cmr "app stable diffusion stable-diffusion onnx python[,variations]" [--input_flags] -j`
+`cmr "modular python app stable-diffusion onnx[,variations]" [--input_flags] -j`
 #### New environment keys (filter)
 
 #### New environment keys auto-detected from customize
diff --git a/cm-mlops/script/get-generic-python-lib/README.md b/cm-mlops/script/get-generic-python-lib/README.md
index 68a0a0b386..6bca9abd3d 100644
--- a/cm-mlops/script/get-generic-python-lib/README.md
+++ b/cm-mlops/script/get-generic-python-lib/README.md
@@ -244,6 +244,12 @@ ___
         - *CM_GENERIC_PYTHON_PACKAGE_NAME*: `numpy`
       - Workflow:
     * `_nvidia-apex`
+      - Environment variables:
+        - *CM_GENERIC_PYTHON_PACKAGE_NAME*: `apex`
+        - *CM_GENERIC_PYTHON_PACKAGE_VARIANT*: `nvidia-apex`
+        - *CM_GENERIC_PYTHON_PIP_URL*: `git+https://github.com/nvidia/apex@0da3ffb92ee6fbe5336602f0e3989db1cd16f880`
+      - Workflow:
+    * `_nvidia-apex-from-src`
       - Environment variables:
         - *CM_GENERIC_PYTHON_PACKAGE_NAME*: `apex`
         - *CM_GENERIC_PYTHON_PACKAGE_VARIANT*: `nvidia-apex`
diff --git a/cm-mlops/script/reproduce-mlperf-inference-nvidia/README.md b/cm-mlops/script/reproduce-mlperf-inference-nvidia/README.md
index 14a6a79490..e0227b4a37 100644
--- a/cm-mlops/script/reproduce-mlperf-inference-nvidia/README.md
+++ b/cm-mlops/script/reproduce-mlperf-inference-nvidia/README.md
@@ -480,7 +480,9 @@ ___
       - Environment variables:
         - *CM_MLPERF_NVIDIA_HARNESS_NUM_WARMUPS*: `1`
       - Workflow:
-    * `_resnet50,multistream,run_harness`
+    * `_resnet50,multistream,run_harness,num-gpus.1`
+      - Workflow:
+    * `_resnet50,multistream,run_harness,num-gpus.2`
       - Workflow:
     * `_resnet50,server,run_harness`
       - Workflow:
@@ -503,6 +505,10 @@ ___
       - Environment variables:
         - *CM_MLPERF_NVIDIA_HARNESS_EMBEDDING_WEIGHTS_ON_GPU_PART*: `0.30`
       - Workflow:
+    * `_rtx_4090,gptj_,offline,run_harness`
+      - Workflow:
+    * `_rtx_4090,gptj_,server,run_harness`
+      - Workflow:
     * `_rtx_4090,resnet50,offline,run_harness`
       - Workflow:
     * `_rtx_4090,resnet50,server,run_harness`
@@ -806,6 +812,7 @@ ___
     * `_singlestream`
       - Environment variables:
         - *CM_MLPERF_LOADGEN_SCENARIO*: `SingleStream`
+        - *CUDA_VISIBLE_DEVICES_NOT_USED*: `0`
       - Workflow:
 
     </details>
@@ -912,6 +919,22 @@ ___
     </details>
 
 
+  * Group "**num-gpus**"
+    <details>
+    <summary>Click here to expand this section.</summary>
+
+    * `_num-gpus.#`
+      - Environment variables:
+        - *CM_NVIDIA_NUM_GPUS*: `#`
+      - Workflow:
+    * **`_num-gpus.1`** (default)
+      - Environment variables:
+        - *CM_NVIDIA_NUM_GPUS*: `1`
+      - Workflow:
+
+    </details>
+
+
   * Group "**power-mode**"
     <details>
     <summary>Click here to expand this section.</summary>
@@ -1060,7 +1083,7 @@ ___
 
 #### Default variations
 
-`_cuda,_resnet50,_run_harness,_tensorrt`
+`_cuda,_num-gpus.1,_resnet50,_run_harness,_tensorrt`
 
 #### Script flags mapped to environment
 <details>
diff --git a/cm-mlops/script/run-mlperf-inference-app/README.md b/cm-mlops/script/run-mlperf-inference-app/README.md
index 574bb9a54a..a9b0b27150 100644
--- a/cm-mlops/script/run-mlperf-inference-app/README.md
+++ b/cm-mlops/script/run-mlperf-inference-app/README.md
@@ -28,13 +28,6 @@
 
 ### About
 
-This is a ready-to-use CM automation recipe that provides a unified and portable interface to the MLPerf inference benchmark 
-assembled from other [portable CM scripts](https://github.com/mlcommons/ck/blob/master/docs/list_of_scripts.md)
-being developed by the open [MLCommons taskforce on automation and reproducibility](https://github.com/mlcommons/ck/blob/master/docs/taskforce.md).
-
-This automation recipe automatically generates the command line for the [universal MLPerf inference script](../app-mlperf-inference)
-to run MLPerf scenarios for a given ML task, model, runtime and device, and prepare and validate submissions.
-
 
 See extra [notes](README-extra.md) from the authors and contributors.
 
@@ -44,7 +37,7 @@ See extra [notes](README-extra.md) from the authors and contributors.
 * CM GitHub repository: *[mlcommons@ck](https://github.com/mlcommons/ck/tree/master/cm-mlops)*
 * GitHub directory for this script: *[GitHub](https://github.com/mlcommons/ck/tree/master/cm-mlops/script/run-mlperf-inference-app)*
 * CM meta description for this script: *[_cm.yaml](_cm.yaml)*
-* CM "database" tags to find this script: *run,mlperf,inference,common*
+* CM "database" tags to find this script: *run-mlperf-inference*
 * Output cached? *False*
 ___
 ### Reuse this script in your project
@@ -61,9 +54,9 @@ ___
 
 #### Run this script from command line
 
-1. `cm run script --tags=run,mlperf,inference,common[,variations] [--input_flags]`
+1. `cm run script --tags=run-mlperf-inference[,variations] [--input_flags]`
 
-2. `cmr "run mlperf inference common[ variations]" [--input_flags]`
+2. `cmr "run-mlperf-inference[ variations]" [--input_flags]`
 
 * `variations` can be seen [here](#variations)
 
@@ -80,7 +73,7 @@ import cmind
 
 r = cmind.access({'action':'run'
                   'automation':'script',
-                  'tags':'run,mlperf,inference,common'
+                  'tags':'run-mlperf-inference'
                   'out':'con',
                   ...
                   (other input keys for this script)
@@ -97,13 +90,13 @@ if r['return']>0:
 
 #### Run this script via GUI
 
-```cmr "cm gui" --script="run,mlperf,inference,common"```
+```cmr "cm gui" --script="run-mlperf-inference"```
 
-Use this [online GUI](https://cKnowledge.org/cm-gui/?tags=run,mlperf,inference,common) to generate CM CMD.
+Use this [online GUI](https://cKnowledge.org/cm-gui/?tags=run-mlperf-inference) to generate CM CMD.
 
 #### Run this script via Docker (beta)
 
-`cm docker script "run mlperf inference common[ variations]" [--input_flags]`
+`cm docker script "run-mlperf-inference[ variations]" [--input_flags]`
 
 ___
 ### Customization
@@ -240,8 +233,10 @@ ___
 
 #### Input description
 
+* --**division** MLPerf division {open,closed} (*open*)
+* --**category** MLPerf category {edge,datacenter,network} (*edge*)
 * --**device** MLPerf device {cpu,cuda,rocm,qaic} (*cpu*)
-* --**model** MLPerf model {resnet50,retinanet,bert-99,bert-99.9,3d-unet-99,3d-unet-99.9,rnnt,dlrm-v2-99,dlrm-v2-99.9,gptj-99,gptj-99.9,sdxl,llama2-70b-99,llama2-70b-99.9,mobilenet,efficientnet} (*resnet50*)
+* --**model** MLPerf model {resnet50,retinanet,bert-99,bert-99.9,3d-unet-99,3d-unet-99.9,rnnt,dlrm-v2-99,dlrm-v2-99.9,gptj-99,gptj-99.9,sdxl,llama2-70b-99,llama2-70b-99.9,mobilenet,efficientnet} (*retinanet*)
 * --**precision** MLPerf model precision {float32,float16,bfloat16,int8,uint8}
 * --**implementation** MLPerf implementation {reference,mil,nvidia-original,intel-original,qualcomm,tflite-cpp} (*reference*)
 * --**backend** MLPerf framework (backend) {onnxruntime,tf,pytorch,deepsparse,tensorrt,glow,tvm-onnx} (*onnxruntime*)
@@ -251,31 +246,37 @@ ___
 * --**submitter** Submitter name (without space) (*CTuning*)
 * --**results_dir** Folder path to store results (defaults to the current working directory)
 * --**submission_dir** Folder path to store MLPerf submission tree
-* --**adr.compiler.tags** Compiler for loadgen and any C/C++ part of implementation (*gcc*)
+* --**adr.compiler.tags** Compiler for loadgen and any C/C++ part of implementation
 * --**adr.inference-src-loadgen.env.CM_GIT_URL** Git URL for MLPerf inference sources to build LoadGen (to enable non-reference implementations)
 * --**adr.inference-src.env.CM_GIT_URL** Git URL for MLPerf inference sources to run benchmarks (to enable non-reference implementations)
 * --**adr.mlperf-inference-implementation.max_batchsize** Maximum batchsize to be used
-* --**adr.mlperf-inference-implementation.num_threads** Number of threads (reference&C++ implementation only)
-* --**adr.python.name** Python virtual environment name (optional) (*mlperf*)
+* --**adr.mlperf-inference-implementation.num_threads** Number of threads (reference & C++ implementation only)
+* --**adr.python.name** Python virtual environment name (optional)
 * --**adr.python.version** Force Python version (must have all system deps)
 * --**adr.python.version_min** Minimal Python version (*3.8*)
+* --**power** Measure power {yes,no} (*no*)
+* --**adr.mlperf-power-client.power_server** MLPerf Power server IP address (*192.168.0.15*)
+* --**adr.mlperf-power-client.port** MLPerf Power client port (*4950*)
 * --**clean** Clean run (*True*)
-* --**compliance** Whether to run compliance tests (applicable only for closed division) {yes,no} (*yes*)
+* --**compliance** Whether to run compliance tests (applicable only for closed division) {yes,no} (*no*)
 * --**dashboard_wb_project** W&B dashboard project (*cm-mlperf-dse-testing*)
 * --**dashboard_wb_user** W&B dashboard user (*cmind*)
-* --**hw_name** MLPerf hardware name (from [here](https://github.com/mlcommons/ck/tree/master/cm-mlops/script/get-mlperf-inference-sut-description/hardware)) (*default*)
+* --**hw_name** MLPerf hardware name (from [here](https://github.com/mlcommons/ck/tree/master/cm-mlops/script/get-mlperf-inference-sut-description/hardware))
 * --**multistream_target_latency** Set MultiStream target latency
 * --**offline_target_qps** Set LoadGen Offline target QPS
-* --**quiet** Quiet run (select default values for all questions) (*False*)
+* --**quiet** Quiet run (select default values for all questions) (*True*)
 * --**server_target_qps** Set Server target QPS
 * --**singlestream_target_latency** Set SingleStream target latency
 * --**target_latency** Set Target latency
 * --**target_qps** Set LoadGen target QPS
+* --**j** Print results dictionary to console at the end of the run (*True*)
+* --**jf** Record results dictionary to file at the end of the run (*mlperf-inference-results*)
+* --**time** Print script execution time at the end of the run (*True*)
 
 **Above CLI flags can be used in the Python CM API as follows:**
 
 ```python
-r=cm.access({... , "device":...}
+r=cm.access({... , "division":...}
 ```
 
 #### Script flags mapped to environment
@@ -400,7 +401,7 @@ ___
 
 ___
 ### Script output
-`cmr "run mlperf inference common[,variations]" [--input_flags] -j`
+`cmr "run-mlperf-inference[,variations]" [--input_flags] -j`
 #### New environment keys (filter)
 
 #### New environment keys auto-detected from customize