-
Notifications
You must be signed in to change notification settings - Fork 11
/
Copy pathmlcube.yaml
47 lines (42 loc) · 1.58 KB
/
mlcube.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
name: MLCommons DataPerf
description: MLCommons DataPerf integration
authors:
- { name: "MLCommons Best Practices Working Group" }
platform:
accelerator_count: 0
docker:
# Image name.
image: mlcommons/dataperf:0.0.1
# Docker build context relative to $MLCUBE_ROOT. Default is `build`.
build_context: "."
# Docker file name within docker build context, default is `Dockerfile`.
build_file: "Dockerfile_mlcube"
tasks:
download:
# Download dataset
parameters:
inputs: { parameters_file: { type: file, default: parameters.yaml } }
outputs: { output_path: data/ }
select:
# Run selection algorithm
parameters:
inputs:
{
config_file: { type: file, default: dataperf_speech_config.yaml },
allowed_training_set: { type: file, default: data/dataperf_en_data/allowed_training_set.yaml },
train_embeddings_dir: data/dataperf_en_data/train_embeddings/,
}
outputs: { outdir: select_output/ }
evaluate:
# Perfom evaluation
parameters:
inputs:
{
eval_embeddings_dir: data/dataperf_en_data/eval_embeddings/,
train_embeddings_dir: data/dataperf_en_data/train_embeddings/,
allowed_training_set: { type: file, default: data/dataperf_en_data/allowed_training_set.yaml },
eval_file: { type: file, default: data/dataperf_en_data/eval.yaml },
train_file: { type: file, default: select_output/en_train.json },
config_file: { type: file, default: dataperf_speech_config.yaml },
}
outputs: { log_path: { type: file, default: log.txt } }