prepare mlperf submission (#4270)

* prepare mlperf submission

* 28min compile and 3h53m

* red 30 minute compile and 56 TFLOPS
This commit is contained in:
chenyu 2024-04-24 13:19:31 -04:00 committed by GitHub
parent c606a0ba6f
commit c11bad766d
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
8 changed files with 118 additions and 0 deletions

View File

@ -0,0 +1,11 @@
export PYTHONPATH="."
export MODEL="resnet"
export DEFAULT_FLOAT="HALF" GPUS=6 BS=1536 EVAL_BS=48
export SPLIT_REDUCEOP=0 LAZYCACHE=0 RESET_STEP=0
export TRAIN_BEAM=3 IGNORE_JIT_FIRST_BEAM=1 BEAM_UOPS_MAX=1500 BEAM_UPCAST_MAX=128 BEAM_LOCAL_MAX=1024 BEAM_MIN_PROGRESS=50
export WANDB=1 PARALLEL=0
python3 examples/mlperf/model_train.py

View File

@ -0,0 +1,11 @@
export PYTHONPATH="."
export MODEL="resnet"
export DEFAULT_FLOAT="HALF" GPUS=6 BS=1536 EVAL_BS=48
export SPLIT_REDUCEOP=0 LAZYCACHE=0 RESET_STEP=0
export TRAIN_BEAM=3 IGNORE_JIT_FIRST_BEAM=1 BEAM_UOPS_MAX=1500 BEAM_UPCAST_MAX=128 BEAM_LOCAL_MAX=1024 BEAM_MIN_PROGRESS=50
export BENCHMARK=10 DEBUG=2
python3 examples/mlperf/model_train.py

View File

@ -0,0 +1,11 @@
export PYTHONPATH="."
export MODEL="resnet"
export DEFAULT_FLOAT="HALF" GPUS=6 BS=1536 EVAL_BS=48
export SPLIT_REDUCEOP=0 LAZYCACHE=0 RESET_STEP=0
export TRAIN_BEAM=2 IGNORE_JIT_FIRST_BEAM=1 BEAM_UOPS_MAX=1200 BEAM_UPCAST_MAX=128 BEAM_LOCAL_MAX=256 BEAM_MIN_PROGRESS=50
export WANDB=1 PARALLEL=0
python3 examples/mlperf/model_train.py

View File

@ -0,0 +1,11 @@
export PYTHONPATH="."
export MODEL="resnet"
export DEFAULT_FLOAT="HALF" GPUS=6 BS=1536 EVAL_BS=48
export SPLIT_REDUCEOP=0 LAZYCACHE=0 RESET_STEP=0
export TRAIN_BEAM=2 IGNORE_JIT_FIRST_BEAM=1 BEAM_UOPS_MAX=1200 BEAM_UPCAST_MAX=64 BEAM_LOCAL_MAX=256 BEAM_MIN_PROGRESS=50
export BENCHMARK=10 DEBUG=2
python3 examples/mlperf/model_train.py

View File

@ -0,0 +1,37 @@
{
"submitter": "tinycorp",
"division": "closed",
"status": "available",
"system_name": "tinybox green",
"number_of_nodes": "",
"host_processors_per_node": "",
"host_processor_model_name": "",
"host_processor_core_count": "",
"host_processor_vcpu_count": "",
"host_processor_frequency": "",
"host_processor_caches": "",
"host_processor_interconnect": "",
"host_memory_capacity": "",
"host_storage_type": "",
"host_storage_capacity": "",
"host_networking": "",
"host_networking_topology": "",
"host_memory_configuration": "",
"accelerators_per_node": "",
"accelerator_model_name": "",
"accelerator_host_interconnect": "",
"accelerator_frequency": "",
"accelerator_on-chip_memories": "",
"accelerator_memory_configuration": "",
"accelerator_memory_capacity": "",
"accelerator_interconnect": "",
"accelerator_interconnect_topology": "",
"cooling": "air",
"hw_notes": "",
"framework": "tinygrad commit",
"other_software_stack": {
"tqdm": ""
},
"operating_system": "Ubuntu 22.04",
"sw_notes": ""
}

View File

@ -0,0 +1,37 @@
{
"submitter": "tinycorp",
"division": "closed",
"status": "available",
"system_name": "tinybox red",
"number_of_nodes": "",
"host_processors_per_node": "",
"host_processor_model_name": "",
"host_processor_core_count": "",
"host_processor_vcpu_count": "",
"host_processor_frequency": "",
"host_processor_caches": "",
"host_processor_interconnect": "",
"host_memory_capacity": "",
"host_storage_type": "",
"host_storage_capacity": "",
"host_networking": "",
"host_networking_topology": "",
"host_memory_configuration": "",
"accelerators_per_node": "",
"accelerator_model_name": "",
"accelerator_host_interconnect": "",
"accelerator_frequency": "",
"accelerator_on-chip_memories": "",
"accelerator_memory_configuration": "",
"accelerator_memory_capacity": "",
"accelerator_interconnect": "",
"accelerator_interconnect_topology": "",
"cooling": "air",
"hw_notes": "",
"framework": "tinygrad commit",
"other_software_stack": {
"tqdm": ""
},
"operating_system": "Ubuntu 22.04",
"sw_notes": ""
}