-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathgehc_resnet50_1_p3_16xlarge_tensorflow111.json
29 lines (29 loc) · 1.6 KB
/
gehc_resnet50_1_p3_16xlarge_tensorflow111.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
{
"version": "v1.0",
"author": "GE Healthcare (Min Zhang)",
"authorEmail": "[email protected]",
"framework": "tensorflow 1.11 + horovod",
"codeURL": "https://github.com/mzhangatge/imagenet104/blob/89f15c2970552127aef427a8cce02c402681c859/imagenet_train.py",
"model": "Resnet 50 v1",
"hardware": "8*V100 (single p3.16xlarge)",
"costPerHour": 24.48,
"timestamp": "2019-02-25",
"usedBlacklist": true,
"misc": {
"Environment": "NCCL2.3.5+PY3.6.7+TF1.11.0+OPENMPI-3.1.2",
"optimizer": "SGD with Momentum",
"save_checkpoints_steps": 625,
"save_summary_steps": 625,
"sagemaker_submit_directory": "s3://sagemaker-us-east-1-752686809366/imagenet-ml-p3-16xlarge-2019-01-04-22-50-34-217/source/sourcedir.tar.gz",
"mom": 0.9,
"wdecay":0.0002,
"loss_scale":256,
"training_strategy": [
{"epoch":[0,6], "lr": [1.0,2.0],"lr_method":"linear","batch_size":740, "image_size":[128, 128], "data_dir":"160", "prefix":"train"},
{"epoch":[6,21], "lr": [2.0,0.45],"lr_method":"linear","batch_size":740, "image_size":[128, 128], "data_dir":"160", "prefix":"train"},
{"epoch":[21,32], "lr": [0.45,0.02],"lr_method":"exp","batch_size":256, "image_size":[224, 224], "data_dir":"320", "prefix":"train"},
{"epoch":[32,36], "lr": [0.02,0.004],"lr_method":"exp","batch_size":196, "image_size":[224, 224], "data_dir":"320", "prefix":"train"},
{"epoch":[36,40], "lr": [0.004,0.002],"lr_method":"exp","batch_size":128, "image_size":[288, 288], "data_dir":"320", "prefix":"train"}
]
}
}