Skip to content
This repository has been archived by the owner on Aug 5, 2022. It is now read-only.

Commit

Permalink
ported FB resnet50 to default_resent50
Browse files Browse the repository at this point in the history
  • Loading branch information
daisyden committed Mar 9, 2018
1 parent 318da3d commit 5fbc80f
Show file tree
Hide file tree
Showing 10 changed files with 44 additions and 6,719 deletions.
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
net: "models/intel_optimized_models/multinode/default_resnet50_16nodes/train_val.prototxt"
test_iter: 1000
test_interval: 625
test_interval: 563
test_initialization: false
display: 40
base_lr: 0.8
Expand All @@ -9,11 +9,11 @@ stepvalue:18750
stepvalue:37500
stepvalue:50000
gamma: 0.1
max_iter: 62556 # 56300
max_iter: 56300
warmup_iter: 3125 # 1281167 / 2048 * 5 epochs
warmup_start_lr: 0.1
momentum: 0.9
weight_decay: 0.0001
snapshot: 6250
snapshot: 5630
snapshot_prefix: "default_resnet_50_16_nodes"
solver_mode: CPU
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
net: "models/intel_optimized_models/multinode/resnet_50_64_nodes_8k_batch/train_val.prototxt"
net: "models/intel_optimized_models/multinode/default_resnet50_64nodes/train_val.prototxt"
test_iter: 1000
test_interval: 156
test_interval: 140
test_initialization: false
display: 40
base_lr: 3.2
Expand All @@ -14,6 +14,6 @@ warmup_iter: 780 # 1281167 / 8192 * 5 epochs
warmup_start_lr: 0.1
momentum: 0.9
weight_decay: 0.0001
snapshot: 1560
snapshot_prefix: "models/intel_optimized_models/multinode/resnet_50_64_nodes_8k_batch/resnet_50_64_nodes_8k"
snapshot: 1408
snapshot_prefix: "default_resnet_50_64_nodes"
solver_mode: CPU
Original file line number Diff line number Diff line change
Expand Up @@ -783,7 +783,7 @@ layer {
num_output: 128
kernel_size: 1
pad: 0
stride: 1
stride: 2
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -841,7 +841,7 @@ layer {
num_output: 128
kernel_size: 3
pad: 1
stride: 2
stride: 1
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -1569,7 +1569,7 @@ layer {
num_output: 256
kernel_size: 1
pad: 0
stride: 1
stride: 2
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -1627,7 +1627,7 @@ layer {
num_output: 256
kernel_size: 3
pad: 1
stride: 2
stride: 1
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -2727,7 +2727,7 @@ layer {
num_output: 512
kernel_size: 1
pad: 0
stride: 1
stride: 2
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -2785,7 +2785,7 @@ layer {
num_output: 512
kernel_size: 3
pad: 1
stride: 2
stride: 1
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -3302,6 +3302,9 @@ layer {
top: "loss"
name: "prob"
type: "SoftmaxWithLoss"
include {
phase: TRAIN
}
}
layer {
name: "loss3/top-1"
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,17 @@
net: "models/intel_optimized_models/multinode/default_resnet50_8nodes/train_val.prototxt"
test_iter: 1000
test_interval: 1126
test_initialization: false
display: 40
base_lr: 0.4
lr_policy: "multistep"
stepvalue:37440
stepvalue:74880
stepvalue:99840
gamma: 0.1
max_iter: 112600
momentum: 0.9
weight_decay: 0.0001
snapshot: 11260
snapshot_prefix: "default_resnet_50_8_nodes"
solver_mode: CPU
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
name: "ResNet-50"
bn_stats_batch_size: 32
layer {
name: "data"
type: "Data"
Expand All @@ -25,7 +26,7 @@ layer {
}
data_param {
source: "examples/imagenet/ilsvrc12_train_lmdb"
batch_size: 32
batch_size: 128
backend: LMDB
prefetch: 2
shuffle: true
Expand Down Expand Up @@ -782,7 +783,7 @@ layer {
num_output: 128
kernel_size: 1
pad: 0
stride: 1
stride: 2
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -840,7 +841,7 @@ layer {
num_output: 128
kernel_size: 3
pad: 1
stride: 2
stride: 1
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -1568,7 +1569,7 @@ layer {
num_output: 256
kernel_size: 1
pad: 0
stride: 1
stride: 2
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -1626,7 +1627,7 @@ layer {
num_output: 256
kernel_size: 3
pad: 1
stride: 2
stride: 1
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -2726,7 +2727,7 @@ layer {
num_output: 512
kernel_size: 1
pad: 0
stride: 1
stride: 2
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -2784,7 +2785,7 @@ layer {
num_output: 512
kernel_size: 3
pad: 1
stride: 2
stride: 1
bias_term: false
weight_filler {
type: "msra"
Expand Down Expand Up @@ -3301,6 +3302,9 @@ layer {
top: "loss"
name: "prob"
type: "SoftmaxWithLoss"
include {
phase: TRAIN
}
}
layer {
name: "loss3/top-1"
Expand Down

This file was deleted.

Loading

0 comments on commit 5fbc80f

Please sign in to comment.