summaryrefslogtreecommitdiff
path: root/src
diff options
context:
space:
mode:
authorYangqing Jia <jiayq84@gmail.com>2013-10-10 21:48:40 -0700
committerYangqing Jia <jiayq84@gmail.com>2013-10-10 21:48:40 -0700
commit0b9b73214b174e34d8f81df22832bd857fee167b (patch)
tree73013f8b521261bc78399c11fd762e0a2176e737 /src
parent6ecaa904e5ffcbf64f50eafd13326af6faf2a1b1 (diff)
downloadcaffeonacl-0b9b73214b174e34d8f81df22832bd857fee167b.tar.gz
caffeonacl-0b9b73214b174e34d8f81df22832bd857fee167b.tar.bz2
caffeonacl-0b9b73214b174e34d8f81df22832bd857fee167b.zip
snapshot. prepare to debug
Diffstat (limited to 'src')
-rw-r--r--src/caffe/optimization/solver.cpp3
-rw-r--r--src/programs/imagenet.prototxt2
-rw-r--r--src/programs/imagenet_solver.prototxt6
3 files changed, 7 insertions, 4 deletions
diff --git a/src/caffe/optimization/solver.cpp b/src/caffe/optimization/solver.cpp
index d9ab2c1b..fb382374 100644
--- a/src/caffe/optimization/solver.cpp
+++ b/src/caffe/optimization/solver.cpp
@@ -114,6 +114,9 @@ void SGDSolver<Dtype>::ComputeUpdateValue() {
vector<shared_ptr<Blob<Dtype> > >& net_params = this->net_->params();
// get the learning rate
Dtype rate = GetLearningRate();
+ if (this->param_.display() && this->iter_ % this->param_.display() == 0) {
+ LOG(ERROR) << "Iteration " << this->iter_ << ", lr = " << rate;
+ }
Dtype momentum = this->param_.momentum();
Dtype weight_decay = this->param_.weight_decay();
// LOG(ERROR) << "rate:" << rate << " momentum:" << momentum
diff --git a/src/programs/imagenet.prototxt b/src/programs/imagenet.prototxt
index 65b7432c..d5e9b921 100644
--- a/src/programs/imagenet.prototxt
+++ b/src/programs/imagenet.prototxt
@@ -7,7 +7,7 @@ layers {
batchsize: 96
subtraction: 114
cropsize: 227
- mirror: true
+ mirror: false
}
top: "data"
top: "label"
diff --git a/src/programs/imagenet_solver.prototxt b/src/programs/imagenet_solver.prototxt
index 58b0dfef..6e583638 100644
--- a/src/programs/imagenet_solver.prototxt
+++ b/src/programs/imagenet_solver.prototxt
@@ -1,10 +1,10 @@
-base_lr: 0.02
+base_lr: 0.01
lr_policy: "step"
gamma: 0.1
stepsize: 340000
-display: 100
+display: 20
max_iter: 1200000
momentum: 0.9
weight_decay: 0.0005
-snapshot: 15000
+snapshot: 5000
snapshot_prefix: "alexnet_train" \ No newline at end of file