update descriptions and traning scripts to latest version

kevinlin311tw · kevinlin311tw · commit 636ee6e6f78a · 2016-11-10T19:15:28.000+08:00
diff --git a/README.md b/README.md
@@ -61,7 +61,7 @@ Launch matalb and run `run_cifar10.m` to perform the evaluation of `precision at
 
 Then, you will get the `mAP` result as follows. 
 
-    >> MAP = 0.899731
+    >> MAP = 0.897165
 
 Moreover, simply run the following commands to generate the `precision at k` curves:
 
@@ -75,20 +75,20 @@ used in the evaluation.
 
 Simply run the following command to train SSDH:
 
+    $ cd /examples/SSDH
+    $ ./train.sh
 
-    $ ./examples/SSDH/train.sh
 
-
-After 50,000 iterations, the top-1 error is 9.7% on the test set of CIFAR10 dataset:
+After 50,000 iterations, the top-1 error is around 10% on the test set of CIFAR10 dataset:
 ```
-I0107 19:24:32.258903 23945 solver.cpp:326] Iteration 50000, loss = 0.0274982
-I0107 19:24:32.259012 23945 solver.cpp:346] Iteration 50000, Testing net (#0)
-I0107 19:24:36.696506 23945 solver.cpp:414]     Test net output #0: accuracy = 0.903125
-I0107 19:24:36.696543 23945 solver.cpp:414]     Test net output #1: loss: 50%-fire-rate = 1.47562e-06 (* 1 = 1.47562e-06 loss)
-I0107 19:24:36.696552 23945 solver.cpp:414]     Test net output #2: loss: classfication-error = 0.332657 (* 1 = 0.332657 loss)
-I0107 19:24:36.696559 23945 solver.cpp:414]     Test net output #3: loss: forcing-binary = -0.00317774 (* 1 = -0.00317774 loss)
-I0107 19:24:36.696565 23945 solver.cpp:331] Optimization Done.
-I0107 19:24:36.696570 23945 caffe.cpp:214] Optimization Done.
+I1109 20:36:30.962478 25398 solver.cpp:326] Iteration 50000, loss = -0.114461
+I1109 20:36:30.962507 25398 solver.cpp:346] Iteration 50000, Testing net (#0)
+I1109 20:36:45.218626 25398 solver.cpp:414]     Test net output #0: accuracy = 0.8979
+I1109 20:36:45.218660 25398 solver.cpp:414]     Test net output #1: loss: 50%-fire-rate = 0.0005225 (* 1 = 0.0005225 loss)
+I1109 20:36:45.218668 25398 solver.cpp:414]     Test net output #2: loss: classfication-error = 0.368178 (* 1 = 0.368178 loss)
+I1109 20:36:45.218675 25398 solver.cpp:414]     Test net output #3: loss: forcing-binary = -0.114508 (* 1 = -0.114508 loss)
+I1109 20:36:45.218682 25398 solver.cpp:331] Optimization Done.
+I1109 20:36:45.218686 25398 caffe.cpp:214] Optimization Done.
 ```
 
 The training process takes roughly 2~3 hours on a desktop with Titian X GPU. You will finally get your model named `SSDH48_iter_xxxxxx.caffemodel` under folder `/examples/SSDH/`
@@ -118,7 +118,7 @@ It should be easy to train the model using another dataset as long as that datas
 
 If `./prepare.sh` fails to download data, you may manually download the resouces from:
 
-0. 48-bit SSDH model: [MEGA](https://mega.nz/#!kJ1jwDpJ!X4dVUeWJ7Eqg9L8bhJaGbr9l5-HS3ccudbjIjIbYNpk), [DropBox](https://www.dropbox.com/s/6iqyz1mdhadhzbu/SSDH48_iter_50000.caffemodel?dl=0), [BaiduYun](http://pan.baidu.com/s/1nurCaJR)
+0. 48-bit SSDH model: [MEGA](https://mega.nz/#!9JMBlCaS!zsTl7eZRMdi25gkLWpj_Uv8LfN_2gQ-UF8OBMhio_3s), [DropBox](https://www.dropbox.com/s/6iqyz1mdhadhzbu/SSDH48_iter_50000.caffemodel?dl=0), [BaiduYun coming soon]
 
 0. CIFAR10 dataset (jpg format): [MEGA](https://mega.nz/#!RENV1bhZ!x0uFnAkqUSTJzKr6HzeeNV9mtDjlgQ0x6ZaXfpxbJkw), [DropBox](https://www.dropbox.com/s/f7q3bbgvat2q1u2/cifar10-dataset.zip?dl=0), [BaiduYun](http://pan.baidu.com/s/1pKsSK7h)
 
diff --git a/examples/SSDH/deploy.prototxt b/examples/SSDH/deploy.prototxt
@@ -1,4 +1,4 @@
-name: "CaffeNet"
+name: "SSDH"
 input: "data"
 input_shape {
   dim: 10
@@ -11,10 +11,26 @@ layer {
   type: "Convolution"
   bottom: "data"
   top: "conv1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
   convolution_param {
     num_output: 96
     kernel_size: 11
     stride: 4
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
   }
 }
 layer {
@@ -50,11 +66,27 @@ layer {
   type: "Convolution"
   bottom: "norm1"
   top: "conv2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
   convolution_param {
     num_output: 256
     pad: 2
     kernel_size: 5
     group: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 1
+    }
   }
 }
 layer {
@@ -90,10 +122,26 @@ layer {
   type: "Convolution"
   bottom: "norm2"
   top: "conv3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
   convolution_param {
     num_output: 384
     pad: 1
     kernel_size: 3
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
   }
 }
 layer {
@@ -107,11 +155,27 @@ layer {
   type: "Convolution"
   bottom: "conv3"
   top: "conv4"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
   convolution_param {
     num_output: 384
     pad: 1
     kernel_size: 3
     group: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 1
+    }
   }
 }
 layer {
@@ -125,11 +189,27 @@ layer {
   type: "Convolution"
   bottom: "conv4"
   top: "conv5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
   convolution_param {
     num_output: 256
     pad: 1
     kernel_size: 3
     group: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 1
+    }
   }
 }
 layer {
@@ -154,8 +234,24 @@ layer {
   type: "InnerProduct"
   bottom: "pool5"
   top: "fc6"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
   inner_product_param {
     num_output: 4096
+    weight_filler {
+      type: "gaussian"
+      std: 0.005
+    }
+    bias_filler {
+      type: "constant"
+      value: 1
+    }
   }
 }
 layer {
@@ -178,8 +274,24 @@ layer {
   type: "InnerProduct"
   bottom: "fc6"
   top: "fc7"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
   inner_product_param {
     num_output: 4096
+    weight_filler {
+      type: "gaussian"
+      std: 0.005
+    }
+    bias_filler {
+      type: "constant"
+      value: 1
+    }
   }
 }
 layer {
@@ -189,18 +301,42 @@ layer {
   top: "fc7"
 }
 layer {
-  name: "latent_layer"
+  name: "drop7"
+  type: "Dropout"
+  bottom: "fc7"
+  top: "fc7"
+  dropout_param {
+    dropout_ratio: 0.5
+  }
+}
+layer {
+  name: "latent"
   type: "InnerProduct"
   bottom: "fc7"
-  top: "latent_layer"
+  top: "latent"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
   inner_product_param {
     num_output: 48
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
   }
 }
 layer {
-  name: "encode_neuron"
+  bottom: "latent"
+  top: "latent_sigmoid"
+  name: "latent_sigmoid"
   type: "Sigmoid"
-  bottom: "latent_layer"
-  top: "encode_neuron"
 }
-
diff --git a/examples/SSDH/solver.prototxt b/examples/SSDH/solver.prototxt
@@ -1,4 +1,4 @@
-net: "./examples/SSDH/train_val.prototxt"
+net: "train_val.prototxt"
 test_iter: 200
 test_interval: 1000
 base_lr: 0.001
@@ -10,6 +10,6 @@ max_iter: 50000
 momentum: 0.9
 weight_decay: 0.0005
 snapshot: 50000
-snapshot_prefix: "./examples/SSDH/SSDH48"
+snapshot_prefix: "SSDH48"
 random_seed: 42
 solver_mode: GPU
diff --git a/examples/SSDH/train.sh b/examples/SSDH/train.sh
@@ -1 +1 @@
-./build/tools/caffe train -solver  ./examples/SSDH/solver.prototxt -weights ./models/bvlc_reference_caffenet/bvlc_reference_caffenet.caffemodel -gpu 0 2>&1 | tee ./examples/SSDH/log.txt
+../../build/tools/caffe train -solver  solver.prototxt -weights ../../models/bvlc_reference_caffenet/bvlc_reference_caffenet.caffemodel -gpu 0 2>&1 | tee log.txt
diff --git a/examples/SSDH/train_val.prototxt b/examples/SSDH/train_val.prototxt
@@ -10,10 +10,10 @@ layer {
   transform_param {
     mirror: true
     crop_size: 227
-    mean_file: "data/ilsvrc12/imagenet_mean.binaryproto"
+    mean_file: "../../data/ilsvrc12/imagenet_mean.binaryproto"
   }
   data_param {
-    source: "data/cifar10/cifar10_train_leveldb"
+    source: "../../data/cifar10/cifar10_train_leveldb"
     batch_size: 32
   }
 }
@@ -28,10 +28,10 @@ layer {
   transform_param {
     mirror: false
     crop_size: 227
-    mean_file: "data/ilsvrc12/imagenet_mean.binaryproto"
+    mean_file: "../../data/ilsvrc12/imagenet_mean.binaryproto"
   }
   data_param {
-    source: "data/cifar10/cifar10_val_leveldb"
+    source: "../../data/cifar10/cifar10_val_leveldb"
     batch_size: 50
   }
 }
diff --git a/models/SSDH/deploy.prototxt b/models/SSDH/deploy.prototxt

Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		`-./build/tools/caffe train -solver ./examples/SSDH/solver.prototxt -weights ./models/bvlc_reference_caffenet/bvlc_reference_caffenet.caffemodel -gpu 0 2>&1 \| tee ./examples/SSDH/log.txt`
	`1`	`+../../build/tools/caffe train -solver solver.prototxt -weights ../../models/bvlc_reference_caffenet/bvlc_reference_caffenet.caffemodel -gpu 0 2>&1 \| tee log.txt`
Original file line number	Diff line number	Diff line change
`@@ -10,10 +10,10 @@ layer {`
`10`	`10`	`transform_param {`
`11`	`11`	`mirror: true`
`12`	`12`	`crop_size: 227`
`13`		`- mean_file: "data/ilsvrc12/imagenet_mean.binaryproto"`
	`13`	`+ mean_file: "../../data/ilsvrc12/imagenet_mean.binaryproto"`
`14`	`14`	`}`
`15`	`15`	`data_param {`
`16`		`- source: "data/cifar10/cifar10_train_leveldb"`
	`16`	`+ source: "../../data/cifar10/cifar10_train_leveldb"`
`17`	`17`	`batch_size: 32`
`18`	`18`	`}`
`19`	`19`	`}`
`@@ -28,10 +28,10 @@ layer {`
`28`	`28`	`transform_param {`
`29`	`29`	`mirror: false`
`30`	`30`	`crop_size: 227`
`31`		`- mean_file: "data/ilsvrc12/imagenet_mean.binaryproto"`
	`31`	`+ mean_file: "../../data/ilsvrc12/imagenet_mean.binaryproto"`
`32`	`32`	`}`
`33`	`33`	`data_param {`
`34`		`- source: "data/cifar10/cifar10_val_leveldb"`
	`34`	`+ source: "../../data/cifar10/cifar10_val_leveldb"`
`35`	`35`	`batch_size: 50`
`36`	`36`	`}`
`37`	`37`	`}`