Get cifar10 tests up and running

pcmoritz · pcmoritz · commit 6e8eb5ed30a0 · 2015-11-17T12:34:29.000-08:00
diff --git a/build.sbt b/build.sbt
@@ -0,0 +1,7 @@
+import AssemblyKeys._
+
+assemblySettings
+
+libraryDependencies += "net.java.dev.jna" % "jna" % "4.2.1"
+
+libraryDependencies += "org.scalatest" % "scalatest_2.10" % "2.0" % "test"
diff --git a/caffe/examples/cifar10/cifar10_full_java_solver.prototxt b/caffe/examples/cifar10/cifar10_full_java_solver.prototxt
@@ -0,0 +1,23 @@
+# reduce learning rate after 120 epochs (60000 iters) by factor 0f 10
+# then another factor of 10 after 10 more epochs (5000 iters)
+
+# The train/test net protocol buffer definition
+net: "examples/cifar10/cifar10_full_java_train_test.prototxt"
+# test_iter specifies how many forward passes the test should carry out.
+# In the case of CIFAR10, we have test batch size 100 and 100 test iterations,
+# covering the full 10,000 testing images.
+test_iter: 100
+# Carry out testing every 1000 training iterations.
+test_interval: 1000
+# The base learning rate, momentum and the weight decay of the network.
+base_lr: 0.001
+momentum: 0.9
+weight_decay: 0.004
+# The learning rate policy
+lr_policy: "fixed"
+# Display every 200 iterations
+display: 200
+# The maximum number of iterations
+max_iter: 60000
+# solver mode: CPU or GPU
+solver_mode: GPU
diff --git a/caffe/examples/cifar10/cifar10_full_java_train_test.prototxt b/caffe/examples/cifar10/cifar10_full_java_train_test.prototxt
@@ -0,0 +1,210 @@
+name: "CIFAR10_full"
+layer {
+  name: "cifardata"
+  type: "JavaData"
+  top: "data"
+  java_data_param {
+  	shape {
+      dim: 100
+      dim: 3
+      dim: 32
+      dim: 32
+    }
+  }
+}
+layer {
+  name: "cifarlabel"
+  type: "JavaData"
+  top: "label"
+  java_data_param {
+  	shape {
+      dim: 100
+      dim: 1
+    }
+  }
+}
+layer {
+  name: "conv1"
+  type: "Convolution"
+  bottom: "data"
+  top: "conv1"
+  param {
+    lr_mult: 1
+  }
+  param {
+    lr_mult: 2
+  }
+  convolution_param {
+    num_output: 32
+    pad: 2
+    kernel_size: 5
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.0001
+    }
+    bias_filler {
+      type: "constant"
+    }
+  }
+}
+layer {
+  name: "pool1"
+  type: "Pooling"
+  bottom: "conv1"
+  top: "pool1"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "relu1"
+  type: "ReLU"
+  bottom: "pool1"
+  top: "pool1"
+}
+layer {
+  name: "norm1"
+  type: "LRN"
+  bottom: "pool1"
+  top: "norm1"
+  lrn_param {
+    local_size: 3
+    alpha: 5e-05
+    beta: 0.75
+    norm_region: WITHIN_CHANNEL
+  }
+}
+layer {
+  name: "conv2"
+  type: "Convolution"
+  bottom: "norm1"
+  top: "conv2"
+  param {
+    lr_mult: 1
+  }
+  param {
+    lr_mult: 2
+  }
+  convolution_param {
+    num_output: 32
+    pad: 2
+    kernel_size: 5
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+    }
+  }
+}
+layer {
+  name: "relu2"
+  type: "ReLU"
+  bottom: "conv2"
+  top: "conv2"
+}
+layer {
+  name: "pool2"
+  type: "Pooling"
+  bottom: "conv2"
+  top: "pool2"
+  pooling_param {
+    pool: AVE
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "norm2"
+  type: "LRN"
+  bottom: "pool2"
+  top: "norm2"
+  lrn_param {
+    local_size: 3
+    alpha: 5e-05
+    beta: 0.75
+    norm_region: WITHIN_CHANNEL
+  }
+}
+layer {
+  name: "conv3"
+  type: "Convolution"
+  bottom: "norm2"
+  top: "conv3"
+  convolution_param {
+    num_output: 64
+    pad: 2
+    kernel_size: 5
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+    }
+  }
+}
+layer {
+  name: "relu3"
+  type: "ReLU"
+  bottom: "conv3"
+  top: "conv3"
+}
+layer {
+  name: "pool3"
+  type: "Pooling"
+  bottom: "conv3"
+  top: "pool3"
+  pooling_param {
+    pool: AVE
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "ip1"
+  type: "InnerProduct"
+  bottom: "pool3"
+  top: "ip1"
+  param {
+    lr_mult: 1
+    decay_mult: 250
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 10
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+    }
+  }
+}
+layer {
+  name: "accuracy"
+  type: "Accuracy"
+  bottom: "ip1"
+  bottom: "label"
+  top: "accuracy"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "loss"
+  type: "SoftmaxWithLoss"
+  bottom: "ip1"
+  bottom: "label"
+  top: "loss"
+}
diff --git a/libccaffe/CMakeLists.txt b/libccaffe/CMakeLists.txt
@@ -56,6 +56,7 @@ include_directories(${CMAKE_CURRENT_SOURCE_DIR}/../caffe/src/)
 ## The files
 
 file(GLOB Source GLOB "${CMAKE_CURRENT_SOURCE_DIR}/../caffe/src/caffe/*.cpp")
+file(GLOB SourceSolvers GLOB "${CMAKE_CURRENT_SOURCE_DIR}/../caffe/src/caffe/solvers/*.cpp")
 file(GLOB SourceUtil GLOB "${CMAKE_CURRENT_SOURCE_DIR}/../caffe/src/caffe/util/*.cpp")
 file(GLOB SourceGPUUtil GLOB "${CMAKE_CURRENT_SOURCE_DIR}/../caffe/src/caffe/util/*.cu")
 file(GLOB SourceLayers GLOB "${CMAKE_CURRENT_SOURCE_DIR}/../caffe/src/caffe/layers/*.cpp")
@@ -65,16 +66,16 @@ set(CUDA_NVCC_FLAGS "-gencode=arch=compute_20,code=\"sm_20,compute_20\" -gencode
 
 # force generation of proto header
 add_library(proto STATIC ${CMAKE_CURRENT_SOURCE_DIR}/../caffe/include/caffe/proto/caffe.pb.h ${ProtoSources})
-set(Caffe_LINKER_LIBS ${OpenCV_LIBS} proto ${Caffe_LINKER_LIBS})
+set(Caffe_LINKER_LIBS proto ${Caffe_LINKER_LIBS})
 
 if(CUDA_FOUND)
-	cuda_add_library(ccaffe SHARED ${ProtoSources} ${ProtoHeaders} ${Source} ${SourceLayers} ${SourceGPULayers} ${SourceUtil} ${SourceGPUUtil} scalacaffe.cpp ${CMAKE_CURRENT_SOURCE_DIR}/../caffe/include/caffe/proto/caffe.pb.h)
+	cuda_add_library(ccaffe SHARED ${ProtoSources} ${ProtoHeaders} ${Source} ${SourceSolvers} ${SourceLayers} ${SourceGPULayers} ${SourceUtil} ${SourceGPUUtil} ccaffe.cpp ${CMAKE_CURRENT_SOURCE_DIR}/../caffe/include/caffe/proto/caffe.pb.h)
 
 	cuda_add_cublas_to_target(ccaffe)
 
 	target_link_libraries(ccaffe ${PROTOBUF_LIBRARY} ${Caffe_LINKER_LIBS} ${CUDA_LIBRARIES} ${CUDA_curand_LIBRARY})
 else(CUDA_FOUND)
-	add_library(ccaffe SHARED ${ProtoSources} ${ProtoHeaders} ${Source} ${SourceLayers} ${SourceUtil} ccaffe.cpp ${CMAKE_CURRENT_SOURCE_DIR}/../caffe/include/caffe/proto/caffe.pb.h)
+	add_library(ccaffe SHARED ${ProtoSources} ${ProtoHeaders} ${Source} ${SourceSolvers} ${SourceLayers} ${SourceUtil} ccaffe.cpp ${CMAKE_CURRENT_SOURCE_DIR}/../caffe/include/caffe/proto/caffe.pb.h)
 
 	target_link_libraries(ccaffe ${PROTOBUF_LIBRARY} ${Caffe_LINKER_LIBS})
 endif(CUDA_FOUND)
diff --git a/libccaffe/ccaffe.cpp b/libccaffe/ccaffe.cpp
@@ -6,6 +6,7 @@
 #include "caffe/common.hpp"
 #include <string>
 #include <boost/shared_ptr.hpp>
+#include <unistd.h>
 
 #include <glog/logging.h>
 
@@ -26,6 +27,10 @@ void init_logging(const char* log_filename, int log_verbosity) {
 	google::SetStderrLogging(log_verbosity);
 }
 
+void set_basepath(const char* path) {
+	chdir(path);
+}
+
 int get_int_size() {
 	return sizeof(int);
 }
@@ -162,7 +167,7 @@ void solver_test(caffenet_state* state, int num_steps) {
 	state->solver->TestAndStoreResult(0, num_steps, state->test_score);
 }
 
-DTYPE solver_get_test_score(caffenet_state* state, int accuracy_idx) {
+DTYPE get_test_score(caffenet_state* state, int accuracy_idx) {
 	assert(0 <= accuracy_idx && accuracy_idx < state->test_score->size());
 	return (*(state->test_score))[accuracy_idx];
 }
diff --git a/libccaffe/ccaffe.h b/libccaffe/ccaffe.h
@@ -12,6 +12,8 @@ extern "C" {
 	// initialize glog
 	void init_logging(const char* log_filename, int log_verbosity);
 
+	void set_basepath(const char* path);
+
 	int get_int_size(); // get number of bytes for native int
 	int get_dtype_size(); // get number of bytes for DTYPE
 
diff --git a/project/plugins.sbt b/project/plugins.sbt
@@ -0,0 +1 @@
+addSbtPlugin("com.eed3si9n" % "sbt-assembly" % "0.11.2")
diff --git a/src/test/scala/org/apache/spark/sparknet/cifartest.scala b/src/test/scala/org/apache/spark/sparknet/cifartest.scala
@@ -0,0 +1,84 @@
+import org.scalatest._
+import org.apache.spark.sparknet.loaders.CifarLoader
+import org.apache.spark.sparknet.CaffeLibrary
+import com.sun.jna.Pointer
+
+// for this test to work, $SPARKNET_HOME/caffe should be the caffe root directory
+// and you need to run $SPARKNET_HOME/caffe/data/cifar10/get_cifar10.sh
+class CifarSpec extends FlatSpec {
+	"A Cifar net" should "get chance digits right on randomly initialized net" in {
+		val sparkNetHome = sys.env("SPARKNET_HOME")
+		val loader = new CifarLoader(sparkNetHome + "/caffe/data/cifar10/")
+
+		System.load(sparkNetHome + "/build/libccaffe.so")
+		val caffeLib = CaffeLibrary.INSTANCE
+
+		caffeLib.set_basepath(sparkNetHome + "/caffe/")
+		val net = caffeLib.make_solver_from_prototxt(sparkNetHome + "/caffe/examples/cifar10/cifar10_full_java_solver.prototxt")
+
+		val dtypeSize = caffeLib.get_dtype_size()
+		val intSize = caffeLib.get_int_size()
+
+		def makeImageCallback(images: Array[Array[Float]]) : CaffeLibrary.java_callback_t = {
+  		return new CaffeLibrary.java_callback_t() {
+  			var currImage = 0
+				def invoke(data: Pointer, batch_size: Int, num_dims: Int, shape: Pointer) {
+					var size = 1
+					for(i <- 0 to num_dims-1) {
+						val dim = shape.getInt(i * intSize)
+						size *= dim
+					}
+					for(j <- 0 to batch_size-1) {
+						assert(size == images(currImage).length)
+						for(i <- 0 to size-1) {
+							data.setFloat((j * size + i) * dtypeSize, images(currImage)(i))
+						}
+						currImage += 1
+						if(currImage == images.length) {
+							currImage = 0
+						}
+					}
+	 			}
+			};
+		}
+
+		def makeLabelCallback(labels: Array[Float]) : CaffeLibrary.java_callback_t =  {
+			return new CaffeLibrary.java_callback_t() {
+				var currImage = 0
+				def invoke(data: Pointer, batch_size: Int, num_dims: Int, shape: Pointer) {
+	  			for(j <- 0 to batch_size-1) {
+						assert(shape.getInt(0) == 1)
+						data.setFloat(j * dtypeSize, labels(currImage))
+						currImage += 1
+						if(currImage == labels.length) {
+							currImage = 0
+						}
+					}
+				}
+			};
+		}
+
+		val loadTrainImageFn = makeImageCallback(loader.trainImages)
+		val loadTrainLabelFn = makeLabelCallback(loader.trainLabels)
+		caffeLib.set_train_data_callback(net, 0, loadTrainImageFn)
+		caffeLib.set_train_data_callback(net, 1, loadTrainLabelFn)
+
+		val loadTestImageFn = makeImageCallback(loader.testImages)
+		val loadTestLabelFn = makeLabelCallback(loader.testLabels)
+		caffeLib.set_test_data_callback(net, 0, loadTestImageFn)
+		caffeLib.set_test_data_callback(net, 1, loadTestLabelFn)
+
+		caffeLib.solver_test(net, 10) // TODO: shouldn't be hard coded
+
+		val numTestScores = caffeLib.num_test_scores(net)
+
+		val testScores = new Array[Float](numTestScores)
+
+		// perform test on random net
+		for (i <- 0 to numTestScores - 1) {
+			testScores(i) = caffeLib.get_test_score(net, i) * 100 // TODO: this batch size shouldn't be hard coded
+		}
+
+		assert(70.0 <= testScores(0) && testScores(0) <= 130.0)
+	}
+}

Original file line number	Diff line number	Diff line change
`@@ -6,6 +6,7 @@`
`6`	`6`	`#include "caffe/common.hpp"`
`7`	`7`	`#include <string>`
`8`	`8`	`#include <boost/shared_ptr.hpp>`
	`9`	`+#include <unistd.h>`
`9`	`10`
`10`	`11`	`#include <glog/logging.h>`
`11`	`12`
`@@ -26,6 +27,10 @@ void init_logging(const char* log_filename, int log_verbosity) {`
`26`	`27`	`google::SetStderrLogging(log_verbosity);`
`27`	`28`	`}`
`28`	`29`
	`30`	`+void set_basepath(const char* path) {`
	`31`	`+ chdir(path);`
	`32`	`+}`
	`33`	`+`
`29`	`34`	`int get_int_size() {`
`30`	`35`	`return sizeof(int);`
`31`	`36`	`}`
`@@ -162,7 +167,7 @@ void solver_test(caffenet_state* state, int num_steps) {`
`162`	`167`	`state->solver->TestAndStoreResult(0, num_steps, state->test_score);`
`163`	`168`	`}`
`164`	`169`
`165`		`-DTYPE solver_get_test_score(caffenet_state* state, int accuracy_idx) {`
	`170`	`+DTYPE get_test_score(caffenet_state* state, int accuracy_idx) {`
`166`	`171`	`assert(0 <= accuracy_idx && accuracy_idx < state->test_score->size());`
`167`	`172`	`return (*(state->test_score))[accuracy_idx];`
`168`	`173`	`}`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+addSbtPlugin("com.eed3si9n" % "sbt-assembly" % "0.11.2")`