BVLC · shelhamer · May 20, 2014 · Apr 9, 2014 · Apr 10, 2014 · Apr 10, 2014
diff --git a/include/caffe/net.hpp b/include/caffe/net.hpp
@@ -89,6 +89,8 @@ class Net {
   inline int num_outputs() { return net_output_blobs_.size(); }
   inline vector<Blob<Dtype>*>& input_blobs() { return net_input_blobs_; }
   inline vector<Blob<Dtype>*>& output_blobs() { return net_output_blobs_; }
+  inline vector<int>& input_blob_indices() { return net_input_blob_indices_; }
+  inline vector<int>& output_blob_indices() { return net_output_blob_indices_; }
   // has_blob and blob_by_name are inspired by
   // https://github.com/kencoken/caffe/commit/f36e71569455c9fbb4bf8a63c2d53224e32a4e7b
   // Access intermediary computation layers, testing with centre image only

diff --git a/python/caffe/_caffe.cpp b/python/caffe/_caffe.cpp
@@ -1,6 +1,6 @@
 // Copyright 2014 BVLC and contributors.
 // pycaffe provides a wrapper of the caffe::Net class as well as some
-// caffe::Caffe functions so that one could easily call it from Python.
+// caffe::Caffe functions so that one could easily call it from python.
 // Note that for python, we will simply use float as the data type.
 
 #define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
@@ -33,7 +33,7 @@ using boost::python::handle;
 using boost::python::vector_indexing_suite;
 
 // for convenience, check that input files can be opened, and raise an
-// exception that boost will send to Python if not (caffe could still crash
+// exception that boost will send to python if not (caffe could still crash
 // later if the input files are disturbed before they are actually used, but
 // this saves frustration in most cases)
 static void CheckFile(const string& filename) {
@@ -46,7 +46,7 @@ static void CheckFile(const string& filename) {
 }
 
 // wrap shared_ptr<Blob<float> > in a class that we construct in C++ and pass
-//  to Python
+// to python
 class CaffeBlob {
  public:
   CaffeBlob(const shared_ptr<Blob<float> > &blob, const string& name)
@@ -70,9 +70,9 @@ class CaffeBlob {
 };
 
 
-// we need another wrapper (used as boost::python's HeldType) that receives a
-//  self PyObject * which we can use as ndarray.base, so that data/diff memory
-//  is not freed while still being used in Python
+// We need another wrapper (used as boost::python's HeldType) that receives a
+// self PyObject * which we can use as ndarray.base, so that data/diff memory
+// is not freed while still being used in python.
 class CaffeBlobWrap : public CaffeBlob {
  public:
   CaffeBlobWrap(PyObject *p, const CaffeBlob &blob)
@@ -142,8 +142,9 @@ struct CaffeNet {
   }
 
   CaffeNet(string param_file, string pretrained_param_file) {
-    Init(param_file);
+    CheckFile(param_file);
     CheckFile(pretrained_param_file);
+    net_.reset(new Net<float>(param_file));
     net_->CopyTrainedLayersFrom(pretrained_param_file);
   }
 
@@ -158,18 +159,15 @@ struct CaffeNet {
 
   virtual ~CaffeNet() {}
 
-  // this function is mostly redundant with the one below, but should go away
-  // with new pycaffe
+  // Check that an array is acceptable for blob assignment
+  // as described in the preface to Forward().
   inline void check_array_against_blob(
-      PyArrayObject* arr, Blob<float>* blob) {
-    CHECK(PyArray_FLAGS(arr) & NPY_ARRAY_C_CONTIGUOUS);
-    CHECK_EQ(PyArray_NDIM(arr), 4);
-    CHECK_EQ(PyArray_ITEMSIZE(arr), 4);
-    npy_intp* dims = PyArray_DIMS(arr);
-    CHECK_EQ(dims[0], blob->num());
-    CHECK_EQ(dims[1], blob->channels());
-    CHECK_EQ(dims[2], blob->height());
-    CHECK_EQ(dims[3], blob->width());
+      PyArrayObject* arr, Blob<float>* blob, string name) {
+    check_contiguous_array(arr, name, blob->channels(), blob->height(),
+        blob->width());
+    if (PyArray_DIMS(arr)[0] != blob->num()) {
+      throw std::runtime_error(name + " has wrong batch size");
+    }
   }
 
   // generate Python exceptions for badly shaped or discontiguous arrays
@@ -197,8 +195,7 @@ struct CaffeNet {
 
   // The actual forward function. It takes in a python list of numpy arrays as
   // input and a python list of numpy arrays as output. The input and output
-  // should all have correct shapes, are single-precisionabcdnt- and
-  // c contiguous.
+  // should all have correct shapes, be single-precision, and be C-contiguous.
   void Forward(list bottom, list top) {
     vector<Blob<float>*>& input_blobs = net_->input_blobs();
     CHECK_EQ(len(bottom), input_blobs.size());
@@ -207,7 +204,8 @@ struct CaffeNet {
     for (int i = 0; i < input_blobs.size(); ++i) {
       object elem = bottom[i];
       PyArrayObject* arr = reinterpret_cast<PyArrayObject*>(elem.ptr());
-      check_array_against_blob(arr, input_blobs[i]);
+      check_array_against_blob(arr, input_blobs[i],
+          net_->blob_names()[net_->input_blob_indices()[i]]);
       switch (Caffe::mode()) {
       case Caffe::CPU:
         memcpy(input_blobs[i]->mutable_cpu_data(), PyArray_DATA(arr),
@@ -227,7 +225,8 @@ struct CaffeNet {
     for (int i = 0; i < output_blobs.size(); ++i) {
       object elem = top[i];
       PyArrayObject* arr = reinterpret_cast<PyArrayObject*>(elem.ptr());
-      check_array_against_blob(arr, output_blobs[i]);
+      check_array_against_blob(arr, output_blobs[i],
+          net_->blob_names()[net_->input_blob_indices()[i]]);
       switch (Caffe::mode()) {
       case Caffe::CPU:
         memcpy(PyArray_DATA(arr), output_blobs[i]->cpu_data(),
@@ -252,7 +251,8 @@ struct CaffeNet {
     for (int i = 0; i < output_blobs.size(); ++i) {
       object elem = top_diff[i];
       PyArrayObject* arr = reinterpret_cast<PyArrayObject*>(elem.ptr());
-      check_array_against_blob(arr, output_blobs[i]);
+      check_array_against_blob(arr, output_blobs[i],
+          net_->blob_names()[net_->input_blob_indices()[i]]);
       switch (Caffe::mode()) {
       case Caffe::CPU:
         memcpy(output_blobs[i]->mutable_cpu_diff(), PyArray_DATA(arr),
@@ -272,7 +272,8 @@ struct CaffeNet {
     for (int i = 0; i < input_blobs.size(); ++i) {
       object elem = bottom_diff[i];
       PyArrayObject* arr = reinterpret_cast<PyArrayObject*>(elem.ptr());
-      check_array_against_blob(arr, input_blobs[i]);
+      check_array_against_blob(arr, input_blobs[i],
+          net_->blob_names()[net_->input_blob_indices()[i]]);
       switch (Caffe::mode()) {
       case Caffe::CPU:
         memcpy(PyArray_DATA(arr), input_blobs[i]->cpu_diff(),
@@ -292,6 +293,10 @@ struct CaffeNet {
     net_->ForwardPrefilled();
   }
 
+  void BackwardPrefilled() {
+    net_->Backward();
+  }
+
   void set_input_arrays(object data_obj, object labels_obj) {
     // check that this network has an input MemoryDataLayer
     shared_ptr<MemoryDataLayer<float> > md_layer =
@@ -350,6 +355,24 @@ struct CaffeNet {
     return result;
   }
 
+  list inputs() {
+    list input_blob_names;
+    for (vector<int>::iterator it = net_->input_blob_indices().begin();
+        it != net_->input_blob_indices().end(); ++it) {
+      input_blob_names.append(net_->blob_names()[*it]);
+    }
+    return input_blob_names;
+  }
+
+  list outputs() {
+    list output_blob_names;
+    for (vector<int>::iterator it = net_->output_blob_indices().begin();
+        it != net_->output_blob_indices().end(); ++it) {
+      output_blob_names.append(net_->blob_names()[*it]);
+    }
+    return output_blob_names;
+  }
+
   // The pointer to the internal caffe::Net instant.
   shared_ptr<Net<float> > net_;
   // if taking input from an ndarray, we need to hold references
@@ -392,13 +415,16 @@ BOOST_PYTHON_MODULE(_caffe) {
       .def("Forward",           &CaffeNet::Forward)
       .def("ForwardPrefilled",  &CaffeNet::ForwardPrefilled)
       .def("Backward",          &CaffeNet::Backward)
+      .def("BackwardPrefilled", &CaffeNet::BackwardPrefilled)
       .def("set_mode_cpu",      &CaffeNet::set_mode_cpu)
       .def("set_mode_gpu",      &CaffeNet::set_mode_gpu)
       .def("set_phase_train",   &CaffeNet::set_phase_train)
       .def("set_phase_test",    &CaffeNet::set_phase_test)
       .def("set_device",        &CaffeNet::set_device)
       .add_property("_blobs",   &CaffeNet::blobs)
       .add_property("layers",   &CaffeNet::layers)
+      .add_property("inputs",    &CaffeNet::inputs)
+      .add_property("outputs",   &CaffeNet::outputs)
       .def("_set_input_arrays", &CaffeNet::set_input_arrays);
 
   boost::python::class_<CaffeBlob, CaffeBlobWrap>(

diff --git a/python/caffe/imagenet/ilsvrc_2012_mean.npy b/python/caffe/imagenet/ilsvrc_2012_mean.npy
diff --git a/python/caffe/imagenet/wrapper.py b/python/caffe/imagenet/wrapper.py
@@ -30,7 +30,6 @@ def oversample(image, center_only=False):
   Output:
       images: the output of size (10 x 3 x 227 x 227)
   """
-  image = image.swapaxes(1, 2).swapaxes(0, 1)
   indices = [0, IMAGE_DIM - CROPPED_DIM]
   center = int(indices[1] / 2)
   if center_only:
@@ -58,8 +57,9 @@ def prepare_image(filename, center_only=False):
     img = np.tile(img[:, :, np.newaxis], (1, 1, 3))
   elif img.shape[2] == 4:
     img = img[:, :, :3]
-  # Resize and convert to BGR
+  # Resize, convert to BGR, and permute axes to caffe order
   img_reshape = (transform.resize(img, (IMAGE_DIM,IMAGE_DIM)) * 255)[:, :, ::-1]
+  img_reshape = img_reshape.swapaxes(1, 2).swapaxes(0, 1)
   # subtract main
   img_reshape -= IMAGENET_MEAN
   return oversample(img_reshape, center_only)