Auto merge of #53 - autumnai:fix/input_reshape, r=hobofan

homu · homu · commit 38d5f48a5e8a · 2016-02-23T19:18:29.000+09:00
Fix/input reshape
diff --git a/src/layer.rs b/src/layer.rs
@@ -133,7 +133,7 @@ impl<B: IBackend + LayerOps<f32> + 'static> Layer<B> {
             LayerType::Softmax => Box::new(Softmax::default()),
             LayerType::ReLU => Box::new(ReLU),
             LayerType::Sigmoid => Box::new(Sigmoid),
-            LayerType::NegativeLogLikelihood => Box::new(NegativeLogLikelihood::default()),
+            LayerType::NegativeLogLikelihood(layer_config) => Box::new(NegativeLogLikelihood::from_config(&layer_config)),
             LayerType::Reshape(layer_config) => Box::new(Reshape::from_config(&layer_config)),
         }
     }
@@ -953,7 +953,7 @@ pub enum LayerType {
     Sigmoid,
     // Loss layers
     /// NegativeLogLikelihood Layer
-    NegativeLogLikelihood,
+    NegativeLogLikelihood(NegativeLogLikelihoodConfig),
     // Utility layers
     /// Reshape Layer
     Reshape(ReshapeConfig),
diff --git a/src/layers/common/convolution.rs b/src/layers/common/convolution.rs
@@ -3,10 +3,11 @@
 //! Does this convolution with a set of learnable filters, each producing one
 //! feature map in the output tensor.
 use std::rc::Rc;
-use co::{IBackend, DeviceType, SharedTensor};
+use co::prelude::*;
 use conn;
 use layer::*;
 use util::{ArcLock, native_backend, cast_vec_usize_to_i32};
+use weight::FillerType;
 use super::FilterLayer;
 
 #[derive(Debug, Clone)]
@@ -126,7 +127,13 @@ impl<B: IBackend + conn::Convolution<f32>> ILayer<B> for Convolution<B> {
             let config = backend.new_convolution_config(&inp, &output_data, &mut filter,
                                                         conn::ConvForwardAlgo::Auto, conn::ConvBackwardFilterAlgo::Auto, conn::ConvBackwardDataAlgo::Auto,
                                                         &stride, &padding).unwrap();
+            // resize and fill weights
             weights_data[0].write().unwrap().resize(filter.desc()).unwrap();
+            let filler = FillerType::Glorot {
+                input_size: inp.desc().size(),
+                output_size: output_shape.size(),
+            };
+            filler.fill(&mut weights_data[0].write().unwrap());
             weights_gradient[0].write().unwrap().resize(filter.desc()).unwrap();
             self.convolution_configs = Some(Rc::new(config));
         }
diff --git a/src/layers/loss/mod.rs b/src/layers/loss/mod.rs
@@ -18,6 +18,6 @@ macro_rules! impl_ilayer_loss {
     )
 }
 
-pub use self::negative_log_likelihood::NegativeLogLikelihood;
+pub use self::negative_log_likelihood::{NegativeLogLikelihood, NegativeLogLikelihoodConfig};
 
 pub mod negative_log_likelihood;
diff --git a/src/layers/loss/negative_log_likelihood.rs b/src/layers/loss/negative_log_likelihood.rs
@@ -7,9 +7,18 @@ use util::{ArcLock, native_backend};
 #[derive(Debug, Clone)]
 #[allow(missing_copy_implementations)]
 /// NegativeLogLikelihood Loss Layer
-pub struct NegativeLogLikelihood;
+pub struct NegativeLogLikelihood {
+    num_classes: usize,
+}
 
 impl NegativeLogLikelihood {
+    /// Create a NegativeLogLikelihood layer from a NegativeLogLikelihoodConfig.
+    pub fn from_config(config: &NegativeLogLikelihoodConfig) -> NegativeLogLikelihood {
+        NegativeLogLikelihood {
+            num_classes: config.num_classes,
+        }
+    }
+
     fn calculate_outer_num(softmax_axis: usize, input_shape: &[usize]) -> usize {
         input_shape.iter().take(softmax_axis + 1).fold(1, |prod, i| prod * i)
     }
@@ -25,14 +34,6 @@ impl NegativeLogLikelihood {
             _ => panic!("NegativeLogLikelihood layer only supports 1D/2D inputs")
         }
     }
-
-    fn num_classes(input_shape: &[usize]) -> usize {
-        match input_shape.len() {
-            1 => input_shape[0],
-            2 => input_shape[1],
-            _ => panic!("NegativeLogLikelihood layer only supports 1D/2D inputs"),
-        }
-    }
 }
 
 impl<B: IBackend> ILayer<B> for NegativeLogLikelihood {
@@ -97,7 +98,7 @@ impl<B: IBackend> ComputeInputGradient<f32, B> for NegativeLogLikelihood {
                               input_gradients: &mut [&mut SharedTensor<f32>]) {
         let labels = input_data[1];
         let batch_size = Self::batch_size(input_data[0].desc());
-        let num_classes = Self::num_classes(input_data[0].desc());
+        let num_classes = self.num_classes;
 
         let native = native_backend();
         let native_labels = labels.get(native.device()).unwrap().as_native().unwrap().as_slice::<f32>();
@@ -114,8 +115,10 @@ impl<B: IBackend> ComputeInputGradient<f32, B> for NegativeLogLikelihood {
 
 impl<B: IBackend> ComputeParametersGradient<f32, B> for NegativeLogLikelihood { }
 
-impl ::std::default::Default for NegativeLogLikelihood {
-    fn default() -> NegativeLogLikelihood {
-        NegativeLogLikelihood
-    }
+#[derive(Debug, Clone)]
+#[allow(missing_copy_implementations)]
+/// Specifies configuration parameters for a NegativeLogLikelihood Layer.
+pub struct NegativeLogLikelihoodConfig {
+    /// How many different classes can be classified.
+    pub num_classes: usize,
 }
diff --git a/src/layers/mod.rs b/src/layers/mod.rs
@@ -64,7 +64,7 @@ pub use self::common::{
 
 #[allow(unused_import_braces)]
 pub use self::loss::{
-    NegativeLogLikelihood,
+    NegativeLogLikelihood, NegativeLogLikelihoodConfig,
 };
 
 #[allow(unused_import_braces)]
diff --git a/src/network.rs b/src/network.rs
@@ -337,7 +337,14 @@ impl<B: IBackend + LayerOps<f32> + 'static> Network<B> {
             for layer in &mut self.layers {
                 for (blob_index, blob_name) in layer.input_blob_names().to_owned().iter().enumerate() {
                     if blob_name == &self.input_blob_names[i] {
+                        let reshaped_shape = layer.input_blobs_data[blob_index].read().unwrap().desc().clone();
                         layer.input_blobs_data[blob_index] = inp.clone();
+                        // reshape input tensor to the reshaped shape
+                        let old_shape = layer.input_blobs_data[blob_index].read().unwrap().desc().clone();
+                        if old_shape.size() != reshaped_shape.size() {
+                            panic!("The provided input does not have the expected shape");
+                        }
+                        layer.input_blobs_data[blob_index].write().unwrap().reshape(&reshaped_shape).unwrap();
                     }
                 }
             }

Original file line number	Diff line number	Diff line change
`@@ -18,6 +18,6 @@ macro_rules! impl_ilayer_loss {`
`18`	`18`	`)`
`19`	`19`	`}`
`20`	`20`
`21`		`-pub use self::negative_log_likelihood::NegativeLogLikelihood;`
	`21`	`+pub use self::negative_log_likelihood::{NegativeLogLikelihood, NegativeLogLikelihoodConfig};`
`22`	`22`
`23`	`23`	`pub mod negative_log_likelihood;`
Original file line number	Diff line number	Diff line change
`@@ -337,7 +337,14 @@ impl<B: IBackend + LayerOps<f32> + 'static> Network<B> {`
`337`	`337`	`for layer in &mut self.layers {`
`338`	`338`	`for (blob_index, blob_name) in layer.input_blob_names().to_owned().iter().enumerate() {`
`339`	`339`	`if blob_name == &self.input_blob_names[i] {`
	`340`	`+ let reshaped_shape = layer.input_blobs_data[blob_index].read().unwrap().desc().clone();`
`340`	`341`	`layer.input_blobs_data[blob_index] = inp.clone();`
	`342`	`+ // reshape input tensor to the reshaped shape`
	`343`	`+ let old_shape = layer.input_blobs_data[blob_index].read().unwrap().desc().clone();`
	`344`	`+ if old_shape.size() != reshaped_shape.size() {`
	`345`	`+ panic!("The provided input does not have the expected shape");`
	`346`	`+ }`
	`347`	`+ layer.input_blobs_data[blob_index].write().unwrap().reshape(&reshaped_shape).unwrap();`
`341`	`348`	`}`
`342`	`349`	`}`
`343`	`350`	`}`