diff --git a/CHANGELIST.md b/CHANGELIST.md
index 0940d3a75..47ff0df0c 100644
--- a/CHANGELIST.md
+++ b/CHANGELIST.md
@@ -19,6 +19,8 @@ v0.4.0
 
 ### Unstable changes
 
+- Added `matrix.op.repmat` function.
+- Added `matrix.ext.iterate` iterator.
 - Added statistical distributions in `stats.dist`.
 - Added `matrix.ext.convolution` and `matrix.ext.real_fftwh`.
 - Added `Matrix<T>::convolution` method. It is in experimental stage, please,
@@ -28,6 +30,9 @@ v0.4.0
 
 ### API Changes
 
+- Removed major order differentiation in `matrix`.
+- `tokens.matrix` **automatically** wraps `matrix` instances, from Lua to C++.
+- `matrix` **automatically** unwraps `tokens.matrix` instances, from C++ to Lua.
 - Added new methods to `AprilMath::Limits` class.
 - Added `metrics.roc` for ROC computation.
 - Added new `class` behavior taken from
@@ -62,6 +67,7 @@ v0.4.0
 
 ### C/C++
 
+- Added `LuaTable` class to allow access of Lua tables from C++ code.
 - Added TAR support in C/C++, allowing to use streams as the standard I/O
   objects in APRIL-ANN.
 - Added `basics` namespace which stores almost all C/C++ code in `basics`
diff --git a/EXAMPLES/xor.lua b/EXAMPLES/xor.lua
index 57788280d..3cefe8dd1 100644
--- a/EXAMPLES/xor.lua
+++ b/EXAMPLES/xor.lua
@@ -11,9 +11,7 @@ trainer:randomize_weights{
   sup        =  0.1 }
 
 trainer:set_option("learning_rate", 8.0)
-trainer:set_option("momentum",      0.5)
-trainer:set_option("weight_decay",  1e-05)
-trainer:set_layerwise_option("b.*", "weight_decay", 0.0)
+trainer:set_option("momentum",      0.8)
 
 local m_xor = matrix.fromString[[
     4 3
diff --git a/packages/ann/ann/binding/bind_ann_base.lua.cc b/packages/ann/ann/binding/bind_ann_base.lua.cc
index 660b0437a..8236e999b 100644
--- a/packages/ann/ann/binding/bind_ann_base.lua.cc
+++ b/packages/ann/ann/binding/bind_ann_base.lua.cc
@@ -20,54 +20,80 @@
  *
  */
 //BIND_HEADER_C
+#include <typeinfo>
+
 #include "bind_function_interface.h"
 #include "bind_matrix.h"
 #include "bind_sparse_matrix.h"
 #include "bind_mtrand.h"
 #include "bind_tokens.h"
+#include "bind_util.h"
 #include "table_of_token_codes.h"
 
 using namespace AprilUtils;
 using namespace Basics;
 
 namespace ANN {
-  static bool rewrapToAtLeastDim2(Token *&tk) {
+  static bool rewrapToAtLeastDim2(AprilUtils::SharedPtr<Token> &tk) {
     if (tk->getTokenCode() == table_of_token_codes::token_matrix) {
       Basics::TokenMatrixFloat *tk_mat = tk->convertTo<Basics::TokenMatrixFloat*>();
       Basics::MatrixFloat *m = tk_mat->getMatrix();
       if (m->getNumDim() == 1) {
         int dims[2] = { 1, m->getDimSize(0) };
-        Basics::Token *new_tk = new Basics::TokenMatrixFloat(m->rewrap(dims, 2));
-        IncRef(new_tk);
-        DecRef(tk);
-        tk = new_tk;
+        tk.reset( new Basics::TokenMatrixFloat(m->rewrap(dims, 2)) );
         return true;
       }
     }
     return false;
   }
 
-  static void unwrapToDim1(Token *&tk) {
+  static void unwrapToDim1(AprilUtils::SharedPtr<Token> &tk) {
     if (tk->getTokenCode() == table_of_token_codes::token_matrix) {
       Basics::TokenMatrixFloat *tk_mat = tk->convertTo<Basics::TokenMatrixFloat*>();
       Basics::MatrixFloat *m = tk_mat->getMatrix();
       int dim = m->getDimSize(1);
       Basics::MatrixFloat *new_m = m->rewrap(&dim, 1);
-      Basics::Token *tk = new Basics::TokenMatrixFloat(new_m);
+      tk.reset( new Basics::TokenMatrixFloat(new_m) );
     }
   }
 
-  template<typename Value, typename PushFunction>
-  void pushHashTableInLuaStack(lua_State *L,
-                               AprilUtils::hash<AprilUtils::string,Value> &hashobject,
-                               PushFunction push_function) {
-    lua_createtable(L, 0, hashobject.size());
-    for (typename AprilUtils::hash<AprilUtils::string,Value>::iterator it = hashobject.begin();
-         it != hashobject.end(); ++it) {
-      push_function(L, it->second);
-      lua_setfield(L, -2, it->first.c_str());
-    }
+}
+
+void lua_pushAuxANNComponent(lua_State *L, ANNComponent *value) {
+  if (typeid(*value) == typeid(StackANNComponent)) {
+    lua_pushStackANNComponent(L, (StackANNComponent*)value);
+  }
+  else if (typeid(*value) == typeid(JoinANNComponent)) {
+    lua_pushJoinANNComponent(L, (JoinANNComponent*)value);
+  }
+  else if (dynamic_cast<ActivationFunctionANNComponent*>(value)) {
+    lua_pushActivationFunctionANNComponent(L, (ActivationFunctionANNComponent*)value);
+  }
+  else if (dynamic_cast<StochasticANNComponent*>(value)) {
+    lua_pushStochasticANNComponent(L, (StochasticANNComponent*)value);
+  }
+  else {
+    lua_pushANNComponent(L, value);
+  }
+}
+
+namespace AprilUtils {
+
+  template<> ANN::ANNComponent *LuaTable::
+  convertTo<ANN::ANNComponent *>(lua_State *L, int idx) {
+    return lua_toANNComponent(L, idx);
+  }
+  
+  template<> void LuaTable::
+  pushInto<ANN::ANNComponent *>(lua_State *L, ANN::ANNComponent *value) {
+    lua_pushAuxANNComponent(L, value);
   }
+
+  template<> bool LuaTable::
+  checkType<ANN::ANNComponent *>(lua_State *L, int idx) {
+    return lua_isANNComponent(L, idx);
+  }
+  
 }
 
 //BIND_END
@@ -101,6 +127,7 @@ namespace ANN {
 #include "relu_actf_component.h"
 #include "hardtanh_actf_component.h"
 #include "sin_actf_component.h"
+#include "log_actf_component.h"
 #include "linear_actf_component.h"
 #include "gaussian_noise_component.h"
 #include "salt_and_pepper_component.h"
@@ -113,6 +140,8 @@ namespace ANN {
 using namespace Functions;
 using namespace ANN;
 
+void lua_pushAuxANNComponent(lua_State *L, ANNComponent *value);
+
 //BIND_END
 
 /////////////////////////////////////////////////////
@@ -138,10 +167,11 @@ using namespace ANN;
 				       input_size);
   //
   Basics::MatrixFloat *obj;
-  if (w && w->getMajorOrder() == CblasColMajor) obj = w->clone();
+  if (w) {
+    obj = w->clone();
+  }
   else {
     obj = Connections::build(input_size, output_size);
-    if (w) Connections::loadWeights(obj, w, first_pos, column_size);
   }
   LUABIND_RETURN(MatrixFloat, obj);
 }
@@ -351,48 +381,48 @@ using namespace ANN;
 
 //BIND_METHOD ANNComponent get_input
 {
-  Basics::Token *aux = obj->getInput();
-  if (aux == 0) {
+  AprilUtils::SharedPtr<Basics::Token> aux( obj->getInput() );
+  if (aux.empty()) {
     LUABIND_RETURN(Token, new TokenNull());
   }
   else {
-    LUABIND_RETURN(Token, aux);
+    LUABIND_RETURN(AuxToken, aux);
   }
 }
 //BIND_END
 
 //BIND_METHOD ANNComponent get_output
 {
-  Basics::Token *aux = obj->getOutput();
-  if (aux == 0) {
+  AprilUtils::SharedPtr<Basics::Token> aux( obj->getOutput() );
+  if (aux.empty()) {
     LUABIND_RETURN(Token, new TokenNull());
   }
   else {
-    LUABIND_RETURN(Token, aux);
+    LUABIND_RETURN(AuxToken, aux);
   }
 }
 //BIND_END
 
 //BIND_METHOD ANNComponent get_error_input
 {
-  Basics::Token *aux = obj->getErrorInput();
+  AprilUtils::SharedPtr<Basics::Token> aux( obj->getErrorInput() );
   if (aux == 0) {
     LUABIND_RETURN(Token, new TokenNull());
   }
   else {
-    LUABIND_RETURN(Token, aux);
+    LUABIND_RETURN(AuxToken, aux);
   }
 }
 //BIND_END
 
 //BIND_METHOD ANNComponent get_error_output
 {
-  Basics::Token *aux = obj->getErrorOutput();
+  AprilUtils::SharedPtr<Basics::Token> aux( obj->getErrorOutput() );
   if (aux == 0) {
     LUABIND_RETURN(Token, new TokenNull());
   }
   else {
-    LUABIND_RETURN(Token, aux);
+    LUABIND_RETURN(AuxToken, aux);
   }
 }
 //BIND_END
@@ -418,35 +448,32 @@ using namespace ANN;
 
 //BIND_METHOD ANNComponent forward
 {
-  Basics::Token *input;
+  AprilUtils::SharedPtr<Basics::Token> input;
   bool during_training;
   LUABIND_CHECK_ARGN(>=, 1);
   LUABIND_CHECK_ARGN(<=, 2);
   LUABIND_GET_PARAMETER(1, AuxToken, input);
   LUABIND_GET_OPTIONAL_PARAMETER(2, bool, during_training, false);
-  IncRef(input);
   bool rewrapped = rewrapToAtLeastDim2(input);
-  Basics::Token *output = obj->doForward(input, during_training);
+  AprilUtils::SharedPtr<Basics::Token> output( obj->doForward(input.get(),
+                                                              during_training) );
   if (rewrapped) unwrapToDim1(output);
-  LUABIND_RETURN(Token, output);
-  DecRef(input);
+  LUABIND_RETURN(AuxToken, output);
 }
 //BIND_END
 
 //BIND_METHOD ANNComponent backprop
 {
-  Basics::Token *input;
+  AprilUtils::SharedPtr<Basics::Token> input;
   LUABIND_CHECK_ARGN(==, 1);
   LUABIND_GET_PARAMETER(1, AuxToken, input);
-  IncRef(input);
   bool rewrapped = rewrapToAtLeastDim2(input);
-  Basics::Token *gradient = obj->doBackprop(input);
-  if (gradient != 0) {
+  AprilUtils::SharedPtr<Basics::Token> gradient( obj->doBackprop(input.get()) );
+  if (!gradient.empty()) {
     if (rewrapped) unwrapToDim1(gradient);
-    LUABIND_RETURN(Token, gradient);
+    LUABIND_RETURN(AuxToken, gradient);
   }
   else LUABIND_RETURN_NIL();
-  DecRef(input);
 }
 //BIND_END
 
@@ -462,14 +489,13 @@ using namespace ANN;
 {
   LUABIND_CHECK_ARGN(<=, 1);
   int argn = lua_gettop(L);
-  Basics::MatrixFloatSet *weight_grads_dict;
-  if (argn == 1)
-    LUABIND_GET_PARAMETER(1, MatrixFloatSet, weight_grads_dict);
-  else
-    weight_grads_dict = new Basics::MatrixFloatSet();
+  AprilUtils::LuaTable weight_grads_dict;
+  if (argn == 1) {
+    weight_grads_dict = AprilUtils::LuaTable(L,1);
+  }
   //
   obj->computeAllGradients(weight_grads_dict);
-  LUABIND_RETURN(MatrixFloatSet, weight_grads_dict);
+  LUABIND_RETURN(LuaTable, weight_grads_dict);
 }
 //BIND_END
 
@@ -500,41 +526,38 @@ using namespace ANN;
   LUABIND_CHECK_ARGN(<=, 1);
   int argn = lua_gettop(L);
   unsigned int input_size=0, output_size=0;
-  Basics::MatrixFloatSet *weights_dict = 0;
-  AprilUtils::hash<AprilUtils::string,ANNComponent*> components_dict;
+  AprilUtils::LuaTable weights_dict(L), components_dict(L);
   if (argn == 1) {
     LUABIND_CHECK_PARAMETER(1, table);
     check_table_fields(L, 1, "input", "output", "weights", (const char *)0);
     LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, input, uint, input_size, 0);
     LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, output, uint, output_size, 0);
-    LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, weights,
-					 MatrixFloatSet, weights_dict, 0);
+    lua_getfield(L, 1, "weights");
+    if (!lua_isnil(L, -1)) weights_dict = lua_toLuaTable(L,-1);
+    lua_pop(L, 1);
   }
-  if (weights_dict == 0) weights_dict = new Basics::MatrixFloatSet();
   //
   obj->build(input_size, output_size, weights_dict, components_dict);
   //
-  LUABIND_RETURN(ANNComponent, obj);
-  LUABIND_RETURN(MatrixFloatSet, weights_dict);
-  pushHashTableInLuaStack(L, components_dict, lua_pushANNComponent);
-  LUABIND_INCREASE_NUM_RETURNS(1);
+  LUABIND_RETURN(AuxANNComponent, obj);
+  LUABIND_RETURN(LuaTable, weights_dict);
+  LUABIND_RETURN(LuaTable, components_dict);
 }
 //BIND_END
 
 //BIND_METHOD ANNComponent copy_weights
 {
-  Basics::MatrixFloatSet *weights_dict = new Basics::MatrixFloatSet();
+  AprilUtils::LuaTable weights_dict(L);
   obj->copyWeights(weights_dict);
-  LUABIND_RETURN(MatrixFloatSet, weights_dict);
+  LUABIND_RETURN(LuaTable, weights_dict);
 }
 //BIND_END
 
 //BIND_METHOD ANNComponent copy_components
 {
-  AprilUtils::hash<AprilUtils::string,ANNComponent*> components_dict;
+  AprilUtils::LuaTable components_dict(L);
   obj->copyComponents(components_dict);
-  pushHashTableInLuaStack(L, components_dict, lua_pushANNComponent);
-  LUABIND_RETURN_FROM_STACK(-1);
+  LUABIND_RETURN(LuaTable, components_dict);
 }
 //BIND_END
 
@@ -546,7 +569,7 @@ using namespace ANN;
   LUABIND_GET_PARAMETER(1, string, name);
   string name_string(name);
   ANNComponent *component = obj->getComponent(name_string);
-  LUABIND_RETURN(ANNComponent, component);
+  LUABIND_RETURN(AuxANNComponent, component);
 }
 //BIND_END
 
@@ -717,8 +740,9 @@ using namespace ANN;
 //BIND_METHOD StackANNComponent unroll
 {
   lua_checkstack(L, obj->size());
-  for (unsigned int i=0; i<obj->size(); ++i)
-    LUABIND_RETURN(ANNComponent, obj->getComponentAt(i));
+  for (unsigned int i=0; i<obj->size(); ++i) {
+    LUABIND_RETURN(AuxANNComponent, obj->getComponentAt(i));
+  }
 }
 //BIND_END
 
@@ -728,26 +752,24 @@ using namespace ANN;
   int argn = lua_gettop(L);
   lua_checkstack(L, argn);
   for (int i=1; i<=argn; ++i) {
-    unsigned int idx;
-    LUABIND_GET_PARAMETER(i, uint, idx);
-    --idx;
-    if (idx >= obj->size())
+    unsigned int idx = lua_tointeger(L, i);
+    if (idx > obj->size())
       LUABIND_FERROR2("Incorrect index, expected <= %d, found %d\n",
-		      obj->size(), idx+1);
-    LUABIND_RETURN(ANNComponent, obj->getComponentAt(idx));
+		      obj->size(), idx);
+    LUABIND_RETURN(AuxANNComponent, obj->getComponentAt(idx - 1));
   }
 }
 //BIND_END
 
 //BIND_METHOD StackANNComponent top
 {
-  LUABIND_RETURN(ANNComponent, obj->topComponent());
+  if (obj->size() > 0) LUABIND_RETURN(AuxANNComponent, obj->topComponent());
 }
 //BIND_END
 
 //BIND_METHOD StackANNComponent pop
 {
-  obj->popComponent();
+  if (obj->size() > 0) obj->popComponent();
   LUABIND_RETURN(StackANNComponent, obj);
 }
 //BIND_END
@@ -1011,10 +1033,16 @@ using namespace ANN;
   int *kernel, *step, n, input_planes_dim;
   check_table_fields(L, 1, "name", "weights", "kernel", "input_planes_dim",
 		     "step", "n", (const char *)0);
+  LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, input_planes_dim, int,
+				       input_planes_dim, -1);
+  if (input_planes_dim > 1) {
+    LUABIND_ERROR("Deprecated property, new version only allowed for input_planes_dim==1\n");
+  }
+  else if (input_planes_dim == 1) {
+    ERROR_PRINT("Deprecated property, not needed in the new version");
+  }
   LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, name, string, name, 0);
   LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, weights, string, weights, 0);
-  LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, input_planes_dim, int,
-				       input_planes_dim, 1);
   LUABIND_GET_TABLE_PARAMETER(1, n, int, n);
   //
   lua_getfield(L, 1, "kernel");
@@ -1041,8 +1069,7 @@ using namespace ANN;
     LUABIND_TABLE_TO_VECTOR(-1, int, step, size);
   }
   lua_pop(L, 1);
-  obj = new ConvolutionANNComponent(size, kernel, step,
-				    input_planes_dim, n,
+  obj = new ConvolutionANNComponent(size, kernel, step, n,
 				    name, weights);
   LUABIND_RETURN(ConvolutionANNComponent, obj);
   delete[] kernel;
@@ -1548,6 +1575,29 @@ using namespace ANN;
 }
 //BIND_END
 
+/////////////////////////////////////////////////////
+//               LogActfANNComponent               //
+/////////////////////////////////////////////////////
+
+//BIND_LUACLASSNAME LogActfANNComponent ann.components.actf.log
+//BIND_CPP_CLASS    LogActfANNComponent
+//BIND_SUBCLASS_OF  LogActfANNComponent ActivationFunctionANNComponent
+
+//BIND_CONSTRUCTOR LogActfANNComponent
+{
+  LUABIND_CHECK_ARGN(<=, 1);
+  int argn = lua_gettop(L);
+  const char *name=0;
+  if (argn == 1) {
+    LUABIND_CHECK_PARAMETER(1, table);
+    check_table_fields(L, 1, "name", (const char *)0);
+    LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, name, string, name, 0);
+  }
+  obj = new LogActfANNComponent(name);
+  LUABIND_RETURN(LogActfANNComponent, obj);  
+}
+//BIND_END
+
 /////////////////////////////////////////////////////
 //              LinearActfANNComponent             //
 /////////////////////////////////////////////////////
diff --git a/packages/ann/ann/c_src/activation_function_component.cc b/packages/ann/ann/c_src/activation_function_component.cc
index 5355ccbad..051ce462a 100644
--- a/packages/ann/ann/c_src/activation_function_component.cc
+++ b/packages/ann/ann/c_src/activation_function_component.cc
@@ -56,7 +56,6 @@ namespace ANN {
     // change current input by new input
     AssignRef(input,_input->convertTo<TokenMatrixFloat*>());
     MatrixFloat *input_mat = input->getMatrix();
-    april_assert(input_mat->getMajorOrder() == CblasColMajor);
     april_assert(input_mat->getNumDim() >= 2);
     if (!input_mat->getIsContiguous()) {
       input_mat = input_mat->clone();
@@ -91,7 +90,6 @@ namespace ANN {
     // change current input by new input
     AssignRef(error_input,_error_input->convertTo<TokenMatrixFloat*>());
     MatrixFloat *error_input_mat = error_input->getMatrix();
-    april_assert(error_input_mat->getMajorOrder() == CblasColMajor);
     april_assert(error_input_mat->getNumDim() >= 2);
     if (!error_input_mat->getIsContiguous()) {
       error_input_mat = error_input_mat->clone();
@@ -139,8 +137,8 @@ namespace ANN {
   
   void ActivationFunctionANNComponent::build(unsigned int _input_size,
 					     unsigned int _output_size,
-					     MatrixFloatSet *weights_dict,
-					     hash<string,ANNComponent*> &components_dict) {
+					     AprilUtils::LuaTable &weights_dict,
+					     AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size, weights_dict, components_dict);
     if (input_size == 0) input_size = output_size;
     if (output_size == 0) output_size = input_size;
diff --git a/packages/ann/ann/c_src/activation_function_component.h b/packages/ann/ann/c_src/activation_function_component.h
index 9f7697978..336445073 100644
--- a/packages/ann/ann/c_src/activation_function_component.h
+++ b/packages/ann/ann/c_src/activation_function_component.h
@@ -63,8 +63,8 @@ namespace ANN {
     
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
   };
 }
diff --git a/packages/ann/ann/c_src/activation_function_kernels.cu b/packages/ann/ann/c_src/activation_function_kernels.cu
index 89e0d3c1e..7e984234c 100644
--- a/packages/ann/ann/c_src/activation_function_kernels.cu
+++ b/packages/ann/ann/c_src/activation_function_kernels.cu
@@ -144,22 +144,16 @@ namespace ANN {
       }
       else {
 #endif
-        AprilMath::FloatGPUMirroredMemoryBlock *input_units =
-          input->getRawDataAccess();
-        AprilMath::FloatGPUMirroredMemoryBlock *output_units =
-          output->getRawDataAccess();
-        const float *input_units_ptr = input_units->getPPALForRead();
-        float *output_units_ptr      = output_units->getPPALForWrite();
-
         for (unsigned int b = 0; b < bunch_size; ++b) {
-          float minimum = input_units_ptr[0];
-          float maximum = input_units_ptr[0];
-          unsigned int cur_pos = bunch_size;
+          Basics::MatrixFloat::const_iterator input_it(input->iteratorAt(b,0));
+          float minimum = *input_it;
+          float maximum = *input_it;
+          ++input_it;
           for (unsigned int i = 2; i < size; i += 2) {
-            float prev_unit = input_units_ptr[cur_pos];
-            cur_pos += bunch_size;
-            float cur_unit = input_units_ptr[cur_pos];
-            cur_pos += bunch_size;
+            float prev_unit = *input_it;
+            ++input_it;
+            float cur_unit = *input_it;
+            ++input_it;
             if (prev_unit < cur_unit) {
               if (prev_unit < minimum) minimum = prev_unit;
               if (cur_unit > maximum) maximum = cur_unit;
@@ -169,25 +163,26 @@ namespace ANN {
             }
           }
           if ((size & 1) == 0) { // si es impar
-            unsigned int last_pos = (size - 1) * bunch_size;
-            if (input_units_ptr[last_pos] < minimum)
-              minimum = input_units_ptr[last_pos];
-            if (input_units_ptr[last_pos] > maximum)
-              maximum = input_units_ptr[last_pos];
+            if (*input_it < minimum) minimum = *input_it;
+            if (*input_it > maximum) maximum = *input_it;
           }
           if ((maximum - minimum) > 30.0f) minimum = maximum - 30.0f;
           double addition = 0;
-          cur_pos = 0;
+          input_it = input->iteratorAt(b,0);
+          Basics::MatrixFloat::iterator output_it(output->iteratorAt(b,0));
           for (unsigned int i = 0; i < size; i++) {
-            double e = exp(input_units_ptr[cur_pos] - minimum);
-            output_units_ptr[cur_pos] = e;
+            double e = exp(*input_it - minimum);
+            *output_it = e;
             addition += e;
-            cur_pos  += bunch_size;
+            ++input_it;
+            ++output_it;
           }
           float ratio = 1.0f/addition;
-          cblas_sscal(size, ratio, output_units_ptr, bunch_size);
-          output_units_ptr++;
-          input_units_ptr++;
+          output_it = output->iteratorAt(b,0);
+          for (unsigned int i = 0; i < size; i++) {
+            *output_it *= ratio;
+            ++output_it;
+          }
         }
 #ifdef USE_CUDA
       }
@@ -229,50 +224,42 @@ namespace ANN {
       }
       else {
 #endif
-        AprilMath::FloatGPUMirroredMemoryBlock *input_units =
-          input->getRawDataAccess();
-        AprilMath::FloatGPUMirroredMemoryBlock *output_units =
-          output->getRawDataAccess();
-        const float *input_units_ptr = input_units->getPPALForRead();
-        float *output_units_ptr      = output_units->getPPALForWrite();
-
         for (unsigned int b = 0; b < bunch_size; ++b) {
-          float maximum = input_units_ptr[0];
-          unsigned int cur_pos = bunch_size;
+          Basics::MatrixFloat::const_iterator input_it(input->iteratorAt(b,0));
+          float maximum = *input_it;
+          ++input_it;
           for (unsigned int i = 2; i < size; i += 2) {
-            float prev_unit = input_units_ptr[cur_pos];
-            cur_pos += bunch_size;
-            float cur_unit = input_units_ptr[cur_pos];
+            float prev_unit = *input_it;
+            ++input_it;
+            float cur_unit = *input_it;
+            ++input_it;
             if (prev_unit < cur_unit) {
               if (cur_unit > maximum) maximum = cur_unit;
             } else {
               if (prev_unit > maximum) maximum = prev_unit;
             }
-            cur_pos += bunch_size;
           }
           if ((size & 1) == 0) { // si es par
-            unsigned int last_pos = (size - 1) * bunch_size;
-            if (input_units_ptr[last_pos] > maximum)
-              maximum = input_units_ptr[last_pos];
+            if (*input_it > maximum) maximum = *input_it;
           }
+          input_it = input->iteratorAt(b,0);
+          Basics::MatrixFloat::iterator output_it(output->iteratorAt(b,0));
           double addition = 0.0f;
-          cur_pos = 0;
           for (unsigned int i = 0; i < size; i++) {
-            output_units_ptr[cur_pos] = input_units_ptr[cur_pos] - maximum;
-            double exp_output = AprilMath::m_exp(static_cast<double>(output_units_ptr[cur_pos]));
+            *output_it = *input_it - maximum;
+            double exp_output = AprilMath::m_exp(static_cast<double>(*output_it));
             addition += exp_output;
-            cur_pos  += bunch_size;
+            ++input_it;
+            ++output_it;
           }
+          output_it = output->iteratorAt(b,0);
           float ratio = static_cast<float>(log(addition));
-          cur_pos = 0;
           for (unsigned int i = 0; i < size; i++) {
-            output_units_ptr[cur_pos] -= ratio;
-            april_assert(!(output_units_ptr[cur_pos] > 0.0f) &&
+            *output_it -= ratio;
+            april_assert(!(*output_it > 0.0f) &&
                          "Numerical inestability at log-softmax activation function");
-            cur_pos += bunch_size;
+            ++output_it;
           }
-          output_units_ptr++;
-          input_units_ptr++;
         }
 #ifdef USE_CUDA
       }
diff --git a/packages/ann/ann/c_src/ann_component.h b/packages/ann/ann/c_src/ann_component.h
index 4201e9d09..80d8a816f 100644
--- a/packages/ann/ann/c_src/ann_component.h
+++ b/packages/ann/ann/c_src/ann_component.h
@@ -22,31 +22,18 @@
 #define ANNCOMPONENT_H
 
 #include <cstring>
-#include "aux_hash_table.h" // required for build
 #include "connection.h"
 #include "disallow_class_methods.h"
 #include "error_print.h"
 #include "function_interface.h"
-#include "hash_table.h"     // required for build
 #include "mystring.h"
+#include "lua_table.h"
 #include "token_base.h"
 #include "matrixFloat.h"
-#include "matrixFloatSet.h"
 #include "unused_variable.h"
 #include "vector.h"
 
-using AprilUtils::hash;    // required for build
-using AprilUtils::string;
-using AprilUtils::vector;
-
-#ifndef NDEBUG
-#define ASSERT_MATRIX(m) do {						\
-    april_assert( (m)->getMajorOrder() == CblasColMajor );		\
-  } while(0)
-// april_assert( (m)->getNumDim() == 2 );
-#else
 #define ASSERT_MATRIX(m)
-#endif
 
 /**
  * @brief Maximum size of automatically generated names.
@@ -56,10 +43,30 @@ using AprilUtils::vector;
  */
 #define MAX_NAME_STR 256
 
+namespace ANN {
+  // forward declaration
+  class ANNComponent;
+}
+
+namespace AprilUtils {
+
+  template<> ANN::ANNComponent *LuaTable::
+  convertTo<ANN::ANNComponent *>(lua_State *L, int idx);
+  
+  template<> void LuaTable::
+  pushInto<ANN::ANNComponent *>(lua_State *L, ANN::ANNComponent *value);
+
+  template<> bool LuaTable::
+  checkType<ANN::ANNComponent *>(lua_State *L, int idx);
+}
+
+
 /**
  * @brief All ANN components and other stuff is implemented here.
  */
 namespace ANN {
+
+
   
   unsigned int mult(const int *v, int n);
 
@@ -284,22 +291,20 @@ namespace ANN {
     /**
      * @brief Computation of gradient of all ANNComponent's is done here.
      *
-     * @param[in,out] weight_grads_dict - A Basics::MatrixFloatSet reference where
+     * @param[in,out] weight_grads_dict - A AprilUtils::LuaTable reference where
      * gradient matrices will be stored.
      *
      * This method traverses all the ANNComponent's using the given
-     * Basics::MatrixFloatSet. If hasWeightsName() is true, the method
-     * computeGradients() will be executed with the shared Basics::MatrixFloat
-     * reference (i.e. AprilUtils::SharedPtr) related to the @c weights_name
-     * property.
+     * AprilUtils::LuaTable. If hasWeightsName() is true, the method
+     * computeGradients() will be executed.
      *
      * @note The @c weight_grads_dict[weights_name] can be an empty reference,
      * in this case, the called method has the responsability of its proper
      * initialization.
      */
-    virtual void computeAllGradients(Basics::MatrixFloatSet *weight_grads_dict){
-      if (!weights_name.empty()) {
-        computeGradients( (*weight_grads_dict)[weights_name].getDense() );
+    virtual void computeAllGradients(AprilUtils::LuaTable &weight_grads_dict){
+      if (hasWeightsName()) {
+        computeGradients( weights_name.c_str(), weight_grads_dict );
       }
     }
     
@@ -354,35 +359,37 @@ namespace ANN {
      * @param _output_size - The output size given to the method. It can be @c
      * _input_size=0 to indicate that it is unknown or don't care.
      *
-     * @param[in,out] weights_dict - A pointer to Basics::MatrixFloatSet where
+     * @param[in,out] weights_dict - A reference to AprilUtils::LuaTable where
      * weight matrices are stored.
      *
-     * @param[out] components_dict - A dictionary of ANNComponent's which are
-     * part of the ANN.
+     * @param[out] components_dict - A AprilUtils::LuaTable of ANNComponent's which
+     * are part of the ANN.
      *
      * @note Derived classes must re-implement this method throwing errors if
      * necessary when input/output sizes have unexpected values, and calling to
      * the parent method before doing anything.
      *
-     * @note The @c weights_dict param contains weight Basics::MatrixFloat
-     * references (i.e. AprilUtils::SharedPtr) indexed by @c weights_name
-     * property. The reference can be empty and the derived class is responsible
-     * to initialize it properly. If it is not empty, the derived class is
-     * responsible to check its size correctness.
+     * @note The @c weights_dict param can contain any Lua or APRIL-ANN type
+     * indexed by @c weights_name property. It can be empty and the derived
+     * class is responsible to initialize it properly. If it is not empty, the
+     * derived class is responsible to check its size and type correctness.
      */
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict) {
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict) {
       UNUSED_VARIABLE(weights_dict);
       // if (is_built) ERROR_EXIT(128, "Rebuild is forbidden!!!!\n");
       is_built = true;
       ////////////////////////////////////////////////////////////////////
-      ANNComponent *&component = components_dict[name];
-      if (component != 0 &&
-          component != this) ERROR_EXIT1(102, "Non unique component name found: %s\n",
-                                         name.c_str());
-      else component = this;
+      ANNComponent *component = components_dict.opt<ANNComponent *>(name.c_str(), 0);
+      if (component != 0 && component != this) {
+        ERROR_EXIT1(102, "Non unique component name found: %s\n", name.c_str());
+      }
+      else {
+        component = this;
+        components_dict.put(name.c_str(), component);
+      }
       ////////////////////////////////////////////////////////////////////
       if (input_size   == 0)  input_size   = _input_size;
       if (output_size  == 0)  output_size  = _output_size;
@@ -399,7 +406,7 @@ namespace ANN {
     }
     
     /// Retrieve matrix weights from ANNComponent's.
-    virtual void copyWeights(Basics::MatrixFloatSet *weights_dict) {
+    virtual void copyWeights(AprilUtils::LuaTable &weights_dict) {
       UNUSED_VARIABLE(weights_dict);
     }
 
@@ -409,8 +416,8 @@ namespace ANN {
      * @note All derived classes which rewrite this method must call parent
      * method before doing anything.
      */
-    virtual void copyComponents(AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict) {
-      components_dict[name] = this;
+    virtual void copyComponents(AprilUtils::LuaTable &components_dict) {
+      components_dict.put(name.c_str(), this);
     }
     
     /// For debug purposes.
@@ -502,8 +509,9 @@ namespace ANN {
      * This method is rewritten only by ANNComponent's which contain trainable
      * weight matrices, and therefore it is needed to compute its gradients.
      *
-     * @param weight_grads - A shared reference (i.e. AprilUtils::SharedPtr) to
-     * a Basics::MatrixFloat pointer.
+     * @param weights_name - A string with the corresponding weights name.
+     *
+     * @param weight_grads - A dictionary where to store the gradients.
      *
      * @note The default implementation in ANNComponent does nothing.
      *
@@ -511,7 +519,9 @@ namespace ANN {
      * class is responsible to initialize it properly, or to check the
      * correctness of sizes and dimensions.
      */
-    virtual void computeGradients(AprilUtils::SharedPtr<Basics::MatrixFloat> &weight_grads) {
+    virtual void computeGradients(const char *weights_name,
+                                  AprilUtils::LuaTable &weight_grads) {
+      UNUSED_VARIABLE(weights_name);
       UNUSED_VARIABLE(weight_grads);
     }
     
diff --git a/packages/ann/ann/c_src/bias_component.cc b/packages/ann/ann/c_src/bias_component.cc
index cb33d996e..167e40c32 100644
--- a/packages/ann/ann/c_src/bias_component.cc
+++ b/packages/ann/ann/c_src/bias_component.cc
@@ -83,15 +83,19 @@ namespace ANN {
     bias_vector->resetSharedCount();
   }
 
-  void BiasANNComponent::computeGradients(AprilUtils::SharedPtr<MatrixFloat> & grads_mat) {
+  void BiasANNComponent::computeGradients(const char *name,
+                                          AprilUtils::LuaTable &weight_grads_dict) {
     // count one use of the vector
     bias_vector->addToSharedCount();
-    if (grads_mat.empty()) {
+    MatrixFloat *grads_mat = weight_grads_dict.opt<MatrixFloat*>(name, 0);
+    if (grads_mat == 0) {
       grads_mat = bias_vector->cloneOnlyDims();
-      matZeros(grads_mat.get());
+      matZeros(grads_mat);
+      weight_grads_dict.put(name, grads_mat);
     }
-    else if (!grads_mat->sameDim(bias_vector))
+    else if (!grads_mat->sameDim(bias_vector)) {
       ERROR_EXIT(128, "Incorrect weights matrix dimensions\n");
+    }
 #ifdef USE_CUDA
     grads_mat->setUseCuda(use_cuda);
 #endif
@@ -99,7 +103,7 @@ namespace ANN {
     unsigned int bunch_size = error_input_mat->getDimSize(0);
     // bias update: prev_bias[j] = prev_bias[j] + \sum_b norm_learn_rate * ERROR_INPUT[b,j]
     if (bunch_size == 1) {
-      matAxpy(grads_mat.get(), 1.0f, error_input_mat);
+      matAxpy(grads_mat, 1.0f, error_input_mat);
     }
     else {
       doAxpyLoop(output_size,
@@ -125,8 +129,8 @@ namespace ANN {
 
   void BiasANNComponent::build(unsigned int _input_size,
 			       unsigned int _output_size,
-			       MatrixFloatSet *weights_dict,
-			       hash<string,ANNComponent*> &components_dict) {
+			       AprilUtils::LuaTable &weights_dict,
+			       AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size,
 			weights_dict, components_dict);
     //
@@ -140,10 +144,10 @@ namespace ANN {
     unsigned int weights_input_size  = 1;
     unsigned int weights_output_size = output_size;
     ////////////////////////////////////////////////////////////////////
-    AprilUtils::SharedPtr<MatrixFloat> &w = (*weights_dict)[weights_name].getDense();
+    MatrixFloat *w = weights_dict.opt<MatrixFloat*>(weights_name, 0);
     // printf("%s :: %p %p\n", weights_name.c_str(), w, bias_vector);
-    if (!w.empty()) {
-      AssignRef(bias_vector, w.get());
+    if (w != 0) {
+      AssignRef(bias_vector, w);
       // printf("COPY OF BIAS FROM HASH %s\n", weights_name.c_str());
       if (!Connections::checkInputOutputSizes(bias_vector,
 					      weights_input_size,
@@ -161,22 +165,22 @@ namespace ANN {
 	IncRef(bias_vector);
       }
       // else printf("USING PREVIOUS BIAS %s\n", weights_name.c_str());
-      w = bias_vector;
+      weights_dict.put(weights_name, bias_vector);
     }
   }
 
-  void BiasANNComponent::copyWeights(MatrixFloatSet *weights_dict) {
+  void BiasANNComponent::copyWeights(AprilUtils::LuaTable &weights_dict) {
     if (bias_vector == 0)
       ERROR_EXIT1(100, "Component not built, impossible execute copyWeights [%s]\n",
 		  name.c_str());
-    AprilUtils::SharedPtr<MatrixFloat> &w = (*weights_dict)[weights_name].getDense();
-    if (!w.empty() && w.get() != bias_vector)
+    MatrixFloat *w = weights_dict.opt<MatrixFloat*>(weights_name, 0);
+    if (w != 0 && w != bias_vector)
       ERROR_EXIT2(101, "Weights dictionary contains %s weights name which is "
 		  "not shared with bias_vector attribute [%s]\n",
 		  weights_name.c_str(),
 		  name.c_str());
-    else if (w.empty()) {
-      w = bias_vector;
+    else if (w == 0) {
+      weights_dict.put(weights_name, bias_vector);
     }
   }
 
diff --git a/packages/ann/ann/c_src/bias_component.h b/packages/ann/ann/c_src/bias_component.h
index 9b7f1695c..10e8b7f5a 100644
--- a/packages/ann/ann/c_src/bias_component.h
+++ b/packages/ann/ann/c_src/bias_component.h
@@ -40,7 +40,7 @@ namespace ANN {
                                                   bool during_training);
     virtual Basics::MatrixFloat *privateDoBackprop(Basics::MatrixFloat *input_error);
     virtual void privateReset(unsigned int it=0);
-    virtual void computeGradients(AprilUtils::SharedPtr<Basics::MatrixFloat> & grad_mat);
+    virtual void computeGradients(const char *name, AprilUtils::LuaTable &weight_grads_dict);
     
   public:
     BiasANNComponent(unsigned int size=0,
@@ -49,9 +49,9 @@ namespace ANN {
     virtual ANNComponent *clone();
     virtual void build(unsigned int input_size,
 		       unsigned int output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
-    virtual void copyWeights(Basics::MatrixFloatSet *weights_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
+    virtual void copyWeights(AprilUtils::LuaTable &weights_dict);
     
     virtual char *toLuaString();
   };
diff --git a/packages/ann/ann/c_src/connection.cc b/packages/ann/ann/c_src/connection.cc
index b5b7bfe37..0a3945477 100644
--- a/packages/ann/ann/c_src/connection.cc
+++ b/packages/ann/ann/c_src/connection.cc
@@ -52,7 +52,7 @@ namespace ANN {
 				  unsigned int num_outputs) {
     int dims[2] = { static_cast<int>(num_outputs),
 		    static_cast<int>(num_inputs) };
-    MatrixFloat *weights = new MatrixFloat(2, dims, CblasColMajor);
+    MatrixFloat *weights = new MatrixFloat(2, dims);
     if (weights == 0)
       ERROR_EXIT(130, "Impossible to allocate memory\n");
     return weights;
@@ -123,9 +123,9 @@ namespace ANN {
     if (min_size > static_cast<unsigned int>(data->size()))
       ERROR_EXIT2(24, "Incorrect matrix size, was %d, expected >= %d\n",
 		  data->size(), min_size);
-    if (!data->isSimple())
-      ERROR_EXIT(128, "Matrices need to be simple (contiguous "
-		 "and in row-major)\n");
+    if (!data->getIsContiguous()) {
+      ERROR_EXIT(128, "Matrices need to be contiguous\n");
+    }
     unsigned int current_w_pos = first_weight_pos;
     MatrixFloat::iterator w_it(weights->begin());
     for (unsigned int j=0; j<num_outputs; ++j) {
@@ -152,9 +152,8 @@ namespace ANN {
     if (min_size > static_cast<unsigned int>(data->size()))
       ERROR_EXIT2(24, "Incorrect matrix size, was %d, expected >= %d\n",
 		  data->size(), min_size);
-    if (!data->isSimple())
-      ERROR_EXIT(128, "Matrices need to be simple (contiguous "
-		 "and in row-major)\n");    
+    if (!data->getIsContiguous())
+      ERROR_EXIT(128, "Matrices need to contiguous\n");
     unsigned int current_w_pos = first_weight_pos;
     MatrixFloat::const_iterator w_it(weights->begin());
     for (unsigned int j=0; j<num_outputs; ++j) {
@@ -170,8 +169,8 @@ namespace ANN {
   char *Connections::toLuaString(MatrixFloat *weights) {
     SharedPtr<CStringStream> stream(new CStringStream());
     stream->put("matrix.fromString[[");
-    AprilUtils::HashTableOptions options;
-    weights->write( stream.get(), options.putBoolean("ascii", false) );
+    AprilUtils::LuaTable options;
+    weights->write( stream.get(), options.put("ascii", false) );
     stream->put("]]\0", 3); // forces a \0 at the end of the buffer
     return stream->releaseString();
   }
diff --git a/packages/ann/ann/c_src/const_component.cc b/packages/ann/ann/c_src/const_component.cc
index cd851f53b..4e330b932 100644
--- a/packages/ann/ann/c_src/const_component.cc
+++ b/packages/ann/ann/c_src/const_component.cc
@@ -29,12 +29,11 @@ namespace ANN {
     ANNComponent(name, 0,
 		 component->getInputSize(),
 		 component->getOutputSize()),
-    component(component),
-    component_weights(new Basics::MatrixFloatSet()) {
+    component(component) {
     if (!component->getIsBuilt()) {
       ERROR_EXIT(128, "Needs a built component!\n");
     }
-    component->copyWeights(component_weights.get());
+    component->copyWeights(component_weights);
   }
   
   ConstANNComponent::~ConstANNComponent() { }
@@ -57,8 +56,8 @@ namespace ANN {
   
   void ConstANNComponent::build(unsigned int _input_size,
                                 unsigned int _output_size,
-                                Basics::MatrixFloatSet *weights_dict,
-                                AprilUtils::hash<string,ANNComponent*> &components_dict) {
+                                AprilUtils::LuaTable &weights_dict,
+                                AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size, weights_dict, components_dict);
   }
   
@@ -66,11 +65,11 @@ namespace ANN {
     AprilUtils::SharedPtr<AprilIO::CStringStream>
       stream(new AprilIO::CStringStream());
     char *component_str = component->toLuaString();
-    char *component_weights_str = component_weights->toLuaString();
+    AprilUtils::string component_weights_str( component_weights.toLuaString() );
     stream->printf("ann.components.const{ name='%s', component=%s:build{ weights=%s } }",
                    name.c_str(),
 		   component_str,
-                   component_weights_str);
+                   component_weights_str.c_str());
     stream->put("\0",1); // forces a \0 at the end of the buffer
     delete[] component_str;
     delete[] component_weights_str;
diff --git a/packages/ann/ann/c_src/const_component.h b/packages/ann/ann/c_src/const_component.h
index d3f73933f..05be3961c 100644
--- a/packages/ann/ann/c_src/const_component.h
+++ b/packages/ann/ann/c_src/const_component.h
@@ -32,7 +32,7 @@ namespace ANN {
     
   protected:
     AprilUtils::SharedPtr<ANNComponent> component;
-    AprilUtils::SharedPtr<Basics::MatrixFloatSet> component_weights;
+    AprilUtils::LuaTable component_weights;
     
   public:
     ConstANNComponent(ANNComponent *component, const char *name);
@@ -53,8 +53,8 @@ namespace ANN {
 
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
     virtual char *toLuaString();
   };
diff --git a/packages/ann/ann/c_src/convolution_bias_component.cc b/packages/ann/ann/c_src/convolution_bias_component.cc
index 2d4f07aaf..8add1a708 100644
--- a/packages/ann/ann/c_src/convolution_bias_component.cc
+++ b/packages/ann/ann/c_src/convolution_bias_component.cc
@@ -54,8 +54,7 @@ namespace ANN {
     MatrixFloat *bias_vec = bias_vector->select(1,0);
     IncRef(bias_vec);
     // the output bias as a 2d matrix of BUNCHxN
-    MatrixFloat *bias_matrix_2d = new MatrixFloat(2, window_size,
-						  CblasColMajor);
+    MatrixFloat *bias_matrix_2d = new MatrixFloat(2, window_size);
     IncRef(bias_matrix_2d);
     // first pattern is done out of the loop
     MatrixFloat *dest = bias_matrix_2d->select(0, 0);
@@ -176,12 +175,15 @@ namespace ANN {
     return error_mat;
   }
      
-  void ConvolutionBiasANNComponent::computeGradients(AprilUtils::SharedPtr<MatrixFloat> &grads_mat) {
+  void ConvolutionBiasANNComponent::computeGradients(const char *name,
+                                                     AprilUtils::LuaTable &grads_mat_dict) {
     // reset shared counter
     bias_vector->addToSharedCount(number_input_windows);
-    if (grads_mat.empty()) {
+    MatrixFloat *grads_mat = grads_mat_dict.opt<MatrixFloat*>(name, 0);
+    if (grads_mat == 0) {
       grads_mat = bias_vector->cloneOnlyDims();
-      matZeros(grads_mat.get());
+      matZeros(grads_mat);
+      grads_mat_dict.put(name, grads_mat);
     }
 #ifdef USE_CUDA
     grads_mat->setUseCuda(use_cuda);
@@ -234,14 +236,14 @@ namespace ANN {
 
   void ConvolutionBiasANNComponent::build(unsigned int _input_size,
 					  unsigned int _output_size,
-					  MatrixFloatSet *weights_dict,
-					  hash<string,ANNComponent*> &components_dict) {
+					  AprilUtils::LuaTable &weights_dict,
+					  AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size,
 			weights_dict, components_dict);
     ////////////////////////////////////////////////////////////////////
-    AprilUtils::SharedPtr<MatrixFloat> &b = (*weights_dict)[weights_name].getDense();
-    if (!b.empty()) {
-      AssignRef(bias_vector, b.get());
+    MatrixFloat *b = weights_dict.opt<MatrixFloat*>(weights_name, 0);
+    if (b != 0) {
+      AssignRef(bias_vector, b);
       if (!Connections::checkInputOutputSizes(bias_vector,1,hidden_size))
 	ERROR_EXIT2(256,"The bias vector input/output sizes are not correct, "
 		    "expected 1x%d [%s]\n", hidden_size, name.c_str());
@@ -251,22 +253,22 @@ namespace ANN {
 	bias_vector = Connections::build(1, hidden_size);
 	IncRef(bias_vector);
       }
-      b = bias_vector;
+      weights_dict.put(weights_name, bias_vector);
     }
   }
 
-  void ConvolutionBiasANNComponent::copyWeights(MatrixFloatSet *weights_dict) {
+  void ConvolutionBiasANNComponent::copyWeights(AprilUtils::LuaTable &weights_dict) {
     if (bias_vector == 0)
       ERROR_EXIT1(100, "Component not built, impossible execute copyWeights [%s]\n",
 		  name.c_str());
-    AprilUtils::SharedPtr<MatrixFloat> &b = (*weights_dict)[weights_name].getDense();
-    if (!b.empty() && b.get() != bias_vector)
+    MatrixFloat *b = weights_dict.opt<MatrixFloat*>(weights_name, 0);
+    if (b != 0 && b != bias_vector)
       ERROR_EXIT2(101, "Weights dictionary contains %s bias name which is "
 		  "not shared with bias_vector attribute [%s]\n",
 		  weights_name.c_str(),
 		  name.c_str());
-    else if (b.empty()) {
-      b = bias_vector;
+    else if (b == 0) {
+      weights_dict.put(weights_name, bias_vector);
     }
   }  
 
diff --git a/packages/ann/ann/c_src/convolution_bias_component.h b/packages/ann/ann/c_src/convolution_bias_component.h
index 93d8ca520..2a94a5342 100644
--- a/packages/ann/ann/c_src/convolution_bias_component.h
+++ b/packages/ann/ann/c_src/convolution_bias_component.h
@@ -52,7 +52,7 @@ namespace ANN {
 
   protected:
 
-    virtual void computeGradients(AprilUtils::SharedPtr<Basics::MatrixFloat> & grad_mat);
+    virtual void computeGradients(const char *name, AprilUtils::LuaTable &weight_grads_dict);
     virtual Basics::MatrixFloat *privateDoForward(Basics::MatrixFloat *input,
                                           bool during_training);
     virtual Basics::MatrixFloat *privateDoBackprop(Basics::MatrixFloat *input_error);
@@ -71,9 +71,9 @@ namespace ANN {
     virtual ANNComponent *clone();
     virtual void build(unsigned int input_size,
 		       unsigned int output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
-    virtual void copyWeights(Basics::MatrixFloatSet *weights_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
+    virtual void copyWeights(AprilUtils::LuaTable &weights_dict);
     virtual char *toLuaString();
 
   };
diff --git a/packages/ann/ann/c_src/convolution_component.cc b/packages/ann/ann/c_src/convolution_component.cc
index 20b6b5f49..bf97d0895 100644
--- a/packages/ann/ann/c_src/convolution_component.cc
+++ b/packages/ann/ann/c_src/convolution_component.cc
@@ -30,17 +30,12 @@ using namespace Basics;
 
 namespace ANN {
 
-  ///////////////////////////////////////////
+  ////////////////////////////////////////////
   // ConvolutionANNComponent implementation //
-  ///////////////////////////////////////////
+  ////////////////////////////////////////////
 
   void ConvolutionANNComponent::initializeArrays(const int *input_dims) {
-    for (int i=1; i<input_planes_dim; ++i) {
-      output_dims[i+1] = (input_dims[i] - kernel_dims[i])/kernel_step[i] + 1;
-      input_window_num_steps[i]    = output_dims[i+1];
-      output_window_num_steps[i+1] = output_dims[i+1];
-    }
-    for (int i=input_planes_dim+1; i<=input_num_dims; ++i) {
+    for (int i=2; i<=input_num_dims; ++i) {
       output_dims[i] = (input_dims[i] - kernel_dims[i])/kernel_step[i] + 1;
       input_window_num_steps[i]  = output_dims[i];
       output_window_num_steps[i] = output_dims[i];
@@ -58,7 +53,7 @@ namespace ANN {
     output_dims[1]	       = hidden_size;
     input_window_size[0]       = input_dims[0];
     input_window_num_steps[0]  = 1;
-    input_window_num_steps[input_planes_dim] = 1;
+    input_window_num_steps[1]  = 1;
     output_window_size[0]      = input_dims[0];
     // AT CONSTRUCTOR: output_window_size[1] = hidden_size;
     output_window_num_steps[0] = 1;
@@ -67,25 +62,20 @@ namespace ANN {
     // AT CONSTRUCTOR: input_window_rewrap[1] = kernel_size;
     output_window_rewrap[0]    = input_dims[0];
     // AT CONSTRUCTOR: output_window_rewrap[1] = hidden_size;
-    if (input_dims[input_planes_dim] != kernel_dims[input_planes_dim])
-      ERROR_EXIT7(128, "Input matrix dim %d must be equals to kernel dim %d, "
-		  "input_dims[%d]=%d, kernel_dims[%d]=%d [%s]\n",
-		  input_planes_dim, input_planes_dim,
-		  input_planes_dim, input_dims[input_planes_dim],
-		  input_planes_dim, kernel_dims[input_planes_dim],
-		  name.c_str());
+    if (input_dims[1] != kernel_dims[1])
+      ERROR_EXIT3(128, "Input matrix dim 1 must be equals to kernel dim 1, "
+		  "input_dims[1]=%d != kernel_dims[1]=%d [%s]\n",
+		  input_dims[1], kernel_dims[1], name.c_str());
   }
   
   ConvolutionANNComponent::ConvolutionANNComponent(int input_num_dims,
 						   const int *_kernel_dims,
 						   const int *_kernel_step,
-						   const int input_planes_dim,
 						   int num_output_planes,
 						   const char *name,
 						   const char *weights_name) :
     VirtualMatrixANNComponent(name, weights_name, 0, 0),
     weights_matrix(0),
-    input_planes_dim(input_planes_dim),
     number_input_windows(0),
     kernel_size(1),
     hidden_size(num_output_planes),
@@ -95,29 +85,23 @@ namespace ANN {
     output_dims(new int[input_num_dims+1]),
     input_window_size(new int[input_num_dims+1]),
     input_window_num_steps(new int[input_num_dims+1]),
-    input_window_order_step(new int[input_num_dims+1]),
     input_window_rewrap(new int[2]),
     output_window_size(new int[input_num_dims+1]),
     output_window_step(new int[input_num_dims+1]),
     output_window_num_steps(new int[input_num_dims+1]),
-    output_window_order_step(new int[input_num_dims+1]),
     output_window_rewrap(new int[2]) {
     setInputContiguousProperty(true);
     if (weights_name == 0) generateDefaultWeightsName("w");
     kernel_dims[0] = static_cast<int>(hidden_size);
     kernel_step[0] = 1;
-    input_window_order_step[0] = 0;
     output_window_size[0] = 0;
     output_window_size[1] = static_cast<int>(hidden_size);
-    output_window_order_step[0] = 0;
     output_window_step[0] = 1;
     output_window_step[1] = 1;
     for(int i=0; i<input_num_dims; ++i) {
       kernel_size *= _kernel_dims[i];
       kernel_dims[i+1] = _kernel_dims[i];
       kernel_step[i+1] = _kernel_step[i];
-      input_window_order_step[i+1] = i+1;
-      output_window_order_step[i+1] = i+1;
       input_window_size[i+1] = kernel_dims[i+1];
     }
     for(int i=2; i<=input_num_dims; ++i) {
@@ -137,11 +121,9 @@ namespace ANN {
     delete[] output_dims;
     delete[] input_window_size;
     delete[] input_window_num_steps;
-    delete[] input_window_order_step;
     delete[] output_window_size;
     delete[] output_window_step;
     delete[] output_window_num_steps;
-    delete[] output_window_order_step;
     delete[] input_window_rewrap;
     delete[] output_window_rewrap;
   }
@@ -160,7 +142,7 @@ namespace ANN {
     const int *input_dims = input_mat->getDimPtr();
     initializeArrays(input_dims);
     MatrixFloat *output_mat;
-    output_mat = new MatrixFloat(input_num_dims+1, output_dims, CblasColMajor);
+    output_mat = new MatrixFloat(input_num_dims+1, output_dims);
     IncRef(output_mat);
 #ifdef USE_CUDA
     output_mat->setUseCuda(use_cuda);
@@ -173,14 +155,12 @@ namespace ANN {
       new MatrixFloat::sliding_window(input_mat, input_window_size,
                                       0,  // OFFSET
                                       kernel_step,
-                                      input_window_num_steps,
-                                      input_window_order_step);
+                                      input_window_num_steps);
     MatrixFloat::sliding_window *output_sw =
       new MatrixFloat::sliding_window(output_mat, output_window_size,
                                       0,  // OFFSET
                                       output_window_step,
-                                      output_window_num_steps,
-                                      output_window_order_step);
+                                      output_window_num_steps);
     number_input_windows = input_sw->numWindows();
     // CONVOLUTION OVER number_input_windows
     MatrixFloat *input_w  = input_sw->getMatrix();
@@ -253,14 +233,12 @@ namespace ANN {
       new MatrixFloat::sliding_window(error_output_mat, input_window_size,
                                       0,  // OFFSET
                                       kernel_step,
-                                      input_window_num_steps,
-                                      input_window_order_step);
+                                      input_window_num_steps);
     MatrixFloat::sliding_window *error_input_sw =
       new MatrixFloat::sliding_window(error_input_mat, output_window_size,
                                       0,  // OFFSET
                                       output_window_step,
-                                      output_window_num_steps,
-                                      output_window_order_step);
+                                      output_window_num_steps);
     april_assert(error_input_sw->numWindows() == number_input_windows);
     // CONVOLUTION GRADIENT
     MatrixFloat *error_input_w  = error_input_sw->getMatrix();
@@ -316,11 +294,14 @@ namespace ANN {
     return error_output_mat;
   }
   
-  void ConvolutionANNComponent::computeGradients(AprilUtils::SharedPtr<MatrixFloat> &grads_mat) {
+  void ConvolutionANNComponent::computeGradients(const char *name,
+                                                 AprilUtils::LuaTable &grads_mat_dict) {
     weights_matrix->addToSharedCount(number_input_windows);
-    if (grads_mat.empty()) {
+    MatrixFloat *grads_mat = grads_mat_dict.opt<MatrixFloat*>(name, 0);
+    if (grads_mat == 0) {
       grads_mat = weights_matrix->cloneOnlyDims();
-      matZeros(grads_mat.get());
+      matZeros(grads_mat);
+      grads_mat_dict.put(name, grads_mat);
     }
 #ifdef USE_CUDA
     grads_mat->setUseCuda(use_cuda);
@@ -331,13 +312,11 @@ namespace ANN {
     MatrixFloat::sliding_window input_sw(input_mat, input_window_size,
 					 0,  // OFFSET
 					 kernel_step,
-					 input_window_num_steps,
-					 input_window_order_step);
+					 input_window_num_steps);
     MatrixFloat::sliding_window error_input_sw(error_input_mat, output_window_size,
 					       0,  // OFFSET
 					       output_window_step,
-					       output_window_num_steps,
-					       output_window_order_step);
+					       output_window_num_steps);
     MatrixFloat *input_w       = input_sw.getMatrix();
     MatrixFloat *error_input_w = error_input_sw.getMatrix();
     IncRef(input_w);
@@ -355,7 +334,7 @@ namespace ANN {
       IncRef(error_input_flattened);
       
       // WEIGHTS UPDATE
-      matGemm(grads_mat.get(),
+      matGemm(grads_mat,
               CblasTrans, CblasNoTrans,
               1.0f,
               error_input_flattened, // A
@@ -382,8 +361,7 @@ namespace ANN {
   ANNComponent *ConvolutionANNComponent::clone() {
     ConvolutionANNComponent *component = new
       ConvolutionANNComponent(input_num_dims, kernel_dims+1, kernel_step+1,
-			      input_planes_dim, hidden_size,
-			      name.c_str(), weights_name.c_str());
+                              hidden_size, name.c_str(), weights_name.c_str());
     component->input_size     = input_size;
     component->output_size    = output_size;
     return component;
@@ -391,19 +369,19 @@ namespace ANN {
 
   void ConvolutionANNComponent::build(unsigned int _input_size,
 				     unsigned int _output_size,
-				     MatrixFloatSet *weights_dict,
-				     hash<string,ANNComponent*> &components_dict) {
+				     AprilUtils::LuaTable &weights_dict,
+				     AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size,
 			weights_dict, components_dict);
     //
     unsigned int weights_input_size  = kernel_size;
     unsigned int weights_output_size = hidden_size;
     ////////////////////////////////////////////////////////////////////
-    AprilUtils::SharedPtr<MatrixFloat> &w = (*weights_dict)[weights_name].getDense();
+    MatrixFloat *w = weights_dict.opt<MatrixFloat*>(weights_name.c_str(), 0);
     // printf("%s :: %p %p\n", weights_name.c_str(), w, weights_matrix);
-    if (!w.empty()) {
+    if (w != 0) {
       // printf("COPY OF WEIGHTS FROM HASH %s\n", weights_name.c_str());
-      AssignRef(weights_matrix, w.get());
+      AssignRef(weights_matrix, w);
       if (!Connections::checkInputOutputSizes(weights_matrix,
 					      weights_input_size,
 					      weights_output_size))
@@ -420,30 +398,30 @@ namespace ANN {
 	IncRef(weights_matrix);
       }
       // else printf("USING PREVIOUS WEIGHTS %s\n", weights_name.c_str());
-      w = weights_matrix;
+      weights_dict.put(weights_name.c_str(), weights_matrix);
     }
   }
 
-  void ConvolutionANNComponent::copyWeights(MatrixFloatSet *weights_dict) {
+  void ConvolutionANNComponent::copyWeights(AprilUtils::LuaTable &weights_dict) {
     if (weights_matrix == 0)
       ERROR_EXIT1(100, "Component not built, impossible execute copyWeights [%s]\n",
 		  name.c_str());
-    AprilUtils::SharedPtr<MatrixFloat> &w = (*weights_dict)[weights_name].getDense();
-    if (!w.empty() && w.get() != weights_matrix)
+    MatrixFloat *w = weights_dict.opt<MatrixFloat*>(weights_name.c_str(), 0);
+    if (w != 0 && w != weights_matrix)
       ERROR_EXIT2(101, "Weights dictionary contains %s weights name which is "
 		  "not shared with weights_matrix attribute [%s]\n",
 		  weights_name.c_str(),
 		  name.c_str());
-    else if (w.empty()) {
-      w = weights_matrix;
+    else if (w == 0) {
+      weights_dict.put(weights_name.c_str(), weights_matrix);
     }
   }  
 
   char *ConvolutionANNComponent::toLuaString() {
     buffer_list buffer;
     buffer.printf("ann.components.convolution{ name='%s',weights='%s',"
-		  "n=%d, input_planes_dim=%d, kernel={", name.c_str(), weights_name.c_str(),
-		  hidden_size, input_planes_dim);
+		  "n=%d, kernel={", name.c_str(), weights_name.c_str(),
+		  hidden_size);
     for (int i=0; i<input_num_dims; ++i)
       buffer.printf("%d,", kernel_dims[i+1]);
     buffer.printf("}, step={");
diff --git a/packages/ann/ann/c_src/convolution_component.h b/packages/ann/ann/c_src/convolution_component.h
index f63c2ec1e..c0af2e6eb 100644
--- a/packages/ann/ann/c_src/convolution_component.h
+++ b/packages/ann/ann/c_src/convolution_component.h
@@ -37,8 +37,6 @@ namespace ANN {
     
     // parameters of the convolution
     
-    /// Dimension where input planes are located
-    const int input_planes_dim;
     /// The number of convolutions computed during last forward
     int number_input_windows;
     /// The size of one kernel (number of inputs of one hidden neuron)
@@ -58,8 +56,6 @@ namespace ANN {
     int *input_window_size;
     /// Number of steps of the convolution window, input_num_dims + 1
     int *input_window_num_steps;
-    /// Order for traversing the input data, prepared for col-major order
-    int *input_window_order_step;
     /// Translates the input window into a bi-dimensional matrix
     int *input_window_rewrap;
     // OUTPUT SLIDING WINDOW SECTION
@@ -69,8 +65,6 @@ namespace ANN {
     int *output_window_step;
     /// Number of steps of the convolution window, input_num_dims + 1
     int *output_window_num_steps;
-    /// Order for traversing the input data, prepared for col-major order
-    int *output_window_order_step;
     /// Translates the output window into a bi-dimensional matrix
     int *output_window_rewrap;
     
@@ -95,7 +89,7 @@ namespace ANN {
     
   protected:
 
-    virtual void computeGradients(AprilUtils::SharedPtr<Basics::MatrixFloat> & grad_mat);
+    virtual void computeGradients(const char *name, AprilUtils::LuaTable &weight_grads_dict);
 
     virtual Basics::MatrixFloat *privateDoForward(Basics::MatrixFloat* input,
                                                   bool during_training);
@@ -106,8 +100,6 @@ namespace ANN {
     ConvolutionANNComponent(int input_num_dims,
 			    const int *_kernel_dims,  // input_num_dims
 			    const int *_kernel_step,  // step
-			    const int input_planes_dim, // dimension where input
-						        // planes are located
 			    int num_output_planes,      // hidden layer size
 			    const char *name=0, const char *weights_name=0);
     virtual ~ConvolutionANNComponent();
@@ -115,19 +107,16 @@ namespace ANN {
 				      AprilUtils::vector<unsigned int> &output_size) {
       output_size.clear();
       output_size.push_back(hidden_size);
-      for (int i=1; i<input_planes_dim; ++i) {
-	output_size.push_back((input_size[i-1]-kernel_dims[i])/kernel_step[i]+1);
-      }
-      for (int i=input_planes_dim+1; i<=input_num_dims; ++i) {
+      for (int i=2; i<=input_num_dims; ++i) {
 	output_size.push_back((input_size[i-1]-kernel_dims[i])/kernel_step[i]+1);
       }
     }
     virtual ANNComponent *clone();
     virtual void build(unsigned int input_size,
 		       unsigned int output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-                       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
-    virtual void copyWeights(Basics::MatrixFloatSet *weights_dict);
+		       AprilUtils::LuaTable &weights_dict,
+                       AprilUtils::LuaTable &components_dict);
+    virtual void copyWeights(AprilUtils::LuaTable &weights_dict);
 
     virtual char *toLuaString();
 
diff --git a/packages/ann/ann/c_src/copy_component.cc b/packages/ann/ann/c_src/copy_component.cc
index 1d95706b5..32885e187 100644
--- a/packages/ann/ann/c_src/copy_component.cc
+++ b/packages/ann/ann/c_src/copy_component.cc
@@ -132,15 +132,14 @@ namespace ANN {
           ERROR_EXIT(128, "Different bunch size between forward and backprop\n");
         }
         error_output_mat = new MatrixFloat(input_mat->getNumDim(),
-                                           input_mat->getDimPtr(),
-                                           CblasColMajor);
+                                           input_mat->getDimPtr());
         break;
       }
     case table_of_token_codes::vector_Tokens:
       {
         int dims[2] = { static_cast<int>(bunch_size),
                         static_cast<int>(input_size) };
-        error_output_mat = new MatrixFloat(2, dims, CblasColMajor);
+        error_output_mat = new MatrixFloat(2, dims);
         break;
       }
     default:
@@ -194,8 +193,8 @@ namespace ANN {
 
   void CopyANNComponent::build(unsigned int _input_size,
 			       unsigned int _output_size,
-			       MatrixFloatSet *weights_dict,
-			       hash<string,ANNComponent*> &components_dict) {
+			       AprilUtils::LuaTable &weights_dict,
+			       AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size,
 			weights_dict, components_dict);
     if (output_size == 0) output_size = input_size * times;
diff --git a/packages/ann/ann/c_src/copy_component.h b/packages/ann/ann/c_src/copy_component.h
index 239ae14d0..2b948c71b 100644
--- a/packages/ann/ann/c_src/copy_component.h
+++ b/packages/ann/ann/c_src/copy_component.h
@@ -61,8 +61,8 @@ namespace ANN {
 
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
     virtual char *toLuaString();
   };
diff --git a/packages/ann/ann/c_src/dot_product_component.cc b/packages/ann/ann/c_src/dot_product_component.cc
index 87ef01083..15fdbf026 100644
--- a/packages/ann/ann/c_src/dot_product_component.cc
+++ b/packages/ann/ann/c_src/dot_product_component.cc
@@ -70,7 +70,7 @@ namespace ANN {
     MatrixFloat *output_mat;
     int dims[2] = { static_cast<int>(bunch_size),
                     static_cast<int>(getOutputSize()) };
-    output_mat = new MatrixFloat(2, dims, CblasColMajor);
+    output_mat = new MatrixFloat(2, dims);
 #ifdef USE_CUDA
     output_mat->setUseCuda(use_cuda);
 #endif
@@ -104,16 +104,15 @@ namespace ANN {
     MatrixFloat *output_mat;
     int dims[2] = {static_cast<int>(bunch_size),
                    static_cast<int>(getOutputSize())};
-    output_mat = new MatrixFloat(2, dims, CblasColMajor);
+    output_mat = new MatrixFloat(2, dims);
 #ifdef USE_CUDA
     output_mat->setUseCuda(use_cuda);
 #endif
     matSparseMM(output_mat,
-                  CblasNoTrans,
-                  NEGATE_CBLAS_TRANSPOSE(transpose_weights),
-                  CblasNoTrans,
-                  1.0f, input_mat, weights_mat,
-                  0.0f);
+                CblasNoTrans,
+                NEGATE_CBLAS_TRANSPOSE(transpose_weights),
+                1.0f, input_mat, weights_mat,
+                0.0f);
     return output_mat;
   }
   
@@ -125,7 +124,7 @@ namespace ANN {
     MatrixFloat *error_output_mat;
     int dims[2] = { static_cast<int>(bunch_size),
 		    static_cast<int>(getInputSize()) };
-    error_output_mat = new MatrixFloat(2, dims, CblasColMajor);
+    error_output_mat = new MatrixFloat(2, dims);
 #ifdef USE_CUDA
     error_output_mat->setUseCuda(use_cuda);
 #endif      
@@ -169,12 +168,15 @@ namespace ANN {
     weights_matrix->resetSharedCount();
   }
 
-  void DotProductANNComponent::
-  initializeComputeGradients(AprilUtils::SharedPtr<MatrixFloat> & grads_mat) {
+  MatrixFloat *DotProductANNComponent::
+  initializeComputeGradients(const char *name,
+                             AprilUtils::LuaTable &grads_mat_dict) {
     weights_matrix->addToSharedCount();
-    if (grads_mat.empty()) {
+    MatrixFloat *grads_mat = grads_mat_dict.opt<MatrixFloat*>(name, 0);
+    if (grads_mat == 0) {
       grads_mat = weights_matrix->cloneOnlyDims();
-      matZeros(grads_mat.get());
+      matZeros(grads_mat);
+      grads_mat_dict.put<MatrixFloat*>(name, grads_mat);
     }
     else if (!grads_mat->sameDim(weights_matrix)) {
       ERROR_EXIT(128, "Incorrect weights matrix dimensions\n");
@@ -182,17 +184,19 @@ namespace ANN {
 #ifdef USE_CUDA
     grads_mat->setUseCuda(use_cuda);
 #endif
+    return grads_mat;
   }
   
   void DotProductANNComponent::
-  privateDenseComputeGradients(AprilUtils::SharedPtr<MatrixFloat> & grads_mat) {
-    initializeComputeGradients(grads_mat);
+  privateDenseComputeGradients(const char *name,
+                               AprilUtils::LuaTable & grads_mat_dict) {
+    MatrixFloat *grads_mat = initializeComputeGradients(name, grads_mat_dict);
     MatrixFloat *error_input_mat;
     error_input_mat = getErrorInputMatrix();
     unsigned int bunch_size = error_input_mat->getDimSize(0);
     MatrixFloat *input_mat = getInputMatrix();
     if (bunch_size > 1) {
-      matGemm(grads_mat.get(),
+      matGemm(grads_mat,
               CblasTrans, CblasNoTrans,
               1.0f,
               (transpose_weights == CblasNoTrans)?error_input_mat:input_mat, // A
@@ -200,7 +204,7 @@ namespace ANN {
               1.0f);
     } // if bunch_size > 1 ... else
     else {
-      matGer(grads_mat.get(),
+      matGer(grads_mat,
              1.0f,
              (transpose_weights == CblasNoTrans)?error_input_mat:input_mat,
              (transpose_weights == CblasNoTrans)?input_mat:error_input_mat);
@@ -208,27 +212,27 @@ namespace ANN {
   }
   
   void DotProductANNComponent::
-  privateSparseComputeGradients(AprilUtils::SharedPtr<MatrixFloat> & grads_mat) {
-    initializeComputeGradients(grads_mat);
+  privateSparseComputeGradients(const char *name,
+                                AprilUtils::LuaTable & grads_mat_dict) {
+    MatrixFloat *grads_mat = initializeComputeGradients(name, grads_mat_dict);
     MatrixFloat *error_input_mat;
     error_input_mat = getErrorInputMatrix();
     SparseMatrixFloat *input_mat;
     input_mat = getSparseInputMatrix();
     if (transpose_weights == CblasNoTrans) {
-      matSparseMM(grads_mat.get(),
+      AprilUtils::SharedPtr< MatrixFloat > gT(grads_mat->transpose());
+      matSparseMM(gT.get(),
                   CblasTrans,
                   CblasNoTrans,
-                  CblasTrans,
                   1.0f,
                   input_mat,
                   error_input_mat,
                   1.0f);
     }
     else {
-      matSparseMM(grads_mat.get(),
+      matSparseMM(grads_mat,
                   CblasTrans,
                   CblasNoTrans,
-                  CblasNoTrans,
                   1.0f,
                   input_mat,
                   error_input_mat,
@@ -246,8 +250,8 @@ namespace ANN {
   
   void DotProductANNComponent::build(unsigned int _input_size,
 				     unsigned int _output_size,
-				     MatrixFloatSet *weights_dict,
-				     hash<string,ANNComponent*> &components_dict) {
+				     AprilUtils::LuaTable &weights_dict,
+				     AprilUtils::LuaTable &components_dict) {
     MatrixInputSwitchANNComponent::build(_input_size, _output_size,
                                          weights_dict, components_dict);
     //
@@ -258,13 +262,14 @@ namespace ANN {
     unsigned int weights_input_size  = getInputSize();
     unsigned int weights_output_size = getOutputSize();
     ////////////////////////////////////////////////////////////////////
-    if (transpose_weights == CblasTrans)
+    if (transpose_weights == CblasTrans) {
       swap(weights_input_size, weights_output_size);
-    AprilUtils::SharedPtr<MatrixFloat> &w = (*weights_dict)[getWeightsName()].getDense();
+    }
+    MatrixFloat *w = weights_dict.opt<MatrixFloat*>(getWeightsName(), 0);
     // printf("%s :: %p %p\n", weights_name.c_str(), w, weights_matrix);
-    if (!w.empty()) {
+    if (w != 0) {
       // printf("COPY OF WEIGHTS FROM HASH %s\n", weights_name.c_str());
-      AssignRef(weights_matrix, w.get());
+      AssignRef(weights_matrix, w);
       if (!Connections::checkInputOutputSizes(weights_matrix,
 					      weights_input_size,
 					      weights_output_size))
@@ -283,22 +288,23 @@ namespace ANN {
 	IncRef(weights_matrix);
       }
       // else printf("USING PREVIOUS WEIGHTS %s\n", weights_name.c_str());
-      w = weights_matrix;
+      weights_dict.put<MatrixFloat*>(getWeightsName(), weights_matrix);
     }
   }
 
-  void DotProductANNComponent::copyWeights(MatrixFloatSet *weights_dict) {
-    if (weights_matrix == 0)
+  void DotProductANNComponent::copyWeights(AprilUtils::LuaTable &weights_dict) {
+    if (weights_matrix == 0) {
       ERROR_EXIT1(100, "Component not built, impossible execute copyWeights [%s]\n",
 		  getName().c_str());
-    AprilUtils::SharedPtr<MatrixFloat> &w = (*weights_dict)[getWeightsName()].getDense();
-    if (!w.empty() && w.get() != weights_matrix)
+    }
+    MatrixFloat *w = weights_dict.opt<MatrixFloat*>(getWeightsName(), 0);
+    if (w != 0 && w != weights_matrix)
       ERROR_EXIT2(101, "Weights dictionary contains %s weights name which is "
 		  "not shared with weights_matrix attribute [%s]\n",
 		  getWeightsName().c_str(),
 		  getName().c_str());
-    else if (w.empty()) {
-      w = weights_matrix;
+    else if (w == 0) {
+      weights_dict.put<MatrixFloat*>(getWeightsName(), weights_matrix);
     }
   }  
 
diff --git a/packages/ann/ann/c_src/dot_product_component.h b/packages/ann/ann/c_src/dot_product_component.h
index a7e1848fe..1eb5bc7a7 100644
--- a/packages/ann/ann/c_src/dot_product_component.h
+++ b/packages/ann/ann/c_src/dot_product_component.h
@@ -46,17 +46,20 @@ namespace ANN {
                                                        bool during_training);
     virtual Basics::MatrixFloat *privateDoDenseBackprop(Basics::MatrixFloat *error_input);
     virtual void privateDenseReset(unsigned int it=0);
-    virtual void privateDenseComputeGradients(AprilUtils::SharedPtr<Basics::MatrixFloat> & grads_mat);
+    virtual void privateDenseComputeGradients(const char *name,
+                                              AprilUtils::LuaTable &grads_mat_dict);
 
     // from SparseMatrixANNComponentHelper
     virtual Basics::MatrixFloat *privateDoSparseForward(Basics::SparseMatrixFloat *input,
                                                         bool during_training);
     virtual Basics::SparseMatrixFloat *privateDoSparseBackprop(Basics::MatrixFloat *error_input);
     virtual void privateSparseReset(unsigned int it=0);
-    virtual void privateSparseComputeGradients(AprilUtils::SharedPtr<Basics::MatrixFloat> & grads_mat);
+    virtual void privateSparseComputeGradients(const char *name,
+                                              AprilUtils::LuaTable &grads_mat_dict);
     
     //
-    void initializeComputeGradients(AprilUtils::SharedPtr<Basics::MatrixFloat> & grads_mat);
+    Basics::MatrixFloat *initializeComputeGradients(const char *name,
+                                                    AprilUtils::LuaTable &grads_mat_dict);
         
   public:
     DotProductANNComponent(const char *name=0, const char *weights_name=0,
@@ -67,9 +70,9 @@ namespace ANN {
     virtual ANNComponent *clone();
     virtual void build(unsigned int input_size,
 		       unsigned int output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
-    virtual void copyWeights(Basics::MatrixFloatSet *weights_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
+    virtual void copyWeights(AprilUtils::LuaTable &weights_dict);
     
     virtual char *toLuaString();
     
diff --git a/packages/ann/ann/c_src/dropout_component.cc b/packages/ann/ann/c_src/dropout_component.cc
index ab6ff2675..6cd0bad1c 100644
--- a/packages/ann/ann/c_src/dropout_component.cc
+++ b/packages/ann/ann/c_src/dropout_component.cc
@@ -72,16 +72,14 @@ namespace ANN {
       // new  output to fit the bunch
       AssignRef(output,new TokenMatrixFloat(input_mat->clone()));
       MatrixFloat *output_mat = output->getMatrix();
-      april_assert(output_mat->getMajorOrder() == CblasColMajor);
       // apply dropout
       if (during_training) {
 	if (dropout_mask == 0 || dropout_mask->size() != input_mat->size()) {
 	  if (dropout_mask) DecRef(dropout_mask);
-	  int dims = { input_mat->size() };
-	  dropout_mask = new MatrixFloat(1, dims, CblasColMajor);
+	  dropout_mask = new MatrixFloat(1, input_mat->size());
 	  IncRef(dropout_mask);
 	}
-	for (MatrixFloat::col_major_iterator it(dropout_mask->begin());
+	for (MatrixFloat::iterator it(dropout_mask->begin());
 	     it != dropout_mask->end(); ++it) {
 	  if (random->rand() < prob) *it = 0.0f;
 	  else *it = 1.0f;
@@ -108,7 +106,6 @@ namespace ANN {
       AssignRef(error_input,_error_input);
       TokenMatrixFloat *error_input_token_matrix = _error_input->convertTo<TokenMatrixFloat*>();
       MatrixFloat *error_input_mat = error_input_token_matrix->getMatrix();
-      april_assert(error_input_mat->getMajorOrder() == CblasColMajor);
       april_assert(error_input_mat->getNumDim() >= 2);
       if (!error_input_mat->getIsContiguous()) {
 	error_input_mat = error_input_mat->clone();
@@ -155,8 +152,8 @@ namespace ANN {
 
   void DropoutANNComponent::build(unsigned int _input_size,
 				  unsigned int _output_size,
-				  MatrixFloatSet *weights_dict,
-				  hash<string,ANNComponent*> &components_dict) {
+				  AprilUtils::LuaTable &weights_dict,
+				  AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size,
 			weights_dict, components_dict);
     if (input_size == 0) input_size = output_size;
diff --git a/packages/ann/ann/c_src/dropout_component.h b/packages/ann/ann/c_src/dropout_component.h
index 4a347155a..c392e9090 100644
--- a/packages/ann/ann/c_src/dropout_component.h
+++ b/packages/ann/ann/c_src/dropout_component.h
@@ -61,8 +61,8 @@ namespace ANN {
 
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
     virtual char *toLuaString();
   };
diff --git a/packages/ann/ann/c_src/flatten_component.cc b/packages/ann/ann/c_src/flatten_component.cc
index 01c92a04b..72d1a12ad 100644
--- a/packages/ann/ann/c_src/flatten_component.cc
+++ b/packages/ann/ann/c_src/flatten_component.cc
@@ -76,8 +76,8 @@ namespace ANN {
   
   void FlattenANNComponent::build(unsigned int _input_size,
 				 unsigned int _output_size,
-				 MatrixFloatSet *weights_dict,
-				 hash<string,ANNComponent*> &components_dict) {
+				 AprilUtils::LuaTable &weights_dict,
+				 AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size,
 			weights_dict, components_dict);
   }
diff --git a/packages/ann/ann/c_src/flatten_component.h b/packages/ann/ann/c_src/flatten_component.h
index 9f6d45405..68d9befac 100644
--- a/packages/ann/ann/c_src/flatten_component.h
+++ b/packages/ann/ann/c_src/flatten_component.h
@@ -61,8 +61,8 @@ namespace ANN {
 
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
     virtual char *toLuaString();
   };
diff --git a/packages/ann/ann/c_src/gaussian_noise_component.cc b/packages/ann/ann/c_src/gaussian_noise_component.cc
index 4d10b104f..74c2c5bc9 100644
--- a/packages/ann/ann/c_src/gaussian_noise_component.cc
+++ b/packages/ann/ann/c_src/gaussian_noise_component.cc
@@ -68,8 +68,7 @@ namespace ANN {
     // get memory blocks for tokens
     MatrixFloat *output_mat = output->getMatrix();
     MatrixFloat *noise_mat  = output_mat->cloneOnlyDims();
-    april_assert(output_mat->getMajorOrder() == CblasColMajor);
-    for (MatrixFloat::col_major_iterator it=noise_mat->begin();
+    for (MatrixFloat::iterator it=noise_mat->begin();
 	 it!=noise_mat->end(); ++it) {
       *it = random->randNorm(mean, variance);
     }
@@ -107,8 +106,8 @@ namespace ANN {
 
   void GaussianNoiseANNComponent::build(unsigned int _input_size,
 					unsigned int _output_size,
-					MatrixFloatSet *weights_dict,
-					hash<string,ANNComponent*> &components_dict) {
+					AprilUtils::LuaTable &weights_dict,
+					AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size,
 			weights_dict, components_dict);
     if (output_size == 0) output_size = input_size;
diff --git a/packages/ann/ann/c_src/gaussian_noise_component.h b/packages/ann/ann/c_src/gaussian_noise_component.h
index 2d21a5f71..3a1481a92 100644
--- a/packages/ann/ann/c_src/gaussian_noise_component.h
+++ b/packages/ann/ann/c_src/gaussian_noise_component.h
@@ -58,8 +58,8 @@ namespace ANN {
 
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
     virtual char *toLuaString();
   };
diff --git a/packages/ann/ann/c_src/hyperplane_component.cc b/packages/ann/ann/c_src/hyperplane_component.cc
index f799be570..bcad92c00 100644
--- a/packages/ann/ann/c_src/hyperplane_component.cc
+++ b/packages/ann/ann/c_src/hyperplane_component.cc
@@ -87,8 +87,7 @@ namespace ANN {
     bias->reset(it);
   }
 
-  void HyperplaneANNComponent::computeAllGradients(MatrixFloatSet
-						   *weight_grads_dict) {
+  void HyperplaneANNComponent::computeAllGradients(AprilUtils::LuaTable &weight_grads_dict) {
     dot_product->computeAllGradients(weight_grads_dict);
     bias->computeAllGradients(weight_grads_dict);
   }
@@ -113,8 +112,8 @@ namespace ANN {
   
   void HyperplaneANNComponent::build(unsigned int _input_size,
 				     unsigned int _output_size,
-				     MatrixFloatSet *weights_dict,
-				     hash<string,ANNComponent*> &components_dict) {
+				     AprilUtils::LuaTable &weights_dict,
+				     AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size, weights_dict, components_dict);
     //////////////////////////////////////////////////////////////
     if (input_size == 0 || output_size == 0)
@@ -126,12 +125,12 @@ namespace ANN {
     bias->build(output_size, output_size, weights_dict, components_dict);
   }
   
-  void HyperplaneANNComponent::copyWeights(MatrixFloatSet *weights_dict) {
+  void HyperplaneANNComponent::copyWeights(AprilUtils::LuaTable &weights_dict) {
     dot_product->copyWeights(weights_dict);
     bias->copyWeights(weights_dict);
   }
 
-  void HyperplaneANNComponent::copyComponents(hash<string,ANNComponent*> &components_dict) {
+  void HyperplaneANNComponent::copyComponents(AprilUtils::LuaTable &components_dict) {
     ANNComponent::copyComponents(components_dict);
     dot_product->copyComponents(components_dict);
     bias->copyComponents(components_dict);
diff --git a/packages/ann/ann/c_src/hyperplane_component.h b/packages/ann/ann/c_src/hyperplane_component.h
index 3cba062ae..4cb1d9d5d 100644
--- a/packages/ann/ann/c_src/hyperplane_component.h
+++ b/packages/ann/ann/c_src/hyperplane_component.h
@@ -66,15 +66,15 @@ namespace ANN {
     
     virtual void build(unsigned int input_size,
 		       unsigned int output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
     
-    virtual void copyWeights(Basics::MatrixFloatSet *weights_dict);
+    virtual void copyWeights(AprilUtils::LuaTable &weights_dict);
 
-    virtual void copyComponents(AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+    virtual void copyComponents(AprilUtils::LuaTable &components_dict);
     
     virtual ANNComponent *getComponent(AprilUtils::string &name);
-    virtual void computeAllGradients(Basics::MatrixFloatSet *weight_grads_dict);
+    virtual void computeAllGradients(AprilUtils::LuaTable &weight_grads_dict);
     virtual void debugInfo() {
       ANNComponent::debugInfo();
       dot_product->debugInfo();
diff --git a/packages/ann/ann/c_src/join_component.cc b/packages/ann/ann/c_src/join_component.cc
index de7ff9ca6..2c6c81d4b 100644
--- a/packages/ann/ann/c_src/join_component.cc
+++ b/packages/ann/ann/c_src/join_component.cc
@@ -181,7 +181,7 @@ namespace ANN {
 		      static_cast<int>(output_size) :
 		      static_cast<int>(input_size) };
     int coords[2] = { 0, 0 };
-    full_mat = new MatrixFloat(2, sizes, CblasColMajor);
+    full_mat = new MatrixFloat(2, sizes);
 #ifdef USE_CUDA
     full_mat->setUseCuda(use_cuda);
 #endif
@@ -268,10 +268,10 @@ namespace ANN {
       components[i]->reset(it);
   }
   
-  void JoinANNComponent::computeAllGradients(MatrixFloatSet
-					     *weight_grads_dict) {
-    for (unsigned int c=0; c<components.size(); ++c)
+  void JoinANNComponent::computeAllGradients(AprilUtils::LuaTable &weight_grads_dict) {
+    for (unsigned int c=0; c<components.size(); ++c) {
       components[c]->computeAllGradients(weight_grads_dict);
+    }
   }
   
   ANNComponent *JoinANNComponent::clone() {
@@ -285,8 +285,8 @@ namespace ANN {
 
   void JoinANNComponent::build(unsigned int _input_size,
 			       unsigned int _output_size,
-			       MatrixFloatSet *weights_dict,
-			       hash<string,ANNComponent*> &components_dict) {
+			       AprilUtils::LuaTable &weights_dict,
+			       AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size,
 			weights_dict, components_dict);
     //
@@ -325,12 +325,12 @@ namespace ANN {
       components[c]->setUseCuda(v);
   }
   
-  void JoinANNComponent::copyWeights(MatrixFloatSet *weights_dict) {
+  void JoinANNComponent::copyWeights(AprilUtils::LuaTable &weights_dict) {
     for (unsigned int i=0; i<components.size(); ++i)
       components[i]->copyWeights(weights_dict);
   }
 
-  void JoinANNComponent::copyComponents(hash<string,ANNComponent*> &components_dict) {
+  void JoinANNComponent::copyComponents(AprilUtils::LuaTable &components_dict) {
     ANNComponent::copyComponents(components_dict);
     for (unsigned int i=0; i<components.size(); ++i)
       components[i]->copyComponents(components_dict);
diff --git a/packages/ann/ann/c_src/join_component.h b/packages/ann/ann/c_src/join_component.h
index 52c5f390e..6b4b69a7b 100644
--- a/packages/ann/ann/c_src/join_component.h
+++ b/packages/ann/ann/c_src/join_component.h
@@ -91,15 +91,15 @@ namespace ANN {
     
     virtual void build(unsigned int input_size,
 		       unsigned int output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
     
-    virtual void copyWeights(Basics::MatrixFloatSet *weights_dict);
+    virtual void copyWeights(AprilUtils::LuaTable &weights_dict);
 
-    virtual void copyComponents(AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+    virtual void copyComponents(AprilUtils::LuaTable &components_dict);
     
     virtual ANNComponent *getComponent(AprilUtils::string &name);
-    virtual void computeAllGradients(Basics::MatrixFloatSet *weight_grads_dict);
+    virtual void computeAllGradients(AprilUtils::LuaTable &weight_grads_dict);
     virtual void debugInfo() {
       ANNComponent::debugInfo();
       for (unsigned int i=0; i<components.size(); ++i)
diff --git a/packages/ann/ann/c_src/log_actf_component.cc b/packages/ann/ann/c_src/log_actf_component.cc
new file mode 100644
index 000000000..36c4a23be
--- /dev/null
+++ b/packages/ann/ann/c_src/log_actf_component.cc
@@ -0,0 +1,61 @@
+/*
+ * This file is part of APRIL-ANN toolkit (A
+ * Pattern Recognizer In Lua with Artificial Neural Networks).
+ *
+ * Copyright 2013, Francisco Zamora-Martinez
+ *
+ * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 3 as
+ * published by the Free Software Foundation
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this library; if not, write to the Free Software Foundation,
+ * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ */
+#include "unused_variable.h"
+#include "cblas_headers.h"
+#include "log_actf_component.h"
+
+using namespace AprilMath;
+using namespace AprilMath::MatrixExt::Operations;
+using namespace AprilUtils;
+using namespace Basics;
+
+namespace ANN {
+
+  LogActfANNComponent::LogActfANNComponent(const char *name) :
+    ActivationFunctionANNComponent(name) { }
+  LogActfANNComponent::~LogActfANNComponent() { }
+
+  void LogActfANNComponent::applyActivation(MatrixFloat *input_units,
+					    MatrixFloat *output_units) {
+    matLog(input_units, output_units);
+  }
+
+  void LogActfANNComponent::multiplyDerivatives(MatrixFloat *input_units,
+                                                MatrixFloat *output_units,
+                                                MatrixFloat *input_errors,
+                                                MatrixFloat *output_errors) {
+    UNUSED_VARIABLE(output_units);
+    matDiv(input_units, 1.0f, output_errors);
+    matCmul(output_errors, input_errors);
+  }
+
+  ANNComponent *LogActfANNComponent::clone() {
+    LogActfANNComponent *obj = new LogActfANNComponent(name.c_str());
+    return obj;
+  }
+
+  char *LogActfANNComponent::toLuaString() {
+    buffer_list buffer;
+    buffer.printf("ann.components.actf.log{ name='%s' }", name.c_str());
+    return buffer.to_string(buffer_list::NULL_TERMINATED);
+  }
+
+}
diff --git a/packages/ann/ann/c_src/log_actf_component.h b/packages/ann/ann/c_src/log_actf_component.h
new file mode 100644
index 000000000..c98e045dd
--- /dev/null
+++ b/packages/ann/ann/c_src/log_actf_component.h
@@ -0,0 +1,50 @@
+/*
+ * This file is part of APRIL-ANN toolkit (A
+ * Pattern Recognizer In Lua with Artificial Neural Networks).
+ *
+ * Copyright 2013, Francisco Zamora-Martinez
+ *
+ * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 3 as
+ * published by the Free Software Foundation
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this library; if not, write to the Free Software Foundation,
+ * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ */
+#ifndef LOGACTFCOMPONENT_H
+#define LOGACTFCOMPONENT_H
+
+#include "activation_function_component.h"
+#include "ann_component.h"
+#include "gpu_mirrored_memory_block.h"
+
+namespace ANN {
+
+  /// A component which computes the Log activation function.
+  class LogActfANNComponent : public ActivationFunctionANNComponent {
+    APRIL_DISALLOW_COPY_AND_ASSIGN(LogActfANNComponent);
+    
+  protected:
+    virtual void applyActivation(Basics::MatrixFloat *input_units,
+				 Basics::MatrixFloat *output_units);
+    virtual void multiplyDerivatives(Basics::MatrixFloat *input_units,
+				     Basics::MatrixFloat *output_units,
+				     Basics::MatrixFloat *input_errors,
+				     Basics::MatrixFloat *output_errors);
+  public:
+    LogActfANNComponent(const char *name);
+    virtual ~LogActfANNComponent();
+    virtual ANNComponent *clone();
+
+    virtual char *toLuaString();
+  };
+}
+
+#endif // LOGACTFCOMPONENT_H
diff --git a/packages/ann/ann/c_src/matrix_component.h b/packages/ann/ann/c_src/matrix_component.h
index 1c8d56503..d8f177dc1 100644
--- a/packages/ann/ann/c_src/matrix_component.h
+++ b/packages/ann/ann/c_src/matrix_component.h
@@ -106,10 +106,10 @@ namespace ANN {
     /*
       virtual void build(unsigned int input_size,
       unsigned int output_size,
-      MatrixFloatSet *weights_dict,
-      hash<string,ANNComponent*> &components_dict) = 0;
+      AprilUtils::LuaTable &weights_dict,
+      AprilUtils::LuaTable &components_dict) = 0;
     */
-    // virtual void copyWeights(MatrixFloatSet *weights_dict) = 0;
+    // virtual void copyWeights(AprilUtils::LuaTable &weights_dict) = 0;
     // virtual char *toLuaString() = 0;
   };
   
diff --git a/packages/ann/ann/c_src/matrix_input_switch_component.cc b/packages/ann/ann/c_src/matrix_input_switch_component.cc
index 1c4a95c61..921dceb21 100644
--- a/packages/ann/ann/c_src/matrix_input_switch_component.cc
+++ b/packages/ann/ann/c_src/matrix_input_switch_component.cc
@@ -250,8 +250,9 @@ namespace ANN {
     else privateSparseReset(it);
   }
 
-  void MatrixInputSwitchANNComponent::computeGradients(AprilUtils::SharedPtr<MatrixFloat> & grads_mat) {
-    if (!is_sparse_input) privateDenseComputeGradients(grads_mat);
-    else privateSparseComputeGradients(grads_mat);
+  void MatrixInputSwitchANNComponent::computeGradients(const char *name,
+                                                       AprilUtils::LuaTable &weight_grads_dict) {
+    if (!is_sparse_input) privateDenseComputeGradients(name, weight_grads_dict);
+    else privateSparseComputeGradients(name, weight_grads_dict);
   }
 }
diff --git a/packages/ann/ann/c_src/matrix_input_switch_component.h b/packages/ann/ann/c_src/matrix_input_switch_component.h
index b6abc326a..52d332650 100644
--- a/packages/ann/ann/c_src/matrix_input_switch_component.h
+++ b/packages/ann/ann/c_src/matrix_input_switch_component.h
@@ -76,19 +76,21 @@ namespace ANN {
       return sparse_error_output->getMatrix();
     }
     
-    virtual void computeGradients(AprilUtils::SharedPtr<Basics::MatrixFloat> & grads_mat);
+    virtual void computeGradients(const char *name, AprilUtils::LuaTable &weight_grads_dict);
 
     // Abstract methods
 
     virtual Basics::MatrixFloat *privateDoDenseForward(Basics::MatrixFloat *input, bool during_training) = 0;
     virtual Basics::MatrixFloat *privateDoDenseBackprop(Basics::MatrixFloat *input_error) = 0;
     virtual void privateDenseReset(unsigned int it=0) = 0;
-    virtual void privateDenseComputeGradients(AprilUtils::SharedPtr<Basics::MatrixFloat> & grads_mat) = 0;
+    virtual void privateDenseComputeGradients(const char *name,
+                                              AprilUtils::LuaTable &weight_grads_dict) = 0;
 
     virtual Basics::MatrixFloat *privateDoSparseForward(Basics::SparseMatrixFloat *input, bool during_training) = 0;
     virtual Basics::SparseMatrixFloat *privateDoSparseBackprop(Basics::MatrixFloat *input_error) = 0;
     virtual void privateSparseReset(unsigned int it=0) = 0;
-    virtual void privateSparseComputeGradients(AprilUtils::SharedPtr<Basics::MatrixFloat> & grads_mat) = 0;
+    virtual void privateSparseComputeGradients(const char *name,
+                                               AprilUtils::LuaTable &weight_grads_dict) = 0;
 
   public:
     MatrixInputSwitchANNComponent(const char *name, const char *weights_name,
@@ -121,10 +123,10 @@ namespace ANN {
     /*
       virtual void build(unsigned int input_size,
       unsigned int output_size,
-      MatrixFloatSet *weights_dict,
-      hash<string,ANNComponent*> &components_dict) = 0;
+      AprilUtils::LuaTable &weights_dict,
+      AprilUtils::LuaTable &components_dict) = 0;
     */
-    // virtual void copyWeights(MatrixFloatSet *weights_dict) = 0;
+    // virtual void copyWeights(AprilUtils::LuaTable &weights_dict) = 0;
     // virtual char *toLuaString() = 0;
     
   };
diff --git a/packages/ann/ann/c_src/maxpooling_component.cc b/packages/ann/ann/c_src/maxpooling_component.cc
index f4e0ef86c..ce9bcecef 100644
--- a/packages/ann/ann/c_src/maxpooling_component.cc
+++ b/packages/ann/ann/c_src/maxpooling_component.cc
@@ -136,7 +136,7 @@ namespace ANN {
     const int *input_dims = input_mat->getDimPtr();
     initializeArrays(input_dims);
     MatrixFloat *output_mat;
-    output_mat = new MatrixFloat(input_num_dims+1, output_dims, CblasColMajor);
+    output_mat = new MatrixFloat(input_num_dims+1, output_dims);
     IncRef(output_mat);
 #ifdef USE_CUDA
     output_mat->setUseCuda(use_cuda);
diff --git a/packages/ann/ann/c_src/maxpooling_component.h b/packages/ann/ann/c_src/maxpooling_component.h
index 40ad86431..24109c830 100644
--- a/packages/ann/ann/c_src/maxpooling_component.h
+++ b/packages/ann/ann/c_src/maxpooling_component.h
@@ -57,7 +57,7 @@ namespace ANN {
     int *input_window_size;
     /// Number of steps of the convolution window, input_num_dims + 1
     int *input_window_num_steps;
-    /// Order for traversing the input data, prepared for col-major order
+    /// Order for traversing the input data
     int *input_window_order_step;
     /// Translates the input window into a bi-dimensional matrix
     int *input_window_rewrap;
@@ -68,7 +68,7 @@ namespace ANN {
     int *output_window_step;
     /// Number of steps of the convolution window, input_num_dims + 1
     int *output_window_num_steps;
-    /// Order for traversing the input data, prepared for col-major order
+    /// Order for traversing the input data
     int *output_window_order_step;
     /// Translates the output window into a bi-dimensional matrix
     int *output_window_rewrap;
diff --git a/packages/ann/ann/c_src/pca_whitening_component.cc b/packages/ann/ann/c_src/pca_whitening_component.cc
index d2d496267..fe9a1f21b 100644
--- a/packages/ann/ann/c_src/pca_whitening_component.cc
+++ b/packages/ann/ann/c_src/pca_whitening_component.cc
@@ -49,8 +49,6 @@ namespace ANN {
 			getInputSize(), getOutputSize(),
 			true),
     takeN(takeN) {
-    if (U->getMajorOrder() != CblasColMajor)
-      ERROR_EXIT(128, "Incorrect U matrix major order, needed col_major\n");
     if (U->getNumDim() != 2)
       ERROR_EXIT(128, "Needs a bi-dimensional matrix as U argument\n");
     if ( !S->isDiagonal() )
@@ -76,9 +74,11 @@ namespace ANN {
     }
     delete aux_mat;
     //
-    matrix_set.insert(WEIGHTS_NAME, U_S_epsilon);
-    hash<string,ANNComponent*> components_dict;
-    dot_product_encoder.build(0, 0, &matrix_set, components_dict);
+    matrix_set.put(WEIGHTS_NAME, U_S_epsilon);
+    AprilUtils::LuaTable components_dict;
+    dot_product_encoder.build(0, 0, matrix_set, components_dict);
+    // avoid problems with DecRef in LuaTable
+    IncRef(&dot_product_encoder);
   }
   
   PCAWhiteningANNComponent::~PCAWhiteningANNComponent() {
@@ -109,8 +109,8 @@ namespace ANN {
   
   void PCAWhiteningANNComponent::build(unsigned int _input_size,
 				       unsigned int _output_size,
-				       MatrixFloatSet *weights_dict,
-				       hash<string,ANNComponent*> &components_dict) {
+				       AprilUtils::LuaTable &weights_dict,
+				       AprilUtils::LuaTable &components_dict) {
     // TODO: CHECK INPUT OUTPUT SIZES
     UNUSED_VARIABLE(_input_size);
     UNUSED_VARIABLE(_output_size);
@@ -120,13 +120,13 @@ namespace ANN {
   
   char *PCAWhiteningANNComponent::toLuaString() {
     SharedPtr<CStringStream> stream(new CStringStream());
-    AprilUtils::HashTableOptions options;
-    options.putBoolean("ascii", false);
+    AprilUtils::LuaTable options;
+    options.put("ascii", false);
     stream->printf("ann.components.pca_whitening{ name='%s', U=matrix.fromString[[",
                    name.c_str());
-    U->write(stream.get(), &options);
+    U->write(stream.get(), options);
     stream->put("]], S=matrix.sparse.fromString[[");
-    S->write(stream.get(), &options);
+    S->write(stream.get(), options);
     stream->printf("]], epsilon=%g, takeN=%u, }", epsilon, takeN);
     stream->put("\0",1); // forces a \0 at the end of the buffer
     return stream->releaseString();
diff --git a/packages/ann/ann/c_src/pca_whitening_component.h b/packages/ann/ann/c_src/pca_whitening_component.h
index 87dece4d9..845cc45c3 100644
--- a/packages/ann/ann/c_src/pca_whitening_component.h
+++ b/packages/ann/ann/c_src/pca_whitening_component.h
@@ -28,7 +28,6 @@
 #include "token_vector.h"
 #include "token_matrix.h"
 #include "dot_product_component.h"
-#include "matrixFloatSet.h"
 
 namespace ANN {
 
@@ -41,7 +40,7 @@ namespace ANN {
     Basics::MatrixFloat *U_S_epsilon; //< matrix for dot_product_component
     float epsilon;  //< regularization
     DotProductANNComponent dot_product_encoder; //< Applies the transformation
-    Basics::MatrixFloatSet matrix_set; //< Auxiliary for dot_product_encoder build
+    AprilUtils::LuaTable matrix_set; //< Auxiliary for dot_product_encoder build
     unsigned int takeN;
     
   public:
@@ -67,8 +66,8 @@ namespace ANN {
 
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
     virtual char *toLuaString();
     unsigned int getTakeN() const { return takeN; }
diff --git a/packages/ann/ann/c_src/rewrap_component.cc b/packages/ann/ann/c_src/rewrap_component.cc
index 631b9aec5..0fabb4476 100644
--- a/packages/ann/ann/c_src/rewrap_component.cc
+++ b/packages/ann/ann/c_src/rewrap_component.cc
@@ -78,8 +78,8 @@ namespace ANN {
   
   void RewrapANNComponent::build(unsigned int _input_size,
 				 unsigned int _output_size,
-				 MatrixFloatSet *weights_dict,
-				 hash<string,ANNComponent*> &components_dict) {
+				 AprilUtils::LuaTable &weights_dict,
+				 AprilUtils::LuaTable &components_dict) {
     unsigned int sz = 1;
     for (int i=1; i<this->n; ++i) sz *= rewrap_dims[i];
     //
diff --git a/packages/ann/ann/c_src/rewrap_component.h b/packages/ann/ann/c_src/rewrap_component.h
index 8c4de0005..359c74f9e 100644
--- a/packages/ann/ann/c_src/rewrap_component.h
+++ b/packages/ann/ann/c_src/rewrap_component.h
@@ -61,8 +61,8 @@ namespace ANN {
 
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
     virtual char *toLuaString();
   };
diff --git a/packages/ann/ann/c_src/salt_and_pepper_component.cc b/packages/ann/ann/c_src/salt_and_pepper_component.cc
index 66c268eeb..86f134910 100644
--- a/packages/ann/ann/c_src/salt_and_pepper_component.cc
+++ b/packages/ann/ann/c_src/salt_and_pepper_component.cc
@@ -68,8 +68,7 @@ namespace ANN {
     // new  output to fit the bunch
     AssignRef(output,new TokenMatrixFloat(input->getMatrix()->clone()));
     MatrixFloat *output_mat = output->getMatrix();
-    april_assert(output_mat->getMajorOrder() == CblasColMajor);
-    for (MatrixFloat::col_major_iterator it(output_mat->begin());
+    for (MatrixFloat::iterator it(output_mat->begin());
 	 it != output_mat->end();
 	 ++it) {
       float p = random->rand();
@@ -113,8 +112,8 @@ namespace ANN {
 
   void SaltAndPepperANNComponent::build(unsigned int _input_size,
 					unsigned int _output_size,
-					MatrixFloatSet *weights_dict,
-					hash<string,ANNComponent*> &components_dict) {
+					AprilUtils::LuaTable &weights_dict,
+					AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size,
 			weights_dict, components_dict);
     if (output_size == 0) output_size = input_size;
diff --git a/packages/ann/ann/c_src/salt_and_pepper_component.h b/packages/ann/ann/c_src/salt_and_pepper_component.h
index c4c6724a8..b0cc22541 100644
--- a/packages/ann/ann/c_src/salt_and_pepper_component.h
+++ b/packages/ann/ann/c_src/salt_and_pepper_component.h
@@ -61,8 +61,8 @@ namespace ANN {
 
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
     virtual char *toLuaString();
   };
diff --git a/packages/ann/ann/c_src/select_component.cc b/packages/ann/ann/c_src/select_component.cc
index 299b23c98..ce4146d28 100644
--- a/packages/ann/ann/c_src/select_component.cc
+++ b/packages/ann/ann/c_src/select_component.cc
@@ -87,8 +87,8 @@ namespace ANN {
   
   void SelectANNComponent::build(unsigned int _input_size,
 				 unsigned int _output_size,
-				 MatrixFloatSet *weights_dict,
-				 hash<string,ANNComponent*> &components_dict) {
+				 AprilUtils::LuaTable &weights_dict,
+				 AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size,
 			weights_dict, components_dict);
   }
diff --git a/packages/ann/ann/c_src/select_component.h b/packages/ann/ann/c_src/select_component.h
index 8d378a6e6..77c37e943 100644
--- a/packages/ann/ann/c_src/select_component.h
+++ b/packages/ann/ann/c_src/select_component.h
@@ -51,8 +51,8 @@ namespace ANN {
 
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
     virtual char *toLuaString();
   };
diff --git a/packages/ann/ann/c_src/slice_component.cc b/packages/ann/ann/c_src/slice_component.cc
index 325fdc4d9..edd015eef 100644
--- a/packages/ann/ann/c_src/slice_component.cc
+++ b/packages/ann/ann/c_src/slice_component.cc
@@ -96,8 +96,8 @@ namespace ANN {
   
   void SliceANNComponent::build(unsigned int _input_size,
 				unsigned int _output_size,
-				MatrixFloatSet *weights_dict,
-				hash<string,ANNComponent*> &components_dict) {
+				AprilUtils::LuaTable &weights_dict,
+				AprilUtils::LuaTable &components_dict) {
     unsigned int sz = mult(slice_size+1, n-1);
     //
     if (_output_size != 0 && _output_size != sz)
diff --git a/packages/ann/ann/c_src/slice_component.h b/packages/ann/ann/c_src/slice_component.h
index 8a7c5ef56..48affcd00 100644
--- a/packages/ann/ann/c_src/slice_component.h
+++ b/packages/ann/ann/c_src/slice_component.h
@@ -55,8 +55,8 @@ namespace ANN {
 
     virtual void build(unsigned int _input_size,
 		       unsigned int _output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
 
     virtual char *toLuaString();
   };
diff --git a/packages/ann/ann/c_src/sparse_matrix_component.h b/packages/ann/ann/c_src/sparse_matrix_component.h
index 810309a13..f130a729a 100644
--- a/packages/ann/ann/c_src/sparse_matrix_component.h
+++ b/packages/ann/ann/c_src/sparse_matrix_component.h
@@ -85,7 +85,7 @@ namespace ANN {
      */
     virtual void privateReset(unsigned int it=0) = 0;
     
-    // virtual void computeGradients(AprilUtils::SharedPtr<MatrixFloat> & grads_mat) = 0;
+    // virtual void computeGradients(const char *name, AprilUtils::LuaTable &weight_grads_dict) = 0;
     
   public:
     VirtualSparseMatrixANNComponent(const char *name, const char *weights_name,
@@ -106,10 +106,10 @@ namespace ANN {
     /*
       virtual void build(unsigned int input_size,
       unsigned int output_size,
-      MatrixFloatSet *weights_dict,
-      hash<string,ANNComponent*> &components_dict) = 0;
+      AprilUtils::LuaTable &weights_dict,
+      AprilUtils::LuaTable &components_dict) = 0;
     */
-    // virtual void copyWeights(MatrixFloatSet *weights_dict) = 0;
+    // virtual void copyWeights(AprilUtils::LuaTable &weights_dict) = 0;
     // virtual char *toLuaString() = 0;
   };
   
diff --git a/packages/ann/ann/c_src/stack_component.cc b/packages/ann/ann/c_src/stack_component.cc
index 2987806a2..ef5ea78ee 100644
--- a/packages/ann/ann/c_src/stack_component.cc
+++ b/packages/ann/ann/c_src/stack_component.cc
@@ -90,10 +90,10 @@ namespace ANN {
       components[c]->reset(it);
   }
   
-  void StackANNComponent::computeAllGradients(MatrixFloatSet
-					      *weight_grads_dict) {
-    for (unsigned int c=0; c<components.size(); ++c)
+  void StackANNComponent::computeAllGradients(AprilUtils::LuaTable &weight_grads_dict) {
+    for (unsigned int c=0; c<components.size(); ++c) {
       components[c]->computeAllGradients(weight_grads_dict);
+    }
   }
 
   ANNComponent *StackANNComponent::clone() {
@@ -113,8 +113,8 @@ namespace ANN {
   
   void StackANNComponent::build(unsigned int _input_size,
 				unsigned int _output_size,
-				MatrixFloatSet *weights_dict,
-				hash<string,ANNComponent*> &components_dict) {
+				AprilUtils::LuaTable &weights_dict,
+				AprilUtils::LuaTable &components_dict) {
     ANNComponent::build(_input_size, _output_size, weights_dict, components_dict);
     //////////////////////////////////////////////////////////////
     if (components.size() == 0)
@@ -145,12 +145,12 @@ namespace ANN {
     */
   }
   
-  void StackANNComponent::copyWeights(MatrixFloatSet *weights_dict) {
+  void StackANNComponent::copyWeights(AprilUtils::LuaTable &weights_dict) {
     for (unsigned int c=0; c<components.size(); ++c)
       components[c]->copyWeights(weights_dict);
   }
 
-  void StackANNComponent::copyComponents(hash<string,ANNComponent*> &components_dict) {
+  void StackANNComponent::copyComponents(AprilUtils::LuaTable &components_dict) {
     ANNComponent::copyComponents(components_dict);
     for (unsigned int c=0; c<components.size(); ++c)
       components[c]->copyComponents(components_dict);
diff --git a/packages/ann/ann/c_src/stack_component.h b/packages/ann/ann/c_src/stack_component.h
index a5e26c298..eae7bee66 100644
--- a/packages/ann/ann/c_src/stack_component.h
+++ b/packages/ann/ann/c_src/stack_component.h
@@ -82,15 +82,15 @@ namespace ANN {
     
     virtual void build(unsigned int input_size,
 		       unsigned int output_size,
-		       Basics::MatrixFloatSet *weights_dict,
-		       AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+		       AprilUtils::LuaTable &weights_dict,
+		       AprilUtils::LuaTable &components_dict);
     
-    virtual void copyWeights(Basics::MatrixFloatSet *weights_dict);
+    virtual void copyWeights(AprilUtils::LuaTable &weights_dict);
 
-    virtual void copyComponents(AprilUtils::hash<AprilUtils::string,ANNComponent*> &components_dict);
+    virtual void copyComponents(AprilUtils::LuaTable &components_dict);
     
     virtual ANNComponent *getComponent(AprilUtils::string &name);
-    virtual void computeAllGradients(Basics::MatrixFloatSet *weight_grads_dict);
+    virtual void computeAllGradients(AprilUtils::LuaTable &weight_grads_dict);
     virtual void debugInfo() {
       ANNComponent::debugInfo();
       for (unsigned int i=0; i<components.size(); ++i) {
diff --git a/packages/ann/ann/c_src/zca_whitening_component.cc b/packages/ann/ann/c_src/zca_whitening_component.cc
index 6af8bd541..fa468fda0 100644
--- a/packages/ann/ann/c_src/zca_whitening_component.cc
+++ b/packages/ann/ann/c_src/zca_whitening_component.cc
@@ -53,9 +53,11 @@ namespace ANN {
       int sizes[2] = { U->getDimSize(0), static_cast<int>(takeN) };
       aux_U = new MatrixFloat(this->U, coords, sizes, true);
     }
-    matrix_set.insert(WEIGHTS_NAME, aux_U);
-    hash<string,ANNComponent*> components_dict;
-    dot_product_decoder.build(0, 0, &matrix_set, components_dict);
+    matrix_set.put(WEIGHTS_NAME, aux_U);
+    AprilUtils::LuaTable components_dict;
+    dot_product_decoder.build(0, 0, matrix_set, components_dict);
+    // avoid problems with DecRef in LuaTable
+    IncRef(&dot_product_decoder);
   }
   
   ZCAWhiteningANNComponent::~ZCAWhiteningANNComponent() {
@@ -82,13 +84,13 @@ namespace ANN {
   
   char *ZCAWhiteningANNComponent::toLuaString() {
     SharedPtr<CStringStream> stream(new CStringStream());
-    AprilUtils::HashTableOptions options;
-    options.putBoolean("ascii", false);
+    AprilUtils::LuaTable options;
+    options.put("ascii", false);
     stream->printf("ann.components.zca_whitening{ name='%s', U=matrix.fromString[[",
                    name.c_str());
-    U->write(stream.get(), &options);
+    U->write(stream.get(), options);
     stream->put("]], S=matrix.sparse.fromString[[");
-    S->write(stream.get(), &options);
+    S->write(stream.get(), options);
     stream->printf("]], epsilon=%g, takeN=%u, }", epsilon, getTakeN());
     stream->put("\0",1); // forces a \0 at the end of the buffer
     return stream->releaseString();
diff --git a/packages/ann/ann/lua_src/annbase.lua b/packages/ann/ann/lua_src/annbase.lua
index 1351456e9..392328ba5 100644
--- a/packages/ann/ann/lua_src/annbase.lua
+++ b/packages/ann/ann/lua_src/annbase.lua
@@ -66,6 +66,7 @@ function ann_wrapper_methods:get_error_output()
 end
 
 function ann_wrapper_methods:forward(input, during_training)
+  self:reset()
   self.input  = input
   self.output = self:forward_function(input, during_training)
   return self.output
@@ -86,14 +87,16 @@ function ann_wrapper_methods:reset(n)
 end
 
 function ann_wrapper_methods:compute_gradients(dict)
-  local dict = wrap_matrices(dict or {})
+  local dict = dict or {}
   self:compute_gradients_function(dict)
   return dict
 end
 
-function ann_wrapper_methods:build()
-  -- already built
-  return self,self.weights,matrix.dict()
+function ann_wrapper_methods:build(params)
+  local input,output,weights = params.input,params.output,params.weights
+  -- TODO: check input/output sizes
+  if params.weights then matrix.dict.replace( self.weights, params.weights ) end
+  return self,self.weights,{}
 end
 
 function ann_wrapper_methods:copy_weights()
@@ -101,7 +104,7 @@ function ann_wrapper_methods:copy_weights()
 end
 
 function ann_wrapper_methods:copy_components()
-  return matrix.dict()
+  return {}
 end
 
 function ann_wrapper_methods:to_lua_string()
@@ -455,6 +458,7 @@ april_set_doc(ann.components.base,
 		    "Components has options (as learning_rate, momentum, ...)",
 		    "which modify they behaviour.",
 		    "Tokens are the basic data which components interchange.",
+                    "Matrix types are a kind of Token, so it is transparent.",
 		    "The ANNs are trained following gradient descent algorithm,",
 		    "so each component has four main properties: input, output,",
 		    "error_input and error_output.",
@@ -543,7 +547,7 @@ april_set_doc(ann.components.base.."get_input",
 		class="method",
 		summary="Returns the token at component input",
 		outputs = {
-		  "A token or nil",
+		  "A token or nil (usually a matrix)",
 		}
 	      })
 
@@ -554,7 +558,7 @@ april_set_doc(ann.components.base.."get_output",
 		class="method",
 		summary="Returns the token at component output",
 		outputs = {
-		  "A token or nil",
+		  "A token or nil (usually a matrix)",
 		}
 	      })
 
@@ -570,7 +574,7 @@ april_set_doc(ann.components.base.."get_error_input",
 		  "in reverse order (from the output)."
 		},
 		outputs = {
-		  "A token or nil",
+		  "A token or nil (usually a matrix)",
 		}
 	      })
 
@@ -586,7 +590,7 @@ april_set_doc(ann.components.base.."get_error_output",
 		  "in reverse order (to the input).",
 		},
 		outputs = {
-		  "A token or nil",
+		  "A token or nil (usually a matrix)",
 		}
 	      })
 
@@ -597,7 +601,7 @@ april_set_doc(ann.components.base.."forward",
 		class="method",
 		summary="Computes forward step with the given token",
 		params={
-		  "An input token",
+		  "An input token (usually a matrix)",
 		  { "A boolean indicating if the forward is during_training or not.",
 		    "This information is used by ann.components.actf objects to",
 		    "apply dropout during training, and to halve the activation",
@@ -605,7 +609,7 @@ april_set_doc(ann.components.base.."forward",
 		    "is false.", }
 		},
 		outputs = {
-		  "An output token",
+		  "An output token (usually a matrix)",
 		}
 	      })
 
@@ -620,10 +624,10 @@ april_set_doc(ann.components.base.."backprop",
 		  "This method is only valid after forward."
 		},
 		params={
-		  "An error input token"
+		  "An error input token (usually a matrix)"
 		},
 		outputs = {
-		  "An error output token",
+		  "An error output token (usually a matrix)",
 		}
 	      })
 
@@ -728,7 +732,7 @@ april_set_doc(ann.components.base.."copy_weights",
 		class="method",
 		summary="Returns the dictionary weights_name=>ann.connections",
 		outputs= {
-		  { "A matrix.dict objecti all the weights_name=>matrix found",
+		  { "A matrix table weights_name=>matrix with matrices found",
 		    "at the components hierarchy."},
 		}
 	      })
diff --git a/packages/ann/ann/test/test-components.lua b/packages/ann/ann/test/test-components.lua
index 68db851e7..5adbba6eb 100644
--- a/packages/ann/ann/test/test-components.lua
+++ b/packages/ann/ann/test/test-components.lua
@@ -7,6 +7,8 @@ local T       = utest.test
 local verbose = false
 local rnd     = random(1234)
 
+utest.select_tests(arg)
+
 function check_component(component_builder_func,loss_name,i,o,b,desc,norm)
   if verbose then
     fprintf(io.stderr, "\nGradients %s (%d,%d,%d,%s)\n",
@@ -17,13 +19,13 @@ function check_component(component_builder_func,loss_name,i,o,b,desc,norm)
   trainer = trainable.supervised_trainer(c, ann.loss[loss_name](), b)
   trainer:build()
   trainer:randomize_weights{ inf = -1, sup = 1, random = rnd }
-  input  = matrix.col_major(b, i):uniformf(-1,1,rnd)
+  input  = matrix(b, i):uniformf(-1,1,rnd)
   if loss_name == "mse" then
-    target = matrix.col_major(b, o):uniformf(-1,1,rnd)
+    target = matrix(b, o):uniformf(-1,1,rnd)
   elseif not norm and (loss_name == "batch_fmeasure_micro_avg" or loss_name == "batch_fmeasure_macro_avg") then
-    target = matrix.col_major(b, o):uniform(0,1,rnd)
+    target = matrix(b, o):uniform(0,1,rnd)
   else
-    target = matrix.col_major(b, o):uniformf(0,1,rnd)
+    target = matrix(b, o):uniformf(0,1,rnd)
   end
   if norm then
     apply(function(m) m:exp() m:scal(1/m:sum()) end,
@@ -43,13 +45,13 @@ function check_component(component_builder_func,loss_name,i,o,b,desc,norm)
     for name,c in trainer:iterate_components() do
       print("---- " .. name .. " ----")
       print("Input matrix")
-      print(c:get_input():get_matrix())
+      print(c:get_input())
       print("Output matrix")
-      print(c:get_output():get_matrix())
+      print(c:get_output())
       print("Error input matrix")
-      print(c:get_error_input():get_matrix())
+      print(c:get_error_input())
       print("Error output matrix")
-      print(c:get_error_output():get_matrix())
+      print(c:get_error_output())
     end
     error(string.format("Error at %s (%d,%d,%d,%s) !!!",desc,i,o,b,loss_name))
   end
@@ -373,7 +375,7 @@ T("DOTPRODUCT + HARDTANH TEST",
   function()
     check(function()
         for i=1,4 do
-          for o=1,4 do
+          for o=1,3 do
             for b=1,4 do
               check_component(function()
                   return ann.components.stack():
diff --git a/packages/ann/ann/test/test-convolution-digits-output.log b/packages/ann/ann/test/test-convolution-digits-output.log
index f96f837a1..afad85ba2 100644
--- a/packages/ann/ann/test/test-convolution-digits-output.log
+++ b/packages/ann/ann/test/test-convolution-digits-output.log
@@ -1,103 +1,103 @@
-# Initial validation error:	2.3027782440186
-   1  2.3091731 2.3016419      0.3421556 0.0214589
-   2  2.3075607 2.3011065      0.3442202 0.0423757
-   3  2.3070073 2.3003175      0.3478714 0.0484170
-   4  2.3039093 2.3004913      0.3545533 0.0605133
-   5  2.3038447 2.2976985      0.3701778 0.0318623
-   6  2.2998519 2.2921381      0.4184297 0.0485013
-   7  2.2937472 2.2827849      0.4860259 0.0329425
-   8  2.2787824 2.2604604      0.6039371 0.0652767
-   9  2.2354033 2.1766105      0.8277379 0.1225157
-  10  2.0284715 1.8138458      1.3124944 0.2083271
-  11  1.5871761 1.4797781      1.5869501 0.3219261
-  12  1.4393833 1.1906155      1.6487943 0.3903195
-  13  1.1372550 1.0119259      1.7389475 0.4257115
-  14  1.0740784 0.9117533      1.8541732 0.4480246
-  15  0.8299662 0.7872189      1.9390054 0.5003507
-  16  0.6222334 0.5738375      1.9802171 0.4926192
-  17  0.5268123 0.4727378      2.0301979 0.5234563
-  18  0.4643472 0.4698027      2.0518024 0.5252032
-  19  0.3715360 0.3621606      2.0763621 0.5243848
-  20  0.3242205 0.3108734      2.1228282 0.5251353
-  21  0.2730467 0.2684864      2.1432869 0.5249929
-  22  0.2867180 0.2299688      2.1643140 0.5248441
-  23  0.2375728 0.2575147      2.2009647 0.5298973
-  24  0.2329835 0.2167354      2.2314546 0.5275757
-  25  0.2081724 0.1923387      2.2511492 0.5248268
-  26  0.1844451 0.1659556      2.2897284 0.5304404
-  27  0.1692892 0.1684320      2.3112116 0.5234334
-  28  0.1758983 0.1467148      2.3175840 0.5255201
-  29  0.1543282 0.1559882      2.3393207 0.5295891
-  30  0.1519023 0.1316371      2.3546882 0.5283211
-  31  0.1408704 0.1359839      2.3752663 0.5267687
-  32  0.1349234 0.1164398      2.3865254 0.5285925
-  33  0.1301739 0.1214613      2.4028389 0.5272004
-  34  0.1266124 0.1318505      2.4107161 0.5275714
-  35  0.1130186 0.1032424      2.4224837 0.5271062
-  36  0.1128689 0.1134973      2.4321771 0.5277860
-  37  0.1168288 0.1148375      2.4392927 0.5297869
-  38  0.1083871 0.1094492      2.4454532 0.5258458
-  39  0.1002430 0.1014217      2.4538875 0.5296689
-  40  0.0991368 0.1062543      2.4592726 0.5275159
-  41  0.0929686 0.1024247      2.4692130 0.5288980
-  42  0.0955258 0.0880626      2.4752336 0.5285102
-  43  0.0958653 0.0988648      2.4851060 0.5289943
-  44  0.0891843 0.0936094      2.4909050 0.5281674
-  45  0.0844175 0.0988650      2.5032592 0.5293697
-  46  0.0837642 0.0938246      2.5074754 0.5286942
-  47  0.0823673 0.0858169      2.5146317 0.5289074
-  48  0.0801467 0.0881427      2.5200601 0.5280017
-  49  0.0780059 0.0859741      2.5285339 0.5280526
-  50  0.0786663 0.0865687      2.5341034 0.5283197
-  51  0.0750520 0.0918086      2.5378325 0.5292972
-  52  0.0742237 0.0878863      2.5405757 0.5291492
-  53  0.0748312 0.0845108      2.5515242 0.5288186
-  54  0.0740691 0.0868368      2.5512390 0.5284169
-  55  0.0786659 0.0880422      2.5557604 0.5288873
-  56  0.0715123 0.0816200      2.5601623 0.5287928
-  57  0.0695872 0.0832472      2.5633242 0.5286641
-  58  0.0666201 0.0812546      2.5656910 0.5288029
-  59  0.0658695 0.0809537      2.5690939 0.5290528
-  60  0.0657818 0.0809261      2.5731125 0.5286253
-  61  0.0664504 0.0802357      2.5772765 0.5286083
-  62  0.0654580 0.0785752      2.5788629 0.5287585
-  63  0.0691944 0.0819406      2.5812109 0.5289132
-  64  0.0641737 0.0810147      2.5834150 0.5289176
-  65  0.0670473 0.0800867      2.5858290 0.5287631
-  66  0.0632108 0.0792683      2.5879066 0.5288982
-  67  0.0625084 0.0782366      2.5900888 0.5288855
-  68  0.0626488 0.0782983      2.5926373 0.5288792
-  69  0.0626763 0.0777918      2.5937855 0.5288222
-  70  0.0610384 0.0770871      2.5959792 0.5287567
-  71  0.0606044 0.0777491      2.5975037 0.5288118
-  72  0.0610456 0.0774639      2.5992379 0.5287875
-  73  0.0607158 0.0777595      2.6003478 0.5288098
-  74  0.0589991 0.0770674      2.6016772 0.5288237
-  75  0.0600297 0.0767250      2.6029975 0.5287988
-  76  0.0593429 0.0770889      2.6041057 0.5287685
-  77  0.0599257 0.0763923      2.6053979 0.5287822
-  78  0.0597628 0.0773198      2.6065853 0.5287585
-  79  0.0582187 0.0776077      2.6072805 0.5287615
-  80  0.0587276 0.0774656      2.6083548 0.5287727
-  81  0.0624181 0.0771174      2.6094499 0.5287409
-  82  0.0583664 0.0773100      2.6102703 0.5287513
-  83  0.0573773 0.0768071      2.6112690 0.5287381
-  84  0.0575434 0.0763570      2.6122327 0.5287266
-  85  0.0571263 0.0762837      2.6129329 0.5287198
-  86  0.0575778 0.0766848      2.6135473 0.5287221
-  87  0.0575646 0.0765896      2.6142757 0.5287187
-  88  0.0565141 0.0764634      2.6149628 0.5287086
-  89  0.0570548 0.0762230      2.6155591 0.5287185
-  90  0.0572100 0.0762230      2.6161551 0.5287156
-  91  0.0561035 0.0762225      2.6166928 0.5287170
-  92  0.0564179 0.0761893      2.6172478 0.5287096
-  93  0.0557620 0.0759611      2.6177032 0.5287079
-  94  0.0601566 0.0758319      2.6180956 0.5287123
-  95  0.0575501 0.0758450      2.6185331 0.5287192
-  96  0.0567835 0.0759369      2.6189599 0.5287102
-  97  0.0568418 0.0758483      2.6194034 0.5287074
-  98  0.0561061 0.0757637      2.6198282 0.5286959
-  99  0.0555633 0.0757410      2.6201890 0.5286919
- 100  0.0550171 0.0757597      2.6205595 0.5286817
-Wall total time: 18.638    per epoch: 0.186
-CPU  total time: 53.624    per epoch: 0.536
+# Initial validation error:	2.3320939540863
+   1  2.3817289 2.0631769      2.9018321 0.4991634
+   2  2.0127337 1.7107930      2.8795006 0.5035625
+   3  1.6115520 1.2513438      2.9442017 0.8443742
+   4  0.9685481 1.1566203      2.9584067 0.8236541
+   5  0.7168815 0.5299435      3.0023289 0.9598033
+   6  0.3206992 0.7767369      3.0112588 1.0033485
+   7  1.0860476 0.4775722      3.0619886 0.9080099
+   8  0.3197918 0.2902382      3.0819499 0.9946644
+   9  0.1958016 0.2106158      3.1147943 1.0441060
+  10  0.1773363 0.2479766      3.1161106 1.0615921
+  11  0.1147678 0.1558276      3.1060569 1.1271385
+  12  0.1075184 0.1278534      3.1359482 1.1556129
+  13  0.0687593 0.1177373      3.1228211 1.1888367
+  14  0.0376837 0.1056202      3.0987959 1.2120602
+  15  0.0332661 0.0668796      3.0852282 1.2166640
+  16  0.0222894 0.0600685      3.0713453 1.2311292
+  17  0.0157525 0.0686342      3.0506024 1.2374449
+  18  0.0115253 0.0606519      3.0346155 1.2406585
+  19  0.0095431 0.0564426      3.0178421 1.2517389
+  20  0.0096749 0.0647243      3.0025630 1.2564744
+  21  0.0081563 0.0492783      2.9901593 1.2620521
+  22  0.0072236 0.0471871      2.9765923 1.2649729
+  23  0.0068440 0.0492596      2.9636908 1.2690161
+  24  0.0062113 0.0444233      2.9502380 1.2735662
+  25  0.0062164 0.0469762      2.9385459 1.2773722
+  26  0.0057972 0.0447712      2.9270246 1.2785951
+  27  0.0054850 0.0431423      2.9172888 1.2828881
+  28  0.0056857 0.0437554      2.9067614 1.2851691
+  29  0.0051850 0.0457627      2.8978255 1.2873341
+  30  0.0050405 0.0443222      2.8893933 1.2886667
+  31  0.0048728 0.0411952      2.8804867 1.2912111
+  32  0.0047736 0.0451460      2.8724542 1.2925699
+  33  0.0047343 0.0427618      2.8648181 1.2946720
+  34  0.0046832 0.0429964      2.8577437 1.2963077
+  35  0.0045158 0.0417560      2.8512356 1.2978028
+  36  0.0045283 0.0416388      2.8447189 1.2991315
+  37  0.0044603 0.0439450      2.8389351 1.2999839
+  38  0.0045015 0.0439863      2.8335478 1.3015293
+  39  0.0045135 0.0419642      2.8276291 1.3028358
+  40  0.0043495 0.0410866      2.8225942 1.3037244
+  41  0.0042960 0.0420940      2.8179231 1.3047636
+  42  0.0043008 0.0415209      2.8133419 1.3054963
+  43  0.0042705 0.0438083      2.8091493 1.3059328
+  44  0.0042271 0.0416972      2.8049216 1.3069941
+  45  0.0041871 0.0415377      2.8009622 1.3079228
+  46  0.0041955 0.0417533      2.7973149 1.3085480
+  47  0.0041712 0.0407047      2.7937105 1.3090197
+  48  0.0041678 0.0410178      2.7903664 1.3095641
+  49  0.0041742 0.0410902      2.7871890 1.3102257
+  50  0.0041256 0.0412507      2.7841580 1.3107642
+  51  0.0041131 0.0415628      2.7813494 1.3110608
+  52  0.0040998 0.0409712      2.7787488 1.3116640
+  53  0.0040972 0.0415965      2.7762249 1.3118533
+  54  0.0041087 0.0409901      2.7738302 1.3124843
+  55  0.0040811 0.0414503      2.7715557 1.3126273
+  56  0.0040664 0.0411232      2.7693908 1.3130567
+  57  0.0040488 0.0415184      2.7673590 1.3133541
+  58  0.0040435 0.0412881      2.7654259 1.3136539
+  59  0.0040367 0.0411067      2.7635655 1.3140180
+  60  0.0040238 0.0412186      2.7617991 1.3143548
+  61  0.0040496 0.0414952      2.7601244 1.3145624
+  62  0.0040242 0.0412628      2.7585847 1.3148264
+  63  0.0040189 0.0414077      2.7571292 1.3150668
+  64  0.0040116 0.0413463      2.7557185 1.3153048
+  65  0.0040060 0.0411429      2.7543688 1.3155513
+  66  0.0040013 0.0409604      2.7530866 1.3158039
+  67  0.0040007 0.0409645      2.7518589 1.3160617
+  68  0.0039978 0.0410308      2.7506838 1.3162131
+  69  0.0039955 0.0410343      2.7495813 1.3163511
+  70  0.0039866 0.0411291      2.7485473 1.3164933
+  71  0.0039847 0.0412160      2.7475665 1.3166759
+  72  0.0039819 0.0412029      2.7466314 1.3168297
+  73  0.0039863 0.0411614      2.7457452 1.3169810
+  74  0.0039765 0.0410840      2.7448990 1.3171121
+  75  0.0039781 0.0410102      2.7440867 1.3172795
+  76  0.0039763 0.0410615      2.7433248 1.3174052
+  77  0.0039698 0.0410833      2.7426071 1.3175198
+  78  0.0039725 0.0411574      2.7419302 1.3176137
+  79  0.0039680 0.0411577      2.7412798 1.3177041
+  80  0.0039635 0.0411501      2.7406545 1.3178079
+  81  0.0039680 0.0411945      2.7400663 1.3178977
+  82  0.0039640 0.0412194      2.7395048 1.3179847
+  83  0.0039599 0.0411666      2.7389762 1.3180798
+  84  0.0039582 0.0411525      2.7384689 1.3181612
+  85  0.0039611 0.0411331      2.7379887 1.3182341
+  86  0.0039573 0.0411306      2.7375333 1.3183086
+  87  0.0039562 0.0411279      2.7371025 1.3183682
+  88  0.0039558 0.0411387      2.7366951 1.3184292
+  89  0.0039548 0.0411185      2.7363050 1.3185025
+  90  0.0039528 0.0411069      2.7359352 1.3185678
+  91  0.0039525 0.0411113      2.7355845 1.3186166
+  92  0.0039486 0.0411286      2.7352538 1.3186692
+  93  0.0039518 0.0411102      2.7349374 1.3187244
+  94  0.0039506 0.0410847      2.7346380 1.3187743
+  95  0.0039497 0.0410745      2.7343528 1.3188190
+  96  0.0039496 0.0410628      2.7340820 1.3188623
+  97  0.0039479 0.0410628      2.7338243 1.3189024
+  98  0.0039464 0.0410597      2.7335773 1.3189430
+  99  0.0039477 0.0410499      2.7333443 1.3189846
+ 100  0.0039471 0.0410509      2.7331240 1.3190198
+Wall total time: 23.492    per epoch: 0.235
+CPU  total time: 89.945    per epoch: 0.899
diff --git a/packages/ann/ann/test/test-convolution-digits.lua b/packages/ann/ann/test/test-convolution-digits.lua
index 0f9d9b348..58e468611 100644
--- a/packages/ann/ann/test/test-convolution-digits.lua
+++ b/packages/ann/ann/test/test-convolution-digits.lua
@@ -3,13 +3,13 @@ mathcore.set_use_cuda_default(util.is_cuda_available())
 local bunch_size       = tonumber(arg[1]) or 64
 local semilla          = 1234
 local weights_random   = random(semilla)
-local inf              = -0.6
-local sup              =  0.6
+local inf              = -2.4
+local sup              =  2.4
 local shuffle_random   = random(5678)
 local learning_rate    = 0.1
 local momentum         = 0.2
-local weight_decay     = 1e-04
-local L1_norm          = 0.00001
+local weight_decay     = 0.01
+local L1_norm          = 0.0
 local max_norm_penalty = 4
 local max_epochs       = 100
 local check_grandients = false
@@ -158,7 +158,7 @@ if check_grandients then
   trainer:grad_check_dataset({
 			       input_dataset  = dataset.slice(val_input, 1, 10),
 			       output_dataset = dataset.slice(val_output, 1, 10),
-			       bunch_size = 1,
+			       bunch_size = 10,
 			       verbose = false,
 			     })
 end
@@ -168,12 +168,12 @@ for input,idxs in trainable.dataset_multiple_iterator{
   bunch_size = 1, } do
   trainer:calculate(input)
   local c = trainer:component("pool-1")
-  local o = c:get_output():get_matrix()
+  local o = c:get_output()
   local d = o:dim()
   local k = 0
   for w in o:sliding_window{ size={1,1,d[3],d[4]}, step={1,1,1,1},
 			     numSteps={d[1], d[2], 1, 1} }:iterate() do
-    local img = w:clone():rewrap(d[3]*d[4]):clone("row_major"):rewrap(d[3],d[4])
+    local img = w:clone():rewrap(d[3],d[4])
     matrix.saveImage(img:adjust_range(0,1), "/tmp/WW-".. idxs[1] .. "-"..k..".pnm")
     k=k+1
   end
@@ -193,13 +193,13 @@ if check_tokens then
     for name,c in self:iterate_components() do -- ("w[34]") do
       print("\n================== "..name.." ==================")
       print("\n++++++++++ input ++++++++++")
-      print(c:get_input():get_matrix())
+      print(c:get_input())
       print("\n++++++++++ output ++++++++++")
-      print(c:get_output():get_matrix())
+      print(c:get_output())
       print("\n++++++++++ error input ++++++++++")
-      print(c:get_error_input():get_matrix())
+      print(c:get_error_input())
       print("\n++++++++++ error output ++++++++++")
-      print(c:get_error_output():get_matrix())
+      print(c:get_error_output())
       print("\n======================================")
     end
   end
@@ -216,9 +216,9 @@ for epoch = 1,max_epochs do
   local norm2_b = trainer:norm2(".*b.*")
   --
   if false then
-    local inp  = trainer:component("conv"):get_input():get_matrix()
-    local outp = trainer:component("conv"):get_output():get_matrix()
-    local err = trainer:component("conv"):get_error_input():get_matrix()
+    local inp  = trainer:component("conv"):get_input()
+    local outp = trainer:component("conv"):get_output()
+    local err = trainer:component("conv"):get_error_input()
     print("DIM", table.concat(err:dim(), " "))
     for i=1,err:dim()[2] do
     --   for j=1,err:dim()[1] do
@@ -253,12 +253,12 @@ end
 --   bunch_size    = 1,
 --   func = function(idxs, trainer)
 --     local c = trainer:component("pool-1")
---     local o = c:get_output():get_matrix()
+--     local o = c:get_output()
 --     local d = o:dim()
 --     local k = 0
 --     for w in o:sliding_window{ size={1,1,d[3],d[4]}, step={1,1,1,1},
 -- 			       numSteps={d[1], d[2], 1, 1} }:iterate() do
---       local img = w:clone():rewrap(d[3]*d[4]):clone("row_major"):rewrap(d[3],d[4])
+--       local img = w:clone():rewrap(d[3],d[4])
 --       matrix.saveImage(img:adjust_range(0,1), "/tmp/jajaja-".. idxs[1] .. "-"..k..".pnm")
 --       k=k+1
 --     end
diff --git a/packages/ann/ann/test/test-convolution.lua b/packages/ann/ann/test/test-convolution.lua
index e836642be..ae2dc1219 100644
--- a/packages/ann/ann/test/test-convolution.lua
+++ b/packages/ann/ann/test/test-convolution.lua
@@ -2,14 +2,14 @@ kx=17
 ky=17
 h=10
 -- a matrix of ROWSxCOLUMNSx3
-m = ImageIO.read(string.get_path(arg[0]) .. "photo.png"):matrix()
-m2 = m:rewrap(m:size()):clone("col_major")
+m = ImageIO.read(string.get_path(arg[0]) .. "photo.png"):matrix():transpose(1,3)
+m2 = m:contiguous():rewrap(m:size())
 
-input = matrix.col_major(2, m2:size())
+input = matrix(2, m2:size())
 input:select(1,1):copy(m2)
 input:select(1,2):copy(m2)
-w,_,thenet = ann.components.stack():
--- converts a flatten image to a matrix in col-major of only 3 planes (RGB)
+thenet,w,_ = ann.components.stack():
+-- converts a flatten image to a matrix of only 3 planes (RGB)
 push(ann.components.rewrap{ size={ 3, m:dim()[2], m:dim()[1] } }):
 -- a kernel over 3 planes and kx,ky sizes, h output neurons
 push(ann.components.convolution{ kernel={3, kx, ky}, n=h }):
@@ -23,10 +23,10 @@ push(ann.components.max_pooling{ kernel={1,3,3} }):
 push(ann.components.actf.hardtanh()):
 build()
 rnd=random(1234)
-for name,cnn in pairs(w) do cnn:randomize_weights{inf=-0.1,sup=0.1,random=rnd} end
+for name,cnn in pairs(w) do ann.connections.randomize_weights(cnn,{inf=-0.1,sup=0.1,random=rnd}) end
 clock = util.stopwatch()
 clock:go()
-output = thenet:forward(input):get_matrix()
+output = thenet:forward(input)
 
 clock:stop()
 print(m:size(), clock:read())
@@ -35,7 +35,7 @@ y = output:dim()[4]
 for b=1,output:dim()[1] do
   for i=1,output:dim()[2] do
     aux = output:select(1,b):select(1,i):clone()
-    aux = aux:rewrap(x*y):clone("row_major"):rewrap(y,x):adjust_range(0,1)
+    aux = aux:rewrap(x,y):adjust_range(0,1)
     ImageIO.write(Image(aux), "output-" .. b .. "-" .. i .. ".png")
   end
 end
diff --git a/packages/ann/ann/test/test-sparse.lua b/packages/ann/ann/test/test-sparse.lua
index 3ab3fbfc4..9217dce4c 100644
--- a/packages/ann/ann/test/test-sparse.lua
+++ b/packages/ann/ann/test/test-sparse.lua
@@ -4,14 +4,14 @@ mathcore.set_use_cuda_default(util.is_cuda_available())
 
 local check = utest.check
 local T = utest.test
-local w = matrix.col_major(4,3):uniformf(0,1,random(1234))
-local input = matrix.col_major(5,3,{ 0, 1, 0,
-                                     1, 1, 1,
-                                     1, 0, 1,
-                                     1, 0, 0,
-                                     0, 0, 1 })
+local w = matrix(4,3):uniformf(0,1,random(1234))
+local input = matrix(5,3,{ 0, 1, 0,
+                           1, 1, 1,
+                           1, 0, 1,
+                           1, 0, 0,
+                           0, 0, 1 })
 local sparse_input = matrix.sparse.csr(input)
-local e = matrix.col_major(5,4):uniformf(0,1,random(2384))
+local e = matrix(5,4):uniformf(0,1,random(2384))
 --
 T("SparseDotProductTest",
   function()
@@ -25,18 +25,18 @@ T("SparseDotProductTest",
           output = 4,
           weights = "w",
           transpose = transpose,
-        }:build{ weights=matrix.dict{ w=w } }
+        }:build{ weights={ w=w } }
         --
-        local output = c:forward(input):get_matrix()
+        local output = c:forward(input)
         c:backprop(e)
         local grads1 = c:compute_gradients()
         --
-        local sparse_output = c:forward(sparse_input):get_matrix()
+        local sparse_output = c:forward(sparse_input)
         c:backprop(e)
         local grads2 = c:compute_gradients()
         --
         check.eq(output,sparse_output)
-        check.eq(grads1("w"),grads2("w"))
+        check.eq(grads1.w, grads2.w)
       end
     end
 end)
diff --git a/packages/ann/ann/test/test.lua b/packages/ann/ann/test/test.lua
index ac8dfad38..0b411715d 100644
--- a/packages/ann/ann/test/test.lua
+++ b/packages/ann/ann/test/test.lua
@@ -37,7 +37,7 @@ function check_result(trainer, filter, t, testname)
     k=k+1
   end
   for name,cnn in trainer:iterate_weights() do
-    local w = cnn:matrix():toTable()
+    local w = cnn:toTable()
     for _,v in ipairs(w) do
       assert(v-t[k]<epsilon,
 	     string.format("[%s] Incorrect weight, expected %f, found %f",
diff --git a/packages/ann/autoencoders/lua_src/stacked_denoising_autoencoder.lua b/packages/ann/autoencoders/lua_src/stacked_denoising_autoencoder.lua
index eacb13c1f..550a21fc4 100644
--- a/packages/ann/autoencoders/lua_src/stacked_denoising_autoencoder.lua
+++ b/packages/ann/autoencoders/lua_src/stacked_denoising_autoencoder.lua
@@ -2,6 +2,8 @@ get_table_from_dotted_string("ann.autoencoders", true)
 
 ----------------------------------------------------------------------
 
+local md = matrix.dict
+
 -- The auto-encoder class (AE) will be a denoising auto-encoder (DAE) when
 -- trained with corrupted input, and clean output
 
@@ -216,12 +218,12 @@ local function build_two_layered_autoencoder_from_sizes_and_actf(names_prefix,
 			  names_prefix.."b1",
 			  names_prefix.."b2" }) do
     ann.connections.
-    randomize_weights(weights_table(wname),
-		      {
-			random = weights_random,
-			inf    = -math.sqrt(6 / (input_size + cod_size)),
-			sup    =  math.sqrt(6 / (input_size + cod_size))
-		      })
+      randomize_weights(weights_table[wname],
+                        {
+                          random = weights_random,
+                          inf    = -math.sqrt(6 / (input_size + cod_size)),
+                          sup    =  math.sqrt(6 / (input_size + cod_size))
+      })
   end
   return autoencoder_component
 end
@@ -260,7 +262,7 @@ function fake_indexed_methods:getPattern(idx)
     for i=1,#self.dict do
       local current_pat_size = self.dict[i]:patternSize()
       local current_token = self.dict[i]:getPattern(index[i])
-      m:slice({1,col_pos},{1,current_pat_size}):copy(current_token:get_matrix())
+      m:slice({1,col_pos},{1,current_pat_size}):copy(current_token)
       col_pos = col_pos + current_pat_size
     end
     return tokens.matrix(m)
@@ -420,7 +422,7 @@ ann.autoencoders.build_full_autoencoder =
     local bias_mat      = sdae_table.bias
     local sdae          = ann.components.stack{ name=names_prefix.."stack" }
     local prev_size     = layers[1].size
-    local weights_table = matrix.dict()
+    local weights_table = {}
     local k = 1
     for i=2,#layers do
       local size , actf   = layers[i].size,layers[i].actf
@@ -705,7 +707,7 @@ ann.autoencoders.greedy_layerwise_pretraining =
     local weights = {}
     local bias    = {}
     -- incremental mlp
-    local mlp_final_weights = matrix.dict()
+    local mlp_final_weights = {}
     local mlp_final = ann.components.stack{ name=params.names_prefix.."stack" }
     -- loop for each pair of layers
     for i=2,#params.layers do
@@ -736,7 +738,7 @@ ann.autoencoders.greedy_layerwise_pretraining =
                                                                params.bunch_size,
                                                                params.optimizer())
 
-        local aux_weights = mlp_final_weights:clone()
+        local aux_weights = md.clone( mlp_final_weights )
         mlp_final_trainer:build{ weights=aux_weights }
         data = generate_training_table_configuration_on_the_fly(current_dataset_params,
                                                                 params.replacement,
@@ -895,7 +897,7 @@ ann.autoencoders.greedy_layerwise_pretraining =
                                                                nil,
                                                                params.bunch_size,
                                                                params.optimizer())
-        local aux_weights = mlp_final_weights:clone()
+        local aux_weights = md.clone( mlp_final_weights )
         mlp_final_trainer:build{ weights = aux_weights }
         data = generate_training_table_configuration_on_the_fly(current_dataset_params,
                                                                 params.replacement,
@@ -987,7 +989,7 @@ function ann.autoencoders.build_codifier_from_sdae_table(sdae_table,
   local weights_mat   = sdae_table.weights
   local bias_mat      = sdae_table.bias
   local codifier_net  = ann.components.stack{ name="stack" }
-  local weights_table = matrix.dict()
+  local weights_table = {}
   for i=2,#layers do
     local bname = "b"..(i-1)
     local wname = "w"..(i-1)
@@ -1069,7 +1071,7 @@ ann.autoencoders.iterative_sampling =
       ["noise"] = {"An ANN component for noise generation (not a trainer"},
       ["mask"]   = {"An array with the input positions which",
                     "will be keep untouched [optional]",},
-      ["input"] = {"A col-major matrix with the input values."},
+      ["input"] = {"A matrix with the input values."},
       ["max"] = "Max number of iterations",
       ["stop"] = "Stop when loss difference between iterations is lower than given value",
       ["verbose"] = "Verbosity true or false [optional].",
@@ -1111,13 +1113,13 @@ ann.autoencoders.iterative_sampling =
       -- compute the loss of current iteration
       params.loss:reset()
       L = params.loss:loss(output, params.model:get_input())
-      if params.log then output:get_matrix():exp() end
+      if params.log then output:exp() end
       -- restore masked positions
       for _,pos in ipairs(params.mask) do
-        output:get_matrix():set(1,pos,input_rewrapped:get(1,pos))
+        output:set(1,pos,input_rewrapped:get(1,pos))
       end
       -- insert current output to the chain
-      table.insert(chain, output:get_matrix():rewrap(table.unpack(params.input:dim())))
+      table.insert(chain, output:rewrap(table.unpack(params.input:dim())))
       -- improvement measure
       local imp = math.abs(math.abs(last_L - L)/last_L)
       if params.verbose then printf("%6d %6g :: %6g\n", i, L, imp) end
@@ -1127,13 +1129,13 @@ ann.autoencoders.iterative_sampling =
       -- sample from noise distribution
       params.noise:reset()
       local input_token = params.noise:forward(output)
-      input = input_token:get_matrix()
+      input = input_token
       -- restore masked positions
       for _,pos in ipairs(params.mask) do
         input:set(1,pos,input_rewrapped:get(1,pos))
       end
     end
-    return output:get_matrix():rewrap(table.unpack(params.input:dim())),L,chain
+    return output:rewrap(table.unpack(params.input:dim())),L,chain
   end
 
 ----------------------------------------------------------------------------
@@ -1153,7 +1155,7 @@ ann.autoencoders.sgd_sampling =
       ["noise"] = {"An ANN component for noise generation (not a trainer"},
       ["mask"]   = {"An array with the input positions which",
                     "will be keep untouched [optional]",},
-      ["input"] = {"A col-major matrix with the input values."},
+      ["input"] = {"A matrix with the input values."},
       ["max"] = "Max number of iterations",
       ["stop"] = "Stop when loss difference between iterations is lower than given value",
       ["verbose"] = "Verbosity true or false [optional].",
@@ -1203,22 +1205,22 @@ ann.autoencoders.sgd_sampling =
       -- compute the loss of current iteration
       params.loss:reset()
       L = params.loss:loss(output, params.model:get_input())
-      if params.log then output:get_matrix():exp() end
+      if params.log then output:exp() end
       -- restore masked positions
       for _,pos in ipairs(params.mask) do
-        output:get_matrix():set(1,pos,input_rewrapped:get(1,pos))
+        output:set(1,pos,input_rewrapped:get(1,pos))
       end
-      table.insert(chain, output:get_matrix():rewrap(table.unpack(params.input:dim())))
+      table.insert(chain, output:rewrap(table.unpack(params.input:dim())))
       local imp = math.abs(math.abs(last_L - L)/last_L)
       if params.verbose then printf("%6d %6g :: %6g", i, L, imp) end
       if i==1 or L <= min then
-        min,result = L,output:get_matrix()
+        min,result = L,output
         if params.verbose then printf(" *") end
       end
       if params.verbose then printf("\n") end
       if last_L == 0 or imp < params.stop then break end
       -- GRADIENT DESCENT UPDATE OF INPUT VECTOR
-      --aux = params.noise:forward(input):get_matrix()
+      --aux = params.noise:forward(input)
       ---- restore masked positions
       --for _,pos in ipairs(params.mask) do
       --aux:set(1,pos,input_rewrapped:get(1,pos))
@@ -1226,10 +1228,10 @@ ann.autoencoders.sgd_sampling =
       
       local gradient = params.model:backprop(params.loss:gradient(params.model:get_output(),
                                                                   params.model:get_input()))
-      -- local g = gradient:get_matrix():clone("row_major"):rewrap(16,16):pow(2):sqrt():clamp(0,1)
+      -- local g = gradient:clone():rewrap(16,16):pow(2):sqrt():clamp(0,1)
       -- matrix.saveImage(g, string.format("gradient-%04d.pnm", i))
-      gradient = gradient:get_matrix()
-      output   = output:get_matrix()
+      gradient = gradient
+      output   = output
       -- input = (1 - beta)*input + beta*output - alpha*gradient
       input = ( input:clone():
                   scal(1.0 - params.beta):
@@ -1240,7 +1242,7 @@ ann.autoencoders.sgd_sampling =
       last_L = L
       -- sample from noise distribution
       params.noise:reset()
-      input = params.noise:forward(input):get_matrix()
+      input = params.noise:forward(input)
       -- restore masked positions
       for _,pos in ipairs(params.mask) do
         input:set(1,pos,input_rewrapped:get(1,pos))
diff --git a/packages/ann/autoencoders/test/test-sampling-one.lua b/packages/ann/autoencoders/test/test-sampling-one.lua
index d53192c2b..7e30018e2 100644
--- a/packages/ann/autoencoders/test/test-sampling-one.lua
+++ b/packages/ann/autoencoders/test/test-sampling-one.lua
@@ -59,7 +59,7 @@ noise:build{ input=256, output=256 }
 output,L,chain = ann.autoencoders.iterative_sampling{
   model   = full_sdae,
   noise   = noise,
-  input   = input:rewrap(1,256):clone("col_major"),
+  input   = input:rewrap(1,256):clone(),
   max     = max_iterations,
   mask    = mask,
   stop    = stop_criterion,
@@ -68,18 +68,18 @@ output,L,chain = ann.autoencoders.iterative_sampling{
   loss    = loss,
 }
 for i,output in ipairs(chain) do
-  matrix.saveImage(output:clone("row_major"):rewrap(16,16),
+  matrix.saveImage(output:clone():rewrap(16,16),
 		   "wop1-"..string.format("%04d",i)..".pnm")
 end
 if log then output:log() end
 ite_L = loss:loss(tokens.matrix(output:rewrap(1,256)),
-		  tokens.matrix(matrix.col_major(1,256,val_input:getPattern(ipat))))
+		  tokens.matrix(matrix(1,256,val_input:getPattern(ipat))))
 print(ite_L)
 
 output,L,chain = ann.autoencoders.sgd_sampling{
   model   = full_sdae,
   noise   = noise,
-  input   = input:rewrap(1,256):clone("col_major"),
+  input   = input:rewrap(1,256):clone(),
   max     = max_iterations,
   mask    = mask,
   stop    = stop_criterion,
@@ -91,10 +91,10 @@ output,L,chain = ann.autoencoders.sgd_sampling{
   loss    = loss,
 }
 for i,output in ipairs(chain) do
-  matrix.saveImage(output:clone("row_major"):rewrap(16,16),
+  matrix.saveImage(output:clone():rewrap(16,16),
 		   "wop2-"..string.format("%04d",i)..".pnm")
 end
 if log then output:log() end
 sgd_L = loss:loss(tokens.matrix(output:rewrap(1,256)),
-		  tokens.matrix(matrix.col_major(1,256,val_input:getPattern(ipat))))
+		  tokens.matrix(matrix(1,256,val_input:getPattern(ipat))))
 print(sgd_L)
diff --git a/packages/ann/autoencoders/test/test-sampling.lua b/packages/ann/autoencoders/test/test-sampling.lua
index 17c24cd61..1b9ae6ca6 100644
--- a/packages/ann/autoencoders/test/test-sampling.lua
+++ b/packages/ann/autoencoders/test/test-sampling.lua
@@ -44,8 +44,8 @@ else
   trainer:build()
 end
 
-local ite_loss_stat = stats.mean_var()
-local sgd_loss_stat = stats.mean_var()
+local ite_loss_stat = stats.running.mean_var()
+local sgd_loss_stat = stats.running.mean_var()
 
 local ite_quartiles = {}
 local sgd_quartiles = {}
@@ -69,7 +69,7 @@ for ipat=1,val_input:numPatterns() do
     end
     output,L = ann.autoencoders.iterative_sampling{
       model   = full_sdae,
-      input   = input:rewrap(1,256):clone("col_major"),
+      input   = input:rewrap(1,256):clone(),
       max     = max_iterations,
       mask    = mask,
       stop    = stop_criterion,
@@ -84,13 +84,13 @@ for ipat=1,val_input:numPatterns() do
     -- tokens.memblock(val_input:getPattern(n))), L)
     loss:reset()
     ite_L = loss:loss(tokens.matrix(output),
-		      tokens.matrix(matrix.col_major(1,256,val_input:getPattern(ipat))))
+		      tokens.matrix(matrix(1,256,val_input:getPattern(ipat))))
     ite_loss_stat:add(ite_L)
     table.insert(ite_quartiles, ite_L)
     
     output,L = ann.autoencoders.sgd_sampling{
       model   = full_sdae,
-      input   = input:rewrap(1,256):clone("col_major"),
+      input   = input:rewrap(1,256):clone(),
       max     = max_iterations,
       mask    = mask,
       stop    = stop_criterion,
@@ -108,7 +108,7 @@ for ipat=1,val_input:numPatterns() do
     -- tokens.memblock(val_input:getPattern(n))), L)
     loss:reset()
     sgd_L = loss:loss(tokens.matrix(output),
-		      tokens.matrix(matrix.col_major(1,256,val_input:getPattern(ipat))))
+		      tokens.matrix(matrix(1,256,val_input:getPattern(ipat))))
     sgd_loss_stat:add(sgd_L)
     table.insert(sgd_quartiles, sgd_L)
   end
diff --git a/packages/ann/autoencoders/test/test_on_the_fly.lua b/packages/ann/autoencoders/test/test_on_the_fly.lua
index 22ce5fcab..b94b84280 100644
--- a/packages/ann/autoencoders/test/test_on_the_fly.lua
+++ b/packages/ann/autoencoders/test/test_on_the_fly.lua
@@ -210,6 +210,7 @@ trainer_deep_wo_pretraining:set_layerwise_option("b.*", "weight_decay",0.0)
 trainer_shallow_classifier:set_layerwise_option("b.*", "weight_decay",0.0)
 
 for i=1,2 do
+  fprintf(io.stderr, "# epoch %d\n", i)
   local mse_tr_deep = trainer_deep_classifier:train_dataset(datosentrenar_deep)
   local mse_tr_deep_wo = trainer_deep_wo_pretraining:train_dataset(datosentrenar_deep_wo)
   local mse_tr_shallow = trainer_shallow_classifier:train_dataset(datosentrenar_shallow)
diff --git a/packages/ann/fnnlm/test/test.lua b/packages/ann/fnnlm/test/test.lua
index 07f886ac3..0a0575fc9 100644
--- a/packages/ann/fnnlm/test/test.lua
+++ b/packages/ann/fnnlm/test/test.lua
@@ -29,5 +29,5 @@ output = nnlm:forward{
   }
 }
 
-print(trainer:component("factors_join"):get_output():get_matrix())
-print(output:get_matrix())
+print(trainer:component("factors_join"):get_output())
+print(output)
diff --git a/packages/ann/loss/binding/bind_loss_functions.lua.cc b/packages/ann/loss/binding/bind_loss_functions.lua.cc
index 7867ae128..6b61351d8 100644
--- a/packages/ann/loss/binding/bind_loss_functions.lua.cc
+++ b/packages/ann/loss/binding/bind_loss_functions.lua.cc
@@ -59,20 +59,17 @@ using namespace ANN;
   LUABIND_CHECK_ARGN(==,2);
   LUABIND_CHECK_PARAMETER(1, AuxToken);
   LUABIND_CHECK_PARAMETER(2, AuxToken);
-  Token *input, *target;
+  AprilUtils::SharedPtr<Token> input, target;
   LUABIND_GET_PARAMETER(1, AuxToken, input);
   LUABIND_GET_PARAMETER(2, AuxToken, target);
-  IncRef(input);
-  IncRef(target);
-  MatrixFloat *loss = obj->computeLoss(input, target);
+  MatrixFloat *loss = obj->computeLoss(input.get(), target.get());
   if (loss) {
     LUABIND_RETURN(float, matSum(loss)/loss->getDimSize(0));
     LUABIND_RETURN(MatrixFloat, loss);
   }
-  else
+  else {
     LUABIND_RETURN_NIL();
-  DecRef(input);
-  DecRef(target);
+  }
 }
 //BIND_END
 
@@ -109,15 +106,12 @@ using namespace ANN;
   LUABIND_CHECK_ARGN(==,2);
   LUABIND_CHECK_PARAMETER(1, AuxToken);
   LUABIND_CHECK_PARAMETER(2, AuxToken);
-  Token *input, *target;
+  AprilUtils::SharedPtr<Token> input, target;
   LUABIND_GET_PARAMETER(1, AuxToken, input);
   LUABIND_GET_PARAMETER(2, AuxToken, target);
-  IncRef(input);
-  IncRef(target);
-  Token *error = obj->computeGradient(input, target);
-  LUABIND_RETURN(Token, error);
-  DecRef(input);
-  DecRef(target);
+  AprilUtils::SharedPtr<Token> error( obj->computeGradient(input.get(),
+                                                           target.get()) );
+  LUABIND_RETURN(AuxToken, error);
 }
 //BIND_END
 
@@ -144,7 +138,9 @@ using namespace ANN;
 
 //BIND_METHOD LossFunction to_lua_string
 {
-  LUABIND_RETURN(string, obj->toLuaString());
+  char *str = obj->toLuaString();
+  LUABIND_RETURN(string, str);
+  delete[] str;
 }
 //BIND_END
 
diff --git a/packages/ann/loss/c_src/batch_fmeasure_macro_avg_loss_function.cc b/packages/ann/loss/c_src/batch_fmeasure_macro_avg_loss_function.cc
index dc9ddb2d8..fd2673aa3 100644
--- a/packages/ann/loss/c_src/batch_fmeasure_macro_avg_loss_function.cc
+++ b/packages/ann/loss/c_src/batch_fmeasure_macro_avg_loss_function.cc
@@ -58,7 +58,7 @@ namespace ANN {
     // FMb = ---------------------
     //        sum(o) + b^2 sum(t)
     int num_classes = input_mat->getDimSize(1);
-    Gs = new MatrixFloat(1,&num_classes,CblasColMajor);
+    Gs = new MatrixFloat(1,&num_classes);
     Hs = Gs->clone();
     AprilUtils::SharedPtr<MatrixFloat> class_input_mat;
     AprilUtils::SharedPtr<MatrixFloat> class_target_mat;
@@ -89,7 +89,7 @@ namespace ANN {
     }
     MatrixFloat *loss_output;
     int aux = 1;
-    loss_output = new MatrixFloat(1, &aux, CblasColMajor);
+    loss_output = new MatrixFloat(1, &aux);
 #ifdef USE_CUDA
     loss_output->setUseCuda(input_mat_->getCudaFlag());
 #endif
diff --git a/packages/ann/loss/c_src/batch_fmeasure_micro_avg_loss_function.cc b/packages/ann/loss/c_src/batch_fmeasure_micro_avg_loss_function.cc
index 4267c9d3f..672abb202 100644
--- a/packages/ann/loss/c_src/batch_fmeasure_micro_avg_loss_function.cc
+++ b/packages/ann/loss/c_src/batch_fmeasure_micro_avg_loss_function.cc
@@ -81,7 +81,7 @@ namespace ANN {
     MatrixFloat *loss_output;
     if ( H>0.0f || H<0.0f ) {
       int dim = 1;
-      loss_output = new MatrixFloat(1, &dim, CblasColMajor);
+      loss_output = new MatrixFloat(1, &dim);
 #ifdef USE_CUDA
       loss_output->setUseCuda(input_mat->getCudaFlag());
 #endif
diff --git a/packages/ann/loss/c_src/cross_entropy_loss_function.cc b/packages/ann/loss/c_src/cross_entropy_loss_function.cc
index a01feb4bf..663db5d26 100644
--- a/packages/ann/loss/c_src/cross_entropy_loss_function.cc
+++ b/packages/ann/loss/c_src/cross_entropy_loss_function.cc
@@ -41,7 +41,7 @@ namespace ANN {
     MatrixFloat *input_mat, *target_mat;
     throwErrorAndGetMatrixFromTokens(input, target, input_mat, target_mat);
     int dim = input_mat->getDimSize(0);
-    MatrixFloat *loss_output = new MatrixFloat(1, &dim, CblasColMajor);
+    MatrixFloat *loss_output = new MatrixFloat(1, &dim);
 #ifdef USE_CUDA
     loss_output->setUseCuda(input_mat->getCudaFlag());
 #endif
diff --git a/packages/ann/loss/c_src/loss_function.h b/packages/ann/loss/c_src/loss_function.h
index 9961440d5..db9fa22c8 100644
--- a/packages/ann/loss/c_src/loss_function.h
+++ b/packages/ann/loss/c_src/loss_function.h
@@ -62,8 +62,6 @@ namespace ANN {
 	april_assert(target_mat->getNumDim() == 2);
 	april_assert(input_mat->sameDim(target_mat));
       }
-      april_assert(input_mat->getMajorOrder() == CblasColMajor);
-      april_assert(target_mat->getMajorOrder() == CblasColMajor);
       april_assert(size==0 || input_mat->getDimSize(1)==static_cast<int>(size));
       //
 #ifdef USE_CUDA
diff --git a/packages/ann/loss/c_src/mae_loss_function.cc b/packages/ann/loss/c_src/mae_loss_function.cc
index 271f4a1a9..c22fd6359 100644
--- a/packages/ann/loss/c_src/mae_loss_function.cc
+++ b/packages/ann/loss/c_src/mae_loss_function.cc
@@ -42,7 +42,7 @@ namespace ANN {
     MatrixFloat *input_mat, *target_mat;
     throwErrorAndGetMatrixFromTokens(input, target, input_mat, target_mat);
     int dim = input_mat->getDimSize(0);
-    MatrixFloat *loss_output = new MatrixFloat(1, &dim, CblasColMajor);
+    MatrixFloat *loss_output = new MatrixFloat(1, &dim);
 #ifdef USE_CUDA
     loss_output->setUseCuda(input_mat->getCudaFlag());
 #endif
diff --git a/packages/ann/loss/c_src/mse_loss_function.cc b/packages/ann/loss/c_src/mse_loss_function.cc
index fd264e5d3..4989130a0 100644
--- a/packages/ann/loss/c_src/mse_loss_function.cc
+++ b/packages/ann/loss/c_src/mse_loss_function.cc
@@ -40,7 +40,7 @@ namespace ANN {
     MatrixFloat *input_mat, *target_mat;
     throwErrorAndGetMatrixFromTokens(input, target, input_mat, target_mat);
     int dim = input_mat->getDimSize(0);
-    MatrixFloat *loss_output = new MatrixFloat(1, &dim, CblasColMajor);
+    MatrixFloat *loss_output = new MatrixFloat(1, &dim);
 #ifdef USE_CUDA
     loss_output->setUseCuda(input_mat->getCudaFlag());
 #endif
diff --git a/packages/ann/loss/c_src/multiclass_cross_entropy_loss_function.cc b/packages/ann/loss/c_src/multiclass_cross_entropy_loss_function.cc
index f14db986d..b6171322d 100644
--- a/packages/ann/loss/c_src/multiclass_cross_entropy_loss_function.cc
+++ b/packages/ann/loss/c_src/multiclass_cross_entropy_loss_function.cc
@@ -48,7 +48,7 @@ namespace ANN {
     MatrixFloat *input_mat, *target_mat;
     throwErrorAndGetMatrixFromTokens(input, target, input_mat, target_mat);
     int dim = input_mat->getDimSize(0);
-    MatrixFloat *loss_output = new MatrixFloat(1, &dim, CblasColMajor);
+    MatrixFloat *loss_output = new MatrixFloat(1, &dim);
 #ifdef USE_CUDA
     loss_output->setUseCuda(input_mat->getCudaFlag());
 #endif
diff --git a/packages/ann/loss/c_src/zero_one_loss_function.cc b/packages/ann/loss/c_src/zero_one_loss_function.cc
index 6e0b06a4b..589908f90 100644
--- a/packages/ann/loss/c_src/zero_one_loss_function.cc
+++ b/packages/ann/loss/c_src/zero_one_loss_function.cc
@@ -42,7 +42,7 @@ namespace ANN {
 				     false);
     int N = input_mat->getDimSize(1);
     int dim = input_mat->getDimSize(0);
-    MatrixFloat *loss_output = new MatrixFloat(1, &dim, CblasColMajor);
+    MatrixFloat *loss_output = new MatrixFloat(1, &dim);
 #ifdef USE_CUDA
     loss_output->setUseCuda(input_mat->getCudaFlag());
     const float *aux = input_mat->getRawDataAccess()->getPPALForRead();
diff --git a/packages/ann/loss/lua_src/loss_functions.lua b/packages/ann/loss/lua_src/loss_functions.lua
index 5b212525a..11524fbff 100644
--- a/packages/ann/loss/lua_src/loss_functions.lua
+++ b/packages/ann/loss/lua_src/loss_functions.lua
@@ -66,8 +66,8 @@ april_set_doc(ann.loss.."compute_loss",
 		  "but it is not accumulated. Call to accum_loss to accumulate it to the internal state.",
 		},
 		params={
-		  "Input token",
-		  "Target token",
+		  "Input token (usually a matrix)",
+		  "Target token (usually a matrix)",
 		},
 		outputs = {
 		  "The loss function mean at the given batch.",
@@ -89,11 +89,11 @@ april_set_doc(ann.loss.."gradient",
 		  "tokens).",
 		},
 		params={
-		  "Input token",
-		  "Target token",
+		  "Input token (usually a matrix)",
+		  "Target token (usually a matrix)",
 		},
 		outputs = {
-		  "The gradient computed for this pair of tokens",
+		  "The gradient computed for this pair of tokens (usually a matrix)",
 		},
 	      })
 
diff --git a/packages/ann/loss/test/test.lua b/packages/ann/loss/test/test.lua
index 4e6e997f5..0e0d301a5 100644
--- a/packages/ann/loss/test/test.lua
+++ b/packages/ann/loss/test/test.lua
@@ -1,88 +1,91 @@
+local check=utest.check
+local T=utest.test
 -- compute_loss(INPUT, TARGET)
 
-EPSILON=1e-03
+T("LossTest", function()
 
-class.extend(matrix,
-             "normalize",
-             function(self)
-               for sw in self:sliding_window():iterate() do
-                 sw:scal(1/sw:sum())
-               end
-               return self
-end)
+    class.extend(matrix,
+                 "normalize",
+                 function(self)
+                   for sw in self:sliding_window():iterate() do
+                     sw:scal(1/sw:sum())
+                   end
+                   return self
+    end)
 
-function check_loss(i,t,l,f,g)
-  if f then
-    local e,m = l:compute_loss(i,t)
-    assert(math.abs(e - f(i,t)) < EPSILON)
-  end
-  if g then
-    local ep = l:gradient(i,t)
-    assert(ep:get_matrix():equals(g(i,t),EPSILON))
-  end
-end
+    local function check_loss(i,t,l,f,g)
+      if f then
+        local e,m = l:compute_loss(i,t)
+        check.number_eq(e, f(i,t))
+      end
+      if g then
+        local ep = l:gradient(i,t)
+        check.eq(ep, g(i,t))
+      end
+    end
 
--- CROSS ENTROPY
-check_loss(matrix.col_major(20,1):uniformf(0,1,random(1234)):log(),
-	   matrix.col_major(20,1):uniform(0,1,random(525)),
-	   ann.loss.cross_entropy(1),
-	   function(i,t)
-	     local a = i:clone():map(t,
-				     function(x,y)
-				       return y*x
-				     end):sum()
-	     local b = i:clone():exp():map(t,
-					   function(x,y)
-					     return (1-y)*(math.log(1-x))
-					   end):sum()
-	     return (-a-b)/20
-	   end,
-	   function(i,t)
-	     return i:clone():exp():axpy(-1, t)
-	   end)
+    -- CROSS ENTROPY
+    check_loss(matrix(20,1):uniformf(0,1,random(1234)):log(),
+               matrix(20,1):uniform(0,1,random(525)),
+               ann.loss.cross_entropy(1),
+               function(i,t)
+                 local a = i:clone():map(t,
+                                         function(x,y)
+                                           return y*x
+                                        end):sum()
+                 local b = i:clone():exp():map(t,
+                                               function(x,y)
+                                                 return (1-y)*(math.log(1-x))
+                                              end):sum()
+                 return (-a-b)/20
+               end,
+               function(i,t)
+                 return i:clone():exp():axpy(-1, t)
+    end)
 
--- MULTICLASS CROSS ENTROPY
-check_loss(matrix.col_major(20,4):uniformf(0,1,random(1234)):normalize():log(),
-	   dataset.indexed(dataset.matrix(matrix(20,1):uniform(1,4,random(525))),
-			   { dataset.identity(4) }):toMatrix():clone("col_major"),
-	   ann.loss.multi_class_cross_entropy(4),
-	   function(i,t)
-	     return -i:clone():cmul(t):sum()/20
-	   end,
-	   function(i,t)
-	     return i:clone():exp():axpy(-1, t)
-	   end)
+    -- MULTICLASS CROSS ENTROPY
+    check_loss(matrix(20,4):uniformf(0,1,random(1234)):normalize():log(),
+               dataset.indexed(dataset.matrix(matrix(20,1):uniform(1,4,random(525))),
+                               { dataset.identity(4) }):toMatrix():clone(),
+               ann.loss.multi_class_cross_entropy(4),
+               function(i,t)
+                 return -i:clone():cmul(t):sum()/20
+               end,
+               function(i,t)
+                 return i:clone():exp():axpy(-1, t)
+    end)
 
--- MSE
-check_loss(matrix.col_major(20,4):uniformf(0,1,random(1234)),
-	   matrix.col_major(20,4):uniform(0,1,random(525)),
-	   ann.loss.mse(4),
-	   function(i,t)
-	     return i:clone():axpy(-1,t):pow(2):sum()*0.5/20
-	   end,
-	   function(i,t)
-	     return i:clone():axpy(-1, t)
-	   end)
+    -- MSE
+    check_loss(matrix(20,4):uniformf(0,1,random(1234)),
+               matrix(20,4):uniform(0,1,random(525)),
+               ann.loss.mse(4),
+               function(i,t)
+                 return i:clone():axpy(-1,t):pow(2):sum()*0.5/20
+               end,
+               function(i,t)
+                 return i:clone():axpy(-1, t)
+    end)
 
--- MAE
-check_loss(matrix.col_major(20,4):uniformf(0,1,random(1234)),
-	   matrix.col_major(20,4):uniform(0,1,random(525)),
-	   ann.loss.mae(4),
-	   function(i,t)
-	     return i:clone():axpy(-1,t):abs():sum()/20/4
-	   end)
+    -- MAE
+    check_loss(matrix(20,4):uniformf(0,1,random(1234)),
+               matrix(20,4):uniform(0,1,random(525)),
+               ann.loss.mae(4),
+               function(i,t)
+                 return i:clone():axpy(-1,t):abs():sum()/20/4
+    end)
 
--- ZERO-ONE
-check_loss(matrix.col_major(20,4):uniformf(0,1,random(1234)),
-	   matrix.col_major(20,1):uniform(1,4,random(525)),
-	   ann.loss.zero_one(4),
-	   function(i,t)
-	     local idx=1
-	     local errors=0
-	     for sw in i:sliding_window():iterate() do
-	       local _,j = sw:max()
-	       if j ~= t:get(idx,1) then errors = errors + 1 end
-	       idx = idx + 1
-	     end
-	     return errors/20
-	   end)
+    -- ZERO-ONE
+    check_loss(matrix(20,4):uniformf(0,1,random(1234)),
+               matrix(20,1):uniform(1,4,random(525)),
+               ann.loss.zero_one(4),
+               function(i,t)
+                 local idx=1
+                 local errors=0
+                 for sw in i:sliding_window():iterate() do
+                   local _,j = sw:max()
+                   if j ~= t:get(idx,1) then errors = errors + 1 end
+                   idx = idx + 1
+                 end
+                 return errors/20
+    end)
+end)
diff --git a/packages/ann/optimizer/c_src/util_regularization.cu b/packages/ann/optimizer/c_src/util_regularization.cu
index 957e971d4..fdfeffb56 100644
--- a/packages/ann/optimizer/c_src/util_regularization.cu
+++ b/packages/ann/optimizer/c_src/util_regularization.cu
@@ -46,7 +46,6 @@ namespace ANN {
     void UtilRegularization::L1NormMap(MatrixFloat *w,
 				       float value) {
       april_assert(w->getNumDim() == 2);
-      april_assert(w->getMajorOrder() == CblasColMajor);
       //
       AprilMath::MatrixExt::MatrixScalarMap1(w,Kernels::L1NormKernel(value),w);
     }
diff --git a/packages/ann/optimizer/c_src/util_rprop.cu b/packages/ann/optimizer/c_src/util_rprop.cu
index 5500c6972..11f812cca 100644
--- a/packages/ann/optimizer/c_src/util_rprop.cu
+++ b/packages/ann/optimizer/c_src/util_rprop.cu
@@ -49,7 +49,6 @@ namespace ANN {
 			 float eta_plus) {
       april_assert(steps->sameDim(old_sign) && steps->sameDim(sign));
       april_assert(steps->getNumDim() == 2);
-      april_assert(steps->getMajorOrder() == CblasColMajor);
       AprilUtils::SharedPtr<MatrixFloat> eta_values( steps->cloneOnlyDims() );
       //
       AprilMath::MatrixExt::
diff --git a/packages/ann/optimizer/lua_src/base_optimizer.lua b/packages/ann/optimizer/lua_src/base_optimizer.lua
new file mode 100644
index 000000000..4c848c839
--- /dev/null
+++ b/packages/ann/optimizer/lua_src/base_optimizer.lua
@@ -0,0 +1,150 @@
+local math = math
+local table = table
+local string = string
+--
+local ipairs = ipairs
+local pairs = pairs
+local assert = assert
+--
+local type = type
+local mop = matrix.op
+local iterator = iterator
+local get_table_fields = get_table_fields
+local april_assert = april_assert
+
+local FLT_MIN = mathcore.limits.float.min()
+
+ann.optimizer = ann.optimizer or {}
+ann.optimizer.MAX_UPDATES_WITHOUT_PRUNE = 100
+
+------------------------------------------------------------------------------
+------------------------------------------------------------------------------
+------------------------------------------------------------------------------
+local ann_optimizer_utils = ann.optimizer.utils
+
+-- this function receives a weights matrix, a L1 regularization parameter (can
+-- be a number of a matrix with L1 for every weight), and an optional update
+-- matrix (for momentum purposes, it can be nil)
+function ann_optimizer_utils.l1_truncate_gradient(w, l1, update)
+  local z = mop.abs(w):gt(l1):to_float() -- which weights won't cross zero
+  -- compute L1 update
+  local u = mop.sign(w)
+  if type(l1) == "number" then u:scal(l1) else u:cmul(l1) end
+  -- apply L1 update to weights
+  w:axpy(-1.0, u)
+  if update then
+    -- apply L1 update to update matrix (for momentum)
+    update:axpy(-1.0, u)
+  end
+  -- remove weights which cross zero
+  w:cmul(z)
+end
+
+-- receives a weights matrix and a max norm penalty value
+function ann_optimizer_utils.max_norm_penalty(w, mnp)
+  for _,row in matrix.ext.iterate(w,1) do
+    local n2 = row:norm2()
+    if n2 > mnp then row:scal(mnp / n2) end
+  end
+end
+------------------------------------------------------------------------------
+------------------------------------------------------------------------------
+------------------------------------------------------------------------------
+
+-- global environment ann.optimizer
+local optimizer,optimizer_methods = class("ann.optimizer", nil, ann.optimizer)
+
+function optimizer:constructor(valid_options,
+                               g_options,
+                               l_options,
+                               count)
+  local g_options, l_options = g_options or {}, l_options or {}
+  self.valid_options     = iterator(ipairs(valid_options or {})):map(function(i,t)return t[1],t[2] end):table()
+  self.global_options    = {}
+  self.layerwise_options = {}
+  self.count             = count or 0
+  for name,value in pairs(g_options) do
+    self.global_options[name] = value
+  end
+  for layer_name,options in pairs(l_options) do
+    for name,value in pairs(options) do
+      self.layerwise_options[layer_name] = self.layerwise_options[layer_name] or {}
+      self.layerwise_options[layer_name][name] = value
+    end
+  end
+  return obj
+end
+
+function optimizer_methods:show_options()
+  local t = iterator(pairs(self.valid_options)):enumerate():table()
+  table.sort(t, function(a,b) return a[1]<b[1] end)
+  print(iterator(ipairs(t)):select(2):map(table.unpack):concat("\t","\n"))
+end
+
+function optimizer_methods:has_option(name)
+  return self.valid_options[name]
+end
+
+function optimizer_methods:set_option(name,value)
+  april_assert(self.valid_options[name], "Not recognized option %s", name)
+  self.global_options[name] = value
+  return self
+end
+
+function optimizer_methods:get_option(name)
+  april_assert(self.valid_options[name], "Not recognized option %s", name)
+  return self.global_options[name]
+end
+
+function optimizer_methods:set_layerwise_option(layer_name,name,value)
+  april_assert(self.valid_options[name], "Not recognized option %s", name)
+  self.layerwise_options[layer_name] = self.layerwise_options[layer_name] or {}
+  self.layerwise_options[layer_name][name] = value
+  return self
+end
+
+function optimizer_methods:get_layerwise_option(layer_name,name)
+  april_assert(self.valid_options[name], "Not recognized option %s", name)
+  return (self.layerwise_options[layer_name] or {})[name]
+end
+
+function optimizer_methods:get_option_of(layer_name,name)
+  april_assert(self.valid_options[name], "Not recognized option %s", name)
+  return ( (self.layerwise_options[layer_name] or {})[name] or
+	     self.global_options[name] )
+end
+
+-- eval is a function which returns the data needed by the optimizer (at least,
+-- the loss, and the gradients. The rest of values will be ignored)
+--
+-- weights is a dictionary of weight matrix objects, indexed by its names, or a
+-- matrix
+function optimizer_methods:execute(eval, weights)
+  error("NOT IMPLEMENTED METHOD!, use a derived class instance")
+end
+
+function optimizer_methods:count_one()
+  self.count = self.count + 1
+end
+
+function optimizer_methods:get_count()
+  return self.count
+end
+
+function optimizer_methods:clone()
+  local obj = ann.optimizer()
+  obj.count = self.count
+  return obj
+end
+
+function optimizer_methods:needs_property(name)
+  return false
+end
+
+function optimizer_methods:has_property(name)
+  return false
+end
+
+------------------------------------------------
+------------------------------------------------
+------------------------------------------------
diff --git a/packages/ann/optimizer/lua_src/optimizer.lua b/packages/ann/optimizer/lua_src/optimizer.lua
deleted file mode 100644
index 841d5bfa6..000000000
--- a/packages/ann/optimizer/lua_src/optimizer.lua
+++ /dev/null
@@ -1,1041 +0,0 @@
-local math = math
-local table = table
-local string = string
---
-local ipairs = ipairs
-local pairs = pairs
-local assert = assert
---
-local type = type
-local iterator = iterator
-local get_table_fields = get_table_fields
-local april_assert = april_assert
-
-------------------------------------------------------------------------------
-
-local MAX_UPDATES_WITHOUT_PRUNE=100
-
-------------------------------------------------------------------------------
-------------------------------------------------------------------------------
-------------------------------------------------------------------------------
--- REMOVE UTILS FROM GLOBALS TABLE
-local ann_optimizer_utils = ann.optimizer.utils
-ann.optimizer.utils = nil
-
-------------------------------------------------------------------------------
-------------------------------------------------------------------------------
-------------------------------------------------------------------------------
-
-get_table_from_dotted_string("ann.optimizer.regularizations", true)
-
-function ann.optimizer.regularizations.weight_decay(update, wd, w)
-  if wd > 0.0 then
-    assert(wd < 1.0, "Incorrect weight decay value")
-    if rawequal(update, w) then w:scal(1-wd)
-    else update:axpy(-wd, w)
-    end
-  end
-end
-
-------------------------------------------------------------------------------
-
-get_table_from_dotted_string("ann.optimizer.constraints", true)
-
--- This regularization term must be applied the last
-function ann.optimizer.constraints.L1_norm(value, w)
-  if value > 0.0 then
-    ann_optimizer_utils.regularization.L1_norm_map(w, value)
-  end
-end
-
--- The penalty is computed and applied on w
-function ann.optimizer.constraints.max_norm_penalty(mp, w)
-  if mp > 0.0 then
-    local sw         = w:sliding_window()
-    local window     = nil
-    while not sw:is_end() do
-      window  = sw:get_matrix(window)
-      local norm2 = window:norm2()
-      if norm2 > mp then
-	local scal_factor = mp / norm2
-	window:scal(scal_factor)
-      end
-      sw:next()
-    end
-  end
-end
-
-------------------------------------------------------------------------------
-------------------------------------------------------------------------------
-------------------------------------------------------------------------------
-
--- global environment ann.optimizer
-local optimizer,optimizer_methods = class("ann.optimizer", nil, ann.optimizer)
-
-function optimizer:constructor(valid_options,
-                               g_options,
-                               l_options,
-                               count)
-  local g_options, l_options = g_options or {}, l_options or {}
-  self.valid_options     = iterator(ipairs(valid_options or {})):map(function(i,t)return t[1],t[2] end):table()
-  self.global_options    = {}
-  self.layerwise_options = {}
-  self.count             = count or 0
-  self.regularizations   = {}
-  self.constraints       = {}
-  self.regularizations_order = {}
-  self.constraints_order     = {}
-  for name,value in pairs(g_options) do
-    self.global_options[name] = value
-  end
-  for layer_name,options in pairs(l_options) do
-    for name,value in pairs(options) do
-      self.layerwise_options[layer_name] = self.layerwise_options[layer_name] or {}
-      self.layerwise_options[layer_name][name] = value
-    end
-  end
-  return obj
-end
-
-
--- regularization functions has the API: func(dest, value, w) where dest is the
--- destination matrix, and w the current weights matrix
-function optimizer_methods:add_regularization(hyperparameter_name, func, desc)
-  local func = april_assert(func or ann.optimizer.regularizations[hyperparameter_name],
-			    "Problem with hyperparemter function of %s",
-			    hyperparameter_name)
-  april_assert(not self.valid_options[hyperparameter_name],
-	       "Redefinition of hyperparameter %s",
-	       hyperparameter_name)
-  self.valid_options[hyperparameter_name] = desc
-  self.regularizations[hyperparameter_name] = func
-  table.insert(self.regularizations_order, hyperparameter_name)
-end
-
--- constraint functions has the API: func(value, w)
-function optimizer_methods:add_constraint(hyperparameter_name, func, desc)
-  local func = april_assert(func or ann.optimizer.constraints[hyperparameter_name],
-			    "Problem with hyperparemter function of %s",
-			    hyperparameter_name)
-  april_assert(not self.valid_options[hyperparameter_name],
-	       "Redefinition of hyperparameter %s",
-	       hyperparameter_name)
-  self.valid_options[hyperparameter_name] = desc
-  self.constraints[hyperparameter_name] = func
-  table.insert(self.constraints_order, hyperparameter_name)
-end
-
-local function ann_optimizer_apply_regularizations(opt, wname, update, w)
-  for _,hypname in ipairs(opt.regularizations_order) do
-    local func = opt.regularizations[hypname]
-    local v = opt:get_option_of(wname, hypname)
-    if v then
-      -- sanity check
-      if v > 0.0 and #w:dim() == 2 and w:dim(2) == 1 then
-	fprintf(io.stderr,
-		"# WARNING!!! Possible %s > 0 in bias connection: %s\n",
-		hypname, wname)
-      end
-      func(update, v, w)
-    end
-  end
-end
-
-local function ann_optimizer_apply_constraints(opt, wname, w)
-  for _,hypname in pairs(opt.constraints_order) do
-    local func = opt.constraints[hypname]
-    local v = opt:get_option_of(wname, hypname)
-    if v then
-      -- sanity check
-      if v > 0.0 and #w:dim() == 2 and w:dim(2) == 1 then
-	fprintf(io.stderr,
-		"# WARNING!!! Possible %s > 0 in bias connection: %s\n",
-		hypname, wname)
-      end
-      func(v, w)
-    end
-  end
-end
-
-function optimizer_methods:show_options()
-  local t = iterator(pairs(self.valid_options)):enumerate():table()
-  table.sort(t, function(a,b) return a[1]<b[1] end)
-  print(iterator(ipairs(t)):select(2):map(table.unpack):concat("\t","\n"))
-end
-
-function optimizer_methods:has_option(name)
-  return self.valid_options[name]
-end
-
-function optimizer_methods:set_option(name,value)
-  april_assert(self.valid_options[name], "Not recognized option %s", name)
-  self.global_options[name] = value
-  return self
-end
-
-function optimizer_methods:get_option(name)
-  april_assert(self.valid_options[name], "Not recognized option %s", name)
-  return self.global_options[name]
-end
-
-function optimizer_methods:set_layerwise_option(layer_name,name,value)
-  april_assert(self.valid_options[name], "Not recognized option %s", name)
-  self.layerwise_options[layer_name] = self.layerwise_options[layer_name] or {}
-  self.layerwise_options[layer_name][name] = value
-  return self
-end
-
-function optimizer_methods:get_layerwise_option(layer_name,name)
-  april_assert(self.valid_options[name], "Not recognized option %s", name)
-  return (self.layerwise_options[layer_name] or {})[name]
-end
-
-function optimizer_methods:get_option_of(layer_name,name)
-  april_assert(self.valid_options[name], "Not recognized option %s", name)
-  return ( (self.layerwise_options[layer_name] or {})[name] or
-	     self.global_options[name] )
-end
-
--- eval is a function which returns the data needed by the optimizer (at least,
--- the loss, and the gradients. The rest of values will be ignored)
---
--- weights is a dictionary of weight matrix objects, indexed by its names, or a
--- matrix
-function optimizer_methods:execute(eval, weights)
-  error("NOT IMPLEMENTED METHOD!, use a derived class instance")
-end
-
-function optimizer_methods:count_one()
-  self.count = self.count + 1
-end
-
-function optimizer_methods:get_count()
-  return self.count
-end
-
-function optimizer_methods:clone()
-  local obj = ann.optimizer()
-  obj.count = self.count
-  return obj
-end
-
-function optimizer_methods:needs_property(name)
-  return false
-end
-
-------------------------------------------------
-------------------------------------------------
-------------------------------------------------
-
-local function ann_optimizer_apply_momentum(mt, update)
-  if mt > 0.0 then
-    -- intertia is computed as a portion of previous update
-    update:scal(mt)
-  else
-    -- sets to ZERO
-    update:zeros()
-  end
-end
-
-------------------------------------------------
-------------------------------------------------
-------------------------------------------------
-
-local wrap_matrices = matrix.dict.wrap_matrices
-
-------------------------------------------------
---------- STOCHASTIC GRADIENT DESCENT ----------
-------------------------------------------------
-
-local sgd, sgd_methods = class("ann.optimizer.sgd", ann.optimizer)
-ann.optimizer.sgd = sgd -- global environment
-
-function sgd:constructor(g_options, l_options, count, update)
-  -- the base optimizer, with the supported learning parameters
-  ann.optimizer.constructor(self,
-                            {
-			      {"learning_rate", "Learning speed factor (0.1)"},
-			      {"momentum", "Learning inertia factor (0.1)"},
-                              {"decay", "Decay of hyper-parameters (0.0), global option"},
-			    },
-			    g_options,
-			    l_options,
-			    count)
-  self.update = wrap_matrices(update or matrix.dict())
-  -- standard regularization and constraints
-  self:add_regularization("weight_decay", nil, "Weight L2 regularization (1e-04)")
-  self:add_constraint("L1_norm", nil, "Weight L1 regularization (1e-05)")
-  self:add_constraint("max_norm_penalty", nil, "Weight max norm upper bound (4)")
-  self:set_option("decay", 0.0)
-end
-
-function sgd_methods:execute(eval, weights)
-  local wrap_matrices = wrap_matrices
-  local table = table
-  local assert = assert
-  --
-  local origw = weights
-  local weights = wrap_matrices(weights)
-  local arg = table.pack( eval(origw) )
-  local tr_loss,gradients = table.unpack(arg)
-  -- the gradient computation could fail returning nil, it is important to take
-  -- this into account
-  if not gradients then return nil end
-  gradients = wrap_matrices(gradients)
-  --
-  local gamma = self:get_option("decay")
-  local decay = 1.0 / (1.0 + gamma * self:get_count())
-  for name,w in pairs(weights) do
-    local update      = self.update(name) or w:clone():zeros()
-    local grad        = gradients(name)
-    local lr          = assert(self:get_option_of(name, "learning_rate"),
-			       "The learning_rate parameter needs to be set")
-    local mt          = self:get_option_of(name, "momentum") or 0.0
-    assert(self:get_option_of(name, "decay") == gamma,
-           "decay option cannot be defined layerwise, only globally")
-    --
-    ann_optimizer_apply_momentum(mt, update)
-    -- apply back-propagation learning rule
-    update:axpy(-lr, grad)
-    -- regularizations
-    ann_optimizer_apply_regularizations(self, name, update, w)
-    -- apply update matrix to the weights
-    w:axpy(decay, update)
-    -- constraints
-    ann_optimizer_apply_constraints(self, name, w)
-    --
-    if self:get_count() % MAX_UPDATES_WITHOUT_PRUNE == 0 then
-      w:prune_subnormal_and_check_normal()
-    end
-    --
-    self.update[name] = update
-  end
-  -- count one more update iteration
-  self:count_one()
-  -- returns the same as returned by eval()
-  return table.unpack(arg)
-end
-
-function sgd_methods:clone()
-  local obj = ann.optimizer.sgd()
-  obj.count             = self.count
-  obj.layerwise_options = table.deep_copy(self.layerwise_options)
-  obj.global_options    = table.deep_copy(self.global_options)
-  obj.update            = self.update:clone()
-  return obj
-end
-
-function sgd_methods:to_lua_string(format)
-  local format = format or "binary"
-  local str_t = { "ann.optimizer.sgd(",
-		  table.tostring(self.global_options),
-		  ",",
-		  table.tostring(self.layerwise_options),
-		  ",",
-		  tostring(self.count),
-		  ",",
-		  self.update:to_lua_string(format),
-		  ")" }
-  return table.concat(str_t, "")
-end
-
-local sgd_properties = {
-  gradient = true
-}
-function sgd_methods:needs_property(name)
-  return sgd_properties[name]
-end
-
------------------------------------
---------- RESILIENT PROP ----------
------------------------------------
-
-local rprop, rprop_methods = class("ann.optimizer.rprop", ann.optimizer)
-ann.optimizer.rprop = rprop
-
-function rprop:constructor(g_options, l_options, count,
-                           steps, old_sign)
-  -- the base optimizer, with the supported learning parameters
-  ann.optimizer.constructor(self,
-                            {
-			      {"initial_step", "Initial weight update value (0.1)"},
-			      {"eta_plus", "Update value up by this factor (1.2)"},
-			      {"eta_minus", "Update value down by this factor (0.5)"},
-			      {"max_step", "Maximum value of update step (50)"},
-			      {"min_step", "Minimum value of update step (1e-05)"},
-			      {"niter", "Number of iterations (1)"},
-			    },
-			    g_options,
-			    l_options,
-			    count)
-  self.steps    = wrap_matrices(steps or matrix.dict())
-  self.old_sign = wrap_matrices(old_sign or matrix.dict())
-  self:add_regularization("weight_decay", nil, "Weight L2 regularization (1e-04)")
-  self:add_constraint("L1_norm", nil, "Weight L1 regularization (1e-05)")
-  self:add_constraint("max_norm_penalty", nil, "Weight max norm upper bound (4)")
-  self:set_option("initial_step",  0.1)
-  self:set_option("eta_plus",      1.2)
-  self:set_option("eta_minus",     0.5)
-  self:set_option("max_step",      50)
-  self:set_option("min_step",      1e-05)
-  self:set_option("niter",         1)
-end
-
-function rprop_methods:execute(eval, weights)
-  local wrap_matrices = wrap_matrices
-  local table = table
-  local assert = assert
-  --
-  local origw = weights
-  local weights = wrap_matrices(weights)
-  local initial_step  = self:get_option("initial_step")
-  local eta_plus      = self:get_option("eta_plus")
-  local eta_minus     = self:get_option("eta_minus")
-  local max_step      = self:get_option("max_step")
-  local min_step      = self:get_option("min_step")
-  local niter         = self:get_option("niter")
-  local steps         = self.steps
-  local old_sign      = self.old_sign
-  local arg
-  for i=1,niter do
-    arg = table.pack( eval(origw, i-1) )
-    local tr_loss,gradients = table.unpack(arg)
-    -- the gradient computation could fail returning nil, it is important to
-    -- take this into account
-    if not gradients then return nil end
-    gradients = wrap_matrices(gradients)
-    --
-    for name,w in pairs(weights) do
-      steps[name] = steps(name) or w:clone():fill(initial_step)
-      local sign  = gradients(name):clone():sign()
-      -- apply reprop learning rule
-      if old_sign(name) then
-	ann_optimizer_utils.rprop.step(steps(name),
-				       old_sign(name),
-				       sign,
-				       eta_minus,
-				       eta_plus)
-      end
-      steps(name):clamp(min_step, max_step)
-      w:axpy(-1.0, sign:clone():cmul(steps(name)))
-      -- regularizations
-      ann_optimizer_apply_regularizations(self, name, w, w)
-      -- constraints
-      ann_optimizer_apply_constraints(self, name, w)
-      -- keep the sign for the next iteration
-      old_sign[name] = sign
-      --
-      if self:get_count() % MAX_UPDATES_WITHOUT_PRUNE == 0 then
-	w:prune_subnormal_and_check_normal()
-      end
-    end
-    -- count one more update iteration
-    self:count_one()
-  end
-  -- returns the same as returned by eval()
-  return table.unpack(arg)
-end
-
-function rprop_methods:clone()
-  local obj = ann.optimizer.rprop()
-  obj.count             = self.count
-  obj.layerwise_options = table.deep_copy(self.layerwise_options)
-  obj.global_options    = table.deep_copy(self.global_options)
-  if self.steps then
-    obj.steps = self.steps:clone()
-  end
-  if self.old_sign then
-    obj.old_sign = self.old_sign:clone()
-  end
-  return obj
-end
-
-function rprop_methods:to_lua_string(format)
-  local str_t = { "ann.optimizer.rprop(",
-		  table.tostring(self.global_options),
-		  ",",
-		  table.tostring(self.layerwise_options),
-		  ",",
-		  tostring(self.count),
-		  ",",
-		  self.steps:to_lua_string(format),
-		  ",",
-		  self.old_sign:to_lua_string(format),
-		  ")" }
-  return table.concat(str_t, "")
-end
-
-local rprop_properties = {
-  gradient = true
-}
-function rprop_methods:needs_property(name)
-  return rprop_properties[name]
-end
-
----------------------------------------
---------- CONJUGATE GRADIENT ----------
----------------------------------------
-
--- Conjugate Gradient implementation, copied/modified from optim package of
--- Torch 7, which is a rewrite of minimize.m written by Carl E. Rasmussen.
-local cg, cg_methods = class("ann.optimizer.cg", ann.optimizer)
-ann.optimizer.cg = cg
-
-function cg:constructor(g_options, l_options, count,
-                        df0, df1, df2, df3, x0, s)
-  -- the base optimizer, with the supported learning parameters
-  ann.optimizer.constructor(self,
-                            {
-                              --			      {"momentum", "Learning inertia factor (0.1)"},
-                              {"rho", "Constant for Wolf-Powell conditions (0.01)"},
-                              {"sig", "Constant for Wolf-Powell conditions (0.5)"},
-                              {"int", "Reevaluation limit (0.1)"},
-                              {"ext", "Maximum number of extrapolations (3)"},
-                              {"max_iter", "Maximum number of iterations (20)"},
-                              {"ratio", "Maximum slope ratio (100)"},
-                              {"max_eval", "Maximum number of evaluations (max_iter*1.25)"},
-                            },
-                            g_options,
-                            l_options,
-                            count)
-  self.state    = {
-    df0 = df0,
-    df1 = df1,
-    df2 = df2, 
-    df3 = df3,
-    x0  = x0,
-    s   = s,
-  }
-  self:set_option("rho",           0.01) -- rho is a constant in Wolfe-Powell conditions
-  self:set_option("sig",           0.5)  -- sig is another constant of Wolf-Powell
-  self:set_option("int",           0.1)  -- reevaluation limit
-  self:set_option("ext",           3.0)  -- maximum number of extrapolations
-  self:set_option("max_iter",      20)
-  self:set_option("ratio",         100)  -- maximum slope ratio
-  -- standard regularization and constraints
-  self:add_regularization("weight_decay", nil, "Weight L2 regularization (1e-04)")
-  self:add_constraint("L1_norm", nil, "Weight L1 regularization (1e-05)")
-  self:add_constraint("max_norm_penalty", nil, "Weight max norm upper bound (4)")
-end
-
-function cg_methods:execute(eval, weights)
-  local wrap_matrices = wrap_matrices
-  local table = table
-  local assert = assert
-  local math = math
-  --
-  local origw = weights
-  local weights = wrap_matrices(weights)
-  -- UPDATE_WEIGHTS function
-  local update_weights = function(x, dir, s)
-    x:axpy(dir, s)
-  end
-  -- APPLY REGULARIZATION AND PENALTIES
-  local apply_regularization_and_penalties = function(x)
-    for name,w in pairs(x) do
-      -- regularizations
-      ann_optimizer_apply_regularizations(self, name, w, w)
-      -- constraints
-      ann_optimizer_apply_constraints(self, name, w)
-    end
-    if self:get_count() % MAX_UPDATES_WITHOUT_PRUNE == 0 then
-      x:prune_subnormal_and_check_normal()
-    end
-  end
-  ----------------------------------------------------------------------------
-  
-  -- count one more update iteration
-  self:count_one()
-  
-  local x             = weights
-  local rho           = self:get_option("rho")
-  local sig           = self:get_option("sig")
-  local int           = self:get_option("int")
-  local ext           = self:get_option("ext")
-  local max_iter      = self:get_option("max_iter")
-  local ratio         = self:get_option("ratio")
-  local max_eval      = self:get_option("max_eval") or max_iter*1.25
-  local red           = 1
-  
-  local i             = 0 -- counts the number of evaluations
-  local ls_failed     = 0
-  local fx            = {}
-
-  -- we need three points for the interpolation/extrapolation stuff
-  local z1,z2,z3 = 0,0,0
-  local d1,d2,d3 = 0,0,0
-  local f1,f2,f3 = 0,0,0
-
-  local df1 = self.state.df1 or x:clone_only_dims()
-  local df2 = self.state.df2 or x:clone_only_dims()
-  local df3 = self.state.df3 or x:clone_only_dims()
-  
-  -- search direction
-  local s = self.state.s or x:clone_only_dims()
-  
-  -- we need a temp storage for X
-  local x0  = self.state.x0 or x:clone()
-  local f0  = 0
-  local df0 = self.state.df0 or x:clone_only_dims()
-  
-  -- evaluate at initial point
-  local arg = table.pack( eval(origw, i) )
-  local tr_loss,gradients = table.unpack(arg)
-  if not gradients then return nil end
-  gradients = wrap_matrices(gradients)
-  f1 = tr_loss
-  table.insert(fx, f1)
-  df1:copy(gradients)
-  i=i+1
-  
-  -- initial search direction
-  s:copy(df1)
-  s:scal(-1)
-  
-  -- slope
-  d1 = -s:dot(s)
-  -- initial step
-  z1 = red/(1-d1)
-  
-  while i < math.abs(max_eval) do
-    
-    x0:copy(x)
-    
-    f0 = f1
-    df0:copy(df1)
-    
-    update_weights(x, z1, s)
-
-    arg = table.pack( eval(origw, i) )
-    tr_loss,gradients = table.unpack(arg)
-    gradients = wrap_matrices(gradients)
-    f2 = tr_loss
-    
-    df2:copy(gradients)
-    i=i+1
-    d2 = df2:dot(s)
-    -- init point 3 equal to point 1
-    f3,d3,z3 = f1,d1,-z1
-    local m       = math.min(max_iter,max_eval-i)
-    local success = false
-    local limit   = -1
-    
-    while true do
-      while (f2 > f1+z1*rho*d1 or d2 > -sig*d1) and m > 0 do
-	limit = z1
-	if f2 > f1 then
-	  z2 = z3 - (0.5*d3*z3*z3)/(d3*z3+f2-f3)
-	else
-	  local A = 6*(f2-f3)/z3+3*(d2+d3)
-	  local B = 3*(f3-f2)-z3*(d3+2*d2)
-	  z2 = (math.sqrt(B*B-A*d2*z3*z3)-B)/A
-	end
-	if z2 ~= z2 or z2 == math.huge or z2 == -math.huge then
-	  z2 = z3/2
-	end
-	z2 = math.max(math.min(z2, int*z3),(1-int)*z3)
-	z1 = z1 + z2
-	
-	update_weights(x, z2, s)
-	arg = table.pack( eval(origw, i) )
-	tr_loss,gradients = table.unpack(arg)
-	gradients = wrap_matrices(gradients)
-	f2 = tr_loss
-	df2:copy(gradients)
-	i=i+1
-	m = m - 1
-	d2 = df2:dot(s)
-	z3 = z3-z2
-      end
-      if f2 > f1+z1*rho*d1 or d2 > -sig*d1 then
-	break
-      elseif d2 > sig*d1 then
-	success = true
-	break
-      elseif m == 0 then
-	break
-      end
-      local A = 6*(f2-f3)/z3+3*(d2+d3);
-      local B = 3*(f3-f2)-z3*(d3+2*d2);
-      z2 = -d2*z3*z3/(B+math.sqrt(B*B-A*d2*z3*z3))
-      
-      if z2 ~= z2 or z2 == math.huge or z2 == -math.huge or z2 < 0 then
-	if limit < -0.5 then
-	  z2 = z1 * (ext -1)
-	else
-	  z2 = (limit-z1)/2
-	end
-      elseif (limit > -0.5) and (z2+z1) > limit then
-	z2 = (limit-z1)/2
-      elseif limit < -0.5 and (z2+z1) > z1*ext then
-	z2 = z1*(ext-1)
-      elseif z2 < -z3*int then
-	z2 = -z3*int
-      elseif limit > -0.5 and z2 < (limit-z1)*(1-int) then
-	z2 = (limit-z1)*(1-int)
-      end
-      f3=f2
-      d3=d2
-      z3=-z2
-      z1=z1+z2;
-      update_weights(x, z2, s)
-      
-      arg = table.pack( eval(origw, i) )
-      tr_loss,gradients = table.unpack(arg)
-      gradients = wrap_matrices(gradients)
-      f2 = tr_loss
-      df2:copy(gradients)
-      i=i+1
-      m = m - 1
-      d2 = df2:dot(s)
-    end
-    if success then
-      f1 = f2
-      table.insert(fx, f1)
-      local ss = (df2:dot(df2) - df2:dot(df1))/df1:dot(df1)
-      s:scal(ss)
-      s:axpy(-1,df2)
-      df1,df2 = df2,df1
-      -- local tmp = clone(df1)
-      -- copy(df1,df2)
-      -- copy(df2,tmp)
-      d2 = df1:dot(s)
-      if d2> 0 then
-	s:copy(df1)
-	s:scal(-1)
-	d2 = -s:dot(s)
-      end
-      z1 = z1 * math.min(ratio, d1/(d2-1e-320))
-      d1 = d2
-      ls_failed = 0
-    else
-      x:copy(x0)
-      f1 = f0
-      df1:copy(df0)
-      if ls_failed or i>max_eval then
-	break
-      end
-      df1,df2 = df2,df1
-      -- local tmp = clone(df1)
-      -- copy(df1,df2)
-      -- copy(df2,tmp)
-      s:copy(df1)
-      s:scal(-1)
-      d1 = -s:dot(s)
-      z1 = 1/(1-d1)
-      ls_failed = 1
-    end
-  end
-  self.state.df0 = df0
-  self.state.df1 = df1
-  self.state.df2 = df2
-  self.state.df3 = df3
-  self.state.x0 = x0
-  self.state.s = s
-  
-  apply_regularization_and_penalties(x)
-  
-  -- evaluate the function at the end
-  local arg = table.pack( eval(origw, i) )
-  -- returns the same as returned by eval(), plus the sequence of iteration
-  -- losses and the number of iterations
-  table.insert(arg, fx)
-  table.insert(arg, i)
-  return table.unpack(arg)
-end
-
-function cg_methods:clone()
-  local obj = ann.optimizer.cg()
-  obj.count             = self.count
-  obj.layerwise_options = table.deep_copy(self.layerwise_options)
-  obj.global_options    = table.deep_copy(self.global_options)
-  if self.state.df0 then
-    obj.state.df0 = self.state.df0:clone()
-  end
-  if self.state.df1 then
-    obj.state.df1 = self.state.df1:clone()
-  end
-  if self.state.df2 then
-    obj.state.df2 = self.state.df2:clone()
-  end
-  if self.state.df3 then
-    obj.state.df3 = self.state.df3:clone()
-  end
-  if self.state.x0 then
-    obj.state.x0 = self.state.x0:clone()
-  end
-  if self.state.s then
-    obj.state.s = self.state.s:clone()
-  end
-  return obj
-end
-
-function cg_methods:to_lua_string(format)
-  local str_t = { "ann.optimizer.cg(",
-		  table.tostring(self.global_options),
-		  ",",
-		  table.tostring(self.layerwise_options),
-		  ",",
-		  tostring(self.count),
-		  ")" }
-  return table.concat(str_t, "")
-end
-
-local cg_properties = {
-  gradient = true
-}
-function cg_methods:needs_property(name)
-  return cg_properties[name]
-end
-
-------------------------------
---------- QUICKPROP ----------
-------------------------------
-
-local quickprop, quickprop_methods = class("ann.optimizer.quickprop",
-                                           ann.optimizer)
-ann.optimizer.quickprop = quickprop
-
-function quickprop:constructor(g_options, l_options, count,
-                               update, lastg)
-  -- the base optimizer, with the supported learning parameters
-  ann.optimizer.constructor(self,
-                            {
-                              {"learning_rate", "Learning speed factor (0.1)"},
-                              {"mu", "Maximum growth factor (1.75)"},
-                              {"epsilon", "Bootstrap factor (1e-04)"},
-			      {"max_step", "Maximum step value (1000)"},
-			    },
-			    g_options,
-			    l_options,
-			    count)
-  self:set_option("mu", 1.75)
-  self:set_option("epsilon", 1e-04)
-  self:set_option("max_step", 1000)
-  self.update = wrap_matrices(update or matrix.dict())
-  self.lastg  = wrap_matrices(lastg  or matrix.dict())
-  -- standard regularization and constraints
-  self:add_regularization("weight_decay", nil, "Weight L2 regularization (1e-04)")
-  self:add_constraint("L1_norm", nil, "Weight L1 regularization (1e-05)")
-  self:add_constraint("max_norm_penalty", nil, "Weight max norm upper bound (4)")
-end
-
-function quickprop_methods:execute(eval, weights)
-  local wrap_matrices = wrap_matrices
-  local table = table
-  local assert = assert
-  local math = math
-  --
-  local origw = weights
-  local weights = wrap_matrices(weights)
-  local arg = table.pack( eval(origw) )
-  local tr_loss,gradients = table.unpack(arg)
-  -- the gradient computation could fail returning nil, it is important to take
-  -- this into account
-  if not gradients then return nil end
-  gradients = wrap_matrices(gradients)
-  for name,w in pairs(weights) do
-    local update      = self.update(name)
-    local lastg       = self.lastg(name)
-    local grad        = gradients(name)
-    local lr          = assert(self:get_option_of(name, "learning_rate"),
-			       "The learning_rate parameter needs to be set")
-    local mu          = self:get_option_of(name, "mu")
-    local epsilon     = self:get_option_of(name, "epsilon")
-    local max_step    = self:get_option_of(name, "max_step")
-    if not update then
-      -- compute standard back-propagation learning rule
-      update = w:clone()
-      lastg  = grad:clone()
-      update:copy(grad)
-    else
-      local shrink = mu / (1.0 + mu)
-      -- compute quickprop update
-      update:map(lastg, grad,
-		 function(prev_step, prev_slope, slope)
-		   local step=0
-		   if math.abs(prev_step) > 1e-03 then
-		     if math.sign(slope) == math.sign(prev_step) then
-		       step = step + epsilon * slope
-		     end
-		     if ( (prev_step > 0 and slope > shrink*prev_slope) or
-		     	  (prev_step < 0 and slope < shrink*prev_slope) ) then
-		       step = step + mu * prev_step
-		     else
-		       step = step + (prev_step*slope) / (prev_slope - slope)
-		     end
-		   else
-		     step = step + epsilon * slope
-		   end
-		   if step > max_step then step = max_step
-		   elseif step < -max_step then
-		     step = -max_step
-		   end
-		   return step
-		 end)
-      lastg:copy(grad)
-    end
-    --
-    self.update[name] = update
-    self.lastg[name]  = lastg
-    -- regularizations
-    ann_optimizer_apply_regularizations(self, name, update, w)
-    -- apply update matrix to the weights
-    w:axpy(-lr, update)
-    -- constraints
-    ann_optimizer_apply_constraints(self, name, w)
-    --
-    if self:get_count() % MAX_UPDATES_WITHOUT_PRUNE == 0 then
-      w:prune_subnormal_and_check_normal()
-    end
-  end
-  -- count one more update iteration
-  self:count_one()
-  -- returns the same as returned by eval()
-  return table.unpack(arg)
-end
-
-function quickprop_methods:clone()
-  local obj = ann.optimizer.quickprop()
-  obj.count             = self.count
-  obj.layerwise_options = table.deep_copy(self.layerwise_options)
-  obj.global_options    = table.deep_copy(self.global_options)
-  obj.update            = self.update:clone()
-  obj.lastg             = self.lastg:clone()
-  return obj
-end
-
-function quickprop_methods:to_lua_string(format)
-  local format = format or "binary"
-  local str_t = { "ann.optimizer.quickprop(",
-		  table.tostring(self.global_options),
-		  ",",
-		  table.tostring(self.layerwise_options),
-		  ",",
-		  tostring(self.count),
-		  ",",
-		  self.update:to_lua_string(format),
-		  ",",
-		  self.lastg:to_lua_string(format),
-		  ")" }
-  return table.concat(str_t, "")
-end
-
-local quickprop_properties = {
-  gradient = true
-}
-function quickprop_methods:needs_property(name)
-  return quickprop_properties[name]
-end
-
-
----------------------------------------------------------
---------- AVERAGED STOCHASTIC GRADIENT DESCENT ----------
----------------------------------------------------------
-
--- extracted from: http://research.microsoft.com/pubs/192769/tricks-2012.pdf
--- Leon Bottou, Stochastic Gradient Descent Tricks, Microsoft Research, 2012
-
-local asgd, asgd_methods = class("ann.optimizer.asgd", ann.optimizer)
-ann.optimizer.asgd = asgd
-
-function asgd:constructor(g_options, l_options, count, update)
-  -- the base optimizer, with the supported learning parameters
-  ann.optimizer.constructor(self,
-                            {
-			      {"learning_rate", "Learning speed factor (0.1)"},
-			      {"lr_decay", "Learning decay factor (0.75)"},
-			      {"t0", "Average starts at bunch t0, good values are data size or data dimension (0)"},
-			    },
-			    g_options,
-			    l_options,
-			    count)
-  self.update = wrap_matrices(update or matrix.dict())
-  -- standard regularization and constraints
-  self:add_regularization("weight_decay", nil, "Weight L2 regularization (1e-04)")
-  self:add_constraint("L1_norm", nil, "Weight L1 regularization (1e-05)")
-  self:add_constraint("max_norm_penalty", nil, "Weight max norm upper bound (4)")
-  -- default values
-  self:set_option("lr_decay", 0.75)
-  self:set_option("t0", 0)
-end
-
-function asgd_methods:execute(eval, weights)
-  local wrap_matrices = wrap_matrices
-  local table = table
-  local assert = assert
-  --
-  local origw = weights
-  local weights = wrap_matrices(weights)
-  local arg = table.pack( eval(origw) )
-  local tr_loss,gradients = table.unpack(arg)
-  -- the gradient computation could fail returning nil, it is important to take
-  -- this into account
-  if not gradients then return nil end
-  gradients = wrap_matrices(gradients)
-  local t = self:get_count()
-  for name,w in pairs(weights) do
-    local update      = (self.update(name) or w:clone()):zeros()
-    local grad        = gradients(name)
-    local lr          = assert(self:get_option_of(name, "learning_rate"),
-			       "The learning_rate parameter needs to be set")
-    local lr_decay    = self:get_option_of(name, "lr_decay")
-    local t0          = self:get_option_of(name, "t0")
-    -- effective values at time t
-    local lr_t        = lr / ((1.0 + lr * t)^(lr_decay)) -- learning rate factor
-    local mu_t        = 1.0 / math.max(1, t - t0)        -- average factor
-    -- apply back-propagation learning rule
-    update:axpy(-lr, grad)
-    -- regularizations
-    ann_optimizer_apply_regularizations(self, name, update, w)
-    -- compute averaged weights
-    if mu_t > 1 or mu_t < 1 then
-      update:axpy(1.0,w)
-      w:scal(1.0 - mu_t):axpy(mu_t, update)
-    else
-      w:axpy(1.0, update)
-    end
-    -- constraints
-    ann_optimizer_apply_constraints(self, name, w)
-    --
-    if self:get_count() % MAX_UPDATES_WITHOUT_PRUNE == 0 then
-      w:prune_subnormal_and_check_normal()
-    end
-    --
-    self.update[name] = update
-  end
-  -- count one more update iteration
-  self:count_one()
-  -- returns the same as returned by eval()
-  return table.unpack(arg)
-end
-
-function asgd_methods:clone()
-  local obj = ann.optimizer.asgd()
-  obj.count             = self.count
-  obj.layerwise_options = table.deep_copy(self.layerwise_options)
-  obj.global_options    = table.deep_copy(self.global_options)
-  obj.update            = self.update:clone()
-  return obj
-end
-
-function asgd_methods:to_lua_string(format)
-  local format = format or "binary"
-  local str_t = { "ann.optimizer.asgd(",
-		  table.tostring(self.global_options),
-		  ",",
-		  table.tostring(self.layerwise_options),
-		  ",",
-		  tostring(self.count),
-		  ",",
-		  self.update:to_lua_string(format),
-		  ")" }
-  return table.concat(str_t, "")
-end
-
-local asgd_properties = {
-  gradient = true
-}
-function asgd_methods:needs_property(name)
-  return asgd_properties[name]
-end
diff --git a/packages/ann/optimizer/lua_src/optimizer_asgd.lua b/packages/ann/optimizer/lua_src/optimizer_asgd.lua
new file mode 100644
index 000000000..0755e4b42
--- /dev/null
+++ b/packages/ann/optimizer/lua_src/optimizer_asgd.lua
@@ -0,0 +1,134 @@
+local assert = assert
+local ipairs = ipairs
+local math = math
+local pairs = pairs
+local string = string
+local table = table
+local type = type
+--
+local april_assert = april_assert
+local get_table_fields = get_table_fields
+local iterator = iterator
+local md = matrix.dict
+local mop = matrix.op
+
+local MAX_UPDATES_WITHOUT_PRUNE = ann.optimizer.MAX_UPDATES_WITHOUT_PRUNE
+
+---------------------------------------------------------
+--------- AVERAGED STOCHASTIC GRADIENT DESCENT ----------
+---------------------------------------------------------
+
+-- extracted from: http://research.microsoft.com/pubs/192769/tricks-2012.pdf
+-- Leon Bottou, Stochastic Gradient Descent Tricks, Microsoft Research, 2012
+local asgd, asgd_methods = class("ann.optimizer.asgd", ann.optimizer)
+ann.optimizer.asgd = asgd
+
+function asgd:constructor(g_options, l_options, count, aw)
+  -- the base optimizer, with the supported learning parameters
+  ann.optimizer.constructor(self,
+                            {
+			      {"learning_rate", "Learning speed factor (0.01)"},
+			      {"lr_decay", "Learning decay factor (0.75)"},
+			      {"t0", "Average starts at bunch t0, good values are data size or data dimension (0)"},
+                              {"weight_decay", "Weight L2 regularization (0.0)"},
+			    },
+			    g_options,
+			    l_options,
+			    count)
+  self.aw = aw or {}
+  if not g_options then
+    -- default values
+    self:set_option("learning_rate", 0.01)
+    self:set_option("lr_decay", 0.75)
+    self:set_option("t0", 0)
+    self:set_option("weight_decay", 0.0)
+  end
+end
+
+function asgd_methods:execute(eval, weights)
+  local table = table
+  local assert = assert
+  --
+  local arg = table.pack( eval(weights) )
+  local tr_loss,gradients = table.unpack(arg)
+  -- the gradient computation could fail returning nil, it is important to take
+  -- this into account
+  if not gradients then return nil end
+  local t = self:get_count()
+  for wname,w in pairs(weights) do
+    local aw          = self.aw[wname] or w:clone():zeros()
+    local grad        = gradients[wname]
+    -- learning options
+    local lr          = self:get_option_of(wname, "learning_rate")
+    local lr_decay    = self:get_option_of(wname, "lr_decay")
+    local t0          = self:get_option_of(wname, "t0")
+    local l2          = self:get_option_of(wname, "weight_decay")
+    -- effective values at time t
+    local lr_t        = lr / ((1.0 + l2 * lr * t)^(lr_decay)) -- learning rate factor
+    local mu_t        = 1.0 / math.max(1, t - t0)             -- average factor
+    -- L2 regularization
+    if l2 > 0.0 then grad:axpy(l2, w) end
+    -- apply back-propagation learning rule
+    w:axpy(-lr_t, grad)
+    if mu_t ~= 1 then
+      -- compute averaged weights
+      aw:axpy(mu_t, w - aw)
+    else
+      -- just copy last weight values
+      aw:copy(w)
+    end
+    -- weights normality check
+    if self:get_count() % MAX_UPDATES_WITHOUT_PRUNE == 0 then
+      w:prune_subnormal_and_check_normal()
+    end
+    --
+    self.aw[wname] = aw
+  end
+  -- count one more update iteration
+  self:count_one()
+  -- returns the same as returned by eval() plus the averaged weights
+  table.insert(arg, self.aw)
+  return table.unpack(arg)
+end
+
+function asgd_methods:clone()
+  local obj = ann.optimizer.asgd()
+  obj.count             = self.count
+  obj.layerwise_options = table.deep_copy(self.layerwise_options)
+  obj.global_options    = table.deep_copy(self.global_options)
+  obj.aw                = md.clone( self.aw )
+  return obj
+end
+
+function asgd_methods:to_lua_string(format)
+  local format = format or "binary"
+  local str_t = { "ann.optimizer.asgd(",
+		  table.tostring(self.global_options),
+		  ",",
+		  table.tostring(self.layerwise_options),
+		  ",",
+		  tostring(self.count),
+		  ",",
+		  util.to_lua_string(self.aw, format),
+		  ")" }
+  return table.concat(str_t, "")
+end
+
+local asgd_needs_properties = {
+  gradient = true,
+}
+function asgd_methods:needs_property(property)
+  return asgd_needs_properties[property]
+end
+
+local asgd_has_properties = {
+  average = true
+}
+function asgd_methods:has_property(property)
+  return asgd_has_properties[property]
+end
+
+function asgd_methods:get_averaged_weights()
+  return self.aw
+end
+
diff --git a/packages/ann/optimizer/lua_src/optimizer_cg.lua b/packages/ann/optimizer/lua_src/optimizer_cg.lua
new file mode 100644
index 000000000..a8ebf0746
--- /dev/null
+++ b/packages/ann/optimizer/lua_src/optimizer_cg.lua
@@ -0,0 +1,346 @@
+local assert = assert
+local ipairs = ipairs
+local math = math
+local pairs = pairs
+local string = string
+local table = table
+local type = type
+--
+local april_assert = april_assert
+local get_table_fields = get_table_fields
+local iterator = iterator
+local mop = matrix.op
+local md = matrix.dict
+
+local MAX_UPDATES_WITHOUT_PRUNE = ann.optimizer.MAX_UPDATES_WITHOUT_PRUNE
+
+---------------------------------------
+--------- CONJUGATE GRADIENT ----------
+---------------------------------------
+
+-- Conjugate Gradient implementation, rewrite from optim package of
+-- Torch 7, which is a rewrite of minimize.m written by Carl E. Rasmussen.
+local cg, cg_methods = class("ann.optimizer.cg", ann.optimizer)
+ann.optimizer.cg = cg
+
+function cg:constructor(g_options, l_options, count,
+                        df0, df1, df2, df3, x0, s)
+  -- the base optimizer, with the supported learning parameters
+  ann.optimizer.constructor(self,
+                            {
+                              --			      {"momentum", "Learning inertia factor (0.1)"},
+                              {"rho", "Constant for Wolf-Powell conditions (0.01)"},
+                              {"sig", "Constant for Wolf-Powell conditions (0.5)"},
+                              {"int", "Reevaluation limit (0.1)"},
+                              {"ext", "Maximum number of extrapolations (3)"},
+                              {"max_iter", "Maximum number of iterations (20)"},
+                              {"ratio", "Maximum slope ratio (100)"},
+                              {"max_eval", "Maximum number of evaluations (max_iter*1.25)"},
+                              {"weight_decay", "Weight L2 regularization (0.0)"},
+                              {"L1_norm", "Weight L1 regularization (0.0)"},
+                              {"max_norm_penalty", "Weight max norm upper bound (0)"},
+                            },
+                            g_options,
+                            l_options,
+                            count)
+  self.state    = {
+    df0 = df0,
+    df1 = df1,
+    df2 = df2, 
+    df3 = df3,
+    x0  = x0,
+    s   = s,
+  }
+  if not g_options then
+    self:set_option("rho",           0.01) -- rho is a constant in Wolfe-Powell conditions
+    self:set_option("sig",           0.5)  -- sig is another constant of Wolf-Powell
+    self:set_option("int",           0.1)  -- reevaluation limit
+    self:set_option("ext",           3.0)  -- maximum number of extrapolations
+    self:set_option("max_iter",      20)
+    self:set_option("ratio",         100)  -- maximum slope ratio
+    self:set_option("weight_decay",  0.0)
+    self:set_option("L1_norm",       0.0)
+    self:set_option("max_norm_penalty", 0.0)
+  end
+end
+
+function cg_methods:execute(eval, weights)
+  local table = table
+  local assert = assert
+  local math = math
+  --
+  local origw = weights
+  -- DO EVAL
+  local do_eval = function(x,i)
+    local arg = table.pack( eval(x, i) )
+    local tr_loss,gradients = table.unpack(arg)
+    local reg = 0.0
+    for wname,w in pairs(x) do
+      local l1 = self:get_option_of(wname, "L1_norm")
+      local l2 = self:get_option_of(wname, "weight_decay")
+      if l1 > 0.0 then reg = reg + l1*mop.abs(w):sum() end
+      if l2 > 0.0 then reg = reg + 0.5*l2*w:dot(w) gradients[wname]:axpy(l2, w) end
+    end
+    arg[1] = arg[1] + reg
+    return arg
+  end
+  -- UPDATE_WEIGHTS function
+  local update_weights = function(x, dir, s)
+    md.axpy(x, dir, s)
+    for wname,w in md.iterator(x) do
+      local l1 = self:get_option_of(wname, "L1_norm")
+      -- L1 regularization, truncated gradient implementation
+      if l1 > 0.0 then ann.optimizer.utils.l1_truncate_gradient(w, math.abs(dir)*l1) end
+    end
+  end
+  -- APPLY REGULARIZATION AND PENALTIES
+  local apply_penalties = function(x)
+    for wname,w in md.iterator(x) do
+      local mnp = self:get_option_of(wname, "max_norm_penalty")
+      -- constraints
+      if mnp > 0.0 then ann.optimizer.utils.max_norm_penalty(w, mnp) end
+    end
+    if self:get_count() % MAX_UPDATES_WITHOUT_PRUNE == 0 then
+      md.prune_subnormal_and_check_normal( x )
+    end
+  end
+  ----------------------------------------------------------------------------
+  
+  -- count one more update iteration
+  self:count_one()
+  
+  local x             = weights
+  local rho           = self:get_option("rho")
+  local sig           = self:get_option("sig")
+  local int           = self:get_option("int")
+  local ext           = self:get_option("ext")
+  local max_iter      = self:get_option("max_iter")
+  local ratio         = self:get_option("ratio")
+  local max_eval      = self:get_option("max_eval") or max_iter*1.25
+  local red           = 1
+  
+  local i             = 0 -- counts the number of evaluations
+  local ls_failed     = 0
+  local fx            = {}
+
+  -- we need three points for the interpolation/extrapolation stuff
+  local z1,z2,z3 = 0,0,0
+  local d1,d2,d3 = 0,0,0
+  local f1,f2,f3 = 0,0,0
+
+  local df1 = self.state.df1 or md.clone_only_dims( x )
+  local df2 = self.state.df2 or md.clone_only_dims( x )
+  local df3 = self.state.df3 or md.clone_only_dims( x )
+  
+  -- search direction
+  local s = self.state.s or md.clone_only_dims( x )
+  
+  -- we need a temp storage for X
+  local x0  = self.state.x0 or md.clone( x )
+  local f0  = 0
+  local df0 = self.state.df0 or md.clone_only_dims( x )
+  
+  -- evaluate at initial point
+  local arg = do_eval(origw, i)
+  local tr_loss,gradients = table.unpack(arg)
+  if not gradients then return nil end
+  f1 = tr_loss
+  table.insert(fx, f1)
+  md.copy(df1, gradients)
+  i=i+1
+  
+  -- initial search direction
+  md.scal( md.copy(s, df1), -1 )
+  
+  -- slope
+  d1 = -md.dot(s, s)
+  -- initial step
+  z1 = red/(1-d1)
+  
+  while i < math.abs(max_eval) do
+    
+    md.copy( x0, x )
+    
+    f0 = f1
+    md.copy( df0, df1 )
+    
+    update_weights(x, z1, s)
+
+    arg = do_eval(origw, i)
+    tr_loss,gradients = table.unpack(arg)
+    f2 = tr_loss
+    
+    md.copy( df2, gradients )
+    i=i+1
+    d2 = md.dot( df2, s )
+    -- init point 3 equal to point 1
+    f3,d3,z3 = f1,d1,-z1
+    local m       = math.min(max_iter,max_eval-i)
+    local success = false
+    local limit   = -1
+    
+    while true do
+      while (f2 > f1+z1*rho*d1 or d2 > -sig*d1) and m > 0 do
+	limit = z1
+	if f2 > f1 then
+	  z2 = z3 - (0.5*d3*z3*z3)/(d3*z3+f2-f3)
+	else
+	  local A = 6*(f2-f3)/z3+3*(d2+d3)
+	  local B = 3*(f3-f2)-z3*(d3+2*d2)
+	  z2 = (math.sqrt(B*B-A*d2*z3*z3)-B)/A
+	end
+	if z2 ~= z2 or z2 == math.huge or z2 == -math.huge then
+	  z2 = z3/2
+	end
+	z2 = math.max(math.min(z2, int*z3),(1-int)*z3)
+	z1 = z1 + z2
+	
+	update_weights(x, z2, s)
+        arg = do_eval(origw, i)
+	tr_loss,gradients = table.unpack(arg)
+	f2 = tr_loss
+	md.copy( df2, gradients )
+	i=i+1
+	m = m - 1
+	d2 = md.dot( df2, s )
+	z3 = z3-z2
+      end
+      if f2 > f1+z1*rho*d1 or d2 > -sig*d1 then
+	break
+      elseif d2 > sig*d1 then
+	success = true
+	break
+      elseif m == 0 then
+	break
+      end
+      local A = 6*(f2-f3)/z3+3*(d2+d3);
+      local B = 3*(f3-f2)-z3*(d3+2*d2);
+      z2 = -d2*z3*z3/(B+math.sqrt(B*B-A*d2*z3*z3))
+      
+      if z2 ~= z2 or z2 == math.huge or z2 == -math.huge or z2 < 0 then
+	if limit < -0.5 then
+	  z2 = z1 * (ext -1)
+	else
+	  z2 = (limit-z1)/2
+	end
+      elseif (limit > -0.5) and (z2+z1) > limit then
+	z2 = (limit-z1)/2
+      elseif limit < -0.5 and (z2+z1) > z1*ext then
+	z2 = z1*(ext-1)
+      elseif z2 < -z3*int then
+	z2 = -z3*int
+      elseif limit > -0.5 and z2 < (limit-z1)*(1-int) then
+	z2 = (limit-z1)*(1-int)
+      end
+      f3=f2
+      d3=d2
+      z3=-z2
+      z1=z1+z2
+      update_weights(x, z2, s)
+      
+      arg = do_eval(origw, i)
+      tr_loss,gradients = table.unpack(arg)
+      f2 = tr_loss
+      md.copy( df2, gradients )
+      i=i+1
+      m = m - 1
+      d2 = md.dot( df2, s )
+    end
+    if success then
+      f1 = f2
+      table.insert(fx, f1)
+      local ss = ( md.dot( df2, df2 ) - md.dot( df2, df1 ))/md.dot( df1, df1 )
+      md.scal( s, ss )
+      md.axpy( s, -1, df2 )
+      df1,df2 = df2,df1
+      -- local tmp = clone(df1)
+      -- copy(df1,df2)
+      -- copy(df2,tmp)
+      d2 = md.dot( df1, s )
+      if d2 > 0 then
+	md.copy( s, df1 )
+	md.scal( s, -1 )
+	d2 = -md.dot( s, s )
+      end
+      z1 = z1 * math.min(ratio, d1/(d2 - FLT_MIN))
+      d1 = d2
+      ls_failed = 0
+    else
+      md.copy( x, x0 )
+      f1 = f0
+      md.copy( df1, df0 )
+      if ls_failed or i>max_eval then
+	break
+      end
+      df1,df2 = df2,df1
+      -- local tmp = clone(df1)
+      -- copy(df1,df2)
+      -- copy(df2,tmp)
+      md.copy( s, df1 )
+      md.scal( s, -1 )
+      d1 = -md.dot( s, s )
+      z1 = 1/(1-d1)
+      ls_failed = 1
+    end
+  end
+  self.state.df0 = df0
+  self.state.df1 = df1
+  self.state.df2 = df2
+  self.state.df3 = df3
+  self.state.x0 = x0
+  self.state.s = s
+  
+  apply_penalties(x)
+  
+  -- evaluate the function at the end
+  local arg = do_eval(origw, i)
+  -- returns the same as returned by eval(), plus the sequence of iteration
+  -- losses and the number of iterations
+  table.insert(arg, fx)
+  table.insert(arg, i)
+  return table.unpack(arg)
+end
+
+function cg_methods:clone()
+  local obj = ann.optimizer.cg()
+  obj.count             = self.count
+  obj.layerwise_options = table.deep_copy(self.layerwise_options)
+  obj.global_options    = table.deep_copy(self.global_options)
+  if self.state.df0 then
+    obj.state.df0 = md.clone( self.state.df0 )
+  end
+  if self.state.df1 then
+    obj.state.df1 = md.clone( self.state.df1 )
+  end
+  if self.state.df2 then
+    obj.state.df2 = md.clone( self.state.df2 )
+  end
+  if self.state.df3 then
+    obj.state.df3 = md.clone( self.state.df3 )
+  end
+  if self.state.x0 then
+    obj.state.x0 = md.clone( self.state.x0 )
+  end
+  if self.state.s then
+    obj.state.s = md.clone( self.state.s )
+  end
+  return obj
+end
+
+function cg_methods:to_lua_string(format)
+  local str_t = { "ann.optimizer.cg(",
+		  table.tostring(self.global_options),
+		  ",",
+		  table.tostring(self.layerwise_options),
+		  ",",
+		  tostring(self.count),
+		  ")" }
+  return table.concat(str_t, "")
+end
+
+local cg_properties = {
+  gradient = true
+}
+function cg_methods:needs_property(name)
+  return cg_properties[name]
+end
diff --git a/packages/ann/optimizer/lua_src/optimizer_quickprop.lua b/packages/ann/optimizer/lua_src/optimizer_quickprop.lua
new file mode 100644
index 000000000..7f19923e6
--- /dev/null
+++ b/packages/ann/optimizer/lua_src/optimizer_quickprop.lua
@@ -0,0 +1,170 @@
+local assert = assert
+local ipairs = ipairs
+local math = math
+local pairs = pairs
+local string = string
+local table = table
+local type = type
+--
+local april_assert = april_assert
+local get_table_fields = get_table_fields
+local iterator = iterator
+local mop = matrix.op
+local md = matrix.dict
+
+local MAX_UPDATES_WITHOUT_PRUNE = ann.optimizer.MAX_UPDATES_WITHOUT_PRUNE
+
+------------------------------
+--------- QUICKPROP ----------
+------------------------------
+
+local quickprop, quickprop_methods = class("ann.optimizer.quickprop",
+                                           ann.optimizer)
+ann.optimizer.quickprop = quickprop
+
+function quickprop:constructor(g_options, l_options, count, update, lastg)
+  -- the base optimizer, with the supported learning parameters
+  ann.optimizer.constructor(self,
+                            {
+                              {"learning_rate", "Learning speed factor (0.01)"},
+                              {"mu", "Maximum growth factor (1.75)"},
+                              {"epsilon", "Bootstrap factor (1e-04)"},
+			      {"max_step", "Maximum step value (1000)"},
+                              {"decay", "Decay of hyper-parameters (1e-05), global option"},
+                              {"weight_decay", "Weight L2 regularization (0.0)"},
+                              {"L1_norm", "Weight L1 regularization (0.0)"},
+                              {"max_norm_penalty", "Weight max norm upper bound (0)"},
+                            },
+			    g_options,
+			    l_options,
+			    count)
+  -- default values
+  if not g_options then
+    self:set_option("learning_rate", 0.01)
+    self:set_option("mu", 1.75)
+    self:set_option("epsilon", 1e-04)
+    self:set_option("max_step", 1000)
+    self:set_option("decay", 1e-05)
+    self:set_option("weight_decay", 0.0)
+    self:set_option("L1_norm", 0.0)
+    self:set_option("max_norm_penalty", 0.0)
+  end
+  self.update = update or {}
+  self.lastg  = lastg  or {}
+end
+
+function quickprop_methods:execute(eval, weights)
+  local table = table
+  local assert = assert
+  local math = math
+  --
+  local origw = weights
+  local arg = table.pack( eval(origw) )
+  local tr_loss,gradients = table.unpack(arg)
+  -- the gradient computation could fail returning nil, it is important to take
+  -- this into account
+  if not gradients then return nil end
+  local d0 = self:get_option("decay")
+  local decay = 1.0 / (1.0 + d0 * self:get_count())
+  for wname,w in pairs(weights) do
+    local update      = self.update[wname]
+    local lastg       = self.lastg[wname]
+    local grad        = gradients[wname]
+    -- learning options
+    local lr          = self:get_option_of(wname, "learning_rate")
+    local lrd         = lr * decay
+    local mu          = self:get_option_of(wname, "mu")
+    local epsilon     = self:get_option_of(wname, "epsilon")
+    local max_step    = self:get_option_of(wname, "max_step")
+    local l1          = self:get_option_of(wname, "L1_norm")
+    local l2          = self:get_option_of(wname, "weight_decay")
+    local mnp         = self:get_option_of(wname, "max_norm_penalty")
+    assert(self:get_option_of(wname, "decay") == d0,
+           "decay option cannot be defined layerwise, only globally")
+    if not update then
+      -- compute standard back-propagation learning rule
+      update = w:clone()
+      lastg  = grad:clone()
+      update:copy(grad)
+    else
+      local shrink = mu / (1.0 + mu)
+      -- compute quickprop update
+      update:map(lastg, grad,
+		 function(prev_step, prev_slope, slope)
+		   local step=0
+		   if math.abs(prev_step) > 1e-03 then
+		     if math.sign(slope) == math.sign(prev_step) then
+		       step = step + epsilon * slope
+		     end
+		     if ( (prev_step > 0 and slope > shrink*prev_slope) or
+                       (prev_step < 0 and slope < shrink*prev_slope) ) then
+		       step = step + mu * prev_step
+		     else
+		       step = step + (prev_step*slope) / (prev_slope - slope)
+		     end
+		   else
+		     step = step + epsilon * slope
+		   end
+		   if step > max_step then step = max_step
+		   elseif step < -max_step then
+		     step = -max_step
+		   end
+		   return step
+      end)
+      lastg:copy(grad)
+    end
+    --
+    self.update[wname] = update
+    self.lastg[wname]  = lastg
+    -- L2 regularization
+    if l2 > 0.0 then update:axpy(l2, w) end
+    -- apply update matrix to the weights
+    w:axpy(-lrd, update)
+    -- L1 regularization, truncated gradient implementation
+    if l1 > 0.0 then ann.optimizer.utils.l1_truncate_gradient(w, lrd*l1) end
+    -- constraints
+    if mnp > 0.0 then ann.optimizer.utils.max_norm_penalty(w, mnp) end
+    -- weights normality check
+    if self:get_count() % MAX_UPDATES_WITHOUT_PRUNE == 0 then
+      w:prune_subnormal_and_check_normal()
+    end
+  end
+  -- count one more update iteration
+  self:count_one()
+  -- returns the same as returned by eval()
+  return table.unpack(arg)
+end
+
+function quickprop_methods:clone()
+  local obj = ann.optimizer.quickprop()
+  obj.count             = self.count
+  obj.layerwise_options = table.deep_copy(self.layerwise_options)
+  obj.global_options    = table.deep_copy(self.global_options)
+  obj.update            = md.clone( self.update )
+  obj.lastg             = md.clone( self.lastg )
+  return obj
+end
+
+function quickprop_methods:to_lua_string(format)
+  local format = format or "binary"
+  local str_t = { "ann.optimizer.quickprop(",
+		  table.tostring(self.global_options),
+		  ",",
+		  table.tostring(self.layerwise_options),
+		  ",",
+		  tostring(self.count),
+		  ",",
+		  util.to_lua_string(self.update, format),
+		  ",",
+		  util.to_lua_string(self.lastg, format),
+		  ")" }
+  return table.concat(str_t, "")
+end
+
+local quickprop_properties = {
+  gradient = true
+}
+function quickprop_methods:needs_property(property)
+  return quickprop_properties[property]
+end
+
diff --git a/packages/ann/optimizer/lua_src/optimizer_rprop.lua b/packages/ann/optimizer/lua_src/optimizer_rprop.lua
new file mode 100644
index 000000000..c5e8d63da
--- /dev/null
+++ b/packages/ann/optimizer/lua_src/optimizer_rprop.lua
@@ -0,0 +1,155 @@
+local assert = assert
+local ipairs = ipairs
+local math = math
+local pairs = pairs
+local string = string
+local table = table
+local type = type
+--
+local april_assert = april_assert
+local get_table_fields = get_table_fields
+local iterator = iterator
+local mop = matrix.op
+local md = matrix.dict
+
+local MAX_UPDATES_WITHOUT_PRUNE = ann.optimizer.MAX_UPDATES_WITHOUT_PRUNE
+
+-----------------------------------
+--------- RESILIENT PROP ----------
+-----------------------------------
+
+local rprop, rprop_methods = class("ann.optimizer.rprop", ann.optimizer)
+ann.optimizer.rprop = rprop
+
+function rprop:constructor(g_options, l_options, count, steps, old_signs)
+  -- the base optimizer, with the supported learning parameters
+  ann.optimizer.constructor(self,
+                            {
+			      {"initial_step", "Initial weight update value (0.1)"},
+			      {"eta_plus", "Update value up by this factor (1.2)"},
+			      {"eta_minus", "Update value down by this factor (0.5)"},
+			      {"max_step", "Maximum value of update step (50)"},
+			      {"min_step", "Minimum value of update step (1e-05)"},
+			      {"niter", "Number of iterations (1)"},
+                              {"weight_decay", "Weight L2 regularization (0.0)"},
+                              {"L1_norm", "Weight L1 regularization (0.0)"},
+                              {"max_norm_penalty", "Weight max norm upper bound (0)"},
+			    },
+			    g_options,
+			    l_options,
+			    count)
+  self.steps     = steps or {}
+  self.old_signs = old_signs or {}
+  if not g_options then
+    -- default values
+    self:set_option("initial_step",  0.1)
+    self:set_option("eta_plus",      1.2)
+    self:set_option("eta_minus",     0.5)
+    self:set_option("max_step",      50)
+    self:set_option("min_step",      1e-05)
+    self:set_option("niter",         1)
+    self:set_option("weight_decay",  0.0)
+    self:set_option("L1_norm",       0.0)
+    self:set_option("max_norm_penalty", 0.0)
+  end
+end
+
+function rprop_methods:execute(eval, weights)
+  local table = table
+  local assert = assert
+  --
+  local origw         = weights
+  local initial_step  = self:get_option("initial_step")
+  local eta_plus      = self:get_option("eta_plus")
+  local eta_minus     = self:get_option("eta_minus")
+  local max_step      = self:get_option("max_step")
+  local min_step      = self:get_option("min_step")
+  local niter         = self:get_option("niter")
+  local steps         = self.steps
+  local old_signs     = self.old_signs
+  local arg
+  for i=1,niter do
+    arg = table.pack( eval(origw, i-1) )
+    local tr_loss,gradients = table.unpack(arg)
+    -- the gradient computation could fail returning nil, it is important to
+    -- take this into account
+    if not gradients then return nil end
+    --
+    for wname,w in pairs(weights) do
+      local grad        = gradients[wname]
+      local old_sign    = old_signs[wname]
+      local step        = steps[wname] or w:clone():fill(initial_step)
+      -- learning options
+      local l1          = self:get_option_of(wname, "L1_norm")
+      local l2          = self:get_option_of(wname, "weight_decay")
+      local mnp         = self:get_option_of(wname, "max_norm_penalty")
+      --
+      local sign  = mop.sign(grad)
+      -- compute rprop learning step
+      if old_sign then
+	ann_optimizer_utils.rprop.step(step, old_sign, sign,
+                                       eta_minus, eta_plus)
+      end
+      step:clamp(min_step, max_step)
+      -- apply sign to rprop learning step
+      local update = mop.cmul(sign, step)
+      -- L2 regularization
+      if l2 then update:axpy(l2, mop.cmul(step, w)) end
+      -- apply update to weights
+      w:axpy(-1.0, update)
+      -- L1 regularization, truncated gradient implementation
+      if l1 > 0.0 then
+        ann.optimizer.utils.l1_truncate_gradient(w, mop.scal(step, l1))
+      end
+      -- constraints
+      if mnp > 0.0 then ann.optimizer.utils.max_norm_penalty(w, mnp) end
+      -- keep matrices for the next iteration
+      old_signs[wname] = sign
+      steps[wname]     = step
+      -- weights normality check
+      if self:get_count() % MAX_UPDATES_WITHOUT_PRUNE == 0 then
+	w:prune_subnormal_and_check_normal()
+      end
+    end
+    -- count one more update iteration
+    self:count_one()
+  end
+  -- returns the same as returned by eval()
+  return table.unpack(arg)
+end
+
+function rprop_methods:clone()
+  local obj = ann.optimizer.rprop()
+  obj.count             = self.count
+  obj.layerwise_options = table.deep_copy(self.layerwise_options)
+  obj.global_options    = table.deep_copy(self.global_options)
+  if self.steps then
+    obj.steps = md.clone( self.steps )
+  end
+  if self.old_signs then
+    obj.old_signs = md.clone( self.old_signs )
+  end
+  return obj
+end
+
+function rprop_methods:to_lua_string(format)
+  local str_t = { "ann.optimizer.rprop(",
+		  table.tostring(self.global_options),
+		  ",",
+		  table.tostring(self.layerwise_options),
+		  ",",
+		  tostring(self.count),
+		  ",",
+		  util.to_lua_string(self.steps, format),
+		  ",",
+		  util.to_lua_string(self.old_signs, format),
+		  ")" }
+  return table.concat(str_t, "")
+end
+
+local rprop_properties = {
+  gradient = true
+}
+function rprop_methods:needs_property(property)
+  return rprop_properties[property]
+end
diff --git a/packages/ann/optimizer/lua_src/optimizer_sgd.lua b/packages/ann/optimizer/lua_src/optimizer_sgd.lua
new file mode 100644
index 000000000..3d6821e93
--- /dev/null
+++ b/packages/ann/optimizer/lua_src/optimizer_sgd.lua
@@ -0,0 +1,130 @@
+local assert = assert
+local ipairs = ipairs
+local math = math
+local pairs = pairs
+local string = string
+local table = table
+local type = type
+--
+local april_assert = april_assert
+local get_table_fields = get_table_fields
+local iterator = iterator
+local mop = matrix.op
+local md = matrix.dict
+
+local MAX_UPDATES_WITHOUT_PRUNE = ann.optimizer.MAX_UPDATES_WITHOUT_PRUNE
+
+------------------------------------------------
+--------- STOCHASTIC GRADIENT DESCENT ----------
+------------------------------------------------
+
+local sgd, sgd_methods = class("ann.optimizer.sgd", ann.optimizer)
+ann.optimizer.sgd = sgd -- global environment
+
+function sgd:constructor(g_options, l_options, count, update)
+  -- the base optimizer, with the supported learning parameters
+  ann.optimizer.constructor(self,
+                            {
+			      {"learning_rate", "Learning speed factor (0.01)"},
+			      {"momentum", "Learning inertia factor (0.0)"},
+                              {"decay", "Decay of hyper-parameters (1e-05), global option"},
+                              {"weight_decay", "Weight L2 regularization (0.0)"},
+                              {"L1_norm", "Weight L1 regularization (0.0)"},
+                              {"max_norm_penalty", "Weight max norm upper bound (0)"},
+			    },
+			    g_options,
+			    l_options,
+			    count)
+  self.update = update or {}
+  if not g_options then
+    -- default values
+    self:set_option("learning_rate", 0.01)
+    self:set_option("momentum", 0.0)
+    self:set_option("decay", 1e-05)
+    self:set_option("weight_decay", 0.0)
+    self:set_option("L1_norm", 0.0)
+    self:set_option("max_norm_penalty", 0.0)
+  end
+end
+
+function sgd_methods:execute(eval, weights)
+  local table = table
+  local assert = assert
+  --
+  local origw = weights
+  local arg = table.pack( eval(origw) )
+  local tr_loss,gradients = table.unpack(arg)
+  -- the gradient computation could fail returning nil, it is important to take
+  -- this into account
+  if not gradients then return nil end
+  --
+  local d0 = self:get_option("decay")
+  local decay = 1.0 / (1.0 + d0 * self:get_count())
+  --
+  for wname,w in pairs(weights) do
+    local update      = self.update[wname] or matrix.as(w):zeros()
+    local grad        = gradients[wname]
+    -- learning options
+    local lr          = self:get_option_of(wname, "learning_rate")
+    local lrd         = lr * decay
+    local mt          = self:get_option_of(wname, "momentum")
+    local l1          = self:get_option_of(wname, "L1_norm")
+    local l2          = self:get_option_of(wname, "weight_decay")
+    local mnp         = self:get_option_of(wname, "max_norm_penalty")
+    assert(self:get_option_of(wname, "decay") == d0,
+           "decay option cannot be defined layerwise, only globally")
+    -- L2 regularization
+    if l2 > 0.0 then grad:axpy(l2, w) end
+    -- momentum
+    if mt > 0.0 then update:scal(mt) else update:zeros() end
+    -- apply back-propagation learning rule to update matrix
+    update:axpy(lrd, grad)
+    -- apply update matrix to the weights
+    w:axpy(-1.0, update)
+    -- L1 regularization, truncated gradient implementation
+    if l1 > 0.0 then ann.optimizer.utils.l1_truncate_gradient(w, lrd*l1,
+                                                              update) end
+    -- constraints
+    if mnp > 0.0 then ann.optimizer.utils.max_norm_penalty(w, mnp) end
+    -- weights normality check
+    if self:get_count() % MAX_UPDATES_WITHOUT_PRUNE == 0 then
+      w:prune_subnormal_and_check_normal()
+    end
+    --
+    self.update[wname] = update
+  end
+  -- count one more update iteration
+  self:count_one()
+  -- returns the same as returned by eval()
+  return table.unpack(arg)
+end
+
+function sgd_methods:clone()
+  local obj = ann.optimizer.sgd()
+  obj.count             = self.count
+  obj.layerwise_options = table.deep_copy(self.layerwise_options)
+  obj.global_options    = table.deep_copy(self.global_options)
+  obj.update            = md.clone( self.update )
+  return obj
+end
+
+function sgd_methods:to_lua_string(format)
+  local format = format or "binary"
+  local str_t = { "ann.optimizer.sgd(",
+		  table.tostring(self.global_options),
+		  ",",
+		  table.tostring(self.layerwise_options),
+		  ",",
+		  tostring(self.count),
+		  ",",
+		  util.to_lua_string(self.update, format),
+		  ")" }
+  return table.concat(str_t, "")
+end
+
+local sgd_properties = {
+  gradient = true
+}
+function sgd_methods:needs_property(property)
+  return sgd_properties[property]
+end
diff --git a/packages/ann/optimizer/test/test-digits-asgd.lua b/packages/ann/optimizer/test/test-digits-asgd.lua
index 29d8551ad..eb4c0c931 100644
--- a/packages/ann/optimizer/test/test-digits-asgd.lua
+++ b/packages/ann/optimizer/test/test-digits-asgd.lua
@@ -12,24 +12,23 @@ T("ASGDTest", function()
     inf            = -1
     sup            =  1
     shuffle_random = random(5678)
-    learning_rate  = 0.08
-    lr_decay       = 0.75
-    weight_decay   = 1e-04
-    t0             = 5*math.ceil(800/bunch_size) -- five epochs
+    learning_rate  = 0.1
+    weight_decay   = 0.001
+    t0             = 5*800/bunch_size -- five epochs
     max_epochs     = 10
 
     -- training and validation
     errors = {
-      {2.2776384, 2.0342729},
-      {1.6926836, 1.2635630},
-      {0.9429189, 0.6279044},
-      {0.5317102, 0.3881207},
-      {0.3188521, 0.3284208},
-      {0.2210947, 0.2336490},
-      {0.1844755, 0.2313963},
-      {0.1819354, 0.2304380},
-      {0.1808625, 0.2299282},
-      {0.1803160, 0.2298454},
+      {2.2425103, 1.8482420},
+      {1.5127832, 1.2634643},
+      {0.7906535, 0.4813936},
+      {0.4786904, 0.3513147},
+      {0.2625008, 0.2448429},
+      {0.2053493, 0.1754262},
+      {0.1336887, 0.1607038},
+      {0.1040219, 0.1502100},
+      {0.0896987, 0.1430567},
+      {0.0798418, 0.1375536},
     }
     epsilon = 0.01
 
@@ -87,7 +86,6 @@ T("ASGDTest", function()
     trainer:build()
 
     trainer:set_option("learning_rate", learning_rate)
-    trainer:set_option("lr_decay", lr_decay)
     trainer:set_option("t0", t0)
     trainer:set_option("weight_decay",  weight_decay)
     -- bias has weight_decay of ZERO
@@ -121,11 +119,18 @@ T("ASGDTest", function()
     clock:go()
 
     -- print("Epoch Training  Validation")
+    local val_trainer = trainer:clone()
+    local tmp = os.tmpname()
     for epoch = 1,max_epochs do
       collectgarbage("collect")
       totalepocas = totalepocas+1
       errortrain,vartrain  = trainer:train_dataset(datosentrenar)
-      errorval,varval      = trainer:validate_dataset(datosvalidar)
+      val_trainer:build{
+        weights = trainer:get_optimizer():get_averaged_weights()
+      }
+      errorval,varval = val_trainer:validate_dataset(datosvalidar)
+      trainer:save(tmp)
+      trainer = trainable.supervised_trainer.load(tmp)
       printf("%4d  %.7f %.7f :: %.7f %.7f\n",
              totalepocas,errortrain,errorval,vartrain,varval)
       check.number_eq(errortrain, errors[epoch][1], epsilon,
@@ -137,11 +142,10 @@ T("ASGDTest", function()
                                       "reference error %g",
                                     errorval, errors[epoch][2]))
     end
-
+    os.remove(tmp)
     clock:stop()
     cpu,wall = clock:read()
-    --printf("Wall total time: %.3f    per epoch: %.3f\n", wall, wall/max_epochs)
-    --printf("CPU  total time: %.3f    per epoch: %.3f\n", cpu, cpu/max_epochs)
+    -- printf("Wall total time: %.3f    per epoch: %.3f\n", wall, wall/max_epochs)
+    -- printf("CPU  total time: %.3f    per epoch: %.3f\n", cpu, cpu/max_epochs)
     -- print("Test passed! OK!")
 end)
-
diff --git a/packages/ann/optimizer/test/test-digits-cg.lua b/packages/ann/optimizer/test/test-digits-cg.lua
index 8dd24e3c8..13096532c 100644
--- a/packages/ann/optimizer/test/test-digits-cg.lua
+++ b/packages/ann/optimizer/test/test-digits-cg.lua
@@ -12,9 +12,7 @@ T("ConjugateGradientTest", function()
     inf            = -1
     sup            =  1
     shuffle_random = random(5678)
-    rho            = 0.01
-    sig            = 0.8
-    weight_decay   = 1e-05
+    weight_decay   = 0.001
     max_epochs     = 10
 
     -- training and validation
@@ -86,8 +84,6 @@ ascii
                                            ann.optimizer.cg())
     trainer:build()
 
-    trainer:set_option("rho", rho)
-    trainer:set_option("sig", sig)
     trainer:set_option("weight_decay",  weight_decay)
     -- bias has weight_decay of ZERO
     trainer:set_layerwise_option("b.", "weight_decay", 0)
@@ -120,11 +116,14 @@ ascii
     clock:go()
 
     -- print("Epoch Training  Validation")
+    local tmp = os.tmpname()
     for epoch = 1,max_epochs do
       collectgarbage("collect")
       totalepocas = totalepocas+1
       errortrain,vartrain  = trainer:train_dataset(datosentrenar)
       errorval,varval      = trainer:validate_dataset(datosvalidar)
+      trainer:save(tmp)
+      trainer = trainable.supervised_trainer.load(tmp)
       printf("%4d  %.7f %.7f :: %.7f %.7f :: %f\n",
              totalepocas,errortrain,errorval,vartrain,varval,trainer:norm2("w.*"))
       --check.number_eq(errortrain, errors:get(epoch,1), epsilon,
@@ -136,7 +135,7 @@ ascii
                                       "reference error %g",
                                     errorval, errors:get(epoch,2)))
     end
-
+    os.remove(tmp)
     clock:stop()
     cpu,wall = clock:read()
     --printf("Wall total time: %.3f    per epoch: %.3f\n", wall, wall/max_epochs)
diff --git a/packages/ann/optimizer/test/test-digits-l1.lua b/packages/ann/optimizer/test/test-digits-l1.lua
index 26f75cf7b..c303881bd 100644
--- a/packages/ann/optimizer/test/test-digits-l1.lua
+++ b/packages/ann/optimizer/test/test-digits-l1.lua
@@ -1,146 +1,150 @@
 mathcore.set_use_cuda_default(util.is_cuda_available())
 --
--- un generador de valores aleatorios... y otros parametros
-bunch_size     = tonumber(arg[1]) or 64
-semilla        = 1234
-weights_random = random(semilla)
-description    = "256 inputs 256 tanh 128 tanh 10 log_softmax"
-inf            = -1
-sup            =  1
-shuffle_random = random(5678)
-learning_rate  = 0.08
-momentum       = 0.01
-L1_norm        = 0.001
-max_epochs     = 10
-
--- training and validation
-errors = {
-  {2.3165729, 2.2201636},
-  {2.1821389, 2.0622385},
-  {1.9339662, 1.8144050},
-  {1.8861914, 1.7708337},
-  {1.8548096, 1.9131246},
-  {1.7150941, 1.7762133},
-  {1.7553701, 1.7308848},
-  {1.6740500, 1.4985144},
-  {1.3345400, 1.2828860},
-  {1.4751233, 1.1786772},
-}
-epsilon = 1e-04
-
---------------------------------------------------------------
-
-m1 = ImageIO.read(string.get_path(arg[0]) .. "../../ann/test/digits.png"):to_grayscale():invert_colors():matrix()
-train_input = dataset.matrix(m1,
-			     {
-			       patternSize = {16,16},
-			       offset      = {0,0},
-			       numSteps    = {80,10},
-			       stepSize    = {16,16},
-			       orderStep   = {1,0}
-			     })
-
-val_input  = dataset.matrix(m1,
-			    {
-			      patternSize = {16,16},
-			      offset      = {1280,0},
-			      numSteps    = {20,10},
-			      stepSize    = {16,16},
-			      orderStep   = {1,0}
-			    })
--- una matriz pequenya la podemos cargar directamente
-m2 = matrix(10,{1,0,0,0,0,0,0,0,0,0})
-
--- ojito con este dataset, fijaros que usa una matriz de dim 1 y talla
--- 10 PERO avanza con valor -1 y la considera CIRCULAR en su unica
--- dimension
-
-train_output = dataset.matrix(m2,
-			      {
-				patternSize = {10},
-				offset      = {0},
-				numSteps    = {800},
-				stepSize    = {-1},
-				circular    = {true}
-			      })
-
-val_output   = dataset.matrix(m2,
-			      {
-				patternSize = {10},
-				offset      = {0},
-				numSteps    = {200},
-				stepSize    = {-1},
-				circular    = {true}
-			      })
-
-
-thenet = ann.mlp.all_all.generate(description)
-trainer = trainable.supervised_trainer(thenet,
-				       ann.loss.multi_class_cross_entropy(10),
-				       bunch_size)
-trainer:build()
-
-trainer:set_option("learning_rate", learning_rate)
-trainer:set_option("momentum",      momentum)
-trainer:set_option("L1_norm",       L1_norm)
--- bias has weight_decay of ZERO
-trainer:set_layerwise_option("b.", "L1_norm", 0)
-
-trainer:randomize_weights{
-  random      = weights_random,
-  inf         = inf,
-  sup         = sup,
-  use_fanin   = true,
-}
-
--- datos para entrenar
-datosentrenar = {
-  input_dataset  = train_input,
-  output_dataset = train_output,
-  shuffle        = shuffle_random,
-}
-
-datosvalidar = {
-  input_dataset  = val_input,
-  output_dataset = val_output,
-}
-
-totalepocas = 0
-
-errorval = trainer:validate_dataset(datosvalidar)
--- print("# Initial validation error:", errorval)
-
-clock = util.stopwatch()
-clock:go()
-
--- print("Epoch Training  Validation")
-for epoch = 1,max_epochs do
-  collectgarbage("collect")
-  totalepocas = totalepocas+1
-  errortrain,vartrain  = trainer:train_dataset(datosentrenar)
-  errorval,varval      = trainer:validate_dataset(datosvalidar)
-  printf("%4d  %.7f %.7f :: %.7f %.7f\n",
-  	 totalepocas,errortrain,errorval,vartrain,varval)
- if math.abs(errortrain - errors[epoch][1]) > epsilon then
-   error(string.format("Training error %g is not equal enough to "..
-                         "reference error %g",
-                       errortrain, errors[epoch][1]))
- end
- if math.abs(errorval - errors[epoch][2]) > epsilon then
-   error(string.format("Validation error %g is not equal enough to "..
-                         "reference error %g",
-                       errorval, errors[epoch][2]))
- end
-end
-
-clock:stop()
-cpu,wall = clock:read()
---printf("Wall total time: %.3f    per epoch: %.3f\n", wall, wall/max_epochs)
---printf("CPU  total time: %.3f    per epoch: %.3f\n", cpu, cpu/max_epochs)
--- print("Test passed! OK!")
-
-for wname,w in trainer:iterate_weights("w.*") do
-  local v = w:clone():abs():min()
-  assert(v == 0 or v > L1_norm)
-  -- print(w:clone():eq(0.0):sum(), w:size())
-end
+local check = utest.check
+local T = utest.test
+--
+T("L1TestDigits", function()
+    -- un generador de valores aleatorios... y otros parametros
+    bunch_size     = tonumber(arg[1]) or 64
+    semilla        = 1234
+    weights_random = random(semilla)
+    description    = "256 inputs 256 tanh 128 tanh 10 log_softmax"
+    inf            = -1
+    sup            =  1
+    shuffle_random = random(5678)
+    learning_rate  = 0.08
+    momentum       = 0.0
+    L1_norm        = 0.001
+    max_epochs     = 10
+
+    -- training and validation
+    errors = {
+      {2.2798486, 2.0456107},
+      {1.7129538, 1.2954185},
+      {0.9751059, 0.6590891},
+      {0.5633602, 0.4138165},
+      {0.3464335, 0.3450162},
+      {0.2428290, 0.2518864},
+      {0.1867137, 0.1979152},
+      {0.1466725, 0.1708217},
+      {0.1282059, 0.1904573},
+      {0.1170338, 0.1766910},
+    }
+    epsilon = 0.05 -- 5%
+
+    --------------------------------------------------------------
+
+    m1 = ImageIO.read(string.get_path(arg[0]) .. "../../ann/test/digits.png"):to_grayscale():invert_colors():matrix()
+    train_input = dataset.matrix(m1,
+                                 {
+                                   patternSize = {16,16},
+                                   offset      = {0,0},
+                                   numSteps    = {80,10},
+                                   stepSize    = {16,16},
+                                   orderStep   = {1,0}
+    })
+
+    val_input  = dataset.matrix(m1,
+                                {
+                                  patternSize = {16,16},
+                                  offset      = {1280,0},
+                                  numSteps    = {20,10},
+                                  stepSize    = {16,16},
+                                  orderStep   = {1,0}
+    })
+    -- una matriz pequenya la podemos cargar directamente
+    m2 = matrix(10,{1,0,0,0,0,0,0,0,0,0})
+
+    -- ojito con este dataset, fijaros que usa una matriz de dim 1 y talla
+    -- 10 PERO avanza con valor -1 y la considera CIRCULAR en su unica
+    -- dimension
+
+    train_output = dataset.matrix(m2,
+                                  {
+                                    patternSize = {10},
+                                    offset      = {0},
+                                    numSteps    = {800},
+                                    stepSize    = {-1},
+                                    circular    = {true}
+    })
+
+    val_output   = dataset.matrix(m2,
+                                  {
+                                    patternSize = {10},
+                                    offset      = {0},
+                                    numSteps    = {200},
+                                    stepSize    = {-1},
+                                    circular    = {true}
+    })
+
+
+    thenet = ann.mlp.all_all.generate(description)
+    trainer = trainable.supervised_trainer(thenet,
+                                           ann.loss.multi_class_cross_entropy(10),
+                                           bunch_size)
+    trainer:build()
+
+    trainer:set_option("learning_rate", learning_rate)
+    trainer:set_option("momentum",      momentum)
+    trainer:set_option("L1_norm",       L1_norm)
+    -- bias has weight_decay of ZERO
+    trainer:set_layerwise_option("b.", "L1_norm", 0)
+
+    trainer:randomize_weights{
+      random      = weights_random,
+      inf         = inf,
+      sup         = sup,
+      use_fanin   = true,
+    }
+
+    -- datos para entrenar
+    datosentrenar = {
+      input_dataset  = train_input,
+      output_dataset = train_output,
+      shuffle        = shuffle_random,
+    }
+
+    datosvalidar = {
+      input_dataset  = val_input,
+      output_dataset = val_output,
+    }
+
+    totalepocas = 0
+
+    errorval = trainer:validate_dataset(datosvalidar)
+    -- print("# Initial validation error:", errorval)
+
+    clock = util.stopwatch()
+    clock:go()
+
+    -- print("Epoch Training  Validation")
+    for epoch = 1,max_epochs do
+      collectgarbage("collect")
+      totalepocas = totalepocas+1
+      errortrain,vartrain  = trainer:train_dataset(datosentrenar)
+      errorval,varval      = trainer:validate_dataset(datosvalidar)
+      printf("%4d  %.7f %.7f :: %.7f %.7f\n",
+             totalepocas,errortrain,errorval,vartrain,varval)
+      check.number_eq(errortrain, errors[epoch][1], epsilon,
+                      string.format("Training error %g is not equal enough to "..
+                                      "reference error %g",
+                                    errortrain, errors[epoch][1]))
+      check.number_eq(errorval, errors[epoch][2], epsilon,
+                      string.format("Validation error %g is not equal enough to "..
+                                      "reference error %g",
+                                    errorval, errors[epoch][2]))
+    end
+
+    clock:stop()
+    cpu,wall = clock:read()
+    --printf("Wall total time: %.3f    per epoch: %.3f\n", wall, wall/max_epochs)
+    --printf("CPU  total time: %.3f    per epoch: %.3f\n", cpu, cpu/max_epochs)
+    -- print("Test passed! OK!")
+
+    for wname,w in trainer:iterate_weights("w.*") do
+      local v = w:clone():abs():min()
+      check.TRUE(v == 0 or v > L1_norm)
+      check.gt(w:eq(0.0):to_float():sum(), 0)
+      -- print(w:eq(0.0):to_float():sum())
+    end
+end)
diff --git a/packages/ann/optimizer/test/test-digits-qprop.lua b/packages/ann/optimizer/test/test-digits-qprop.lua
index b1a0c47da..9eedb89a6 100644
--- a/packages/ann/optimizer/test/test-digits-qprop.lua
+++ b/packages/ann/optimizer/test/test-digits-qprop.lua
@@ -116,11 +116,14 @@ T("QuickPropTest", function()
     clock:go()
 
     -- print("Epoch Training  Validation")
+    local tmp = os.tmpname()
     for epoch = 1,max_epochs do
       collectgarbage("collect")
       totalepocas = totalepocas+1
       errortrain,vartrain  = trainer:train_dataset(datosentrenar)
       errorval,varval      = trainer:validate_dataset(datosvalidar)
+      trainer:save(tmp)
+      trainer = trainable.supervised_trainer.load(tmp)
       printf("%4d  %.7f %.7f :: %.7f %.7f\n",
              totalepocas,errortrain,errorval,vartrain,varval)
       check.number_eq(errortrain, errors:get(epoch,1), epsilon,
@@ -132,7 +135,7 @@ T("QuickPropTest", function()
                                       "reference error %g",
                                     errorval, errors:get(epoch,2)))
     end
-
+    os.remove(tmp)
     clock:stop()
     cpu,wall = clock:read()
     --printf("Wall total time: %.3f    per epoch: %.3f\n", wall, wall/max_epochs)
diff --git a/packages/ann/optimizer/test/test-digits-rprop.lua b/packages/ann/optimizer/test/test-digits-rprop.lua
index 70f3332a5..b19a6ff03 100644
--- a/packages/ann/optimizer/test/test-digits-rprop.lua
+++ b/packages/ann/optimizer/test/test-digits-rprop.lua
@@ -115,11 +115,14 @@ ascii
     clock:go()
 
     -- print("Epoch Training  Validation")
+    local tmp = os.tmpname()
     for epoch = 1,max_epochs do
       collectgarbage("collect")
       totalepocas = totalepocas+1
       errortrain,vartrain  = trainer:train_dataset(datosentrenar)
       errorval,varval      = trainer:validate_dataset(datosvalidar)
+      trainer:save(tmp)
+      trainer = trainable.supervised_trainer.load(tmp)
       printf("%4d  %.7f %.7f :: %.7f %.7f :: %f\n",
              totalepocas,errortrain,errorval,vartrain,varval,trainer:norm2("w.*"))
       check.number_eq(errortrain, errors:get(epoch,1), epsilon,
@@ -131,6 +134,7 @@ ascii
                                       "reference error %g",
                                     errorval, errors:get(epoch,2)))
     end
+    os.remove(tmp)
     clock:stop()
     cpu,wall = clock:read()
     --printf("Wall total time: %.3f    per epoch: %.3f\n", wall, wall/max_epochs)
diff --git a/packages/ann/optimizer/test/test-digits-sgd.lua b/packages/ann/optimizer/test/test-digits-sgd.lua
index 5a062008a..38bf9f928 100644
--- a/packages/ann/optimizer/test/test-digits-sgd.lua
+++ b/packages/ann/optimizer/test/test-digits-sgd.lua
@@ -3,7 +3,23 @@ mathcore.set_use_cuda_default(util.is_cuda_available())
 local check = utest.check
 local T = utest.test
 --
-T("SGDTest", function()
+T("SGDConvexTest", function()
+    local opt = ann.optimizer.sgd()
+    opt:set_option("learning_rate", 0.01)
+    opt:set_option("momentum", 0.02)
+    -- optimize quadractic function: f(x) = 3*x^2 - 2*x + 10
+    local function f(x) return (3*x^2 - 2*x + 10):sum() end
+    local function df_dx(x) return 6*x - 2 end
+    -- df(x)/dx = 6*x - 2
+    -- the minimum is in x=0.333
+    local x = matrix(1,1,{-100})
+    for i=1,200 do
+      opt:execute(function() return f(x),{df_dx(x)} end, {x})
+    end
+    check.eq(x, matrix(1,1,{0.333}))
+end)
+
+T("SGDTestDigits", function()
     -- un generador de valores aleatorios... y otros parametros
     bunch_size     = tonumber(arg[1]) or 64
     semilla        = 1234
@@ -30,7 +46,7 @@ T("SGDTest", function()
       {0.1077118, 0.1718368},
       {0.0960633, 0.1591717},
     }
-    epsilon = 0.01
+    epsilon = 0.01 -- 1% relative difference
 
     --------------------------------------------------------------
 
@@ -116,13 +132,16 @@ T("SGDTest", function()
 
     clock = util.stopwatch()
     clock:go()
-
+    local weights = trainer.weights_table
     -- print("Epoch Training  Validation")
+    local tmp = os.tmpname()
     for epoch = 1,max_epochs do
       collectgarbage("collect")
       totalepocas = totalepocas+1
       errortrain,vartrain  = trainer:train_dataset(datosentrenar)
       errorval,varval      = trainer:validate_dataset(datosvalidar)
+      trainer:save(tmp)
+      trainer = trainable.supervised_trainer.load(tmp)
       printf("%4d  %.7f %.7f :: %.7f %.7f\n",
              totalepocas,errortrain,errorval,vartrain,varval)
       check.number_eq(errortrain, errors[epoch][1], epsilon,
@@ -134,7 +153,7 @@ T("SGDTest", function()
                                       "reference error %g",
                                     errorval, errors[epoch][2]))
     end
-
+    os.remove(tmp)
     clock:stop()
     cpu,wall = clock:read()
     --printf("Wall total time: %.3f    per epoch: %.3f\n", wall, wall/max_epochs)
diff --git a/packages/autodiff/ann/lua_src/autodiff-ann.lua b/packages/autodiff/ann/lua_src/autodiff-ann.lua
index 685cb8141..3372c9d8f 100644
--- a/packages/autodiff/ann/lua_src/autodiff-ann.lua
+++ b/packages/autodiff/ann/lua_src/autodiff-ann.lua
@@ -4,6 +4,43 @@
 local AD = autodiff
 AD.ann   = AD.ann or {}
 
+-- Make a model wrapper, receives a symbol with the operation, the input symbol,
+-- weight symbols, shared table with matrices, input size, output size,
+function AD.ann.model(f, i, symbols, shared, isize, osize)
+  assert(type(f) == "table", "Needs a symbol as first argument")
+  assert(type(i) == "table", "Needs a symbol as second argument")
+  assert(type(symbols) == "table",
+         "Needs a symbols or a table of symbols as third argument")
+  local diff,func,M = AD.diff,AD.func,AD.matrix
+  local seed = M("seed")
+  local df_dw_tbl = table.pack( diff(f, symbols, seed) )
+  local compiled_f = func(f, { i }, shared)
+  local compiled_df_dw = func(df_dw_tbl, { i, f, seed }, shared)
+  local model = ann.components.wrapper{
+    input = isize,
+    output = osize,
+    weights = shared,
+    state = { f = f, df_dw_tbl = df_dw_tbl, symbols = symbols, cache = {} },
+    forward = function(self, input, during_training)
+      return compiled_f(input, self.state.cache)
+    end,
+    backprop = function(self, seed)
+    end,
+    compute_gradients = function(self,dict)
+      local dw = table.pack( compiled_df_dw(self:get_input(),
+                                            self:get_output(),
+                                            self:get_error_input(),
+                                            self.state.cache) )
+      for i,s in ipairs(symbols) do dict[s.name] = dw[i] end
+      return dict
+    end,
+    reset = function(self)
+      self.state.cache  = {}
+    end,
+  }
+  return model
+end
+
 -- RECTIFIED LINER
 function AD.ann.relu(a)
   return AD.op.cmul(a, AD.op.gt(a,0))
diff --git a/packages/autodiff/ann/test/test-digits.lua b/packages/autodiff/ann/test/test-digits.lua
index d4d67c212..c0122cd88 100644
--- a/packages/autodiff/ann/test/test-digits.lua
+++ b/packages/autodiff/ann/test/test-digits.lua
@@ -1,12 +1,15 @@
-local learning_rate  = 0.01
+local learning_rate  = 0.1
 local momentum       = 0.1
-local weight_decay   = 1e-01
+local weight_decay   = 0.001
 local semilla        = 1234
 local rnd            = random(semilla)
 local H1             = 256
 local H2             = 128
-local M              = matrix.col_major
-local bunch_size     = 32
+local M              = matrix
+local bunch_size     = 64
+
+-- smooth learning rate depending in bunch size
+local learning_rate = learning_rate * bunch_size / math.sqrt(bunch_size)
 --
 --------------------------------------------------------------
 
@@ -123,27 +126,25 @@ opt:set_option("momentum", momentum)
 --
 
 -- WEIGHTS DICTIONARY
-local weights_dict = matrix.dict(weights)
-
 local ds_pair_it = trainable.dataset_pair_iterator
 -- traindataset
 local function train_dataset(in_ds,out_ds)
-  local mv = stats.mean_var()
+  local mv = stats.running.mean_var()
   for input_bunch,output_bunch in ds_pair_it{ input_dataset=in_ds,
 					      output_dataset=out_ds,
 					      bunch_size=bunch_size,
 					      shuffle = rnd, } do
     local loss
-    loss = opt:execute(function(params)
-                         if params ~= weights then
-                           dw_func:set_shared(params)
-                         end
-			 local loss,b1,w1,b2,w2,
-			 b3,w3 = dw_func(input_bunch:get_matrix():transpose(),
-					 output_bunch:get_matrix():transpose())
-			 return loss, { b1=b1, w1=w1, b2=b2, w2=w2, b3=b3, w3=w3 }
-		       end,
-		       weights_dict)
+    loss = opt:execute(function(params,it)
+        if params ~= dw_func:get_shared() then
+          dw_func:set_shared(params)
+        end
+        local loss,b1,w1,b2,w2,
+        b3,w3 = dw_func(input_bunch:transpose(),
+                        output_bunch:transpose())
+        local grads = { b1=b1, w1=w1, b2=b2, w2=w2, b3=b3, w3=w3 }
+        return loss, grads end,
+      dw_func:get_shared())
     mv:add(loss)
   end
   return mv:compute()
@@ -151,12 +152,12 @@ end
 
 -- validatedataset
 local function validate_dataset(in_ds,out_ds)
-  local mv = stats.mean_var()
+  local mv = stats.running.mean_var()
   for input_bunch,output_bunch in ds_pair_it{ input_dataset=in_ds,
 					      output_dataset=out_ds,
 					      bunch_size=bunch_size } do
-    local loss = L_func(input_bunch:get_matrix():transpose(),
-			output_bunch:get_matrix():transpose())
+    local loss = L_func(input_bunch:transpose(),
+			output_bunch:transpose())
     mv:add(loss)
   end
   return mv:compute()
@@ -170,7 +171,7 @@ while train_func:execute(function()
 							 train_output)
 			   local va_loss = validate_dataset(val_input,
 							    val_output)
-			   return weights_dict,tr_loss,va_loss
+			   return dw_func:get_shared(),tr_loss,va_loss
 			 end) do
   print(train_func:get_state_string())
 end
diff --git a/packages/autodiff/autodiff/lua_src/autodiff.lua b/packages/autodiff/autodiff/lua_src/autodiff.lua
index 33a3c2e5c..0cfd276a2 100644
--- a/packages/autodiff/autodiff/lua_src/autodiff.lua
+++ b/packages/autodiff/autodiff/lua_src/autodiff.lua
@@ -608,6 +608,7 @@ function autodiff.func(s, args, shared_values, optimize)
     outputs       = s,
     shared_values = shared_values,
     funcs         = funcs,
+    get_shared    = function(self) return self.shared_values end,
     set_shared    = function(self,new_shared_values)
       for name,w in pairs(new_shared_values) do
         self.shared_values[name] = w
diff --git a/packages/autodiff/autodiff/lua_src/matrix.lua b/packages/autodiff/autodiff/lua_src/matrix.lua
index 77ceac42a..dbaf40bde 100644
--- a/packages/autodiff/autodiff/lua_src/matrix.lua
+++ b/packages/autodiff/autodiff/lua_src/matrix.lua
@@ -550,7 +550,7 @@ autodiff.op[MATRIX] = {
 		     function(self, ...)
 		       local a = self.args[1]:eval(...)
 		       local b = self.args[2]:eval(...)
-		       return a:clone():lt(b)
+		       return a:clone():lt(b):to_float()
 		     end,
 		     function(self, seed, result)
 		       return result
@@ -558,7 +558,7 @@ autodiff.op[MATRIX] = {
 		     function(self, dest)
 		       local a,b = self.args[1],self.args[2]
 		       local str_tbl = { a.var_name,
-					 ':clone():lt(', b.var_name, ')' }
+					 ':clone():lt(', b.var_name, '):to_float()' }
 		       dest:write_expr_assign(self.var_name,
 					      table.concat(str_tbl, ""))
 		     end)
@@ -577,7 +577,7 @@ autodiff.op[MATRIX] = {
 		     function(self, ...)
 		       local a = self.args[1]:eval(...)
 		       local b = self.args[2]:eval(...)
-		       return a:clone():gt(b)
+		       return a:clone():gt(b):to_float()
 		     end,
 		     function(self, seed, result)
 		       return result
@@ -585,7 +585,7 @@ autodiff.op[MATRIX] = {
 		     function(self, dest)
 		       local a,b = self.args[1],self.args[2]
 		       local str_tbl = { a.var_name,
-					 ':clone():gt(', b.var_name, ')' }
+					 ':clone():gt(', b.var_name, '):to_float()' }
 		       dest:write_expr_assign(self.var_name,
 					      table.concat(str_tbl, ""))
 		     end)
@@ -965,7 +965,36 @@ end
     if a.dims then s:set_dims(a.dims) end
     return s
   end,
-  
+
+  clamp = function(a,lower,upper)
+    local a,lower,upper = coercion(a),coercion(lower),coercion(upper)
+    local s = gen_op('clamp', MATRIX, {a,lower,upper},
+		     function(self, ...)
+		       local a = self.args[1]:eval(...)
+		       local lower = self.args[2]:eval(...)
+		       local upper = self.args[3]:eval(...)
+                       -- TODO: check types
+		       return a:clone():clamp(lower, upper)
+		     end,
+		     function(self, seed, result)
+		       local a = self.args[1]
+		       a:diff(seed, result)
+		       return result
+		     end,
+		     function(self, dest)
+		       local a = self.args[1]
+                       local lower = self.args[2]
+                       local upper = self.args[3]
+		       local str_tbl = { a.var_name, ':clone()',
+                                         ':clamp(',
+                                         lower.var_name, ',',
+                                         upper.var_name, ')' }
+		       dest:write_expr_assign(self.var_name,
+					      table.concat(str_tbl, ""))
+		     end)
+    if a.dims then s:set_dims(a.dims) end
+    return s
+  end,  
 }
 
 ------------------------------------------------------------------------------
diff --git a/packages/autodiff/autodiff/lua_src/scalar.lua b/packages/autodiff/autodiff/lua_src/scalar.lua
index 0708f18b5..a85cdb97b 100644
--- a/packages/autodiff/autodiff/lua_src/scalar.lua
+++ b/packages/autodiff/autodiff/lua_src/scalar.lua
@@ -291,6 +291,34 @@ autodiff.op[SCALAR] = {
 		     end)
     return s
   end,
+  
+  clamp = function(a,lower,upper)
+    local a,lower,upper = coercion(a),coercion(lower),coercion(upper)    
+    local s = gen_op('clamp', SCALAR, {a,lower,upper},
+		     function(self, ...)
+		       local a = self.args[1]:eval(...)
+                       local lower = self.args[2]:eval(...)
+                       local upper = self.args[3]:eval(...)
+		       return math.clamp(a,lower,upper)
+		     end,
+		     function(self, seed, result)
+		       local a = self.args[1]
+		       a:diff(seed, result)
+		       return result
+		     end,
+		     function(self, dest)
+		       local a = self.args[1]
+                       local lower = self.args[2]
+                       local upper = self.args[3]
+		       local str_tbl = { "math.clamp(",
+                                         a.var_name, ",",
+                                         lower.var_name, ",",
+                                         upper.var_name, ")" }
+		       dest:write_expr_assign(self.var_name,
+					      table.concat(str_tbl, " "))
+    end)
+    return s
+  end,
 
   -- matrix operations
   fill = function(a,b) return b end,
diff --git a/packages/autodiff/autodiff/test/test-xor.lua b/packages/autodiff/autodiff/test/test-xor.lua
index f130b7886..f12bb91a3 100644
--- a/packages/autodiff/autodiff/test/test-xor.lua
+++ b/packages/autodiff/autodiff/test/test-xor.lua
@@ -4,7 +4,7 @@ local weight_decay   = 1e-05
 local semilla        = 1234
 local rnd            = random(semilla)
 --
-local M = matrix.col_major
+local M = matrix
 
 m_xor = matrix.fromString[[
     4 3
@@ -20,7 +20,7 @@ ds_output = dataset.matrix(m_xor,{offset={0,2},patternSize={1,1}})
 
 m = matrix.fromString[[
     3 3
-    ascii col_major
+    ascii
       -0.5 -1.2 1.0
       -2.0 4.0 -4.0
       -1.0 2.0 2.0
diff --git a/packages/autodiff/autodiff/test/test.lua b/packages/autodiff/autodiff/test/test.lua
index 213d21422..ec77ca9fd 100644
--- a/packages/autodiff/autodiff/test/test.lua
+++ b/packages/autodiff/autodiff/test/test.lua
@@ -5,7 +5,7 @@ local a,w,w2 = AD.matrix('a w w2')
 local b,c = AD.matrix('b c')
 
 local rnd = random(1234)
-local M   = matrix.col_major
+local M   = matrix
 
 weights = {
   w  = M(3,4):uniformf(0,1,rnd),
@@ -69,7 +69,7 @@ L = autodiff.op.sum( (f - target)^2 )
 
 -- INSTANTIATION
 local rnd = random(1234)
-local M   = matrix.col_major
+local M   = matrix
 
 weights = {
   wx  = M(12,3):uniformf(-0.1, 0.1, rnd),
diff --git a/packages/basics/aprilio/binding/bind_april_io.lua.cc b/packages/basics/aprilio/binding/bind_april_io.lua.cc
index c172cea15..fe70c3df1 100644
--- a/packages/basics/aprilio/binding/bind_april_io.lua.cc
+++ b/packages/basics/aprilio/binding/bind_april_io.lua.cc
@@ -396,25 +396,6 @@ namespace AprilIO {
 
 /////////////////////////////////////////////////////////////////////////////
 
-//BIND_LUACLASSNAME OutputLuaStringStream aprilio.stream.output_lua_string
-//BIND_CPP_CLASS OutputLuaStringStream
-//BIND_SUBCLASS_OF OutputLuaStringStream StreamInterface
-
-//BIND_CONSTRUCTOR OutputLuaStringStream
-{
-  obj = new OutputLuaStringStream(L, 1);
-  LUABIND_RETURN(OutputLuaStringStream, obj);
-}
-//BIND_END
-
-//BIND_METHOD OutputLuaStringStream value
-{
-  LUABIND_INCREASE_NUM_RETURNS(obj->push(L));
-}
-//BIND_END
-
-/////////////////////////////////////////////////////////////////////////////
-
 //BIND_LUACLASSNAME CStringStream aprilio.stream.c_string
 //BIND_CPP_CLASS CStringStream
 //BIND_SUBCLASS_OF CStringStream StreamInterface
@@ -543,13 +524,13 @@ namespace AprilIO {
   if (!lua_istable(L,1)) {
     LUABIND_GET_OPTIONAL_PARAMETER(1, AuxStreamInterface<StreamInterface>, ptr, 0);
     options_pos = 2;
-    AprilUtils::LuaTableOptions options(L,2);
+    AprilUtils::LuaTable options(L,2);
   }
   else {
     options_pos = 1;
     ptr = 0;
   }
-  AprilUtils::LuaTableOptions options(L,options_pos);
+  AprilUtils::LuaTable options(L,options_pos);
   if (ptr == 0) {
     aux_lua_string = new OutputLuaStringStream(L);
     dest = aux_lua_string;
@@ -557,7 +538,7 @@ namespace AprilIO {
   else {
     dest.reset(ptr);
   }
-  obj->write(dest.get(), &options);
+  obj->write(dest.get(), options);
   if (ptr == 0) LUABIND_INCREASE_NUM_RETURNS(aux_lua_string->push(L));
 }
 //BIND_END
diff --git a/packages/basics/aprilio/c_src/buffered_stream.cc b/packages/basics/aprilio/c_src/buffered_stream.cc
index cde177be6..74e0a1b16 100644
--- a/packages/basics/aprilio/c_src/buffered_stream.cc
+++ b/packages/basics/aprilio/c_src/buffered_stream.cc
@@ -18,6 +18,8 @@
  * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  *
  */
+#include <cstdarg>
+#include <cstddef>
 #include <cstdlib>
 extern "C" {
 #include <stdint.h>
diff --git a/packages/basics/aprilio/c_src/lua_string.cc b/packages/basics/aprilio/c_src/lua_string.cc
index b562e3143..40803403e 100644
--- a/packages/basics/aprilio/c_src/lua_string.cc
+++ b/packages/basics/aprilio/c_src/lua_string.cc
@@ -143,10 +143,10 @@ namespace AprilIO {
       }
     */
     lua_pushvalue(L, pos);
+    // put string into registry to avoid garbage collection
     ref = luaL_ref(L, LUA_REGISTRYINDEX);
-    lua_rawgeti(L, LUA_REGISTRYINDEX, ref);
-    data = lua_tostring(L, -1);
-    lua_pop(L, -1);
+    // get the pointer the stack
+    data = lua_tostring(L, pos);
   }
   
   InputLuaStringStream::~InputLuaStringStream() {
diff --git a/packages/basics/aprilio/c_src/lua_string.h b/packages/basics/aprilio/c_src/lua_string.h
index c71fe1b4f..8b4469cdf 100644
--- a/packages/basics/aprilio/c_src/lua_string.h
+++ b/packages/basics/aprilio/c_src/lua_string.h
@@ -35,6 +35,9 @@ namespace AprilIO {
    * intermediate C strings.
    *
    * @note The string is generated by adding data to a @c luaL_Buffer.
+   *
+   * @note Never instantiate this in Lua, it needs a Lua stack in C to work and
+   * it is not safe to reuse the same object between different C calls from Lua.
    */
   class OutputLuaStringStream : public StreamMemory {
     lua_State *L;            ///< @c lua_State where the string is allocated.
@@ -88,7 +91,7 @@ namespace AprilIO {
     const char *data;   ///< The string pointer in C.
     size_t total_size,  ///< Length of the string.
       data_pos;         ///< Current position for read.
-  
+    
   public:
     /// Constructor from @c lua_State and the stack @c pos of the string.
     InputLuaStringStream(lua_State *L, int pos);
diff --git a/packages/basics/aprilio/c_src/serializable.h b/packages/basics/aprilio/c_src/serializable.h
index 7df0bd4a6..e2b0617ed 100644
--- a/packages/basics/aprilio/c_src/serializable.h
+++ b/packages/basics/aprilio/c_src/serializable.h
@@ -21,8 +21,8 @@
 #ifndef SERIALIZABLE_H
 #define SERIALIZABLE_H
 
-#include "generic_options.h"
 #include "error_print.h"
+#include "lua_table.h"
 #include "referenced.h"
 #include "stream.h"
 #include "unused_variable.h"
@@ -39,11 +39,11 @@ namespace AprilIO {
     
     // The read method needs to be implemented in derived classes.
     // Whatever *read(StreamInterface *dest,
-    //                const AprilUtils::GenericOptions *options);
+    //                const AprilUtils::LuaTable &options);
 
     /// Writes the object data into dest, and it could be retrieved by read.
     virtual void write(StreamInterface *dest,
-                       const AprilUtils::GenericOptions *options) = 0;
+                       const AprilUtils::LuaTable &options) = 0;
     
     /**
      * @brief Writes a Lua string which can be instantiated to get the object.
@@ -54,7 +54,7 @@ namespace AprilIO {
      * @note THIS METHOD IS A FUTURE FEATURE, IT IS NOT BEEN USED ANYWHERE.
      */
     virtual void toLuaString(StreamInterface *dest,
-                             const AprilUtils::GenericOptions *options) {
+                             const AprilUtils::LuaTable &options) {
       UNUSED_VARIABLE(dest);
       UNUSED_VARIABLE(options);
       ERROR_EXIT(128, "Unable to instantiate into a Lua string\n");
diff --git a/packages/basics/matrix/c_src/matrixFloatSet.cc b/packages/basics/base/binding/bind_base.lua.cc
similarity index 80%
rename from packages/basics/matrix/c_src/matrixFloatSet.cc
rename to packages/basics/base/binding/bind_base.lua.cc
index 3fb2e3602..0122dcba5 100644
--- a/packages/basics/matrix/c_src/matrixFloatSet.cc
+++ b/packages/basics/base/binding/bind_base.lua.cc
@@ -2,7 +2,7 @@
  * This file is part of APRIL-ANN toolkit (A
  * Pattern Recognizer In Lua with Artificial Neural Networks).
  *
- * Copyright 2013, Francisco Zamora-Martinez
+ * Copyright 2014, Francisco Zamora-Martinez
  *
  * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License version 3 as
@@ -18,10 +18,12 @@
  * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  *
  */
+//BIND_HEADER_H
+#include "base.h"
+//BIND_END
 
-#include "matrixSet.h"
-
-namespace Basics {
-  template class MatrixSet<float>;
+//BIND_STATIC_CONSTRUCTOR base_static_constructor
+{
+  Base::registerGlobalLuaState(L);
 }
-
+//BIND_END
diff --git a/packages/basics/base/c_src/base.cc b/packages/basics/base/c_src/base.cc
new file mode 100644
index 000000000..13ccd13be
--- /dev/null
+++ b/packages/basics/base/c_src/base.cc
@@ -0,0 +1,42 @@
+/*
+ * This file is part of APRIL-ANN toolkit (A
+ * Pattern Recognizer In Lua with Artificial Neural Networks).
+ *
+ * Copyright 2014, Francisco Zamora-Martinez
+ *
+ * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 3 as
+ * published by the Free Software Foundation
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this library; if not, write to the Free Software Foundation,
+ * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ */
+#include <cstdlib>
+#include <cstdio>
+#include "base.h"
+
+namespace Base {
+  static lua_State *globalL = 0;
+  
+  void registerGlobalLuaState(lua_State *L) {
+    if (globalL != 0 && globalL != L) {
+      fprintf(stderr, "FATAL ERROR: Global Lua State set twice!!!\n");
+      exit(128);
+    }
+    globalL = L;
+  }
+  lua_State *getGlobalLuaState() {
+    if (globalL == 0) {
+      fprintf(stderr, "FATAL ERROR: Global Lua State not initialized!!!\n");
+      exit(128);
+    }
+    return globalL;
+  }
+}
diff --git a/packages/basics/matrix/c_src/matrixFloatSet.h b/packages/basics/base/c_src/base.h
similarity index 81%
rename from packages/basics/matrix/c_src/matrixFloatSet.h
rename to packages/basics/base/c_src/base.h
index 0aa456b81..030a253a4 100644
--- a/packages/basics/matrix/c_src/matrixFloatSet.h
+++ b/packages/basics/base/c_src/base.h
@@ -18,15 +18,16 @@
  * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  *
  */
+#ifndef BASE_H
+#define BASE_H
 
-#ifndef MATRIXFLOATSET_H
-#define MATRIXFLOATSET_H
-
-#include "matrixFloat.h"
-#include "matrixSet.h"
+extern "C" {
+#include "lua.h"
+}
 
-namespace Basics {
-  typedef MatrixSet<float> MatrixFloatSet;
+namespace Base {
+  void registerGlobalLuaState(lua_State *L);
+  lua_State *getGlobalLuaState();
 }
 
-#endif // MATRIXFLOATSET_H
+#endif // BASE_H
diff --git a/packages/basics/base/lua_src/base.lua b/packages/basics/base/lua_src/base.lua
index 6194a1b56..d2698e374 100644
--- a/packages/basics/base/lua_src/base.lua
+++ b/packages/basics/base/lua_src/base.lua
@@ -2,13 +2,19 @@ aprilann = { _NAME = "APRIL-ANN" }
 
 make_deprecated_function = function(name, new_name, new_func)
   return function(...)
-    if new_name and new_func then
-      io.stderr:write(debug.traceback(string.format("Warning: %s is in deprecated state, use %s instead",
-                                                    name, new_name)))
+    if new_func then
+      if new_name then
+        io.stderr:write(debug.traceback(string.format("Warning: %s is in deprecated state, use %s instead",
+                                                      name, new_name)))
+      else
+        io.stderr:write(debug.traceback(string.format("Warning: %s is in deprecated state",
+                                                      name)))
+      end
       io.stderr:write("\n")
       return new_func(...)
     else
-      error(string.format("%s is in deprecated state", name))
+      error(string.format("%s is in deprecated state%s", name,
+                          new_name and (", currently it is %s"%{new_name}) or ""))
     end
   end
 end
diff --git a/packages/basics/base/package.lua b/packages/basics/base/package.lua
index 693dbecd8..c4c5d108c 100644
--- a/packages/basics/base/package.lua
+++ b/packages/basics/base/package.lua
@@ -17,8 +17,8 @@ package{ name = "base",
    target{
      name = "provide",
      depends = "init",
-     --copy{ file= "c_src/*.h", dest_dir = "include" },
-     --provide_bind{ file = "binding/bind_util.lua.cc" , dest_dir = "include" },
+     copy{ file= "c_src/*.h", dest_dir = "include" },
+     provide_bind{ file = "binding/bind_base.lua.cc" , dest_dir = "include" },
    },
    target{
      name = "test",
@@ -32,16 +32,16 @@ package{ name = "base",
      name = "build",
      depends = "provide",
      use_timestamp = true,
-     -- object{ 
-     --   file = "c_src/*.cc",
-     --   dest_dir = "build",
-     --   --       flags = "-std=c99",
-     -- },
+     object{ 
+       file = "c_src/*.cc",
+       dest_dir = "build",
+       --       flags = "-std=c99",
+     },
      luac{
        orig_dir = "lua_src",
        dest_dir = "build",
      },
-     --build_bind{ file = "binding/bind_util.lua.cc", dest_dir = "build" },
+     build_bind{ file = "binding/bind_base.lua.cc", dest_dir = "build" },
    },
    target{
      name = "document",
diff --git a/packages/basics/complex/binding/bind_complex.lua.cc b/packages/basics/complex/binding/bind_complex.lua.cc
index e0ffa4429..feb9d3311 100644
--- a/packages/basics/complex/binding/bind_complex.lua.cc
+++ b/packages/basics/complex/binding/bind_complex.lua.cc
@@ -19,6 +19,7 @@
  *
  */
 //BIND_HEADER_C
+#include "lua_table.h"
 #include "luabindutil.h"
 #include "luabindmacros.h"
 
@@ -56,6 +57,25 @@ void lua_pushComplexF(lua_State *L, const ComplexF &number) {
   LuaComplexFNumber *obj = new LuaComplexFNumber(number);
   lua_pushLuaComplexFNumber(L, obj);
 }
+
+namespace AprilUtils {
+  template<> AprilMath::ComplexF LuaTable::
+  convertTo<AprilMath::ComplexF>(lua_State *L, int idx) {
+    return lua_toComplexF(L, idx);
+  }
+  
+  template<> void LuaTable::
+  pushInto<const AprilMath::ComplexF &>(lua_State *L,
+                                        const AprilMath::ComplexF &value) {
+    lua_pushComplexF(L, value);
+  }
+
+  template<> bool LuaTable::
+  checkType<AprilMath::ComplexF>(lua_State *L, int idx) {
+    return lua_isComplexF(L, idx);
+  }
+}
+
 //BIND_END
 
 //BIND_HEADER_H
diff --git a/packages/basics/complex/c_src/complex_number.h b/packages/basics/complex/c_src/complex_number.h
index ee52e26e8..c58134452 100644
--- a/packages/basics/complex/c_src/complex_number.h
+++ b/packages/basics/complex/c_src/complex_number.h
@@ -28,7 +28,12 @@
 
 #include <cmath>
 
+#ifndef NAN
+#define NAN sqrtf(-1.0f)
+#endif
+
 #include "constString.h"
+#include "lua_table.h"
 #include "error_print.h"
 #include "referenced.h"
 
@@ -37,10 +42,6 @@
 #undef UNDEF_MATH_DEFINES
 #endif
 
-#ifndef NAN
-#define NAN sqrtf(-1.0f)
-#endif
-
 #define REAL_IDX 0
 #define IMG_IDX  1
 
@@ -198,7 +199,6 @@ namespace AprilMath {
   typedef Complex<float> ComplexF;
   typedef Complex<double> ComplexD;
 
-
   class LuaComplexFNumber : public Referenced {
   public:
     
@@ -291,6 +291,18 @@ namespace AprilMath {
 namespace AprilUtils {
   void aprilPrint(const AprilMath::ComplexF &v);
   void aprilPrint(const AprilMath::ComplexD &v);
+
+  ////////////////////////////////////////////////////////////////////////////
+  
+  template<> AprilMath::ComplexF LuaTable::
+  convertTo<AprilMath::ComplexF>(lua_State *L, int idx);
+  
+  template<> void LuaTable::
+  pushInto<const AprilMath::ComplexF &>(lua_State *L,
+                                        const AprilMath::ComplexF &value);
+
+  template<> bool LuaTable::
+  checkType<AprilMath::ComplexF>(lua_State *L, int idx);
 }
 
 #endif // COMPLEX_NUMBER_H
diff --git a/packages/basics/dataset/binding/bind_dataset.lua.cc b/packages/basics/dataset/binding/bind_dataset.lua.cc
index 7aca53bdb..c0cec8eac 100644
--- a/packages/basics/dataset/binding/bind_dataset.lua.cc
+++ b/packages/basics/dataset/binding/bind_dataset.lua.cc
@@ -67,8 +67,8 @@ namespace Basics {
     }
     lua_pushnumber(L,index);
     int ps = obj->patternSize();
-    Token *tk = obj->getPattern(index-1); // ojito que le RESTAMOS uno
-    lua_pushToken(L,tk);
+    AprilUtils::SharedPtr<Token> tk( obj->getPattern(index-1) ); // ojito que le RESTAMOS uno
+    lua_pushAuxToken(L,tk);
     return 2;
   }
 
@@ -1181,8 +1181,8 @@ LUABIND_ERROR("use constructor methods: matrix, etc.");
   LUABIND_GET_PARAMETER(1,int,index);
   if (index < 1 || index > obj->numPatterns())
     LUABIND_ERROR("index out of range");
-  Token *token = obj->getPattern(index-1); // ojito que le RESTAMOS uno
-  LUABIND_RETURN(Token, token);
+  AprilUtils::SharedPtr<Token> token( obj->getPattern(index-1) ); // ojito que le RESTAMOS uno
+  LUABIND_RETURN(AuxToken, token);
 }
 //BIND_END
 
@@ -1195,24 +1195,24 @@ LUABIND_ERROR("use constructor methods: matrix, etc.");
   LUABIND_TABLE_GETN(1,bunch_size);
   indexes = new int[bunch_size];
   LUABIND_TABLE_TO_VECTOR_SUB1(1,uint,indexes,bunch_size);
-  Token *token = obj->getPatternBunch(indexes,bunch_size);
+  AprilUtils::SharedPtr<Token> token( obj->getPatternBunch(indexes,bunch_size) );
   delete[] indexes;
-  LUABIND_RETURN(Token, token);
+  LUABIND_RETURN(AuxToken, token);
 }
 //BIND_END
 
 //BIND_METHOD DataSetToken putPattern
 {
   int index;
-  Token *pattern;
+  AprilUtils::SharedPtr<Token> pattern;
   LUABIND_CHECK_ARGN(==,2);
   LUABIND_CHECK_PARAMETER(1, int);
-  LUABIND_CHECK_PARAMETER(2, Token);
+  LUABIND_CHECK_PARAMETER(2, AuxToken);
   LUABIND_GET_PARAMETER(1,int,index);
-  LUABIND_GET_PARAMETER(2,Token,pattern);
+  LUABIND_GET_PARAMETER(2,AuxToken,pattern);
   if (index < 1 || index > obj->numPatterns())
     LUABIND_ERROR("index out of range");
-  obj->putPattern(index-1, pattern); // ojito que le RESTAMOS uno
+  obj->putPattern(index-1, pattern.get()); // ojito que le RESTAMOS uno
 }
 //BIND_END
 
@@ -1220,15 +1220,15 @@ LUABIND_ERROR("use constructor methods: matrix, etc.");
 {
   unsigned int bunch_size;
   int *indexes;
-  Token *pattern;
+  AprilUtils::SharedPtr<Token> pattern;
   LUABIND_CHECK_ARGN(==,2);
   LUABIND_CHECK_PARAMETER(1, table);
-  LUABIND_CHECK_PARAMETER(2, Token);
-  LUABIND_GET_PARAMETER(2,Token,pattern);
+  LUABIND_CHECK_PARAMETER(2, AuxToken);
+  LUABIND_GET_PARAMETER(2,AuxToken,pattern);
   LUABIND_TABLE_GETN(1,bunch_size);
   indexes = new int[bunch_size];
   LUABIND_TABLE_TO_VECTOR_SUB1(1,uint,indexes,bunch_size);
-  obj->putPatternBunch(indexes,bunch_size,pattern);
+  obj->putPatternBunch(indexes,bunch_size,pattern.get());
   delete[] indexes;
 }
 //BIND_END
@@ -1300,10 +1300,10 @@ LUABIND_ERROR("use constructor methods: matrix, etc.");
 //BIND_METHOD DataSetTokenVector push_back
 {
   LUABIND_CHECK_ARGN(==, 1);
-  LUABIND_CHECK_PARAMETER(1, Token);
-  Token *token;
-  LUABIND_GET_PARAMETER(1, Token, token);
-  obj->push_back(token);
+  LUABIND_CHECK_PARAMETER(1, AuxToken);
+  AprilUtils::SharedPtr<Token> token;
+  LUABIND_GET_PARAMETER(1, AuxToken, token);
+  obj->push_back(token.get());
 }
 //BIND_END
 
diff --git a/packages/basics/dataset/c_src/datasetToken.h b/packages/basics/dataset/c_src/datasetToken.h
index c7d31e0b1..5e9724c32 100644
--- a/packages/basics/dataset/c_src/datasetToken.h
+++ b/packages/basics/dataset/c_src/datasetToken.h
@@ -56,7 +56,7 @@ namespace Basics {
         // FIXME: Check this shape to be consistent when getPattern() returns a multi-dimensional matrix.
         int dims[2]   = { static_cast<int>(bunch_size),
                           patternSize() };
-        MatrixFloat *output_mat = new MatrixFloat(2, dims, CblasColMajor);
+        MatrixFloat *output_mat = new MatrixFloat(2, dims);
         IncRef(output_mat);
         TokenMatrixFloat *output_mat_token  = new TokenMatrixFloat(output_mat);
         output           = output_mat_token;
@@ -214,7 +214,7 @@ namespace Basics {
     DataSetFloat2TokenWrapper(DataSetFloat *ds) :
       ds(ds) {
       int dims[2] = { 1, ds->patternSize() };
-      aux_mat = new MatrixFloat(2, dims, CblasColMajor);
+      aux_mat = new MatrixFloat(2, dims);
 #ifdef USE_CUDA
       aux_mat->setUseCuda(false);
 #endif
@@ -224,7 +224,7 @@ namespace Basics {
     int patternSize() { return ds->patternSize(); }
     Token *getPattern(int index) {
       int dims[2] = { 1, patternSize() };
-      MatrixFloat *mat = new MatrixFloat(2, dims, CblasColMajor);
+      MatrixFloat *mat = new MatrixFloat(2, dims);
       TokenMatrixFloat *token = new TokenMatrixFloat(mat);
       AprilMath::FloatGPUMirroredMemoryBlock *mem_block = mat->getRawDataAccess();
       float *mem_ptr = mem_block->getPPALForWrite();
@@ -234,7 +234,7 @@ namespace Basics {
     Token *getPatternBunch(const int *indexes, unsigned int bunch_size) {
       int dims[2], major_dim=0;
       dims[0] = static_cast<int>(bunch_size); dims[1] = patternSize();
-      MatrixFloat *mat = new MatrixFloat(2, dims, CblasColMajor);
+      MatrixFloat *mat = new MatrixFloat(2, dims);
 #ifdef USE_CUDA
       bool old_use_cuda = mat->getCudaFlag();
       mat->setUseCuda(false);
diff --git a/packages/basics/iterator/lua_src/iterator.lua b/packages/basics/iterator/lua_src/iterator.lua
new file mode 100644
index 000000000..ce353cb81
--- /dev/null
+++ b/packages/basics/iterator/lua_src/iterator.lua
@@ -0,0 +1,545 @@
+--[[
+  
+  Copyright (c) 2014 Francisco Zamora-Martinez (pakozm@gmail.com)
+  
+  Permission is hereby granted, free of charge, to any person obtaining a copy
+  of this software and associated documentation files (the "Software"), to deal
+  in the Software without restriction, including without limitation the rights
+  to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+  copies of the Software, and to permit persons to whom the Software is
+  furnished to do so, subject to the following conditions:
+  
+  The above copyright notice and this permission notice shall be included in all
+  copies or substantial portions of the Software.
+  
+  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+  IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+  FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+  AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+  LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+  OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
+  IN THE SOFTWARE.
+
+]]
+
+-- Detect if APRIL-ANN is available.
+local type = type
+local aprilann_available = (aprilann ~= nil)
+if aprilann_available then type = luatype or type end
+--
+local class = class or require "oop-iter.class"
+
+--------------------------------
+-- iterator module definition --
+--------------------------------
+local iterator,iterator_methods = class("iterator")
+iterator._NAME = "iterator"
+iterator._VERSION = "0.1"
+
+local concat = table.concat
+local insert = table.insert
+local pack = table.pack
+local remove = table.remove
+local unpack = table.unpack
+local wrap = coroutine.wrap
+local yield = coroutine.yield
+
+-- Clones the function and its upvalues
+local function clone_function(func)
+  -- clone by using a string dump
+  local ok,func_dump = pcall(string.dump, func)
+  local func_clone = (ok and loadstring(func_dump)) or func
+  if func_clone ~= func then
+    -- copy upvalues
+    local i = 1
+    while true do
+      local name,value = debug.getupvalue(func,i)
+      if not name then break end
+      -- TODO: implement cone (deep copy) of tables
+      if type(value) == "function" then value = clone_function(value) end
+      debug.setupvalue(func_clone, i, value)
+      i = i + 1
+    end
+  end
+  return func_clone
+end
+
+-- Filters a Lua iterator function output using a given predicate function. The
+-- predicate returns true when a value must be taken, false when it must be
+-- removed. The predicate function is called as f(...) where ... are the values
+-- returned by the iterator function.
+local function filter(predicate_func, f, s, v)
+  return function(s, v)
+    local tmp = pack(f(s, v))
+    while tmp[1] ~= nil and not predicate_func(unpack(tmp)) do
+      v = tmp[1]
+      tmp = pack(f(s, v))
+    end
+    return unpack(tmp)
+  end, s, v
+end
+
+-- Iterable map function, receives a map function and a Lua iterator and returns
+-- another Lua iterator function. The map function is called as f(...) where
+-- ... are the values returned by the iterator function. Multiple results are
+-- possible from one map call using coroutine.yield function.
+--
+-- @note FROM: http://www.corsix.org/content/mapping-and-lua-iterators
+local function map(map_func, f, s, v)
+  local done
+  local function maybeyield(...)
+    if ... ~= nil then
+      yield(...)
+    end
+  end
+  local function domap(...)
+    v = ...
+    if v ~= nil then
+      return maybeyield(map_func(...))
+    else
+      done = true
+    end
+  end
+  return wrap(function()
+      repeat
+        local tmp = pack(f(s,v))
+        v = tmp[1]
+        domap(unpack(tmp))
+      until done
+  end), s, v
+end
+
+-- Reduce function, receives a reduce function, a reduce initial value, and a
+-- Lua iterator, and returns the computation result of the reduction. The
+-- reduce function is call as f(acc,...) where acc is the reduced (accumulated)
+-- computation, and ... are the values returned by the iterator function.
+local function reduce(reduce_func, initial_value, f, s, v)
+  assert(initial_value ~= nil,
+	 "reduce: needs an initial_value as second argument")
+  local accum = initial_value
+  local tmp = pack(f(s, v))
+  while tmp[1] ~= nil do
+    accum = reduce_func(accum, unpack(tmp))
+    tmp = pack(f(s, tmp[1]))
+  end
+  return accum
+end
+
+-- Apply function, receives a function and a Lua iterator, and calls the apply
+-- function with every element of the iterator. The apply function is called as
+-- f(...) where ... are the values returned by the iterator function.
+local function apply(apply_func, f, s, v)
+  if not apply_func then apply_func = function() end end
+  local tmp = pack(f(s,v))
+  while tmp[1] ~= nil do
+    apply_func(unpack(tmp))
+    tmp = pack(f(s,tmp[1]))
+  end
+end
+
+--------------------------------------------------------------------
+--------------------------------------------------------------------
+--------------------------------------------------------------------
+
+-- Function generators
+
+-- Range iterator, receives start,stop,step
+function iterator.range(...)
+  local arg = pack(...)
+  local start,stop,step = arg[1],arg[2],arg[3] or 1
+  if not stop then start,stop=1,start end
+  local i = start - step
+  return iterator(function(step, i)
+      if step and i then
+        i = i + step
+        if i <= stop then return i end
+      end
+                  end, step, i)
+end
+
+-- Duplicates its arguments in an infinite iterator.
+function iterator.duplicate(...)
+  return iterator(function(arg) return unpack(arg) end, pack(...))
+end
+
+-- Returns an inifite iterator which calls the given function with: f(0), f(1),
+-- ..., f(i), ...
+function iterator.tabulate(func)
+  local x=-1
+  return iterator(function() x=x+1 return func(x) end)
+end
+
+-- Returns a zero indefinitely.
+function iterator.zeros()
+  return iterator(function() return 0 end)
+end
+
+-- Returns a one indefinitely.
+function iterator.ones()
+  return iterator(function() return 1 end)
+end
+
+-- Returns an iterator over multiple iterators at the same time. The iteration
+-- ends if any of the given iterators end.
+function iterator.zip(...)
+  local arg = { ... }
+  for i=1,#arg do assert(class.is_a(arg[i], iterator),
+                         "Needs instances of iterator class") end
+  local finished = false
+  return iterator(function()
+      if finished then return nil end
+      local result = {}
+      for i=1,#arg do
+        local partial = table.pack( arg[i]() )
+        if not partial[1] then finished=true return nil end
+        for k,v in ipairs(partial) do table.insert(result,v) end
+      end
+      return table.unpack(result)
+  end)
+end
+
+--------------------------------------------------------------------
+--------------------------------------------------------------------
+--------------------------------------------------------------------
+
+-- Constructor of class iterator. It is a wrapper around a Lua iterator
+-- function, which allow to keep the iterator state, allowing to write easy
+-- functional operations (map, reduce, filter, ...).
+function iterator:constructor(f, s, v)
+  if class.is_a(f, iterator) then
+    assert(not s and not v, "Given s and v parameters with an iterator object")
+    f,s,v = f:get()
+  elseif type(f) == "table" then
+    if #f == 0 then f,s,v = iterator(pairs(f)):select(2):get()
+    else f,s,v = iterator(ipairs(f)):select(2):get()
+    end    
+  end
+  self.f,self.s,self.v = f,s,v
+end
+
+-- Returns the underlying Lua iterator.
+function iterator_methods:get() return self.f,self.s,self.v end
+
+-- Performs one iterator step, and returns its result.
+function iterator_methods:step()
+  local tmp = pack( self.f(self.s, self.v) )
+  self.v = tmp[1]
+  return unpack(tmp)
+end
+
+-- Equivalent to step() method, allowing to use iterator objects as Lua
+-- iterators in generic for loops.
+function iterator.meta_instance:__call() return self:step() end
+
+-- Map method, a wrapper around map function. Multiple results are possible
+-- from one map call using coroutine.yield function.
+function iterator_methods:map(func)
+  return iterator(map(func, self:get()))
+end
+
+-- Filter method, a wrapper around filter function.
+function iterator_methods:filter(func)
+  return iterator(filter(func, self:get()))
+end
+
+-- Apply method, a wrapper around apply function.
+function iterator_methods:apply(func)
+  apply(func, self:get())
+end
+
+-- Reduce method, a wrapper around reduce function.
+function iterator_methods:reduce(func, initial_value)
+  return reduce(func, initial_value, self:get())
+end
+
+-- Enumerate method, returns another iterator object which appends as a first
+-- element of every iteration a enumeration number.
+function iterator_methods:enumerate()
+  local id = 0
+  return self:map(function(...)
+      id = id + 1
+      return id, ...
+  end)
+end
+
+-- Calls a function for every iteration value. The function is a name, and this
+-- name must be declared in every iteration value (as table keys, or in its
+-- metatable).
+function iterator_methods:call(funcname, ...)
+  local func_args = pack(...)
+  return self:map(function(...)
+      local arg    = pack(...)
+      local result = {}
+      for i=1,#arg do
+        local t = pack(arg[i][funcname](arg[i],unpack(func_args)))
+        for j=1,#t do insert(result, t[j]) end
+      end
+      return unpack(result)
+  end)
+end
+
+-- Performs a nested iteration over every result. It receives a Lua function
+-- which returns an iterator (as ipairs, pairs, ...)
+function iterator_methods:iterate(iterator_func)
+  return self:map(function(...)
+      local f,s,v = iterator_func(...)
+      local tmp   = pack(f(s,v))
+      while tmp[1] ~= nil do
+        yield(unpack(tmp))
+        tmp = pack(f(s,tmp[1]))
+      end
+  end)
+end
+
+-- Concats the iterator results using sep1 for inter-iteration elements, and
+-- sep2 for intra-iteration calls.
+function iterator_methods:concat(sep1,sep2)
+  local sep1,sep2 = sep1 or "",sep2 or sep1 or ""
+  local t = {}
+  self:apply(function(...)
+      local arg = pack(...)
+      insert(t, string.format("%s", concat(arg, sep1)))
+  end)
+  return concat(t, sep2)
+end
+
+-- Indexes iteration result by a given set of indices. It assumes that all
+-- the elements in the iterator result are tables.
+function iterator_methods:field(...)
+  local f,s,v = self:get()
+  local arg   = pack(...)
+  return iterator(function(s)
+      local tmp = pack(f(s,v))
+      if tmp[1] == nil then return nil end
+      v = tmp[1]
+      local ret = { }
+      for i=1,#tmp do
+        for j=1,#arg do
+          insert(ret, tmp[i][arg[j]])
+        end
+      end
+      return unpack(ret)
+		  end,
+    s,v)
+end
+
+-- Selects an iteration result by a given set of number indices.
+function iterator_methods:select(...)
+  local f,s,v = self:get()
+  local arg   = pack(...)
+  for i=1,#arg do arg[i]=tonumber(arg[i]) assert(arg[i],"select: expected a number") end
+  return iterator(function(s)
+      local tmp = pack(f(s,v))
+      if tmp[1] == nil then return nil end
+      v = tmp[1]
+      local selected = {}
+      for i=1,#arg do selected[i] = tmp[arg[i]] end
+      return unpack(selected)
+		  end,
+    s,v)
+end
+
+-- Stores the iteration into a table. If every iteration has more than one
+-- result, the first element will be used as key, otherwise, an enumerated
+-- key will be used.
+function iterator_methods:table()
+  local t = {}
+  local idx = 1
+  self:apply(function(...)
+      local v = pack(...)
+      local k = remove(v, 1)
+      if #v == 0 then
+        k,v = idx,k
+      elseif #v == 1 then
+        v = v[1]
+      end
+      t[k] = v
+      idx = idx + 1
+  end)
+  return t
+end
+
+-- Returns the iterator result at nth position.
+function iterator_methods:nth(nth)
+  for i=1,nth-1 do
+    if not self() then break end
+  end
+  return self()
+end
+
+-- Returns the head of the iterator.
+function iterator_methods:head()
+  return self:nth(1)
+end
+
+-- Returns the tail of the iterator.
+function iterator_methods:tail()
+  self() -- skip first value
+  return self
+end
+
+-- Returns the first n elements of the iterator, or the first which satisfy a
+-- given predicate
+function iterator_methods:take(n)
+  if type(n) == "number" then
+    local i=0
+    return iterator(function() if i < n then i=i+1 return self() end end)
+  else
+    local satisfied = true
+    return iterator(function()
+        if satisfied then
+          local result = pack( self() )
+          if not n( unpack(result) ) then
+            satisfied = false
+          else
+            return unpack( result )
+          end
+        end
+    end)
+  end
+end
+
+-- Skips the first n elements of the iterator, or the first which satisfy a
+-- given predicate
+function iterator_methods:drop(n)
+  if type(n) == "number" then
+    for i=1,n do
+      if not self() then break end
+    end
+    return self
+  else
+    local result
+    repeat result = pack(self()) until not n( unpack(result) )
+    return iterator(function()
+        local aux
+        aux,result = result,pack( self() )
+        return unpack(aux)
+    end)
+  end
+end
+
+-- Splits an iterator into two iterators, only works with pure functional
+-- iterators.
+function iterator_methods:split(n)
+  return self:clone():take(n),self:clone():drop(n)
+end
+
+-- Only works properly with pure functional iterators.
+function iterator_methods:clone()
+  local f,s,v = self:get()
+  local f = clone_function(f)
+  return iterator(f,s,v)
+end
+
+-- Returns the position of the first iterator index which is equals to the given
+-- arguments.
+function iterator_methods:index(...)
+  local arg = pack(...)
+  local idx=0
+  while true do
+    idx=idx+1
+    local current = pack(self()) if not current[1] then break end
+    assert(#current == #arg, "Incorrect number of arguments")
+    local eq = true
+    for j=1,#current do
+      if current[j] ~= arg[j] then eq = false break end
+    end
+    if eq then return idx end
+  end
+  return nil
+end
+
+-- Returns an iterator to positions which are equal to the given arguments.
+function iterator_methods:indices(...)
+  local arg = pack(...)
+  return iterator(function(self, idx)
+      while true do
+        idx = idx+1
+        local current = pack(self()) if not current[1] then break end
+        local eq = true
+        for j=1,#current do
+          if current[j] ~= arg[j] then eq = false break end
+        end
+        if eq then return idx end
+      end
+                  end, self, 0)
+end
+
+-- Filters by using a regular expression.
+function iterator_methods:grep(regexp_string)
+  assert(type(regexp_string) == "string", "Only valid with string values")
+  return self:filter(function(str,...)
+      assert(not ..., "Only valid for unary iterators")
+      assert(type(str) == "string", "Only valid with string values")
+      return str:find(regexp_string) ~= nil
+  end)
+end
+
+-- Returns two iterators where elements do and not do satisfy the given
+-- predicate.
+function iterator_methods:partition(pred)
+  return self:clone():filter(pred),
+  self:clone():filter(function(...) return not pred(...) end)
+end
+
+-- Returns two iterators where elements do and not do satisfy the given
+-- predicate.
+function iterator_methods:size()
+  return self:reduce(function(acc,x) return acc + 1 end, 0)
+end
+
+-- Returns true if all return values satisfy the predicate.
+function iterator_methods:all(pred)
+  return self:reduce(function(acc,...) return acc and pred(...) end, true)
+end
+
+-- Returns true if at least one return value satisfies the predicate.
+function iterator_methods:any(pred)
+  return self:reduce(function(acc,...) return acc or pred(...) end, false)
+end
+
+-- Returns the sum.
+function iterator_methods:sum()
+  return self:reduce(function(a,b) return a+b end, 0)
+end
+
+-- Returns the product.
+function iterator_methods:prod()
+  return self:reduce(function(a,b) return a*b end, 1)
+end
+
+-- Returns the max.
+function iterator_methods:max()
+  return self:reduce(math.max, -math.huge)
+end
+
+-- Returns the min.
+function iterator_methods:min()
+  return self:reduce(math.min, math.huge)
+end
+
+-- In APRIL-ANN this module is defined at global environment
+if aprilann_available then
+  _G.apply = apply
+  _G.iterator = iterator
+  _G.iterable_filter = filter
+  _G.iterable_map = map
+  _G.range = iterator.range
+  _G.reduce = reduce
+end
+
+-- UNIT TEST
+function iterator.test()
+  for k,v in filter(function(k,v) return v % 2 == 0 end, ipairs{1,2,3,4}) do
+    assert(v % 2 == 0)
+  end
+  for k,v in map(function(k,v) return k,k+v end, ipairs{1,2,3,4}) do
+    assert(v == 2*k)
+  end
+  local r = reduce(function(acc,a,b,c) return acc+a+b+c end, 0, map(function(k,v) return k,v,v end, ipairs{1,2,3,4}))
+  assert(r == 3 + 6 + 9 + 12)
+  apply(function(a,b,c) assert(a==b and b==c) end,
+    map(function(k,v) return k,v,v end, ipairs{1,2,3,4}))
+end
+
+return iterator
diff --git a/packages/basics/iterator/package.lua b/packages/basics/iterator/package.lua
new file mode 100644
index 000000000..746d669b5
--- /dev/null
+++ b/packages/basics/iterator/package.lua
@@ -0,0 +1,53 @@
+package{ name = "iterator",
+   version = "1.0",
+   depends = { "base", "class" },
+   keywords = { },
+   description = "",
+   -- targets como en ant
+   target{
+     name = "init",
+     mkdir{ dir = "build" },
+     mkdir{ dir = "include" },
+   },
+   target{ 
+     name = "clean",
+     delete{ dir = "build" },
+     delete{ dir = "include" },
+   },
+   target{
+     name = "provide",
+     depends = "init",
+     --copy{ file= "c_src/*.h", dest_dir = "include" },
+     --provide_bind{ file = "binding/bind_util.lua.cc" , dest_dir = "include" },
+   },
+   target{
+     name = "test",
+     lua_unit_test{
+       file={
+	 "test/test-iterator.lua",
+       },
+     },
+   },
+   target{
+     name = "build",
+     depends = "provide",
+     use_timestamp = true,
+     -- object{ 
+     --   file = "c_src/*.cc",
+     --   dest_dir = "build",
+     --   --       flags = "-std=c99",
+     -- },
+     luac{
+       orig_dir = "lua_src",
+       dest_dir = "build",
+     },
+     --build_bind{ file = "binding/bind_util.lua.cc", dest_dir = "build" },
+   },
+   target{
+     name = "document",
+     document_src{
+     },
+     document_bind{
+     },
+   },
+ }
diff --git a/packages/basics/iterator/test/test-iterator.lua b/packages/basics/iterator/test/test-iterator.lua
new file mode 100644
index 000000000..205631c29
--- /dev/null
+++ b/packages/basics/iterator/test/test-iterator.lua
@@ -0,0 +1,57 @@
+local check = utest.check
+local T = utest.test
+-- reduce
+T("ReduceTest", function()
+    check.eq(iterator(ipairs({4,2,1,10})):reduce(math.min, math.huge), 1)
+    check.eq(iterator(string.gmatch("01101",".")):reduce(function(acc,v)return acc*2+v end, 0), 13)
+end)
+-- map
+T("MapTest", function()
+    check.eq(iterator(ipairs({1,2,3,4})):map(function(i,v) return v*2 end):concat(" "),
+             "2 4 6 8")
+end)
+-- filter
+T("FilterTest", function()
+    check.eq(iterator(ipairs{1,2,3,4,5,6,7}):filter(function(i,v) return v%2==0 end):map(function(i,v)return v end):concat(" "),
+             "2 4 6")
+end)
+
+T("IterableMapTest", function()
+    local t = { Lemon = "sour", Cake = "nice", }
+    local expected = {
+      ["lemon is slightly SOUR"]=0,
+      ["cake is slightly NICE"]=0,
+    }
+    for ingredient, modifier, taste in iterator(pairs(t)):map(function(a, b)
+        return a:lower(),"slightly",b:upper()
+    end) do
+      local str = ingredient .." is ".. modifier .. " " .. taste
+      check.eq(expected[str], 0)
+      expected[str] = expected[str] + 1
+    end
+
+    local t = { Lemon = "sour", Cake = "nice", }
+    local expected = {
+      ["cake is very NICE"]=0,
+      ["Cake is slightly nice"]=0,
+      ["lemon is very SOUR"]=0,
+      ["Lemon is slightly sour"]=0,
+    }
+    for ingredient, modifier, taste in iterator(pairs(t)):map(function(a, b)
+        coroutine.yield(a:lower(),"very",b:upper())
+        return a, "slightly", b
+    end) do
+      local str = ingredient .." is ".. modifier .. " " .. taste
+      check.eq(expected[str], 0)
+      expected[str] = expected[str] + 1
+    end
+
+    local idx=1
+    local expected={2,4,6}
+    for v in iterator(ipairs{1,2,3,4,5,6,7}):filter(function(key,value) return value%2==0 end) do
+      check.eq(v, expected[idx])
+      idx=idx+1
+    end
+    
+    for k,v in iterator(ipairs{1,2,3}) do check.eq(k, v) end
+end)
diff --git a/packages/basics/mathcore/c_src/cblas_headers.h b/packages/basics/mathcore/c_src/cblas_headers.h
index f12327932..6e46fd3bf 100644
--- a/packages/basics/mathcore/c_src/cblas_headers.h
+++ b/packages/basics/mathcore/c_src/cblas_headers.h
@@ -373,9 +373,9 @@ namespace AprilMath {
   /**
    * @brief Template wrapper for sparse MM operation.
    *
-   * SparseMM computes op(C) = alpha * op(A) * op(B) + beta * C where A is a
+   * SparseMM computes C = alpha * op(A) * op(B) + beta * C where A is a
    * sparse matrix given in CSR or CSC formats, B and C are dense matrices, op
-   * is tranposition operator, and alpha and beta are scalars. op(C) is a matrix
+   * is tranposition operator, and alpha and beta are scalars. C is a matrix
    * with MxN size. op(A) will be MxK and op(B) will be KxN.
    *
    * @see Basics::SparseMatrix class documentation.
@@ -387,7 +387,6 @@ namespace AprilMath {
    * @param sparse_format - The format can be CSR_FORMAT or CSC_FORMAT.
    * @param a_transpose - Indicates if A matrix must be transposed.
    * @param b_transpose - Indicates if B matrix must be transposed.
-   * @param c_transpose - Indicates if C matrix must be transposed.
    * @param m - The number of rows in C.
    * @param n - The number of columns in C.
    * @param k - The common dimension for A and B.
@@ -409,7 +408,6 @@ namespace AprilMath {
                   SPARSE_FORMAT sparse_format,
                   CBLAS_TRANSPOSE a_transpose,
                   CBLAS_TRANSPOSE b_transpose,
-                  CBLAS_TRANSPOSE c_transpose,
                   int m,
                   int n,
                   int k,
diff --git a/packages/basics/mathcore/c_src/cmath_overloads.h b/packages/basics/mathcore/c_src/cmath_overloads.h
index 78df0cb1e..2e41f033b 100644
--- a/packages/basics/mathcore/c_src/cmath_overloads.h
+++ b/packages/basics/mathcore/c_src/cmath_overloads.h
@@ -576,35 +576,31 @@ namespace AprilMath {
     /// Less than comparison.
     template<typename T>
     struct m_lt {
-      /// Returns @c T(1.0f) or @c T(0.0f) depending in @c a<b
-      APRIL_CUDA_EXPORT T operator()(const T &a, const T &b) const {
-        if (a < b) return T(1.0f);
-        else return T(0.0f);
+      /// Returns @c true or @c false depending in @c a<b
+      APRIL_CUDA_EXPORT bool operator()(const T &a, const T &b) const {
+        return a < b;
       }
     };
     
     /// Greater than comparison.
     template<typename T>
     struct m_gt {
-      /// Returns @c T(1.0f) or @c T(0.0f) depending in @c b<a
+      /// Returns @c true or @c false depending in @c b<a
       APRIL_CUDA_EXPORT T operator()(const T &a, const T &b) const {
-        if (b < a) return T(1.0f);
-        else return T(0.0f);
+        return b < a;
       }
     };
     
     /// Equals comparison.
     template<typename T>
     struct m_eq {
-      /// Returns @c T(1.0f) or @c T(0.0f) depending in @c b=a
+      /// Returns @c true or @c false depending in @c b==a
       APRIL_CUDA_EXPORT T operator()(const T &a, const T &b) const {
         if (AprilMath::m_isnan(a)) {
-          if (AprilMath::m_isnan(b)) return T(1.0f);
-          else return T(0.0f);
+          return AprilMath::m_isnan(b);
         }
         else {
-          if (a == b) return T(1.0f);
-          else return T(0.0f);
+          return (a == b);
         }
       }
     };
@@ -731,13 +727,13 @@ namespace AprilMath {
   T m_relu(const T &a) { return Functors::m_relu<T>()(a); }
   /// @see Functors::m_lt
   template<typename T> APRIL_CUDA_EXPORT
-  T m_lt(const T &a, const T &b) { return Functors::m_lt<T>()(a,b); }
+  bool m_lt(const T &a, const T &b) { return Functors::m_lt<T>()(a,b); }
   /// @see Functors::m_gt
   template<typename T> APRIL_CUDA_EXPORT
-  T m_gt(const T &a, const T &b) { return Functors::m_gt<T>()(a,b); }
+  bool m_gt(const T &a, const T &b) { return Functors::m_gt<T>()(a,b); }
   /// @see Functors::m_eq
   template<typename T> APRIL_CUDA_EXPORT
-  T m_eq(const T &a, const T &b) { return Functors::m_eq<T>()(a,b); }
+  bool m_eq(const T &a, const T &b) { return Functors::m_eq<T>()(a,b); }
   /// @see Functors::m_relative_equals
   template<typename T> APRIL_CUDA_EXPORT
   bool m_relative_equals(const T &a, const T &b, const float &c) { return Functors::m_relative_equals<T>()(a,b,c); }
@@ -764,9 +760,8 @@ namespace AprilMath {
     template<typename T>
     struct m_neq {
       /// It uses AprilMath::m_eq function.
-      APRIL_CUDA_EXPORT T operator()(const T &a, const T &b) {
-        if (AprilMath::m_eq(a,b) == T(1.0f)) return T(0.0f);
-        else return T(1.0f);
+      APRIL_CUDA_EXPORT bool operator()(const T &a, const T &b) {
+        return !(AprilMath::m_eq(a,b));
       }
     };
     
@@ -834,7 +829,7 @@ namespace AprilMath {
   
   /// @see Functors::m_neq
   template<typename T> APRIL_CUDA_EXPORT
-  T m_neq(const T &a, const T &b) { return Functors::m_neq<T>()(a,b); }
+  bool m_neq(const T &a, const T &b) { return Functors::m_neq<T>()(a,b); }
   /// @see Functors::m_logistic
   template<typename T> APRIL_CUDA_EXPORT
   T m_logistic(const T &a) { return Functors::m_logistic<T>()(a); }
@@ -1225,7 +1220,7 @@ namespace AprilMath {
   struct m_curried_lt {
     const T value;
     m_curried_lt(const T &value) : value(value) { }
-    APRIL_CUDA_EXPORT T operator()(const T &a) {
+    APRIL_CUDA_EXPORT bool operator()(const T &a) {
       return AprilMath::m_lt(a, value);
     }
   };
@@ -1234,7 +1229,7 @@ namespace AprilMath {
   struct m_curried_gt {
     const T value;
     m_curried_gt(const T &value) : value(value) { }
-    APRIL_CUDA_EXPORT T operator()(const T &a) {
+    APRIL_CUDA_EXPORT bool operator()(const T &a) {
       return AprilMath::m_gt(a, value);
     }
   };
@@ -1247,17 +1242,15 @@ namespace AprilMath {
         ERROR_EXIT(128, "For NaN comparison use m_curried_eq_nan\n");
       }
     }
-    APRIL_CUDA_EXPORT T operator()(const T &a) {
-      if (a == value) return T(1.0f);
-      else return T(0.0f);
+    APRIL_CUDA_EXPORT bool operator()(const T &a) {
+      return (a == value);
     }
   };
 
   template<typename T>
   struct m_curried_eq_nan {
-    APRIL_CUDA_EXPORT T operator()(const T &a) {
-      if (AprilMath::m_isnan(a)) return T(1.0f);
-      else return T(0.0f);
+    APRIL_CUDA_EXPORT bool operator()(const T &a) {
+      return AprilMath::m_isnan(a);
     }
   };
 
@@ -1269,17 +1262,15 @@ namespace AprilMath {
         ERROR_EXIT(128, "For NaN comparison use m_curried_eq_nan\n");
       }
     }
-    APRIL_CUDA_EXPORT T operator()(const T &a) {
-      if (a == value) return T(0.0f);
-      else return T(1.0f);
+    APRIL_CUDA_EXPORT bool operator()(const T &a) {
+      return !(a == value);
     }
   };
 
   template<typename T>
   struct m_curried_neq_nan {
-    APRIL_CUDA_EXPORT T operator()(const T &a) {
-      if (AprilMath::m_isnan(a)) return T(0.0f);
-      else return T(1.0f);
+    APRIL_CUDA_EXPORT bool operator()(const T &a) {
+      return !(AprilMath::m_isnan(a));
     }
   };
   
diff --git a/packages/basics/mathcore/c_src/copy.cu b/packages/basics/mathcore/c_src/copy.cu
index 391646d24..c22142498 100644
--- a/packages/basics/mathcore/c_src/copy.cu
+++ b/packages/basics/mathcore/c_src/copy.cu
@@ -181,6 +181,14 @@ namespace AprilMath {
                              unsigned int,
                              bool);
 
+  template void doCopy<bool>(int, const GPUMirroredMemoryBlock<bool>*,
+                             unsigned int,
+                             unsigned int,
+                             GPUMirroredMemoryBlock<bool>*,
+                             unsigned int,
+                             unsigned int,
+                             bool);
+
   template void doCopy<float>(int, const GPUMirroredMemoryBlock<float>*,
                               unsigned int,
                               unsigned int,
diff --git a/packages/basics/mathcore/c_src/gemm.cu b/packages/basics/mathcore/c_src/gemm.cu
index 6b3434d8d..38e5bfa0e 100644
--- a/packages/basics/mathcore/c_src/gemm.cu
+++ b/packages/basics/mathcore/c_src/gemm.cu
@@ -20,6 +20,7 @@
  *
  */
 #include "mathcore.h"
+#include "transpose.h"
 #include "unused_variable.h"
 
 namespace AprilMath {
@@ -30,7 +31,7 @@ namespace AprilMath {
     /***************************************
      ************** CUDA SECTION ***********
      ***************************************/
-
+    
     cublasStatus_t wrapperCublasGemm(cublasHandle_t &handle,
                                      cublasOperation_t &cublas_a_transpose,
                                      cublasOperation_t &cublas_b_transpose,
@@ -268,9 +269,21 @@ namespace AprilMath {
 #endif
 #ifdef USE_CUDA
     if (use_gpu) {
+      AprilUtils::SharedPtr< GPUMirroredMemoryBlock<T> > old_c;
+      int old_c_inc;
+      if (major_type != CblasColMajor) {
+        AprilUtils::swap(m,n);
+        AprilUtils::swap(a,b);
+        AprilUtils::swap(a_inc,b_inc);
+        a_transpose = NEGATE_CBLAS_TRANSPOSE(a_transpose);
+        b_transpose = NEGATE_CBLAS_TRANSPOSE(b_transpose);
+        old_c.reset(c);
+        c = new GPUMirroredMemoryBlock<T>(m*n);
+        old_c_inc = c_inc;
+        c_inc = m;
+      }
       cublasStatus_t status;
       cublasHandle_t handle = CUDA::GPUHelper::getHandler();
-      assert(major_type == CblasColMajor);
       //printf("Doing a sgemm with comp=1 & cuda=1\n");
       a_mem = a->getGPUForRead() + a_shift;
       b_mem = b->getGPUForRead() + b_shift;
@@ -289,6 +302,14 @@ namespace AprilMath {
                                        &beta, c_mem, c_inc);
       
       checkCublasError(status);
+      
+      if (order != CblasColMajor) {
+        // transpose the result
+        CUDA::wrapperTranspose(handle, m, n,
+                               c->getGPUForRead(), c_inc,
+                               old_c->getGPUForWrite(), old_c_inc);
+        delete c;
+      }
     }
     else {
       //printf("Doing a sgemm with comp=1 & cuda=0\n");
@@ -323,7 +344,6 @@ namespace AprilMath {
                   SPARSE_FORMAT sparse_format,
                   CBLAS_TRANSPOSE a_transpose,
                   CBLAS_TRANSPOSE b_transpose,
-                  CBLAS_TRANSPOSE c_transpose,
                   int m,
                   int n,
                   int k,
@@ -354,8 +374,8 @@ namespace AprilMath {
       cusparseHandle_t handle = CUDA::GPUHelper::getSparseHandler();
       if (major_order != CblasColMajor)
         ERROR_EXIT(128, "Column major matrices are expected\n");
-      if (b_transpose == CblasTrans || c_transpose == CblasTrans)
-        ERROR_EXIT(128, "Impossible to transpose B or C matrices "
+      if (b_transpose == CblasTrans)
+        ERROR_EXIT(128, "Impossible to transpose B matrix "
                    "when using CUDA\n");
       if (sparse_format != CSR_FORMAT)
         a_transpose = NEGATE_CBLAS_TRANSPOSE(a_transpose);
@@ -406,7 +426,7 @@ namespace AprilMath {
       // matrix matrix product: C = \alpha op(A) op(B) + \beta C
       wrapperCblasSparseMM(major_order,
                            sparse_format,
-                           a_transpose, b_transpose, c_transpose,
+                           a_transpose, b_transpose, CblasNoTrans,
                            m,            // num rows of A (before transpose)
                            n,            // num rows at B (before transpose)
                            k,            // Common dimension between A and B
@@ -485,7 +505,6 @@ namespace AprilMath {
                                   SPARSE_FORMAT sparse_format,
                                   CBLAS_TRANSPOSE a_transpose,
                                   CBLAS_TRANSPOSE b_transpose,
-                                  CBLAS_TRANSPOSE c_transpose,
                                   int m,
                                   int n,
                                   int k,
@@ -506,7 +525,6 @@ namespace AprilMath {
                                    SPARSE_FORMAT sparse_format,
                                    CBLAS_TRANSPOSE a_transpose,
                                    CBLAS_TRANSPOSE b_transpose,
-                                   CBLAS_TRANSPOSE c_transpose,
                                    int m,
                                    int n,
                                    int k,
@@ -527,7 +545,6 @@ namespace AprilMath {
                                      SPARSE_FORMAT sparse_format,
                                      CBLAS_TRANSPOSE a_transpose,
                                      CBLAS_TRANSPOSE b_transpose,
-                                     CBLAS_TRANSPOSE c_transpose,
                                      int m,
                                      int n,
                                      int k,
diff --git a/packages/basics/mathcore/c_src/lapack_headers.cc b/packages/basics/mathcore/c_src/lapack_headers.cc
index 16ca02d88..841672b9c 100644
--- a/packages/basics/mathcore/c_src/lapack_headers.cc
+++ b/packages/basics/mathcore/c_src/lapack_headers.cc
@@ -26,16 +26,14 @@
 #include "cblas_headers.h"
 int clapack_sgetrf(const int Order, const int M, const int N,
                    float *A, const int lda, int *ipiv) {
-  if (Order != CblasColMajor)
-    ERROR_EXIT(256, "Only col_major order is allowed\n");
+  UNUSED_VARIABLE(Order);
   int INFO;
   sgetrf_(&M,&N,A,&lda,ipiv,&INFO);
   return INFO;
 }
 int clapack_sgetri(const int Order, const int N,
                    float *A, const int lda, int *ipiv) {
-  if (Order != CblasColMajor)
-    ERROR_EXIT(256, "Only col_major order is allowed\n");
+  UNUSED_VARIABLE(Order);
   int INFO;
   int LWORK = N*N;
   float *WORK = new float[LWORK];
@@ -45,8 +43,9 @@ int clapack_sgetri(const int Order, const int N,
 }
 int clapack_sgesdd(const int Order, const int M, const int N, const int LDA,
 		   float *A, float *U, float *S, float *VT) {
-  if (Order != CblasColMajor)
+  if (Order != CblasColMajor) {
     ERROR_EXIT(256, "Only col_major order is allowed\n");
+  }
   const int numSV = (M<N) ? M : N;
   // workspace
   float workSize;
@@ -68,27 +67,29 @@ int clapack_sgesdd(const int Order, const int M, const int N, const int LDA,
 }
 int clapack_spotrf(const int Order, const int Uplo, const int N, float *A,
                    const int LDA) {
-  if (Order != CblasColMajor)
-    ERROR_EXIT(256, "Only col_major order is allowed\n");
   int info = 0;
-  char uplo = (Uplo == CblasLower) ? 'L' : 'U';
-  spotrf_(&uplo, &N, A, &LDA, &info);
+  if (Order == CblasRowMajor) {
+    char uplo = (Uplo == CblasLower) ? 'U' : 'L';
+    spotrf_(&uplo, &N, A, &LDA, &info);
+  }
+  else { // CblasColMajor
+    char uplo = (Uplo == CblasLower) ? 'L' : 'U';
+    spotrf_(&uplo, &N, A, &LDA, &info);
+  }
   return info;
 }
 #elif defined(USE_XCODE)
 #include "cblas_headers.h"
 int clapack_sgetrf(int Order, int M, int N,
                    float *A, int lda, int *ipiv) {
-  if (Order != CblasColMajor)
-    ERROR_EXIT(256, "Only col_major order is allowed\n");
+  UNUSED_VARIABLE(Order);
   int INFO;
   sgetrf_(&M,&N,A,&lda,ipiv,&INFO);
   return INFO;
 }
 int clapack_sgetri(int Order, int N,
                    float *A, int lda, int *ipiv) {
-  if (Order != CblasColMajor)
-    ERROR_EXIT(256, "Only col_major order is allowed\n");
+  UNUSED_VARIABLE(Order);
   int INFO;
   int LWORK = N*N;
   float *WORK = new float[LWORK];
@@ -122,11 +123,15 @@ int clapack_sgesdd(int Order, int M, int N, int LDA,
 }
 int clapack_spotrf(int Order, int Uplo, int N, float *A,
                    int LDA) {
-  if (Order != CblasColMajor)
-    ERROR_EXIT(256, "Only col_major order is allowed\n");
   int info = 0;
-  char uplo = (Uplo == CblasLower) ? 'L' : 'U';
-  spotrf_(&uplo, &N, A, &LDA, &info);
+  if (Order == CblasRowMajor) {
+    char uplo = (Uplo == CblasLower) ? 'U' : 'L';
+    spotrf_(&uplo, &N, A, &LDA, &info);
+  }
+  else { // CblasColMajor
+    char uplo = (Uplo == CblasLower) ? 'L' : 'U';
+    spotrf_(&uplo, &N, A, &LDA, &info);
+  }
   return info;
 }
 #else
diff --git a/packages/basics/mathcore/c_src/transpose.cu b/packages/basics/mathcore/c_src/transpose.cu
new file mode 100644
index 000000000..013ede803
--- /dev/null
+++ b/packages/basics/mathcore/c_src/transpose.cu
@@ -0,0 +1,61 @@
+/*
+ * This file is part of APRIL-ANN toolkit (A
+ * Pattern Recognizer In Lua with Artificial Neural Networks).
+ *
+ * Copyright 2013, Salvador España-Boquera, Francisco Zamora-Martinez
+ * Copyright 2012, Salvador España-Boquera
+ *
+ * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 3 as
+ * published by the Free Software Foundation
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this library; if not, write to the Free Software Foundation,
+ * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ */
+#include "transpose.h"
+
+#ifdef USE_CUDA
+namespace CUDA {
+  cublasStatus_t wrapperTranspose(cublasHandle_t &handle,
+                                  int m, int n,
+                                  const float *orig, int orig_inc,
+                                  float *dest, int dest_inc) {
+    float alpha=1.0f, beta=0.0f;
+    return cublasSgeam(handle, CUBLAS_OP_T, CUBLAS_OP_T, m, n,
+                       &alpha, orig, orig_inc,
+                       &beta, orig, orig_inc,
+                       dest, dest_inc);
+  }
+
+  cublasStatus_t wrapperTranspose(cublasHandle_t &handle,
+                                  int m, int n,
+                                  const double *orig, int orig_inc,
+                                  double *dest, int dest_inc) {
+    double alpha=1.0, beta=0.0;
+    return cublasDgeam(handle, CUBLAS_OP_T, CUBLAS_OP_T, m, n,
+                       &alpha, orig, orig_inc,
+                       &beta, orig, orig_inc,
+                       dest, dest_inc);
+  }
+
+  cublasStatus_t wrapperTranspose(cublasHandle_t &handle,
+                                  int m, int n,
+                                  const ComplexF *orig, int orig_inc,
+                                  ComplexF *dest, int dest_inc) {
+    ComplexF alpha=ComplexF(1.0,1.0), beta=ComplexF(0.0,0.0);
+    return cublasCgeam(handle, CUBLAS_OP_T, CUBLAS_OP_T, m, n,
+                       reinterpret_cast<const cuComplex*>(&alpha),
+                       orig, orig_inc,
+                       reinterpret_cast<const cuComplex*>(&beta),
+                       orig, orig_inc,
+                       dest, dest_inc);
+  }
+}
+#endif // USE_CUDA
diff --git a/packages/basics/mathcore/c_src/transpose.h b/packages/basics/mathcore/c_src/transpose.h
new file mode 100644
index 000000000..b66c90aaf
--- /dev/null
+++ b/packages/basics/mathcore/c_src/transpose.h
@@ -0,0 +1,45 @@
+/*
+ * This file is part of APRIL-ANN toolkit (A
+ * Pattern Recognizer In Lua with Artificial Neural Networks).
+ *
+ * Copyright 2013, Salvador España-Boquera, Francisco Zamora-Martinez
+ * Copyright 2012, Salvador España-Boquera
+ *
+ * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 3 as
+ * published by the Free Software Foundation
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this library; if not, write to the Free Software Foundation,
+ * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ */
+#ifndef TRANSPOSE_H
+#define TRANSPOSE_H
+#include "mathcore.h"
+
+#ifdef USE_CUDA
+namespace CUDA {
+  cublasStatus_t wrapperTranspose(cublasHandle_t &handle,
+                                  int m, int n,
+                                  const float *orig, int orig_inc,
+                                  float *dest, int dest_inc);
+
+  cublasStatus_t wrapperTranspose(cublasHandle_t &handle,
+                                  int m, int n,
+                                  const double *orig, int orig_inc,
+                                  double *dest, int dest_inc);
+
+  cublasStatus_t wrapperTranspose(cublasHandle_t &handle,
+                                  int m, int n,
+                                  const ComplexF *orig, int orig_inc,
+                                  ComplexF *dest, int dest_inc);
+}
+#endif // USE_CUDA
+
+#endif // TRANSPOSE_H
diff --git a/packages/basics/matrix/binding/bind_matrix.lua.cc b/packages/basics/matrix/binding/bind_matrix.lua.cc
index f9270dcd3..9412a427c 100644
--- a/packages/basics/matrix/binding/bind_matrix.lua.cc
+++ b/packages/basics/matrix/binding/bind_matrix.lua.cc
@@ -20,9 +20,13 @@
  */
 //BIND_HEADER_C
 #include <cmath> // para isfinite
+extern "C" {
+#include <ctype.h>
+}
 #include "bind_april_io.h"
 #include "bind_mtrand.h"
 #include "bind_matrix_int32.h"
+#include "bind_matrix_bool.h"
 #include "bind_sparse_matrix.h"
 #include "luabindutil.h"
 #include "luabindmacros.h"
@@ -31,6 +35,23 @@
 #include "mystring.h"
 #include "utilMatrixFloat.h"
 
+namespace AprilUtils {
+  template<> Basics::MatrixFloat *LuaTable::
+  convertTo<Basics::MatrixFloat *>(lua_State *L, int idx) {
+    return lua_toMatrixFloat(L, idx);
+  }
+  
+  template<> void LuaTable::
+  pushInto<Basics::MatrixFloat *>(lua_State *L, Basics::MatrixFloat *value) {
+    lua_pushMatrixFloat(L, value);
+  }
+
+  template<> bool LuaTable::
+  checkType<Basics::MatrixFloat *>(lua_State *L, int idx) {
+    return lua_isMatrixFloat(L, idx);
+  }
+}
+
 #define FUNCTION_NAME "read_vector"
 static int *read_vector(lua_State *L, const char *key, int num_dim, int add) {
   int *v=0;
@@ -67,23 +88,6 @@ int sliding_window_iterator_function(lua_State *L) {
   return 1;
 }
 
-int matrixfloatset_iterator_function(lua_State *L) {
-  MatrixFloatSetIteratorWrapper *obj = lua_toMatrixFloatSetIteratorWrapper(L,1);
-  if (obj->it == obj->m->end()) {
-    lua_pushnil(L);
-    return 1;
-  }
-  lua_pushstring(L, obj->it->first.c_str());
-  if (obj->it->second.isSparse()) {
-    lua_pushSparseMatrixFloat(L, obj->it->second.getSparse().get());
-  }
-  else {
-    lua_pushMatrixFloat(L, obj->it->second.checkDense().get());
-  }
-  ++obj->it;
-  return 2;
-}
-
 template<typename T>
 static bool check_number(lua_State *L, int i, T &dest) {
   if (lua_isnumber(L,i)) {
@@ -105,7 +109,6 @@ static bool check_number(lua_State *L, int i, T &dest) {
 //BIND_HEADER_H
 #include "bind_april_io.h"
 #include "matrixFloat.h"
-#include "matrixFloatSet.h"
 #include "utilLua.h"
 #include <cmath> // para isfinite
 
@@ -125,34 +128,20 @@ typedef MatrixFloat::sliding_window SlidingWindow;
 
 namespace Basics {
 
-  class MatrixFloatSetIteratorWrapper : public Referenced {
-  public:
-    MatrixFloatSet *m;
-    MatrixFloatSet::iterator it;
-    MatrixFloatSetIteratorWrapper(MatrixFloatSet *m) :
-      Referenced(), m(m), it(m->begin()) {
-      IncRef(m);
-    }
-    virtual ~MatrixFloatSetIteratorWrapper() {
-      DecRef(m);
-    }
-  };
-
   template<typename T>
   Matrix<T> *readMatrixLuaMethod(lua_State *L) {
     AprilIO::StreamInterface *stream =
       lua_toAuxStreamInterface<AprilIO::StreamInterface>(L,1);
     if (stream == 0) luaL_error(L, "Needs a stream as first argument");
     AprilUtils::SharedPtr<AprilIO::StreamInterface> ptr(stream);
-    AprilUtils::LuaTableOptions options(L,2);
-    return Matrix<T>::read(ptr.get(), &options); 
+    AprilUtils::LuaTable options(L,2);
+    return Matrix<T>::read(ptr.get(), options); 
   }
 }
 //BIND_END
 
 //BIND_STRING_CONSTANT matrix.options.tab Basics::MatrixIO::TAB_OPTION
 //BIND_STRING_CONSTANT matrix.options.ascii Basics::MatrixIO::ASCII_OPTION
-//BIND_STRING_CONSTANT matrix.options.order Basics::MatrixIO::ORDER_OPTION
 //BIND_STRING_CONSTANT matrix.options.delim Basics::MatrixIO::DELIM_OPTION
 //BIND_STRING_CONSTANT matrix.options.empty Basics::MatrixIO::EMPTY_OPTION
 //BIND_STRING_CONSTANT matrix.options.default Basics::MatrixIO::DEFAULT_OPTION
@@ -281,60 +270,6 @@ namespace Basics {
 }
 //BIND_END
 
-//BIND_CLASS_METHOD MatrixFloat col_major
-//DOC_BEGIN
-// col_major_matrix(int dim1, int dim2, ..., table mat=nil)
-/// Constructor con una secuencia de valores que son las dimensiones de
-/// la matriz el ultimo argumento puede ser una tabla, en cuyo caso
-/// contiene los valores adecuadamente serializados, si solamente
-/// aparece la matriz, se trata de un vector cuya longitud viene dada
-/// implicitamente.
-//DOC_END
-{
-  int i,argn;
-  argn = lua_gettop(L); // number of arguments
-  LUABIND_CHECK_ARGN(>=, 1);
-  int ndims = (!lua_isnumber(L,argn)) ? argn-1 : argn;
-  int *dim;
-  if (ndims == 0) { // caso matrix{valores}
-    ndims = 1;
-    dim = new int[ndims];
-    LUABIND_TABLE_GETN(1, dim[0]);
-  } else {
-    dim = new int[ndims];
-    for (i=1; i <= ndims; i++) {
-      if (!lua_isnumber(L,i))
-	// TODO: Este mensaje de error parece que no es correcto... y no se todavia por que!!!
-	LUABIND_FERROR2("incorrect argument to matrix dimension (arg %d must"
-			" be a number and is a %s)",
-			i, lua_typename(L,i));
-      dim[i-1] = (int)lua_tonumber(L,i);
-      if (dim[i-1] <= 0)
-	LUABIND_FERROR1("incorrect argument to matrix dimension (arg %d must be >0)",i);
-    }
-  }
-  MatrixFloat* obj;
-  obj = new MatrixFloat(ndims,dim,CblasColMajor);
-  if (lua_istable(L,argn)) {
-    int i=1;
-    int len;
-    LUABIND_TABLE_GETN(argn, len);
-    if (len != obj->size())
-      LUABIND_FERROR2("Incorrect number of elements at the given table, "
-		      "found %d, expected %d", len, obj->size());
-    for (MatrixFloat::iterator it(obj->begin()); it != obj->end(); ++it, ++i) {
-      lua_rawgeti(L,argn,i);
-      if (!check_number(L,-1,*it))
-	LUABIND_FERROR1("The given table has a no number value at position %d, "
-			"the table could be smaller than matrix size", i);
-      lua_remove(L,-1);
-    }
-  }
-  delete[] dim;
-  LUABIND_RETURN(MatrixFloat,obj);
-}
-//BIND_END
-
 //BIND_METHOD MatrixFloat size
 {
   LUABIND_RETURN(int, obj->size());
@@ -555,14 +490,6 @@ namespace Basics {
 }
 //BIND_END
 
-//BIND_METHOD MatrixFloat get_major_order
-{
-  if (obj->getMajorOrder() == CblasRowMajor)
-    LUABIND_RETURN(string, "row_major");
-  else LUABIND_RETURN(string, "col_major");
-}
-//BIND_END
-
 //BIND_METHOD MatrixFloat dim
 {
   LUABIND_CHECK_ARGN(>=, 0);
@@ -645,21 +572,7 @@ namespace Basics {
 /// Devuelve un <em>clon</em> de la matriz.
 //DOC_END
 {
-  LUABIND_CHECK_ARGN(>=, 0);
-  LUABIND_CHECK_ARGN(<=, 1);
-  int argn;
-  argn = lua_gettop(L); // number of arguments
-  MatrixFloat *obj2;
-  if (argn == 0) obj2 = obj->clone();
-  else {
-    const char *major;
-    LUABIND_GET_OPTIONAL_PARAMETER(1, string, major, "row_major");
-    CBLAS_ORDER order=CblasRowMajor;
-    if (strcmp(major, "col_major") == 0) order = CblasColMajor;
-    else if (strcmp(major, "row_major") != 0)
-      LUABIND_FERROR1("Incorrect major order string %s", major);
-    obj2 = obj->clone(order);
-  }
+  MatrixFloat *obj2 = obj->clone();
   LUABIND_RETURN(MatrixFloat,obj2);
 }
 //BIND_END
@@ -676,22 +589,17 @@ namespace Basics {
 
 //BIND_METHOD MatrixFloat transpose
 {
-  LUABIND_RETURN(MatrixFloat, obj->transpose());
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloat in_major_order
-{
-  const char *major;
-  LUABIND_GET_PARAMETER(1, string, major);
-  CBLAS_ORDER order;
-  if (strcmp(major, "col_major") == 0) order = CblasColMajor;
-  else if (strcmp(major, "row_major") == 0) order = CblasRowMajor;
+  int argn;
+  argn = lua_gettop(L);
+  if (argn == 0) {
+    LUABIND_RETURN(MatrixFloat, obj->transpose());
+  }
   else {
-    order = CblasRowMajor; // avoids compiler warning
-    LUABIND_FERROR1("Incorrect major order string %s", major);
+    int d1,d2;
+    LUABIND_GET_PARAMETER(1, int, d1);
+    LUABIND_GET_PARAMETER(2, int, d2);
+    LUABIND_RETURN(MatrixFloat, obj->transpose(d1-1, d2-1));
   }
-  LUABIND_RETURN(MatrixFloat, obj->inMajorOrder(order));
 }
 //BIND_END
 
@@ -855,14 +763,9 @@ namespace Basics {
     LUABIND_ERROR("First argument must be <= second argument");
   if (random == 0) random = new MTRand();
   IncRef(random);
-  if (obj->getIsDataRowOrdered())
-    for (MatrixFloat::iterator it(obj->begin()); it != obj->end(); ++it) {
-      *it = static_cast<float>(random->randInt(upper - lower)) + lower;
-    }
-  else
-    for (MatrixFloat::col_major_iterator it(obj->begin());it!=obj->end();++it) {
-      *it = static_cast<float>(random->randInt(upper - lower)) + lower;
-    }
+  for (MatrixFloat::iterator it(obj->begin()); it != obj->end(); ++it) {
+    *it = static_cast<float>(random->randInt(upper - lower)) + lower;
+  }
   DecRef(random);
   LUABIND_RETURN(MatrixFloat, obj);
 }
@@ -879,12 +782,8 @@ namespace Basics {
     LUABIND_ERROR("First argument must be <= second argument");
   if (random == 0) random = new MTRand();
   IncRef(random);
-  if (obj->getMajorOrder() == CblasRowMajor)
-    for (MatrixFloat::iterator it(obj->begin()); it != obj->end(); ++it)
-      *it = random->rand(upper - lower) + lower;
-  else
-    for (MatrixFloat::col_major_iterator it(obj->begin());it!=obj->end();++it)
-      *it = random->rand(upper - lower) + lower;
+  for (MatrixFloat::iterator it(obj->begin()); it != obj->end(); ++it)
+    *it = random->rand(upper - lower) + lower;
   DecRef(random);
   LUABIND_RETURN(MatrixFloat, obj);
 }
@@ -979,12 +878,6 @@ namespace Basics {
 }
 //BIND_END
 
-//BIND_METHOD MatrixFloat is_transposed
-{
-  LUABIND_RETURN(bool, obj->getTransposedFlag());
-}
-//BIND_END
-
 //BIND_METHOD MatrixFloat prune_subnormal_and_check_normal
 {
   obj->pruneSubnormalAndCheckNormal();
@@ -1402,10 +1295,10 @@ namespace Basics {
   LUABIND_CHECK_ARGN(>=, 0);
   LUABIND_CHECK_ARGN(<=, 2);
   int argn = lua_gettop(L); // number of arguments
-  if (argn >= 1) {
+  if (argn > 0 && !lua_isnil(L,1)) {
     int dim;
-    MatrixFloat *dest;
     LUABIND_GET_PARAMETER(1, int, dim);
+    MatrixFloat *dest;
     LUABIND_GET_OPTIONAL_PARAMETER(2, MatrixFloat, dest, 0);
     if (dim < 1 || dim > obj->getNumDim())
       LUABIND_FERROR2("Incorrect dimension, found %d, expect in [1,%d]",
@@ -1495,10 +1388,10 @@ namespace Basics {
 {
   LUABIND_CHECK_ARGN(==, 1);
   LUABIND_CHECK_PARAMETER(1, table);
-  check_table_fields(L,1, "trans_A", "trans_B", "trans_C",
+  check_table_fields(L,1, "trans_A", "trans_B",
                      "alpha", "A", "B", "beta",
                      (const char *)0);
-  bool trans_A, trans_B, trans_C;
+  bool trans_A, trans_B;
   float alpha;
   float beta;
   SparseMatrixFloat *matA;
@@ -1507,7 +1400,6 @@ namespace Basics {
   LUABIND_GET_TABLE_PARAMETER(1, B, MatrixFloat, matB);
   LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, trans_A, bool, trans_A, false);
   LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, trans_B, bool, trans_B, false);
-  LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, trans_C, bool, trans_C, false);
   LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, alpha, float, alpha, 1.0f);
   LUABIND_GET_TABLE_OPTIONAL_PARAMETER(1, beta, float, beta, 1.0f);
   LUABIND_RETURN(MatrixFloat,
@@ -1515,7 +1407,6 @@ namespace Basics {
                  matSparseMM(obj,
                              trans_A ? CblasTrans : CblasNoTrans,
                              trans_B ? CblasTrans : CblasNoTrans,
-                             trans_C ? CblasTrans : CblasNoTrans,
                              alpha, matA, matB,
                              beta));
 }
@@ -1679,6 +1570,10 @@ namespace Basics {
 {
   char uplo;
   LUABIND_GET_OPTIONAL_PARAMETER(1, char, uplo, 'U');
+  uplo = toupper(uplo);
+  if (uplo != 'U' && uplo != 'L') {
+    LUABIND_ERROR("Incorrect argument, expected character L or U");
+  }
   LUABIND_RETURN(MatrixFloat, AprilMath::MatrixExt::Operations::
                  matCholesky(obj, uplo));
 }
@@ -1700,13 +1595,13 @@ namespace Basics {
   if (lua_isMatrixFloat(L, 1)) {
     MatrixFloat *value;
     LUABIND_GET_PARAMETER(1, MatrixFloat, value);
-    LUABIND_RETURN(MatrixFloat, AprilMath::MatrixExt::Operations::
+    LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
                    matLT(obj, value));
   }
   else {
     float value;
     LUABIND_GET_PARAMETER(1, float, value);
-    LUABIND_RETURN(MatrixFloat, AprilMath::MatrixExt::Operations::
+    LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
                    matLT(obj, value));
   }
 }
@@ -1717,13 +1612,13 @@ namespace Basics {
   if (lua_isMatrixFloat(L, 1)) {
     MatrixFloat *value;
     LUABIND_GET_PARAMETER(1, MatrixFloat, value);
-    LUABIND_RETURN(MatrixFloat, AprilMath::MatrixExt::Operations::
+    LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
                    matGT(obj, value));
   }
   else {
     float value;
     LUABIND_GET_PARAMETER(1, float, value);
-    LUABIND_RETURN(MatrixFloat, AprilMath::MatrixExt::Operations::
+    LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
                    matGT(obj, value));
   }
 }
@@ -1734,13 +1629,13 @@ namespace Basics {
   if (lua_isMatrixFloat(L, 1)) {
     MatrixFloat *value;
     LUABIND_GET_PARAMETER(1, MatrixFloat, value);
-    LUABIND_RETURN(MatrixFloat, AprilMath::MatrixExt::Operations::
+    LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
                    matEQ(obj, value));
   }
   else {
     float value;
     LUABIND_GET_PARAMETER(1, float, value);
-    LUABIND_RETURN(MatrixFloat, AprilMath::MatrixExt::Operations::
+    LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
                    matEQ(obj, value));
   }
 }
@@ -1751,13 +1646,13 @@ namespace Basics {
   if (lua_isMatrixFloat(L, 1)) {
     MatrixFloat *value;
     LUABIND_GET_PARAMETER(1, MatrixFloat, value);
-    LUABIND_RETURN(MatrixFloat, AprilMath::MatrixExt::Operations::
+    LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
                    matNEQ(obj, value));
   }
   else {
     float value;
     LUABIND_GET_PARAMETER(1, float, value);
-    LUABIND_RETURN(MatrixFloat, AprilMath::MatrixExt::Operations::
+    LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
                    matNEQ(obj, value));
     
   }
@@ -1954,404 +1849,3 @@ namespace Basics {
 //BIND_END
 
 //////////////////////////////////////////////////////////////////////
-
-//BIND_LUACLASSNAME MatrixFloatSet matrix.dict
-//BIND_CPP_CLASS MatrixFloatSet
-
-//BIND_CONSTRUCTOR MatrixFloatSet
-{
-  int argn = lua_gettop(L); // number of arguments
-  obj = new MatrixFloatSet();
-  if (argn == 1) {
-    LUABIND_CHECK_PARAMETER(1, table);
-    lua_pushvalue(L, 1);
-    // stack now contains: -1 => table
-    lua_pushnil(L);
-    // stack now contains: -1 => nil; -2 => table
-    while (lua_next(L, -2)) {
-      // copy the key so that lua_tostring does not modify the original
-      lua_pushvalue(L, -2);
-      // stack now contains: -1 => value; -2 => key; -3 => table
-      const char *key = lua_tostring(L, -1);
-      // stack now contains: -1 => key; -2 => value; -3 => key; -4 => table
-      if (lua_isMatrixFloat(L, -2)) {
-        MatrixFloat *value = lua_toMatrixFloat(L, -2);
-        obj->insert(key, value);
-      }
-      else if (lua_isSparseMatrixFloat(L, -2)) {
-        SparseMatrixFloat *value = lua_toSparseMatrixFloat(L, -2);
-        obj->insert(key, value);
-      }
-      else LUABIND_ERROR("Incorrect matrix type, expected matrix or matrix.sparse\n");
-      // pop value + copy of key, leaving original key
-      lua_pop(L, 2);
-      // stack now contains: -1 => key; -2 => table
-    }
-    // stack now contains: -1 => table (when lua_next returns 0 it pops the key
-    // but does not push anything.)
-  }
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet size
-{
-  LUABIND_RETURN(int, obj->size());
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet insert
-{
-  const char *key;
-  LUABIND_CHECK_ARGN(==, 2);
-  LUABIND_GET_PARAMETER(1, string, key);
-  if (lua_isMatrixFloat(L, 2)) {
-    MatrixFloat *m;
-    LUABIND_GET_PARAMETER(2, MatrixFloat, m);
-    obj->insert(key, m);
-  }
-  else if (lua_isSparseMatrixFloat(L, 2)) {
-    SparseMatrixFloat *m;
-    LUABIND_GET_PARAMETER(2, SparseMatrixFloat, m);
-    obj->insert(key, m);
-  }
-  else LUABIND_ERROR("Incorrect matrix type, expected matrix or matrix.sparse\n");
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet find
-{
-  const char *key;
-  LUABIND_CHECK_ARGN(==, 1);
-  LUABIND_GET_PARAMETER(1, string, key);
-  MatrixFloatSet::Value *v = obj->find(key);
-  if (v != 0) {
-    if (v->isSparse()) {
-      LUABIND_RETURN(SparseMatrixFloat, v->getSparse().get());
-    }
-    else {
-      LUABIND_RETURN(MatrixFloat, v->checkDense().get());
-    }
-  }
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet fill
-{
-  float value;
-  LUABIND_GET_PARAMETER(1, float, value);
-  obj->fill(value);
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet scalar_add
-{
-  float value;
-  LUABIND_GET_PARAMETER(1, float, value);
-  obj->scalarAdd(value);
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet pow
-{
-  float value;
-  LUABIND_GET_PARAMETER(1, float, value);
-  obj->pow(value);
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet scal
-{
-  float value;
-  LUABIND_GET_PARAMETER(1, float, value);
-  obj->scal(value);
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet clamp
-{
-  float v1,v2;
-  LUABIND_GET_PARAMETER(1, float, v1);
-  LUABIND_GET_PARAMETER(2, float, v2);
-  obj->clamp(v1,v2);
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet zeros
-{
-  obj->zeros();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet ones
-{
-  obj->ones();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet plogp
-{
-  obj->plogp();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet log
-{
-  obj->log();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet log1p
-{
-  obj->log1p();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet exp
-{
-  obj->exp();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet sqrt
-{
-  obj->sqrt();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet tan
-{
-  obj->tan();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet tanh
-{
-  obj->tanh();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet atan
-{
-  obj->atan();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet atanh
-{
-  obj->atanh();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet cos
-{
-  obj->cos();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet cosh
-{
-  obj->cosh();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet acos
-{
-  obj->acos();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet acosh
-{
-  obj->acosh();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet sin
-{
-  obj->sin();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet sinh
-{
-  obj->sinh();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet asin
-{
-  obj->asin();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet asinh
-{
-  obj->asinh();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet abs
-{
-  obj->abs();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet complement
-{
-  obj->complement();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet sign
-{
-  obj->sign();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet inv
-{
-  obj->inv();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet norm2
-{
-  LUABIND_RETURN(float, obj->norm2());
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet prune_subnormal_and_check_normal
-{
-  obj->pruneSubnormalAndCheckNormal();
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet keys
-{
-  lua_createtable(L, 0, 0);
-  int i=1;
-  for (MatrixFloatSet::const_iterator it=obj->begin();
-       it != obj->end(); ++it, ++i) {
-    lua_pushnumber(L, i);
-    lua_pushstring(L, it->first.c_str());
-    lua_settable(L, -3);
-  }
-  LUABIND_INCREASE_NUM_RETURNS(1);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet axpy
-{
-  float alpha;
-  MatrixFloatSet *other;
-  LUABIND_CHECK_ARGN(==,2);
-  LUABIND_CHECK_PARAMETER(1,float);
-  LUABIND_CHECK_PARAMETER(2,MatrixFloatSet);
-  LUABIND_GET_PARAMETER(1, float, alpha);
-  LUABIND_GET_PARAMETER(2, MatrixFloatSet, other);
-  obj->axpy(alpha, other);
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet copy
-{
-  MatrixFloatSet *other;
-  LUABIND_GET_PARAMETER(1, MatrixFloatSet, other);
-  obj->copy(other);
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet cmul
-{
-  MatrixFloatSet *other;
-  LUABIND_CHECK_ARGN(==,1);
-  LUABIND_CHECK_PARAMETER(1,MatrixFloatSet);
-  LUABIND_GET_PARAMETER(1, MatrixFloatSet, other);
-  obj->cmul(other);
-  LUABIND_RETURN(MatrixFloatSet, obj);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet dot
-{
-  MatrixFloatSet *other;
-  LUABIND_CHECK_ARGN(==,1);
-  LUABIND_CHECK_PARAMETER(1,MatrixFloatSet);
-  LUABIND_GET_PARAMETER(1, MatrixFloatSet, other);
-  float dot_result = obj->dot(other);
-  LUABIND_RETURN(float, dot_result);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet clone
-{
-  MatrixFloatSet *cloned = obj->clone();
-  LUABIND_RETURN(MatrixFloatSet, cloned);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet clone_only_dims
-{
-  MatrixFloatSet *cloned = obj->cloneOnlyDims();
-  LUABIND_RETURN(MatrixFloatSet, cloned);
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet iterate
-{
-  LUABIND_CHECK_ARGN(==, 0);
-  LUABIND_RETURN(cfunction,matrixfloatset_iterator_function);
-  LUABIND_RETURN(MatrixFloatSetIteratorWrapper,
-                 new MatrixFloatSetIteratorWrapper(obj));
-}
-//BIND_END
-
-//BIND_METHOD MatrixFloatSet to_lua_string
-{
-  char *str = obj->toLuaString();
-  LUABIND_RETURN(string, str);
-  delete[] str;
-}
-//BIND_END
-
-//BIND_LUACLASSNAME MatrixFloatSetIteratorWrapper matrix.dict.__iterator__
-//BIND_CPP_CLASS    MatrixFloatSetIteratorWrapper
-
-//BIND_CONSTRUCTOR MatrixFloatSetIteratorWrapper
-{
-  LUABIND_ERROR("Use matrix.dict.iterate method");
-}
-//BIND_END
diff --git a/packages/basics/matrix/binding/bind_matrix_bool.lua.cc b/packages/basics/matrix/binding/bind_matrix_bool.lua.cc
new file mode 100644
index 000000000..e4dcc5d22
--- /dev/null
+++ b/packages/basics/matrix/binding/bind_matrix_bool.lua.cc
@@ -0,0 +1,730 @@
+/*
+ * This file is part of APRIL-ANN toolkit (A
+ * Pattern Recognizer In Lua with Artificial Neural Networks).
+ *
+ * Copyright 2013, Francisco Zamora-Martinez
+ *
+ * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 3 as
+ * published by the Free Software Foundation
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this library; if not, write to the Free Software Foundation,
+ * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ */
+//BIND_HEADER_C
+#include "bind_matrix.h"
+#include "luabindutil.h"
+#include "luabindmacros.h"
+
+namespace Basics {
+#define FUNCTION_NAME "read_vector"
+  static int *read_vector(lua_State *L, const char *key, int num_dim, int add) {
+    int *v=0;
+    lua_getfield(L, 1, key);
+    if (!lua_isnil(L, -1)) {
+      LUABIND_CHECK_PARAMETER(-1, table);
+      int table_len;
+      LUABIND_TABLE_GETN(-1, table_len);
+      if (table_len != num_dim)
+        LUABIND_FERROR3("Table '%s' with incorrect size, expected %d, found %d",
+                        key, num_dim, table_len);
+      v = new int[num_dim];
+      for(int i=0; i < num_dim; i++) {
+        lua_rawgeti(L, -1, i+1);
+        v[i] = static_cast<int>(lua_tonumber(L, -1)) + add;
+        lua_pop(L,1);
+      }
+    }
+    lua_pop(L, 1);
+    return v;
+  }
+#undef FUNCTION_NAME
+
+  int sliding_window_matrixBool_iterator_function(lua_State *L) {
+    SlidingWindowMatrixBool *obj = lua_toSlidingWindowMatrixBool(L,1);
+    if (obj->isEnd()) {
+      lua_pushnil(L);
+      return 1;
+    }
+    MatrixBool *mat = obj->getMatrix();
+    lua_pushMatrixBool(L, mat);
+    obj->next();
+    return 1;
+  }
+  
+}
+//BIND_END
+
+//BIND_HEADER_H
+#include "matrixBool.h"
+using namespace Basics;
+typedef MatrixBool::sliding_window SlidingWindowMatrixBool;
+//BIND_END
+
+//BIND_LUACLASSNAME MatrixBool matrixBool
+//BIND_CPP_CLASS MatrixBool
+//BIND_LUACLASSNAME Serializable aprilio.serializable
+//BIND_SUBCLASS_OF MatrixBool Serializable
+
+//BIND_LUACLASSNAME SlidingWindowMatrixBool matrixBool.__sliding_window__
+//BIND_CPP_CLASS SlidingWindowMatrixBool
+
+//BIND_CONSTRUCTOR SlidingWindowMatrixBool
+{
+  LUABIND_ERROR("Use matrixBool.sliding_window");
+}
+//BIND_END
+
+//BIND_METHOD SlidingWindowMatrixBool get_matrix
+{
+  MatrixBool *dest;
+  LUABIND_GET_OPTIONAL_PARAMETER(1, MatrixBool, dest, 0);
+  LUABIND_RETURN(MatrixBool, obj->getMatrix(dest));
+}
+//BIND_END
+
+//BIND_METHOD SlidingWindowMatrixBool next
+{
+  LUABIND_RETURN(SlidingWindowMatrixBool, obj->next());
+}
+//BIND_END
+
+//BIND_METHOD SlidingWindowMatrixBool set_at_window
+{
+  int windex;
+  LUABIND_CHECK_ARGN(==,1);
+  LUABIND_GET_PARAMETER(1, int, windex);
+  if (windex < 1) LUABIND_ERROR("Index must be >= 1\n");
+  obj->setAtWindow(windex-1);
+  LUABIND_RETURN(SlidingWindowMatrixBool, obj);
+}
+//BIND_END
+
+//BIND_METHOD SlidingWindowMatrixBool num_windows
+{
+  LUABIND_RETURN(int, obj->numWindows());
+}
+//BIND_END
+
+//BIND_METHOD SlidingWindowMatrixBool coords
+{
+  LUABIND_VECTOR_TO_NEW_TABLE(int, obj->getCoords(), obj->getNumDim());
+  LUABIND_RETURN_FROM_STACK(-1);
+}
+//BIND_END
+
+//BIND_METHOD SlidingWindowMatrixBool is_end
+{
+  LUABIND_RETURN(bool, obj->isEnd());
+}
+//BIND_END
+
+//BIND_METHOD SlidingWindowMatrixBool iterate
+{
+  LUABIND_CHECK_ARGN(==, 0);
+  LUABIND_RETURN(cfunction,sliding_window_matrixBool_iterator_function);
+  LUABIND_RETURN(SlidingWindowMatrixBool,obj);
+}
+//BIND_END
+
+//////////////////////////////////////////////////////////////////////
+
+//BIND_CONSTRUCTOR MatrixBool
+{
+  LUABIND_CHECK_ARGN(>=, 1);
+  if (lua_isMatrixFloat(L,1)) {
+    MatrixFloat *m;
+    LUABIND_GET_PARAMETER(1, MatrixFloat, m);
+    MatrixBool *obj = new MatrixBool(m->getNumDim(), m->getDimPtr());
+    MatrixBool::iterator bool_it(obj->begin());
+    MatrixFloat::const_iterator float_it(m->begin());
+    while(bool_it != obj->end()) {
+      if (*float_it == 0.0f) *bool_it = false;
+      else if (*float_it == 1.0f) *bool_it = true;
+      else LUABIND_ERROR("Needs a 0/1 matrix argument\n");
+      ++bool_it;
+      ++float_it;
+    }
+    LUABIND_RETURN(MatrixBool, obj);
+  }
+  else {
+    int i,argn;
+    argn = lua_gettop(L); // number of arguments
+    int ndims = (!lua_isnumber(L,argn)) ? argn-1 : argn;
+    int *dim;
+    if (ndims == 0) { // caso matrix{valores}
+      ndims = 1;
+      dim = new int[ndims];
+      LUABIND_TABLE_GETN(1, dim[0]);
+    } else {
+      dim = new int[ndims];
+      for (i=1; i <= ndims; i++) {
+        if (!lua_isnumber(L,i))
+          // TODO: Este mensaje de error parece que no es correcto... y no se todavia por que!!!
+          LUABIND_FERROR2("incorrect argument to matrix dimension (arg %d must"
+                          " be a number and is a %s)",
+                          i, lua_typename(L,i));
+        dim[i-1] = (int)lua_tonumber(L,i);
+        if (dim[i-1] <= 0)
+          LUABIND_FERROR1("incorrect argument to matrix dimension (arg %d must be >0)",i);
+      }
+    }
+    MatrixBool* obj;
+    obj = new MatrixBool(ndims,dim);
+    if (lua_istable(L,argn)) {
+      int i=1;
+      for (MatrixBool::iterator it(obj->begin()); it != obj->end(); ++it) {
+        lua_rawgeti(L,argn,i);
+        if (!lua_isboolean(L,-1))
+          LUABIND_FERROR1("The given table has a no boolean value at position %d, "
+                          "the table could be smaller than matrix size", i);
+        *it = lua_toboolean(L,-1);
+        lua_remove(L,-1);
+        ++i;
+      }
+    }
+    delete[] dim;
+    LUABIND_RETURN(MatrixBool,obj);
+  }
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool size
+{
+  LUABIND_RETURN(int, obj->size());
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool rewrap
+{
+  LUABIND_CHECK_ARGN(>=, 1);
+  int ndims;
+  ndims = lua_gettop(L); // number of dimensions
+  int *dims = new int[ndims];
+  for (int i=1; i <= ndims; i++) {
+    LUABIND_GET_PARAMETER(i, int, dims[i-1]);
+    if (dims[i-1] <= 0)
+      LUABIND_FERROR1("incorrect argument to matrix dimension (arg %d must be >0)",i);
+  }
+  MatrixBool *new_obj = obj->rewrap(dims, ndims);
+  delete[] dims;
+  LUABIND_RETURN(MatrixBool,new_obj);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool squeeze
+{
+  LUABIND_RETURN(MatrixBool,obj->squeeze());
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool get_reference_string
+{
+  char buff[128];
+  sprintf(buff,"%p data= %p",
+	  (void*)obj,
+	  (void*)obj->getRawDataAccess());
+  LUABIND_RETURN(string, buff);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool copy_from_table
+{
+  LUABIND_CHECK_ARGN(==, 1);
+  LUABIND_CHECK_PARAMETER(1, table);
+  int veclen;
+  LUABIND_TABLE_GETN(1, veclen);
+  if (veclen != obj->size())
+    LUABIND_FERROR2("wrong size %d instead of %d",veclen,obj->size());
+  int i=1;
+  for (MatrixBool::iterator it(obj->begin()); it != obj->end(); ++it) {
+    lua_rawgeti(L,1,i);
+    if (!lua_isboolean(L,-1))
+      LUABIND_FERROR1("The given table has a no boolean value at position %d, "
+                      "the table could be smaller than matrix size", i);
+    *it = lua_toboolean(L,-1);
+    lua_remove(L,-1);
+    ++i;
+  }
+  LUABIND_RETURN(MatrixBool, obj);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool get
+//DOC_BEGIN
+// bool get(coordinates)
+/// Permite ver valores de una matriz. Requiere tantos indices como dimensiones tenga la matriz.
+///@param coordinates Tabla con la posición exacta del punto de la matriz que queremos obtener.
+//DOC_END
+{
+  int argn = lua_gettop(L); // number of arguments
+  if (argn != obj->getNumDim())
+    LUABIND_FERROR2("wrong size %d instead of %d",argn,obj->getNumDim());
+  bool ret;
+  if (obj->getNumDim() == 1) {
+    int v1;
+    LUABIND_GET_PARAMETER(1,int,v1);
+    if (v1<1 || v1 > obj->getDimSize(0)) {
+      LUABIND_FERROR2("wrong index parameter: 1 <= %d <= %d is incorrect",
+		      v1, obj->getDimSize(0));
+    }
+    ret = (*obj)(v1-1);
+  }
+  else if (obj->getNumDim() == 2) {
+    int v1, v2;
+    LUABIND_GET_PARAMETER(1,int,v1);
+    LUABIND_GET_PARAMETER(2,int,v2);
+    if (v1<1 || v1 > obj->getDimSize(0)) {
+      LUABIND_FERROR2("wrong index parameter: 1 <= %d <= %d is incorrect",
+		      v1, obj->getDimSize(0));
+    }
+    if (v2<1 || v2 > obj->getDimSize(1)) {
+      LUABIND_FERROR2("wrong index parameter: 2 <= %d <= %d is incorrect",
+		      v2, obj->getDimSize(1));
+    }
+    ret = (*obj)(v1-1, v2-1);
+  }
+  else {
+    int *coords = new int[obj->getNumDim()];
+    for (int i=0; i<obj->getNumDim(); ++i) {
+      LUABIND_GET_PARAMETER(i+1,int,coords[i]);
+      if (coords[i]<1 || coords[i] > obj->getDimSize(i)) {
+	LUABIND_FERROR2("wrong index parameter: 1 <= %d <= %d is incorrect",
+			coords[i], obj->getDimSize(i));
+      }
+      coords[i]--;
+    }
+    ret = (*obj)(coords, obj->getNumDim());
+    delete[] coords;
+  }
+  LUABIND_RETURN(boolean, ret);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool set
+//DOC_BEGIN
+// bool set(coordinates,value)
+/// Permite cambiar el valor de un elemento en la matriz. Requiere
+/// tantos indices como dimensiones tenga la matriz y adicionalmente
+/// el valor a cambiar
+///@param coordinates Tabla con la posición exacta del punto de la matriz que queremos obtener.
+//DOC_END
+{
+  int argn = lua_gettop(L); // number of arguments
+  if (argn != obj->getNumDim()+1)
+    LUABIND_FERROR2("wrong size %d instead of %d",argn,obj->getNumDim()+1);
+  bool v;
+  if (obj->getNumDim() == 1) {
+    int v1;
+    LUABIND_GET_PARAMETER(1,int,v1);
+    if (v1<1 || v1 > obj->getDimSize(0)) {
+      LUABIND_FERROR2("wrong index parameter: 1 <= %d <= %d is incorrect",
+		      v1, obj->getDimSize(0));
+    }
+    LUABIND_GET_PARAMETER(obj->getNumDim()+1,boolean,v);
+    (*obj)(v1-1) = v;
+  }
+  else if (obj->getNumDim() == 2) {
+    int v1, v2;
+    LUABIND_GET_PARAMETER(1,int,v1);
+    LUABIND_GET_PARAMETER(2,int,v2);
+    if (v1<1 || v1 > obj->getDimSize(0)) {
+      LUABIND_FERROR2("wrong index parameter: 1 <= %d <= %d is incorrect",
+		      v1, obj->getDimSize(0));
+    }
+    if (v2<1 || v2 > obj->getDimSize(1)) {
+      LUABIND_FERROR2("wrong index parameter: 2 <= %d <= %d is incorrect",
+		      v2, obj->getDimSize(1));
+    }
+    LUABIND_GET_PARAMETER(obj->getNumDim()+1,boolean,v);
+    (*obj)(v1-1, v2-1) = v;
+  }
+  else {
+    int *coords = new int[obj->getNumDim()];
+    for (int i=0; i<obj->getNumDim(); ++i) {
+      LUABIND_GET_PARAMETER(i+1,int,coords[i]);
+      if (coords[i]<1 || coords[i] > obj->getDimSize(i)) {
+	LUABIND_FERROR2("wrong index parameter: 1 <= %d <= %d is incorrect",
+			coords[i], obj->getDimSize(i));
+      }
+      coords[i]--;
+    }
+    LUABIND_GET_PARAMETER(obj->getNumDim()+1,boolean,v);
+    (*obj)(coords, obj->getNumDim()) = v;
+    delete[] coords;
+  }
+  LUABIND_RETURN(MatrixBool, obj);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool offset
+{
+  LUABIND_RETURN(int, obj->getOffset());
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool raw_get
+{
+  int raw_pos;
+  LUABIND_GET_PARAMETER(1, int, raw_pos);
+  LUABIND_RETURN(bool, (*obj)[raw_pos]);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool raw_set
+{
+  int raw_pos;
+  bool value;
+  LUABIND_GET_PARAMETER(1, int, raw_pos);
+  LUABIND_GET_PARAMETER(2, boolean, value);
+  (*obj)[raw_pos] = value;
+  LUABIND_RETURN(MatrixBool, obj);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool fill
+//DOC_BEGIN
+// void fill(bool value)
+/// Permite poner todos los valores de la matriz a un mismo valor.
+//DOC_END
+{
+  LUABIND_CHECK_ARGN(==, 1);
+  LUABIND_CHECK_PARAMETER(1, boolean);
+  bool value;
+  LUABIND_GET_PARAMETER(1,boolean,value);
+  LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
+                 matFill(obj, value));
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool zeros
+{
+  LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
+                 matFill(obj, false));
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool ones
+{
+  LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
+                 matFill(obj, true));
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool dim
+{
+  LUABIND_CHECK_ARGN(>=, 0);
+  LUABIND_CHECK_ARGN(<=, 1);
+  int pos;
+  const int *d=obj->getDimPtr();
+  LUABIND_GET_OPTIONAL_PARAMETER(1, int, pos, -1);
+  if (pos < 1) {
+    LUABIND_VECTOR_TO_NEW_TABLE(int, d, obj->getNumDim());
+    LUABIND_RETURN_FROM_STACK(-1);
+  }
+  else LUABIND_RETURN(int, d[pos-1]);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool stride
+{
+  LUABIND_CHECK_ARGN(>=, 0);
+  LUABIND_CHECK_ARGN(<=, 1);
+  int pos;
+  const int *s=obj->getStridePtr();
+  LUABIND_GET_OPTIONAL_PARAMETER(1, int, pos, -1);
+  if (pos < 1) {
+    LUABIND_VECTOR_TO_NEW_TABLE(int, s, obj->getNumDim());
+    LUABIND_RETURN_FROM_STACK(-1);
+  }
+  else LUABIND_RETURN(int, s[pos-1]);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool slice
+{
+  LUABIND_CHECK_ARGN(>=,2);
+  LUABIND_CHECK_ARGN(<=,3);
+  LUABIND_CHECK_PARAMETER(1, table);
+  LUABIND_CHECK_PARAMETER(2, table);
+  int *coords, *sizes, coords_len, sizes_len;
+  bool clone;
+  LUABIND_TABLE_GETN(1, coords_len);
+  LUABIND_TABLE_GETN(2, sizes_len);
+  if (coords_len != sizes_len || coords_len != obj->getNumDim())
+    LUABIND_FERROR3("Incorrect number of dimensions, expected %d, "
+		    "found %d and %d\n",
+		    obj->getNumDim(), coords_len, sizes_len);
+  coords = new int[coords_len];
+  sizes  = new int[sizes_len];
+  LUABIND_TABLE_TO_VECTOR_SUB1(1, int, coords, coords_len);
+  LUABIND_TABLE_TO_VECTOR(2, int, sizes,  sizes_len);
+  for (int i=0; i<sizes_len; ++i)
+    if (coords[i] < 0 || sizes[i] < 1 ||
+	sizes[i]+coords[i] > obj->getDimSize(i))
+      LUABIND_FERROR1("Incorrect size or coord at position %d\n", i+1);
+  LUABIND_GET_OPTIONAL_PARAMETER(3, bool, clone, false);
+  MatrixBool *obj2 = new MatrixBool(obj, coords, sizes, clone);
+  LUABIND_RETURN(MatrixBool, obj2);
+  delete[] coords;
+  delete[] sizes;
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool select
+{
+  LUABIND_CHECK_ARGN(>=,2);
+  LUABIND_CHECK_ARGN(<=,3);
+  LUABIND_CHECK_PARAMETER(1, int);
+  LUABIND_CHECK_PARAMETER(2, int);
+  int dim, index;
+  MatrixBool *dest;
+  LUABIND_GET_PARAMETER(1, int, dim);
+  LUABIND_GET_PARAMETER(2, int, index);
+  LUABIND_GET_OPTIONAL_PARAMETER(3, MatrixBool, dest, 0);
+  MatrixBool *obj2 = obj->select(dim-1, index-1, dest);
+  LUABIND_RETURN(MatrixBool, obj2);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool clone
+//DOC_BEGIN
+// matrix *clone()
+/// Devuelve un <em>clon</em> de la matriz.
+//DOC_END
+{
+  MatrixBool *obj2 = obj->clone();
+  LUABIND_RETURN(MatrixBool,obj2);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool transpose
+{
+  int argn;
+  argn = lua_gettop(L);
+  if (argn == 0) {
+    LUABIND_RETURN(MatrixBool, obj->transpose());
+  }
+  else {
+    int d1,d2;
+    LUABIND_GET_PARAMETER(1, int, d1);
+    LUABIND_GET_PARAMETER(2, int, d2);
+    LUABIND_RETURN(MatrixBool, obj->transpose(d1-1, d2-1));
+  }
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool diag
+{
+  LUABIND_CHECK_ARGN(==,1);
+  bool v;
+  LUABIND_GET_PARAMETER(1, boolean, v);
+  LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
+                 matDiag(obj, v));
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool toTable
+// Permite salvar una matriz en una tabla lua
+// TODO: Tener en cuenta las dimensiones de la matriz
+  {
+    LUABIND_CHECK_ARGN(==, 0);
+    lua_createtable(L, obj->size(), 0);
+    int index = 1;
+    for (MatrixBool::iterator it(obj->begin()); it != obj->end(); ++it) {
+      lua_pushboolean(L, *it);
+      lua_rawseti(L, -2, index++);
+    }
+    LUABIND_RETURN_FROM_STACK(-1);
+  }
+//BIND_END
+
+//BIND_METHOD MatrixBool sliding_window
+{
+  int *sub_matrix_size=0, *offset=0, *step=0, *num_steps=0, *order_step=0;
+  int argn = lua_gettop(L); // number of arguments
+  const int num_dim = obj->getNumDim();
+  if (argn > 1)
+    LUABIND_ERROR("incorrect number of arguments");
+  if (argn == 1) {
+    LUABIND_CHECK_PARAMETER(1, table);
+    check_table_fields(L, 1,
+		       "offset",
+		       "size",
+		       "step",
+		       "numSteps",
+		       "orderStep",
+		       (const char*)0);
+    
+    offset = read_vector(L, "offset", num_dim, 0);
+    sub_matrix_size = read_vector(L, "size", num_dim, 0);
+    step = read_vector(L, "step", num_dim, 0);
+    num_steps = read_vector(L, "numSteps", num_dim, 0);
+    order_step = read_vector(L, "orderStep", num_dim, -1);
+  }
+  SlidingWindowMatrixBool *window = new SlidingWindowMatrixBool(obj,
+								sub_matrix_size,
+								offset,
+								step,
+								num_steps,
+								order_step);
+  LUABIND_RETURN(SlidingWindowMatrixBool, window);
+  delete[] sub_matrix_size;
+  delete[] offset;
+  delete[] step;
+  delete[] num_steps;
+  delete[] order_step;
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool is_contiguous
+{
+  LUABIND_RETURN(bool, obj->getIsContiguous());
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool complement
+{
+  for (MatrixBool::iterator it(obj->begin());
+       it != obj->end(); ++it) {
+    if (*it) *it = false;
+    else *it = true;
+  }
+  LUABIND_RETURN(MatrixBool, obj);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool to_float
+{
+  MatrixFloat *result = new MatrixFloat(obj->getNumDim(),
+                                        obj->getDimPtr());
+  MatrixBool::const_iterator bool_it(obj->begin());
+  MatrixFloat::iterator float_it(result->begin());
+  while(bool_it != obj->end()) {
+    *float_it = (*bool_it) ? (1.0f) : (0.0f);
+    ++bool_it;
+    ++float_it;
+  }
+  LUABIND_RETURN(MatrixFloat, result);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool copy
+{
+  int argn;
+  LUABIND_CHECK_ARGN(==, 1);
+  MatrixBool *mat;
+  LUABIND_GET_PARAMETER(1, MatrixBool, mat);
+  LUABIND_RETURN(MatrixBool, AprilMath::MatrixExt::Operations::
+                 matCopy(obj, mat));
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool count_ones
+{
+  int count=0;
+  for (MatrixBool::const_iterator it(obj->begin());
+       it != obj->end(); ++it) {
+    if (*it) ++count;
+  }
+  LUABIND_RETURN(int, count);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool count_zeros
+{
+  int count=0;
+  for (MatrixBool::const_iterator it(obj->begin());
+       it != obj->end(); ++it) {
+    if (!(*it)) ++count;
+  }
+  LUABIND_RETURN(int, count);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool any
+{
+  bool result = false;
+  for (MatrixBool::const_iterator it(obj->begin());
+       it != obj->end() && !result; ++it) {
+    result = result || (*it);
+  }
+  LUABIND_RETURN(boolean, result);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool all
+{
+  bool result = true;
+  for (MatrixBool::const_iterator it(obj->begin());
+       it != obj->end() && result; ++it) {
+    result = result && (*it);
+  }
+  LUABIND_RETURN(boolean, result);
+}
+//BIND_END
+
+//BIND_METHOD MatrixBool map
+{
+  int argn;
+  int N;
+  argn = lua_gettop(L); // number of arguments
+  N = argn-1;
+  MatrixBool **v = 0;
+  MatrixBool::const_iterator *list_it = 0;
+  if (N > 0) {
+    v = new MatrixBool*[N];
+    list_it = new MatrixBool::const_iterator[N];
+  }
+  for (int i=0; i<N; ++i) {
+    LUABIND_CHECK_PARAMETER(i+1, MatrixBool);
+    LUABIND_GET_PARAMETER(i+1, MatrixBool, v[i]);
+    if (!v[i]->sameDim(obj))
+      LUABIND_ERROR("The given matrices must have the same dimension sizes\n");
+    list_it[i] = v[i]->begin();
+  }
+  LUABIND_CHECK_PARAMETER(argn, function);
+  for (MatrixBool::iterator it(obj->begin()); it!=obj->end(); ++it) {
+    // copy the Lua function, lua_call will pop this copy
+    lua_pushvalue(L, argn);
+    // push the self matrix value
+    lua_pushboolean(L, *it);
+    // push the value of the rest of given matrices
+    for (int j=0; j<N; ++j) {
+      lua_pushboolean(L, *list_it[j]);
+      ++list_it[j];
+    }
+    // CALL
+    lua_call(L, N+1, 1);
+    // pop the result, a number
+    if (!lua_isnil(L, -1)) {
+      if (!lua_isboolean(L, -1))
+	LUABIND_ERROR("Incorrect returned value type, expected NIL or COMPLEX\n");
+      *it = lua_toboolean(L, -1);
+    }
+    lua_pop(L, 1);
+  }
+  delete[] v;
+  delete[] list_it;
+  LUABIND_RETURN(MatrixBool, obj);
+}
+//BIND_END
+
+//// MATRIX SERIALIZATION ////
+
+//BIND_CLASS_METHOD MatrixBool read
+{
+  MAKE_READ_MATRIX_LUA_METHOD(MatrixBool, bool);
+  LUABIND_INCREASE_NUM_RETURNS(1);
+}
+//BIND_END
+
+//////////////////////////////////////////////////////////////////////
+
diff --git a/packages/basics/matrix/binding/bind_matrix_char.lua.cc b/packages/basics/matrix/binding/bind_matrix_char.lua.cc
index f7e127cde..a9e1d0b9c 100644
--- a/packages/basics/matrix/binding/bind_matrix_char.lua.cc
+++ b/packages/basics/matrix/binding/bind_matrix_char.lua.cc
@@ -24,6 +24,23 @@
 #include "luabindutil.h"
 #include "luabindmacros.h"
 
+namespace AprilUtils {
+  template<> Basics::MatrixChar *LuaTable::
+  convertTo<Basics::MatrixChar *>(lua_State *L, int idx) {
+    return lua_toMatrixChar(L, idx);
+  }
+  
+  template<> void LuaTable::
+  pushInto<Basics::MatrixChar *>(lua_State *L, Basics::MatrixChar *value) {
+    lua_pushMatrixChar(L, value);
+  }
+
+  template<> bool LuaTable::
+  checkType<Basics::MatrixChar *>(lua_State *L, int idx) {
+    return lua_isMatrixChar(L, idx);
+  }
+}
+
 namespace Basics {
 #define FUNCTION_NAME "read_vector"
   static int *read_vector(lua_State *L, const char *key, int num_dim, int add) {
@@ -471,28 +488,24 @@ typedef MatrixChar::sliding_window SlidingWindowMatrixChar;
 /// Devuelve un <em>clon</em> de la matriz.
 //DOC_END
 {
-  LUABIND_CHECK_ARGN(>=, 0);
-  LUABIND_CHECK_ARGN(<=, 1);
-  int argn;
-  argn = lua_gettop(L); // number of arguments
-  MatrixChar *obj2;
-  if (argn == 0) obj2 = obj->clone();
-  else {
-    const char *major;
-    LUABIND_GET_OPTIONAL_PARAMETER(1, string, major, "row_major");
-    CBLAS_ORDER order=CblasRowMajor;
-    if (strcmp(major, "col_major") == 0) order = CblasColMajor;
-    else if (strcmp(major, "row_major") != 0)
-      LUABIND_FERROR1("Incorrect major order char %s", major);
-    obj2 = obj->clone(order);
-  }
+  MatrixChar *obj2 = obj->clone();
   LUABIND_RETURN(MatrixChar,obj2);
 }
 //BIND_END
 
 //BIND_METHOD MatrixChar transpose
 {
-  LUABIND_RETURN(MatrixChar, obj->transpose());
+  int argn;
+  argn = lua_gettop(L);
+  if (argn == 0) {
+    LUABIND_RETURN(MatrixChar, obj->transpose());
+  }
+  else {
+    int d1,d2;
+    LUABIND_GET_PARAMETER(1, int, d1);
+    LUABIND_GET_PARAMETER(2, int, d2);
+    LUABIND_RETURN(MatrixChar, obj->transpose(d1-1, d2-1));
+  }
 }
 //BIND_END
 
diff --git a/packages/basics/matrix/binding/bind_matrix_complex_float.lua.cc b/packages/basics/matrix/binding/bind_matrix_complex_float.lua.cc
index 7575d06a6..392985934 100644
--- a/packages/basics/matrix/binding/bind_matrix_complex_float.lua.cc
+++ b/packages/basics/matrix/binding/bind_matrix_complex_float.lua.cc
@@ -27,6 +27,23 @@
 #include "luabindmacros.h"
 #include "bind_complex.h"
 
+namespace AprilUtils {
+  template<> Basics::MatrixComplexF *LuaTable::
+  convertTo<Basics::MatrixComplexF *>(lua_State *L, int idx) {
+    return lua_toMatrixComplexF(L, idx);
+  }
+  
+  template<> void LuaTable::
+  pushInto<Basics::MatrixComplexF *>(lua_State *L, Basics::MatrixComplexF *value) {
+    lua_pushMatrixComplexF(L, value);
+  }
+
+  template<> bool LuaTable::
+  checkType<Basics::MatrixComplexF *>(lua_State *L, int idx) {
+    return lua_isMatrixComplexF(L, idx);
+  }
+}
+
 namespace Basics {
 #define FUNCTION_NAME "read_vector"
   static int *read_vector(lua_State *L, const char *key, int num_dim, int add) {
@@ -199,57 +216,6 @@ typedef MatrixComplexF::sliding_window SlidingWindowComplexF;
 }
 //BIND_END
 
-//BIND_CLASS_METHOD MatrixComplexF col_major
-//DOC_BEGIN
-// col_major_matrix(int dim1, int dim2, ..., table mat=nil)
-/// Constructor con una secuencia de valores que son las dimensiones de
-/// la matriz el ultimo argumento puede ser una tabla, en cuyo caso
-/// contiene los valores adecuadamente serializados, si solamente
-/// aparece la matriz, se trata de un vector cuya longitud viene dada
-/// implicitamente.
-//DOC_END
-{
-  int i,argn;
-  argn = lua_gettop(L); // number of arguments
-  LUABIND_CHECK_ARGN(>=, 1);
-  int ndims = (!lua_isnumber(L,argn)) ? argn-1 : argn;
-  int *dim;
-  if (ndims == 0) { // caso matrix{valores}
-    ndims = 1;
-    dim = new int[ndims];
-    LUABIND_TABLE_GETN(1, dim[0]);
-  } else {
-    dim = new int[ndims];
-    for (i=1; i <= ndims; i++) {
-      if (!lua_isnumber(L,i))
-	// TODO: Este mensaje de error parece que no es correcto... y no se todavia por que!!!
-	LUABIND_FERROR2("incorrect argument to matrix dimension (arg %d must"
-			" be a number and is a %s)",
-			i, lua_typename(L,i));
-      dim[i-1] = (int)lua_tonumber(L,i);
-      if (dim[i-1] <= 0)
-	LUABIND_FERROR1("incorrect argument to matrix dimension (arg %d must be >0)",i);
-    }
-  }
-  MatrixComplexF* obj;
-  obj = new MatrixComplexF(ndims,dim,CblasColMajor);
-  if (lua_istable(L,argn)) {
-    int len;
-    LUABIND_TABLE_GETN(argn, len);
-    if (len != obj->size())
-      LUABIND_FERROR2("Incorrect number of elements at the given table, "
-		      "found %d, expected %d", len, obj->size());
-    int i=1;
-    for (MatrixComplexF::iterator it(obj->begin()); it != obj->end(); ++it,++i) {
-      lua_rawgeti(L,argn,i);
-      *it = lua_toComplexF(L, -1);
-    }
-  }
-  delete[] dim;
-  LUABIND_RETURN(MatrixComplexF,obj);
-}
-//BIND_END
-
 //BIND_METHOD MatrixComplexF size
 {
   LUABIND_RETURN(int, obj->size());
@@ -273,6 +239,12 @@ typedef MatrixComplexF::sliding_window SlidingWindowComplexF;
 }
 //BIND_END
 
+//BIND_METHOD MatrixComplexF squeeze
+{
+  LUABIND_RETURN(MatrixComplexF,obj->squeeze());
+}
+//BIND_END
+
 //BIND_METHOD MatrixComplexF get_reference_string
 {
   char buff[128];
@@ -492,14 +464,6 @@ typedef MatrixComplexF::sliding_window SlidingWindowComplexF;
 }
 //BIND_END
 
-//BIND_METHOD MatrixComplexF get_major_order
-{
-  if (obj->getMajorOrder() == CblasRowMajor)
-    LUABIND_RETURN(string, "row_major");
-  else LUABIND_RETURN(string, "col_major");
-}
-//BIND_END
-
 //BIND_METHOD MatrixComplexF dim
 {
   LUABIND_CHECK_ARGN(>=, 0);
@@ -582,28 +546,24 @@ typedef MatrixComplexF::sliding_window SlidingWindowComplexF;
 /// Devuelve un <em>clon</em> de la matriz.
 //DOC_END
 {
-  LUABIND_CHECK_ARGN(>=, 0);
-  LUABIND_CHECK_ARGN(<=, 1);
-  int argn;
-  argn = lua_gettop(L); // number of arguments
-  MatrixComplexF *obj2;
-  if (argn == 0) obj2 = obj->clone();
-  else {
-    const char *major;
-    LUABIND_GET_OPTIONAL_PARAMETER(1, string, major, "row_major");
-    CBLAS_ORDER order=CblasRowMajor;
-    if (strcmp(major, "col_major") == 0) order = CblasColMajor;
-    else if (strcmp(major, "row_major") != 0)
-      LUABIND_FERROR1("Incorrect major order string %s", major);
-    obj2 = obj->clone(order);
-  }
+  MatrixComplexF *obj2 = obj->clone();
   LUABIND_RETURN(MatrixComplexF,obj2);
 }
 //BIND_END
 
 //BIND_METHOD MatrixComplexF transpose
 {
-  LUABIND_RETURN(MatrixComplexF, obj->transpose());
+  int argn;
+  argn = lua_gettop(L);
+  if (argn == 0) {
+    LUABIND_RETURN(MatrixComplexF, obj->transpose());
+  }
+  else {
+    int d1,d2;
+    LUABIND_GET_PARAMETER(1, int, d1);
+    LUABIND_GET_PARAMETER(2, int, d2);
+    LUABIND_RETURN(MatrixComplexF, obj->transpose(d1-1, d2-1));
+  }
 }
 //BIND_END
 
@@ -649,6 +609,52 @@ typedef MatrixComplexF::sliding_window SlidingWindowComplexF;
   }
 //BIND_END
 
+//BIND_METHOD MatrixComplexF map
+{
+  int argn;
+  int N;
+  argn = lua_gettop(L); // number of arguments
+  N = argn-1;
+  MatrixComplexF **v = 0;
+  MatrixComplexF::const_iterator *list_it = 0;
+  if (N > 0) {
+    v = new MatrixComplexF*[N];
+    list_it = new MatrixComplexF::const_iterator[N];
+  }
+  for (int i=0; i<N; ++i) {
+    LUABIND_CHECK_PARAMETER(i+1, MatrixComplexF);
+    LUABIND_GET_PARAMETER(i+1, MatrixComplexF, v[i]);
+    if (!v[i]->sameDim(obj))
+      LUABIND_ERROR("The given matrices must have the same dimension sizes\n");
+    list_it[i] = v[i]->begin();
+  }
+  LUABIND_CHECK_PARAMETER(argn, function);
+  for (MatrixComplexF::iterator it(obj->begin()); it!=obj->end(); ++it) {
+    // copy the Lua function, lua_call will pop this copy
+    lua_pushvalue(L, argn);
+    // push the self matrix value
+    lua_pushComplexF(L, *it);
+    // push the value of the rest of given matrices
+    for (int j=0; j<N; ++j) {
+      lua_pushComplexF(L, *list_it[j]);
+      ++list_it[j];
+    }
+    // CALL
+    lua_call(L, N+1, 1);
+    // pop the result, a number
+    if (!lua_isnil(L, -1)) {
+      if (!lua_isComplexF(L, -1))
+	LUABIND_ERROR("Incorrect returned value type, expected NIL or COMPLEX\n");
+      *it = lua_toComplexF(L, -1);
+    }
+    lua_pop(L, 1);
+  }
+  delete[] v;
+  delete[] list_it;
+  LUABIND_RETURN(MatrixComplexF, obj);
+}
+//BIND_END
+
 //BIND_METHOD MatrixComplexF equals
 {
   MatrixComplexF *other;
@@ -860,16 +866,10 @@ typedef MatrixComplexF::sliding_window SlidingWindowComplexF;
     LUABIND_ERROR("First argument must be <= second argument");
   if (random == 0) random = new MTRand();
   IncRef(random);
-  if (obj->getMajorOrder() == CblasRowMajor)
-    for (MatrixComplexF::iterator it(obj->begin()); it != obj->end(); ++it) {
-      *it = ComplexF(static_cast<float>(random->randInt(upper - lower) + lower),
-		     0.0f);
-    }
-  else
-    for (MatrixComplexF::col_major_iterator it(obj->begin());it!=obj->end();++it) {
-      *it = ComplexF(static_cast<float>(random->randInt(upper - lower) + lower),
-		     0.0f);
-    }
+  for (MatrixComplexF::iterator it(obj->begin()); it != obj->end(); ++it) {
+    *it = ComplexF(static_cast<float>(random->randInt(upper - lower) + lower),
+                   0.0f);
+  }
   DecRef(random);
   LUABIND_RETURN(MatrixComplexF, obj);
 }
diff --git a/packages/basics/matrix/binding/bind_matrix_double.lua.cc b/packages/basics/matrix/binding/bind_matrix_double.lua.cc
index 0b77f9cad..afb64ea1c 100644
--- a/packages/basics/matrix/binding/bind_matrix_double.lua.cc
+++ b/packages/basics/matrix/binding/bind_matrix_double.lua.cc
@@ -24,6 +24,23 @@
 #include "luabindutil.h"
 #include "luabindmacros.h"
 
+namespace AprilUtils {
+  template<> Basics::MatrixDouble *LuaTable::
+  convertTo<Basics::MatrixDouble *>(lua_State *L, int idx) {
+    return lua_toMatrixDouble(L, idx);
+  }
+  
+  template<> void LuaTable::
+  pushInto<Basics::MatrixDouble *>(lua_State *L, Basics::MatrixDouble *value) {
+    lua_pushMatrixDouble(L, value);
+  }
+
+  template<> bool LuaTable::
+  checkType<Basics::MatrixDouble *>(lua_State *L, int idx) {
+    return lua_isMatrixDouble(L, idx);
+  }
+}
+
 namespace Basics {
 #define FUNCTION_NAME "read_vector"
   static int *read_vector(lua_State *L, const char *key, int num_dim, int add) {
@@ -199,6 +216,12 @@ typedef MatrixDouble::sliding_window SlidingWindowMatrixDouble;
 }
 //BIND_END
 
+//BIND_METHOD MatrixDouble squeeze
+{
+  LUABIND_RETURN(MatrixDouble,obj->squeeze());
+}
+//BIND_END
+
 //BIND_METHOD MatrixDouble get_reference_string
 {
   char buff[128];
@@ -477,28 +500,24 @@ typedef MatrixDouble::sliding_window SlidingWindowMatrixDouble;
 /// Devuelve un <em>clon</em> de la matriz.
 //DOC_END
 {
-  LUABIND_CHECK_ARGN(>=, 0);
-  LUABIND_CHECK_ARGN(<=, 1);
-  int argn;
-  argn = lua_gettop(L); // number of arguments
-  MatrixDouble *obj2;
-  if (argn == 0) obj2 = obj->clone();
-  else {
-    const char *major;
-    LUABIND_GET_OPTIONAL_PARAMETER(1, string, major, "row_major");
-    CBLAS_ORDER order=CblasRowMajor;
-    if (strcmp(major, "col_major") == 0) order = CblasColMajor;
-    else if (strcmp(major, "row_major") != 0)
-      LUABIND_FERROR1("Incorrect major order char %s", major);
-    obj2 = obj->clone(order);
-  }
+  MatrixDouble *obj2 = obj->clone();
   LUABIND_RETURN(MatrixDouble,obj2);
 }
 //BIND_END
 
 //BIND_METHOD MatrixDouble transpose
 {
-  LUABIND_RETURN(MatrixDouble, obj->transpose());
+  int argn;
+  argn = lua_gettop(L);
+  if (argn == 0) {
+    LUABIND_RETURN(MatrixDouble, obj->transpose());
+  }
+  else {
+    int d1,d2;
+    LUABIND_GET_PARAMETER(1, int, d1);
+    LUABIND_GET_PARAMETER(2, int, d2);
+    LUABIND_RETURN(MatrixDouble, obj->transpose(d1-1, d2-1));
+  }
 }
 //BIND_END
 
@@ -527,6 +546,52 @@ typedef MatrixDouble::sliding_window SlidingWindowMatrixDouble;
   }
 //BIND_END
 
+//BIND_METHOD MatrixDouble map
+{
+  int argn;
+  int N;
+  argn = lua_gettop(L); // number of arguments
+  N = argn-1;
+  MatrixDouble **v = 0;
+  MatrixDouble::const_iterator *list_it = 0;
+  if (N > 0) {
+    v = new MatrixDouble*[N];
+    list_it = new MatrixDouble::const_iterator[N];
+  }
+  for (int i=0; i<N; ++i) {
+    LUABIND_CHECK_PARAMETER(i+1, MatrixDouble);
+    LUABIND_GET_PARAMETER(i+1, MatrixDouble, v[i]);
+    if (!v[i]->sameDim(obj))
+      LUABIND_ERROR("The given matrices must have the same dimension sizes\n");
+    list_it[i] = v[i]->begin();
+  }
+  LUABIND_CHECK_PARAMETER(argn, function);
+  for (MatrixDouble::iterator it(obj->begin()); it!=obj->end(); ++it) {
+    // copy the Lua function, lua_call will pop this copy
+    lua_pushvalue(L, argn);
+    // push the self matrix value
+    lua_pushdouble(L, *it);
+    // push the value of the rest of given matrices
+    for (int j=0; j<N; ++j) {
+      lua_pushdouble(L, *list_it[j]);
+      ++list_it[j];
+    }
+    // CALL
+    lua_call(L, N+1, 1);
+    // pop the result, a number
+    if (!lua_isnil(L, -1)) {
+      if (!lua_isdouble(L, -1))
+	LUABIND_ERROR("Incorrect returned value type, expected NIL or DOUBLE\n");
+      *it = lua_todouble(L, -1);
+    }
+    lua_pop(L, 1);
+  }
+  delete[] v;
+  delete[] list_it;
+  LUABIND_RETURN(MatrixDouble, obj);
+}
+//BIND_END
+
 //BIND_METHOD MatrixDouble sliding_window
 {
   int *sub_matrix_size=0, *offset=0, *step=0, *num_steps=0, *order_step=0;
@@ -573,10 +638,7 @@ typedef MatrixDouble::sliding_window SlidingWindowMatrixDouble;
 
 //BIND_METHOD MatrixDouble to_float
 {
-  bool col_major;
-  LUABIND_GET_OPTIONAL_PARAMETER(1, bool, col_major, false);
-  LUABIND_RETURN(MatrixFloat,
-		 convertFromMatrixDoubleToMatrixFloat(obj, col_major));
+  LUABIND_RETURN(MatrixFloat, convertFromMatrixDoubleToMatrixFloat(obj));
 }
 //BIND_END
 
diff --git a/packages/basics/matrix/binding/bind_matrix_int32.lua.cc b/packages/basics/matrix/binding/bind_matrix_int32.lua.cc
index 949e052b8..9fe7ead7d 100644
--- a/packages/basics/matrix/binding/bind_matrix_int32.lua.cc
+++ b/packages/basics/matrix/binding/bind_matrix_int32.lua.cc
@@ -20,10 +20,28 @@
  */
 //BIND_HEADER_C
 #include "bind_matrix.h"
+#include "bind_mtrand.h"
 #include "utilMatrixInt32.h"
 #include "luabindutil.h"
 #include "luabindmacros.h"
 
+namespace AprilUtils {
+  template<> Basics::MatrixInt32 *LuaTable::
+  convertTo<Basics::MatrixInt32 *>(lua_State *L, int idx) {
+    return lua_toMatrixInt32(L, idx);
+  }
+  
+  template<> void LuaTable::
+  pushInto<Basics::MatrixInt32 *>(lua_State *L, Basics::MatrixInt32 *value) {
+    lua_pushMatrixInt32(L, value);
+  }
+
+  template<> bool LuaTable::
+  checkType<Basics::MatrixInt32 *>(lua_State *L, int idx) {
+    return lua_isMatrixInt32(L, idx);
+  }
+}
+
 namespace Basics {
 
 #define FUNCTION_NAME "read_vector"
@@ -207,6 +225,12 @@ typedef MatrixInt32::sliding_window SlidingWindowMatrixInt32;
 }
 //BIND_END
 
+//BIND_METHOD MatrixInt32 squeeze
+{
+  LUABIND_RETURN(MatrixInt32,obj->squeeze());
+}
+//BIND_END
+
 //BIND_METHOD MatrixInt32 get_reference_string
 {
   char buff[128];
@@ -485,28 +509,24 @@ typedef MatrixInt32::sliding_window SlidingWindowMatrixInt32;
 /// Devuelve un <em>clon</em> de la matriz.
 //DOC_END
 {
-  LUABIND_CHECK_ARGN(>=, 0);
-  LUABIND_CHECK_ARGN(<=, 1);
-  int argn;
-  argn = lua_gettop(L); // number of arguments
-  MatrixInt32 *obj2;
-  if (argn == 0) obj2 = obj->clone();
-  else {
-    const char *major;
-    LUABIND_GET_OPTIONAL_PARAMETER(1, string, major, "row_major");
-    CBLAS_ORDER order=CblasRowMajor;
-    if (strcmp(major, "col_major") == 0) order = CblasColMajor;
-    else if (strcmp(major, "row_major") != 0)
-      LUABIND_FERROR1("Incorrect major order char %s", major);
-    obj2 = obj->clone(order);
-  }
+  MatrixInt32 *obj2 = obj->clone();
   LUABIND_RETURN(MatrixInt32,obj2);
 }
 //BIND_END
 
 //BIND_METHOD MatrixInt32 transpose
 {
-  LUABIND_RETURN(MatrixInt32, obj->transpose());
+  int argn;
+  argn = lua_gettop(L);
+  if (argn == 0) {
+    LUABIND_RETURN(MatrixInt32, obj->transpose());
+  }
+  else {
+    int d1,d2;
+    LUABIND_GET_PARAMETER(1, int, d1);
+    LUABIND_GET_PARAMETER(2, int, d2);
+    LUABIND_RETURN(MatrixInt32, obj->transpose(d1-1, d2-1));
+  }
 }
 //BIND_END
 
@@ -535,6 +555,52 @@ typedef MatrixInt32::sliding_window SlidingWindowMatrixInt32;
   }
 //BIND_END
 
+//BIND_METHOD MatrixInt32 map
+{
+  int argn;
+  int N;
+  argn = lua_gettop(L); // number of arguments
+  N = argn-1;
+  MatrixInt32 **v = 0;
+  MatrixInt32::const_iterator *list_it = 0;
+  if (N > 0) {
+    v = new MatrixInt32*[N];
+    list_it = new MatrixInt32::const_iterator[N];
+  }
+  for (int i=0; i<N; ++i) {
+    LUABIND_CHECK_PARAMETER(i+1, MatrixInt32);
+    LUABIND_GET_PARAMETER(i+1, MatrixInt32, v[i]);
+    if (!v[i]->sameDim(obj))
+      LUABIND_ERROR("The given matrices must have the same dimension sizes\n");
+    list_it[i] = v[i]->begin();
+  }
+  LUABIND_CHECK_PARAMETER(argn, function);
+  for (MatrixInt32::iterator it(obj->begin()); it!=obj->end(); ++it) {
+    // copy the Lua function, lua_call will pop this copy
+    lua_pushvalue(L, argn);
+    // push the self matrix value
+    lua_pushint(L, *it);
+    // push the value of the rest of given matrices
+    for (int j=0; j<N; ++j) {
+      lua_pushint(L, *list_it[j]);
+      ++list_it[j];
+    }
+    // CALL
+    lua_call(L, N+1, 1);
+    // pop the result, a number
+    if (!lua_isnil(L, -1)) {
+      if (!lua_isint(L, -1))
+	LUABIND_ERROR("Incorrect returned value type, expected NIL or INT\n");
+      *it = lua_toint(L, -1);
+    }
+    lua_pop(L, 1);
+  }
+  delete[] v;
+  delete[] list_it;
+  LUABIND_RETURN(MatrixInt32, obj);
+}
+//BIND_END
+
 //BIND_METHOD MatrixInt32 sliding_window
 {
   int *sub_matrix_size=0, *offset=0, *step=0, *num_steps=0, *order_step=0;
@@ -581,10 +647,7 @@ typedef MatrixInt32::sliding_window SlidingWindowMatrixInt32;
 
 //BIND_METHOD MatrixInt32 to_float
 {
-  bool col_major;
-  LUABIND_GET_OPTIONAL_PARAMETER(1, bool, col_major, false);
-  LUABIND_RETURN(MatrixFloat,
-		 convertFromMatrixInt32ToMatrixFloat(obj, col_major));
+  LUABIND_RETURN(MatrixFloat, convertFromMatrixInt32ToMatrixFloat(obj));
 }
 //BIND_END
 
@@ -599,6 +662,27 @@ typedef MatrixInt32::sliding_window SlidingWindowMatrixInt32;
 }
 //BIND_END
 
+//BIND_METHOD MatrixInt32 uniform
+{
+  int lower, upper;
+  MTRand *random;
+  LUABIND_GET_PARAMETER(1, int, lower);
+  LUABIND_GET_PARAMETER(2, int, upper);
+  LUABIND_GET_OPTIONAL_PARAMETER(3, MTRand, random, 0);
+  
+  if (lower > upper) {
+    LUABIND_ERROR("First argument must be <= second argument");
+  }
+  if (random == 0) random = new MTRand();
+  IncRef(random);
+  for (MatrixInt32::iterator it(obj->begin()); it != obj->end(); ++it) {
+    *it = random->randInt(upper - lower) + lower;
+  }
+  DecRef(random);
+  LUABIND_RETURN(MatrixInt32, obj);
+}
+//BIND_END
+
 //// MATRIX SERIALIZATION ////
 
 //BIND_CLASS_METHOD MatrixInt32 read
diff --git a/packages/basics/matrix/binding/bind_sparse_matrix.lua.cc b/packages/basics/matrix/binding/bind_sparse_matrix.lua.cc
index d7e84db69..dd5981c48 100644
--- a/packages/basics/matrix/binding/bind_sparse_matrix.lua.cc
+++ b/packages/basics/matrix/binding/bind_sparse_matrix.lua.cc
@@ -29,6 +29,24 @@
 #include "luabindmacros.h" // for lua_pushfloat and lua_pushint
 #include "luabindutil.h"   // for lua_pushfloat and lua_pushint
 
+namespace AprilUtils {
+  template<> Basics::SparseMatrixFloat *LuaTable::
+  convertTo<Basics::SparseMatrixFloat *>(lua_State *L, int idx) {
+    return lua_toSparseMatrixFloat(L, idx);
+  }
+  
+  template<> void LuaTable::
+  pushInto<Basics::SparseMatrixFloat *>(lua_State *L,
+                                        Basics::SparseMatrixFloat *value) {
+    lua_pushSparseMatrixFloat(L, value);
+  }
+
+  template<> bool LuaTable::
+  checkType<Basics::SparseMatrixFloat *>(lua_State *L, int idx) {
+    return lua_isSparseMatrixFloat(L, idx);
+  }
+}
+
 namespace Basics {
   int sparseMatrixFloatIteratorFunction(lua_State *L) {
     SparseMatrixFloatIterator *obj = lua_toSparseMatrixFloatIterator(L,1);
@@ -87,8 +105,8 @@ namespace Basics {
       luaL_error(L, "Needs a stream as 1st argument");
       return 0;
     }
-    AprilUtils::LuaTableOptions options(L,2);
-    return SparseMatrix<T>::read(ptr.get(), &options);
+    AprilUtils::LuaTable options(L,2);
+    return SparseMatrix<T>::read(ptr.get(), options);
   }
 
 } // namespace Basics
@@ -353,13 +371,7 @@ using namespace Basics;
 
 //BIND_METHOD SparseMatrixFloat to_dense
 {
-  const char *major;
-  LUABIND_GET_OPTIONAL_PARAMETER(1, string, major, "row_major");
-  CBLAS_ORDER order=CblasRowMajor;
-  if (strcmp(major, "col_major") == 0) order = CblasColMajor;
-  else if (strcmp(major, "row_major") != 0)
-    LUABIND_FERROR1("Incorrect major order string %s", major);
-  LUABIND_RETURN(MatrixFloat, obj->toDense(order));
+  LUABIND_RETURN(MatrixFloat, obj->toDense());
 }
 //BIND_END
 
diff --git a/packages/basics/matrix/c_src/matrix-conv.impl.h b/packages/basics/matrix/c_src/matrix-conv.impl.h
index 57e18d885..a73f38ffd 100644
--- a/packages/basics/matrix/c_src/matrix-conv.impl.h
+++ b/packages/basics/matrix/c_src/matrix-conv.impl.h
@@ -45,10 +45,6 @@ namespace AprilMath {
             aux_step[0] = aux_step[1] = 1;
             for (int i=0; i<D; ++i) aux_step[i+2] = step[i];
           }
-          if (mat->getMajorOrder() == CblasColMajor) {
-            order_step = new int[numDim];
-            for (int i=0; i<numDim; ++i) order_step[i] = i;
-          }
           switch(D+2 - numDim) {
           case 2: // numDim == D
             // Kx1xN1xN2x...xNd kernel :: M1xM2x...xMd matrix
@@ -116,7 +112,7 @@ namespace AprilMath {
                           mat_sw->numWindows()/bunch_size,
                           mat_slice->size() };
           Basics::Matrix<T> *unrolled_mat =
-            new Basics::Matrix<T>(3, dims,mat->getMajorOrder());
+            new Basics::Matrix<T>(3, dims);
           AprilUtils::UniquePtr<int []> aux_dims(new int[mat_slice->getNumDim()+2]);
           aux_dims[0] = dims[0];
           aux_dims[1] = dims[1];
@@ -129,10 +125,6 @@ namespace AprilMath {
           aux_dims[0] = 1;
           aux_dims[1] = 1;
           AprilUtils::UniquePtr<int []> order_step;
-          if (mat->getMajorOrder() == CblasColMajor) {
-            order_step = new int[mat_slice->getNumDim()+2];
-            for (int i=0; i<mat_slice->getNumDim()+2; ++i) order_step[i] = i;
-          }
           AprilUtils::SharedPtr< typename Basics::Matrix<T>::sliding_window >
             unrolled_sw( new typename Basics::Matrix<T>::
                          sliding_window(unrolled_mat_rewrapped.get(),
@@ -215,8 +207,7 @@ namespace AprilMath {
           }
           // allocate new result matrix if not given
           if (result == 0) {
-            result = new Basics::Matrix<T>(D+2, result_sizes.get(),
-                                           mat->getMajorOrder());
+            result = new Basics::Matrix<T>(D+2, result_sizes.get());
           }
           // check result matrix sizes (includes number of planes = number of kernels)
           else {
diff --git a/packages/basics/matrix/c_src/matrix-iterators.impl.h b/packages/basics/matrix/c_src/matrix-iterators.impl.h
index 2b4fc3728..b90a34ff4 100644
--- a/packages/basics/matrix/c_src/matrix-iterators.impl.h
+++ b/packages/basics/matrix/c_src/matrix-iterators.impl.h
@@ -31,7 +31,7 @@ namespace Basics {
 
   template <typename T>
   Matrix<T>::iterator::iterator(Matrix<T> *m) : m(m), idx(0), raw_pos(0) {
-    if (!m->getIsContiguous() || !m->getIsDataRowOrdered()) {
+    if (!m->getIsContiguous()) {
       coords = new int[m->getNumDim()];
       for (int i=0; i<m->getNumDim(); ++i) coords[i] = 0;
     }
@@ -43,7 +43,7 @@ namespace Basics {
   template <typename T>
   Matrix<T>::iterator::iterator(Matrix<T> *m, int raw_pos) :
     m(m), idx(0), raw_pos(raw_pos) {
-    if (!m->getIsContiguous() || !m->getIsDataRowOrdered()) {
+    if (!m->getIsContiguous()) {
       coords = new int[m->getNumDim()];
       m->computeCoords(raw_pos, coords);
     }
@@ -54,11 +54,11 @@ namespace Basics {
   template <typename T>
   Matrix<T>::iterator::iterator(Matrix<T> *m, int raw_pos, int *coords) :
     m(m), idx(0), raw_pos(raw_pos) {
-    if (!m->getIsContiguous() || !m->getIsDataRowOrdered()) {
+    if (!m->getIsContiguous()) {
       this->coords = new int[m->getNumDim()];
       for (int i=0; i<m->getNumDim(); ++i) this->coords[i] = coords[i];
     }
-    else coords = 0;
+    else this->coords = 0;
     data = m->getData();
   }
 
@@ -138,163 +138,11 @@ namespace Basics {
   }
 
   /*******************************************************************/
-
-  template <typename T>
-  Matrix<T>::col_major_iterator::col_major_iterator(Matrix<T> *m) :
-    m(m), idx(0), raw_pos(0) {
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[m->getNumDim()];
-      for (int i=0; i<m->getNumDim(); ++i) coords[i] = 0;
-    }
-    else coords = 0;
-    raw_pos = m->getOffset();
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::col_major_iterator::col_major_iterator(Matrix<T> *m, int raw_pos) :
-    m(m), idx(0), raw_pos(raw_pos) {
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[m->getNumDim()];
-      m->computeCoords(raw_pos, coords);
-    }
-    else coords = 0;
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::col_major_iterator::col_major_iterator(Matrix<T> *m, int raw_pos, int *coords) :
-    m(m), idx(0), raw_pos(raw_pos) {
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[m->getNumDim()];
-      for (int i=0; i<m->getNumDim(); ++i) this->coords[i] = coords[i];
-    }
-    else coords = 0;
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::col_major_iterator::col_major_iterator() :
-    m(0), idx(0), raw_pos(0), coords(0) { }
-
-  template <typename T>
-  Matrix<T>::col_major_iterator::col_major_iterator(const col_major_iterator &other) :
-    m(other.m),
-    idx(other.idx),
-    raw_pos(other.raw_pos) {
-    if (other.coords != 0) {
-      coords = new int[m->getNumDim()];
-      for (int i=0; i<m->getNumDim(); ++i) coords[i] = other.coords[i];
-    }
-    else coords = 0;
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::col_major_iterator::col_major_iterator(const iterator &other) :
-    m(other.m),
-    idx(other.idx),
-    raw_pos(other.raw_pos) {
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[m->getNumDim()];
-      if (other.coords != 0)
-        for (int i=0; i<m->getNumDim(); ++i) coords[i] = other.coords[i];
-      else m->computeCoords(raw_pos, coords);
-    }
-    else coords = 0;
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::col_major_iterator::~col_major_iterator() {
-    delete[] coords;
-  }
-
-  template <typename T>
-  typename Matrix<T>::col_major_iterator &Matrix<T>::col_major_iterator::operator=(const Matrix<T>::col_major_iterator &other) {
-    m = other.m;
-    idx = other.idx;
-    raw_pos = other.raw_pos;
-    data = m->getData();
-    if (other.coords != 0) {
-      if (coords==0 || m->numDim != other.m->numDim) {
-        delete[] coords;
-        coords = new int[other.m->getNumDim()];
-      }
-      for (int i=0; i<m->getNumDim(); ++i) coords[i] = other.coords[i];
-    }
-    else {
-      delete[] coords;
-      coords = 0;
-    }
-    return *this;
-  }
-
-  template <typename T>
-  typename Matrix<T>::col_major_iterator &Matrix<T>::col_major_iterator::operator=(const Matrix<T>::iterator &other) {
-    m = other.m;
-    idx = other.idx;
-    idx = other.idx;
-    raw_pos = other.raw_pos;
-    data = m->getData();
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[other.m->getNumDim()];
-      if (other.coords != 0)
-        for (int i=0; i<m->getNumDim(); ++i) coords[i] = other.coords[i];
-      else m->computeCoords(raw_pos, coords);
-    }
-    return *this;
-  }
-
-  template <typename T>
-  bool Matrix<T>::col_major_iterator::operator==(const Matrix<T>::col_major_iterator &other) const {
-    return m==other.m && raw_pos == other.raw_pos;
-  }
-
-  template <typename T>
-  bool Matrix<T>::col_major_iterator::operator==(const Matrix<T>::iterator &other) const {
-    return m==other.m && raw_pos == other.raw_pos;
-  }
-
-  template <typename T>
-  bool Matrix<T>::col_major_iterator::operator!=(const Matrix<T>::col_major_iterator &other) const {
-    return !( (*this) == other );
-  }
-
-  template <typename T>
-  bool Matrix<T>::col_major_iterator::operator!=(const Matrix<T>::iterator &other) const {
-    return !( (*this) == other );
-  }
-
-  template <typename T>
-  typename Matrix<T>::col_major_iterator &Matrix<T>::col_major_iterator::operator++() {
-    ++idx;
-    if (coords != 0) m->nextCoordVectorColOrder(coords, raw_pos);
-    else ++raw_pos;
-    return *this;
-  }
-
-  template <typename T>
-  T &Matrix<T>::col_major_iterator::operator*() {
-    return data[raw_pos];
-  }
-
-  template <typename T>
-  T *Matrix<T>::col_major_iterator::operator->() {
-    return &data[raw_pos];
-  }
-
-  template <typename T>
-  int Matrix<T>::col_major_iterator::getRawPos() const {
-    return raw_pos;
-  }
-
-  /*******************************************************************/
-
+  
   template <typename T>
   Matrix<T>::const_iterator::const_iterator(const Matrix<T> *m) :
     m(m), idx(0), raw_pos(0) {
-    if (!m->getIsContiguous() || !m->getIsDataRowOrdered()) {
+    if (!m->getIsContiguous()) {
       coords = new int[m->getNumDim()];
       for (int i=0; i<m->getNumDim(); ++i) coords[i] = 0;
     }
@@ -306,7 +154,7 @@ namespace Basics {
   template <typename T>
   Matrix<T>::const_iterator::const_iterator(const Matrix<T> *m, int raw_pos) :
     m(m), idx(0), raw_pos(raw_pos) {
-    if (!m->getIsContiguous() || !m->getIsDataRowOrdered()) {
+    if (!m->getIsContiguous()) {
       coords = new int[m->getNumDim()];
       m->computeCoords(raw_pos, coords);
     }
@@ -317,11 +165,11 @@ namespace Basics {
   template <typename T>
   Matrix<T>::const_iterator::const_iterator(const Matrix<T> *m, int raw_pos, int *coords) :
     m(m), idx(0), raw_pos(raw_pos) {
-    if (!m->getIsContiguous() || !m->getIsDataRowOrdered()) {
-      coords = new int[m->getNumDim()];
+    if (!m->getIsContiguous()) {
+      this->coords = new int[m->getNumDim()];
       for (int i=0; i<m->getNumDim(); ++i) this->coords[i] = coords[i];
     }
-    else coords = 0;
+    else this->coords = 0;
     data = m->getData();
   }
 
@@ -442,216 +290,7 @@ namespace Basics {
   int Matrix<T>::const_iterator::getRawPos() const {
     return raw_pos;
   }
-
-  /*******************************************************************/
-
-  template <typename T>
-  Matrix<T>::const_col_major_iterator::const_col_major_iterator(const Matrix<T> *m) :
-    m(m), idx(0), raw_pos(0) {
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[m->getNumDim()];
-      for (int i=0; i<m->getNumDim(); ++i) coords[i] = 0;
-    }
-    else coords = 0;
-    raw_pos = m->getOffset();
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::const_col_major_iterator::const_col_major_iterator(const Matrix<T> *m,
-                                                                int raw_pos) :
-    m(m), idx(0), raw_pos(raw_pos) {
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[m->getNumDim()];
-      m->computeCoords(raw_pos, coords);
-    }
-    else coords = 0;
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::const_col_major_iterator::const_col_major_iterator(const Matrix<T> *m,
-                                                                int raw_pos,
-                                                                int *coords) :
-    m(m), idx(0), raw_pos(raw_pos) {
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[m->getNumDim()];
-      for (int i=0; i<m->getNumDim(); ++i) this->coords[i] = coords[i];
-    }
-    else coords = 0;
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::const_col_major_iterator::const_col_major_iterator() :
-    m(0), idx(0), raw_pos(0), coords(0) { }
-
-  template <typename T>
-  Matrix<T>::const_col_major_iterator::
-  const_col_major_iterator(const Matrix<T>::const_col_major_iterator &other) :
-    m(other.m),
-    idx(other.idx), 
-    raw_pos(other.raw_pos) {
-    if (other.coords != 0) {
-      coords = new int[m->getNumDim()];
-      for (int i=0; i<m->getNumDim(); ++i) coords[i] = other.coords[i];
-    }
-    else coords = 0;
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::const_col_major_iterator::
-  const_col_major_iterator(const Matrix<T>::iterator &other) :
-    m(other.m),
-    idx(other.idx), 
-    raw_pos(other.raw_pos) {
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[m->getNumDim()];
-      if (other.coords != 0)
-        for (int i=0; i<m->getNumDim(); ++i) coords[i] = other.coords[i];
-      else m->computeCoords(raw_pos, coords);
-    }
-    else coords = 0;
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::const_col_major_iterator::
-  const_col_major_iterator(const Matrix<T>::const_iterator &other) :
-    m(other.m),
-    idx(other.idx), 
-    raw_pos(other.raw_pos) {
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[m->getNumDim()];
-      if (other.coords != 0)
-        for (int i=0; i<m->getNumDim(); ++i) coords[i] = other.coords[i];
-      else m->computeCoords(raw_pos, coords);
-    }
-    else coords = 0;
-    data = m->getData();
-  }
-
-  template <typename T>
-  Matrix<T>::const_col_major_iterator::~const_col_major_iterator() {
-    delete[] coords;
-  }
-
-  template <typename T>
-  typename Matrix<T>::const_col_major_iterator &Matrix<T>::
-  const_col_major_iterator::
-  operator=(const typename Matrix<T>::const_col_major_iterator &other) {
-    m = other.m;
-    idx = other.idx;
-    raw_pos = other.raw_pos;
-    data = m->getData();
-    if (other.coords != 0) {
-      if (coords==0 || m->numDim != other.m->numDim) {
-        delete[] coords;
-        coords = new int[other.m->getNumDim()];
-      }
-      for (int i=0; i<m->getNumDim(); ++i) coords[i] = other.coords[i];
-    }
-    else {
-      delete[] coords;
-      coords = 0;
-    }
-    return *this;
-  }
-
-  template <typename T>
-  typename Matrix<T>::const_col_major_iterator &Matrix<T>::
-  const_col_major_iterator::operator=(const typename Matrix<T>::iterator &other) {
-    m = other.m;
-    idx = other.idx;
-    raw_pos = other.raw_pos;
-    data = m->getData();
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[other.m->getNumDim()];
-      if (other.coords != 0)
-        for (int i=0; i<m->getNumDim(); ++i) coords[i] = other.coords[i];
-      else m->computeCoords(raw_pos, coords);
-    }
-    return *this;
-  }
-
-  template <typename T>
-  typename Matrix<T>::const_col_major_iterator &Matrix<T>::
-  const_col_major_iterator::
-  operator=(const typename Matrix<T>::const_iterator &other) {
-    m = other.m;
-    idx = other.idx;
-    raw_pos = other.raw_pos;
-    data = m->getData();
-    if (!m->getIsContiguous() || m->getIsDataRowOrdered()) {
-      coords = new int[other.m->getNumDim()];
-      if (other.coords != 0)
-        for (int i=0; i<m->getNumDim(); ++i) coords[i] = other.coords[i];
-      else m->computeCoords(raw_pos, coords);
-    }
-    return *this;
-  }
-
-  template <typename T>
-  bool Matrix<T>::const_col_major_iterator::
-  operator==(const Matrix<T>::const_col_major_iterator &other) const {
-    return m==other.m && raw_pos == other.raw_pos;
-  }
-
-  template <typename T>
-  bool Matrix<T>::const_col_major_iterator::
-  operator==(const Matrix<T>::iterator &other) const {
-    return m==other.m && raw_pos == other.raw_pos;
-  }
-
-  template <typename T>
-  bool Matrix<T>::const_col_major_iterator::
-  operator==(const Matrix<T>::const_iterator &other) const {
-    return m==other.m && raw_pos == other.raw_pos;
-  }
-
-  template <typename T>
-  bool Matrix<T>::const_col_major_iterator::
-  operator!=(const Matrix<T>::const_col_major_iterator &other) const {
-    return !( (*this) == other );
-  }
-
-  template <typename T>
-  bool Matrix<T>::const_col_major_iterator::
-  operator!=(const Matrix<T>::iterator &other) const {
-    return !( (*this) == other );
-  }
-
-  template <typename T>
-  bool Matrix<T>::const_col_major_iterator::
-  operator!=(const Matrix<T>::const_iterator &other) const {
-    return !( (*this) == other );
-  }
-
-  template <typename T>
-  typename Matrix<T>::const_col_major_iterator
-  &Matrix<T>::const_col_major_iterator::operator++() {
-    ++idx;
-    if (coords != 0) m->nextCoordVectorColOrder(coords, raw_pos);
-    else ++raw_pos;
-    return *this;
-  }
-
-  template <typename T>
-  const T &Matrix<T>::const_col_major_iterator::operator*() const {
-    return data[raw_pos];
-  }
-
-  template <typename T>
-  const T *Matrix<T>::const_col_major_iterator::operator->() const {
-    return &data[raw_pos];
-  }
-
-  template <typename T>
-  int Matrix<T>::const_col_major_iterator::getRawPos() const {
-    return raw_pos;
-  }
-
+  
   /*******************************************************************/
 
   template <typename T>
@@ -680,17 +319,11 @@ namespace Basics {
           order[1] = 0;
         }
         else {
-          // CUATION: this conditions are critical to work with transposed matrices,
-          // in order to ensure the iterator to traverse equally two matrices with
-          // different transposition.
-          if (m->getMajorOrder() == CblasRowMajor) {
-            order[0] = 1;
-            order[1] = 0;
-          }
-          else {
-            order[0] = 0;
-            order[1] = 1;
-          }
+          // CUATION: this conditions are critical to work with transposed
+          // matrices, in order to ensure the iterator to traverse equally two
+          // matrices with different transposition.
+          order[0] = 1;
+          order[1] = 0;
         }
       }
       else {
@@ -874,7 +507,7 @@ namespace Basics {
 
   template <typename T>
   Matrix<T>::pos_iterator::pos_iterator(const Matrix<T> *m) : m(m), idx(0), raw_pos(0) {
-    if (!m->getIsContiguous() || !m->getIsDataRowOrdered()) {
+    if (!m->getIsContiguous()) {
       coords = new int[m->getNumDim()];
       for (int i=0; i<m->getNumDim(); ++i) coords[i] = 0;
     }
@@ -1156,8 +789,7 @@ namespace Basics {
       return new Matrix<T>(m->numDim, m->stride,
                            raw_pos, sub_matrix_size,
                            total_size, last_raw_pos + raw_pos,
-                           m->data.get(), m->major_order, m->use_cuda,
-                           m->transposed);
+                           m->data.get(), m->use_cuda);
     }
     else {
       april_assert(dest->getRawDataAccess() == m->getRawDataAccess());
diff --git a/packages/basics/matrix/c_src/matrix-serialization.impl.h b/packages/basics/matrix/c_src/matrix-serialization.impl.h
index 3f4cecb73..13b1c5cde 100644
--- a/packages/basics/matrix/c_src/matrix-serialization.impl.h
+++ b/packages/basics/matrix/c_src/matrix-serialization.impl.h
@@ -40,8 +40,8 @@ namespace Basics {
   template <typename T>
   Matrix<T>*
   Matrix<T>::read(AprilIO::StreamInterface *stream,
-                  const AprilUtils::GenericOptions *options) {
-    if (options->getOptionalBoolean(MatrixIO::TAB_OPTION, false)) {
+                  const AprilUtils::LuaTable &options) {
+    if (options.opt<bool>(MatrixIO::TAB_OPTION, false)) {
       return readTab(stream, options);
     }
     else {
@@ -52,8 +52,8 @@ namespace Basics {
   template <typename T>
   Matrix<T>*
   Matrix<T>::readNormal(AprilIO::StreamInterface *stream,
-                        const AprilUtils::GenericOptions *options) {
-    const char *given_order = options->getOptionalString(MatrixIO::ORDER_OPTION, 0);
+                        const AprilUtils::LuaTable &options) {
+    UNUSED_VARIABLE(options);
     //
     MatrixIO::AsciiExtractor<T> ascii_extractor;
     MatrixIO::BinaryExtractor<T> bin_extractor;
@@ -64,7 +64,7 @@ namespace Basics {
     AprilUtils::SharedPtr<AprilIO::CStringStream>
       c_str(new AprilIO::CStringStream());;
     april_assert(!c_str.empty());
-    AprilUtils::constString line,format,order,token;
+    AprilUtils::constString line,format,token;
     // First we read the matrix dimensions
     line = readULine(stream, c_str.get());
     if (!line) {
@@ -100,17 +100,11 @@ namespace Basics {
       ERROR_PRINT("impossible to read format token\n");
       return 0;
     }
-    order = line.extract_token();
-    if (given_order != 0) order = given_order;
+    // legacy major order string
+    // order = line.extract_token();
+    // if (given_order != 0) order = given_order;
     if (pos_comodin == -1) { // Normal version
-      if (!order || order=="row_major")
-        mat = new Matrix<T>(n,dims);
-      else if (order == "col_major")
-        mat = new Matrix<T>(n,dims,CblasColMajor);
-      else {
-        ERROR_PRINT("Impossible to determine the order\n");
-        return 0;
-      }
+      mat = new Matrix<T>(n,dims);
       typename Matrix<T>::iterator data_it(mat->begin());
       if (format == "ascii") {
         while (data_it!=mat->end() && (line=readULine(stream, c_str.get()))) {
@@ -173,10 +167,7 @@ namespace Basics {
         delete[] data; return 0;
       }
       dims[pos_comodin] = size / sizesincomodin;
-      if (!order || order == "row_major")
-        mat = new Matrix<T>(n,dims);
-      else if (order == "col_major")
-        mat = new Matrix<T>(n,dims,CblasColMajor);
+      mat = new Matrix<T>(n,dims);
       int i=0;
       for (typename Matrix<T>::iterator it(mat->begin());
            it!=mat->end();
@@ -189,16 +180,16 @@ namespace Basics {
   
   template <typename T>
   void Matrix<T>::write(AprilIO::StreamInterface *stream,
-                        const AprilUtils::GenericOptions *options) {
-    bool is_tab = options->getOptionalBoolean(MatrixIO::TAB_OPTION, false);
+                        const AprilUtils::LuaTable &options) {
+    bool is_tab = options.opt(MatrixIO::TAB_OPTION, false);
     if (is_tab) writeTab(stream, options);
     else writeNormal(stream, options);
   }
 
   template <typename T>
   void Matrix<T>::writeNormal(AprilIO::StreamInterface *stream,
-                              const AprilUtils::GenericOptions *options) {
-    bool is_ascii = options->getOptionalBoolean(MatrixIO::ASCII_OPTION, false);
+                              const AprilUtils::LuaTable &options) {
+    bool is_ascii = options.opt(MatrixIO::ASCII_OPTION, false);
     //
     MatrixIO::AsciiSizer<T> ascii_sizer;
     MatrixIO::BinarySizer<T> bin_sizer;
@@ -222,12 +213,14 @@ namespace Basics {
     if (is_ascii) {
       const int columns = 9;
       stream->printf("ascii");
-      if (this->getMajorOrder() == CblasColMajor) {
+      /* legacy major order string
+        if (this->getMajorOrder() == CblasColMajor) {
         stream->printf(" col_major");
-      }
-      else {
+        }
+        else {
         stream->printf(" row_major");
-      }
+        }
+      */
       stream->printf("\n");
       int i=0;
       for(typename Matrix<T>::const_iterator it(this->begin());
@@ -241,12 +234,14 @@ namespace Basics {
     } else { // binary
       const int columns = 16;
       stream->printf("binary");
-      if (this->getMajorOrder() == CblasColMajor) {
+      /* legacy major order string
+        if (this->getMajorOrder() == CblasColMajor) {
         stream->printf(" col_major");
-      }
-      else {
+        }
+        else {
         stream->printf(" row_major");
-      }
+        }
+      */
       stream->printf("\n");
       // We substract 1 so the final '\0' is not considered
       int i=0;
@@ -270,13 +265,12 @@ namespace Basics {
   template <typename T>
   Matrix<T>*
   Matrix<T>::readTab(AprilIO::StreamInterface *stream,
-                     const AprilUtils::GenericOptions *options) {
-    const char *given_order = options->getOptionalString(MatrixIO::ORDER_OPTION, 0);
-    const char *delim       = options->getOptionalString(MatrixIO::DELIM_OPTION, "\n\r\t,; ");
-    bool read_empty         = options->getOptionalBoolean(MatrixIO::EMPTY_OPTION, false);
-    T default_value         = getTemplateOption(options, MatrixIO::DEFAULT_OPTION, T());
-    int ncols               = options->getOptionalInt32(MatrixIO::NCOLS_OPTION, 0);
-    int nrows               = options->getOptionalInt32(MatrixIO::NROWS_OPTION, 0);
+                     const AprilUtils::LuaTable &options) {
+    const char *delim       = options.opt(MatrixIO::DELIM_OPTION, "\n\r\t,; ");
+    bool read_empty         = options.opt(MatrixIO::EMPTY_OPTION, false);
+    T default_value         = options.opt(MatrixIO::DEFAULT_OPTION, T());
+    int ncols               = options.opt<int>(MatrixIO::NCOLS_OPTION, 0);
+    int nrows               = options.opt<int>(MatrixIO::NROWS_OPTION, 0);
     //
     MatrixIO::AsciiExtractor<T> ascii_extractor;
     if (!stream->good()) {
@@ -322,19 +316,10 @@ namespace Basics {
         return 0;
       }
     }
-    AprilUtils::constString order( (given_order) ? given_order : "row_major"),token;
+    AprilUtils::constString token;
     int dims[2] = { nrows, ncols };
     Matrix<T> *mat = 0;
-    if (order=="row_major") {
-      mat = new Matrix<T>(2,dims);
-    }
-    else if (order == "col_major") {
-      mat = new Matrix<T>(2,dims,CblasColMajor);
-    }
-    else {
-      ERROR_PRINT("Impossible to determine the order\n");
-      return 0;
-    }
+    mat = new Matrix<T>(2,dims);
     int i=0;
     typename Matrix<T>::iterator data_it(mat->begin());
     if (read_empty) {
@@ -387,7 +372,7 @@ namespace Basics {
   
   template <typename T>
   void Matrix<T>::writeTab(AprilIO::StreamInterface *stream,
-                           const AprilUtils::GenericOptions *options) {
+                           const AprilUtils::LuaTable &options) {
     UNUSED_VARIABLE(options);
     MatrixIO::AsciiSizer<T> ascii_sizer;
     MatrixIO::AsciiCoder<T> ascii_coder;
@@ -413,16 +398,6 @@ namespace Basics {
       stream->printf("\n"); 
     }
   }
-
-  template <typename T>
-  T Matrix<T>::getTemplateOption(const AprilUtils::GenericOptions *options,
-                                 const char *name, T default_value) {
-    UNUSED_VARIABLE(options);
-    UNUSED_VARIABLE(name);
-    UNUSED_VARIABLE(default_value);
-    ERROR_EXIT(128, "NOT IMPLEMENTED\n");
-    return T();
-  }
   
 } // namespace Basics
 
diff --git a/packages/basics/matrix/c_src/matrix.h b/packages/basics/matrix/c_src/matrix.h
index 88317309e..28c9993e1 100644
--- a/packages/basics/matrix/c_src/matrix.h
+++ b/packages/basics/matrix/c_src/matrix.h
@@ -49,8 +49,6 @@ namespace Basics {
     const char * const TAB_OPTION   = "tab";
     /// Boolean option key for read/write using ascii format.
     const char * const ASCII_OPTION = "ascii";
-    /// String option key for read/write in 'col_major' or 'row_major'.
-    const char * const ORDER_OPTION = "order";
     /// String option key with a delimitiers list.
     const char * const DELIM_OPTION = "delim";
     /// Boolean option key indicating if empty fields are allowed during read.
@@ -84,8 +82,6 @@ namespace Basics {
     // weight matrices)
     unsigned int shared_count;
   protected:
-    /// Indicator of transposition
-    bool transposed;
     /// Number of dimensions
     int numDim;
     /// Size of each dimension
@@ -100,18 +96,11 @@ namespace Basics {
     /// Pointer to data
     AprilUtils::SharedPtr< AprilMath::GPUMirroredMemoryBlock<T> > data;
     AprilUtils::SharedPtr< AprilUtils::MMappedDataReader > mmapped_data;
-    /// Major type (only when numDim=2)
-    CBLAS_ORDER major_order;
     /// For CUDA purposes
     bool use_cuda;
     /// To know if it is contiguous
     mutable matrix_contiguous_enum_t is_contiguous;
   
-    /// Constructor... -> Integer array with the size of each dimension
-    /*
-      Matrix(int numDim, const int* dim, T* data_vector,
-      CBLAS_ORDER major_order = CblasRowMajor);
-    */
     /// Returns the data pointer for read and write
     T *getData() { return data->getPPALForReadAndWrite(); }
     /// Returns the data pointer for read
@@ -174,8 +163,8 @@ namespace Basics {
       const Matrix<T> *m; ///< A weak reference.
       int idx;
       int raw_pos;
-      /// The coords array is only used when the matrix is not congiuous
-      /// or it is in col_major order, otherwise it is NULL
+      /// The coords array is only used when the matrix is not congiuous,
+      /// otherwise it is NULL
       int *coords;
     public:
       pos_iterator(const Matrix<T> *m);
@@ -191,18 +180,14 @@ namespace Basics {
     };
     // forward declaration
     class const_iterator;
-    class col_major_iterator;
-    class const_col_major_iterator;
     class iterator {
       friend class const_iterator;
-      friend class col_major_iterator;
-      friend class const_col_major_iterator;
       friend class Matrix;
       Matrix<T> *m; ///< A weak reference.
       int idx;
       int raw_pos;
-      /// The coords array is only used when the matrix is not congiuous
-      /// or it is in col_major order, otherwise it is NULL
+      /// The coords array is only used when the matrix is not congiuous,
+      /// otherwise it is NULL
       int *coords;
       T *data;
       iterator(Matrix<T> *m);
@@ -222,44 +207,13 @@ namespace Basics {
       int getIdx() const { return idx; }
     };
     /*******************************************************/
-    class col_major_iterator {
-      friend class Matrix;
-      Matrix<T> *m; ///< A weak reference.
-      int idx;
-      int raw_pos;
-      /// The coords array is only used when the matrix is not congiuous
-      /// or it is in row_major order, otherwise it is NULL
-      int *coords;
-      T *data;
-      col_major_iterator(Matrix<T> *m);
-      col_major_iterator(Matrix<T> *m, int raw_pos);
-      col_major_iterator(Matrix<T> *m, int raw_pos, int *coords);
-    public:
-      col_major_iterator();
-      col_major_iterator(const col_major_iterator &other);
-      col_major_iterator(const iterator &other);
-      ~col_major_iterator();
-      col_major_iterator &operator=(const col_major_iterator &other);
-      col_major_iterator &operator=(const iterator &other);
-      bool      operator==(const col_major_iterator &other) const;
-      bool      operator==(const iterator &other) const;
-      bool      operator!=(const col_major_iterator &other) const;
-      bool      operator!=(const iterator &other) const;
-      col_major_iterator &operator++();
-      T &operator*();
-      T *operator->();
-      int getRawPos() const;
-      int getIdx() const { return idx; }
-    };
-    /*******************************************************/
     class const_iterator {
-      friend class const_col_major_iterator;
       friend class Matrix;
       const Matrix<T> *m; ///< A weak reference.
       int idx;
       int raw_pos;
-      /// The coords array is only used when the matrix is not congiuous
-      /// or it is in col_major order, otherwise it is NULL
+      /// The coords array is only used when the matrix is not congiuous,
+      /// otherwise it is NULL
       int *coords;
       const T *data;
       const_iterator(const Matrix<T> *m);
@@ -283,43 +237,7 @@ namespace Basics {
       int getRawPos() const;
       int getIdx() const { return idx; }
     };
-    /*******************************************************/
-    class const_col_major_iterator {
-      friend class Matrix;
-      const Matrix<T> *m; ///< A weak reference.
-      int idx;
-      int raw_pos;
-      /// The coords array is only used when the matrix is not congiuous
-      /// or it is in row_major order, otherwise it is NULL
-      int *coords;
-      const T *data;
-      const_col_major_iterator(const Matrix<T> *m);
-      const_col_major_iterator(const Matrix<T> *m, int raw_pos);
-      const_col_major_iterator(const Matrix<T> *m, int raw_pos, int *coords);
-    public:
-      const_col_major_iterator();
-      const_col_major_iterator(const const_col_major_iterator &other);
-      const_col_major_iterator(const iterator &other);
-      const_col_major_iterator(const const_iterator &other);
-      /*const_col_major_iterator(const iterator &other);*/
-      ~const_col_major_iterator();
-      const_col_major_iterator &operator=(const const_col_major_iterator &other);
-      const_col_major_iterator &operator=(const iterator &other);
-      const_col_major_iterator &operator=(const const_iterator &other);
-      bool            operator==(const const_col_major_iterator &other) const;
-      bool            operator==(const iterator &other) const;
-      bool            operator==(const const_iterator &other) const;
-      bool            operator!=(const const_col_major_iterator &other) const;
-      bool            operator!=(const iterator &other) const;
-      bool            operator!=(const const_iterator &other) const;
-      const_col_major_iterator &operator++();
-      const T &operator*() const;
-      const T *operator->() const;
-      int getRawPos() const;
-      int getIdx() const { return idx; }
-    };
     
-
     /********************************************************/
     /**
      * The sliding is a kind of iterator which traverses the matrix producing
@@ -394,15 +312,13 @@ namespace Basics {
           const int a_sz = m->matrixSize[a];
           const int b_sz = m->matrixSize[b];
           if (a_sz == b_sz) {
-            if (m->major_order == CblasRowMajor)
-              return b < a;
-            else
-              return a < b;
+            return b < a;
           }
           // Don't use a trade-off between size and stride, it will be unsafe with
           // transposed matrices
-          else
+          else {
             return a_sz > b_sz;
+          }
         }
       };
       //
@@ -554,8 +470,8 @@ namespace Basics {
     //
     Matrix(int numDim, const int *stride, const int offset,
            const int *matrixSize, const int total_size, const int last_raw_pos,
-           AprilMath::GPUMirroredMemoryBlock<T> *data, const CBLAS_ORDER major_order,
-           const bool use_cuda, const bool transposed,
+           AprilMath::GPUMirroredMemoryBlock<T> *data,
+           const bool use_cuda,
            AprilUtils::MMappedDataReader *mmapped_data = 0);
 
     /// Modifies the offset of the matrix. WARNING, this method doesn't check the
@@ -570,15 +486,13 @@ namespace Basics {
 
   public:
     /********** Constructors ***********/
-    /// Full constructor given numDim, dim, and major_order
+    /// Full constructor given numDim, dim, data, offset
     Matrix(int numDim, const int* dim,
-           CBLAS_ORDER major_order = CblasRowMajor,
            AprilMath::GPUMirroredMemoryBlock<T> *data = 0,
-           int offset = 0,
-           bool transposed = false);
+           int offset = 0);
   
-    /// Constructor for CblasRowMajor order
-    Matrix(int numDim, int d1, ...);
+    /// Constructor with variadic arguments.
+    explicit Matrix(int numDim, int d1, ...);
   
     /// Constructor given other matrix, it does a shallow or deep copy (clone). By
     /// default is a deep copy, some code pieces expect this behavior, don't
@@ -590,9 +504,9 @@ namespace Basics {
            bool clone=true);
     /// Sub-matrix constructor of a const matrix. WARNING, this matrices don't
     /// allow writes if clone=false
-    Matrix(const Matrix<T> *other,
-           const int* coords, const int *sizes,
-           bool clone=true);
+    explicit Matrix(const Matrix<T> *other,
+                    const int* coords, const int *sizes,
+                    bool clone=true);
     /// Destructor
     virtual ~Matrix();
   
@@ -619,12 +533,6 @@ namespace Basics {
     int getDimSize(int i) const { return matrixSize[i]; }
     int getStrideSize(int i) const { return stride[i]; }
     int size() const { return total_size; }
-    CBLAS_ORDER getMajorOrder() const { return major_order; }
-    bool getTransposedFlag() const { return transposed; }
-    bool getIsDataRowOrdered() const {
-      return ( (getMajorOrder()==CblasRowMajor && !getTransposedFlag()) ||
-               (getMajorOrder()==CblasColMajor &&  getTransposedFlag()) );
-    }
     void setUseCuda(bool v) {
       use_cuda = v;
 #ifdef USE_CUDA
@@ -633,7 +541,7 @@ namespace Basics {
     }
     bool getCudaFlag() const { return use_cuda; }
     bool isSimple() const {
-      return (getIsContiguous())&&(getIsDataRowOrdered());
+      return (getIsContiguous());
     }
     /// Indicates if it is a contiguous matrix
     bool getIsContiguous() const;
@@ -688,20 +596,16 @@ namespace Basics {
       return end_const_iterator;
     }
 
-    /// Symbolic transposition, changes the flag and preserves the major order
-    /// flag
+    /// Symbolic transposition, changes strides order
     Matrix<T>* transpose();
-    /// Changing major order is a different way to perform a transposition, but
-    /// taking into account a change in the major_order flag
-    Matrix<T>* inMajorOrder(CBLAS_ORDER new_major_order);
+    /// Symbolic transposition, changes strides order
+    Matrix<T>* transpose(int dim1, int dim2);
     /// Copy only sizes, but not data
     Matrix<T>* cloneOnlyDims() const;
     /// Deep copy
     Matrix<T>* clone() const;
-    /// Deep copy with different major_order
-    Matrix<T> *clone(CBLAS_ORDER major_order) const;
     /// Shallow copy
-    Matrix<T>* shallow_copy();
+    Matrix<T>* shallowCopy();
   
     /// Number values check
     void pruneSubnormalAndCheckNormal();
@@ -728,8 +632,8 @@ namespace Basics {
     const T& operator() (int coord0, int coord1, int coord2, ...) const;
     const T& operator() (int *coords, int sz) const;
   
-    /// Function to obtain RAW access to data pointer. Be careful with it, because
-    /// you are losing sub-matrix abstraction, and the major order.
+    /// Function to obtain RAW access to data pointer. Be careful with it, you
+    /// are losing sub-matrix abstraction.
     AprilMath::GPUMirroredMemoryBlock<T> *getRawDataAccess() { return data.get(); }
     const AprilMath::GPUMirroredMemoryBlock<T> *getRawDataAccess() const { return data.get(); }
   
@@ -788,7 +692,7 @@ namespace Basics {
      *   true.
      */
     virtual void write(AprilIO::StreamInterface *stream,
-                       const AprilUtils::GenericOptions *options);
+                       const AprilUtils::LuaTable &options);
     
     /**
      * @brief Reads the Matrix from a stream.
@@ -802,12 +706,6 @@ namespace Basics {
      *   Matrix in a tabulated way (true) or in the APRIL-ANN Matrix format
      *   (false). By default it is false.
      *
-     * - MatrixIO::ORDER_OPTION this key contains a string with "row_major",
-     *   "col_major", or it can be not defined at all. It forces the read()
-     *   method to allocate a Matrix in the indicate major order. By default it
-     *   is not defined and the major order will be taken from the file in case
-     *   @c TAB_OPTION=false or in "row_major" in case @c TAB_OPTION=true.
-     *
      * - MatrixIO::DELIM_OPTION if @c TAB_OPTION=true this key contains a string
      *   value with a list of delimitiers. By default it is "\n\r\t,; ".
      *
@@ -836,7 +734,7 @@ namespace Basics {
      * @note This method throws different kind of errors.
      */
     static Matrix<T> *read(AprilIO::StreamInterface *stream,
-                           const AprilUtils::GenericOptions *options);
+                           const AprilUtils::LuaTable &options);
     
   private:
     void allocate_memory(int size);
@@ -852,19 +750,16 @@ namespace Basics {
     }
 
     void writeNormal(AprilIO::StreamInterface *stream,
-                     const AprilUtils::GenericOptions *options);
+                     const AprilUtils::LuaTable &options);
     
     void writeTab(AprilIO::StreamInterface *stream,
-                  const AprilUtils::GenericOptions *options);
+                  const AprilUtils::LuaTable &options);
 
     static Matrix<T> *readNormal(AprilIO::StreamInterface *stream,
-                                 const AprilUtils::GenericOptions *options);
+                                 const AprilUtils::LuaTable &options);
     
     static Matrix<T> *readTab(AprilIO::StreamInterface *stream,
-                              const AprilUtils::GenericOptions *options);
-    
-    static T getTemplateOption(const AprilUtils::GenericOptions *options,
-                               const char *name, T default_value);
+                              const AprilUtils::LuaTable &options);
   };
 
 } // namespace Basics
@@ -878,4 +773,11 @@ namespace Basics {
 #include "matrix-iterators.impl.h"
 #include "matrix-serialization.impl.h"
 
+#include "matrixFloat.h"
+#include "matrixDouble.h"
+#include "matrixComplexF.h"
+#include "matrixInt32.h"
+#include "matrixChar.h"
+#include "matrixBool.h"
+
 #endif // MATRIX_H
diff --git a/packages/basics/matrix/c_src/matrix.impl.h b/packages/basics/matrix/c_src/matrix.impl.h
index 169e0d8a0..212916862 100644
--- a/packages/basics/matrix/c_src/matrix.impl.h
+++ b/packages/basics/matrix/c_src/matrix.impl.h
@@ -44,25 +44,11 @@ namespace Basics {
   template <typename T>
   void Matrix<T>::initialize(const int *dim) {
     total_size=1;
-    switch(major_order) {
-    case CblasRowMajor:
-      for(int i=numDim-1; i>=0; --i) {
-        stride[i] = total_size;
-        total_size *= dim[i];
-        matrixSize[i] = dim[i];
-        april_assert(matrixSize[i] > 0);
-      }
-      break;
-    case CblasColMajor:
-      for(int i=0; i<numDim; ++i) {
-        stride[i] = total_size;
-        total_size *= dim[i];
-        matrixSize[i] = dim[i];
-        april_assert(matrixSize[i] > 0);
-      }
-      break;
-    default:
-      ERROR_EXIT(128, "Incorrect major order!!!\n");
+    for(int i=numDim-1; i>=0; --i) {
+      stride[i] = total_size;
+      total_size *= dim[i];
+      matrixSize[i] = dim[i];
+      april_assert(matrixSize[i] > 0);
     }
     last_raw_pos = total_size-1;
   }
@@ -91,15 +77,12 @@ namespace Basics {
                     const int total_size,
                     const int last_raw_pos,
                     AprilMath::GPUMirroredMemoryBlock<T> *data,
-                    const CBLAS_ORDER major_order,
                     const bool use_cuda,
-                    const bool transposed,
                     AprilUtils::MMappedDataReader *mmapped_data) :
-    AprilIO::Serializable(), shared_count(0), transposed(transposed),
+    AprilIO::Serializable(), shared_count(0),
     numDim(numDim), stride(new int[numDim]), offset(offset),
     matrixSize(new int[numDim]), total_size(total_size),
     last_raw_pos(last_raw_pos), data(data), mmapped_data(mmapped_data),
-    major_order(major_order),
     use_cuda(use_cuda),
     is_contiguous(NONE),
     end_iterator(), end_const_iterator(), end_span_iterator_() {
@@ -114,17 +97,14 @@ namespace Basics {
   template <typename T>
   Matrix<T>::Matrix(int numDim,
                     const int* dim,
-                    CBLAS_ORDER major_order,
                     AprilMath::GPUMirroredMemoryBlock<T> *data,
-                    int offset,
-                    bool transposed) :
-    AprilIO::Serializable(), shared_count(0), transposed(transposed),
+                    int offset) :
+    AprilIO::Serializable(), shared_count(0),
     numDim(numDim),
     offset(offset),
     data(data),
-    major_order(major_order),
     use_cuda(AprilMath::GPUMirroredMemoryBlockBase::USE_CUDA_DEFAULT),
-    is_contiguous(CONTIGUOUS),
+    is_contiguous(NONE),
     end_iterator(), end_const_iterator(), end_span_iterator_() {
     stride     = new int[numDim];
     matrixSize = new int[numDim];
@@ -145,10 +125,9 @@ namespace Basics {
                     const int* coords, const int *sizes,
                     bool clone) :
     AprilIO::Serializable(),
-    shared_count(0), transposed(other->transposed),
+    shared_count(0),
     numDim(other->numDim),
     offset(0),
-    major_order(other->major_order),
     use_cuda(other->use_cuda),
     is_contiguous(NONE),
     end_iterator(), end_const_iterator(), end_span_iterator_() {
@@ -160,8 +139,6 @@ namespace Basics {
     stride     = new int[numDim];
     matrixSize = new int[numDim];
     if (clone) {
-      transposed    = false;
-      is_contiguous = CONTIGUOUS;
       initialize(sizes);
       allocate_memory(total_size);
       span_iterator it(this);
@@ -203,10 +180,9 @@ namespace Basics {
                     const int* coords, const int *sizes,
                     bool clone) :
     AprilIO::Serializable(),
-    shared_count(0), transposed(other->transposed),
+    shared_count(0),
     numDim(other->numDim),
     offset(0),
-    major_order(other->major_order),
     use_cuda(other->use_cuda),
     is_contiguous(NONE),
     end_iterator(), end_const_iterator(), end_span_iterator_() {
@@ -218,8 +194,6 @@ namespace Basics {
     stride     = new int[numDim];
     matrixSize = new int[numDim];
     if (clone) {
-      transposed    = false;
-      is_contiguous = CONTIGUOUS;
       initialize(sizes);
       allocate_memory(total_size);
       span_iterator it(this), it_other(other, it.getDimOrder());
@@ -301,11 +275,11 @@ namespace Basics {
   /// Constructor with variable arguments
   template <typename T>
   Matrix<T>::Matrix(int numDim, int d1, ...) :
-    AprilIO::Serializable(), shared_count(0), transposed(false),
+    AprilIO::Serializable(), shared_count(0),
     numDim(numDim),
     offset(0),
-    major_order(CblasRowMajor),
-    is_contiguous(CONTIGUOUS),
+    use_cuda(AprilMath::GPUMirroredMemoryBlockBase::USE_CUDA_DEFAULT),
+    is_contiguous(NONE),
     end_iterator(), end_const_iterator(), end_span_iterator_() {
     int *dim   = new int[numDim];
     stride     = new int[numDim];
@@ -328,23 +302,20 @@ namespace Basics {
   template <typename T>
   Matrix<T>::Matrix(Matrix<T> *other, bool clone) :
     AprilIO::Serializable(),
-    shared_count(0), transposed(other->transposed),
+    shared_count(0),
     numDim(other->numDim),
     offset(0),
-    major_order(other->major_order),
     use_cuda(other->use_cuda),
-    is_contiguous(other->is_contiguous),
+    is_contiguous(NONE),
     end_iterator(), end_const_iterator(), end_span_iterator_() {
     stride       = new int[numDim];
     matrixSize   = new int[numDim];
     total_size   = other->total_size;
     last_raw_pos = other->last_raw_pos;
     if (clone) {
-      transposed = false;
       initialize(other->matrixSize);
       allocate_memory(total_size);
       AprilMath::MatrixExt::Operations::matCopy(this, other);
-      is_contiguous = CONTIGUOUS;
     }
     else {
       offset       = other->offset;
@@ -377,8 +348,10 @@ namespace Basics {
     obj->matrixSize    = mmapped_data->get<int>(N);
     obj->total_size    = *(mmapped_data->get<int>());
     obj->last_raw_pos  = *(mmapped_data->get<int>());
-    obj->major_order   = *(mmapped_data->get<CBLAS_ORDER>());
-    obj->transposed    = *(mmapped_data->get<bool>());
+    CBLAS_ORDER dummy1 = *(mmapped_data->get<CBLAS_ORDER>());
+    bool dummy2        = *(mmapped_data->get<bool>()); // legacy transposed flag
+    UNUSED_VARIABLE(dummy1);
+    UNUSED_VARIABLE(dummy2);
     // NON MAPPED DATA
     obj->use_cuda      = AprilMath::GPUMirroredMemoryBlockBase::USE_CUDA_DEFAULT;
     obj->shared_count  = 0;
@@ -401,8 +374,10 @@ namespace Basics {
     mmapped_data->put(matrixSize, numDim);
     mmapped_data->put(&total_size);
     mmapped_data->put(&last_raw_pos);
-    mmapped_data->put(&major_order);
-    mmapped_data->put(&transposed);
+    CBLAS_ORDER dummy1=CblasRowMajor;
+    mmapped_data->put(&dummy1);
+    bool dummy2=false; // legacy transposed flag
+    mmapped_data->put(&dummy2);
   }
 
   template <typename T>
@@ -451,36 +426,45 @@ namespace Basics {
     if (need_clone) {
       AprilMath::GPUMirroredMemoryBlock<T> *new_data =
         new AprilMath::GPUMirroredMemoryBlock<T>(new_size);
-      obj = new Matrix<T>(len, new_dims, major_order, new_data);
+      obj = new Matrix<T>(len, new_dims, new_data);
       AprilUtils::SharedPtr< Matrix<T> > aux( obj->rewrap(this->getDimPtr(),
                                                            this->getNumDim()) );
       AprilMath::MatrixExt::Operations::matCopy(aux.get(),this);
     }
     else {
-      obj = new Matrix<T>(len, new_dims, major_order, data.get(), offset);
+      obj = new Matrix<T>(len, new_dims, data.get(), offset);
     }
 #ifdef USE_CUDA
     obj->setUseCuda(use_cuda);
 #endif
     return obj;
   }
-
+  
   template <typename T>
   Matrix<T> *Matrix<T>::squeeze() {
     int len = 0;
-    int *sizes = new int[getNumDim()];
+    AprilUtils::UniquePtr<int []> sizes(new int[getNumDim()]);
+    AprilUtils::UniquePtr<int []> strides(new int[getNumDim()]);
     for (int i=0; i<getNumDim(); ++i) {
       int sz = getDimSize(i);
       if (sz > 1) {
+        strides[len] = getStrideSize(i);
         sizes[len++] = sz;
       }
     }
+    // matrices with 1x1x1x...x1 dimensions need the following sanity check
+    if (len == 0) {
+      strides[len] = 1;
+      sizes[len++] = 1;
+    }
+    // return this in case len==numDim, rewrap in other case
     Matrix<T> *obj = (len==numDim) ?
-      this : new Matrix<T>(len, sizes, major_order, data.get(), offset);
+      this : new Matrix<T>(len, strides.get(), getOffset(), sizes.get(),
+                           size(), last_raw_pos, data.get(),
+                           use_cuda, mmapped_data.get());
 #ifdef USE_CUDA
     obj->setUseCuda(use_cuda);
 #endif
-    delete[] sizes;
     return obj;
   }
 
@@ -488,8 +472,7 @@ namespace Basics {
   Matrix<T> *Matrix<T>::transpose() {
     Matrix<T> *result;
     if (this->numDim > 1) {
-      result = this->shallow_copy();
-      result->transposed = !result->transposed;
+      result = this->shallowCopy();
       for (int i=0,j=numDim-1; i<numDim; ++i,--j) {
         result->stride[j]     = this->stride[i];
         result->matrixSize[j] = this->matrixSize[i];
@@ -500,47 +483,32 @@ namespace Basics {
     return result;
   }
 
+  /// Symbolic transposition, changes strides order
   template<typename T>
-  Matrix<T> *Matrix<T>::inMajorOrder(CBLAS_ORDER new_major_order) {
-    Matrix<T> *result;
-    if (new_major_order == major_order) result = this;
-    else {
-      result = this->transpose();
-      result->transposed  = !result->transposed;
-      result->major_order = new_major_order;
+  Matrix<T>* Matrix<T>::transpose(int dim1, int dim2) {
+    if (dim1 == dim2) return this;
+    if (dim1 < 0 || dim1 >= numDim ||
+        dim2 < 0 || dim2 >= numDim) {
+      ERROR_EXIT4(128, "Incorrect dimensions, exepected to be "
+                  "in range [%d,%d], given dim1=%d, dim2=%d\n",
+                  0, numDim-1, dim1, dim2);
     }
+    Matrix<T> *result;
+    result = this->shallowCopy();
+    AprilUtils::swap(result->stride[dim1], result->stride[dim2]);
+    AprilUtils::swap(result->matrixSize[dim1], result->matrixSize[dim2]);
     return result;
   }
-
+  
   template <typename T>
   Matrix<T>* Matrix<T>::cloneOnlyDims() const {
-    Matrix<T> *obj = new Matrix<T>(numDim, matrixSize, major_order);
+    Matrix<T> *obj = new Matrix<T>(numDim, matrixSize);
 #ifdef USE_CUDA
     obj->setUseCuda(use_cuda);
 #endif
     return obj;
   }
 
-  template<typename T>
-  Matrix<T> *Matrix<T>::clone(CBLAS_ORDER major_order) const {
-    Matrix<T> *resul;
-    if (this->major_order != major_order) {
-      resul = new Matrix<T>(numDim, matrixSize, major_order);
-#ifdef USE_CUDA
-      resul->setUseCuda(use_cuda);
-#endif
-      iterator resul_it(resul->begin());
-      const_iterator this_it(begin());
-      while(resul_it != resul->end()) {
-        *resul_it = *this_it;
-        ++resul_it;
-        ++this_it;
-      }
-    }
-    else resul = this->clone();
-    return resul;
-  }
-
   template <typename T>
   Matrix<T>* Matrix<T>::clone() const {
     Matrix<T> *result = this->cloneOnlyDims();
@@ -549,7 +517,7 @@ namespace Basics {
   }
 
   template <typename T>
-  Matrix<T>* Matrix<T>::shallow_copy() {
+  Matrix<T>* Matrix<T>::shallowCopy() {
     return new Matrix<T>(this,false);
   }
 
@@ -737,12 +705,10 @@ namespace Basics {
       result = new Matrix();
       int d = numDim - 1;
       // Data initialization
-      result->transposed   = this->transposed;
       result->use_cuda     = use_cuda;
       result->numDim       = d;
       result->matrixSize   = new int[d];
       result->stride       = new int[d];
-      result->major_order  = major_order;
       result->offset       = offset + index*stride[dim]; // the select implies an offset
       result->last_raw_pos = result->offset;
       result->data         = data;
@@ -962,37 +928,20 @@ namespace Basics {
     return raw_pos + this->offset;
   }
 
+  /// FIXME: Change it to compute coords traversing strides in descending order?
   template <typename T>
   void Matrix<T>::computeCoords(const int raw_pos, int *coords) const {
     int R = raw_pos - offset;
     switch(numDim) {
     case 1: coords[0] = R / stride[0]; break;
     case 2:
-      switch(major_order) {
-      case CblasRowMajor:
-        coords[0] =  R / stride[0];
-        coords[1] = (R % stride[0]) / stride[1];
-        break;
-      case CblasColMajor:
-        coords[1] =  R / stride[1];
-        coords[0] = (R % stride[1]) / stride[0];
-        break;
-      }
+      coords[0] =  R / stride[0];
+      coords[1] = (R % stride[0]) / stride[1];
       break;
     default:
-      switch(major_order) {
-      case CblasRowMajor:
-        for (int i=0; i<numDim; ++i) {
-          coords[i] = R / stride[i];
-          R = R % stride[i];
-        }
-        break;
-      case CblasColMajor:
-        for (int i=numDim-1; i>=0; --i) {
-          coords[i] = R / stride[i];
-          R = R % stride[i];
-        }
-        break;
+      for (int i=0; i<numDim; ++i) {
+        coords[i] = R / stride[i];
+        R = R % stride[i];
       }
     }
   }
@@ -1000,25 +949,13 @@ namespace Basics {
   template <typename T>
   bool Matrix<T>::getIsContiguous() const {
     if (is_contiguous != NONE) return (is_contiguous==CONTIGUOUS);
-    if (major_order == CblasRowMajor) {
-      int aux = 1;
-      for (int i=numDim-1; i>=0; --i) {
-        if(stride[i] != aux) {
-          is_contiguous = NONCONTIGUOUS;
-          return false;
-        }
-        else aux *= matrixSize[i];
-      }
-    }
-    else {
-      int aux = 1;
-      for (int i=0; i<numDim; ++i) {
-        if(stride[i] != aux) {
-          is_contiguous = NONCONTIGUOUS;
-          return false;
-        }
-        else aux *= matrixSize[i];
+    int aux = 1;
+    for (int i=numDim-1; i>=0; --i) {
+      if(stride[i] != aux) {
+        is_contiguous = NONCONTIGUOUS;
+        return false;
       }
+      else aux *= matrixSize[i];
     }
     is_contiguous = CONTIGUOUS;
     return true;
@@ -1030,14 +967,12 @@ namespace Basics {
     if (numDim != 1)
       ERROR_EXIT(128, "Only one-dimensional matrix is allowed\n");
     const int dims[2] = { matrixSize[0], matrixSize[0] };
-    Matrix<T> *resul  = new Matrix<T>(2, dims, major_order);
+    Matrix<T> *resul  = new Matrix<T>(2, dims);
     // resul_diag is a submatrix of resul, build to do a diagonal traverse
     const int stride  = matrixSize[0] + 1;
     Matrix<T> *resul_diag = new Matrix<T>(1, &stride, 0, dims, dims[0],
                                           resul->last_raw_pos, resul->data.get(),
-                                          resul->major_order,
-                                          resul->use_cuda,
-                                          resul->transposed);
+                                          resul->use_cuda);
     AprilMath::MatrixExt::Operations::matZeros(resul);
     AprilMath::MatrixExt::Operations::matCopy(resul_diag, this);
     delete resul_diag;
@@ -1058,7 +993,7 @@ namespace Basics {
       result_sizes[i] = getDimSize(i) + begin_padding[i] + end_padding[i];
       matrix_pos[i] = begin_padding[i];
     }
-    Matrix<T> *result = new Matrix<T>(getNumDim(), result_sizes, getMajorOrder());
+    Matrix<T> *result = new Matrix<T>(getNumDim(), result_sizes);
     // FIXME: implement fill by several submatrices for large matrix sizes with
     // small padding sizes
     AprilMath::MatrixExt::Operations::matFill(result, default_value);
@@ -1082,7 +1017,7 @@ namespace Basics {
       result_sizes[i] = getDimSize(i) + pad_value*2;
       matrix_pos[i] = pad_value;
     }
-    Matrix<T> *result = new Matrix<T>(getNumDim(), result_sizes, getMajorOrder());
+    Matrix<T> *result = new Matrix<T>(getNumDim(), result_sizes);
     // FIXME: implement fill by several submatrices for large matrix sizes with
     // small padding sizes
     AprilMath::MatrixExt::Operations::matFill(result, default_value);
diff --git a/packages/basics/matrix/c_src/matrixBool.cc b/packages/basics/matrix/c_src/matrixBool.cc
new file mode 100644
index 000000000..a96a478a6
--- /dev/null
+++ b/packages/basics/matrix/c_src/matrixBool.cc
@@ -0,0 +1,81 @@
+/*
+ * This file is part of APRIL-ANN toolkit (A
+ * Pattern Recognizer In Lua with Artificial Neural Networks).
+ *
+ * Copyright 2013, Francisco Zamora-Martinez
+ *
+ * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 3 as
+ * published by the Free Software Foundation
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this library; if not, write to the Free Software Foundation,
+ * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ */
+#include "matrixBool.h"
+
+namespace Basics {
+
+  namespace MatrixIO {
+    /////////////////////////////////////////////////////////////////////////
+  
+    template<>
+    bool AsciiExtractor<bool>::operator()(AprilUtils::constString &line,
+                                          bool &destination) {
+      char aux;
+      if (!line.extract_char(&aux)) return false;
+      destination = (aux == '1');
+      return true;
+    }
+  
+    template<>
+    bool BinaryExtractor<bool>::operator()(AprilUtils::constString &line,
+                                           bool &destination) {
+      UNUSED_VARIABLE(line);
+      UNUSED_VARIABLE(destination);
+      ERROR_EXIT(128, "Bool type has not binary option\n");
+      return false;
+
+    }
+  
+    template<>
+    int AsciiSizer<bool>::operator()(const Matrix<bool> *mat) {
+      return mat->size()*2;
+    }
+
+    template<>
+    int BinarySizer<bool>::operator()(const Matrix<bool> *mat) {
+      UNUSED_VARIABLE(mat);
+      ERROR_EXIT(128, "Bool type has not binary option\n");
+      return 0;
+    }
+
+    template<>
+    void AsciiCoder<bool>::operator()(const bool &value,
+                                      AprilIO::StreamInterface *stream) {
+      stream->printf("%c", (value) ? ('1') : ('0'));
+    }
+  
+    template<>
+    void BinaryCoder<bool>::operator()(const bool &value,
+                                       AprilIO::StreamInterface *stream) {
+      UNUSED_VARIABLE(value);
+      UNUSED_VARIABLE(stream);
+      ERROR_EXIT(128, "Bool type has not binary option\n");
+
+    }
+
+    /////////////////////////////////////////////////////////////////////////////
+
+  } // namespace MatrixIO
+
+  ///////////////////////////////////////////////////////////////////////////////
+  template class Matrix<bool>;
+
+} // namespace Basics
diff --git a/packages/basics/matrix/c_src/matrixBool.h b/packages/basics/matrix/c_src/matrixBool.h
new file mode 100644
index 000000000..c2994713c
--- /dev/null
+++ b/packages/basics/matrix/c_src/matrixBool.h
@@ -0,0 +1,61 @@
+/*
+ * This file is part of APRIL-ANN toolkit (A
+ * Pattern Recognizer In Lua with Artificial Neural Networks).
+ *
+ * Copyright 2013, Francisco Zamora-Martinez
+ *
+ * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 3 as
+ * published by the Free Software Foundation
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this library; if not, write to the Free Software Foundation,
+ * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ */
+#ifndef MATRIX_BOOL_H
+#define MATRIX_BOOL_H
+#include "matrix.h"
+
+namespace Basics {
+
+
+  namespace MatrixIO {
+
+    /* Especialization of MatrixBool ascii and binary extractors, sizers and
+       coders */
+    template<>
+    bool AsciiExtractor<bool>::operator()(AprilUtils::constString &line,
+                                          bool &destination);
+  
+    template<>
+    bool BinaryExtractor<bool>::operator()(AprilUtils::constString &line,
+                                           bool &destination);
+  
+    template<>
+    int AsciiSizer<bool>::operator()(const Matrix<bool> *mat);
+
+    template<>
+    int BinarySizer<bool>::operator()(const Matrix<bool> *mat);
+
+    template<>
+    void AsciiCoder<bool>::operator()(const bool &value,
+                                      AprilIO::StreamInterface *stream);
+  
+    template<>
+    void BinaryCoder<bool>::operator()(const bool &value,
+                                       AprilIO::StreamInterface *stream);
+
+  } // namespace MatrixIO
+  
+  ///////////////////////////////////////////////////////////////////////////////
+  typedef Matrix<bool> MatrixBool;
+
+} // namespace Basics
+
+#endif // MATRIX_BOOL_H
diff --git a/packages/basics/matrix/c_src/matrixChar.cc b/packages/basics/matrix/c_src/matrixChar.cc
index 73253c3eb..c8ece64cb 100644
--- a/packages/basics/matrix/c_src/matrixChar.cc
+++ b/packages/basics/matrix/c_src/matrixChar.cc
@@ -73,12 +73,6 @@ namespace Basics {
 
   } // namespace MatrixIO
 
-  template<>
-  char Matrix<char>::getTemplateOption(const AprilUtils::GenericOptions *options,
-                                       const char *name, char default_value) {
-    return options->getOptionalChar(name, default_value);
-  }
-
   ///////////////////////////////////////////////////////////////////////////////
   template class Matrix<char>;
 
diff --git a/packages/basics/matrix/c_src/matrixChar.h b/packages/basics/matrix/c_src/matrixChar.h
index 418976d3b..8f4ac66f3 100644
--- a/packages/basics/matrix/c_src/matrixChar.h
+++ b/packages/basics/matrix/c_src/matrixChar.h
@@ -53,13 +53,23 @@ namespace Basics {
 
   } // namespace MatrixIO
 
-  template<>
-  char Matrix<char>::getTemplateOption(const AprilUtils::GenericOptions *options,
-                                       const char *name, char default_value);
-  
   ///////////////////////////////////////////////////////////////////////////////
   typedef Matrix<char> MatrixChar;
 
 } // namespace Basics
 
+////////////////////////////////////////////////////////////////////////////
+
+namespace AprilUtils {
+
+  template<> Basics::MatrixChar *LuaTable::
+  convertTo<Basics::MatrixChar *>(lua_State *L, int idx);
+  
+  template<> void LuaTable::
+  pushInto<Basics::MatrixChar *>(lua_State *L, Basics::MatrixChar *value);
+
+  template<> bool LuaTable::
+  checkType<Basics::MatrixChar *>(lua_State *L, int idx);
+}
+
 #endif // MATRIX_CHAR_H
diff --git a/packages/basics/matrix/c_src/matrixComplexF.cc b/packages/basics/matrix/c_src/matrixComplexF.cc
index 0a151b825..7a45fad31 100644
--- a/packages/basics/matrix/c_src/matrixComplexF.cc
+++ b/packages/basics/matrix/c_src/matrixComplexF.cc
@@ -79,17 +79,6 @@ namespace Basics {
 
   } // namespace MatrixIO
 
-  template<>
-  ComplexF Matrix<ComplexF>::
-  getTemplateOption(const AprilUtils::GenericOptions *options,
-                    const char *name,
-                    ComplexF default_value) {
-    AprilMath::LuaComplexFNumber *c =
-      options->getOptionalReferenced<AprilMath::LuaComplexFNumber>(name, 0);
-    if (c == 0) return default_value;
-    else return c->getValue();
-  }
-
   /////////////////////////////////////////////////////////////////////////////
   
   template class Matrix<ComplexF>;
diff --git a/packages/basics/matrix/c_src/matrixComplexF.h b/packages/basics/matrix/c_src/matrixComplexF.h
index 21ea361e1..9025c7e99 100644
--- a/packages/basics/matrix/c_src/matrixComplexF.h
+++ b/packages/basics/matrix/c_src/matrixComplexF.h
@@ -55,16 +55,24 @@ namespace Basics {
   
   } // namespace MatrixIO
 
-  template<>
-  AprilMath::ComplexF Matrix<AprilMath::ComplexF>::
-  getTemplateOption(const AprilUtils::GenericOptions *options,
-                    const char *name,
-                    AprilMath::ComplexF default_value);
-
   //////////////////////////////////////////////////////////////////////////////
 
   typedef Matrix<AprilMath::ComplexF> MatrixComplexF;
 
 } // namespace Basics
 
+////////////////////////////////////////////////////////////////////////////
+
+namespace AprilUtils {
+
+  template<> Basics::MatrixComplexF *LuaTable::
+  convertTo<Basics::MatrixComplexF *>(lua_State *L, int idx);
+  
+  template<> void LuaTable::
+  pushInto<Basics::MatrixComplexF *>(lua_State *L, Basics::MatrixComplexF *value);
+
+  template<> bool LuaTable::
+  checkType<Basics::MatrixComplexF *>(lua_State *L, int idx);
+}
+
 #endif // MATRIXCOMPLEXF_H
diff --git a/packages/basics/matrix/c_src/matrixDouble.cc b/packages/basics/matrix/c_src/matrixDouble.cc
index f866a2d7b..2337a1653 100644
--- a/packages/basics/matrix/c_src/matrixDouble.cc
+++ b/packages/basics/matrix/c_src/matrixDouble.cc
@@ -68,13 +68,6 @@ namespace Basics {
 
   } // namespace MatrixIO
   
-  template<>
-  double Matrix<double>::
-  getTemplateOption(const AprilUtils::GenericOptions *options,
-                    const char *name, double default_value) {
-    return options->getOptionalDouble(name, default_value);
-  }
-
   /////////////////////////////////////////////////////////////////////////
   
   template class Matrix<double>;
diff --git a/packages/basics/matrix/c_src/matrixDouble.h b/packages/basics/matrix/c_src/matrixDouble.h
index 2b731ffbc..6665f0871 100644
--- a/packages/basics/matrix/c_src/matrixDouble.h
+++ b/packages/basics/matrix/c_src/matrixDouble.h
@@ -55,11 +55,20 @@ namespace Basics {
     
   } // namespace MatrixIO
 
-  template<>
-  double Matrix<double>::
-  getTemplateOption(const AprilUtils::GenericOptions *options,
-                    const char *name, double default_value);
+}
+
+////////////////////////////////////////////////////////////////////////////
+
+namespace AprilUtils {
+
+  template<> Basics::MatrixDouble *LuaTable::
+  convertTo<Basics::MatrixDouble *>(lua_State *L, int idx);
+  
+  template<> void LuaTable::
+  pushInto<Basics::MatrixDouble *>(lua_State *L, Basics::MatrixDouble *value);
 
+  template<> bool LuaTable::
+  checkType<Basics::MatrixDouble *>(lua_State *L, int idx);
 }
 
 #endif // MATRIX_DOUBLE_H
diff --git a/packages/basics/matrix/c_src/matrixFloat.cc b/packages/basics/matrix/c_src/matrixFloat.cc
index de4275897..eab251403 100644
--- a/packages/basics/matrix/c_src/matrixFloat.cc
+++ b/packages/basics/matrix/c_src/matrixFloat.cc
@@ -77,12 +77,6 @@ namespace Basics {
   
 
   } // namespace MatrixIO
-
-  template<>
-  float Matrix<float>::getTemplateOption(const AprilUtils::GenericOptions *options,
-                                         const char *name, float default_value) {
-    return options->getOptionalFloat(name, default_value);
-  }
   
   template <>
   void Matrix<float>::pruneSubnormalAndCheckNormal() {
diff --git a/packages/basics/matrix/c_src/matrixFloat.h b/packages/basics/matrix/c_src/matrixFloat.h
index 2fd3272b1..bd911be38 100644
--- a/packages/basics/matrix/c_src/matrixFloat.h
+++ b/packages/basics/matrix/c_src/matrixFloat.h
@@ -22,6 +22,7 @@
 #ifndef MATRIXFLOAT_H
 #define MATRIXFLOAT_H
 
+#include "lua_table.h"
 #include "matrix.h"
 
 namespace Basics {
@@ -55,11 +56,7 @@ namespace Basics {
     /**************************************************************************/
  
   } // namespace MatrixIO
-  
-  template<>
-  float Matrix<float>::getTemplateOption(const AprilUtils::GenericOptions *options,
-                                         const char *name, float default_value);
-  
+    
   //////////////////////////////////////////////////////////////////////////
   
   template <>
@@ -71,4 +68,18 @@ namespace Basics {
 
 }
 
+////////////////////////////////////////////////////////////////////////////
+
+namespace AprilUtils {
+
+  template<> Basics::MatrixFloat *LuaTable::
+  convertTo<Basics::MatrixFloat *>(lua_State *L, int idx);
+  
+  template<> void LuaTable::
+  pushInto<Basics::MatrixFloat *>(lua_State *L, Basics::MatrixFloat *value);
+
+  template<> bool LuaTable::
+  checkType<Basics::MatrixFloat *>(lua_State *L, int idx);
+}
+
 #endif // MATRIXFLOAT_H
diff --git a/packages/basics/matrix/c_src/matrixInt32.cc b/packages/basics/matrix/c_src/matrixInt32.cc
index d65e207f5..3b41e1f40 100644
--- a/packages/basics/matrix/c_src/matrixInt32.cc
+++ b/packages/basics/matrix/c_src/matrixInt32.cc
@@ -69,13 +69,6 @@ namespace Basics {
 
   } // namespace MatrixIO
   
-  template<>
-  int32_t Matrix<int32_t>::
-  getTemplateOption(const AprilUtils::GenericOptions *options,
-                    const char *name, int32_t default_value) {
-    return options->getOptionalInt32(name, default_value);
-  }
-
   /////////////////////////////////////////////////////////////////////////////
   
   template class Matrix<int32_t>;
diff --git a/packages/basics/matrix/c_src/matrixInt32.h b/packages/basics/matrix/c_src/matrixInt32.h
index e691943d7..00e495705 100644
--- a/packages/basics/matrix/c_src/matrixInt32.h
+++ b/packages/basics/matrix/c_src/matrixInt32.h
@@ -52,11 +52,6 @@ namespace Basics {
                                           AprilIO::StreamInterface *stream);
 
   } // namespace MatrixIO
-
-  template<>
-  int32_t Matrix<int32_t>::
-  getTemplateOption(const AprilUtils::GenericOptions *options,
-                    const char *name, int32_t default_value);
   
   //////////////////////////////////////////////////////////////////////////////
   
@@ -64,4 +59,18 @@ namespace Basics {
 
 } // namespace Basics
 
+////////////////////////////////////////////////////////////////////////////
+
+namespace AprilUtils {
+
+  template<> Basics::MatrixInt32 *LuaTable::
+  convertTo<Basics::MatrixInt32 *>(lua_State *L, int idx);
+  
+  template<> void LuaTable::
+  pushInto<Basics::MatrixInt32 *>(lua_State *L, Basics::MatrixInt32 *value);
+
+  template<> bool LuaTable::
+  checkType<Basics::MatrixInt32 *>(lua_State *L, int idx);
+}
+
 #endif // MATRIX_INT_H
diff --git a/packages/basics/matrix/c_src/matrixSet.h b/packages/basics/matrix/c_src/matrixSet.h
deleted file mode 100644
index 86fce2fea..000000000
--- a/packages/basics/matrix/c_src/matrixSet.h
+++ /dev/null
@@ -1,373 +0,0 @@
-/*
- * This file is part of APRIL-ANN toolkit (A
- * Pattern Recognizer In Lua with Artificial Neural Networks).
- *
- * Copyright 2014, Francisco Zamora-Martinez
- *
- * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License version 3 as
- * published by the Free Software Foundation
- *
- * This library is distributed in the hope that it will be useful, but WITHOUT
- * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
- * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this library; if not, write to the Free Software Foundation,
- * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
- *
- */
-
-#ifndef MATRIXSET_H
-#define MATRIXSET_H
-
-#include <cmath>
-
-#include "aux_hash_table.h"
-#include "hash_table.h"
-#include "matrix.h"
-#include "matrixFloat.h"
-#include "maxmin.h"
-#include "mystring.h"
-#include "referenced.h"
-#include "smart_ptr.h"
-#include "sparse_matrix.h"
-#include "sparse_matrixFloat.h"
-
-namespace Basics {
-
-  /**
-   * The class MatrixSet is a hash map of string=>Matrix<T>, allowing to compute
-   * math operations to all the underlying matrices, or between two MatrixSet.
-   */
-  template<typename T>
-    class MatrixSet : public Referenced {
-  public:
-
-    ///////////////////////////////////////////////////////////////////////
-    
-    class Value {
-    public:
-      Value() {}
-      Value(Matrix<T> *m) : dense(m) {}
-      Value(SparseMatrix<T> *m) : sparse(m) {}
-      bool isSparse() const { return !sparse.empty(); }
-      bool empty() const { return sparse.empty() && dense.empty(); }
-      void assign(Matrix<T> *m) {
-        dense.reset(m);
-        sparse.reset();
-      }
-      void assign(SparseMatrix<T> *m) {
-        sparse.reset(m);
-        dense.reset();
-      }
-      AprilUtils::SharedPtr< Matrix<T> > &checkDense() {
-        if (dense.empty()) ERROR_EXIT(128, "Impossible to retrive a dense matrix\n");
-        return dense;
-      }
-      AprilUtils::SharedPtr< SparseMatrix<T> > &checkSparse() {
-        if (sparse.empty()) ERROR_EXIT(128, "Impossible to retrive a sparse matrix\n");
-        return sparse;
-      }
-      AprilUtils::SharedPtr< Matrix<T> > &getDense() {
-        return dense;
-      }
-      AprilUtils::SharedPtr< SparseMatrix<T> > &getSparse() {
-        return sparse;
-      }
-      const AprilUtils::SharedPtr< Matrix<T> > &getDense() const {
-        return dense;
-      }
-      const AprilUtils::SharedPtr< SparseMatrix<T> > &getSparse() const {
-        return sparse;
-      }
-    private:
-      AprilUtils::SharedPtr< Matrix<T> > dense;
-      AprilUtils::SharedPtr< SparseMatrix<T> > sparse;
-    };
-    
-    ///////////////////////////////////////////////////////////////////////
-    
-  private:
-    typedef AprilUtils::hash<AprilUtils::string, Value> DictType;
-    DictType matrix_dict;
-  
-  public:
-    typedef typename DictType::iterator       iterator;
-    typedef typename DictType::const_iterator const_iterator;
-
-    //
-
-    MatrixSet() : matrix_dict(32, 2.0f) { }
-    virtual ~MatrixSet() { }
-
-    iterator begin() { return matrix_dict.begin(); }
-
-    iterator end()   { return matrix_dict.end(); }
-
-    MatrixSet<T> *clone() {
-      MatrixSet<T> *cloned = new MatrixSet<T>();
-      for (iterator it = matrix_dict.begin(); it!=matrix_dict.end(); ++it) {
-        if (it->second.isSparse()) {
-          cloned->insert(it->first, it->second.getSparse()->clone());
-        }
-        else {
-          cloned->insert(it->first, it->second.checkDense()->clone());
-        }
-      }
-      return cloned;
-    }
-
-    MatrixSet<T> *cloneOnlyDims() {
-      MatrixSet<T> *cloned = new MatrixSet<T>();
-      for (iterator it = matrix_dict.begin(); it!=matrix_dict.end(); ++it) {
-        if (it->second.isSparse())
-          ERROR_EXIT(256, "Impossible to cloneOnlyDims of MatrixSet objects "
-                     "with sparse matrices\n");
-        cloned->insert(it->first, it->second.checkDense()->cloneOnlyDims());
-      }
-      return cloned;
-    }
-
-    // operator[]
-    Value &operator[](const char *k) {
-      return matrix_dict[AprilUtils::string(k)];
-    }
-    Value &operator[](const AprilUtils::string &k) {
-      return matrix_dict[k];
-    }
-    // insert operation
-    void insert(const char *k, Matrix<T> *v) {
-      return insert(AprilUtils::string(k), v);
-    }
-    void insert(const AprilUtils::string &k, Matrix<T> *v) {
-      Value &old = matrix_dict[k];
-      old.assign(v);
-    }
-    void insert(const char *k, SparseMatrix<T> *v) {
-      return insert(AprilUtils::string(k), v);
-    }
-    void insert(const AprilUtils::string &k, SparseMatrix<T> *v) {
-      Value &old = matrix_dict[k];
-      old.assign(v);
-    }
-    // find operation
-    Value *find(const char *k) const {
-      return find(AprilUtils::string(k));
-    }
-    Value *find(const AprilUtils::string &k) const {
-      Value *ptr = matrix_dict.find(k);
-      return (ptr!=0) ? ptr : 0;
-    }
-    // matrix component-wise operators macros
-#define MAKE_N0_OPERATOR(NAME,FUNC)                                         \
-    void NAME() {                                                       \
-      for (iterator it = matrix_dict.begin();                           \
-           it!=matrix_dict.end(); ++it) {                               \
-        if (it->second.isSparse())                                      \
-          ERROR_EXIT(256, "Impossible to execute operators with sparse matrices\n"); \
-        AprilMath::MatrixExt::Operations::FUNC(it->second.checkDense().get()); \
-      }                                                                 \
-    }
-#define MAKE_N1_OPERATOR(NAME,FUNC,TYPE1)                               \
-    void NAME(const TYPE1 &v1) {                                        \
-      for (iterator it = matrix_dict.begin();                           \
-           it!=matrix_dict.end(); ++it) {                               \
-        if (it->second.isSparse())                                      \
-          ERROR_EXIT(256, "Impossible to execute operators with sparse matrices\n"); \
-        AprilMath::MatrixExt::Operations::FUNC(it->second.checkDense().get(), v1); \
-      }                                                                 \
-    }
-#define MAKE_N2_OPERATOR(NAME,FUNC,TYPE1,TYPE2)                         \
-    void NAME(const TYPE1 &v1, const TYPE2 &v2) {                       \
-      for (iterator it = matrix_dict.begin();                           \
-           it!=matrix_dict.end(); ++it) {                               \
-        if (it->second.isSparse())                                      \
-          ERROR_EXIT(256, "Impossible to execute operators with sparse matrices\n"); \
-        AprilMath::MatrixExt::Operations::FUNC(it->second.checkDense().get(),v1,v2); \
-      }                                                                 \
-    }
-    // matrix component-wise operators declaration
-    MAKE_N1_OPERATOR(fill,matFill,T);
-    MAKE_N2_OPERATOR(clamp,matClamp,T,T);
-    MAKE_N0_OPERATOR(zeros,matZeros);
-    MAKE_N0_OPERATOR(ones,matOnes);
-    MAKE_N1_OPERATOR(scalarAdd,matScalarAdd,T);
-    MAKE_N0_OPERATOR(plogp,matPlogp);
-    MAKE_N0_OPERATOR(log,matLog);
-    MAKE_N0_OPERATOR(log1p,matLog1p);
-    MAKE_N0_OPERATOR(exp,matExp);
-    MAKE_N0_OPERATOR(sqrt,matSqrt);
-    MAKE_N1_OPERATOR(pow,matPow,T);
-    MAKE_N0_OPERATOR(tan,matTan);
-    MAKE_N0_OPERATOR(tanh,matTanh);
-    MAKE_N0_OPERATOR(atan,matAtan);
-    MAKE_N0_OPERATOR(atanh,matAtanh);
-    MAKE_N0_OPERATOR(cos,matCos);
-    MAKE_N0_OPERATOR(cosh,matCosh);
-    MAKE_N0_OPERATOR(acos,matAcos);
-    MAKE_N0_OPERATOR(acosh,matAcosh);
-    MAKE_N0_OPERATOR(sin,matSin);
-    MAKE_N0_OPERATOR(sinh,matSinh);
-    MAKE_N0_OPERATOR(asin,matAsin);
-    MAKE_N0_OPERATOR(asinh,matAsinh);
-    MAKE_N0_OPERATOR(abs,matAbs);
-    MAKE_N0_OPERATOR(complement,matComplement);
-    MAKE_N0_OPERATOR(sign,matSign);
-    MAKE_N1_OPERATOR(scal,matScal,T);
-    MAKE_N2_OPERATOR(adjustRange,matAdjustRange,T,T);
-    MAKE_N0_OPERATOR(inv,matInv);
-#undef MAKE_N1_OPERATOR
-#undef MAKE_N2_OPERATOR
-
-    void pruneSubnormalAndCheckNormal() {
-      for (iterator it = matrix_dict.begin();
-           it!=matrix_dict.end(); ++it) {
-        if (it->second.isSparse())
-          ERROR_EXIT(256, "Impossible to execute operators with sparse matrices\n");
-        it->second.checkDense()->pruneSubnormalAndCheckNormal();
-      }
-    }
-    
-    // two matrix basic math operator macros
-#define MAKE_OPERATOR(NAME,FUNC)                                            \
-    void NAME(const MatrixSet<T> *other) {                              \
-      for (iterator it = matrix_dict.begin();                           \
-           it!=matrix_dict.end(); ++it) {                               \
-        Value &a = it->second;                                          \
-        const Value *b = other->find(it->first);                        \
-        if (a.isSparse() || b->isSparse())                              \
-          ERROR_EXIT(256, "Impossible to execute operators with sparse matrices\n"); \
-        if (b->empty())                                                 \
-          ERROR_EXIT1(128, "Matrix with name %s not found\n",           \
-                      it->first.c_str());                               \
-        AprilMath::MatrixExt::Operations::FUNC(a.getDense().get(),      \
-                                               b->getDense().get());    \
-      }                                                                 \
-    }
-    // two matrix basic math operator declarations
-    MAKE_OPERATOR(cmul,matCmul);
-    MAKE_OPERATOR(copy,matCopy);
-#undef MAKE_OPERATOR
-
-    // AXPY
-    void axpy(T alpha, const MatrixSet<T> *other) {
-      for (iterator it = matrix_dict.begin(); it!=matrix_dict.end(); ++it) {
-        Value &a = it->second;
-        const Value *b = other->find(it->first);
-        if (b->empty())
-          ERROR_EXIT1(128, "Matrix with name %s not found\n",
-                      it->first.c_str());
-        if (a.isSparse() || b->isSparse())
-          ERROR_EXIT(256, "Impossible to execute operators with sparse matrices\n");
-        AprilMath::MatrixExt::Operations::matAxpy(a.getDense().get(), alpha,
-                                                  b->getDense().get());
-      }
-    }
-
-    // EQUALS
-    void equals(const MatrixSet<T> *other, T epsilon) {
-      for (iterator it = matrix_dict.begin(); it!=matrix_dict.end(); ++it) {
-        const Value &a = it->second;
-        const Value *b = other->find(it->first);
-        if (b->empty())
-          ERROR_EXIT1(128, "Matrix with name %s not found\n",
-                      it->first.c_str());
-        if (a.isSparse() != b->isSparse())
-          ERROR_EXIT(256, "Impossible to execute operators with different matrix types\n");
-        if (a.isSparse())
-          AprilMath::MatrixExt::Operations::matEquals(a.getSparse().get(),
-                                                      b->getSparse().get(),
-                                                      epsilon);
-        else
-          AprilMath::MatrixExt::Operations::matEquals(a.getDense().get(),
-                                                      b->getDense().get(),
-                                                      epsilon);
-      }
-    }
-
-    // matrix math reductions
-    T norm2() {
-      T result_norm2 = T();
-      for (iterator it = matrix_dict.begin(); it!=matrix_dict.end(); ++it) {
-        T current_norm2;
-        Value &a = it->second;
-        if (a.isSparse()) {
-          current_norm2 = AprilMath::MatrixExt::Operations::
-            matNorm2(it->second.getSparse().get());
-        }
-        else {
-          current_norm2 = AprilMath::MatrixExt::Operations::
-            matNorm2(it->second.checkDense().get());
-        }
-        result_norm2 = result_norm2 + current_norm2*current_norm2;
-      }
-      return result_norm2;
-    }
-
-    // matrix math reductions
-    int size() {
-      int total_size = 0;
-      for (iterator it = matrix_dict.begin(); it!=matrix_dict.end(); ++it) {
-        Value &a = it->second;
-        if (a.isSparse())
-          total_size += it->second.getSparse()->size();
-        else
-          total_size += it->second.checkDense()->size();
-      }
-      return total_size;
-    }
-
-    // dot reduction
-    T dot(MatrixSet<T> *other) {
-      T result = T();
-      for (iterator it = matrix_dict.begin(); it!=matrix_dict.end(); ++it) {
-        Value &va = it->second;
-        Value *vb = other->find(it->first);
-        if (vb->empty())
-          ERROR_EXIT1(128, "Matrix with name %s not found\n",
-                      it->first.c_str());
-        if (va.isSparse() || vb->isSparse())
-          ERROR_EXIT(256, "Impossible to execute operators with sparse matrices\n");
-        AprilUtils::SharedPtr< Matrix<T> > a = va.checkDense(), b = vb->checkDense();
-        if (!a->getIsContiguous()) a = a->clone();
-        if (!b->getIsContiguous()) b = b->clone();
-        int a_size = a->size();
-        int b_size = b->size();
-        a = a->rewrap(&a_size, 1);
-        b = b->rewrap(&b_size, 1);
-        result = result + AprilMath::MatrixExt::Operations::matDot(a.get(),
-                                                                   b.get());
-      }
-      return result;
-    }
-
-    char *toLuaString() {
-      AprilUtils::SharedPtr<AprilIO::CStringStream> stream(new AprilIO::CStringStream());
-      AprilUtils::HashTableOptions options;
-      options.putBoolean("ascii", false);
-      stream->put("matrix.dict{ ");
-      for (iterator it = matrix_dict.begin(); it!=matrix_dict.end(); ++it) {
-        stream->printf("[\"%s\"] = ", it->first.c_str());
-        Value &a = it->second;
-        if (a.isSparse()) {
-          stream->put("matrix.sparse.fromString[[");
-          a.getSparse()->write(stream.get(), &options);
-          stream->put("]],");
-        }
-        else {
-          stream->put("matrix.fromString[[");
-          a.getDense()->write(stream.get(), &options);
-          stream->put("]],");
-        }
-      }
-      stream->put(" }\0", 3); // forces a \0 at the end of the buffer
-      return stream->releaseString();
-    }
-    
-  };
-
-} // namespace Basics
-
-#endif // MATRIXSET_H
diff --git a/packages/basics/matrix/c_src/matrix_operations.cu b/packages/basics/matrix/c_src/matrix_operations.cu
index 1f339237c..468a8efca 100644
--- a/packages/basics/matrix/c_src/matrix_operations.cu
+++ b/packages/basics/matrix/c_src/matrix_operations.cu
@@ -421,9 +421,7 @@ namespace AprilMath {
                          const Matrix<T> *otherA,
                          const Matrix<T> *otherB,
                          T beta) {
-        if (C->getTransposedFlag()) {
-          ERROR_EXIT(128, "GEMM method don't work with transposed C matrix\n");
-        }
+        CBLAS_ORDER order = CblasRowMajor;
         if (C == otherA || C == otherB) {
           ERROR_EXIT(128, "GEMM method couldn't receive as A or B argument "
                      "the C argument\n");
@@ -433,42 +431,48 @@ namespace AprilMath {
             otherB->getNumDim() != 2) {
           ERROR_EXIT(128,"Incorrect number of dimensions, only allowed for numDim=2\n");
         }
-        int row_idx_A = 0, col_idx_A = 1, row_idx_B = 0, col_idx_B = 1;
+        int row_idx_A = 0, col_idx_A = 1;
+        int row_idx_B = 0, col_idx_B = 1;
+        //
+        const int *A_stride = otherA->getStridePtr();
+        const int *B_stride = otherB->getStridePtr();
+        const int *C_stride = C->getStridePtr();
+        if (C_stride[1] != 1) order = CblasColMajor;
+        //
+        int lda = AprilUtils::max(A_stride[0], A_stride[1]);
+        int ldb = AprilUtils::max(B_stride[0], B_stride[1]);
+        int ldc = AprilUtils::max(C_stride[0], C_stride[1]);
+        if (A_stride[0] + A_stride[1] != lda+1 ||
+            B_stride[0] + B_stride[1] != ldb+1 ||
+            C_stride[0] + C_stride[1] != ldc+1) {
+          ERROR_EXIT(128, "Only allowed with contiguous matrices in leading dimension\n");
+        }
+        //
+        const int *A_dim = otherA->getDimPtr();
+        const int *B_dim = otherB->getDimPtr();
+        const int *C_dim = C->getDimPtr();
+        //
         if (trans_A == CblasTrans) AprilUtils::swap(row_idx_A, col_idx_A);
         if (trans_B == CblasTrans) AprilUtils::swap(row_idx_B, col_idx_B);
-        if (C->getDimSize(0) != otherA->getDimSize(row_idx_A) ||
-            C->getDimSize(1) != otherB->getDimSize(col_idx_B) ||
-            otherA->getDimSize(col_idx_A) != otherB->getDimSize(row_idx_B)) {
+        if (C_dim[0] != A_dim[row_idx_A] ||
+            C_dim[1] != B_dim[col_idx_B] ||
+            A_dim[col_idx_A] != B_dim[row_idx_B]) {
           ERROR_EXIT6(128, "Incorrect matrixes dimensions: %dx%d + %dx%d * %dx%d\n",
-                      C->getDimSize(0), C->getDimSize(1),
-                      otherA->getDimSize(row_idx_A), otherA->getDimSize(col_idx_A),
-                      otherB->getDimSize(row_idx_B), otherB->getDimSize(col_idx_B));
+                      C_dim[0], C_dim[1],
+                      A_dim[row_idx_A], A_dim[col_idx_A],
+                      B_dim[row_idx_B], B_dim[col_idx_B]);
         }
-        if (C->getMajorOrder() != otherA->getMajorOrder() ||
-            otherA->getMajorOrder() != otherB->getMajorOrder()) {
-          ERROR_EXIT(128, "Matrices with different major orders\n");
-        }
-  
-        int M=C->getDimSize(0), N=C->getDimSize(1), K=otherA->getDimSize(col_idx_A);
-        int lda, ldb, ldc;
-        if (C->getMajorOrder() == CblasRowMajor) {
-          lda = (!otherA->getTransposedFlag())?(otherA->getStrideSize(0)):(otherA->getStrideSize(1));
-          ldb = (!otherB->getTransposedFlag())?(otherB->getStrideSize(0)):(otherB->getStrideSize(1));
-          ldc = (!C->getTransposedFlag())?(C->getStrideSize(0)):(C->getStrideSize(1));
+        int M = C_dim[0], N=C_dim[1];
+        int K = A_dim[col_idx_A];
+        if (order == CblasRowMajor) {
+          if (A_stride[1] != 1) trans_A = NEGATE_CBLAS_TRANSPOSE(trans_A);
+          if (B_stride[1] != 1) trans_B = NEGATE_CBLAS_TRANSPOSE(trans_B);
         }
         else {
-          lda = (!otherA->getTransposedFlag())?(otherA->getStrideSize(1)):(otherA->getStrideSize(0));
-          ldb = (!otherB->getTransposedFlag())?(otherB->getStrideSize(1)):(otherB->getStrideSize(0));
-          ldc = (!C->getTransposedFlag())?(C->getStrideSize(1)  ):(C->getStrideSize(0));
-        }
-        if (otherA->getStrideSize(0) + otherA->getStrideSize(1) != lda+1 ||
-            otherB->getStrideSize(0) + otherB->getStrideSize(1) != ldb+1 ||
-            C->getStrideSize(0)      + C->getStrideSize(1)      != ldc+1) {
-          ERROR_EXIT(128, "Contiguous matrices are needed\n");
-        }
-        if (otherA->getTransposedFlag()) trans_A=NEGATE_CBLAS_TRANSPOSE(trans_A);
-        if (otherB->getTransposedFlag()) trans_B=NEGATE_CBLAS_TRANSPOSE(trans_B);
-        doGemm(C->getMajorOrder(), trans_A, trans_B,
+          if (A_stride[0] != 1) trans_A = NEGATE_CBLAS_TRANSPOSE(trans_A);
+          if (B_stride[0] != 1) trans_B = NEGATE_CBLAS_TRANSPOSE(trans_B);
+        }
+        doGemm(order, trans_A, trans_B,
                M, N, K,
                alpha, otherA->getRawDataAccess(), lda,
                otherB->getRawDataAccess(), ldb,
@@ -483,11 +487,11 @@ namespace AprilMath {
       Matrix<T> *matSparseMM(Matrix<T> *C,
                              CBLAS_TRANSPOSE trans_A,
                              CBLAS_TRANSPOSE trans_B,
-                             CBLAS_TRANSPOSE trans_C,
                              const T alpha,
                              const SparseMatrix<T> *otherA,
                              const Matrix<T> *otherB,
                              T beta) {
+        CBLAS_ORDER order = CblasRowMajor;
         if (C == otherB) {
           ERROR_EXIT(128, "Sparse GEMM method couldn't receive as A or B argument "
                      "the C argument\n");
@@ -497,43 +501,47 @@ namespace AprilMath {
             otherB->getNumDim() != 2) {
           ERROR_EXIT(128,"Incorrect number of dimensions, only allowed for numDim=2\n");
         }
-        int row_idx_A = 0, col_idx_A = 1, row_idx_B = 0, col_idx_B = 1;
-        int row_idx_C = 0, col_idx_C = 1;
+        int row_idx_A = 0, col_idx_A = 1;
+        int row_idx_B = 0, col_idx_B = 1;
+        //
+        const int *B_stride = otherB->getStridePtr();
+        const int *C_stride = C->getStridePtr();
+        if (C_stride[1] != 1) order = CblasColMajor;
+        //
+        int ldb = AprilUtils::max(B_stride[0], B_stride[1]);
+        int ldc = AprilUtils::max(C_stride[0], C_stride[1]);
+        if (B_stride[0] + B_stride[1] != ldb+1 ||
+            C_stride[0] + C_stride[1] != ldc+1) {
+          ERROR_EXIT(128, "Only allowed with contiguous matrices in leading dimension\n");
+        }
+        //
+        const int *A_dim = otherA->getDimPtr();
+        const int *B_dim = otherB->getDimPtr();
+        const int *C_dim = C->getDimPtr();
+        //
         if (trans_A == CblasTrans) AprilUtils::swap(row_idx_A, col_idx_A);
         if (trans_B == CblasTrans) AprilUtils::swap(row_idx_B, col_idx_B);
-        if (trans_C == CblasTrans) AprilUtils::swap(row_idx_C, col_idx_C);
-        if (C->getDimSize(row_idx_C) != otherA->getDimSize(row_idx_A) ||
-            C->getDimSize(col_idx_C) != otherB->getDimSize(col_idx_B) ||
-            otherA->getDimSize(col_idx_A) != otherB->getDimSize(row_idx_B)) {
+        //
+        if (C_dim[0] != A_dim[row_idx_A] ||
+            C_dim[1] != B_dim[col_idx_B] ||
+            A_dim[col_idx_A] != B_dim[row_idx_B]) {
           ERROR_EXIT6(128, "Incorrect matrixes dimensions: %dx%d + %dx%d * %dx%d\n",
-                      C->getDimSize(row_idx_C), C->getDimSize(col_idx_C),
-                      otherA->getDimSize(row_idx_A), otherA->getDimSize(col_idx_A),
-                      otherB->getDimSize(row_idx_B), otherB->getDimSize(col_idx_B));
+                      C_dim[0], C_dim[1],
+                      A_dim[row_idx_A], A_dim[col_idx_A],
+                      B_dim[row_idx_B], B_dim[col_idx_B]);
         }
-        if (C->getMajorOrder() != otherB->getMajorOrder()) {
-          ERROR_EXIT(128, "Matrices with different major orders\n"); 
-        }
-        int M=C->getDimSize(row_idx_C), N=C->getDimSize(col_idx_C), K=otherB->getDimSize(row_idx_B);
-        int ldb, ldc;
-        if (C->getMajorOrder() == CblasRowMajor) {
-          ldb = (!otherB->getTransposedFlag())?(otherB->getStrideSize(0)):(otherB->getStrideSize(1));
-          ldc = (!C->getTransposedFlag())?(C->getStrideSize(0)):(C->getStrideSize(1));
+        int M=C_dim[0], N=C_dim[1];
+        int K=B_dim[row_idx_B];
+        if (order == CblasRowMajor) {
+          if (B_stride[1] != 1) trans_B = NEGATE_CBLAS_TRANSPOSE(trans_B);
         }
         else {
-          ldb = (!otherB->getTransposedFlag())?(otherB->getStrideSize(1)):(otherB->getStrideSize(0));
-          ldc = (!C->getTransposedFlag())?(C->getStrideSize(1)):(C->getStrideSize(0));
-        }
-        if (otherB->getStrideSize(0)+ otherB->getStrideSize(1) != ldb+1 ||
-            C->getStrideSize(0)     + C->getStrideSize(1)      != ldc+1) {
-          ERROR_EXIT(128, "Contiguous matrices are needed\n");
+          if (B_stride[0] != 1) trans_B = NEGATE_CBLAS_TRANSPOSE(trans_B);
         }
-        if (otherB->getTransposedFlag()) trans_B=NEGATE_CBLAS_TRANSPOSE(trans_B);
-        if (C->getTransposedFlag())      trans_C=NEGATE_CBLAS_TRANSPOSE(trans_C);
-        doSparseMM<T>(C->getMajorOrder(),
+        doSparseMM<T>(order,
                       otherA->getSparseFormat(),
                       trans_A,
                       trans_B,
-                      trans_C,
                       M, N, K,
                       alpha,
                       otherA->getRawValuesAccess(),
@@ -554,42 +562,36 @@ namespace AprilMath {
                          const Matrix<T> *otherA,
                          const Matrix<T> *otherX,
                          const T beta) {
+        CBLAS_ORDER order = CblasRowMajor;
         if (!Y->isVector() || !otherX->isVector() || otherA->getNumDim() != 2) {
           ERROR_EXIT(128,"Incorrect number of dimensions\n");
         }
-        int M,N;
-        if (otherA->getTransposedFlag()) {
-          trans_A=NEGATE_CBLAS_TRANSPOSE(trans_A);
-          M=otherA->getDimSize(1);
-          N=otherA->getDimSize(0);
-        }else {
-          M=otherA->getDimSize(0);
-          N=otherA->getDimSize(1);
+        int M, N;
+        const int *A_stride = otherA->getStridePtr();
+        int lda = AprilUtils::max(A_stride[0],A_stride[1]);
+        if (A_stride[0]+A_stride[1] != lda+1) {
+          ERROR_EXIT(128, "Only allowed with contiguous matrices in leading dimension\n");
         }
+        if (A_stride[1] != 1) order = CblasColMajor;
+        M = otherA->getDimSize(0);
+        N = otherA->getDimSize(1);
         // SANITY CHECK
-        if (trans_A == CblasNoTrans) {
-          if (M != Y->size() || N != otherX->size()) {
+        if (trans_A == CblasTrans) {
+          if (N != Y->size() || M != otherX->size()) {
             ERROR_EXIT4(128, "Incorrect matrixes dimensions: %dx1 + %dx%d * %dx1\n",
-                        Y->size(), M, N, otherX->size());
+                        Y->size(), N, M, otherX->size());
           }
         }
         else {
-          if (N != Y->size() || M != otherX->size())
+          if (M != Y->size() || N != otherX->size()) {
             ERROR_EXIT4(128, "Incorrect matrixes dimensions: %dx1 + %dx%d * %dx1\n",
-                        Y->size(), N, M, otherX->size());
-        }
-        if (Y->getMajorOrder() != otherA->getMajorOrder() ||
-            otherA->getMajorOrder() != otherX->getMajorOrder()) {
-          ERROR_EXIT(128, "Matrices with different major orders\n");
+                        Y->size(), M, N, otherX->size());
+          }
         }
         //
-        int lda=(otherA->getIsDataRowOrdered())?otherA->getStrideSize(0):otherA->getStrideSize(1);
         int ldx=otherX->getVectorStride();
         int ldy=Y->getVectorStride();
-        if (otherA->getStrideSize(0) + otherA->getStrideSize(1) != lda+1) {
-          ERROR_EXIT(128, "Only allowed with contiguous matrices\n");
-        }
-        doGemv(Y->getMajorOrder(), trans_A,
+        doGemv(order, trans_A,
                M, N,
                alpha, otherA->getRawDataAccess(), lda,
                otherX->getRawDataAccess(), ldx,
@@ -649,25 +651,21 @@ namespace AprilMath {
                         const T alpha,
                         const Matrix<T> *otherX,
                         const Matrix<T> *otherY) {
-        if (A->getTransposedFlag()) {
-          ERROR_EXIT(128, "GER method don't work with transposed A matrix\n");
-        }
+        CBLAS_ORDER order = CblasRowMajor;
         if (!otherX->isVector() || !otherY->isVector() || A->getNumDim()!=2) {
           ERROR_EXIT(128,"Incorrect number of dimensions\n");
         }
+        const int *A_stride = A->getStridePtr();
+        int lda = AprilUtils::max(A_stride[0],A_stride[1]);
+        if (A->getStrideSize(1) != 1) order = CblasColMajor;
         int M=otherX->size(), N=otherY->size();
         if (A->getDimSize(0) != M || A->getDimSize(1) != N) {
           ERROR_EXIT4(128, "Incorrect matrixes dimensions: %dx%d + %dx1 * 1x%d\n",
                       A->getDimSize(0), A->getDimSize(1), M, N);
         }
-        if (A->getMajorOrder() != otherX->getMajorOrder() ||
-            otherX->getMajorOrder() != otherY->getMajorOrder()) {
-          ERROR_EXIT(128, "Matrices with different major orders\n");
-        }
-        int lda=(A->getIsDataRowOrdered())?A->getStrideSize(0):A->getStrideSize(1);
         int ldx=otherX->getVectorStride();
         int ldy=otherY->getVectorStride();
-        doGer(A->getMajorOrder(),
+        doGer(order,
               M, N,
               alpha, otherX->getRawDataAccess(), otherX->getOffset(), ldx,
               otherY->getRawDataAccess(), otherY->getOffset(), ldy,
@@ -683,9 +681,6 @@ namespace AprilMath {
           ERROR_EXIT2(128, "Incorrect dimensions: %d dot %d\n",
                       X->size(), Y->size());
         }
-        if (X->getMajorOrder() != Y->getMajorOrder()) {
-          ERROR_EXIT(128, "Matrices with different major orders\n");
-        }
         return MatrixSpanReduce2(X, Y, doDot< T, AprilMath::Functors::r_add<T,T> >,
                                  AprilMath::Functors::r_add<T,T>(),
                                  T(0.0f));
@@ -948,26 +943,15 @@ namespace AprilMath {
       // FIXME: using WRAPPER
       template<typename T>
       void matMinAndMax(const Matrix<T> *obj, T &min, T &max) {
-        if (obj->getMajorOrder() == CblasRowMajor) {
-          typename Matrix<T>::const_iterator it(obj->begin());
-          min = *it;
-          max = *it;
-          for (; it!=obj->end(); ++it) {
-            if (*it < min) min = *it;
-            if (*it > max) max = *it;
-          }
-        }
-        else {
-          typename Matrix<T>::const_col_major_iterator it(obj->begin());
-          min = *it;
-          max = *it;
-          for (; it!=obj->end(); ++it) {
-            if (*it < min) min = *it;
-            if (*it > max) max = *it;
-          }
+        typename Matrix<T>::const_iterator it(obj->begin());
+        min = *it;
+        max = *it;
+        for (; it!=obj->end(); ++it) {
+          if (*it < min) min = *it;
+          if (*it > max) max = *it;
         }
       }
-    
+      
       template<typename T>
       void matMinAndMax(const SparseMatrix<T> *obj, T &min, T &max) {
         typename SparseMatrix<T>::const_iterator it(obj->begin());
@@ -990,8 +974,7 @@ namespace AprilMath {
                       dim, obj->getNumDim());
         }
         if (result == 0) {
-          result = new Matrix<T>(1, obj->getDimSize(dim),
-                                 obj->getMajorOrder());
+          result = new Matrix<T>(1, obj->getDimSize(dim));
         }
         else {
           if (result->size()!=obj->getDimSize(dim) || result->getNumDim()!=1) {
@@ -1112,77 +1095,101 @@ namespace AprilMath {
          ZERO/ONE matrix, depending in the truth of the given condition */
     
       template <typename T>
-      Matrix<T> *matLT(Matrix<T> *obj, const T &value,
-                       Matrix<T> *dest) {
-        if (dest == 0) dest = obj;
-        return MatrixScalarMap1<T,T>(obj, m_curried_lt<T>(value), dest);
+      Matrix<bool> *matLT(Matrix<T> *obj, const T &value,
+                          Matrix<bool> *dest) {
+        if (dest == 0) {
+          dest = new Matrix<bool>(obj->getNumDim(),
+                                  obj->getDimPtr());
+        }
+        return MatrixScalarMap1<T,bool>(obj, m_curried_lt<T>(value), dest);
       }
 
       template <typename T>
-      Matrix<T> *matLT(Matrix<T> *obj,
-                       const Matrix<T> *other,
-                       Matrix<T> *dest) {
-        if (dest == 0) dest = obj;
-        return MatrixScalarMap2<T,T,T>(obj, other,
-                                       AprilMath::Functors::m_lt<T>(), dest);
+      Matrix<bool> *matLT(Matrix<T> *obj,
+                          const Matrix<T> *other,
+                          Matrix<bool> *dest) {
+        if (dest == 0) {
+          dest = new Matrix<bool>(obj->getNumDim(),
+                                  obj->getDimPtr());
+        }
+        return MatrixScalarMap2<T,T,bool>(obj, other,
+                                          AprilMath::Functors::m_lt<T>(), dest);
       }
 
       template <typename T>
-      Matrix<T> *matGT(Matrix<T> *obj, const T &value,
-                       Matrix<T> *dest) {
-        if (dest == 0) dest = obj;
-        return MatrixScalarMap1<T,T>(obj, m_curried_gt<T>(value), dest);
+      Matrix<bool> *matGT(Matrix<T> *obj, const T &value,
+                          Matrix<bool> *dest) {
+        if (dest == 0) {
+          dest = new Matrix<bool>(obj->getNumDim(),
+                                  obj->getDimPtr());
+        }
+        return MatrixScalarMap1<T,bool>(obj, m_curried_gt<T>(value), dest);
       }
 
       template <typename T>
-      Matrix<T> *matGT(Matrix<T> *obj,
+      Matrix<bool> *matGT(Matrix<T> *obj,
                        const Matrix<T> *other,
-                       Matrix<T> *dest) {
-        if (dest == 0) dest = obj;
-        return MatrixScalarMap2<T,T,T>(obj, other,
-                                       AprilMath::Functors::m_gt<T>(), dest);
+                       Matrix<bool> *dest) {
+        if (dest == 0) {
+          dest = new Matrix<bool>(obj->getNumDim(),
+                                  obj->getDimPtr());
+        }
+        return MatrixScalarMap2<T,T,bool>(obj, other,
+                                          AprilMath::Functors::m_gt<T>(), dest);
       }
 
       template <typename T>
-      Matrix<T> *matEQ(Matrix<T> *obj, const T &value,
-                       Matrix<T> *dest) {
-        if (dest == 0) dest = obj;
+      Matrix<bool> *matEQ(Matrix<T> *obj, const T &value,
+                          Matrix<bool> *dest) {
+        if (dest == 0) {
+          dest = new Matrix<bool>(obj->getNumDim(),
+                                  obj->getDimPtr());
+        }
         if (m_isnan(value)) {
-          return MatrixScalarMap1<T,T>(obj, m_curried_eq_nan<T>(), dest);
+          return MatrixScalarMap1<T,bool>(obj, m_curried_eq_nan<T>(), dest);
         }
         else {
-          return MatrixScalarMap1<T,T>(obj, m_curried_eq<T>(value), dest);
+          return MatrixScalarMap1<T,bool>(obj, m_curried_eq<T>(value), dest);
         }
       }
     
       template <typename T>
-      Matrix<T> *matEQ(Matrix<T> *obj,
-                       const Matrix<T> *other,
-                       Matrix<T> *dest) {
-        if (dest == 0) dest = obj;
-        return MatrixScalarMap2<T,T>(obj, other,
-                                     AprilMath::Functors::m_eq<T>(), dest);
+      Matrix<bool> *matEQ(Matrix<T> *obj,
+                          const Matrix<T> *other,
+                          Matrix<bool> *dest) {
+        if (dest == 0) {
+          dest = new Matrix<bool>(obj->getNumDim(),
+                                  obj->getDimPtr());
+        }
+        return MatrixScalarMap2<T,T,bool>(obj, other,
+                                          AprilMath::Functors::m_eq<T>(), dest);
       }
     
       template <typename T>
-      Matrix<T> *matNEQ(Matrix<T> *obj, const T &value,
-                        Matrix<T> *dest) {
-        if (dest == 0) dest = obj;
+      Matrix<bool> *matNEQ(Matrix<T> *obj, const T &value,
+                           Matrix<bool> *dest) {
+        if (dest == 0) {
+          dest = new Matrix<bool>(obj->getNumDim(),
+                                  obj->getDimPtr());
+        }
         if (m_isnan(value)) {
-          return MatrixScalarMap1<T,T>(obj, m_curried_neq_nan<T>(), dest);
+          return MatrixScalarMap1<T,bool>(obj, m_curried_neq_nan<T>(), dest);
         }
         else {
-          return MatrixScalarMap1<T,T>(obj, m_curried_neq<T>(value), dest);
+          return MatrixScalarMap1<T,bool>(obj, m_curried_neq<T>(value), dest);
         }
       }
     
       template <typename T>
-      Matrix<T> *matNEQ(Matrix<T> *obj,
-                        const Matrix<T> *other,
-                        Matrix<T> *dest) {
-        if (dest == 0) dest = obj;
-        return MatrixScalarMap2<T,T>(obj, other,
-                                     AprilMath::Functors::m_neq<T>(), dest);
+      Matrix<bool> *matNEQ(Matrix<T> *obj,
+                           const Matrix<T> *other,
+                           Matrix<bool> *dest) {
+        if (dest == 0) {
+          dest = new Matrix<bool>(obj->getNumDim(),
+                                  obj->getDimPtr());
+        }
+        return MatrixScalarMap2<T,T,bool>(obj, other,
+                                          AprilMath::Functors::m_neq<T>(), dest);
       }
     
       //////////////////// OTHER MATH OPERATIONS ////////////////////
@@ -1212,7 +1219,7 @@ namespace AprilMath {
             // OUTER product
             int dim[2] = {a->size(),b->size()};
             if (c == 0) {
-              c = new Matrix<T>(2, dim, a->getMajorOrder());
+              c = new Matrix<T>(2, dim);
 #ifdef USE_CUDA
               c->setUseCuda(a->getCudaFlag() || b->getCudaFlag());
 #endif
@@ -1227,7 +1234,7 @@ namespace AprilMath {
             // Matrix-Vector product
             int dim[2] = {a->getDimSize(0),1};
             if (c == 0) {
-              c = new Matrix<T>(b->getNumDim(), dim, a->getMajorOrder());
+              c = new Matrix<T>(b->getNumDim(), dim);
 #ifdef USE_CUDA
               c->setUseCuda(a->getCudaFlag() || b->getCudaFlag());
 #endif
@@ -1242,7 +1249,7 @@ namespace AprilMath {
             // DOT product
             int dim[2] = {1,1};
             if (c == 0) {
-              c = new Matrix<T>(a->getNumDim(), dim, a->getMajorOrder());
+              c = new Matrix<T>(a->getNumDim(), dim);
 #ifdef USE_CUDA
               c->setUseCuda(a->getCudaFlag() || b->getCudaFlag());
 #endif
@@ -1259,7 +1266,7 @@ namespace AprilMath {
           // Matrix-Matrix product
           int dim[2] = {a->getDimSize(0), b->getDimSize(1)};
           if (c == 0) {
-            c = new Matrix<T>(2,dim,a->getMajorOrder());
+            c = new Matrix<T>(2,dim);
 #ifdef USE_CUDA
               c->setUseCuda(a->getCudaFlag() || b->getCudaFlag());
 #endif
@@ -1444,21 +1451,21 @@ namespace AprilMath {
       
       Matrix<float> *matInv(const Matrix<float> *obj) {
         if (obj->getNumDim() != 2 || obj->getDimSize(0) != obj->getDimSize(1)) {
-          ERROR_EXIT(128, "Only bi-dimensional matrices are allowed\n");
+          ERROR_EXIT(128, "Only squared bi-dimensional matrices are allowed\n");
         }
-        Matrix<float> *A = obj->clone(CblasColMajor);
+        Matrix<float> *A = obj->clone();
         AprilUtils::UniquePtr<int []> IPIV( new int[obj->getDimSize(0)] );
         int INFO;
-        INFO = clapack_sgetrf(CblasColMajor,
+        INFO = clapack_sgetrf(CblasRowMajor,
                               A->getDimSize(0), A->getDimSize(1),
                               A->getRawDataAccess()->getPPALForReadAndWrite(),
-                              A->getStrideSize(1),
+                              A->getStrideSize(0),
                               IPIV.get());
         checkLapackInfo(INFO);
-        INFO = clapack_sgetri(CblasColMajor,
+        INFO = clapack_sgetri(CblasRowMajor,
                               A->getDimSize(0),
                               A->getRawDataAccess()->getPPALForReadAndWrite(),
-                              A->getStrideSize(1),
+                              A->getStrideSize(0),
                               IPIV.get());
         checkLapackInfo(INFO);
         return A;
@@ -1470,22 +1477,38 @@ namespace AprilMath {
         if (obj->getNumDim() != 2) {
           ERROR_EXIT(128, "Only bi-dimensional matrices are allowed\n");
         }
-        AprilUtils::SharedPtr< Matrix<float> > A( obj->clone(CblasColMajor) );
+        AprilUtils::SharedPtr< Matrix<float> > A( obj->clone() );
+        AprilUtils::SharedPtr< Matrix<float> > AT( A->transpose() );
         int INFO;
         const int m = A->getDimSize(0); // cols
         const int n = A->getDimSize(1); // rows
-        const int lda = A->getStrideSize(1);
         const int numSV = (m<n) ? m : n;
         const int dimsU[2]  = {m, m};
         const int dimsVT[2] = {n, n};
-        *U  = new Matrix<float>(2, dimsU,  CblasColMajor);
-        *S  = SparseMatrix<float>::diag(numSV, 0.0f, CSR_FORMAT);
-        *VT = new Matrix<float>(2, dimsVT, CblasColMajor);
-        INFO = clapack_sgesdd(CblasColMajor, m, n, lda,
-                              A->getRawDataAccess()->getPPALForReadAndWrite(),
-                              (*U)->getRawDataAccess()->getPPALForWrite(),
-                              (*S)->getRawValuesAccess()->getPPALForWrite(),
-                              (*VT)->getRawDataAccess()->getPPALForWrite());
+        GPUMirroredMemoryBlock<float> *S_values =
+          new GPUMirroredMemoryBlock<float>(numSV);
+        GPUMirroredMemoryBlock<int32_t> *S_indices =
+          new GPUMirroredMemoryBlock<int32_t>(numSV);
+        GPUMirroredMemoryBlock<int32_t> *S_first =
+          new GPUMirroredMemoryBlock<int32_t>(m+1);
+        for (int i=0; i<numSV; ++i) {
+          (*S_indices)[i]=i;
+          (*S_first)[i]=i;
+        }
+        for (int i=numSV; i<=m; ++i) {
+          (*S_first)[i]=numSV;
+        }
+        *U  = new Matrix<float>(2, dimsU);
+        *S  = new SparseMatrix<float>(m,n,S_values,S_indices,S_first);
+        *VT = new Matrix<float>(2, dimsVT);
+        AprilUtils::SharedPtr< Matrix<float> > UT( (*VT)->transpose() );
+        AprilUtils::SharedPtr< Matrix<float> > V( (*U)->transpose() );
+        // m,n are changed by n,m because the tranposition of the matrices
+        INFO = clapack_sgesdd(CblasColMajor, n, m, AT->getStrideSize(1),
+                              AT->getRawDataAccess()->getPPALForReadAndWrite(),
+                              UT->getRawDataAccess()->getPPALForWrite(),
+                              S_values->getPPALForWrite(),
+                              V->getRawDataAccess()->getPPALForWrite());
         checkLapackInfo(INFO);
       }
 
@@ -1495,13 +1518,14 @@ namespace AprilMath {
         if (obj->getNumDim() != 2 || obj->getDimSize(0) != obj->getDimSize(1)) {
           ERROR_EXIT(128, "Only squared bi-dimensional matrices are allowed\n");
         }
-        AprilUtils::SharedPtr< Matrix<float> > A( obj->clone(CblasColMajor) );
+        AprilUtils::SharedPtr< Matrix<float> > A( obj->clone() );
+        AprilUtils::SharedPtr< Matrix<float> > AT( A->transpose() ); // in col major
         AprilUtils::UniquePtr<int []> IPIV( new int[A->getDimSize(0)] );
         int INFO;
         INFO = clapack_sgetrf(CblasColMajor,
-                              A->getDimSize(0), A->getDimSize(1),
-                              A->getRawDataAccess()->getPPALForReadAndWrite(),
-                              A->getStrideSize(1),
+                              AT->getDimSize(0), AT->getDimSize(1),
+                              AT->getRawDataAccess()->getPPALForReadAndWrite(),
+                              AT->getStrideSize(1),
                               IPIV.get());
         checkLapackInfo(INFO);
         Matrix<float>::const_random_access_iterator it(A.get());
@@ -1539,13 +1563,14 @@ namespace AprilMath {
         if (obj->getNumDim() != 2 || obj->getDimSize(0) != obj->getDimSize(1)) {
           ERROR_EXIT(128, "Only squared bi-dimensional matrices are allowed\n");
         }
-        AprilUtils::SharedPtr< Matrix<float> > A( obj->clone(CblasColMajor) );
+        AprilUtils::SharedPtr< Matrix<float> > A( obj->clone() );
+        AprilUtils::SharedPtr< Matrix<float> > AT( A->transpose() ); // in col major
         AprilUtils::UniquePtr<int []> IPIV( new int[A->getDimSize(0)] );
         int INFO;
         INFO = clapack_sgetrf(CblasColMajor,
-                              A->getDimSize(0), A->getDimSize(1),
-                              A->getRawDataAccess()->getPPALForReadAndWrite(),
-                              A->getStrideSize(1),
+                              AT->getDimSize(0), AT->getDimSize(1),
+                              AT->getRawDataAccess()->getPPALForReadAndWrite(),
+                              AT->getStrideSize(1),
                               IPIV.get());
         checkLapackInfo(INFO);
         Matrix<float>::const_random_access_iterator it(A.get());
@@ -1586,12 +1611,12 @@ namespace AprilMath {
         if (obj->getNumDim() != 2 || obj->getDimSize(0) != obj->getDimSize(1)) {
           ERROR_EXIT(128, "Only squared bi-dimensional matrices are allowed\n");
         }
-        Matrix<float> *A = obj->clone(CblasColMajor);
-        int INFO = clapack_spotrf(CblasColMajor,
+        Matrix<float> *A = obj->clone();
+        int INFO = clapack_spotrf(CblasRowMajor,
                                   (uplo == 'U') ? CblasUpper : CblasLower,
                                   A->getDimSize(0),
                                   A->getRawDataAccess()->getPPALForReadAndWrite(),
-                                  A->getStrideSize(1));
+                                  A->getStrideSize(0));
         checkLapackInfo(INFO);
         switch(uplo) {
         case 'U':
@@ -1638,7 +1663,7 @@ namespace AprilMath {
 	  }
 	}
 	else {
-	  dest = new Matrix<float>(N+1, dest_size.get(), obj->getMajorOrder());
+	  dest = new Matrix<float>(N+1, dest_size.get());
 #ifdef USE_CUDA
 	  dest->setUseCuda(obj->getCudaFlag());
 #endif
@@ -1720,7 +1745,6 @@ namespace AprilMath {
                                       const Matrix<float> *otherB,
                                       float beta);
       template Matrix<float> *matSparseMM(Matrix<float> *,
-                                          CBLAS_TRANSPOSE,
                                           CBLAS_TRANSPOSE,
                                           CBLAS_TRANSPOSE,
                                           const float,
@@ -1763,24 +1787,24 @@ namespace AprilMath {
                                            Int32GPUMirroredMemoryBlock *,
                                            const int,
                                            Basics::Matrix<float> *);
-      template Matrix<float> *matLT(Matrix<float> *, const float &,
-                                    Matrix<float> *);
+      template Matrix<bool> *matLT(Matrix<float> *, const float &,
+                                   Matrix<bool> *);
 
-      template Matrix<float> *matLT(Matrix<float> *,
-                                    const Matrix<float> *,
-                                    Matrix<float> *);
-      template Matrix<float> *matGT(Matrix<float> *, const float &, Matrix<float> *);
-      template Matrix<float> *matGT(Matrix<float> *,
-                                    const Matrix<float> *, Matrix<float> *);
-      template Matrix<float> *matEQ(Matrix<float> *, const float &, Matrix<float> *);
-      template Matrix<float> *matEQ(Matrix<float> *,
+      template Matrix<bool> *matLT(Matrix<float> *,
+                                   const Matrix<float> *,
+                                   Matrix<bool> *);
+      template Matrix<bool> *matGT(Matrix<float> *, const float &, Matrix<bool> *);
+      template Matrix<bool> *matGT(Matrix<float> *,
+                                   const Matrix<float> *, Matrix<bool> *);
+      template Matrix<bool> *matEQ(Matrix<float> *, const float &, Matrix<bool> *);
+      template Matrix<bool> *matEQ(Matrix<float> *,
+                                   const Matrix<float> *,
+                                   Matrix<bool> *);
+      template Matrix<bool> *matNEQ(Matrix<float> *, const float &,
+                                    Matrix<bool> *);
+      template Matrix<bool> *matNEQ(Matrix<float> *,
                                     const Matrix<float> *,
-                                    Matrix<float> *);
-      template Matrix<float> *matNEQ(Matrix<float> *, const float &,
-                                     Matrix<float> *);
-      template Matrix<float> *matNEQ(Matrix<float> *,
-                                     const Matrix<float> *,
-                                     Matrix<float> *);
+                                    Matrix<bool> *);
       template Matrix<float> *matAddition(const Matrix<float> *,
                                           const Matrix<float> *,
                                           Matrix<float> *);
@@ -1834,85 +1858,84 @@ namespace AprilMath {
       template Matrix<double> *matComplement(Matrix<double> *, Matrix<double> *);
       template Matrix<double> *matSign(Matrix<double> *, Matrix<double> *);
       template Matrix<double> *matClamp(Matrix<double> *, const double,
-                                       const double, Matrix<double> *);
+                                        const double, Matrix<double> *);
       template Matrix<double> *matFill(Matrix<double> *, const double);
       template Matrix<double> *matZeros(Matrix<double> *);
       template Matrix<double> *matOnes(Matrix<double> *);
       template Matrix<double> *matDiag(Matrix<double> *, const double);
       template Matrix<double> *matCopy(Matrix<double> *, const Matrix<double> *);
       template Matrix<double> *matAxpy(Matrix<double> *, const double,
-                                      const Matrix<double> *);
+                                       const Matrix<double> *);
       template Matrix<double> *matAxpy(Matrix<double> *, const double,
-                                      const SparseMatrix<double> *);
+                                       const SparseMatrix<double> *);
       template Matrix<double> *matGemm(Matrix<double> *,
-                                      CBLAS_TRANSPOSE,
-                                      CBLAS_TRANSPOSE,
-                                      const double,
-                                      const Matrix<double> *otherA,
-                                      const Matrix<double> *otherB,
-                                      double beta);
+                                       CBLAS_TRANSPOSE,
+                                       CBLAS_TRANSPOSE,
+                                       const double,
+                                       const Matrix<double> *otherA,
+                                       const Matrix<double> *otherB,
+                                       double beta);
       template Matrix<double> *matSparseMM(Matrix<double> *,
-                                          CBLAS_TRANSPOSE,
-                                          CBLAS_TRANSPOSE,
-                                          CBLAS_TRANSPOSE,
-                                          const double,
-                                          const SparseMatrix<double> *,
-                                          const Matrix<double> *,
-                                          double);
+                                           CBLAS_TRANSPOSE,
+                                           CBLAS_TRANSPOSE,
+                                           const double,
+                                           const SparseMatrix<double> *,
+                                           const Matrix<double> *,
+                                           double);
       template Matrix<double> *matGemv(Matrix<double> *Y,
-                                      CBLAS_TRANSPOSE,
-                                      const double,
-                                      const Matrix<double> *,
-                                      const Matrix<double> *,
-                                      const double);
+                                       CBLAS_TRANSPOSE,
+                                       const double,
+                                       const Matrix<double> *,
+                                       const Matrix<double> *,
+                                       const double);
       template Matrix<double> *matGemv(Matrix<double> *Y,
-                                      CBLAS_TRANSPOSE,
+                                       CBLAS_TRANSPOSE,
+                                       const double,
+                                       const SparseMatrix<double> *,
+                                       const Matrix<double> *,
+                                       const double);
+      template Matrix<double> *matGer(Matrix<double> *,
                                       const double,
-                                      const SparseMatrix<double> *,
                                       const Matrix<double> *,
-                                      const double);
-      template Matrix<double> *matGer(Matrix<double> *,
-                                     const double,
-                                     const Matrix<double> *,
-                                     const Matrix<double> *);
+                                      const Matrix<double> *);
       template double matDot(const Matrix<double> *, const Matrix<double> *);
       template double matDot(const Matrix<double> *, const SparseMatrix<double> *);
       template Matrix<double> *matScal(Matrix<double> *, const double);
       template float matNorm2(Matrix<double> *);
       template Matrix<double> *matMin(Matrix<double> *,
-                                     int,
-                                     Matrix<double> *,
-                                     Matrix<int32_t> *);
+                                      int,
+                                      Matrix<double> *,
+                                      Matrix<int32_t> *);
       template Matrix<double> *matMax(Matrix<double> *,
-                                     int,
-                                     Matrix<double> *,
-                                     Matrix<int32_t> *);
+                                      int,
+                                      Matrix<double> *,
+                                      Matrix<int32_t> *);
       template double matMin(const Matrix<double> *, int &, int &);
       template double matMax(const Matrix<double> *, int &, int &);
       template void matMinAndMax(const Matrix<double> *, double &, double &);
       template Matrix<double> *matMaxSelDim(const Matrix<double> *,
-                                           const int,
-                                           Int32GPUMirroredMemoryBlock *,
-                                           const int,
-                                           Basics::Matrix<double> *);
-      template Matrix<double> *matLT(Matrix<double> *, const double &,
-                                    Matrix<double> *);
+                                            const int,
+                                            Int32GPUMirroredMemoryBlock *,
+                                            const int,
+                                            Basics::Matrix<double> *);
+      template Matrix<bool> *matLT(Matrix<double> *, const double &,
+                                   Matrix<bool> *);
 
-      template Matrix<double> *matLT(Matrix<double> *,
-                                    const Matrix<double> *,
-                                    Matrix<double> *);
-      template Matrix<double> *matGT(Matrix<double> *, const double &, Matrix<double> *);
-      template Matrix<double> *matGT(Matrix<double> *,
-                                    const Matrix<double> *, Matrix<double> *);
-      template Matrix<double> *matEQ(Matrix<double> *, const double &, Matrix<double> *);
-      template Matrix<double> *matEQ(Matrix<double> *,
+      template Matrix<bool> *matLT(Matrix<double> *,
+                                   const Matrix<double> *,
+                                   Matrix<bool> *);
+      template Matrix<bool> *matGT(Matrix<double> *, const double &, Matrix<bool> *);
+      template Matrix<bool> *matGT(Matrix<double> *,
+                                   const Matrix<double> *, Matrix<bool> *);
+      template Matrix<bool> *matEQ(Matrix<double> *, const double &, Matrix<bool> *);
+      template Matrix<bool> *matEQ(Matrix<double> *,
+                                   const Matrix<double> *,
+                                   Matrix<bool> *);
+      template Matrix<bool> *matNEQ(Matrix<double> *, const double &,
+                                    Matrix<bool> *);
+      template Matrix<bool> *matNEQ(Matrix<double> *,
                                     const Matrix<double> *,
-                                    Matrix<double> *);
-      template Matrix<double> *matNEQ(Matrix<double> *, const double &,
-                                     Matrix<double> *);
-      template Matrix<double> *matNEQ(Matrix<double> *,
-                                     const Matrix<double> *,
-                                     Matrix<double> *);
+                                    Matrix<bool> *);
       template Matrix<double> *matAddition(const Matrix<double> *,
                                           const Matrix<double> *,
                                           Matrix<double> *);
@@ -1958,7 +1981,6 @@ namespace AprilMath {
                                       const Matrix<ComplexF> *otherB,
                                       ComplexF beta);
       template Matrix<ComplexF> *matSparseMM(Matrix<ComplexF> *,
-                                          CBLAS_TRANSPOSE,
                                           CBLAS_TRANSPOSE,
                                           CBLAS_TRANSPOSE,
                                           const ComplexF,
@@ -2015,6 +2037,13 @@ namespace AprilMath {
       template Matrix<char> *matZeros(Matrix<char> *);
       template Matrix<char> *matOnes(Matrix<char> *);
       template Matrix<char> *matDiag(Matrix<char> *, const char);
+
+      // INSTANTIATIONS (bool type, dense matrix)
+      template Matrix<bool> *matCopy(Matrix<bool> *, const Matrix<bool> *);
+      template Matrix<bool> *matFill(Matrix<bool> *, const bool);
+      template Matrix<bool> *matZeros(Matrix<bool> *);
+      template Matrix<bool> *matOnes(Matrix<bool> *);
+      template Matrix<bool> *matDiag(Matrix<bool> *, const bool);
       
       // INSTANTIATIONS (int32_t type, dense matrix)
       template Matrix<int32_t> *matCopy(Matrix<int32_t> *, const Matrix<int32_t> *);
diff --git a/packages/basics/matrix/c_src/matrix_operations.h b/packages/basics/matrix/c_src/matrix_operations.h
index 1221ac9b0..34c343f5c 100644
--- a/packages/basics/matrix/c_src/matrix_operations.h
+++ b/packages/basics/matrix/c_src/matrix_operations.h
@@ -248,7 +248,6 @@ namespace AprilMath {
       Basics::Matrix<T> *matSparseMM(Basics::Matrix<T> *C,
                                      CBLAS_TRANSPOSE trans_A,
                                      CBLAS_TRANSPOSE trans_B,
-                                     CBLAS_TRANSPOSE trans_C,
                                      const T alpha,
                                      const Basics::SparseMatrix<T> *otherA,
                                      const Basics::Matrix<T> *otherB,
@@ -366,40 +365,40 @@ namespace AprilMath {
          ZERO/ONE matrix, depending in the truth of the given condition */
     
       template <typename T>
-      Basics::Matrix<T> *matLT(Basics::Matrix<T> *obj, const T &value,
-                               Basics::Matrix<T> *dest=0);
+      Basics::Matrix<bool> *matLT(Basics::Matrix<T> *obj, const T &value,
+                                  Basics::Matrix<bool> *dest=0);
 
       template <typename T>
-      Basics::Matrix<T> *matLT(Basics::Matrix<T> *obj,
-                               const Basics::Matrix<T> *other,
-                               Basics::Matrix<T> *dest=0);
+      Basics::Matrix<bool> *matLT(Basics::Matrix<T> *obj,
+                                  const Basics::Matrix<T> *other,
+                                  Basics::Matrix<bool> *dest=0);
 
       template <typename T>
-      Basics::Matrix<T> *matGT(Basics::Matrix<T> *obj, const T &value,
-                               Basics::Matrix<T> *dest=0);
+      Basics::Matrix<bool> *matGT(Basics::Matrix<T> *obj, const T &value,
+                                  Basics::Matrix<bool> *dest=0);
 
       template <typename T>
-      Basics::Matrix<T> *matGT(Basics::Matrix<T> *obj,
-                               const Basics::Matrix<T> *other,
-                               Basics::Matrix<T> *dest=0);
+      Basics::Matrix<bool> *matGT(Basics::Matrix<T> *obj,
+                                  const Basics::Matrix<T> *other,
+                                  Basics::Matrix<bool> *dest=0);
 
       template <typename T>
-      Basics::Matrix<T> *matEQ(Basics::Matrix<T> *obj, const T &value,
-                               Basics::Matrix<T> *dest=0);
+      Basics::Matrix<bool> *matEQ(Basics::Matrix<T> *obj, const T &value,
+                                  Basics::Matrix<bool> *dest=0);
     
       template <typename T>
-      Basics::Matrix<T> *matEQ(Basics::Matrix<T> *obj,
-                               const Basics::Matrix<T> *other,
-                               Basics::Matrix<T> *dest=0);
+      Basics::Matrix<bool> *matEQ(Basics::Matrix<T> *obj,
+                                  const Basics::Matrix<T> *other,
+                                  Basics::Matrix<bool> *dest=0);
     
       template <typename T>
-      Basics::Matrix<T> *matNEQ(Basics::Matrix<T> *obj, const T &value,
-                                Basics::Matrix<T> *dest=0);
+      Basics::Matrix<bool> *matNEQ(Basics::Matrix<T> *obj, const T &value,
+                                   Basics::Matrix<bool> *dest=0);
     
       template <typename T>
-      Basics::Matrix<T> *matNEQ(Basics::Matrix<T> *obj,
-                                const Basics::Matrix<T> *other,
-                                Basics::Matrix<T> *dest=0);
+      Basics::Matrix<bool> *matNEQ(Basics::Matrix<T> *obj,
+                                   const Basics::Matrix<T> *other,
+                                   Basics::Matrix<bool> *dest=0);
     
       //////////////////// OTHER MATH OPERATIONS ////////////////////
     
@@ -504,9 +503,9 @@ namespace AprilMath {
        *
        * @param uplo - A char with 'U' or 'L'.
        */
-      Basics::Matrix<float> *matCholesky(const Basics::Matrix<float> *obj,
-                                         char uplo);
-
+      Basics::Matrix<float> * matCholesky(const Basics::Matrix<float> *obj,
+                                          char uplo);
+      
       Basics::Matrix<float> *matRealFFTwithHamming(Basics::Matrix<float> *obj,
 						   int wsize,
 						   int wadvance,
diff --git a/packages/basics/matrix/c_src/reduce_matrix.impl.h b/packages/basics/matrix/c_src/reduce_matrix.impl.h
index 985a6368e..26b2fd02e 100644
--- a/packages/basics/matrix/c_src/reduce_matrix.impl.h
+++ b/packages/basics/matrix/c_src/reduce_matrix.impl.h
@@ -163,8 +163,7 @@ namespace AprilMath {
       Basics::Matrix<T> *result  = dest;
       Basics::Matrix<int32_t> *result2 = which;
       if (result == 0) {
-        result = new Basics::Matrix<T>(numDim, result_dims.get(),
-                                       input->getMajorOrder());
+        result = new Basics::Matrix<T>(numDim, result_dims.get());
         set_dest_to_zero = true;
       }
       if (result2 == 0) {
@@ -256,8 +255,7 @@ namespace AprilMath {
       /******************************/
       Basics::Matrix<O> *result = dest;
       if (result == 0) {
-        result = new Basics::Matrix<O>(numDim, result_dims.get(),
-                                       input->getMajorOrder());
+        result = new Basics::Matrix<O>(numDim, result_dims.get());
         set_dest_to_zero = true;
       }
       else if (result->size() != result_size) {
@@ -666,8 +664,7 @@ namespace AprilMath {
       /******************************/
       Basics::Matrix<O> *result = dest;
       if (result == 0) {
-        result = new Basics::Matrix<O>(numDim, result_dims.get(),
-                                       input1->getMajorOrder());
+        result = new Basics::Matrix<O>(numDim, result_dims.get());
         set_dest_to_zero = true;
       }
       else if (result->size() != result_size) {
diff --git a/packages/basics/matrix/c_src/sparse_matrix-serialization.impl.h b/packages/basics/matrix/c_src/sparse_matrix-serialization.impl.h
index be70d5692..9d32ca940 100644
--- a/packages/basics/matrix/c_src/sparse_matrix-serialization.impl.h
+++ b/packages/basics/matrix/c_src/sparse_matrix-serialization.impl.h
@@ -43,7 +43,7 @@ namespace Basics {
   template <typename T>
   SparseMatrix<T>*
   SparseMatrix<T>::read(AprilIO::StreamInterface *stream,
-                        const AprilUtils::GenericOptions *options) {
+                        const AprilUtils::LuaTable &options) {
     UNUSED_VARIABLE(options);
     MatrixIO::AsciiExtractor<T> ascii_extractor;
     MatrixIO::BinaryExtractor<T> bin_extractor;
@@ -177,8 +177,8 @@ namespace Basics {
   
   template <typename T>
   void SparseMatrix<T>::write(AprilIO::StreamInterface *stream,
-                              const AprilUtils::GenericOptions *options) {
-    bool is_ascii = options->getOptionalBoolean(MatrixIO::ASCII_OPTION, false);
+                              const AprilUtils::LuaTable &options) {
+    bool is_ascii = options.opt(MatrixIO::ASCII_OPTION, false);
     //
     MatrixIO::SparseAsciiSizer<T> ascii_sizer;
     MatrixIO::SparseBinarySizer<T> bin_sizer;
diff --git a/packages/basics/matrix/c_src/sparse_matrix.h b/packages/basics/matrix/c_src/sparse_matrix.h
index eee644a5c..3140214d1 100644
--- a/packages/basics/matrix/c_src/sparse_matrix.h
+++ b/packages/basics/matrix/c_src/sparse_matrix.h
@@ -176,7 +176,7 @@ namespace Basics {
 
     /// Constructor given a dense matrix, it does constructs a sparse matrix
     /// (cloned).
-    SparseMatrix(const Matrix<T> *other,
+    SparseMatrix(Matrix<T> *other,
                  const SPARSE_FORMAT sparse_format = CSR_FORMAT,
                  const T zero = T());
     /// Constructor given other matrix, it does a deep copy (clone).
@@ -278,7 +278,7 @@ namespace Basics {
     SparseMatrix<T> *clone(SPARSE_FORMAT sparse_format = NONE_FORMAT) const;
   
     /// Returns an equivalent dense matrix
-    Matrix<T> *toDense(CBLAS_ORDER order=CblasRowMajor) const;
+    Matrix<T> *toDense() const;
   
     /// Number values check
     void pruneSubnormalAndCheckNormal();
@@ -300,7 +300,7 @@ namespace Basics {
     const T operator() (int row, int col) const;
   
     /// Function to obtain RAW access to data pointer. Be careful with it, because
-    /// you are losing sub-matrix abstraction, and the major order.
+    /// you are losing sub-matrix abstraction.
     AprilMath::GPUMirroredMemoryBlock<T> *getRawValuesAccess() { return values.get(); }
     AprilMath::Int32GPUMirroredMemoryBlock *getRawIndicesAccess() { return indices.get(); }
     AprilMath::Int32GPUMirroredMemoryBlock *getRawFirstIndexAccess() { return first_index.get(); }
@@ -412,7 +412,7 @@ namespace Basics {
      * Any key/value in @c options dictionary will be ignored.
      */
     static SparseMatrix<T> *read(AprilIO::StreamInterface *stream,
-                                 const AprilUtils::GenericOptions *options);
+                                 const AprilUtils::LuaTable &options);
 
     /**
      * @brief Writes the SparseMatrix into a stream.
@@ -424,7 +424,7 @@ namespace Basics {
      *   binarization purposes. By default it is true.
      */
     virtual void write(AprilIO::StreamInterface *stream,
-                       const AprilUtils::GenericOptions *options);
+                       const AprilUtils::LuaTable &options);
 
     
   private:
@@ -450,4 +450,6 @@ namespace Basics {
 #include "sparse_matrix-iterators.impl.h"
 #include "sparse_matrix-serialization.impl.h"
 
+#include "sparse_matrixFloat.h"
+
 #endif // SPARSE_MATRIX_H
diff --git a/packages/basics/matrix/c_src/sparse_matrix.impl.h b/packages/basics/matrix/c_src/sparse_matrix.impl.h
index 97823d8a3..b65753ab0 100644
--- a/packages/basics/matrix/c_src/sparse_matrix.impl.h
+++ b/packages/basics/matrix/c_src/sparse_matrix.impl.h
@@ -202,8 +202,9 @@ namespace Basics {
     checkSortedIndices(sort);
   }
 
+  // FIXME: Matrix<T> *other cannot be const because of transpose() method.
   template <typename T>
-  SparseMatrix<T>::SparseMatrix(const Matrix<T> *other,
+  SparseMatrix<T>::SparseMatrix(Matrix<T> *other,
                                 const SPARSE_FORMAT sparse_format,
                                 const T zero) :
     AprilIO::Serializable(), shared_count(0), mmapped_data(0),
@@ -231,7 +232,8 @@ namespace Basics {
     switch(sparse_format) {
     case CSC_FORMAT:
       {
-        typename Matrix<T>::const_col_major_iterator it(other->begin());
+        AprilUtils::SharedPtr< Matrix<T> > aux(other->transpose());
+        typename Matrix<T>::const_iterator it(aux->begin());
         for (int c1=0; c1<other->getDimSize(1); ++c1) {
           for (int c0=0; c0<other->getDimSize(0); ++c0, ++it) {
             if (zero < *it || *it < -zero) {
@@ -462,8 +464,8 @@ namespace Basics {
   }
 
   template <typename T>
-  Matrix<T> *SparseMatrix<T>::toDense(CBLAS_ORDER order) const {
-    Matrix<T> *result = new Matrix<T>(2, matrixSize, order);
+  Matrix<T> *SparseMatrix<T>::toDense() const {
+    Matrix<T> *result = new Matrix<T>(2, matrixSize);
     typename Matrix<T>::random_access_iterator result_it(result);
     AprilMath::MatrixExt::Operations::matZeros(result);
     int x0=0,x1=0;
diff --git a/packages/basics/matrix/c_src/sparse_matrixFloat.h b/packages/basics/matrix/c_src/sparse_matrixFloat.h
index 5aba34722..bab40c2ef 100644
--- a/packages/basics/matrix/c_src/sparse_matrixFloat.h
+++ b/packages/basics/matrix/c_src/sparse_matrixFloat.h
@@ -46,4 +46,19 @@ namespace Basics {
 
 }
 
+////////////////////////////////////////////////////////////////////////////
+
+namespace AprilUtils {
+
+  template<> Basics::SparseMatrixFloat *LuaTable::
+  convertTo<Basics::SparseMatrixFloat *>(lua_State *L, int idx);
+  
+  template<> void LuaTable::
+  pushInto<Basics::SparseMatrixFloat *>(lua_State *L,
+                                        Basics::SparseMatrixFloat *value);
+
+  template<> bool LuaTable::
+  checkType<Basics::SparseMatrixFloat *>(lua_State *L, int idx);
+}
+
 #endif // SPARSEMATRIXFLOAT_H
diff --git a/packages/basics/matrix/c_src/utilMatrixComplexF.cc b/packages/basics/matrix/c_src/utilMatrixComplexF.cc
index d04e534d3..e740b01a1 100644
--- a/packages/basics/matrix/c_src/utilMatrixComplexF.cc
+++ b/packages/basics/matrix/c_src/utilMatrixComplexF.cc
@@ -29,21 +29,13 @@ namespace Basics {
     MatrixFloat *new_mat;
     int N     = mat->getNumDim();
     int *dims = new int[N+1];
-    if (mat->getMajorOrder() == CblasRowMajor) {
-      // the real and imaginary part are the last dimension (they are stored
-      // together in row major)
-      for (int i=0; i<N; ++i) dims[i] = mat->getDimPtr()[i];
-      dims[N] = 2;
-    }
-    else {
-      // the real and imaginary part are the first dimension (they are stored
-      // together in col major)
-      dims[0] = 2;
-      for (int i=0; i<N; ++i) dims[i+1] = mat->getDimPtr()[i];
-    }
+    // the real and imaginary part are the last dimension (they are stored
+    // together in row major)
+    for (int i=0; i<N; ++i) dims[i] = mat->getDimPtr()[i];
+    dims[N] = 2;
     AprilMath::FloatGPUMirroredMemoryBlock *new_mat_memory;
     new_mat_memory = mat->getRawDataAccess()->reinterpretAs<float>();
-    new_mat=new MatrixFloat(N+1, dims, mat->getMajorOrder(), new_mat_memory);
+    new_mat=new MatrixFloat(N+1, dims, new_mat_memory);
 #ifdef USE_CUDA
     new_mat->setUseCuda(mat->getCudaFlag());
 #endif
@@ -60,8 +52,7 @@ namespace Basics {
 
   MatrixFloat *realPartFromMatrixComplexFToMatrixFloat(MatrixComplexF *mat) {
     MatrixFloat *new_mat = new MatrixFloat(mat->getNumDim(),
-                                           mat->getDimPtr(),
-                                           mat->getMajorOrder());
+                                           mat->getDimPtr());
 #ifdef USE_CUDA
     new_mat->setUseCuda(mat->getCudaFlag());
 #endif
@@ -77,8 +68,7 @@ namespace Basics {
 
   MatrixFloat *imgPartFromMatrixComplexFToMatrixFloat(MatrixComplexF *mat) {
     MatrixFloat *new_mat = new MatrixFloat(mat->getNumDim(),
-                                           mat->getDimPtr(),
-                                           mat->getMajorOrder());
+                                           mat->getDimPtr());
 #ifdef USE_CUDA
     new_mat->setUseCuda(mat->getCudaFlag());
 #endif
@@ -94,8 +84,7 @@ namespace Basics {
 
   MatrixFloat *absFromMatrixComplexFToMatrixFloat(MatrixComplexF *mat) {
     MatrixFloat *new_mat = new MatrixFloat(mat->getNumDim(),
-                                           mat->getDimPtr(),
-                                           mat->getMajorOrder());
+                                           mat->getDimPtr());
 #ifdef USE_CUDA
     new_mat->setUseCuda(mat->getCudaFlag());
 #endif
@@ -111,8 +100,7 @@ namespace Basics {
 
   MatrixFloat *angleFromMatrixComplexFToMatrixFloat(MatrixComplexF *mat) {
     MatrixFloat *new_mat = new MatrixFloat(mat->getNumDim(),
-                                           mat->getDimPtr(),
-                                           mat->getMajorOrder());
+                                           mat->getDimPtr());
 #ifdef USE_CUDA
     new_mat->setUseCuda(mat->getCudaFlag());
 #endif
diff --git a/packages/basics/matrix/c_src/utilMatrixDouble.cc b/packages/basics/matrix/c_src/utilMatrixDouble.cc
index d72a0e3d6..2b7a0956e 100644
--- a/packages/basics/matrix/c_src/utilMatrixDouble.cc
+++ b/packages/basics/matrix/c_src/utilMatrixDouble.cc
@@ -24,11 +24,9 @@
 
 namespace Basics {
   
-  MatrixFloat *convertFromMatrixDoubleToMatrixFloat(MatrixDouble *mat,
-                                                    bool col_major) {
+  MatrixFloat *convertFromMatrixDoubleToMatrixFloat(MatrixDouble *mat) {
     MatrixFloat *new_mat=new MatrixFloat(mat->getNumDim(),
-                                         mat->getDimPtr(),
-                                         (col_major)?CblasColMajor:CblasRowMajor);
+                                         mat->getDimPtr());
 #ifdef USE_CUDA
     new_mat->setUseCuda(mat->getCudaFlag());
 #endif
diff --git a/packages/basics/matrix/c_src/utilMatrixDouble.h b/packages/basics/matrix/c_src/utilMatrixDouble.h
index f25170f66..8e653622c 100644
--- a/packages/basics/matrix/c_src/utilMatrixDouble.h
+++ b/packages/basics/matrix/c_src/utilMatrixDouble.h
@@ -26,8 +26,7 @@
 
 namespace Basics {
 
-  MatrixFloat *convertFromMatrixDoubleToMatrixFloat(MatrixDouble *mat,
-                                                    bool col_major);
+  MatrixFloat *convertFromMatrixDoubleToMatrixFloat(MatrixDouble *mat);
   
 
 } // namespace Basics
diff --git a/packages/basics/matrix/c_src/utilMatrixInt32.cc b/packages/basics/matrix/c_src/utilMatrixInt32.cc
index 889dba11b..304e53810 100644
--- a/packages/basics/matrix/c_src/utilMatrixInt32.cc
+++ b/packages/basics/matrix/c_src/utilMatrixInt32.cc
@@ -22,11 +22,9 @@
 
 namespace Basics {
 
-  MatrixFloat *convertFromMatrixInt32ToMatrixFloat(MatrixInt32 *mat,
-                                                   bool col_major) {
+  MatrixFloat *convertFromMatrixInt32ToMatrixFloat(MatrixInt32 *mat) {
     MatrixFloat *new_mat=new MatrixFloat(mat->getNumDim(),
-                                         mat->getDimPtr(),
-                                         (col_major)?CblasColMajor:CblasRowMajor);
+                                         mat->getDimPtr());
 #ifdef USE_CUDA
     new_mat->setUseCuda(mat->getCudaFlag());
 #endif
diff --git a/packages/basics/matrix/c_src/utilMatrixInt32.h b/packages/basics/matrix/c_src/utilMatrixInt32.h
index d3ace99f9..d7a20540e 100644
--- a/packages/basics/matrix/c_src/utilMatrixInt32.h
+++ b/packages/basics/matrix/c_src/utilMatrixInt32.h
@@ -26,8 +26,7 @@
 
 namespace Basics {
   
-  MatrixFloat *convertFromMatrixInt32ToMatrixFloat(MatrixInt32 *mat,
-                                                   bool col_major);
+  MatrixFloat *convertFromMatrixInt32ToMatrixFloat(MatrixInt32 *mat);
   
 } // namespace Basics
 
diff --git a/packages/basics/matrix/lua_src/generic_call.lua b/packages/basics/matrix/lua_src/generic_call.lua
index d2ccd54e0..9cc9135a5 100644
--- a/packages/basics/matrix/lua_src/generic_call.lua
+++ b/packages/basics/matrix/lua_src/generic_call.lua
@@ -3,6 +3,7 @@ matrix.__generic__ = matrix.__generic__ or {}
 
 matrix.__generic__.__make_generic_call__ = function()
   return function(self,...)
+    if ... == nil then return self end
     local arg      = table.pack(...)
     local dims     = self:dim()
     local pos,size = {},{}
@@ -12,8 +13,12 @@ matrix.__generic__.__make_generic_call__ = function()
       local a,b
       if tt == "table" then
 	a,b = table.unpack(t)
-	april_assert(tonumber(a) and tonumber(b),
-		     "The table for component %d must contain two numbers",i)
+        if not a and not b then
+          a,b = 1,dims[i]
+        else
+          april_assert(tonumber(a) and tonumber(b),
+                       "The table for component %d must contain two numbers or none",i)
+        end
       elseif tt == "string" then
 	a = t:match("^(%d+)%:.*$") or 1
 	b = t:match("^.*%:(%d+)$") or dims[i]
@@ -38,3 +43,19 @@ matrix.__generic__.__make_generic_call__ = function()
     return self:slice(pos,size)
   end
 end
+
+matrix.__generic__.__make_generic_newindex__ = function(matrix_class)
+  assert(matrix_class and class.is_class(matrix_class),
+         "Needs a class table as argument")
+  return function(self,key,value)
+    assert(type(key) == "table", "Needs a table as key")
+    local m  = self(table.unpack(key))
+    local tv = type(value)
+    if tv == "number" or tv == "complex" then
+      m:fill(value)
+    else
+      assert(class.is_a(m, matrix_class), "Needs a number or a matrix as value")
+      m:copy(value)
+    end
+  end
+end
diff --git a/packages/basics/matrix/lua_src/generic_join.lua b/packages/basics/matrix/lua_src/generic_join.lua
index 35607d04d..dacb4cbf7 100644
--- a/packages/basics/matrix/lua_src/generic_join.lua
+++ b/packages/basics/matrix/lua_src/generic_join.lua
@@ -28,12 +28,7 @@ matrix.__generic__.__make_generic_join__ = function(constructor)
       end
     end
     -- JOIN
-    local outm
-    if arg[1].get_major_order and arg[1]:get_major_order() == "col_major" then
-      outm = constructor.col_major(table.unpack(size))
-    else
-      outm = constructor(table.unpack(size))
-    end
+    local outm = constructor(table.unpack(size))
     local first = matrix(#size):ones():toTable()
     for i=1,#arg do
       local m = arg[i]
diff --git a/packages/basics/matrix/lua_src/generic_print.lua b/packages/basics/matrix/lua_src/generic_print.lua
index 77b229b4a..0e46e24ff 100644
--- a/packages/basics/matrix/lua_src/generic_print.lua
+++ b/packages/basics/matrix/lua_src/generic_print.lua
@@ -4,40 +4,46 @@ matrix.__generic__ = matrix.__generic__ or {}
 matrix.__generic__.__make_generic_print__ = function(name,getter)
   assert(name and getter)
   return function(self)
-    local dims   = self:dim()
-    local major  = (self.get_major_order and self:get_major_order()) or "row_major"
-    local coords = {}
-    local out    = {}
-    local row    = {}
-    local so_large = false
-    for i=1,#dims do 
-      coords[i]=1
-      if dims[i] > 20 then so_large = true end
-    end
-    if not so_large then
-      for i=1,self:size() do
-	if #dims > 2 and coords[#dims] == 1 and coords[#dims-1] == 1 then
-	  table.insert(out,
-		       string.format("\n# pos [%s]",
-				     table.concat(coords, ",")))
-	end
-	table.insert(row, getter(self:get(table.unpack(coords))))
-	local j=#dims+1
-	repeat
-	  j=j-1
-	  coords[j] = coords[j] + 1
-	  if coords[j] > dims[j] then coords[j] = 1 end
-	until j==1 or coords[j] ~= 1
-	if coords[#coords] == 1 then
-	  table.insert(out, table.concat(row, " ")) row={}
-	end
+    local MAX_ROW_LEN,MAX_ROWS = 60,6
+    local dims     = self:dim()
+    local coords   = {}
+    local out      = {}
+    local row      = {}
+    local row_len  = 0
+    for i=1,#dims do coords[i]=1 end
+    for i=1,self:size() do
+      if #dims > 2 and coords[#dims] == 1 and coords[#dims-1] == 1 then
+        table.insert(out,
+                     string.format("\n# pos [%s]",
+                                   table.concat(coords, ",")))
+      end
+      if not coords[#coords-1] or coords[#coords-1] < MAX_ROWS or coords[#coords-1] == dims[#coords-1] then
+        if row_len < MAX_ROW_LEN or coords[#coords] == dims[#coords] then
+          local str = getter(self:get(table.unpack(coords)))
+          row_len = row_len + #str + 1
+          if row_len < MAX_ROW_LEN  or coords[#coords] == dims[#coords] then
+            table.insert(row, str)
+          else
+            table.insert(row, "...")
+          end
+        end
+      elseif coords[#coords-1] == MAX_ROWS then
+        row = { "..." }
+      end
+      local j=#dims+1
+      repeat
+        j=j-1
+        coords[j] = coords[j] + 1
+        if coords[j] > dims[j] then coords[j] = 1 end
+      until j==1 or coords[j] ~= 1
+      if coords[#coords] == 1 then
+        if #row > 0 then table.insert(out, table.concat(row, " ")) row={} row_len = 0 end
       end
-    else
-      table.insert(out, "Large matrix, not printed to display")
     end
-    table.insert(out, string.format("# %s of size [%s] in %s [%s]\n",
+    table.insert(out, string.format("# %s of size [%s] stride [%s] ref [%s]\n",
 				    name,
-				    table.concat(dims, ","), major,
+				    table.concat(dims, ","),
+                                    table.concat(self:stride(), ","),
 				    self:get_reference_string()))
     return table.concat(out, "\n")
   end
diff --git a/packages/basics/matrix/lua_src/generic_serialization.lua b/packages/basics/matrix/lua_src/generic_serialization.lua
index 1130e8440..6fbeb5516 100644
--- a/packages/basics/matrix/lua_src/generic_serialization.lua
+++ b/packages/basics/matrix/lua_src/generic_serialization.lua
@@ -9,22 +9,22 @@ end
 
 matrix.__generic__ = matrix.__generic__ or {}
 
-matrix.__generic__.__make_generic_to_lua_string__ = function(matrix_class)
+matrix.__generic__.__make_generic_to_lua_string__ = function(matrix_class,
+                                                             defmode)
   local name = matrix_class.meta_instance.id
   class.extend(matrix_class, "to_lua_string",
                function(self, format)
                  return string.format("%s.fromString[[%s]]",
-                                      name, self:toString(format or "binary"))
+                                      name, self:toString(format or defmode))
   end)
 end
 
 -- GENERIC FROM FILENAME
 matrix.__generic__.__make_generic_fromFilename__ = function(matrix_class)
-  matrix_class.fromFilename = function(filename,order)
+  matrix_class.fromFilename = function(filename)
     local f = april_assert(io.open(filename),
                            "Unable to open %s", filename)
-    local ret = table.pack(matrix_class.read(archive_wrapper( f ),
-                                             { [matrix.options.order]=order }))
+    local ret = table.pack(matrix_class.read(archive_wrapper( f )))
     f:close()
     return table.unpack(ret)
   end
@@ -32,12 +32,11 @@ end
 
 -- GENERIC FROM TAB FILENAME
 matrix.__generic__.__make_generic_fromTabFilename__ = function(matrix_class)
-  matrix_class.fromTabFilename = function(filename,order)
+  matrix_class.fromTabFilename = function(filename)
     local f = april_assert(io.open(filename),
                            "Unable to open %s", filename)
     local ret = table.pack(matrix_class.read(archive_wrapper( f ),
-                                             { [matrix.options.order] = order,
-                                               [matrix.options.tab] = true }))
+                                             { [matrix.options.tab] = true }))
     f:close()
     return table.unpack(ret)
   end
@@ -46,7 +45,6 @@ end
 matrix.__generic__.__make_generic_fromCSVFilename__ = function(matrix_class)
   matrix_class.fromCSVFilename = function(filename,args)
     local args = get_table_fields({
-        [matrix.options.order]   = { mandatory=false, type_match="string" },
         [matrix.options.delim]   = { mandatory=true, type_match="string", default="," },
         [matrix.options.default] = { mandatory=false } }, args)
     args[matrix.options.empty] = true
@@ -67,9 +65,11 @@ matrix.__generic__.__make_generic_fromString__ = function(matrix_class)
 end
 
 -- GENERIC TO FILENAME
-matrix.__generic__.__make_generic_toFilename__ = function(matrix_class)
+matrix.__generic__.__make_generic_toFilename__ = function(matrix_class,
+                                                          defmode)
   class.extend(matrix_class, "toFilename",
                function(self,filename,mode)
+                 local mode = mode or defmode
                  local f = april_assert(io.open(filename,"w"),
                                         "Unable to open %s", filename)
                  local ret = table.pack(self:write(f,
@@ -94,20 +94,23 @@ matrix.__generic__.__make_generic_toTabFilename__ = function(matrix_class)
 end
 
 -- GENERIC TO STRING
-matrix.__generic__.__make_generic_toString__ = function(matrix_class)
+matrix.__generic__.__make_generic_toString__ = function(matrix_class, defmode)
   class.extend(matrix_class, "toString",
                function(self,mode)
+                 local mode = mode or defmode
                  return self:write({ [matrix.options.ascii] = (mode=="ascii") })
   end)
 end
 
-function matrix.__generic__.__make_all_serialization_methods__(matrix_class)
+function matrix.__generic__.__make_all_serialization_methods__(matrix_class,
+                                                               defmode)
+  local defmode = defmode or "binary"
   matrix.__generic__.__make_generic_fromFilename__(matrix_class)
   matrix.__generic__.__make_generic_fromTabFilename__(matrix_class)
   matrix.__generic__.__make_generic_fromString__(matrix_class)
   matrix.__generic__.__make_generic_fromCSVFilename__(matrix_class)
-  matrix.__generic__.__make_generic_toFilename__(matrix_class)
+  matrix.__generic__.__make_generic_toFilename__(matrix_class, defmode)
   matrix.__generic__.__make_generic_toTabFilename__(matrix_class)
-  matrix.__generic__.__make_generic_toString__(matrix_class)
-  matrix.__generic__.__make_generic_to_lua_string__(matrix_class)
+  matrix.__generic__.__make_generic_toString__(matrix_class, defmode)
+  matrix.__generic__.__make_generic_to_lua_string__(matrix_class, defmode)
 end
diff --git a/packages/basics/matrix/lua_src/matrix.lua b/packages/basics/matrix/lua_src/matrix.lua
index eccdafb42..bee4802cc 100644
--- a/packages/basics/matrix/lua_src/matrix.lua
+++ b/packages/basics/matrix/lua_src/matrix.lua
@@ -1,4 +1,6 @@
--- ADDING PSEUDO-INVERSE METHOD
+class.extend(matrix, "t", matrix.."transpose")
+
+-- ADDING PSEUDO-INVERSE METHODcond
 class.extend(matrix, "pinv",
              function(self)
                local u,s,vt = self:svd()
@@ -16,26 +18,343 @@ class.extend(matrix, "pinv",
                  }
 end)
 
--- the constructor
-matrix.row_major = function(...)
-  return matrix(...)
-end
+matrix.ext.iterate =
+  april_doc{
+    class = "method",
+    summary = "Returns an iterator which traverses a dimension",
+    description = {
+      "The iterator uses m:select() method to traverse the given",
+      "dimension number. The iterator returns the pair pos,slice",
+      "where pos is the position inside the dimension and slice",
+      "is a matrix with the result of m:select(dim,pos).",
+      "Note that slice is reused between different iterations.",
+      "Note that slice is a reference to the original matrix, any",
+      "change to slice will be reflected into m."
+    },
+    params = {
+      "A matrix instance (any kind of matrix type)",
+      "A dimension number [optional], by default it is 1 (row traversal)",
+    },
+    outputs = {
+      "An instance of iterator class",
+    },
+  } ..
+  function(self,dim)
+    local dim = dim or 1
+    local d = self:dim()
+    assert(dim > 0 and dim < #d, "Out-of-bounds dimension number")
+    local slice = self:select(dim,1)
+    return iterator(function(state,pos)
+        local self,slice,dim,sz = table.unpack(state)
+        pos = pos + 1
+        if pos <= d[dim] then
+          slice = (pos == 1 and slice) or self:select(dim,pos)
+          return pos,slice
+        end
+                    end, {self,slice,dim,d[dim]}, 0)
+  end
+
+class.extend(matrix, "order",
+             april_doc{
+               class = "method",
+               summary = "Returns a permutation of the matrix which sorts its data",
+               outputs = { "A matrixInt32 instance" },
+             } ..
+               function(self)
+                 local self = self:squeeze()
+                 assert(#self:dim() == 1, "Needs a rank 1 tensor")
+                 local t = iterator(range(1,self:size())):table()
+                 table.sort(t, function(a,b)
+                              return self:get(a) < self:get(b)
+                 end)
+                 return matrixInt32(t)
+end)
+
+class.extend(matrix, "order_rank",
+             april_doc{
+               class = "method",
+               summary = "Returns the sorted rank of the matrix values",
+               outputs = { "A matrixInt32 instance" },
+             } ..
+               function(self)
+                 local self = self:squeeze()
+                 assert(#self:dim() == 1, "Needs a rank 1 tensor")
+                 local t = iterator(range(1,self:size())):table()
+                 table.sort(t, function(a,b)
+                              return self:get(a) < self:get(b)
+                 end)
+                 return matrixInt32(table.invert(t))
+end)
+
+class.extend(matrix, "index",
+             april_doc{
+               class = "method",
+               summary = {
+                 "Returns new allocated matrix filtered by the given dim and",
+                 "index matrix parameters.",
+               },
+               params = {
+                 "A dimension number",
+                 { "A table, matrixBool or matrixInt32 indicating which",
+                   "indices will be taken." },
+               },
+               outputs = {
+                 { "A new allocated matrix instance, or nil if 2nd argument",
+                   "has zero selected components", },
+               },
+             } ..
+               function(self,dim,idx)
+                 assert(type(dim) == "number",
+                        "Needs a number as second argument")
+                 if type(idx) == "table" then idx = matrixInt32(idx)
+                 elseif class.is_a(idx, matrixBool) then idx = idx:to_index()
+                 end
+                 if not idx then return nil end
+                 assert(class.is_a(idx, matrixInt32),
+                        "Needs a matrixInt32 second argument (index)")
+                 local idx = idx:squeeze()
+                 assert(#idx:dim() == 1, "Needs a rank 1 tensor as second argument (index)")
+                 local d = self:dim()
+                 assert(dim >= 1 and dim <= #d, "Dimension argument out-of-bounds")
+                 local dim_bound = d[dim]
+                 d[dim] = idx:size()
+                 local constructor = class.of(self)
+                 local result = constructor(table.unpack(d))
+                 d[dim] = 1
+                 local self_sw = self:sliding_window{ size=d, step=d }
+                 local dest_sw   = result:sliding_window{ size=d, step=d }
+                 local result_submat,self_submat
+                 idx:map(function(p)
+                     april_assert(p >= 1 and p <= dim_bound,
+                                  "Index number %d out-of-bounds", i)
+                     assert(not dest_sw:is_end())
+                     self_sw:set_at_window(p)
+                     result_submat = dest_sw:get_matrix(result_submat)      
+                     self_submat = self_sw:get_matrix(self_submat)
+                     result_submat:copy(self_submat)
+                     dest_sw:next()
+                 end)
+                 return result
+end)
+
+
+class.extend(matrix, "indexed_fill",
+             april_doc{
+               class = "method",
+               summary = {
+                 "Fills the indexed dim,index components of the caller matrix.",
+               },
+               params = {
+                 "A dimension number",
+                 { "A table, matrixBool or matrixInt32 indicating which",
+                   "indices will be taken." },
+                 "A number value for filling.",
+               },
+               outputs = {
+                 "The caller matrix.",
+               },
+             } ..
+             function(self,dim,idx,val)
+               if type(idx) == "table" then idx = matrixInt32(idx)
+               elseif class.is_a(idx, matrixBool) then idx = idx:to_index()
+               end
+               if not idx then return self end
+               assert(class.is_a(idx, matrixInt32),
+                      "Needs a matrixInt32 second argument (index)")
+               local idx = idx:squeeze()
+               assert(#idx:dim() == 1,
+                      "Needs a rank 1 tensor as second argument (index)")
+               local d = self:dim()
+               assert(dim >= 1 and dim <= #d,"Dimension argument out-of-bounds")
+               local dim_bound = d[dim]
+               d[dim] = 1
+               local sw = self:sliding_window{ size=d, step=d }
+               local mat
+               idx:map(function(p)
+                   april_assert(p >= 1 and p <= dim_bound,
+                                "Index number %d out-of-bounds", i)
+                   sw:set_at_window(p)
+                   mat = sw:get_matrix(mat)
+                   mat:fill(val)
+               end)
+               return self
+end)
+
+class.extend(matrix, "indexed_copy",
+             april_doc{
+               class = "method",
+               summary = {
+                 "Copies a matrix into the indexed dim,index components of the caller matrix.",
+               },
+               params = {
+                 "A dimension number",
+                 { "A table, matrixBool or matrixInt32 indicating which",
+                   "indices will be taken." },
+                 "A matrix with data to be copied.",
+               },
+               outputs = {
+                 "The caller matrix.",
+               },
+             } ..
+             function(self,dim,idx,other)
+               if type(idx) == "table" then idx = matrixInt32(idx)
+               elseif class.is_a(idx, matrixBool) then idx = idx:to_index()
+               end
+               if not idx then return self end
+               assert(class.is_a(idx, matrixInt32),
+                      "Needs a matrixInt32 second argument (index)")
+               assert(class.of(self) == class.of(other),
+                      "Self and other must be same matrix type")
+               local idx = idx:squeeze()
+               assert(#idx:dim() == 1,
+                      "Needs a rank 1 tensor as second argument (index)")
+               local d = self:dim()
+               assert(dim >= 1 and dim <= #d,"Dimension argument out-of-bounds")
+               local dim_bound = d[dim]
+               d[dim] = 1
+               local other_sw = other:sliding_window{ size=d, step=d }
+               local self_sw = self:sliding_window{ size=d, step=d }
+               local other_submat,self_submat
+               idx:map(function(p)
+                   april_assert(p >= 1 and p <= dim_bound,
+                                "Index number %d out-of-bounds", i)
+                   assert(not other_sw:is_end())
+                   self_sw:set_at_window(p)
+                   other_submat = other_sw:get_matrix(other_submat)
+                   self_submat = self_sw:get_matrix(self_submat)
+                   self_submat:copy(other_submat)
+                   other_sw:next()
+               end)
+               return self
+end)
 
 -- static methods which return a new matrix instead of operate in-place
+matrix.op = {}
 for _,method in ipairs{"adjust_range", "clamp", "cmul",
                        "plogp", "log", "log1p", "exp",
                        "sqrt", "pow",
                        "tan", "tanh", "atan",
                        "sin", "sinh", "asin", "asinh",
                        "cos", "cosh", "acos", "acosh",
-                       "abs", "complement", "sign", "scal", "div",
-                       "lt", "gt", "eq", "neq" } do
-  matrix[method] = function(self,...)
+                       "abs", "complement", "sign", "scal", "div" } do
+  matrix.op[method] = function(self,...)
     local clone = self:clone()
     return clone[method](clone,...)
   end
 end
 
+function matrix.op.repmat(x, ...)
+  local arg = table.pack(...)
+  local dim = x:dim()
+  local result_dim = {}
+  assert(#arg >= #dim, "Underflow given number of dimensions")
+  for i=1,#arg do dim[i] = dim[i] or 1 result_dim[i] = dim[i] * arg[i] end
+  local x = x:rewrap(table.unpack(dim))
+  local result = matrix(table.unpack(result_dim))
+  local result_sw = result:sliding_window{ size=dim, step=dim }
+  local mat
+  while not result_sw:is_end() do
+    mat = result_sw:get_matrix(mat)
+    mat:copy(x)
+    result_sw:next()
+  end
+  return result
+end
+
+matrix.op.diag =
+  april_doc{
+    class = "function",
+    summary = "Returns a matrix with diagonal elements of the given matrix",
+    params = {
+      "A 2D matrix",
+      "The k-th diagonal number [optional], by default k=0",
+    },
+    outputs = {
+      "A new matrix instance",
+    }
+  } ..
+  function(m,k)
+    local k=k or 0
+    local dim = m:dim()
+    assert(#dim == 2, "Needs a 2D matrix")
+    local N = dim[1]
+    assert(dim[2] == N, "Needs a square matrix")
+    local get_map
+    if k == 0 then
+      get_map = function(i) return m:get(i,i) end
+    elseif k>0 then
+      assert(k < N, "Out-of-bounds k argument")
+      get_map = function(i) return m:get(i,i+k) end
+    else -- k<0
+      assert(k > -N, "Out-of-bounds k argument")
+      get_map = function(i) return m:get(i-k,i) end
+    end
+    local ctor = class.of(m)
+    if rawequal(ctor,matrix.sparse) then ctor = matrix end
+    return ctor(N-math.abs(k)):linspace():map(get_map)
+  end
+
+matrix.op.triu =
+  april_doc{
+    class = "function",
+    summary = "Returns uppper triangular matrix taken from given matrix",
+    params = {
+      "A 2D matrix",
+      "The start k-th diagonal number [optional], by default k=0",
+    },
+    outputs = {
+      "A new matrix instance",
+    }
+  } ..
+  function(m,k)
+    local k=k or 0
+    local dim = m:dim()
+    local N = dim[1]
+    assert(#dim == 2, "Needs a 2D matrix")
+    assert(dim[2] == N, "Needs a square matrix")
+    assert(k <= 0 or k <  N, "Out-of-bounds k argument")
+    assert(k >= 0 or k > -N, "Out-of-bounds k argument")
+    local ctor = class.of(m)
+    local triu = ctor(table.unpack(dim)):zeros()
+    -- for each row
+    for i=1,math.min(N,N-k) do
+      local cols = { math.max(1,i+k), N }
+      triu[{ i, cols }] = m(i, cols)
+    end
+    return triu
+  end
+
+matrix.op.tril =
+  april_doc{
+    class = "function",
+    summary = "Returns lower triangular matrix taken from given matrix",
+    params = {
+      "A 2D matrix",
+      "The start k-th diagonal number [optional], by default k=0",
+    },
+    outputs = {
+      "A new matrix instance",
+    }
+  } ..
+  function(m,k)
+    local k=k or 0
+    local dim = m:dim()
+    local N = dim[1]
+    assert(#dim == 2, "Needs a 2D matrix")
+    assert(dim[2] == N, "Needs a square matrix")
+    assert(k <= 0 or k <  N, "Out-of-bounds k argument")
+    assert(k >= 0 or k > -N, "Out-of-bounds k argument")
+    local ctor = class.of(m)
+    local triu = ctor(table.unpack(dim)):zeros()
+    local j=math.max(1,k+1) -- col number
+    -- for each row
+    for i=math.max(1,-k+1),N do
+      local cols = { 1, math.min(N,j) } j=j+1
+      triu[{ i, cols }] = m(i, cols)
+    end
+    return triu
+  end
+
 -- serialization
 matrix.__generic__.__make_all_serialization_methods__(matrix)
 
@@ -44,10 +363,14 @@ matrix.__generic__.__make_all_serialization_methods__(matrix)
 matrix.meta_instance.__call =
   matrix.__generic__.__make_generic_call__()
 
+-- define left side operator [{}]
+matrix.meta_instance.__newindex =
+  matrix.__generic__.__make_generic_newindex__(matrix)
+
 matrix.meta_instance.__tostring =
   matrix.__generic__.__make_generic_print__("Matrix",
                                             function(value)
-                                              return string.format("% -11.6g", value)
+                                              return string.format("% -13.6g", value)
   end)
 
 matrix.join =
@@ -80,12 +403,12 @@ end
 matrix.meta_instance.__mul = function(op1, op2)
   if class.is_a(op1,matrix.sparse) or class.is_a(op2,matrix.sparse) then
     if class.is_a(op2,matrix.sparse) then
-      local res = matrix[op1:get_major_order()](op1:dim(1),op2:dim(2))
-      res:sparse_mm{ alpha=1.0, beta=0.0, A=op2, B=op1,
-		     trans_A=true, trans_B=true, trans_C=true }
+      local res = matrix(op1:dim(1),op2:dim(2))
+      res:transpose():sparse_mm{ alpha=1.0, beta=0.0, A=op2, B=op1,
+                                 trans_A=true, trans_B=true }
       return res
     else
-      local res = matrix[op2:get_major_order()](op1:dim(1),op2:dim(2))
+      local res = matrix(op1:dim(1),op2:dim(2))
       res:sparse_mm{ alpha=1.0, beta=0.0, A=op1, B=op2 }
       return res
     end
@@ -174,40 +497,148 @@ end
 -----------------------------------------------------------------------------
 -----------------------------------------------------------------------------
 
-function matrix.dict.wrap_matrices(m)
-  local tt = type(m)
-  local unwrap
-  if tt == "table" then
-    m = matrix.dict(m)
-    unwrap = function(m) return iterator(pairs(m)):table() end
-  elseif tt == "matrix" then
-    m = matrix.dict():insert("1",m)
-    unwrap = function(m) return m("1") end
+matrix.dict = matrix.dict or {}
+setmetatable(matrix.dict, { __call =
+                              function(self,v)
+                                if v then
+                                  return type(v) == "table" and v or {v}
+                                else
+                                  return {}
+                                end
+                              end
+})
+
+local mmap = function(tbl,func,...)
+  if type(tbl) == "table" then
+    for name,w in pairs(tbl) do func(w,...) end
   else
-    unwrap = function(m) return m end
+    func(tbl,...)
+  end
+  return tbl
+end
+
+local mreduce = function(tbl,func,start,...)
+  if type(tbl) == "table" then
+    local acc = start
+    for name,w in pairs(tbl) do acc = func(acc,w,...) end
+    return acc
+  else
+    return func(start,w,...)
+  end
+end
+
+matrix.dict.iterator = function(tbl,name_match)
+  if type(tbl) == "table" then
+    local name_match = name_match or ".*"
+    return iterator(pairs(tbl)):
+    filter(function(name,w) return name:find(name_match) end)
+  else
+    assert("Needs a table")
+  end
+end
+
+for _,name in ipairs{ "scal", "fill", "scalar_add", "pow", "clamp",
+                      "zeros", "ones", "plogp", "log", "log1p", "exp", "sqrt",
+                      "tan", "tanh", "atan", "atanh",
+                      "cos", "cosh", "acos", "acosh",
+                      "sin", "sinh", "asin", "asinh",
+                      "abs", "complement", "sign", "inv",
+                      "prune_subnormal_and_check_normal", } do
+  matrix.dict[name] = function(tbl,...)
+    return mmap(tbl, function(w, name, ...) w[name](w,...) end, name, ...)
   end
-  assert(class.is_a(m, matrix.dict), "Needs a matrix.dict, a matrix, or a table")
-  return m,unwrap
 end
 
-function matrix.dict.meta_instance.__index:to_lua_string(format)
-  local str_tbl = { "matrix.dict{\n" }
-  for name,w in pairs(self) do
-    table.insert(str_tbl,
-		 string.format("[%q] = %s,\n", name, w:to_lua_string(format)))
+matrix.dict.replace = function(tbl1, tbl2)
+  assert(type(tbl1) == "table", "Needs a table as 1st argument")
+  assert(type(tbl2) == "table", "Needs a table as 2nd argument")
+  for name,w1 in pairs(tbl1) do
+    local w2 = tbl2[name]
+    if w2 then tbl1[name] = w2 end
   end
-  table.insert(str_tbl, "}")
-  return table.concat(str_tbl, " ")
+  return tbl1
 end
 
-function matrix.dict.meta_instance:__call(key)
-  return self:find(key)
+matrix.dict.clone = function(tbl)
+  if type(tbl) == "table" then
+    return iterator(pairs(tbl)):
+    map(function(name,w) return name,w:clone() end):table()
+  else
+    return tbl:clone()
+  end
 end
-function matrix.dict.meta_instance:__newindex(key,value)
-  return self:insert(key, value)
+
+matrix.dict.clone_only_dims = function(tbl)
+  if type(tbl) == "table" then
+    return iterator(pairs(tbl)):
+    map(function(name,w) return name,matrix.as(w) end):
+      table()
+  else
+    return matrix.as(tbl)
+  end
 end
-function matrix.dict.meta_instance:__pairs()
-  return self:iterate()
+
+matrix.dict.axpy = function(tbl1,value,tbl2)
+  assert(type(value) == "number", "Needs a number as 2nd argument")
+  if type(tbl1) == "table" and type(tbl2) == "table" then
+    for name,w1 in pairs(tbl1) do
+      local w2 = april_assert(tbl2[name], "Unable to find key %s", name)
+      w1:axpy(value,w2)
+    end
+  else
+    tbl1:axpy(value, tbl2)
+  end
+  return tbl1
+end
+
+matrix.dict.copy = function(tbl1,tbl2)
+  if type(tbl1) == "table" and type(tbl2) == "table" then
+    for name,w1 in pairs(tbl1) do
+      local w2 = april_assert(tbl2[name], "Unable to find key %s", name)
+      w1:copy(w2)
+    end
+  else
+    tbl1:copy(tbl2)
+  end
+  return tbl1
+end
+
+matrix.dict.cmul = function(tbl1,tbl2)
+  if type(tbl1) == "table" and type(tbl2) == "table" then
+    for name,w1 in pairs(tbl1) do
+      local w2 = april_assert(tbl2[name], "Unable to find key %s", name)
+      w1:cmul(w2)
+    end
+  else
+    tbl1:cmul(tbl2)
+  end
+  return tbl1
+end
+
+matrix.dict.norm2 = function(tbl)
+  if type(tbl) == "table" then
+    local n2 = mreduce(tbl, function(acc,w) return acc + w:norm2()^2 end, 0)
+    return math.sqrt(n2)
+  else
+    return tbl:norm2()
+  end
+end
+
+matrix.dict.size = function(tbl)
+  return mreduce(tbl, function(acc,w) return acc + w:size() end, 0)
+end
+
+matrix.dict.dot = function(tbl1,tbl2)
+  if type(tbl1) == "table" and type(tbl2) == "table" then
+    local dot=0
+    for name,w1 in pairs(tbl1) do
+      local w2 = april_assert(tbl2[name], "Unable to find %s key", name)
+      dot = dot + w1:dot(w2)
+    end
+    return dot
+  else
+    return tbl1:dot(tbl2)
+  end
 end
 
 -----------------------------------------------------------------------------
@@ -273,26 +704,6 @@ april_set_doc(matrix, {
 		},
 		outputs = { "A matrix instantiated object" }, })
 
-april_set_doc(matrix.col_major, {
-		class = "function", summary = "constructor",
-		description ={
-		  "Constructor of a multidimensional matrix.",
-		  "The data is stored at col_major order, but from",
-		  "outside is viewed as row_major (for compatibility",
-		  "purposes).",
-		},
-		params = {
-		  "First dimension size",
-		  "Second dimension size",
-		  "...",
-		  "ith dimension size",
-		  "...",
-		  "nth dimension size",
-		  { "A table with values [optional]. The values must be",
-		    "in row major order", }
-		},
-		outputs = { "A matrix instantiated object" }, })
-
 april_set_doc(matrix.read, {
 		class = "method",
 		summary = "It allows to read a matrix from a stream.",
@@ -502,13 +913,6 @@ april_set_doc(matrix.."set_use_cuda", {
 		  "The caller object (itself)",
 		}, })
 
-april_set_doc(matrix.."get_major_order", {
-		class = "method",
-		summary = "Returns the major order of internal data.",
-		outputs = {
-		  "A string with the major order",
-		}, })
-
 april_set_doc(matrix.."dim", {
 		class = "method",
 		summary = "Returns a table with the size of each dimension.",
@@ -618,15 +1022,6 @@ april_set_doc(matrix.join, {
 april_set_doc(matrix.."clone", {
 		class = "method",
 		summary = "Returns a deep copy (clone) of the caller matrix.",
-		description = {
-		  "Returns a deep copy (clone) of the caller matrix.",
-		  "It has the possibility of indicate the major order,",
-		  "and the data will be reordered if necessary.",
-		},
-		params = {
-		  { "A string: col_major or row_major [optional]. By",
-		    "default it is the same major order as the caller matrix" },
-		},
 		outputs = {
 		  "A matrix object (cloned)",
 		}, })
@@ -642,6 +1037,21 @@ april_set_doc(matrix.."transpose", {
 		  "A matrix object (transposed)",
 		}, })
 
+april_set_doc(matrix.."transpose", {
+		class = "method",
+		summary = "Transposes two dimensions.",
+		description = {
+		  "Transposes two dimensions of the caller matrix.",
+		  "The returned matrix is a reference to the original.",
+		},
+                params = {
+                  "One dimension number",
+                  "Second dimension number",
+                },
+		outputs = {
+		  "A matrix object (transposed)",
+		}, })
+
 april_set_doc(matrix.."adjust_range", {
 		class = "method",
 		summary = "Modifies the matrix values IN-PLACE to be at given range",
@@ -1119,10 +1529,6 @@ april_set_doc(matrix.."inv",
 		  "This method computes the inverse of matrix.",
 		  "Check that your matrix is not singular, otherwise",
 		  "the returned matrix won't be correct.",
-		  "It is adapted to work with row_major matrices, but",
-		  "internally they are transformed to col_major, so",
-		  "it is more efficient to compute the inverse over",
-		  "col_major matrices.",
 		},
 		outputs = { "The matrix inverse" },
 	      })
@@ -1133,11 +1539,8 @@ april_set_doc(matrix.."svd",
 		summary = "Computes the SVD of a matrix",
 		description = {
 		  "This method computes the SVD of matrix.",
-		  "It is adapted to work with row_major matrices, but",
-		  "internally they are transformed to col_major, so",
-		  "it is more efficient to compute the SVD over",
-		  "col_major matrices. The computation returns three matrices",
-		  "in col_major, so A=U * S * V'.",
+                  "The computation returns three matrices",
+		  ", so A=U * S * V'.",
 		},
 		outputs = {
 		  "The matrix U",
@@ -1196,21 +1599,21 @@ april_set_doc(matrix.."map",
 april_set_doc(matrix.."lt",
 	      {
 		class = "method",
-		summary = "Returns a 0/1 matrix where values are less than given param. IN-PLACE operation",
+		summary = "Returns a matrixBool with true where values are less than given param.",
 		params = {
 		  "A matrix or a number",
 		},
-		outputs = { "The caller matrix" },
+		outputs = { "A matrixBool instance" },
 	      })
 
 april_set_doc(matrix.."gt",
 	      {
 		class = "method",
-		summary = "Returns a 0/1 matrix where values are greater than given param. IN-PLACE operation",
+		summary = "Returns a  matrixBool with true where values are greater than given param.",
 		params = {
 		  "A matrix or a number",
 		},
-		outputs = { "The caller matrix" },
+		outputs = { "A matrixBool instance" },
 	      })
 
 -------------------------------------------------------------------------
@@ -1264,3 +1667,12 @@ april_set_doc(matrix.__sliding_window__.."iterate",
 		summary     = "Returns an iterator function: for mat in s:iterate() do ... end",
 		outputs     = { "An iterator function" },
 	      })
+
+-----------------------------
+-- DEPRECATED CONSTRUCTORS --
+matrix.row_major = make_deprecated_function("matrix.row_major", "matrix", matrix)
+matrix.col_major = make_deprecated_function("matrix.col_major", "matrix", matrix)
+class.extend(matrix, "get_major_order",
+             make_deprecated_function("matrix.get_major_order", nil,
+                                      function(self) return "row_major" end))
+-----------------------------
diff --git a/packages/basics/matrix/lua_src/matrixBool.lua b/packages/basics/matrix/lua_src/matrixBool.lua
new file mode 100644
index 000000000..426f1494a
--- /dev/null
+++ b/packages/basics/matrix/lua_src/matrixBool.lua
@@ -0,0 +1,105 @@
+class.extend(matrixBool, "t", matrixBool.."transpose")
+
+-- serialization
+matrix.__generic__.__make_all_serialization_methods__(matrixBool, "ascii")
+
+matrixBool.meta_instance.__call =
+  matrix.__generic__.__make_generic_call__()
+
+matrixBool.meta_instance.__newindex =
+  matrix.__generic__.__make_generic_newindex__(matrixBool)
+
+matrixBool.meta_instance.__tostring =
+  matrix.__generic__.__make_generic_print__("MatrixBool",
+                                            function(value)
+                                              return string.format("%s", value and "T" or "F")
+  end)
+
+matrixBool.join =
+  matrix.__generic__.__make_generic_join__(matrixBool)
+
+class.extend(matrixBool, "to_index",
+             april_doc{
+               class = "method",
+               summary = "Returns a matrixInt32 with the list of true indices",
+               description = "Requires a rank 1 matrix",
+               outputs = { "A matrixInt32 instance", },
+             } ..
+               function(self)
+                 local self = self:squeeze()
+                 assert(#self:dim() == 1, "Needs a rank 1 matrix")
+                 local ones = self:count_ones()
+                 if ones == 0 then return nil end
+                 local result = matrixInt32(ones)
+                 local idx,pos=0,0
+                 self:map(function(x)
+                     idx=idx+1
+                     if x then pos=pos+1 result:set(pos,idx) end
+                 end)
+                 assert(pos == ones)
+                 return result
+end)
+
+class.extend(matrixBool, "land",
+             april_doc{
+               class = "method",
+               summary = "Computes component-wise AND operation IN-PLACE",
+               params  = {"Another matrixBool instance",},
+               outputs = {"The caller matrix",}
+             } ..
+               function(self,other)
+                 assert(class.is_a(other,matrixBool),
+                        "Needs a matrixBool as argument")
+                 self:map(other,function(x,y)
+                            return x and y
+                 end)
+                 return self
+end)
+
+class.extend(matrixBool, "lor",
+             april_doc{
+               class = "method",
+               summary = "Computes component-wise OR operation IN-PLACE",
+               params  = {"Another matrixBool instance",},
+               outputs = {"The caller matrix",}
+             } ..
+               function(self,other)
+                 assert(class.is_a(other,matrixBool),
+                        "Needs a matrixBool as argument")
+                 self:map(other,function(x,y)
+                            return x or y
+                 end)
+                 return self
+end)
+
+matrixBool.meta_instance.__unm = function(op)
+  return op:clone():complement()
+end
+
+matrixBool.meta_instance.__add = function(op1, op2)
+  assert(class.is_a(op1, matrixBool), "Needs two matrixBool arguments")
+  assert(class.is_a(op2, matrixBool), "Needs two matrixBool arguments")
+  return op1:clone():lor(op2)
+end
+
+matrixBool.meta_instance.__mul = function(op1, op2)
+  assert(class.is_a(op1, matrixBool), "Needs two matrixBool arguments")
+  assert(class.is_a(op2, matrixBool), "Needs two matrixBool arguments")
+  return op1:clone():land(op2)
+end
+
+matrixBool.meta_instance.__eq = function(op1, op2)
+  if class.is_a(op1, matrix) then op1 = matrixBool(op1)
+  elseif class.is_a(op2, matrix) then op2 = matrixBool(op2) end
+  assert(class.is_a(op1, matrixBool) and class.is_a(op2, matrixBool),
+         "Needs two matrixBool arguments")
+  local d1,d2 = op1:dim(),op2:dim()
+  if #d1 ~= #d2 then return false end
+  local eq_size = iterator.zip(iterator(ipairs(d1)):select(2),
+                               iterator(ipairs(d2)):select(2)):
+  reduce(function(acc,a,b) return acc and (a==b) end, true)
+  if not eq_size then return false end
+  local eq = true
+  op1:map(op2,function(x,y) eq = eq and (x == y) end)
+  return eq
+end
diff --git a/packages/basics/matrix/lua_src/matrixChar.lua b/packages/basics/matrix/lua_src/matrixChar.lua
index 03f0c5ec1..c28f0ac19 100644
--- a/packages/basics/matrix/lua_src/matrixChar.lua
+++ b/packages/basics/matrix/lua_src/matrixChar.lua
@@ -1,5 +1,7 @@
+class.extend(matrixChar, "t", matrixChar.."transpose")
+
 -- serialization
-matrix.__generic__.__make_all_serialization_methods__(matrixChar)
+matrix.__generic__.__make_all_serialization_methods__(matrixChar, "ascii")
 
 matrixChar.meta_instance.__tostring = function(self)
   local dims   = self:dim()
diff --git a/packages/basics/matrix/lua_src/matrixComplex.lua b/packages/basics/matrix/lua_src/matrixComplex.lua
index 586017f21..e7722bcc6 100644
--- a/packages/basics/matrix/lua_src/matrixComplex.lua
+++ b/packages/basics/matrix/lua_src/matrixComplex.lua
@@ -1,13 +1,18 @@
+class.extend(matrixComplex, "t", matrixComplex.."transpose")
+
 -- serialization
 matrix.__generic__.__make_all_serialization_methods__(matrixComplex)
 
 matrixComplex.meta_instance.__call =
   matrix.__generic__.__make_generic_call__()
 
+matrixComplex.meta_instance.__newindex =
+  matrix.__generic__.__make_generic_newindex__(matrixComplex)
+
 matrixComplex.meta_instance.__tostring =
   matrix.__generic__.__make_generic_print__("MatrixComplex",
                                             function(value)
-                                              return string.format("%12s",tostring(value))
+                                              return string.format("%26s",tostring(value))
   end)
 
 matrixComplex.join =
@@ -93,28 +98,6 @@ april_set_doc(matrixComplex, {
 		},
 		outputs = { "A matrixComplex instantiated object" }, })
 
-april_set_doc(matrixComplex.col_major, {
-		class = "function", summary = "constructor",
-		description ={
-		  "Constructor of a multidimensional matrixComplex.",
-		  "The data is stored at col_major order, but from",
-		  "outside is viewed as row_major (for compatibility",
-		  "purposes).",
-		},
-		params = {
-		  "First dimension size",
-		  "Second dimension size",
-		  "...",
-		  "ith dimension size",
-		  "...",
-		  "nth dimension size",
-		  { "A table with values [optional]. The values must be",
-		    "in row major order. A valid value is a number, which is",
-		    "taken as real part only, a complex object instance, or a",
-		    "string with the complex number.", },
-		},
-		outputs = { "A matrixComplex instantiated object" }, })
-
 april_set_doc(matrixComplex.."to_lua_string", {
 		class = "method",
 		summary = "It returns a Lua chunk string which is loadable.",
@@ -222,13 +205,6 @@ april_set_doc(matrixComplex.."set_use_cuda", {
 		  "The caller object (itself)",
 		}, })
 
-april_set_doc(matrixComplex.."get_major_order", {
-		class = "method",
-		summary = "Returns the major order of internal data.",
-		outputs = {
-		  "A string with the major order",
-		}, })
-
 april_set_doc(matrixComplex.."dim", {
 		class = "method",
 		summary = "Returns a table with the size of each dimension.",
@@ -319,15 +295,6 @@ april_set_doc(matrixComplex.."select", {
 april_set_doc(matrixComplex.."clone", {
 		class = "method",
 		summary = "Returns a deep copy (clone) of the caller matrixComplex.",
-		description = {
-		  "Returns a deep copy (clone) of the caller matrixComplex.",
-		  "It has the possibility of indicate the major order,",
-		  "and the data will be reordered if necessary.",
-		},
-		params = {
-		  { "A string: col_major or row_major [optional]. By",
-		    "default it is the same major order as the caller matrixComplex" },
-		},
 		outputs = {
 		  "A matrixComplex object (cloned)",
 		}, })
@@ -550,8 +517,7 @@ april_set_doc(matrixComplex.."to_float",
 		  "Converts the given matrixComplex to a matrix (with float)",
 		  "with the one additional dimension of size two, where the",
 		  "real and imaginary part will be stored together.",
-		  "The extra dimension will be the last if the original",
-		  "matrix is in row_major, or the first if its in col_major.",
+		  "The extra dimension will be the last.",
 		},
 		outputs = { "A matrix instance" },
 })
diff --git a/packages/basics/matrix/lua_src/matrixDouble.lua b/packages/basics/matrix/lua_src/matrixDouble.lua
index 78dbbac7b..378eee16d 100644
--- a/packages/basics/matrix/lua_src/matrixDouble.lua
+++ b/packages/basics/matrix/lua_src/matrixDouble.lua
@@ -1,13 +1,18 @@
+class.extend(matrixDouble, "t", matrixDouble.."transpose")
+
 -- serialization
 matrix.__generic__.__make_all_serialization_methods__(matrixDouble)
 
 matrixDouble.meta_instance.__call =
   matrix.__generic__.__make_generic_call__()
 
+matrixDouble.meta_instance.__newindex =
+  matrix.__generic__.__make_generic_newindex__(matrixDouble)
+
 matrixDouble.meta_instance.__tostring =
   matrix.__generic__.__make_generic_print__("MatrixDouble",
                                             function(value)
-                                              return string.format("% -11.6g", value)
+                                              return string.format("% -15.6g", value)
   end)
 
 matrixDouble.join =
diff --git a/packages/basics/matrix/lua_src/matrixInt32.lua b/packages/basics/matrix/lua_src/matrixInt32.lua
index df72cf200..93851c04c 100644
--- a/packages/basics/matrix/lua_src/matrixInt32.lua
+++ b/packages/basics/matrix/lua_src/matrixInt32.lua
@@ -1,9 +1,14 @@
+class.extend(matrixInt32, "t", matrixInt32.."transpose")
+
 -- serialization
 matrix.__generic__.__make_all_serialization_methods__(matrixInt32)
 
 matrixInt32.meta_instance.__call =
   matrix.__generic__.__make_generic_call__()
 
+matrixInt32.meta_instance.__newindex =
+  matrix.__generic__.__make_generic_newindex__(matrixInt32)
+
 matrixInt32.meta_instance.__tostring =
   matrix.__generic__.__make_generic_print__("MatrixInt32",
                                             function(value)
@@ -12,3 +17,16 @@ matrixInt32.meta_instance.__tostring =
 
 matrixInt32.join =
   matrix.__generic__.__make_generic_join__(matrixInt32)
+
+matrixInt32.meta_instance.__eq = function(op1, op2)
+  if type(op1) == "number" or type(op2) == "number" then return false end
+  local d1,d2 = op1:dim(),op2:dim()
+  if #d1 ~= #d2 then return false end
+  local eq_size = iterator.zip(iterator(ipairs(d1)):select(2),
+                               iterator(ipairs(d2)):select(2)):
+  reduce(function(acc,a,b) return acc and (a==b) end, true)
+  if not eq_size then return false end
+  local eq = true
+  op1:map(op2, function(x,y) eq = eq and (x==y) end)
+  return eq
+end
diff --git a/packages/basics/matrix/lua_src/sparse_matrix.lua b/packages/basics/matrix/lua_src/sparse_matrix.lua
index 62f961c90..808e72ae1 100644
--- a/packages/basics/matrix/lua_src/sparse_matrix.lua
+++ b/packages/basics/matrix/lua_src/sparse_matrix.lua
@@ -58,7 +58,18 @@ matrix.sparse.meta_instance.__mul = function(op1, op2)
   if type(op2) == "number" then return op1:clone():scal(op2)
   elseif type(op1) == "number" then return op2:clone():scal(op1)
   else
-    error("matrix.sparse only could be multiplied by scalars")
+    if class.is_a(op1,matrix) then
+      local res = matrix(op1:dim(1),op2:dim(2))
+      res:transpose():sparse_mm{ alpha=1.0, beta=0.0, A=op2, B=op1,
+                                 trans_A=true, trans_B=true }
+      return res
+    elseif class.is_a(op2,matrix) then
+      local res = matrix(op1:dim(1),op2:dim(2))
+      res:sparse_mm{ alpha=1.0, beta=0.0, A=op1, B=op2 }
+      return res
+    else
+      error("matrix.sparse only could be multiplied by scalars or matrix")
+    end
   end
 end
 
diff --git a/packages/basics/matrix/package.lua b/packages/basics/matrix/package.lua
index aea9d5a3f..b5bc193e5 100644
--- a/packages/basics/matrix/package.lua
+++ b/packages/basics/matrix/package.lua
@@ -17,7 +17,10 @@
      name = "test",
      lua_unit_test{
        file={
+         "test/test_gemm.lua",
+         "test/test_gemv.lua",
 	 "test/test_matrix_inv_solve.lua",
+	 "test/test_matrix_fft.lua",
 	 "test/test_matrix_math.lua",
 	 "test/test_sparse_matrix.lua",
 	 "test/test_convolution.lua",
@@ -34,6 +37,7 @@
      provide_bind{ file = "binding/bind_matrix_double.lua.cc", dest_dir = "include" },
      provide_bind{ file = "binding/bind_matrix_int32.lua.cc", dest_dir = "include" },
      provide_bind{ file = "binding/bind_matrix_char.lua.cc", dest_dir = "include" },
+     provide_bind{ file = "binding/bind_matrix_bool.lua.cc", dest_dir = "include" },
      provide_bind{ file = "binding/bind_referenced_vector.lua.cc", dest_dir = "include" }
    },
    target{
@@ -78,6 +82,10 @@
         file = "binding/bind_matrix_char.lua.cc",
         dest_dir = "build",
      },
+     build_bind{
+        file = "binding/bind_matrix_bool.lua.cc",
+        dest_dir = "build",
+     },
      build_bind{
         file = "binding/bind_referenced_vector.lua.cc",
         dest_dir = "build",
diff --git a/packages/basics/matrix/test/test_convolution.lua b/packages/basics/matrix/test/test_convolution.lua
index 8f2881c9d..ff1aaa621 100644
--- a/packages/basics/matrix/test/test_convolution.lua
+++ b/packages/basics/matrix/test/test_convolution.lua
@@ -7,8 +7,8 @@ local aux = matrix(1,1,3,3):linear()
 local aux = matrix.join(1,aux,aux)
 local k = matrix(2,1,2,2):linear()
 local o = matrix.ext.convolution(aux, { kernel=k, D=2 })
-local o2 = matrix.ext.convolution(aux:clone("col_major"),
-				  { kernel=k:clone("col_major"), D=2 })
+local o2 = matrix.ext.convolution(aux:clone(),
+				  { kernel=k:clone(), D=2 })
 
 --print(o)
 --print(o2)
@@ -28,13 +28,9 @@ T("MatrixConvolutionBasicTest",
     local target_o = matrix.join(1, target_o, target_o, target_o)
     --
     local o  = matrix.ext.convolution(m, { kernel=k, D=2 })
-    local o2 = matrix.ext.convolution(m:clone("col_major"),
-				      { kernel=k:clone("col_major"), D=2 })
     --
     --print(o)
-    check.eq(o,  target_o)
-    --print(o2)
-    check.eq(o2, target_o:clone("col_major"))
+    check.eq(o, target_o)
 end)
 
 T("MatrixConvolutionMediumTest",
@@ -66,20 +62,15 @@ T("MatrixConvolutionMediumTest",
                                 -28,   3, -38, -11,
     })
 
-    local target_o2 = target_o:clone("col_major")
-    local m2 = m:clone("col_major")
-    local k2 = k:clone("col_major")
     -------------------------------------------------------------------------
     local o = matrix.ext.convolution(m, { kernel=k, D=2 })
-    local o2 = matrix.ext.convolution(m2, { kernel=k2, D=2 })
     local c = ann.components.convolution{ kernel = { 3,3,3 }, n=2,
                                           weights = "w1" }
-    c:build{ weights = matrix.dict{ w1 = k2:rewrap(2, k:size()/2) } }
-    local cnn_o = c:forward(m2):get_matrix()
+    c:build{ weights = { w1 = k:rewrap(2, k:size()/2) } }
+    local cnn_o = c:forward(m)
     --
     check.eq( o, target_o )
-    check.eq( o2, target_o2 )
-    check.eq( cnn_o, target_o2 )
+    check.eq( cnn_o, target_o )
 end)
 
 if #arg > 0 then
diff --git a/packages/basics/matrix/test/test_gemm.lua b/packages/basics/matrix/test/test_gemm.lua
new file mode 100644
index 000000000..fc003180a
--- /dev/null
+++ b/packages/basics/matrix/test/test_gemm.lua
@@ -0,0 +1,54 @@
+local check=utest.check
+local T=utest.test
+
+T("GEMMTest", function()
+
+    local t1 = { 1, 2, 3,
+		 4, 5, 6 }
+    local t2 = { 3, 4,
+		 1, 7,
+		 9, 6 }
+
+    local t1_t2   = matrix(2,2,{ 32, 36,
+				 71, 87 })
+    local t2_t1   = matrix(3,3,{ 19, 26, 33,
+				 29, 37, 45,
+				 33, 48, 63 })
+    local t1p_t2p = matrix(3,3,{ 19, 29, 33,
+				 26, 37, 48,
+				 33, 45, 63 })
+    local t2p_t1p = matrix(2,2,{ 32, 71,
+				 36, 87 })
+
+    local A = matrix(2,3,t1)
+    local B = matrix(3,2,t2)
+
+    check.eq(A*B, t1_t2)
+    check.eq(B*A, t2_t1)
+    check.eq(A:t()*B:t(), t1p_t2p)
+    check.eq(B:t()*A:t(), t2p_t1p)
+
+    check.eq(matrix(2,2):gemm{ A=A, B=B, alpha=1, beta=0 }, t1_t2)
+    check.eq(matrix(3,3):gemm{ A=B, B=A, alpha=1, beta=0 }, t2_t1)
+    check.eq(matrix(3,3):gemm{ A=A:t(), B=B:t(), alpha=1, beta=0 }, t1p_t2p)
+    check.eq(matrix(2,2):gemm{ A=B:t(), B=A:t(), alpha=1, beta=0 }, t2p_t1p)
+
+    check.eq(matrix(2,2):gemm{ A=A:t(), B=B:t(), trans_A=true, trans_B=true, alpha=1, beta=0 }, t1_t2)
+    check.eq(matrix(3,3):gemm{ A=B:t(), B=A:t(), trans_A=true, trans_B=true, alpha=1, beta=0 }, t2_t1)
+    check.eq(matrix(3,3):gemm{ A=A, B=B, trans_A=true, trans_B=true, alpha=1, beta=0 }, t1p_t2p)
+    check.eq(matrix(2,2):gemm{ A=B, B=A, trans_A=true, trans_B=true, alpha=1, beta=0 }, t2p_t1p)
+
+    check.eq(matrix(2,2):transpose():gemm{ A=A, B=B, alpha=1, beta=0 }, t1_t2)
+    check.eq(matrix(3,3):transpose():gemm{ A=B, B=A, alpha=1, beta=0 }, t2_t1)
+    check.eq(matrix(3,3):transpose():gemm{ A=A:t(), B=B:t(), alpha=1, beta=0 }, t1p_t2p)
+    check.eq(matrix(2,2):transpose():gemm{ A=B:t(), B=A:t(), alpha=1, beta=0 }, t2p_t1p)
+
+    check.eq(matrix(2,2):transpose():gemm{ A=A:t(), B=B:t(), trans_A=true, trans_B=true, alpha=1, beta=0 }, t1_t2)
+    check.eq(matrix(3,3):transpose():gemm{ A=B:t(), B=A:t(), trans_A=true, trans_B=true, alpha=1, beta=0 }, t2_t1)
+    check.eq(matrix(3,3):transpose():gemm{ A=A, B=B, trans_A=true, trans_B=true, alpha=1, beta=0 }, t1p_t2p)
+    check.eq(matrix(2,2):transpose():gemm{ A=B, B=A, trans_A=true, trans_B=true, alpha=1, beta=0 }, t2p_t1p)
+    
+    check.errored(function() return A*A end)
+    check.errored(function() return B*B end)
+    
+end)
diff --git a/packages/basics/matrix/test/test_gemv.lua b/packages/basics/matrix/test/test_gemv.lua
new file mode 100644
index 000000000..83712f4f3
--- /dev/null
+++ b/packages/basics/matrix/test/test_gemv.lua
@@ -0,0 +1,26 @@
+local check=utest.check
+local T=utest.test
+
+T("GEMVTest", function()
+
+    local t1 = { 1, 2, 3,
+		 4, 5, 6 }
+    local t2 = { 3, 1, 9 }
+    local t3 = { 9, 7 }
+
+    local t1_t2  = matrix(2,{ 32, 71 })
+    local t1p_t3 = matrix(3,{ 37, 53, 69 })
+
+    local A = matrix(2,3,t1)
+    local B = matrix(t2)
+    local C = matrix(t3)
+
+    check.eq(matrix(2):gemv{ A=A, X=B, alpha=1, beta=0 }, t1_t2)
+    check.eq(matrix(3):gemv{ A=A:t(), X=C, alpha=1, beta=0 }, t1p_t3)
+    
+    check.eq(matrix(2):gemv{ A=A:t(), X=B, trans_A=true, alpha=1, beta=0 }, t1_t2)
+    check.eq(matrix(3):gemv{ A=A, X=C, trans_A=true, alpha=1, beta=0 }, t1p_t3)
+    
+    check.errored(function() return matrix(3):gemv{ A=A:t(), X=C, trans_A=true, alpha=1, beta=0 } end)
+    check.errored(function() return matrix(3):gemv{ A=A, X=C, alpha=1, beta=0 } end)
+end)
diff --git a/packages/basics/matrix/test/test_matrix_fft.lua b/packages/basics/matrix/test/test_matrix_fft.lua
new file mode 100644
index 000000000..4a1fc83d9
--- /dev/null
+++ b/packages/basics/matrix/test/test_matrix_fft.lua
@@ -0,0 +1,14 @@
+local check = utest.check
+local T = utest.test
+
+T("FFTTest", function()
+    local sin1 = matrix(512):linspace(0,1*math.pi):sin()
+    local sin2 = matrix(512):linspace(0,2*math.pi):sin()
+    local sin3 = matrix(512):linspace(0,3*math.pi):sin()
+    local sin4 = matrix(512):linspace(0,4*math.pi):sin()
+    local sin256 = matrix(512):linspace(0,512*math.pi):sin()
+    local sum  = (sin1 + sin2 + sin3 + sin4 + sin256)/5
+    local fft  = matrix.ext.real_fftwh(sum, 512, 512):log():clamp(0,math.huge)
+    local peaks = fft:gt(3):to_index()
+    check.eq( peaks, matrixInt32{1, 2, 3, 4, 256} )
+end)
diff --git a/packages/basics/matrix/test/test_matrix_inv_solve.lua b/packages/basics/matrix/test/test_matrix_inv_solve.lua
index 287ebd977..149c56ea6 100644
--- a/packages/basics/matrix/test/test_matrix_inv_solve.lua
+++ b/packages/basics/matrix/test/test_matrix_inv_solve.lua
@@ -2,19 +2,20 @@ mathcore.set_use_cuda_default(util.is_cuda_available())
 --
 local check = utest.check
 local T = utest.test
--- inverse
-local M = matrix.col_major
-local m = M(2,2, {
-		-2, 1,
-		-1, 1,
-		 })
-local b = M(2,1, {
-	      4,
-	      1
-		 })
-local c = m:inv()*b
-T("InverseTest", function() check.eq(c, M(2,1,{-3,-2})) end)
-
--- pseudo-inverse
-local c = m:pinv()*b
-T("PseudoInverseTest", function() check.eq(c, M(2,1,{-3,-2})) end)
+T("InverseTest", function()
+    -- inverse
+    local M = matrix
+    local m = M(2,2, {
+                    -2, 1,
+                    -1, 1,
+    })
+    local b = M(2,1, {
+                  4,
+                  1
+    })
+    local c = m:inv()*b
+    check.eq(c, M(2,1,{-3,-2}), "inverse")
+    -- pseudo-inverse
+    local c = m:pinv()*b
+    check.eq(c, M(2,1,{-3,-2}), "pseudo-inverse")
+end)
diff --git a/packages/basics/matrix/test/test_matrix_math.lua b/packages/basics/matrix/test/test_matrix_math.lua
index e2e5077bb..e654f2178 100644
--- a/packages/basics/matrix/test/test_matrix_math.lua
+++ b/packages/basics/matrix/test/test_matrix_math.lua
@@ -1,3 +1,5 @@
+-- TODO: implement unit tests for index, indexCopy, indexFill, operator [{}]
+
 -- forces the use of CUDA
 mathcore.set_use_cuda_default(util.is_cuda_available())
 --
@@ -5,7 +7,7 @@ local check = utest.check
 local T = utest.test
 --
 
-if not util.is_cuda_available() then
+-- if not util.is_cuda_available() then
   T("MathOpTest",
     function()
       local a = matrix(2,4,3,{
@@ -23,13 +25,13 @@ if not util.is_cuda_available() then
       
       local a = matrix.fromString[[
 1 3
-ascii col_major
+ascii
 1 2 3
 ]]
 
       local b = matrix.fromString[[
 3 1
-ascii col_major
+ascii
 1
 4
 7
@@ -38,11 +40,11 @@ ascii col_major
       local c = a*b
       check.eq(c:get(1,1), 1*1+2*4+3*7, "dot product")
       
-      check.eq(b*a, matrix.col_major(3,3,{
-                                       1,  2,  3,
-                                       4,  8, 12,
-                                       7, 14, 21,
-                                    }),
+      check.eq(b*a, matrix(3,3,{
+                             1,  2,  3,
+                             4,  8, 12,
+                             7, 14, 21,
+                          }),
                "cross product")
 
       local d = matrix.fromString[[
@@ -53,12 +55,12 @@ ascii
 7 8 9
 ]]
 
-      check.eq(d:clone("col_major"), matrix.col_major(3,3,{
-                                                        1, 2, 3,
-                                                        4, 5, 6,
-                                                        7, 8, 9,
-                                                     }),
-               "col_major clone")
+      check.eq(d:clone(), matrix(3,3,{
+                                   1, 2, 3,
+                                   4, 5, 6,
+                                   7, 8, 9,
+                                }),
+               "clone")
       
       check(d:transpose(), matrix(3,3,{
                                     1, 4, 7,
@@ -66,6 +68,13 @@ ascii
                                     3, 6, 9,
                                  }),
             "transpose")
+
+      check(d:transpose():clone(), matrix(3,3,{
+                                            1, 4, 7,
+                                            2, 5, 8,
+                                            3, 6, 9,
+                                         }),
+            "transpose clone")
       
       local e = d * d 
       check(e, matrix(3,3,{
@@ -75,63 +84,68 @@ ascii
                      }),
             "matrix mult *")
 
-      local d = d:clone("col_major")
-      local e = d * d
-      check(e, matrix.col_major(3,3,{
-                                  30,   36,  42,
-                                  66,   81,  96,
-                                  102, 126, 150,
-                               }),
-            "matrix mult * in col_major")
-
       local h = d:slice({2,2},{2,2})
-      check(h, matrix.col_major(2,2,{
-                                  5, 6,
-                                  8, 9,
-                               }),
+      check(h, matrix(2,2,{
+                        5, 6,
+                        8, 9,
+                     }),
             "matrix slice")
 
       local h = d:slice({2,2},{2,2},true)
-      check(h, matrix.col_major(2,2,{
-                                  5, 6,
-                                  8, 9,
-                               }),
+      check(h, matrix(2,2,{
+                        5, 6,
+                        8, 9,
+                     }),
             "matrix slice clone")
 
       local e = h * h
-      check(e, matrix.col_major(2,2,{
-                                  73,  84,
-                                  112, 129,
-                               }),
+      check(e, matrix(2,2,{
+                        73,  84,
+                        112, 129,
+                     }),
             "matrix slice mul *")
 
-      local l = matrix.col_major(2,2):fill(4) + h
-      check(l, matrix.col_major(2,2,{
-                                  9, 10,
-                                  12, 13,
-                               }),
+      local l = matrix(2,2):fill(4) + h
+      check(l, matrix(2,2,{
+                        9, 10,
+                        12, 13,
+                     }),
             "matrix fill and slice add +")
 
       local g = matrix(3,2,{1,2,
                             3,4,
                             5,6})
-      check(g:transpose():clone("col_major"), matrix.col_major(2,3,{
-                                                                 1, 3, 5,
-                                                                 2, 4, 6,
-                                                              }),
-            "transpose + col_major clone")
+      check(g:transpose():clone(), matrix(2,3,{
+                                            1, 3, 5,
+                                            2, 4, 6,
+                                         }),
+            "transpose + clone")
       
-      check(g:transpose():clone("col_major"):clone("row_major"), matrix(2,3,{
-                                                                          1, 3, 5,
-                                                                          2, 4, 6,
-                                                                       }),
-            "transpose + col_major clone + row_major clone")
+      check(g:transpose():clone():transpose():clone(), matrix(2,3,{
+                                                                1, 3, 5,
+                                                                2, 4, 6,
+                                                             }),
+            "transpose + clone + transpose + clone")
       
       check(g:transpose(), matrix(2,3,{
                                     1, 3, 5,
                                     2, 4, 6,
                                  }),
             "transpose")
+
+      check(g:transpose():clone(), matrix(2,3,{
+                                            1, 3, 5,
+                                            2, 4, 6,
+                                         }),
+            "transpose clone")
+
+      local h = matrix(table.unpack(g:transpose():dim()))
+      
+      check(h:copy(g:transpose()), matrix(2,3,{
+                                            1, 3, 5,
+                                            2, 4, 6,
+                                         }),
+            "copy transposed")
       
       local j = g:transpose() * g
       check(j, matrix(2,2,{
@@ -149,143 +163,143 @@ ascii
                         35, 44,
                         44, 56,
                      }),
-            "gemm in row_major")
+            "gemm")
       
-      local j = matrix.col_major(2,2):gemm{
+      local j = matrix(2,2):transpose():gemm{
         trans_A=true, trans_B=false,
-        alpha=1.0, A=g:clone("col_major"), B=g:clone("col_major"),
+        alpha=1.0, A=g, B=g,
         beta=0.0
-                                          }
-      check(j, matrix.col_major(2,2,{
-                                  35, 44,
-                                  44, 56,
-                               }),
+                                            }
+      check(j, matrix(2,2,{
+                        35, 44,
+                        44, 56,
+                     }),
             "gemm in col_major")
   end)
-else
-  T("CudaMathOpTest",
-    function()
-      local a = matrix.col_major(2,4,3,{
-                                   0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0, 0.1, 0.2,
-                                   0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.8, 0.7, 0.6, 0.5, 0.4,
-      })
-      ca = a:select(2,2):complement()
-      check.eq(ca,
-               matrix.col_major(2,4,3,{
-                                  0.9, 0.8, 0.7, 0.6, 0.5, 0.4, 0.3, 0.2, 0.1, 0.0, 0.9, 0.8,
-                                  0.7, 0.6, 0.5, 0.4, 0.3, 0.2, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6,
-               }):select(2,2),
-               "CUDA select")
+-- else
+--   T("CudaMathOpTest",
+--     function()
+--       local a = matrix(2,4,3,{
+--                          0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0, 0.1, 0.2,
+--                          0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.8, 0.7, 0.6, 0.5, 0.4,
+--       })
+--       ca = a:select(2,2):complement()
+--       check.eq(ca,
+--                matrix(2,4,3,{
+--                         0.9, 0.8, 0.7, 0.6, 0.5, 0.4, 0.3, 0.2, 0.1, 0.0, 0.9, 0.8,
+--                         0.7, 0.6, 0.5, 0.4, 0.3, 0.2, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6,
+--                }):select(2,2),
+--                "CUDA select")
       
       
-      local a = matrix.fromString[[
-1 3
-ascii col_major
-1 2 3
-]]
-
-      local b = matrix.fromString[[
-3 1
-ascii col_major
-1
-4
-7
-]]
-      local c = a*b
-      check.eq(c:get(1,1), 1*1+2*4+3*7, "CUDA dot product")
+--       local a = matrix.fromString[[
+-- 1 3
+-- ascii col_major
+-- 1 2 3
+-- ]]
+
+--       local b = matrix.fromString[[
+-- 3 1
+-- ascii col_major
+-- 1
+-- 4
+-- 7
+-- ]]
+--       local c = a*b
+--       check.eq(c:get(1,1), 1*1+2*4+3*7, "CUDA dot product")
       
-      check.eq(b*a, matrix.col_major(3,3,{
-                                       1,  2,  3,
-                                       4,  8, 12,
-                                       7, 14, 21,
-                                    }),
-               "CUDA cross product")
+--       check.eq(b*a, matrix.col_major(3,3,{
+--                                        1,  2,  3,
+--                                        4,  8, 12,
+--                                        7, 14, 21,
+--                                     }),
+--                "CUDA cross product")
       
-      local d = matrix.fromString[[
-3 3
-ascii col_major
-1 2 3
-4 5 6
-7 8 9
-]]
-      check.eq(d:transpose(), matrix.col_major(3,3,{
-                                                 1, 4, 7,
-                                                 2, 5, 8,
-                                                 3, 6, 9,
-                                              }),
-               "CUDA transpose")
+--       local d = matrix.fromString[[
+-- 3 3
+-- ascii col_major
+-- 1 2 3
+-- 4 5 6
+-- 7 8 9
+-- ]]
+--       check.eq(d:transpose(), matrix.col_major(3,3,{
+--                                                  1, 4, 7,
+--                                                  2, 5, 8,
+--                                                  3, 6, 9,
+--                                               }),
+--                "CUDA transpose")
       
-      check(d:clone(), matrix(3,3,{
-                                1, 2, 3,
-                                4, 5, 6,
-                                7, 8, 9,
-                                 }),
-            "CUDA clone")
+--       check(d:clone(), matrix(3,3,{
+--                                 1, 2, 3,
+--                                 4, 5, 6,
+--                                 7, 8, 9,
+--                                  }),
+--             "CUDA clone")
       
-      local e = d * d 
-      check(e, matrix.col_major(3,3,{
-                                  30,   36,  42,
-                                  66,   81,  96,
-                                  102, 126, 150,
-                               }),
-            "CUDA matrix mult *")
+--       local e = d * d 
+--       check(e, matrix.col_major(3,3,{
+--                                   30,   36,  42,
+--                                   66,   81,  96,
+--                                   102, 126, 150,
+--                                }),
+--             "CUDA matrix mult *")
       
-      local h = d:slice({2,2},{2,2})
-      check(h, matrix.col_major(2,2,{
-                                  5, 6,
-                                  8, 9,
-                               }),
-            "CUDA matrix slice")
-
-      local h = d:slice({2,2},{2,2},true)
-      check(h, matrix.col_major(2,2,{
-                                  5, 6,
-                                  8, 9,
-                               }),
-            "CUDA matrix slice clone")
-
-      local e = h * h
-      check(e, matrix.col_major(2,2,{
-                                  73,  84,
-                                  112, 129,
-                               }),
-            "CUDA matrix slice mul *")
+--       local h = d:slice({2,2},{2,2})
+--       check(h, matrix.col_major(2,2,{
+--                                   5, 6,
+--                                   8, 9,
+--                                }),
+--             "CUDA matrix slice")
+
+--       local h = d:slice({2,2},{2,2},true)
+--       check(h, matrix.col_major(2,2,{
+--                                   5, 6,
+--                                   8, 9,
+--                                }),
+--             "CUDA matrix slice clone")
+
+--       local e = h * h
+--       check(e, matrix.col_major(2,2,{
+--                                   73,  84,
+--                                   112, 129,
+--                                }),
+--             "CUDA matrix slice mul *")
       
-      local l = matrix.col_major(2,2):fill(4) + h
-      check(l, matrix.col_major(2,2,{
-                                  9, 10,
-                                  12, 13,
-                               }),
-            "CUDA matrix fill and slice add +")
-
-      local g = matrix.col_major(3,2,{1,2,
-                                      3,4,
-                                      5,6})
-      check(g:transpose():clone(), matrix.col_major(2,3,{
-                                                      1, 3, 5,
-                                                      2, 4, 6,
-                                                   }),
-            "CUDA transpose + clone")
+--       local l = matrix.col_major(2,2):fill(4) + h
+--       check(l, matrix.col_major(2,2,{
+--                                   9, 10,
+--                                   12, 13,
+--                                }),
+--             "CUDA matrix fill and slice add +")
+
+--       local g = matrix.col_major(3,2,{1,2,
+--                                       3,4,
+--                                       5,6})
+--       check(g:transpose():clone(), matrix.col_major(2,3,{
+--                                                       1, 3, 5,
+--                                                       2, 4, 6,
+--                                                    }),
+--             "CUDA transpose + clone")
             
-      local j = g:transpose() * g
-      check(j, matrix.col_major(2,2,{
-                                  35, 44,
-                                  44, 56,
-                               }),
-            "CUDA transpose mul *")
-
-      local j = matrix.col_major(2,2):gemm{
-        trans_A=true, trans_B=false,
-        alpha=1.0, A=g, B=g,
-        beta=0.0
-                                          }
-      check(j, matrix.col_major(2,2,{
-                                  35, 44,
-                                  44, 56,
-                               }),
-            "CUDA gemm")
-  end)
-end
+--       local j = g:transpose() * g
+--       check(j, matrix.col_major(2,2,{
+--                                   35, 44,
+--                                   44, 56,
+--                                }),
+--             "CUDA transpose mul *")
+
+--       local j = matrix.col_major(2,2):gemm{
+--         trans_A=true, trans_B=false,
+--         alpha=1.0, A=g, B=g,
+--         beta=0.0
+--                                           }
+--       check(j, matrix.col_major(2,2,{
+--                                   35, 44,
+--                                   44, 56,
+--                                }),
+--             "CUDA gemm")
+--   end)
+-- end
 
 ---------------------------------------------------------------
 ---------------------------------------------------------------
@@ -293,30 +307,30 @@ end
 
 T("SVDTest",
   function()
-    local m = matrix.col_major(4,5,{1,0,0,0,2,
-                                    0,0,3,0,0,
-                                    0,0,0,0,0,
-                                    0,4,0,0,0})
+    local m = matrix(4,5,{1,0,0,0,2,
+                          0,0,3,0,0,
+                          0,0,0,0,0,
+                          0,4,0,0,0})
     local U,S,V = m:svd()
-    check(U, matrix.col_major(4,4,
-                              {
-                                0,0,1, 0,
-                                0,1,0, 0,
-                                0,0,0,-1,
-                                1,0,0, 0,
-    }),
-    "SVD U matrix")
-    check(S:to_dense(), matrix.col_major(4,{4,3,2.23607,0}):diagonalize(),
+    check(U, matrix(4,4,
+                    {
+                      0,0,1, 0,
+                      0,1,0, 0,
+                      0,0,0,-1,
+                      1,0,0, 0,
+                   }),
+          "SVD U matrix")
+    check(S:to_dense(), matrix(4,{4,3,2.23607,0}):diagonalize(),
           "SVD S matrix")
-    check(V, matrix.col_major(5,5,
-                              {
-                                0,1,0,0,0,
-                                0,0,1,0,0,
-                                0.447214,0,0,0,0.894427,
-                                0,0,0,1,0,
-                                  -0.894427,0,0,0,0.447214,
-    }),
-    "SVD V matrix")
+    check(V, matrix(5,5,
+                    {
+                      0,1,0,0,0,
+                      0,0,1,0,0,
+                      0.447214,0,0,0,0.894427,
+                      0,0,0,1,0,
+                        -0.894427,0,0,0,0.447214,
+                   }),
+          "SVD V matrix")
 end)
 
 ---------------------------------------------------------------
@@ -332,11 +346,11 @@ T("SliceTest",
     local subm = m:slice({1,4},{6,m:dim(2)-3})
     check.eq(subm, m(":6","4:"), "slice() 3")
     --
-    local m = matrix.col_major(1,4):linear()
-    check.eq(m:slice({1,1},{1,2},true), matrix.col_major(1,2,{0,1}), "slice 4")
-    check.eq(m:slice({1,3},{1,2},true), matrix.col_major(1,2,{2,3}), "slice 5")
-    check.eq(m:slice({1,1},{1,2}), matrix.col_major(1,2,{0,1}), "slice 6")
-    check.eq(m:slice({1,3},{1,2}), matrix.col_major(1,2,{2,3}), "slice 7")
+    local m = matrix(1,4):transpose():linear()
+    check.eq(m:slice({1,1},{2,1},true), matrix(2,1,{0,1}), "slice 4")
+    check.eq(m:slice({3,1},{2,1},true), matrix(2,1,{2,3}), "slice 5")
+    check.eq(m:slice({1,1},{2,1}), matrix(2,1,{0,1}), "slice 6")
+    check.eq(m:slice({3,1},{2,1}), matrix(2,1,{2,3}), "slice 7")
     --
     local m = matrix(1,4):linear()
     check.eq(m:slice({1,1},{1,2},true), matrix(1,2,{0,1}), "slice 8")
@@ -379,18 +393,18 @@ os.remove(tmpname)
 T("EQandNEQTest", function()
     local m   = load_csv()
     local def = 0.0/0.0
-    check.eq(m:clone():eq(def),
-             matrix(3,5,{0,0,0,1,0,0,0,0,0,1,0,1,1,1,0}), "NAN eq")
-    check.eq(m:clone():neq(def),
-             matrix(3,5,{1,1,1,0,1,1,1,1,1,0,1,0,0,0,1}), "NAN neq")
+    check.eq(m:eq(def),
+             matrixBool(matrix(3,5,{0,0,0,1,0,0,0,0,0,1,0,1,1,1,0})), "NAN eq")
+    check.eq(m:neq(def),
+             matrixBool(matrix(3,5,{1,1,1,0,1,1,1,1,1,0,1,0,0,0,1})), "NAN neq")
     
-    check.eq(m:clone():eq(4),
-             matrix(3,5,{0,0,0,0,1,0,0,0,0,0,1,0,0,0,0}), "4 eq")
-    check.eq(m:clone():neq(4),
-             matrix(3,5,{1,1,1,1,0,1,1,1,1,1,0,1,1,1,1}), "4 neq")
+    check.eq(m:eq(4),
+             matrixBool(matrix(3,5,{0,0,0,0,1,0,0,0,0,0,1,0,0,0,0})), "4 eq")
+    check.eq(m:neq(4),
+             matrixBool(matrix(3,5,{1,1,1,1,0,1,1,1,1,1,0,1,1,1,1})), "4 neq")
 
-    check.eq(m:clone():eq(m), matrix(3,5):ones(), "eq m")
-    check.eq(m:clone():neq(m), matrix(3,5):zeros(), "neq m")
+    check.eq(m:eq(m), matrixBool(3,5):ones(), "eq m")
+    check.eq(m:neq(m), matrixBool(3,5):zeros(), "neq m")
 end)
 
 T("SumTest", function()
@@ -418,7 +432,6 @@ T("SumTest", function()
 end)
 
 T("MaxTest", function()
-    -- IN ROW MAJOR ORDER
     local m = matrix(2, 3, {1, 4, 2,
                             6, 3, 5})
     check.eq(m:max(), 6, "max()")
@@ -452,41 +465,6 @@ T("MaxTest", function()
                                   15, 17, 21, 23 }), "max(3) a")
     check.eq(b:to_float(), matrix(2, 4, 1, { 3, 1, 2, 2,
                                              3, 2, 3, 2 }), "max(3) b")
-    -- IN COL MAJOR ORDER
-    local m = matrix.col_major(2, 3, {1, 4, 2,
-                                      6, 3, 5})
-    check.eq(m:max(), 6, "max() col_major")
-    check.eq(m:max(1), matrix.col_major(1, 3, {6, 4, 5}), "max(1) col_major")
-    check.eq(m:max(2), matrix.col_major(2, 1, {4, 6}), "max(2) col_major")
-
-    local m = matrix.col_major(2, 4, 3, { 12, 14, 18,   8,  5, 6,    7, 16,  9,   10, 24, 1,
-                                          13,  2, 15,   4, 17, 3,   19, 20, 21,   22, 23, 11})
-    check.eq(m:max(), 24, "max() 2 col_major")
-    local a,b = m:max(1)
-    check.eq(a, matrix.col_major(1, 4, 3, { 13,  14, 18,
-                                            8,   17,  6,
-                                            19,  20, 21,
-                                            22,  24, 11 }),
-             "max(1) a col_major")
-    check.eq(b:to_float(), matrix(1, 4, 3, { 2, 1, 1,
-                                             1, 2, 1,
-                                             2, 2, 2,
-                                             2, 1, 2 }),
-             "max(1) b col_major")
-    local a,b = m:max(2)
-    check.eq(a, matrix.col_major(2, 1, 3, { 12, 24, 18,
-                                            22, 23, 21 }),
-             "max(2) a col_major")
-    check.eq(b:to_float(), matrix(2, 1, 3, { 1, 4, 1,
-                                             4, 4, 3 }),
-             "max(2) b col_major")
-    local a,b = m:max(3)
-    check.eq(a, matrix.col_major(2, 4, 1, { 18, 8, 16, 24,
-                                            15, 17, 21, 23 }),
-             "max(3) a col_major")
-    check.eq(b:to_float(), matrix(2, 4, 1, { 3, 1, 2, 2,
-                                             3, 2, 3, 2 }),
-             "max(3) b col_major")
 end)
 
 T("MinTest", function()
diff --git a/packages/basics/stats/binding/bind_stats.lua.cc b/packages/basics/stats/binding/bind_stats.lua.cc
index 69c545af0..069a248e3 100644
--- a/packages/basics/stats/binding/bind_stats.lua.cc
+++ b/packages/basics/stats/binding/bind_stats.lua.cc
@@ -72,7 +72,7 @@ using namespace Stats;
   if (N > 0) {
     if (dest == 0) {
       int dims[2] = { N, static_cast<int>(obj->getSize()) };
-      dest = new MatrixFloat(2, dims, CblasColMajor);
+      dest = new MatrixFloat(2, dims);
     }
     else {
       if (N != dest->getDimSize(0))
@@ -97,7 +97,7 @@ using namespace Stats;
     LUABIND_GET_PARAMETER(1, float, xf);
     dest = 0;
     int dims[2] = {1,1};
-    x = new MatrixFloat(2, dims, CblasColMajor);
+    x = new MatrixFloat(2, dims);
     (*x)(0,0) = xf;
   }
   IncRef(x);
@@ -119,7 +119,7 @@ using namespace Stats;
     LUABIND_GET_PARAMETER(1, float, xf);
     dest = 0;
     int dims[2] = {1,1};
-    x = new MatrixFloat(2, dims, CblasColMajor);
+    x = new MatrixFloat(2, dims);
     (*x)(0,0) = xf;
   }
   IncRef(x);
@@ -141,7 +141,7 @@ using namespace Stats;
     LUABIND_GET_PARAMETER(1, float, xf);
     grads = 0;
     int dims[2] = {1,1};
-    x = new MatrixFloat(2, dims, CblasColMajor);
+    x = new MatrixFloat(2, dims);
     (*x)(0,0) = xf;
   }
   IncRef(x);
@@ -196,8 +196,8 @@ using namespace Stats;
     LUABIND_GET_PARAMETER(1, float, lowf);
     LUABIND_GET_PARAMETER(2, float, highf);
     int dims[1] = { 1 };
-    low  = new MatrixFloat(1, dims, CblasColMajor);
-    high = new MatrixFloat(1, dims, CblasColMajor);
+    low  = new MatrixFloat(1, dims);
+    high = new MatrixFloat(1, dims);
     (*low)(0)  = lowf;
     (*high)(0) = highf;
   }
@@ -277,7 +277,7 @@ using namespace Stats;
       LUABIND_GET_PARAMETER(1, float, mu);
       LUABIND_GET_PARAMETER(2, float, sigma);
       int dims[1] = { 1 };
-      mean = new MatrixFloat(1, dims, CblasColMajor);
+      mean = new MatrixFloat(1, dims);
       (*mean)(0) = mu;
       cov = SparseMatrixFloat::diag(1, sigma);
       DiagonalNormalDistribution *obj = new DiagonalNormalDistribution(mean, cov);
@@ -359,11 +359,11 @@ using namespace Stats;
     LUABIND_GET_PARAMETER(2, float, sigma);
     LUABIND_GET_OPTIONAL_PARAMETER(3, float, loc, 0.0f);
     int dims[1] = { 1 };
-    mean = new MatrixFloat(1, dims, CblasColMajor);
+    mean = new MatrixFloat(1, dims);
     (*mean)(0) = mu;
     cov = SparseMatrixFloat::diag(1, sigma);
     if (loc != 0.0f) {
-      location = new MatrixFloat(1, dims, CblasColMajor);
+      location = new MatrixFloat(1, dims);
       (*location)(0) = loc;
     }
     else location = 0;
@@ -404,7 +404,7 @@ using namespace Stats;
     float lambdaf;
     LUABIND_GET_PARAMETER(1, float, lambdaf);
     int dims[1] = {1};
-    lambda = new MatrixFloat(1, dims, CblasColMajor);
+    lambda = new MatrixFloat(1, dims);
     AprilMath::MatrixExt::Operations::matFill(lambda, lambdaf);
   }
   obj = new ExponentialDistribution(lambda);
@@ -437,9 +437,9 @@ using namespace Stats;
     LUABIND_GET_PARAMETER(1, float, alphaf);
     LUABIND_GET_PARAMETER(2, float, betaf);
     int dims[1] = {1};
-    alpha = new MatrixFloat(1, dims, CblasColMajor);
+    alpha = new MatrixFloat(1, dims);
     (*alpha)(0) = alphaf;
-    beta = new MatrixFloat(1, dims, CblasColMajor);
+    beta = new MatrixFloat(1, dims);
     (*beta)(0) = betaf;
   }
   obj = new BetaDistribution(alpha, beta);
@@ -474,9 +474,9 @@ using namespace Stats;
     LUABIND_GET_PARAMETER(1, uint, ni);
     LUABIND_GET_PARAMETER(2, float, pf);
     int dims[1] = {1};
-    n = new MatrixFloat(1, dims, CblasColMajor);
+    n = new MatrixFloat(1, dims);
     (*n)(0) = static_cast<float>(ni);
-    p = new MatrixFloat(1, dims, CblasColMajor);
+    p = new MatrixFloat(1, dims);
     (*p)(0) = pf;
   }
   obj = new BinomialDistribution(n, p);
diff --git a/packages/basics/stats/c_src/exponential_distribution.cc b/packages/basics/stats/c_src/exponential_distribution.cc
index ab4aad03a..ff8493811 100644
--- a/packages/basics/stats/c_src/exponential_distribution.cc
+++ b/packages/basics/stats/c_src/exponential_distribution.cc
@@ -40,8 +40,6 @@ namespace Stats {
     lambda(lambda), inv_lambda(0) {
     if (lambda->getNumDim() != 1)
       ERROR_EXIT(128, "Expected one-dimensional lambda matrix\n");
-    if (lambda->getMajorOrder() != CblasColMajor)
-      ERROR_EXIT(128, "Expected col_major matrix\n");
     IncRef(lambda);
     updateParams();
   }
@@ -132,8 +130,8 @@ namespace Stats {
   char *ExponentialDistribution::toLuaString(bool is_ascii) const {
     SharedPtr<CStringStream> stream(new CStringStream());
     stream->put("stats.dist.exponential(matrix.fromString[[");
-    AprilUtils::HashTableOptions options;
-    lambda->write( stream.get(), options.putBoolean("ascii", is_ascii) );
+    AprilUtils::LuaTable options;
+    lambda->write( stream.get(), options.put("ascii", is_ascii) );
     stream->put("]])\0",4); // forces a \0 at the end of the buffer
     return stream->releaseString();
   }
diff --git a/packages/basics/stats/c_src/normal_distribution.cc b/packages/basics/stats/c_src/normal_distribution.cc
index 2bc37d994..0ef450b79 100644
--- a/packages/basics/stats/c_src/normal_distribution.cc
+++ b/packages/basics/stats/c_src/normal_distribution.cc
@@ -51,9 +51,6 @@ namespace Stats {
       ERROR_EXIT(128, "Expected squared bi-dimensional cov matrix\n");
     if (mean->getDimSize(0) != cov->getDimSize(0))
       ERROR_EXIT(128, "Expected mean and cov matrix with same size\n");
-    if (mean->getMajorOrder() != CblasColMajor ||
-        cov->getMajorOrder() != CblasColMajor)
-      ERROR_EXIT(128, "Expected col_major matrices\n");
     IncRef(mean);
     IncRef(cov);
     updateParams();
@@ -104,7 +101,7 @@ namespace Stats {
                                                 MatrixFloat *result) {
     SharedPtr<MatrixFloat> diff( x->clone() );
     int dims[1] = { x->getDimSize(1) };
-    SharedPtr<MatrixFloat> mult( new MatrixFloat(1, dims, CblasColMajor) );
+    SharedPtr<MatrixFloat> mult( new MatrixFloat(1, dims) );
     // over all samples (bunch_size)
     MatrixFloat::iterator result_it(result->begin());
     SharedPtr<MatrixFloat> diff_row;
@@ -145,12 +142,12 @@ namespace Stats {
   
   char *GeneralNormalDistribution::toLuaString(bool is_ascii) const {
     SharedPtr<CStringStream> stream(new CStringStream());
-    AprilUtils::HashTableOptions options;
-    options.putBoolean("ascii", is_ascii);
+    AprilUtils::LuaTable options;
+    options.put("ascii", is_ascii);
     stream->put("stats.dist.normal(matrix.fromString[[");
-    mean->write(stream.get(), &options);
+    mean->write(stream.get(), options);
     stream->put("]], matrix.fromString[[");
-    cov->write(stream.get(), &options);
+    cov->write(stream.get(), options);
     stream->put("]])\0",4);
     return stream->releaseString();
   }
@@ -167,8 +164,6 @@ namespace Stats {
       ERROR_EXIT(128, "Expected squared bi-dimensional cov matrix\n");
     if (mean->getDimSize(0) != cov->getDimSize(0))
       ERROR_EXIT(128, "Expected mean and cov matrix with same size\n");
-    if (mean->getMajorOrder() != CblasColMajor)
-      ERROR_EXIT(128, "Expected col_major mean matrix\n");
     IncRef(mean);
     IncRef(cov);
     updateParams();
@@ -220,7 +215,8 @@ namespace Stats {
     for (MatrixFloat::iterator z_it = z->begin(); z_it != z->end(); ++z_it) {
       *z_it = static_cast<float>(rng->randNorm(0.0, 1.0));
     }
-    matSparseMM(result, CblasTrans, CblasTrans, CblasTrans,
+    SharedPtr<MatrixFloat> rT(result->transpose());
+    matSparseMM(rT.get(), CblasTrans, CblasTrans,
                 1.0f, L, z.get(), 0.0f);
     SharedPtr<MatrixFloat> result_row;
     for (int i=0; i<result->getDimSize(0); ++i) {
@@ -233,7 +229,7 @@ namespace Stats {
                                                  MatrixFloat *result) {
     SharedPtr<MatrixFloat> diff( x->clone() );
     int dims[1] = { x->getDimSize(1) };
-    SharedPtr<MatrixFloat> mult( new MatrixFloat(1, dims, CblasColMajor) );
+    SharedPtr<MatrixFloat> mult( new MatrixFloat(1, dims) );
     // over all samples (bunch_size)
     MatrixFloat::iterator result_it(result->begin());
     SharedPtr<MatrixFloat> diff_row;
@@ -274,12 +270,12 @@ namespace Stats {
   
   char *DiagonalNormalDistribution::toLuaString(bool is_ascii) const {
     SharedPtr<CStringStream> stream(new CStringStream());
-    AprilUtils::HashTableOptions options;
-    options.putBoolean("ascii", is_ascii);
+    AprilUtils::LuaTable options;
+    options.put("ascii", is_ascii);
     stream->put("stats.dist.normal(matrix.fromString[[");
-    mean->write(stream.get(), &options);
+    mean->write(stream.get(), options);
     stream->put("]], matrix.sparse.fromString[[");
-    cov->write(stream.get(), &options);
+    cov->write(stream.get(), options);
     stream->put("]])\0",4); // forces a \0 at the end of the buffer
     return stream->releaseString();
   }
@@ -402,14 +398,14 @@ namespace Stats {
   
   char *GeneralLogNormalDistribution::toLuaString(bool is_ascii) const {
     SharedPtr<CStringStream> stream(new CStringStream());
-    AprilUtils::HashTableOptions options;
-    options.putBoolean("ascii", is_ascii);
+    AprilUtils::LuaTable options;
+    options.put("ascii", is_ascii);
     stream->put("stats.dist.lognormal(matrix.fromString[[");
-    mean->write(stream.get(), &options);
+    mean->write(stream.get(), options);
     stream->put("]], matrix.fromString[[");
-    cov->write(stream.get(), &options);
+    cov->write(stream.get(), options);
     stream->put("]], matrix.fromString[[");
-    location->write(stream.get(), &options);
+    location->write(stream.get(), options);
     stream->put("]])\0",4); // forces a \0 at the end of the buffer
     return stream->releaseString();
   }
@@ -482,14 +478,14 @@ namespace Stats {
   
   char *DiagonalLogNormalDistribution::toLuaString(bool is_ascii) const {
     SharedPtr<CStringStream> stream(new CStringStream());
-    AprilUtils::HashTableOptions options;
-    options.putBoolean("ascii", is_ascii);
+    AprilUtils::LuaTable options;
+    options.put("ascii", is_ascii);
     stream->put("stats.dist.lognormal(matrix.fromString[[");
-    mean->write(stream.get(), &options);
+    mean->write(stream.get(), options);
     stream->put("]], matrix.sparse.fromString[[");
-    cov->write(stream.get(), &options);
+    cov->write(stream.get(), options);
     stream->put("]], matrix.fromString[[");
-    location->write(stream.get(), &options);
+    location->write(stream.get(), options);
     stream->put("]])\0",4); // forces a \0 at the end of the buffer
     return stream->releaseString();
   }
diff --git a/packages/basics/stats/c_src/statistical_distribution.h b/packages/basics/stats/c_src/statistical_distribution.h
index b1ce5402c..b334beb35 100644
--- a/packages/basics/stats/c_src/statistical_distribution.h
+++ b/packages/basics/stats/c_src/statistical_distribution.h
@@ -24,7 +24,6 @@
 #include "error_print.h"
 #include "logbase.h"
 #include "matrixFloat.h"
-#include "matrixFloatSet.h"
 #include "MersenneTwister.h"
 #include "referenced.h"
 
@@ -36,9 +35,8 @@ namespace Stats {
    * statistical distributions and defines a private API for new classes
    * derivation.
    
-   * All the methods work with col_major matrices (like ANN components), and
-   * with two-dimensional matrices where first dimension is the bunch_size (like
-   * ANN components).
+   * All the methods work with two-dimensional matrices where first dimension is
+   * the bunch_size (like ANN components).
    */
   class StatisticalDistributionBase : public Referenced {
     unsigned int size;
@@ -105,13 +103,11 @@ namespace Stats {
                                 Basics::MatrixFloat *result=0) {
       int dims[2] = { 1, static_cast<int>(size) };
       if (result == 0) {
-        result = new Basics::MatrixFloat(2, dims, CblasColMajor);
+        result = new Basics::MatrixFloat(2, dims);
       }
       else if (result->getNumDim() != 2 || result->getDimSize(1) != static_cast<int>(size))
         ERROR_EXIT1(128, "Incorrect result matrix size, expected "
                     "bi-dimensional matrix with Nx%u shape\n", size);
-      else if (result->getMajorOrder() != CblasColMajor)
-        ERROR_EXIT(128, "Expected col_major order in result matrix\n");
       // virtual call
       privateSample(rng, result);
       return result;
@@ -131,17 +127,13 @@ namespace Stats {
       if (x->getNumDim() != 2 || x->getDimSize(1) != static_cast<int>(size))
         ERROR_EXIT1(128, "Incorrect x matrix size, expected bi-dimensional "
                     "matrix with Nx%u shape\n", size);
-      if (x->getMajorOrder() != CblasColMajor)
-        ERROR_EXIT(128, "Expected col_major in x matrix\n");
       int dims[1] = { x->getDimSize(0) };
       if (result == 0) {
-        result = new Basics::MatrixFloat(1, dims, CblasColMajor);
+        result = new Basics::MatrixFloat(1, dims);
       }
       else if (result->getNumDim() != 1 || result->getDimSize(0) != dims[0])
         ERROR_EXIT1(128, "Incorrect result matrix size, expected "
                     "one-dimensional matrix with %d size\n", dims[0]);
-      else if (result->getMajorOrder() != CblasColMajor)
-        ERROR_EXIT(128, "Expected col_major order in result matrix\n");
       // virtual call
       privateLogpdf(x, result);
       return result;
@@ -161,17 +153,13 @@ namespace Stats {
       if (x->getNumDim() != 2 || x->getDimSize(1) != static_cast<int>(size))
         ERROR_EXIT1(128, "Incorrect x matrix size, expected bi-dimensional "
                     "matrix with Nx%u shape\n", size);
-      if (x->getMajorOrder() != CblasColMajor)
-        ERROR_EXIT(128, "Expected col_major in x matrix\n");
       int dims[1] = { x->getDimSize(0) };
       if (result == 0) {
-        result = new Basics::MatrixFloat(1, dims, CblasColMajor);
+        result = new Basics::MatrixFloat(1, dims);
       }
       else if (result->getNumDim() != 1 || result->getDimSize(0) != dims[0])
         ERROR_EXIT1(128, "Incorrect result matrix size, expected "
                     "one-dimensional matrix with %d size\n", dims[0]);
-      else if (result->getMajorOrder() != CblasColMajor)
-        ERROR_EXIT(128, "Expected col_major order in result matrix\n");
       // virtual call
       privateLogcdf(x, result);
       return result;
@@ -192,19 +180,15 @@ namespace Stats {
       if (x->getNumDim() != 2 || x->getDimSize(1) != static_cast<int>(size))
         ERROR_EXIT1(128, "Incorrect x matrix size, expected bi-dimensional "
                     "matrix with Nx%u shape\n", size);
-      if (x->getMajorOrder() != CblasColMajor)
-        ERROR_EXIT(128, "Expected col_major in x matrix\n");
       const int *dims = x->getDimPtr();
       if (grads == 0) {
-        grads = new Basics::MatrixFloat(2, dims, CblasColMajor);
+        grads = new Basics::MatrixFloat(2, dims);
         AprilMath::MatrixExt::Operations::matZeros(grads);
       }
       else if (grads->getNumDim() != 2 || grads->getDimSize(0) != dims[0] ||
                grads->getDimSize(1) != dims[1])
         ERROR_EXIT2(128, "Incorrect grads matrix size, expected "
                     "bidimensional matrix with %dx%d size\n", dims[0], dims[1]);
-      else if (grads->getMajorOrder() != CblasColMajor)
-        ERROR_EXIT(128, "Expected col_major order in grads matrix\n");
       // virtual call
       IncRef(grads);
       privateLogpdfDerivative(x, grads);
diff --git a/packages/basics/stats/c_src/uniform_distribution.cc b/packages/basics/stats/c_src/uniform_distribution.cc
index 0341db4e1..07ed81fd4 100644
--- a/packages/basics/stats/c_src/uniform_distribution.cc
+++ b/packages/basics/stats/c_src/uniform_distribution.cc
@@ -38,9 +38,6 @@ namespace Stats {
     IncRef(high);
     if (!low->sameDim(high))
       ERROR_EXIT(128, "Expected same sizes in low and high matrices\n");
-    if (low->getMajorOrder() != CblasColMajor ||
-        high->getMajorOrder() != CblasColMajor)
-      ERROR_EXIT(128, "Expected col_major matrices\n");
     MatrixFloat::const_iterator low_it(low->begin());
     MatrixFloat::const_iterator high_it(high->begin());
     while(low_it != low->end()) {
@@ -140,12 +137,12 @@ namespace Stats {
 
   char *UniformDistribution::toLuaString(bool is_ascii) const {
     SharedPtr<CStringStream> stream(new CStringStream());
-    AprilUtils::HashTableOptions options;
-    options.putBoolean("ascii", is_ascii);
+    AprilUtils::LuaTable options;
+    options.put("ascii", is_ascii);
     stream->put("stats.dist.uniform(matrix.fromString[[");
-    low->write(stream.get(), &options);
+    low->write(stream.get(), options);
     stream->put("]], matrix.fromString[[");
-    high->write(stream.get(), &options);
+    high->write(stream.get(), options);
     stream->put("]])\0",4);
     return stream->releaseString();
   }
diff --git a/packages/basics/stats/lua_src/pca.lua b/packages/basics/stats/lua_src/pca.lua
index f75315c13..2fcba5538 100644
--- a/packages/basics/stats/lua_src/pca.lua
+++ b/packages/basics/stats/lua_src/pca.lua
@@ -1,4 +1,15 @@
 stats = get_table_from_dotted_string("stats", true)
+stats.pca = stats.pca or {}
+stats.zca = stats.zca or {}
+
+april_set_doc(stats.pca,{
+                class = "namespace",
+                summary = "Table with PCA related stuff",
+})
+april_set_doc(stats.zca,{
+                class = "namespace",
+                summary = "Table with ZCA related stuff",
+})
 
 local function normalize(m,norm)
   local norm = norm or m:norm2()
@@ -13,11 +24,12 @@ end
 -------------------------------------------------------------------------------
 
 -- WARNING IN PLACE OPERATION
-function stats.mean_centered_by_pattern(X)
+function stats.pca.center_by_pattern(X)
+  local X=X:clone()
   local dim = X:dim()
   assert(#dim == 2, "Expected a bi-dimensional matrix")
   local M,N = table.unpack(dim)
-  -- U is the mean over all rows
+  -- U is the mean over all columns
   local U,auxX = X:sum(2):rewrap(M):scal(1/N)
   -- X is centered subtracting by -U
   for i=1,X:dim(2) do auxX=X:select(2,i,auxX):axpy(-1, U) end
@@ -27,9 +39,9 @@ end
 -------------------------------------------------------------------------------
 
 -- NOT IN-PLACE
-function stats.pca_whitening(X,U,S,epsilon)
+function stats.pca.whitening(X,U,S,epsilon)
   local epsilon = epsilon or 0.0
-  local result = matrix[X:get_major_order()](X:dim(1), S:dim(1))
+  local result = matrix(X:dim(1), S:dim(1))
   result:gemm{ A=X, B=U, trans_B=false, beta=0, alpha=1}
   for v,i in S:iterate() do
     result:select(2,i):scal( 1/math.sqrt(v + epsilon) )
@@ -38,60 +50,100 @@ function stats.pca_whitening(X,U,S,epsilon)
 end
 
 -- WARNING IN PLACE OPERATION
-function stats.zca_whitening(X,U,S,epsilon)
-  local aux = stats.pca_whitening(X,U,S,epsilon)
+function stats.zca.whitening(X,U,S,epsilon)
+  local aux = stats.pca.whitening(X,U,S,epsilon)
   X:gemm{ A=aux, B=U, trans_B=true, beta=0, alpha=1 }
   return X
 end
 
 -- compute PCA mass
-function stats.pca_mass(S,mass)
-  local acc = 0
-  local acc_mat = matrix.col_major(S:size())
-  for v,i in S:iterate() do
-    acc=acc + v
-    acc_mat:set(i, acc)
+stats.pca.mass =
+  april_doc{
+    class = "function",
+    summary = "Computes PCA mass probability given S diagonal sparse matrix",
+    params = { "S diagonal sparse matrix" },
+    outputs = { "A matrix with probability mass" },
+  } ..
+  function(S)
+    local acc = 0
+    local acc_mat = S:clone()
+    for v,i in S:iterate() do acc=acc + v end
+    acc_mat:scal(1.0/acc)
+    return acc_mat
   end
-  acc_mat:scal(1.0/acc)
-  return acc_mat
-end
 
 -- show PCA threshold
-function stats.pca_threshold(S,mass)
-  local mass = mass or 0.99
-  local acc = 0
-  local sum = S:sum()
-  local acc_th,th,vth = 0,1
-  for v,i in S:iterate() do
-    acc=acc + v
-    if acc/sum < mass then vth,acc_th,th=v,acc,i end
+stats.pca.threshold =
+  april_doc{
+    class = "function",
+    summary = "Computes the PCA threshold for a given mass probability",
+    params = {
+      "The S diagonal sparse matrix with singular values",
+      "A number in [0,1] range indicating the mass probability [optional]. 0.99 by default",
+    },
+    outputs = {
+      "The number of components",
+      "The threshold singular value",
+      "The accumulated probability",
+    },
+  } ..
+  function(S,mass)
+    local mass = mass or 0.99
+    local acc = 0
+    local sum = S:sum()
+    local acc_th,th,vth = 0,1
+    for v,i in S:iterate() do
+      acc=acc + v
+      vth,acc_th,th=v,acc,i
+      if acc/sum > mass then break end
+    end
+    assert(acc_th > 0, "The probability mass needs to be larger")
+    return th,vth,acc_th/sum
   end
-  assert(acc_th > 0, "The probability mass needs to be larger")
-  return th,vth,acc_th/sum
-end
 
 -------------------------------------------------------------------------------
 
 -- PCA algorithm based on covariance matrix and SVD decomposition the matrix Xc
 -- must be zero mean centerd for each pattern. Patterns are ordered by rows.
-function stats.pca(Xc)
-  local dim    = Xc:dim()
-  assert(#dim == 2, "Expected a bi-dimensional matrix")
-  local aux = Xc:sum(2):scal(1/Xc:dim(2)):rewrap(Xc:dim(1))
-  local M,N    = table.unpack(dim)
-  local sigma  = matrix.col_major(N,N)
-  sigma:gemm{ A=Xc, B=Xc,
-	      trans_A=true,
-	      trans_B=false,
-	      alpha=1/M,
-	      beta=0, }
-  local U,S,VT = sigma:svd()
-  return U,S,VT
-end
+stats.pca =
+  april_doc{
+    class = "function",
+    summary = "Computes PCA using SVD decomposition of covariance matrix",
+    description = { "Data is ordered by rows, features by columns.",
+                    "If not centered, the data is centered by columns instead",
+                    "that by rows (using stats.pca.center_by_pattern function",
+                    "instead of stats.center function)." },
+    params = {
+      "A 2D matrix",
+      "An [optional] table with 'centered' boolean, by default centered=false",
+    },
+    outputs = {
+      "U matrix with left singular vectors",
+      "S diagonal sparse matrix with  singular values",
+      "VT transpose of right singular vectors",
+      "In case centered=false, fourth result is the center vector [optional]",
+    },
+  }..
+  setmetatable(stats.pca, {
+                 __call = function(self, Xc, params)
+                   local params = get_table_fields(
+                     {
+                       centered = { type_match = "boolean", default = nil },
+                     }, params)
+                   assert(#Xc:dim() == 2, "Expected a bi-dimensional matrix")
+                   local center
+                   if not params.centered then
+                     Xc,center = stats.pca.center_by_pattern(Xc)
+                   end
+                   local sigma = stats.cov(Xc,{ centered=true })
+                   local U,S,VT = sigma:svd()
+                   return U,S,VT,center
+                 end
+  })
 
 -------------------------------------------------------------------------------
 
-stats.iterative_pca =
+stats.pca.gs_pca =
   april_doc{
     class = "function",
     summary = "Computes PCA using GS-PCA (iterative PCA algorithm)",
@@ -142,10 +194,9 @@ stats.iterative_pca =
     if M < N then
       print("# Warning, M < N, probably matrix need to be transposed")
     end
-    local major_order = X:get_major_order()
-    local T = matrix[major_order](M,K):zeros() -- left eigenvectors
-    local P = matrix[major_order](N,K):zeros() -- right eigenvectors
-    local L = matrix[major_order](K):zeros()   -- eigenvalues
+    local T = matrix(M,K):zeros() -- left eigenvectors
+    local P = matrix(N,K):zeros() -- right eigenvectors
+    local L = matrix(K):zeros()   -- eigenvalues
     local R = X:clone()
     local U = R:sum(2):scal(1/R:dim(2)):rewrap(R:dim(1))
     assert( math.abs(U:sum() / U:size()) < 1e-03,
diff --git a/packages/basics/stats/lua_src/statistics.lua b/packages/basics/stats/lua_src/statistics.lua
index c8f8c7240..e125bcb60 100644
--- a/packages/basics/stats/lua_src/statistics.lua
+++ b/packages/basics/stats/lua_src/statistics.lua
@@ -1,8 +1,296 @@
 stats = stats or {} -- global environment
-local mean_var,mean_var_methods = class("stats.mean_var")
-stats.mean_var = mean_var -- global environment
+stats.running = stats.running or {}
 
-april_set_doc(stats.mean_var, {
+april_set_doc(stats.running,{
+                class = "namespace",
+                summary = "Table with running statistics classes",
+})
+
+-----------------------------------------------------------------------------
+
+local mop = matrix.op
+local sdiag = matrix.sparse.diag
+
+-- x must be a 2D matrix
+local function center(x)
+  local x_dim = x:dim()
+  local N = x_dim[1]
+  local x_mu,mu
+  if #x_dim == 1 then
+    mu   = x:sum()/N
+    x_mu = mu
+  else
+    mu = x:sum(1):scal(1/N)
+    x_mu = mop.repmat(mu,N,1)
+  end
+  return x - x_mu,mu
+end
+
+stats.standardize =
+  april_doc{
+    class = "function",
+    summary = "Standardize data to have zero-mean one-variance",
+    description = "Data is ordered by rows, features by columns.",
+    params = { "A 2D matrix" },
+    outputs = { "Another new allocated matrix" },
+  } ..
+  function(x)
+    assert(#x:dim() == 2, "Needs a 2D matrix")
+    local N = x:dim(1)
+    local sigma2,mu = stats.var(x,1)
+    local x = x:clone()
+    x:axpy(-1.0, mop.repmat(mu,N,1))
+    x:cmul(mop.repmat(1/sigma2:sqrt(),N,1))
+    return x,mu,sigma2
+  end
+
+stats.center =
+  april_doc{
+    class = "function",
+    summary = "Centers data by rows, computing mean of every column",
+    description = "Data is ordered by rows, features by columns.",
+    params = { "A 2D matrix" },
+    outputs = { "Another new allocated matrix" },
+  } ..
+  function(x)
+    assert(#x:dim() == 2, "Needs a 2D matrix")
+    return center(x)
+  end
+
+stats.var =
+  april_doc{
+    class = "function",
+    summary = "Computes variance over a dimension",
+    params = { "A matrix",
+               "A dimension number [optional].", },
+    outputs = {
+      "A new allocated matrix or a number if not dim given",
+      "The mean used to center the data"
+    },
+  } ..
+  function(x,dim)
+    local mean = stats.amean(x,dim)
+    local x,x_row,sz = x:clone()
+    if dim then
+      sz = x:dim(dim)
+      for i=1,sz do x_row=x:select(dim,i,x_row):axpy(-1.0, mean) end
+    else
+      x:scalar_add(-mean)
+      sz = x:size()
+    end
+    return x:pow(2):sum(dim)/(sz-1),mean
+  end
+
+stats.cov =
+  april_doc{
+    class = "function",
+    summary = "Compute covariance matrix of two matrices.",
+    description = "Data is ordered by rows, features by columns.",
+    params = {
+      "A 2D matrix or a vector (x)",
+      "Another 2D matrix or a vector (y)",
+      "An [optional] table with 'centered' boolean, 'true_mean' boolean",
+    },
+    outputs = { "Covariance matrix" }
+  } ..
+  april_doc{
+    class = "function",
+    summary = "Compute covariance matrix.",
+    description = "Data is ordered by rows, features by columns.",
+    params = {
+      "A 2D matrix or a vector (x)",
+      "An [optional] table with 'centered' boolean, 'true_mean' boolean",
+    },
+    outputs = { "Covariance matrix",
+                "The x center vector if not centered flag [optional]",
+                "The y center vector if not centered flag [optional]" }
+  } ..
+  function(x,...)
+    local y,params = ...
+    if type(y) == "table" or not y then y,params = x,y end
+    collectgarbage("collect")
+    assert(class.is_a(x,matrix) and class.is_a(y,matrix),
+           "Needs at least two matrix arguments")
+    local params = get_table_fields(
+      {
+        centered = { type_match = "boolean", default = nil },
+        true_mean = { type_match = "boolean", default =nil },
+      }, params)
+    assert(not params.true_mean or params.centered,
+           "true_mean=true is mandatory of centered=true")
+    local x_dim,y_dim = x:dim(),y:dim()
+    assert((#x_dim <= 2) and (#y_dim <= 2), "Needs 2D matrices or vectors")
+    assert(x_dim[1] == y_dim[1] and x_dim[2] == y_dim[2],
+           "Require same shape matrices")
+    local mu_x,mu_y
+    local N,M = table.unpack(x_dim)
+    if not params.centered then
+      local oldx = x
+      x,mu_x = center(x)
+      if rawequal(xold,y) then y,mu_y = x,mu_x else y,mu_y = center(y) end
+    end
+    local sz = N-1
+    if params.true_mean then sz = N end
+    return (x:transpose() * y):scal(1/sz):rewrap(M or 1,M or 1),mu_x,mu_y
+  end
+
+stats.cor =
+  april_doc{
+    class = "function",
+    summary = "Compute correlation matrix of two matrices.",
+    description = "Data is ordered by rows, features by columns.",
+    params = {
+      "A 2D matrix or a vector (x)",
+      "Another 2D matrix or a vector (y)",
+      "An [optional] table with 'centered' boolean",
+    },
+    outputs = { "Correlation matrix" }
+  } ..
+  april_doc{
+    class = "function",
+    summary = "Compute correlation matrix.",
+    description = "Data is ordered by rows, features by columns.",
+    params = {
+      "A 2D matrix or a vector (x)",
+      "An [optional] table with 'centered' boolean",
+    },
+    outputs = { "Correlation matrix",
+                "The x center vector if not centered flag [optional]",
+                "The y center vector if not centered flag [optional]" }
+  } ..
+  function(x,...)
+    local y,params = ...
+    if type(y) == "table" or not y then y,params = x,y end
+    local params = params or {}
+    local mu_x,mu_y
+    if not params.centered then
+      local xold = x
+      x,mu_x = center(x)
+      if rawequal(xold,y) then y,mu_y = x,mu_x else y,mu_y = center(y) end
+    end
+    local function cstd(m) return sdiag((m^2):sum(1):scal(1/(m:dim(1)-1)):sqrt():div(1):squeeze()) end
+    local sigma = stats.cov(x,y,{ centered=true })
+    local sx = cstd(x)
+    local sy = rawequal(x,y) and sx or cstd(y)
+    return sx * sigma * sy,mu_x,mu_y
+  end
+
+stats.acf =
+  april_doc{
+    class = "function",
+    summary = "Compute auto-correlation of one or more series.",
+    description = "Data is ordered by rows, series by columns.",
+    params = {
+      "A 2D matrix or a vector (x)",
+      { "An [optional] table with 'lag_max' number,",
+        "'lag_step' number, 'lag_start' number,",
+        "'cor' function (one of stats.cor [default], stats.cov)." },
+    },
+    outputs = { "A matrix with auto-correlation of the series",
+                "A matrixInt32 with lag values" },
+  } ..
+  function(x,params)
+    assert(class.is_a(x, matrix), "Needs a matrix argument")
+    local x_dim = x:dim()
+    assert(x_dim[1] > 1, "Needs two or more rows")
+    assert(#x_dim <= 2, "Requires 2D matrix or a vector")
+    local params = get_table_fields(
+      {
+        lag_max = { type_match = "number", default = x_dim[1]-2 },
+        lag_step = { type_match = "number", default = 1 },
+        lag_start = { type_match = "number", default = 1 },
+        cor = { type_match = "function", default = stats.cor },
+      }, params)
+    local lag_start,lag_max,lag_step = params.lag_start,params.lag_max,params.lag_step
+    if #x_dim == 1 then x = x:rewrap(x:size(),1) end
+    local N,M = x_dim[1],x:dim(2)
+    local result = matrix(math.floor((lag_max + 1 - lag_start) / lag_step), M)
+    local acf_func = params.cor
+    for j=1,M do
+      local i=1
+      for lag = lag_start, lag_max, lag_step do
+        local a,b = x({1,N-lag},j), x({lag+1,N},j)
+        local y = acf_func(a,b)
+        result[{i,j}] = y
+        i=i+1
+      end
+    end
+    local lags = matrixInt32(iterator(range(lag_start,lag_max,lag_step)):table())
+    return result,lags
+  end
+
+-- arithmetic mean of a matrix
+stats.amean =
+  april_doc{
+    class = "function",
+    summary = "Computes the arithmetic mean over a given dimension",
+    params = {
+      "A matrix",
+      "A dimension number [optional]",
+    },
+    outputs = {
+      "A matrix if given a dimension, a number otherwise",
+    },
+  } ..
+  function(m, D)
+    local r = m:sum(D)
+    if D then
+      return r:scal(1/m:dim(D))
+    else
+      return r/m:size()
+    end
+  end
+
+-- geometric mean of a matrix with positive elements
+stats.gmean =
+  april_doc{
+    class = "function",
+    summary = "Computes the geometric mean over a given dimension",
+    params = {
+      "A matrix with positive elements",
+      "A dimension number [optional]",
+    },
+    outputs = {
+      "A matrix if given a dimension, a number otherwise",
+    },
+  } ..
+  function(m, D)
+    local r = mop.log(m):sum(D)
+    if D then
+      return r:scal(1.0/m:dim(D)):exp()
+    else
+      return math.exp(r / m:size())
+    end
+  end
+
+-- harmonic mean of a matrix with non-zero elements
+stats.hmean =
+  april_doc{
+    class = "function",
+    summary = "Computes the harmonic mean over a given dimension",
+    params = {
+      "A matrix with non-zero elements",
+      "A dimension number [optional]",
+    },
+    outputs = {
+      "A matrix if given a dimension, a number otherwise",
+    },
+  } ..
+  function(m, D)
+    local r = (1 / m):sum(D)
+    if D then
+      return r:div( m:dim(D) )
+    else
+      return m:size() / r
+    end
+  end
+
+-----------------------------------------------------------------------------
+
+local mean_var,mean_var_methods = class("stats.running.mean_var")
+stats.running.mean_var = mean_var -- global environment
+
+april_set_doc(stats.running.mean_var, {
 		class       = "class",
 		summary     = "Class to compute mean and variance",
 		description ={
@@ -12,7 +300,7 @@ april_set_doc(stats.mean_var, {
 
 -----------------------------------------------------------------------------
 
-april_set_doc(stats.mean_var, {
+april_set_doc(stats.running.mean_var, {
 		class = "method", summary = "Constructor",
 		description ={
 		  "Constructor of a mean_var object",
@@ -614,25 +902,24 @@ april_set_doc(stats.boot,
 		description= {
 		  "This function is useful to compute confidence intervals",
 		  "by using bootstrapping technique. The function receives",
-		  "a data table or matrix, a function which returns statistics",
-                  "of a sample given an iterator.",
+		  "the population size and a function which returns statistics",
+                  "of a sample.",
 		  "A table with the computation of the post-process function",
 		  "for every repetition will be returned.",
 		},
 		params = {
-		  data = "A table with the data",
+		  size = "Population size",
 		  R = "Number of repetitions, recommended minimum of 1000",
 		  statistic = {
-		    "A function witch receives an iterator and computes",
-                    "statistics (k>=1 statistics) over all the iterator results.",
-                    "The iterator produces a key which is a row in data",
-                    "and a value which is the corresponding row.",
+		    "A function witch receives a matrixInt32 with sample indices and computes",
+                    "statistics (k>=1 statistics) over the sample.",
                     "If k>1, statistic must return a table with the desired",
                     "k statistics."
 		  },
 		  verbose = "True or false",
                   ncores = "Number of cores [optional], by default it is 1",
                   seed = "A random seed [optional], by default it is os.time()",
+                  [2] = "As second parameter it accepts extra arguments for statistic function.",
 		},
 		outputs = {
 		  "A table with the k statistics for every repetition."
@@ -640,10 +927,10 @@ april_set_doc(stats.boot,
 })
 
 -- self is needed because of __call metamethod, but it will be ignored
-local function boot(self,params)
+local function boot(self,params,...)
   local params = get_table_fields(
     {
-      data        = { mandatory = true },
+      size        = { type_match = "number",   mandatory = true, },
       R           = { type_match = "number",   mandatory = true },
       statistic   = { type_match = "function", mandatory = true },
       verbose     = { mandatory = false },
@@ -651,35 +938,19 @@ local function boot(self,params)
       seed        = { mandatory = false, type_match = "number", default = os.time() },
     },
     params)
-  local data        = params.data
+  local extra       = table.pack(...)
+  local size        = params.size
   local repetitions = params.R
   local statistic   = params.statistic
   local ncores      = params.ncores
   local seed        = params.seed
   local get_row,N
-  -- prepare N and get_row function depending in the type of data parameter
-  if type(data) == "table" then
-    N = #data
-    get_row = function(i) return data[i] end
-  elseif class.is_a(data, matrix) or class.is_a(data, matrixInt32) or class.is_a(data, matrixComplex) then
-    N = data:dim(1)
-    local row
-    get_row = function(i) row=data:select(1,i,row) return row end
-  else
-    errro("Incorrect type, needs a table, a matrix, matrixInt32 or matrixComplex")
-  end
-  -- returns an iterator of random samples using rnd random object
-  local make_iterator = function(rnd)
-    local p=0
-    return function()
-      if p<N then p=p+1 j=rnd:randInt(1,p) return j,get_row(j) end
-    end
-  end
   -- resample function executed in parallel using parallel_foreach
   local resample = function(i, id)
     collectgarbage("collect")
     local rnd = random(seed + i - 1)
-    local r,_ = statistic(make_iterator(rnd))
+    local sample = matrixInt32(size):uniform(1,size,rnd)
+    local r,_ = statistic(sample,table.unpack(extra))
     assert(not _, "statistic must return one value (it can be a table")
     assert(type(r) == "number" or type(r) == "table",
            "statistic function must return a number or a table")
@@ -738,10 +1009,10 @@ stats.boot.ci =
 stats.boot.percentil =
   april_doc{
     class = "function",
-    summary = "Returns a percentil value",
+    summary = "Returns a percentil value from bootstrap output",
     description= {
       "This function returns a percentil value",
-      "given the result of stats.boot function and the confidence value.",
+      "given the result of stats.boot function and the percentil number.",
       "It could compute the percentil over a slice of the table.",
     },
     params = {
@@ -780,13 +1051,12 @@ stats.boot.percentil =
 -----------------------------------------------------------------------------
 -----------------------------------------------------------------------------
 
-local pearson,pearson_methods = class("stats.correlation.pearson")
-get_table_from_dotted_string("stats.correlation", true)
-stats.correlation.pearson = pearson
+local pearson,pearson_methods = class("stats.running.pearson")
+stats.running.pearson = pearson
 
 function pearson:constructor(x,y)
-  self.mean_var_x  = stats.mean_var()
-  self.mean_var_y  = stats.mean_var()
+  self.mean_var_x  = stats.running.mean_var()
+  self.mean_var_y  = stats.running.mean_var()
   self.xy_sum      = 0
   if x then self:add(x,y) end
 end
@@ -822,9 +1092,30 @@ end
 
 stats.dist.bernoulli = function(p)
   if class.is_a(p, matrix) then
-    return stats.dist.binomial(matrix.col_major(1,{1}),p)
+    return stats.dist.binomial(matrix(1,{1}),p)
   else
     return stats.dist.binomial(1,p)
   end
 end
 
+-------------------------------------------------------------------------------
+-------------------------------------------------------------------------------
+
+april_set_doc(stats.comb,{
+                class = "function", 
+                summary = "Computes k-combination",
+                params = {
+                  "Total number of elements (n)",
+                  "How many selected elements (k)",
+                },
+                outputs = { "A number with (n over k)" },
+})
+
+stats.mean_var = make_deprecated_function("stats.mean_var",
+                                          "stats.running.mean_var",
+                                          stats.running.mean_var)
+
+stats.correlation = {} -- deprecated table
+stats.correlation.pearson = make_deprecated_function("stats.correlation.pearson",
+                                                     "stats.running.pearson",
+                                                     stats.running.pearson)
diff --git a/packages/basics/stats/package.lua b/packages/basics/stats/package.lua
index 71e0b744e..53582f201 100644
--- a/packages/basics/stats/package.lua
+++ b/packages/basics/stats/package.lua
@@ -25,8 +25,10 @@
        file={
 	 "test/test_bootstrap.lua",
 	 "test/test_comb.lua",
+	 "test/test_covariance.lua",
 	 "test/test_distributions.lua",
 	 "test/test-gs-pca.lua",
+	 "test/test_means.lua",
 	 "test/test-zca-whitening.lua",
        },
      },
diff --git a/packages/basics/stats/test/test-gs-pca.lua b/packages/basics/stats/test/test-gs-pca.lua
index 2d824066b..3697e5961 100644
--- a/packages/basics/stats/test/test-gs-pca.lua
+++ b/packages/basics/stats/test/test-gs-pca.lua
@@ -3,15 +3,6 @@ local T = utest.test
 --
 local base_dir = string.get_path(arg[0])
 
-function compute_cov(X,dim)
-  local other = 3 - dim
-  local major_order = X:get_major_order()
-  return matrix[major_order](X:dim(dim),X:dim(dim)):gemm{ A=X, B=X,
-							  trans_A=true,
-							  alpha=1/X:dim(other),
-							  beta=0 }
-end
-
 --------------------------------------------------------------------------
 
 local ok,m = pcall(matrix.fromTabFilename, "/tmp/sample.txt.gz")
@@ -34,27 +25,27 @@ end
 
 --------------------------------------------------------------------------
 
-local aR = stats.mean_centered_by_pattern(m:clone("col_major"))
+local aR = stats.pca.center_by_pattern(m:clone())
 
 T("PCATest",
   function()
     local aU,aS,aVT = stats.pca(aR)
 
     -- check regeneration of original covariance matrix
-    local cov = compute_cov(aR, 2)
+    local cov = stats.cov(aR, aR, { centered=true })
     check(function()
-        return cov:equals(aU * aS:to_dense("col_major") * aVT)
+        return cov:equals(aU * aS:to_dense() * aVT)
     end, "Regeneration of covariance matrix")
 
     -- ROTATION
     local amRot = aR * aU
     -- check covariance of rotated data
-    local cov = compute_cov(amRot, 2)
+    local cov = stats.cov(amRot, amRot, { centered=true })
     -- adjusting the data to be between 0 and 1
     for sw in cov:sliding_window():iterate() do sw:adjust_range(0,1) end
     -- the adjusted covariance must be an identity matrix
     -- assert(cov:equals( cov:clone():zeros():diag(1), 0.1 ))
-
+    
     -- U matrix orthogonality check
     local aUmul = aU:clone():gemm{ A=aU, B=aU, trans_B=true,
                                    alpha=1.0, beta=0.0, }
@@ -69,24 +60,24 @@ T("PCATest",
     end, "V orthogonality test")
 
     -- check U matrix with octave computation
-    local refU = matrix.fromTabFilename(base_dir.."data/U.gz", "col_major"):
+    local refU = matrix.fromTabFilename(base_dir.."data/U.gz"):
       abs()
     check(function() return refU:equals(aU:clone():abs(), 0.06) end,
       "U matrix comparison with octave")
 
     -- check V matrix with octave computation
-    local refV = matrix.fromTabFilename(base_dir.."data/V.gz", "col_major"):
+    local refV = matrix.fromTabFilename(base_dir.."data/V.gz"):
       transpose():abs()
     check(function() return refV:equals(aVT:clone():abs(), 0.06) end,
       "V matrix comparison with octave")
 
     -- check S matrix with octave computation
-    local refS = matrix.fromFilename(base_dir.."data/S.gz", "col_major")
+    local refS = matrix.fromFilename(base_dir.."data/S.gz")
     check(function()
         -- FIXME: the last value is weird... we need to remove it for pass the
         -- test (both matrices are of (1:144,1:144)
         return refS:diagonalize()('1:143','1:143'):
-          equals(aS:to_dense("col_major")('1:143','1:143') )
+          equals(aS:to_dense()('1:143','1:143') )
     end,
     "S matrix comparison with octave")
 end)
@@ -97,14 +88,14 @@ end)
 
 T("GS-PCATest",
   function()
-    local aR = stats.mean_centered_by_pattern(m:clone("col_major"))
-    local bT,bP,bR,bV,bS = stats.iterative_pca{ X = aR, K = 144, }
+    local aR = stats.pca.center_by_pattern(m:clone())
+    local bT,bP,bR,bV,bS = stats.pca.gs_pca{ X = aR, K = 144, }
 
     -- check regeneration of original matrix
     check(function() return aR:equals( bT * bP:transpose() + bR ) end)
 
     -- check covariance of rotated data
-    local cov = compute_cov(bT, 2)
+    local cov = stats.cov(bT, bT, { centered=true })
     -- adjusting the data to be between 0 and 1
     for sw in cov:sliding_window():iterate() do sw:adjust_range(0,1) end
     -- the adjusted covariance must be an identity matrix
diff --git a/packages/basics/stats/test/test-zca-whitening.lua b/packages/basics/stats/test/test-zca-whitening.lua
index 0eae03adb..393d5559d 100644
--- a/packages/basics/stats/test/test-zca-whitening.lua
+++ b/packages/basics/stats/test/test-zca-whitening.lua
@@ -12,16 +12,16 @@ local ds = dataset.matrix(m,
 			    orderStep   = {1,0}
 			  })
 local m = ds:toMatrix()
-local aux = stats.mean_centered_by_pattern(m:clone("col_major"))
+local aux = stats.pca.center_by_pattern(m:clone())
 local aU,aS,aVT = stats.pca(aux)
 
 -- PCA THRESHOLD STATISTICS
 T("PCAThresholdTest",
   function()
-    local takeN,eigen_value,prob_mass=stats.pca_threshold(aS, 0.99)
-    check.eq(takeN, 192)
-    check.lt(math.abs(eigen_value-0.01752162), 1e-03)
-    check.lt(math.abs(prob_mass-0.9897367), 1e-03)
+    local takeN,eigen_value,prob_mass=stats.pca.threshold(aS, 0.99)
+    check.eq(takeN, 193)
+    check.number_eq(eigen_value,0.017318)
+    check.number_eq(prob_mass,0.990025)
 end)
 
 local zca_whitening,new
@@ -30,20 +30,20 @@ if ann.components.zca_whitening then
     U=aU,
     S=aS,
     epsilon=0.017,
-    takeN=192,
+    takeN=193,
   }
-  new = zca_whitening:forward(aux):get_matrix()
+  new = zca_whitening:forward(aux)
 end
 
-local new2 = stats.zca_whitening(aux:clone(), aU(':','1:192'),
-				 aS('1:192','1:192'), 0.017)
+local new2 = stats.zca.whitening(aux:clone(), aU(':','1:193'),
+				 aS('1:193','1:193'), 0.017)
 
 if new then
   T("ZCAWhiteningTest",
     function()
       for i=1,new:dim(1) do
-        local d = new(i,':'):clone("row_major"):rewrap(16,16):adjust_range(0,1)
-        local d2 = new2(i,':'):clone("row_major"):rewrap(16,16):adjust_range(0,1)
+        local d = new(i,':'):clone():rewrap(16,16):adjust_range(0,1)
+        local d2 = new2(i,':'):clone():rewrap(16,16):adjust_range(0,1)
         check.eq(d, d2)
         -- ImageIO.write(Image(d), "wop-" .. string.format("%03d",i) .. ".png")
       end
@@ -52,6 +52,6 @@ end
 
 -- PCA FILTERS
 -- for i=1,aU:dim(1) do
---   local d = aU:select(2,i):clone("row_major"):rewrap(16,16):adjust_range(0,1)
+--   local d = aU:select(2,i):clone():rewrap(16,16):adjust_range(0,1)
 --   ImageIO.write(Image(d), "filter-" .. string.format("%03d",i) .. ".png")
 -- end
diff --git a/packages/basics/stats/test/test_bootstrap-output.log b/packages/basics/stats/test/test_bootstrap-output.log
index fe59e719c..bde8fc32f 100644
--- a/packages/basics/stats/test/test_bootstrap-output.log
+++ b/packages/basics/stats/test/test_bootstrap-output.log
@@ -1,1000 +1,1000 @@
--0.099173416414325	1.0451668220883
--0.098400892352358	1.0020156339997
--0.094721095314375	0.95595890804428
--0.087549116258934	1.0115291159222
--0.072949525135802	1.0274507115672
--0.071902029003092	1.0550019486267
--0.071820996517336	0.96207857415103
--0.071725057213935	1.0895223149051
--0.07083359428959	1.0161686036111
--0.070581008649784	0.93918019040868
--0.069920523121135	1.0395533192777
--0.068424635280829	1.0087692575631
--0.067912352426936	1.0090987641921
--0.067496047438062	1.0817760545907
--0.066675529604163	0.97548611997191
--0.066202931865909	1.0590405785124
--0.065885022564883	1.049583193891
--0.065338163275298	1.1091665702362
--0.065004411948577	0.94800815273036
--0.062792658611307	1.0745901618824
--0.060140193829468	1.0053096107444
--0.060022315855092	1.0956475930874
--0.060013438211171	1.0213133702282
--0.059433163380361	1.0946353262324
--0.058701825133759	1.1109662343316
--0.058496427339014	1.0017718199106
--0.058429386471135	0.97454726474096
--0.057912199252041	1.1226515078125
--0.057847528414633	1.0343638179275
--0.057811344908386	1.0262921830711
--0.057799304624309	1.0069081947421
--0.057629068076313	0.9540217326488
--0.05742070273804	0.97105523441595
--0.05702517096443	1.0328976068751
--0.056032341445253	1.0682415531142
--0.055426845187651	1.0550104714073
--0.055236734207057	1.0784094645485
--0.055021721221176	1.0651627684423
--0.054727789374251	0.96388328213133
--0.053934645802181	0.92618405115789
--0.05335472007767	1.0699865384177
--0.052965794493128	1.1159929185845
--0.052877086421755	1.0036373667192
--0.051038331936151	0.98488735939327
--0.05091728319512	1.0811414324082
--0.050888941393849	1.09370599774
--0.050274045433878	1.011584533611
--0.050232149059929	1.0815298053371
--0.049747978789077	1.0116388190055
--0.049550850263437	1.0584831025978
--0.048854539571585	1.0111606873976
--0.048667639608802	0.9908919651846
--0.048442528499904	1.0216292300037
--0.047752703556472	1.0397878163822
--0.047581528090405	1.0539130630526
--0.047461110725154	1.0413758630365
--0.047336934927256	0.96362224971514
--0.047266494192134	1.102647621608
--0.04695467880296	1.1316936048364
--0.046918857316533	1.0282003239372
--0.046903523567744	0.98325505924141
--0.046418980182329	1.0205594401815
--0.046174988198647	0.96426197189158
--0.045589099821764	1.0119222472817
--0.045329794479582	1.060007824876
--0.045112543058728	0.98096639671971
--0.044766645757664	1.0428175895874
--0.044680680726508	1.0491798620698
--0.044558734474343	1.0776907227687
--0.044225606963246	0.98213070631689
--0.043749182823206	1.0420604189759
--0.043206584380241	1.0979794849084
--0.042700242304669	1.0437515153385
--0.042598651238702	1.0595253714892
--0.041672827389055	1.0843322585385
--0.041565534785066	0.95262107988295
--0.041512735217451	1.0159762568097
--0.041192449079926	1.0450793644125
--0.041037512996184	0.98417909428056
--0.040962512568302	1.0648538364464
--0.040897282350289	0.98779215037456
--0.040336170066034	0.90172559183862
--0.040203775184254	1.0888328695872
--0.040176817520013	1.0432507353696
--0.039886406435057	1.0385793659365
--0.039497566749671	1.1103266940618
--0.039246473721234	1.0381799918076
--0.039181565166029	1.0128175365233
--0.038800497941906	1.1152049159257
--0.038729227583168	1.0634245348443
--0.038722367251186	1.06327527843
--0.038017176763059	1.0937155837905
--0.037945722945123	1.0641643677386
--0.037939484742719	1.0417558577224
--0.037905669864737	1.0087298097196
--0.037840262659511	1.0089502083319
--0.037788800876517	1.0116984455204
--0.037602384389705	1.0063961059686
--0.037205894747324	0.94792733701659
--0.037170046207544	0.98932107172102
--0.036872555243307	1.0264804268485
--0.036493546935366	1.1488496840726
--0.036455366850645	0.97744334163377
--0.036273443987352	1.1235531600368
--0.036026611778408	1.0109440014991
--0.035955226456947	1.0822336816232
--0.035851955477506	0.99975541724307
--0.035409788785194	1.0372605190165
--0.03521793235626	1.0671306348151
--0.035128032672626	1.09859501106
--0.035079310468376	1.076055231523
--0.034796545810128	0.97437939825448
--0.034539295579803	0.96007417335012
--0.034529669112847	1.014134536046
--0.034518960212032	1.038304525369
--0.034342706762213	1.0215469348606
--0.034256985866139	1.0110487599173
--0.034159829535566	1.0737404038002
--0.034140507892735	1.0506219505938
--0.034111896716092	1.0987641171471
--0.033957485255869	1.1036411711232
--0.033431479935806	1.0145128676337
--0.0332296878777	0.9886111213292
--0.03316272978426	1.1433545765443
--0.033127878683758	1.0728586644865
--0.033110705969025	1.0791336144292
--0.033107781788906	1.1327202654014
--0.032706886934527	1.0802150715606
--0.032542989673351	1.0995148068099
--0.032514522428026	1.0323623043179
--0.032366537229729	1.0132316133633
--0.032030599878251	1.0714898406705
--0.032019161141088	1.0663941174213
--0.032002833017972	0.95787702358901
--0.031757429187212	1.0553726624
--0.031671065945501	1.0364983754372
--0.031438836051327	1.1008748311312
--0.031395819809367	1.0093867534562
--0.031212431773307	1.0053160450314
--0.030958331257078	1.0854814459277
--0.030696506245976	1.0137077870375
--0.030623763124814	1.1153240948284
--0.030619726899827	1.0466965089746
--0.030457719712835	1.1083998883033
--0.030342890637863	1.136088783799
--0.030234585304634	1.0470541448667
--0.030059981527035	1.051298327338
--0.029978458787333	1.0265713336827
--0.029875115047209	1.0345202570936
--0.029749802290585	1.0075653975858
--0.029689197425863	1.027031823859
--0.029662276165533	1.0478146803109
--0.029480754009733	1.0363395094324
--0.029313713899101	0.97951886053766
--0.029261830690581	1.0382607913082
--0.029228128289794	1.0489950122189
--0.029164691979952	0.97925419643517
--0.028917219585834	0.99612789044887
--0.028799758686443	0.96346935932012
--0.028767497655924	1.0238824903483
--0.028529296144076	0.96593310766018
--0.028501972847052	1.0639506715629
--0.028368481754517	1.0154668790927
--0.028335713417467	1.0086527664073
--0.028322208560352	0.96118913586083
--0.028309306579457	1.0261729169365
--0.02830657641114	1.0471352640043
--0.028278274162873	0.96641407615153
--0.028129903984087	1.0805087940045
--0.027889082869516	1.033351373609
--0.027783627107087	1.1011184674845
--0.027671394692265	0.97271458252103
--0.027630475344186	0.99339305911987
--0.027626348986606	1.002370478023
--0.027548815708123	1.0968817083115
--0.027489694431737	1.0356636474211
--0.027392968011863	1.1202416244956
--0.027302006375863	1.1061806358216
--0.027261145808483	0.98490410108279
--0.027195798556694	0.99670855499079
--0.027010036259205	0.97223775115803
--0.026918360573223	1.0594793241318
--0.026746680700148	1.0195312086802
--0.026632417015284	1.0666633391711
--0.02631541796827	1.0726254736035
--0.026205158418802	1.0147084491794
--0.026120968110117	1.018953930258
--0.026077191978254	1.0928269391664
--0.026003421029984	1.0734225852221
--0.025964799164134	1.1086378079442
--0.025901026188324	1.0465996782042
--0.025642064581621	1.0746530899337
--0.025460912807135	1.1341625097036
--0.025417314789781	0.96012344213433
--0.025385851449285	0.97036274509377
--0.025373337850076	1.1153135736352
--0.025227274690419	1.0686618610592
--0.02518968052475	1.1525654741067
--0.025033837068104	1.0042163473205
--0.024741395405238	0.97970665213074
--0.024727169977757	1.0051141092366
--0.024586414967621	1.0213424365303
--0.024583344735447	1.097370304149
--0.024241477784194	0.9928172044431
--0.024148320817005	1.0116731658116
--0.024104546548785	1.0243810778315
--0.024004297927769	1.0087108415143
--0.023987889233434	1.04035465575
--0.023977040281248	1.0569975285089
--0.023952471874957	0.97843654183675
--0.023925509609146	1.1161758644592
--0.023923669061226	0.96276744139484
--0.023850320778456	1.0195966299038
--0.023837703021271	1.0085384577617
--0.023666719108985	1.0737708476822
--0.023644112913458	1.0431488869046
--0.02360175937968	1.1317895719891
--0.023523139365529	1.1251477707354
--0.023484377839099	1.0662915064024
--0.023387771269313	1.0399772711271
--0.023366849999069	1.0836799191733
--0.023356938321676	1.0839465137211
--0.023278329805965	0.98558936927927
--0.022966835523502	0.97970072904608
--0.022920676500055	1.0402206723479
--0.022874507299817	1.1074938671326
--0.022861361903135	1.0099613620545
--0.022791486704606	1.0282022645714
--0.022753220067866	1.1087568257005
--0.02272604953378	1.0484674019523
--0.02233747815915	1.0593766088595
--0.022300543490376	1.0243902945992
--0.022238439357473	1.0737390723921
--0.022116173470942	1.0457237299813
--0.021922569712483	1.0267872223916
--0.021793630448082	1.1072135016748
--0.021721583309532	1.0642473167195
--0.021684405528814	1.0803751194154
--0.021671525076541	1.0290592238086
--0.021586681844542	1.126802963703
--0.021506857458496	1.0561680866624
--0.021454336848886	1.0431799961609
--0.021241572632923	1.0564386453772
--0.021132204372112	1.0115961505885
--0.021108478046342	1.0352757369071
--0.021065021268355	1.1291863726498
--0.021061352772553	1.1698508411985
--0.021013867217918	1.0553358275073
--0.020981559512326	1.0656363825657
--0.020975938721426	1.0578160872803
--0.020948724425542	1.025491893567
--0.020923011892439	1.0588338170696
--0.020554913889665	1.0658136208779
--0.020553775626095	0.94458880953027
--0.019878712121643	1.0102544757398
--0.019620191196759	1.0444735933711
--0.019600663132017	1.0133727790985
--0.019576769188327	1.0463272488428
--0.019503774224635	1.0617807580049
--0.019490420097907	1.0360908684296
--0.019211829561011	1.0732856308215
--0.019053738219415	1.0122291857294
--0.01895252156926	1.1022629383182
--0.018802878403832	1.0724157031208
--0.018659388690687	0.99623275876205
--0.018591321454111	1.0290731577003
--0.018397982661665	1.0206616708216
--0.018338360836468	1.0268422661817
--0.01821410785648	1.0405018581217
--0.018102501561065	1.0242307779596
--0.018032293248348	1.0104262773341
--0.017952599503915	0.96314710346777
--0.017946861006665	1.0223558836446
--0.017818561383994	0.92728887071214
--0.017632768067937	0.94177706140275
--0.017532879437489	1.0424364122013
--0.017509741139533	1.061162554674
--0.017496818042168	1.1103127826414
--0.017482641506697	1.0586064363797
--0.017288325953277	0.98584640863792
--0.017264488963033	1.1163106298001
--0.017158979359959	0.9991322747989
--0.017109403701535	0.98790964998951
--0.016969288166019	1.0215734233514
--0.016866753970901	1.1012682828257
--0.016859453402222	1.0154272542031
--0.016564615849643	0.90697862980486
--0.016468967121913	1.098899464817
--0.016439062144788	0.94734017147917
--0.01643851844041	1.0278482688027
--0.016436009548338	1.1502126495187
--0.016217068400705	1.0571611106201
--0.016205375894529	1.0461069924615
--0.016152781114062	1.0523622103539
--0.016125309524624	1.0235149624668
--0.016080766641985	1.1024442465856
--0.015970330623914	0.94830547566499
--0.015951695417696	1.0567200306286
--0.015895922325248	1.0426913429534
--0.015816990547031	1.0995781098562
--0.015770988241631	1.061854702012
--0.01568858113965	1.0234048407342
--0.015634395946019	1.1340569901186
--0.015614518616477	1.0231230378291
--0.015606389559026	1.0494385412266
--0.015598664589645	1.0120759714538
--0.015547113786001	1.0636068576329
--0.015437310407125	0.98445658551047
--0.015300685713257	1.0405453816615
--0.015298658307972	1.0568404170176
--0.015096217812292	1.0414876290128
--0.014888932241435	1.0352246675473
--0.014828886137877	1.0051131113681
--0.014752182239065	0.97678443473487
--0.014537306369185	1.0478653656242
--0.014499096781853	1.0961418196834
--0.014421007068514	1.021009884438
--0.014292335554194	1.0585505321497
--0.014146184141543	1.1068309958342
--0.013909709334611	0.94226395918407
--0.013885321672337	0.98890689305121
--0.01376761230051	0.97444389859079
--0.013749595048122	0.97888947098034
--0.013522818895109	1.0880718840894
--0.013497960799851	1.072386212548
--0.013197207500496	1.0817648140139
--0.01273968493556	1.0789693945215
--0.012666129206095	1.0112542686625
--0.012520247430466	1.0417804239374
--0.012397962808629	1.0925161500678
--0.012321026518864	1.0914604693111
--0.01231720099839	1.0271388700915
--0.012091928256369	1.0269356848329
--0.012052137670075	1.0813897304521
--0.011815232872817	1.0057680853301
--0.011646897812088	1.0386578568151
--0.011583562161	1.0533195152853
--0.011339938697498	0.99154904571415
--0.011217169898654	0.98515408956877
--0.011021471030869	1.1631260604534
--0.010943366544862	0.97644097403703
--0.010920496610902	1.0904437093687
--0.010877972716658	1.0184574653598
--0.01084645496366	0.97916642866446
--0.010745650317134	1.1676580854452
--0.010727110432016	0.98834605009
--0.010661638723137	1.0221410455646
--0.010627374695363	1.0780266170996
--0.010392874720284	0.96499144410573
--0.010258676632142	1.0094515636468
--0.010201246055201	1.085289596484
--0.010173864973889	1.0207724973337
--0.010086677109084	1.0479743403702
--0.009980648939559	1.0183625026041
--0.0098961388672496	1.08753504998
--0.0098354700603622	1.0641724717393
--0.0097992348601492	1.0441577688416
--0.0097879183042595	1.0021594100438
--0.009753931333296	1.0283727947023
--0.0096188647647124	1.0713851480434
--0.0095038354515468	1.0466357705162
--0.0095029356514408	1.0512896788771
--0.0094972005059355	1.0589175906757
--0.009485672577202	1.0952930984052
--0.0094254568480638	1.0169586606043
--0.0093633535725954	1.1010343082872
--0.0093236027131996	1.0329849330027
--0.0093002421260962	1.0861560435138
--0.0092372958907962	0.957276110138
--0.0092043564698223	1.0675694083875
--0.0091328442258259	1.0868635006644
--0.0091062875245978	1.044506945826
--0.009102853141116	1.1625247227752
--0.0090958006142473	1.0554290801778
--0.0090749345131316	0.9907955206153
--0.0087573917958014	1.1037788874241
--0.0086260860019406	1.181905368031
--0.0085969665018086	1.0560552945472
--0.0084258925658109	0.92318595176531
--0.0083765658645895	1.071668738677
--0.0081556794909978	0.97623351287368
--0.0079858112948992	1.0224721204004
--0.0078309487207852	1.0374510794319
--0.0076187038777562	1.0440436128564
--0.0074441308235832	1.0651089754325
--0.0073757852860804	1.1200126045182
--0.0073036713867316	1.0873408792086
--0.0072518112382617	1.0799424675719
--0.0072074061969208	1.0443646885659
--0.0070378559360103	1.0780703829929
--0.0069950794731492	1.0893160360917
--0.0069921730039544	1.0061773205483
--0.006947473126379	0.9974835322922
--0.0069125157536629	1.0194222881502
--0.0068788559391388	1.0495992211388
--0.0067022475387748	1.0374998545202
--0.0066255553585386	1.1177500718113
--0.0064519019481178	1.0222285693066
--0.0064089880032541	1.1029944702809
--0.006305157847216	1.0443469719952
--0.0062153137738811	1.0315252890146
--0.0061190413703085	1.0163768665398
--0.0060829282371001	1.1283174162812
--0.0058901703226169	0.99766311291538
--0.0058874151082406	1.1338684053646
--0.0057941768635546	1.0261836228198
--0.0057735141147161	0.9167541889492
--0.0057606772665386	1.0097201579765
--0.0054709879943039	0.96913943051023
--0.0053578440694546	1.0297623204078
--0.0053115515810525	1.0685275426251
--0.0053030121699763	1.1004971934519
--0.0052430775311409	1.0176095526293
--0.0051914997741413	0.96000934534059
--0.0049580534251201	1.0653630408226
--0.0048204454412891	1.0474196875273
--0.0045045512146381	1.015903702009
--0.0043696514803841	0.94607285831142
--0.0042374997909196	0.99689576632995
--0.0039521634729388	1.1448545543839
--0.0038632395007752	1.0635428589435
--0.0038627971374791	0.96098651416422
--0.0038257173970624	0.97976057334045
--0.0037920659680177	1.1299977348134
--0.0037831661699115	1.094784455276
--0.0037589214810001	1.0297980815504
--0.0037167252227012	1.1039668052981
--0.0036786723085907	1.0863370910464
--0.0035569143164507	0.98655349564903
--0.0034553562881108	1.1048499261477
--0.003437475312429	1.0069492534737
--0.0034153781276191	1.0121896984987
--0.003264319642635	1.0567940491392
--0.0032409654249518	1.0528372688643
--0.0032244199095692	1.0447829963098
--0.003195491350131	1.088946304694
--0.0030374251195593	1.1361433105136
--0.0030322407225109	1.1416534857233
--0.0029301360865695	1.0550809743414
--0.0028972531922454	0.92964087852651
--0.0028154957239143	1.0319599178366
--0.002761151148771	1.0138916833198
--0.0027019250829514	0.97828647096001
--0.0024742594584755	1.0161546216572
--0.0023166026476833	0.96570283303937
--0.0022573353380595	1.042753287233
--0.0019965180996106	1.1031989729782
--0.0017243563626029	1.0322973517933
--0.0016299599834297	1.0821228927324
--0.001555808073308	1.1021619418271
--0.0013857769312249	0.99801974939897
--0.0013289671813985	0.9879824401236
--0.0010712997843154	1.0275897953634
--0.00085562234451449	1.0945567071888
--0.00064203712770765	1.0370335836075
--0.00036572138577897	0.98795517262379
--0.00020404541392297	1.0768619674576
--0.00014461435459039	1.0450424166484
--0.00012785779094644	1.044958000631
-3.0451636468439e-05	0.97634139571987
-0.00010034235653916	1.0458056996227
-0.0001365050946843	0.95032687375956
-0.00031463861122248	1.0662083774143
-0.00037340091172062	1.0624769950539
-0.00048891580034857	1.1318728920646
-0.00054625416171238	1.0676996724128
-0.00055641367409564	0.97265706855278
-0.00085780183283054	1.006198389057
-0.0010101613235592	1.1308167271765
-0.0011474504673446	1.1591524947083
-0.0012496406642243	1.0340766144818
-0.0013466305350471	1.0726856614754
-0.0013687219827648	0.99532024856222
-0.0014014328618075	1.0784316307611
-0.0015518297323897	1.0271693691368
-0.0015748726731165	0.97884563879504
-0.0016717436220699	1.1046463467277
-0.0016811596236973	1.0326368376635
-0.0016855226312212	1.0078313941699
-0.001739907645676	1.1504122190039
-0.0017494525784893	0.97526620749798
-0.0017631416502778	1.0038218430129
-0.0017727186694121	1.0292399180274
-0.0018151646390339	0.94042370726906
-0.0018647161881519	1.0147436065762
-0.0018770762291975	1.0606955614611
-0.0020190999574167	1.0397719890554
-0.0021666878486792	1.0199624079767
-0.0022056765965103	1.0942782352917
-0.0022145278829564	1.090251139374
-0.0023263990011021	1.0323424607895
-0.0023469855896837	1.0510068272444
-0.0025389170680218	1.0047034338363
-0.0026219302066843	0.96778990466941
-0.0026933187107378	1.0585521634338
-0.0027407608643399	1.0418609243863
-0.0030054336803422	1.0278130417992
-0.0032648442697112	1.0948578343346
-0.003378714735529	1.0569512948082
-0.0036366917659211	1.0753808018891
-0.0036611030091583	1.047989039266
-0.0037246637346128	1.0330781415317
-0.0037407588610184	1.0139207306403
-0.0038096471943166	1.0336151075037
-0.0038111283005024	1.0153781254059
-0.0038784704259733	1.0803087351048
-0.0039361444930823	1.0991654927863
-0.0039679935267842	1.0704388184719
-0.0041113192319249	1.0279412555237
-0.0041495058789189	1.0532828835596
-0.0041703455421212	1.0523408876431
-0.0041877025883431	0.99384635504204
-0.0042025863924496	0.97977022317388
-0.0042476141868871	1.0554688891129
-0.0042514625698632	1.0820826533491
-0.0042828210763498	0.9715438993378
-0.004338637334195	1.0337735975646
-0.0044405949682982	1.0779009223863
-0.0044576990496795	1.0259187179036
-0.0046318006155755	1.0510432267172
-0.0047586969336313	1.0538903751046
-0.0048268118623613	1.0075497949356
-0.0049257006251251	1.0114023797745
-0.0049513497593843	1.0122320342048
-0.0049619935360498	1.0362216448881
-0.0050054978605388	1.1055421361197
-0.005020404762432	1.0350070206785
-0.0050396985454473	1.0158656303293
-0.0050418898364327	1.050055523948
-0.0051332787341775	1.0826573445653
-0.0053294740939407	1.043517551387
-0.0053826542610931	1.0246390431656
-0.0053924976626879	1.0528496423718
-0.0055384700681846	1.0624445411507
-0.005601506023047	0.99840258029771
-0.0056785060544104	1.0173411679499
-0.0056800593267945	1.0263704255931
-0.005703616351883	1.0287186770257
-0.0059939483163781	1.0557058758089
-0.0060922294309123	1.0714714941002
-0.0060927433289082	0.99044951696252
-0.0062154119207317	1.0209922466966
-0.006295166889835	0.96019947710075
-0.0064559953135295	1.017901049857
-0.0065065656975912	1.0063170125843
-0.0065328556949555	1.0127278369764
-0.0066003046542705	1.0193977953034
-0.0067134256017322	1.1031091584507
-0.0067418331589086	1.0658669926392
-0.0067928758044076	1.042213958146
-0.0068688344665313	1.0782970067197
-0.0071244413889128	1.0666043799901
-0.0071789648746449	1.1449453433914
-0.0073806854471135	1.0533941885832
-0.0073994549126046	1.1711266362701
-0.0074513058257942	1.0872649944347
-0.0075207261905099	1.0411645263893
-0.0077202453935618	1.0347044730349
-0.0077333738833805	1.1180019105314
-0.0077363120444507	0.99969617513142
-0.0078950274043774	0.97023852655436
-0.0079411886062912	1.015149385803
-0.007990322146646	1.0872240043301
-0.0081711320665125	0.94090537431428
-0.0082204987669678	1.1292409284438
-0.008275117893945	1.0814592255439
-0.0083524940441323	1.0434689237926
-0.0084069709057476	1.0854108975338
-0.0084573924770809	1.0744520229922
-0.0086244691001316	1.079269453753
-0.0087183826126773	1.0673411230576
-0.0087887450671453	0.96661288773705
-0.0087983001664665	0.93697765583316
-0.0089174202550519	0.95015498275197
-0.0090321513641956	1.1060305616075
-0.0090414921805091	1.0854884217944
-0.0091037177521533	1.0199358549997
-0.0093487977870841	0.98893146436792
-0.0094714996254597	0.96235102751438
-0.0096363867244496	1.0001753915163
-0.0098315485905978	1.0398399974397
-0.0098592983395631	0.98452569920322
-0.010017606211281	0.94827105392727
-0.01004336217895	1.0024030726156
-0.010226382813888	0.99374916418919
-0.010255005622313	1.0636044969465
-0.010302037400572	1.0930652455947
-0.010330150123576	1.1166010669909
-0.01036270383405	1.0422864944635
-0.01059440188966	1.016320809349
-0.010751398141769	0.93363482536589
-0.010774932073694	1.0039861945745
-0.010783393922936	1.0262307178783
-0.010838122774172	1.1211117227477
-0.010852413429825	1.0145631249612
-0.010976820554971	1.0030267934633
-0.011022971752684	1.0463625523209
-0.011093045695756	1.1858921898452
-0.011316683420128	1.0201676794416
-0.011341360429169	1.0294874980036
-0.011387876262849	1.0675837433211
-0.011441759806075	1.0500628786825
-0.011454866674432	1.0686022723077
-0.01147334734453	1.0189231237557
-0.011794233569737	1.0088860438585
-0.011869811905734	1.024759444136
-0.011957432396859	1.0339146227354
-0.011980071319944	1.1037406052714
-0.012022039020959	1.0995553398304
-0.012220423778485	1.075181657183
-0.012534879468834	1.0118716759739
-0.012842690656585	1.0231138647337
-0.01295580520452	0.93560868522767
-0.012984767706844	1.1050141430714
-0.013008056086399	0.96631589739239
-0.013044079149104	1.0127934085754
-0.013072741085263	1.0856646654202
-0.013099832830648	1.0152744636183
-0.013112680667496	1.0292752175857
-0.013193110139412	1.0296664787982
-0.013375306419283	1.0086267943053
-0.013454143584836	1.0579064200536
-0.013596215238227	1.0243378248513
-0.013655267231762	1.0743843805979
-0.013661401212067	1.0673695558737
-0.013667529284363	1.0243697027189
-0.013753540273315	1.0644425934443
-0.013754588155765	1.0962425179631
-0.013755529303192	1.0124587803058
-0.013763666905121	1.0600501023188
-0.01381311555932	0.99455807284379
-0.013928896223212	1.0075482629011
-0.014297381427072	0.97716096023975
-0.014324159811855	0.95952723229952
-0.014399006453229	1.001974073042
-0.014425711078208	0.97968510249942
-0.014439730069494	1.0805570668592
-0.014990350801211	1.0006525243073
-0.014990582118471	1.149583321857
-0.015065711022937	1.0388267521965
-0.015297326586431	0.97362844946423
-0.015334650879322	1.0747775986163
-0.015523255083142	1.0265554008317
-0.015660879316913	1.0783360886319
-0.015777226873099	1.0046138344266
-0.015860810102479	1.0322821892431
-0.015920439242882	1.0739639089438
-0.015942654689341	1.0779914751202
-0.015950109875394	1.0616388073888
-0.01603175360998	1.0961725466159
-0.016069843087206	0.99371488436407
-0.016070942628637	1.0062540957824
-0.016319844800388	1.0712019410676
-0.016380728103938	1.0558157521136
-0.016612209484602	1.1001878555141
-0.016775672870391	1.0169048314526
-0.016776295099463	1.1565449522799
-0.017027275889956	0.93659936236398
-0.017031438589734	1.0960454545701
-0.017287672219752	1.1173123817117
-0.017343673965741	0.98395638833198
-0.017464031554054	1.0505264919603
-0.017479321396528	1.0574455372893
-0.017501961118148	0.98318587202303
-0.017536955894641	1.0250672896501
-0.017557054768225	0.96765893646759
-0.017679871789278	1.0706444679515
-0.017863466829156	1.0479865042553
-0.017955400529813	1.0886200453946
-0.018048468852553	1.0668082861191
-0.018082379203388	1.093332459386
-0.018153033206676	1.0277909607653
-0.018205612634809	1.0613851310784
-0.01836032111025	1.0408039600566
-0.018510440946717	0.963421284415
-0.018637175671142	1.0723148093524
-0.018993407058199	1.0059068573321
-0.019043996290968	1.053018825199
-0.019097273931851	0.99915946011714
-0.01932988288984	1.1951156641726
-0.019427523843415	1.1079775890225
-0.019657109903763	1.0671787882594
-0.019714209243048	1.0525623180667
-0.019774853164027	1.0708785306866
-0.019886819912479	1.093818615152
-0.019964049255872	1.1176563719514
-0.020107508577507	0.98575503516188
-0.020274603545903	1.0529254979754
-0.020526896087428	1.0670755914564
-0.020567789823691	1.0290160143453
-0.020751962745919	1.0360239153067
-0.020918835466069	1.0511512125447
-0.021094007477743	1.023660646869
-0.021103374455069	1.0289621048294
-0.021132241311318	1.0773131845723
-0.021363766158654	1.0743587504426
-0.021571461896306	0.9656684047319
-0.021624602067503	1.0390680743007
-0.021657167715424	0.99078825499689
-0.021679828185353	1.101574840235
-0.021707898394668	0.93933361420726
-0.021876012922893	1.0638529330419
-0.021900366321131	1.0785503414352
-0.021944989426037	1.0830114799852
-0.021964327160545	1.0955567662283
-0.021969159730837	0.99620039375001
-0.022176776601586	1.0665055509213
-0.022215952708065	1.0462117515789
-0.022398248096982	1.0410533624065
-0.02269256602995	1.0265243112698
-0.022693623750998	1.0604200748549
-0.022740704410908	1.080173673714
-0.022828677356958	1.0066824671494
-0.022831725120409	1.038690915692
-0.022840276325398	0.970482497019
-0.023025100776751	1.0282284281422
-0.023067338142596	1.0222608291284
-0.023195681414743	1.1285573609816
-0.023331693583614	1.0221153834759
-0.023382704750576	1.105443698301
-0.023389427832524	1.0520875307269
-0.023537555510167	1.0133442199994
-0.023541149691425	1.0604037551075
-0.023632428851655	1.0808052729169
-0.023729099442437	1.0350088519443
-0.023769935160175	1.0438163015124
-0.023932244921849	1.0942718091859
-0.023997141529155	1.0710805954332
-0.024009591311037	0.96872810844793
-0.024012869126144	0.99440249144642
-0.024045665550765	1.080557608052
-0.024059241973725	1.0247740472972
-0.024099217685729	0.97348336782522
-0.024127572186049	1.0039081028264
-0.024145954559015	1.0061650535412
-0.0241616988709	0.94192269360134
-0.02424528212821	1.0100663775354
-0.02427990704912	1.0346679697076
-0.024345455740108	1.0360634416321
-0.024387585968642	1.0926437778717
-0.024389969141504	1.0161740486296
-0.024546095122874	1.0169518850444
-0.024563295982392	1.0279559132865
-0.024751657544007	0.96837209316963
-0.024761023406684	1.0514173982463
-0.024841449071882	1.0524679132439
-0.025161925370811	0.95456759218417
-0.025253816413861	1.1050922994861
-0.025340634442991	1.1319064107677
-0.025493961199519	1.0627508991212
-0.025513813938471	1.0972989776012
-0.025527405137699	0.99368693979506
-0.025671865063531	1.0308676067389
-0.025710907226113	1.0224286809624
-0.025753788938306	1.0307170588271
-0.025753815871206	1.0225398712066
-0.025961888021143	1.0381055000709
-0.025978605051632	1.0853152654366
-0.02606279695605	0.99997967311024
-0.026100476692282	0.99651520959199
-0.026140147130115	0.98101470904722
-0.026330861668927	1.0518626531631
-0.02639764601549	1.0717650954535
-0.026408851464372	1.0006100227901
-0.026538897981398	1.028797894506
-0.026591039966113	1.0230616881649
-0.026614257365637	1.0075577659408
-0.026639824900268	1.0919042205457
-0.026754100445468	1.0829549651368
-0.026887891471394	1.1189215521332
-0.02708215391282	1.0678913540864
-0.027091650836627	1.0582840369003
-0.027216911437652	0.97831748873686
-0.027649817970084	1.0860079102208
-0.027652099933186	1.0485506923236
-0.027712871004056	1.0583075762017
-0.027782523158018	1.0248196240829
-0.027785688917067	1.1282145274262
-0.027927008628149	1.0249833346445
-0.027952404641264	1.0613228093088
-0.027965944065008	1.0779275872631
-0.028036943529055	1.0750951237193
-0.028141010967157	1.0356108739166
-0.028258958919937	1.1272153194367
-0.028364114761924	1.0499504430947
-0.028463486676016	1.0425922463732
-0.028525834404042	1.0627994290237
-0.028761357192293	1.0500745311632
-0.028979171219341	0.99706329266878
-0.028993393231664	1.0169153145543
-0.029408392199627	1.0114919507966
-0.029409282947163	1.1075090137401
-0.029495698034404	1.0420359301845
-0.02955199977579	0.98720758143854
-0.029709726471075	0.99447884671534
-0.029756695440159	0.95321075501576
-0.029872091214958	1.0165928632888
-0.029931936071492	1.1215540506631
-0.029991741995135	1.0959740744974
-0.030076801584586	1.0028911461513
-0.030208070749177	1.0936426214359
-0.030249583765852	1.0346304982574
-0.030329647941561	0.94148169443134
-0.030505567894078	1.119565260247
-0.030527935981961	0.97961001514877
-0.03053465116449	0.99689830927643
-0.030545570930285	1.0480990318956
-0.030774128009726	1.0467268798234
-0.030904749229324	1.0894378654144
-0.031147704799171	1.060107464179
-0.031273129602914	1.0656013740992
-0.031286935201579	1.0105269992374
-0.031294123187912	1.0489663905147
-0.031487850583375	0.97366496450837
-0.031584230307376	0.98544862718314
-0.031837332964879	1.0370091672262
-0.0320377193184	1.0671101167267
-0.032288184379672	0.979502653366
-0.032311803866986	1.0329165770243
-0.032456313006016	1.0307955471439
-0.032467228757409	1.1057619538923
-0.032615703026347	0.97537688909435
-0.032962626893869	0.98119230461184
-0.033059618328508	1.0243593627334
-0.033098163716758	0.99081274230406
-0.033423719097416	1.1905553035081
-0.03344393179216	1.0261125259439
-0.033537514328376	0.96338566512284
-0.033704265472923	1.020754350797
-0.033745345147579	1.0235899422349
-0.033825005860061	1.0117708707683
-0.033835525689264	1.0431514649376
-0.034032639428565	1.1119886724853
-0.034051774591484	1.1154902755237
-0.034091097806847	1.0765813925359
-0.03441936436462	1.0203311806186
-0.034598609689185	1.0055297490034
-0.034609898993041	1.0155396481067
-0.034831634672744	1.0068159279995
-0.03483655003493	1.1509646325537
-0.034910360961448	1.102458799365
-0.03494205121865	1.0483857436496
-0.035010331756542	1.1023987423586
-0.035186469467152	0.96540123544521
-0.035308046592774	1.1482414186103
-0.035340043714924	0.96744240881184
-0.0354401017781	0.98745579223973
-0.035528980066015	1.0658683413068
-0.035530699844607	1.022345203508
-0.035534929347216	1.0062316968405
-0.035751554140686	1.0641260241591
-0.03615464869644	1.1012930042451
-0.036220965032123	0.99245027521674
-0.036255884355359	1.0310400826529
-0.036259863784234	1.055889075147
-0.03629813707692	1.0364084807861
-0.036312570005177	1.0602920688421
-0.036416364440704	1.0430323098521
-0.036459679021477	1.0410468567835
-0.036508618007838	1.0269982984701
-0.03662656069514	1.0098939475175
-0.036996836524584	1.0443374032984
-0.037297593855353	1.0741834867665
-0.037374515853487	0.96821899814057
-0.037389225705184	1.0137209263798
-0.037392048021854	1.0263190054203
-0.037552551430835	1.0258679378837
-0.037594460415065	1.0821531041231
-0.037717258575685	1.0403598499208
-0.037935418201943	1.0676657137743
-0.037970281489394	1.046400344462
-0.038085471365546	1.1630774813468
-0.038152564958837	1.0807554030115
-0.038305805922763	1.0582419839047
-0.038477426828936	1.0924713655635
-0.038505954273475	1.0287248732099
-0.038678058859252	1.0294806105466
-0.038803481502152	1.0442654193041
-0.038939075039149	0.94114888489678
-0.038987897929502	1.0772714049433
-0.039174127083481	0.96546417420143
-0.03949853215609	1.0044860829975
-0.03956943199333	1.0401109688515
-0.039804083629606	1.0725555848744
-0.040112354632656	1.0439326541563
-0.04028121264635	1.085499760065
-0.040544477112506	1.0879611067442
-0.040859858911371	1.0056605543696
-0.040919835523674	1.0575031417829
-0.041028081748606	0.99689528272964
-0.041611687948391	1.0783813974758
-0.041806501607356	1.0443698479478
-0.042029541377977	1.0325720297871
-0.042031458365487	1.0761351678211
-0.042068452024837	1.0502347328691
-0.042071117479906	1.0843742291616
-0.042088427059775	1.0437225517247
-0.042126969432741	1.0872956704043
-0.042269698587575	1.0380517347201
-0.042328204119307	1.1048061323968
-0.042534702569118	1.0844051033406
-0.042608997894787	0.98216124035345
-0.042643339998804	1.0349023074604
-0.043636405774263	1.0243893178205
-0.043942808041947	1.0558646544488
-0.044197840506814	1.0536434836221
-0.044300450721935	1.0455447222152
-0.04455427651688	1.0027852911473
-0.045096283293461	1.1239075670322
-0.045178824676883	1.0303803616832
-0.045222075664767	1.1273190405966
-0.045277002507163	1.0525109241987
-0.045348700342496	1.03261116836
-0.045513247210923	0.93456118373981
-0.045552181567436	1.0646184203907
-0.04564276620418	1.0456408708008
-0.045695308238338	1.0059232747479
-0.046291341484943	1.0453153135945
-0.046917821272261	1.0438194200538
-0.047163972275964	1.0213231494014
-0.047238649947519	1.0091430271634
-0.047787963540262	0.97478302408347
-0.048186500456359	1.0972077859002
-0.048205130687965	0.94309596402991
-0.04857520695041	1.0621253696246
-0.049861836226309	1.0565609041579
-0.04992880160437	1.0609841630796
-0.050477065141517	1.0516616077274
-0.050568057809856	1.0634061937724
-0.051062886659889	1.021175789179
-0.051089357295406	0.99927185393007
-0.051163261174614	1.0625981363385
-0.051260289179963	1.1124291863953
-0.051574900012381	1.0198926006218
-0.051813323256537	1.018156642247
-0.051917292479213	1.0522454187568
-0.051986572944286	1.0930986412041
-0.052512014520906	0.99422727361335
-0.052734468237537	1.0338765174929
-0.052791003093597	0.99709694878288
-0.05283179718349	1.0800491308174
-0.052867595789631	1.0362425577711
-0.0533973097802	1.0722758961144
-0.053598708621061	1.0389491493418
-0.053872548134341	1.0254834803533
-0.053884575159546	1.089025669963
-0.054007384959782	0.9976606501746
-0.054120031418466	1.0241296517159
-0.054803335273104	1.0925853594967
-0.054972644694337	1.128142403997
-0.054981185271706	1.115990330475
-0.055581046322645	1.0177394154902
-0.055809122669018	1.1189799517722
-0.056270609777831	1.0728221089378
-0.056314513787795	1.0702880731265
-0.056918591859989	1.0314631620425
-0.057054721917153	1.030381183978
-0.059215751667604	1.0526592281133
-0.059243655864089	0.96616271972476
-0.060149692151068	1.1410075624902
-0.060443872474845	1.0030402655554
-0.060613522785631	1.0323462812733
-0.061485516430101	1.0230443278616
-0.061644500776623	1.0430966321384
-0.062800108683081	0.96831604912625
-0.063313462276424	1.0471838328317
-0.063349958052368	1.0052798460146
-0.063618584045097	1.0444920064492
-0.064324828686573	1.1737747122642
-0.064481456820764	1.1201404550867
-0.065413040770848	1.0420338965249
-0.06567187182579	1.0173546973385
-0.066355550975036	1.0807742825318
-0.06665510867807	1.0157272929725
-0.067282439665865	1.0971232480732
-0.067469333924031	1.0141328358045
-0.067928494595022	1.0158655606695
-0.068358969295044	1.0667701422861
-0.06892339276401	1.0211621551726
-0.068963346069058	1.0448300910919
-0.069215290357532	1.0944997026357
-0.069229468342028	1.1086254817589
-0.070280824426845	1.0829895079412
-0.071638120894839	1.1123318965685
-0.071985105840588	0.99646067253113
-0.072679252688938	1.1536242254462
-0.077374661911026	1.0796010102122
-0.07781751145817	1.0355769051255
-0.079844900565023	1.0145191923501
-0.079946225159076	1.0391076879142
-0.080196476802703	1.0772787821381
-0.080354931253449	1.0049139811011
-0.081729153765545	0.99322214679801
-0.083056711566111	1.0414723550234
-0.088499028574951	0.99791100031666
-0.090256213591909	1.0630167585133
-0.094759071221866	0.98297688227792
-0.097573533047283	1.0013399168592
-0.1072015593282	0.95183876643946
-0.11226721874715	1.1478700225589
+-0.10497045712461 0.92908626816169
+-0.10303726521254 1.0839316738048
+-0.098471726916423 1.0732768075083
+-0.094706867247905 0.92415201289011
+-0.091233284993305 0.99784907309092
+-0.090950250630774 1.045528772476
+-0.085191067431077 0.97373109001266
+-0.083693952372356 1.069512893715
+-0.082997016937968 1.000031796313
+-0.0822700390127 0.99293951815895
+-0.0820739045782 1.0585070089127
+-0.077267295263318 0.98506808258966
+-0.077117465587113 1.0336707165228
+-0.076912546601461 1.0468179906945
+-0.074179868909128 0.98147050281715
+-0.07403456723398 0.99715034389517
+-0.07358261821014 1.1359777201128
+-0.073290211151814 0.98064426913718
+-0.073175116994201 0.96345663743462
+-0.072983667191032 0.99300322800777
+-0.072926805413777 0.97046509607858
+-0.072588648723905 1.1119248316009
+-0.072588179994 1.0511425373231
+-0.072049617391279 1.016617538186
+-0.071339398099482 1.0012991109315
+-0.070837215866205 1.0509567229172
+-0.070582854038817 1.0867928655542
+-0.07040540481939 1.0131055251096
+-0.069356601411579 1.0157885565374
+-0.068512080442675 1.0269249169117
+-0.068045582445813 1.1038491741538
+-0.067052901397287 0.98772165547191
+-0.066310743227343 1.0796343355435
+-0.066184501541924 1.1492781678548
+-0.066025479438527 1.0640927362911
+-0.065766675893958 0.98125781821915
+-0.065528469854491 0.94100690320696
+-0.064532035456792 1.0209864576566
+-0.064323393243902 1.07896340234
+-0.064183404650338 1.0812008005858
+-0.064137576792222 0.97164369270275
+-0.06413069572589 1.0407031128918
+-0.063324704868038 0.96616463193002
+-0.06329904795504 1.0270145193473
+-0.063073300537916 1.0160585512014
+-0.062241904371072 1.145136759412
+-0.062161203292393 1.0279984523388
+-0.062062032756728 1.0718661146065
+-0.061988066472765 0.99622797843863
+-0.061859319822518 0.99326643153952
+-0.061748267615001 1.0250212006836
+-0.061723534218994 1.0076570987663
+-0.061047619067581 0.94882117084581
+-0.060775752953243 1.0131133725309
+-0.060706745568602 1.0229222107971
+-0.060558285167175 1.0035759887007
+-0.060455959744898 1.0234268768251
+-0.060444820723913 1.0487760287579
+-0.060108809052494 0.98524986923062
+-0.060105691513507 1.0137800084038
+-0.060050580329199 0.97345806417757
+-0.059959143400439 0.96628358355269
+-0.05986403760967 1.0193615277981
+-0.059756742429742 1.0245632370487
+-0.058891057139535 1.0190012653231
+-0.058560948121718 0.97444302060849
+-0.058535896855147 0.97820489673807
+-0.058373015210858 1.1709341371993
+-0.057819312016993 1.0243627788954
+-0.057289802374969 1.083624220288
+-0.057183023900624 1.0966927383724
+-0.057163532983601 1.0171111354192
+-0.05676229717485 1.0423136123322
+-0.056471356421967 0.94548782690979
+-0.056233745258658 1.009225174993
+-0.056192144808518 1.0768828794636
+-0.056155018001824 1.05117464323
+-0.055881906923415 1.0296007041592
+-0.055483613665278 0.99915092967419
+-0.054910423230185 1.0066822918584
+-0.054702599677133 1.0399449184422
+-0.054383495490468 1.0709943750635
+-0.054244539428788 1.0854697337518
+-0.053933419555653 1.0318965911962
+-0.053918182534811 1.0736391833733
+-0.053737668078972 1.0297041331457
+-0.053651165598871 1.0117932088873
+-0.053635828052285 0.98611718759074
+-0.053616457155631 0.97879262639703
+-0.053608158432034 1.0250709784091
+-0.053174591420227 1.0066059765305
+-0.052682451371402 1.0043216727631
+-0.05258330748579 1.0159769056857
+-0.052349040485672 1.1003797228708
+-0.051976374064461 1.0480402055563
+-0.051852008927111 0.97727397468016
+-0.051657781896293 1.0643473152666
+-0.051154113849233 1.0060316974451
+-0.050952025809543 1.0302058209275
+-0.050897307614132 0.99160961525097
+-0.050262955743043 0.95540877233616
+-0.05006019172846 1.0695864234241
+-0.049903666923695 1.1121951969714
+-0.049175941112373 1.0432000531582
+-0.048799191421009 0.97268008689488
+-0.04876030680714 1.0523377469024
+-0.048759777762721 1.0996179864493
+-0.048650217648164 1.081409819496
+-0.048539004023917 0.97128197271013
+-0.048521642097026 1.0130030295809
+-0.048383650071117 1.0321770309542
+-0.048227758980079 0.96201737954439
+-0.048092269450189 1.0302849061891
+-0.047746824413724 0.92808692190851
+-0.047339786310493 0.96199285303766
+-0.047004525867081 1.0087007054347
+-0.046941917793638 1.1115454689525
+-0.046879714097497 1.0035860979879
+-0.046594429314278 1.1013875064224
+-0.046542973678832 1.0458622796117
+-0.046335392197949 1.0172000559349
+-0.046207509561646 0.99108156102389
+-0.046204409228854 1.0446190127707
+-0.045993726122153 0.96312162228716
+-0.04593370453955 1.1056201164926
+-0.045684827799559 1.0700638868206
+-0.04512536050205 0.96645988058432
+-0.044639480833196 1.0643470720894
+-0.044547871595823 1.0185106314833
+-0.04419444511834 0.96725946291752
+-0.044141540885962 0.99145833742285
+-0.044125803224583 1.0063738447259
+-0.044086761707227 1.0125433446095
+-0.044020641410534 1.0525849726422
+-0.043831257494653 0.99102808845512
+-0.043534910123178 1.0039511988808
+-0.04345733914761 1.0012489301408
+-0.043279401784366 1.0299002748735
+-0.043003515643771 1.0260068261965
+-0.042959774421611 1.0086671673322
+-0.042910263802177 0.98551900687285
+-0.042812779372828 1.0363723102156
+-0.042651734181269 0.98279791317078
+-0.042546058886007 1.0959340409787
+-0.042334091255095 0.97585806723882
+-0.042126255586853 1.0041838161185
+-0.042008201602932 0.9524793814944
+-0.042007281965931 0.99034984021702
+-0.041820821299955 0.94725594934378
+-0.04178486145227 1.0469280572138
+-0.041513204298778 0.9890368242605
+-0.041465432599775 1.0216504006662
+-0.041335252232218 1.0545583356563
+-0.041238556301838 1.0329670592567
+-0.040738915119789 1.1352270886907
+-0.040703441547414 1.0553252940704
+-0.040664486006701 1.0076052437917
+-0.04065811403295 0.94673489480232
+-0.040281828586785 1.0167105498076
+-0.040131719656175 1.0113645255427
+-0.040081688825079 0.97025767282402
+-0.039734207638795 1.0968079063039
+-0.039687432876268 1.0462796577234
+-0.039359831334346 1.0799273923893
+-0.03929338528937 1.0149878428859
+-0.039260536344305 1.0054281829547
+-0.039149548354668 1.014613299911
+-0.039051139701768 1.0650066978528
+-0.038952104250859 0.97026600687399
+-0.038912462191757 1.028643539205
+-0.038859476543986 1.0590583910668
+-0.038836381077756 0.95842179005068
+-0.038619623178723 1.11632336764
+-0.038516168775921 1.0286192346473
+-0.038146277413205 1.04955835522
+-0.038124986844493 0.96313579832451
+-0.038022575801754 0.91789074984538
+-0.037910460393695 1.0363455463322
+-0.037888062181152 1.021534914222
+-0.037780990859406 1.0466836965184
+-0.03754588652473 1.0519588969578
+-0.037540566227516 0.97885646898797
+-0.037528838555186 1.0240879228357
+-0.037507859100106 1.0580057104079
+-0.037422623032665 0.97053467004369
+-0.037403974382316 1.0894183791197
+-0.037390824845431 1.0562014397788
+-0.037366414955852 1.0580181764219
+-0.037319518429576 1.1315667988178
+-0.037294998361125 1.0966352295161
+-0.036899181739935 0.97961499626674
+-0.036655964073581 0.99875523436902
+-0.036259013912257 1.0645077781724
+-0.036218260066323 1.1432896666333
+-0.036091399607235 0.97046270885559
+-0.035975498135068 0.97788973080067
+-0.035950981467954 1.0360310697608
+-0.035871382547455 1.0913914987488
+-0.035692287648859 1.0527169831726
+-0.035494323896533 1.0580401880598
+-0.035141126040897 0.98190885570018
+-0.034831177483392 0.99465771316146
+-0.03479702059797 1.0065710584259
+-0.034783292101622 1.0402088229936
+-0.034653046400903 1.0877308343663
+-0.034621201693629 1.0813790260583
+-0.034481232734955 0.96884660944316
+-0.034478739526987 0.96337117446489
+-0.034413916112182 1.0199007912494
+-0.034374238325709 0.96268696700339
+-0.034155774878379 1.034555338895
+-0.034073647085271 1.0110064279398
+-0.03396123670827 1.0635613602392
+-0.033954512720544 1.0759123975813
+-0.033675573590008 1.0837134902386
+-0.033672478509882 1.0832328293034
+-0.033634613970103 0.92482400399532
+-0.033608325357852 1.0925469610292
+-0.033590546661138 0.99060561096926
+-0.033587463273035 1.0205801658138
+-0.033480451338049 0.92877321243235
+-0.03316554421449 0.98877454122315
+-0.033060719503664 1.0561086731981
+-0.033018223339228 0.91466947871088
+-0.032974495095473 1.0336044213078
+-0.0328263523703 1.0024292353162
+-0.032633807789251 0.91041220171225
+-0.032622350206647 0.90764424432003
+-0.032607511083764 0.91724474159028
+-0.032561141536541 1.0335192072632
+-0.032378838215573 0.9942487755622
+-0.032327921553556 1.0618730768019
+-0.032297586504015 1.0356684009443
+-0.032203486492581 1.01368611568
+-0.032188692525851 1.0742555964198
+-0.032188454074764 1.0557240004219
+-0.03218637506197 1.0558352062705
+-0.032092628484307 1.110763585119
+-0.032090206182309 1.0124992212152
+-0.031999296865362 0.95783169309444
+-0.031975243659399 1.0510778303481
+-0.031723304898687 1.1067226190278
+-0.031701013536658 1.0127696290968
+-0.031621480588463 0.95635178216515
+-0.031576018095114 1.0193147150458
+-0.031451325000285 1.0140350904647
+-0.031412827608237 1.0232976998608
+-0.031406511704013 1.0374917515227
+-0.031336923042976 0.91576933846181
+-0.031317590118049 0.97477334241274
+-0.031114665538427 0.95808119831011
+-0.03108691612334 1.0858020008845
+-0.030926876493418 0.98654114263611
+-0.030836104240187 1.0065187884884
+-0.0308271465158 1.0409286151552
+-0.030784555210126 1.0613612481147
+-0.030756950444893 1.0281193190024
+-0.030737919997484 1.0556624734539
+-0.030319247089703 0.98283456420165
+-0.030154749131306 1.1028466643153
+-0.030123515771326 0.96361570947946
+-0.030085243133682 1.0557471780551
+-0.029986352829061 0.9216481133114
+-0.029961285924075 0.97672772386225
+-0.029655221934001 1.0191198240922
+-0.029627656357291 1.0534434426966
+-0.029390798487453 1.0496120064727
+-0.029277881943951 1.0917462138384
+-0.029226157419043 1.0502556158883
+-0.029179942387618 0.99746609478346
+-0.029094794936236 0.98936034814183
+-0.028992815367827 0.99646215488088
+-0.028829128185905 1.0591409396992
+-0.028763627846049 1.0657959157304
+-0.028732643635094 1.0160402353908
+-0.028675860377554 1.0714351268656
+-0.028616278330358 0.93637268187864
+-0.028611007302951 1.0479466939761
+-0.028558827055277 0.94729527012539
+-0.028526633246233 1.0181081920496
+-0.028455733116593 0.96040179960882
+-0.028239222028544 1.0524024651679
+-0.028225229783327 0.95857329635328
+-0.028196774260124 0.97152368339716
+-0.028176049704029 1.0438606132484
+-0.028094924821371 1.0219618396017
+-0.027982297165631 1.0196925153987
+-0.027963373228121 0.93239006907207
+-0.027908001268364 0.95989501997361
+-0.027904226802938 1.0599901411192
+-0.027902971489866 1.0225323851314
+-0.027817810113988 1.0178039300563
+-0.027729339972219 1.0215938469675
+-0.027587247032146 1.0388526925617
+-0.027420509510694 1.027444709996
+-0.027326686892709 0.99729950529453
+-0.027151761975042 0.97796274150186
+-0.026964198681329 1.0582435920554
+-0.026961534238201 1.013786502423
+-0.026943989790685 1.0171218311615
+-0.026897827288411 1.0123204255764
+-0.026699163528381 1.0707295987954
+-0.026666016874643 1.1197987160722
+-0.026175903073662 1.0414656164452
+-0.02606954104619 1.0641861618091
+-0.026064787811289 0.99399420914523
+-0.025989351303624 1.0046291028473
+-0.025881108695245 1.1155102586592
+-0.025821458190623 0.99299493233546
+-0.025776322988806 0.97924149959787
+-0.025749614877921 1.0420941094905
+-0.025723824577302 1.0645489242423
+-0.025616403400458 1.0334138291043
+-0.025611256720821 1.044873066123
+-0.02542805969796 1.1061637667179
+-0.025353002382245 1.0408460911938
+-0.025012317864542 1.0132870053696
+-0.024971042350831 1.0012501834299
+-0.02494615461588 1.0136310677523
+-0.02484721790335 1.0104483791678
+-0.024842072257179 1.0791717971082
+-0.024799959799419 0.97905588015105
+-0.02469917305257 1.078595799849
+-0.024691655105333 1.0445358037373
+-0.024511211129257 0.9690821427267
+-0.024441035630287 0.98608441254722
+-0.024336734503218 0.99910436813364
+-0.024217232547993 1.0331004373167
+-0.024160504080583 1.0479713518679
+-0.023992058564942 1.0845538996125
+-0.023904078242015 0.95119734708475
+-0.023872500260985 1.0079264470428
+-0.023840036411108 1.0388498805722
+-0.023500571896346 1.107244376909
+-0.023468993103209 1.0547020424261
+-0.023458039436778 1.0978345894659
+-0.023357758966204 1.011224162916
+-0.023327077604343 1.0355166882032
+-0.023281507090719 0.99015563851809
+-0.023165912544639 1.1909042950649
+-0.023080405390373 0.99247968917808
+-0.023041245458203 0.97325423513304
+-0.022947501241347 0.97070643446144
+-0.02285762659749 1.0134435815438
+-0.022736442177571 1.0926125834659
+-0.022698313077573 1.0400943808553
+-0.022621601297921 1.0837219827349
+-0.022575421549088 1.0877892016167
+-0.022480428960748 1.082021342697
+-0.022470113374153 1.0744811533677
+-0.022448793542287 0.99574200450726
+-0.022429634229642 1.0429787643594
+-0.022264800429178 1.0420076522534
+-0.022198119421939 1.0565421143389
+-0.022020872370803 1.0445218305777
+-0.022014988571173 1.0946771027929
+-0.022010472995742 1.0532659379913
+-0.021858768673729 0.98400369253584
+-0.021517744402227 1.0377554580723
+-0.021479754544625 1.0656582187385
+-0.021471969753387 1.016008563945
+-0.021335290863833 1.0039468070907
+-0.021269222012056 1.1036048500712
+-0.021078251823029 1.0560826136853
+-0.021028567746589 1.0831667773126
+-0.020992458492643 1.0114632004065
+-0.02097156147273 1.0409960760381
+-0.020895525066198 0.96951914785147
+-0.020821361247207 1.0878752035818
+-0.020740777455318 1.0055079656522
+-0.020286214260355 0.93938424571419
+-0.020249694350094 1.0577874058522
+-0.020200164746334 0.97942365808069
+-0.020140470692117 0.99775881186079
+-0.020076235166158 1.0303207105411
+-0.020049113716883 0.98570559619142
+-0.019972919787209 1.0654739647899
+-0.019943726087713 1.0589178048181
+-0.019895132803465 1.089004477507
+-0.019891559802248 1.0668776370411
+-0.019846886319224 1.0693746714883
+-0.019685064485263 1.1267817238331
+-0.019624873871247 1.0547324110226
+-0.019533636048962 1.0059191725559
+-0.01951138944568 1.0734734246049
+-0.019504513996075 1.0101220179608
+-0.019490739606826 1.0176263632377
+-0.019444285941841 1.0391965144761
+-0.019249972932026 0.98993611760071
+-0.019129070077263 1.0881693353508
+-0.01898993868313 1.0688968803526
+-0.018905638679385 1.0679412423907
+-0.018702492962105 1.0501233882577
+-0.018501560889978 1.0676059345912
+-0.018405992727215 1.0472413664276
+-0.018325395016175 1.0122787949302
+-0.018317688936775 1.0083997673664
+-0.018304087535698 1.0485057164289
+-0.01828614773301 1.087487353546
+-0.018285540096277 1.0814739427681
+-0.018214224609835 0.94333202043238
+-0.018154559817979 1.0270749529691
+-0.01814561878803 1.0222765969467
+-0.017902941312253 1.1270651211624
+-0.017831848754685 1.031339210759
+-0.017828007346182 0.98451445441574
+-0.017616383335907 1.0439072219616
+-0.017568738024923 1.0455152735444
+-0.017131060301719 1.0294180804256
+-0.017093789769217 1.0943515364891
+-0.01700404093847 0.9908281048111
+-0.016948884971332 0.99502544108339
+-0.016767318493377 1.0647344323668
+-0.016555515871653 1.0892112205639
+-0.016519950419077 1.030579426374
+-0.016445252604509 0.93969790510429
+-0.016433293076635 1.0222090882479
+-0.016429317259292 1.0563276554644
+-0.016351548080802 1.0599677176217
+-0.015991927596073 1.0235111896822
+-0.015941649565883 1.0528083932133
+-0.015899197871088 1.1080987993046
+-0.015795856790939 1.0259380719395
+-0.015723104283504 0.9698757734418
+-0.015661850851131 1.0470739138012
+-0.015659612349352 1.0405444107015
+-0.015511726898901 0.98561352459836
+-0.015345773837706 1.1150666667824
+-0.015186009824343 0.9881179919344
+-0.015116062819054 1.0752092354351
+-0.015003853128526 1.0408519878637
+-0.014991530490462 1.0932166961955
+-0.014885422537347 1.0575898977831
+-0.014832433600702 1.0387248830034
+-0.014765865691152 1.0925361352101
+-0.014754656553838 1.0797128162079
+-0.014744672316802 1.0585027966645
+-0.014713154890488 1.0214479584987
+-0.014703814561812 1.0683269570235
+-0.014667725827882 1.1297561041458
+-0.014588141994276 1.090946539192
+-0.014536385510596 1.0712152063771
+-0.01452881612991 1.0303022362306
+-0.014253950035515 1.0630659277005
+-0.014239771202504 0.9579455579785
+-0.014124631292041 1.0143155744964
+-0.014099536408654 0.99751897200795
+-0.013832426032884 1.0161921281681
+-0.013829018438855 1.0767419601825
+-0.01381784117179 1.0943085189845
+-0.013813800784385 0.96196855792208
+-0.013608199757127 1.0957209892676
+-0.013509875313584 1.115849898207
+-0.013456801292701 1.0274249743694
+-0.013333908849459 0.96399479612411
+-0.01331234291481 1.0384741102099
+-0.013286711451416 0.96590988401672
+-0.013156626916914 0.98064656762192
+-0.01312190133565 1.0349375873949
+-0.013110190854452 1.046330212899
+-0.012980128660658 1.0531953281973
+-0.012956842891863 1.0106124685447
+-0.01265311426895 1.0314187592677
+-0.012639845990399 1.0111781871833
+-0.012566447552532 0.99115237230928
+-0.012373518762612 1.1488371555439
+-0.012371527745937 1.0714177555465
+-0.012357067236548 1.0392791200821
+-0.012318901694837 1.1073145497806
+-0.01217865007551 1.0056788707291
+-0.012155520714426 1.0509819708566
+-0.012129910968964 1.0265947914867
+-0.012005275692402 0.95834382320314
+-0.011903090214018 1.0160394503311
+-0.011814707111192 1.057604363954
+-0.011790985156118 1.0641759873781
+-0.011686554881699 0.99819772594782
+-0.011493579213538 1.0262958889857
+-0.011370820538203 1.044035280035
+-0.011242204402233 1.0766228690285
+-0.011218446016061 1.0639402085791
+-0.01110648140288 1.0563540905883
+-0.011092330787796 1.0391726568588
+-0.011087852820724 1.0739981817649
+-0.011077163849822 1.0489811962836
+-0.011011352452223 0.96763248407142
+-0.010983358033756 0.97146214126719
+-0.010981290888139 1.1041542084088
+-0.01090095940919 1.0673063214533
+-0.010891322382403 1.0115387471371
+-0.010875475699644 1.0262346320891
+-0.010815630074249 0.93213627548027
+-0.010799782252764 1.0196765731689
+-0.010768499821857 1.0297883436824
+-0.010614803501515 1.0746269801158
+-0.010410331464148 1.0819533091822
+-0.010406951239304 1.1162286685203
+-0.010398742728657 1.1643155529631
+-0.010376771759831 1.0146002972255
+-0.010296339535622 1.0457408560236
+-0.010222101206468 1.0671672781118
+-0.010193934524845 1.0478421441015
+-0.010138581870678 0.99227422131023
+-0.010074503819108 0.98548204944306
+-0.010046785054442 1.050345630583
+-0.0099264051199837 0.97297171617083
+-0.0099257485932059 0.99898992847203
+-0.0098873330275924 1.0972485559836
+-0.0098699915015653 1.0310266384902
+-0.0098473667986594 1.0024778779535
+-0.0097721974104093 1.039287948282
+-0.0097389117468614 1.0506901205838
+-0.0097201751761045 1.0561668141272
+-0.0096737431259643 1.0200235852877
+-0.0095861931183453 1.0766824671169
+-0.0095704439689168 0.94936692615187
+-0.0095485281643864 1.057348113644
+-0.0094082950296643 0.99214610174631
+-0.0092373850878761 1.1169307378834
+-0.0091224935571287 0.98426344732374
+-0.0089356045399436 1.0726341717536
+-0.0088929489148988 1.059037877435
+-0.0088361728515265 1.0028924281892
+-0.0087091615406166 0.97185122989086
+-0.0086249474747783 1.0183320460001
+-0.0084682668582967 1.1022496830023
+-0.0082851478526139 0.97646403414159
+-0.0082717356740807 1.0788850935997
+-0.0082078850822809 0.96451426016616
+-0.0081780748337668 1.0044734942857
+-0.0081644174694454 1.0290860906654
+-0.0080628561682311 1.0946860020805
+-0.0080069256517424 1.05806204386
+-0.0079524062455289 1.0065219904392
+-0.0078903661545845 1.1142406824517
+-0.0078498731630513 0.98257374014865
+-0.0078241166690318 1.0435866211196
+-0.0078191008790506 0.93326991776186
+-0.0077886091750153 1.0285830721897
+-0.007775050085234 1.0426863933898
+-0.00750434322521 1.1313508036399
+-0.0074711848612585 1.02102330584
+-0.0073835919474609 1.0495624747308
+-0.0073681354978184 1.0201779400839
+-0.0073043059981654 0.95520223021632
+-0.0071889645128466 1.0793509530163
+-0.0071577815873259 1.052432513244
+-0.0070709494570471 0.9925025257592
+-0.0069688472562636 1.0713870600419
+-0.0069237317164994 1.0350110723476
+-0.0067967347132065 0.94567320197514
+-0.0067057127626171 1.0014748697885
+-0.0066850674226183 0.98595327449843
+-0.0066452614965119 1.0857405482159
+-0.0064168530237541 1.0534362183969
+-0.0064090681645056 1.0762051855546
+-0.0063046140506103 1.1202255055691
+-0.0061508232029456 1.0300581715341
+-0.0060944042062684 1.0102292007362
+-0.0060451599601562 0.97976504260899
+-0.0059153916623788 1.0711241401272
+-0.0058639793464203 1.1209517126917
+-0.0058217420037355 0.98592450423756
+-0.0057145148835638 1.0340528251593
+-0.0056852199838286 1.0744180103287
+-0.0056525522445517 1.0282525471713
+-0.0056317424875835 0.99064977042715
+-0.0056105205111734 1.1238299572429
+-0.0055820204751279 1.0581259456258
+-0.0054280912060044 1.0247384407456
+-0.0053579563246089 1.013976200843
+-0.0052920568479323 1.0532955285987
+-0.0052849174370562 0.96078863835982
+-0.0052533761496337 0.88857229923671
+-0.0052303106925438 1.0363757733618
+-0.0049806227065927 0.93667437960193
+-0.0048832145003547 1.0011240198444
+-0.0047883831326679 1.012593781389
+-0.0045787823943252 1.057270768533
+-0.004466835199046 0.99778384310878
+-0.0044097019019308 1.1191241565445
+-0.0043689459076338 1.0349854071092
+-0.0043424962313935 1.0790253703125
+-0.0042635125884715 1.0118439638151
+-0.0042395769986498 1.0385855505085
+-0.0042157992905755 0.98170453448743
+-0.0041821538663204 1.0595481444248
+-0.0041362154300401 1.1238575666757
+-0.0040744849875401 1.0386412674562
+-0.0038090883406067 1.0511197691943
+-0.0035923126766385 0.98170369006154
+-0.0035614762659156 0.99931037525572
+-0.0035074032780281 1.0475765345515
+-0.0032753000144221 1.082586458141
+-0.0032380057035071 1.0296205857283
+-0.0031926934497024 1.00790025065
+-0.0031383654744926 1.0002304250289
+-0.0029507628796659 0.99467813549386
+-0.0028889661862562 0.99276456961012
+-0.0026747070378167 1.0627680795095
+-0.0025162504797088 0.97123659009997
+-0.0024304402574365 1.1043149592931
+-0.0023904960118018 0.99740671729705
+-0.0023881800089163 1.0711808125772
+-0.0022951509650249 0.98553400603296
+-0.0021788156430745 1.0383562382912
+-0.0020525702350462 1.0717585365745
+-0.002047076172739 1.0389159024345
+-0.0019562225209257 0.99490519916154
+-0.0019042069834845 1.0194033005587
+-0.0018957320320217 0.96350814135143
+-0.0018116562840351 1.0574971152117
+-0.0018060342846091 1.0965105323537
+-0.001746263626117 1.0869696660631
+-0.0017377498407054 0.98953917420793
+-0.0017362222616324 1.0253477565289
+-0.0016629166751756 0.94406002200871
+-0.0014289613145661 1.0176115523118
+-0.0013854875432539 1.015169401849
+-0.0012677467841233 1.078394941997
+-0.0012003688519988 1.0033243629245
+-0.0011566311340297 1.0644533610343
+-0.00095046688964302 1.0758074673653
+-0.00093675858148806 1.0063914565684
+-0.00090087111986436 0.94536397941222
+-0.00084079252075425 1.0461316775305
+-0.00083785302849904 1.0021714687568
+-0.00073377439081922 1.0059956542942
+-0.00070495588237295 1.0415826322842
+-0.00066937304054503 1.0583551696373
+-0.00060276487554776 1.0231157541549
+-0.00045314727213326 0.94037365834064
+-0.00039745953061847 1.0418768679298
+-0.00011660907525311 1.0620112702783
+0.00018311428673569 0.98851029786775
+0.00024779057443452 1.0942645300679
+0.00028810071501718 1.1005413477303
+0.00034998699450025 1.0750252648187
+0.00047019894469747 1.0746642849943
+0.00054953290700935 1.0278540499113
+0.00060129232678208 1.0563619917345
+0.00091335236195988 0.9687510976194
+0.0010224789541182 1.0059486571804
+0.0010473872832747 0.95535714568598
+0.0011557727648575 1.0792920029787
+0.0012313312544328 1.0089346138904
+0.001312366207591 1.024183718647
+0.0014169636813817 0.97370803359461
+0.0014802837865984 1.0149089351699
+0.0014975762961888 1.1388782405966
+0.0016860823470861 0.98006826132258
+0.0017652734145633 1.0266688014804
+0.0017847888414505 0.98315514731407
+0.0018391434504692 1.0082980197485
+0.0018396844961609 1.0629313697182
+0.0018487920026714 1.0017643638412
+0.0019482552687359 1.0369528052974
+0.0019533637882282 0.96411567435939
+0.0019697932252128 0.98624811532771
+0.0019910202581849 0.96541949824179
+0.002058879736643 0.99314870814323
+0.0021273531012959 0.97008620184943
+0.0023589098395924 0.96058061001677
+0.0024433584800133 0.94692329496847
+0.0024857000376957 1.0320996730536
+0.0025257193286905 0.96071100591565
+0.00268261213568 1.0432871635793
+0.0027349840206156 1.0161920874645
+0.0027562940003772 1.0194863805811
+0.002757062124756 0.93462692012799
+0.0028647892762327 0.99863768036708
+0.0032996076569657 1.0104360335827
+0.0033733123956299 1.0247349912448
+0.0034025881687281 1.1195776395069
+0.0034310069750437 0.98756110864657
+0.0035038143330702 1.0115744836911
+0.0035167237984125 1.0107595505206
+0.0037377566174736 1.0699612017026
+0.0037479124614576 1.2051321658154
+0.0037841000206192 1.0483120380928
+0.0038016607330054 0.99800066553044
+0.0038269117877865 1.0423792753584
+0.0038415775032313 1.0783698956652
+0.0038923013144148 1.0353642160838
+0.0039472893642878 1.122397024217
+0.0039571400362133 1.0789574403485
+0.0039947855749546 0.99638888071293
+0.0040042039828814 1.039549849762
+0.0041827094738259 0.92514820571746
+0.0042045656329673 1.111279473025
+0.0042833007039737 1.0558188491492
+0.0043396629882698 1.1000523323678
+0.0043586427947124 0.97023975383831
+0.0046665123834924 1.0266904710397
+0.0046831752515069 1.0748852480603
+0.0047034378436156 1.0287048896857
+0.004728883124768 1.0010705518649
+0.0049373866820471 1.1107838603591
+0.0050674858966902 1.0230906922465
+0.0051126595886928 0.99663030506705
+0.0051141441824814 0.98727015710409
+0.0051883086130636 1.0471899132272
+0.005248828044845 1.1021426084804
+0.005321819318526 1.0024771355733
+0.0056008598593482 1.0306678751828
+0.0058297241022598 1.0017999813403
+0.0059385173252028 0.95446344445318
+0.0061865717378422 1.1182052452802
+0.0062868421265992 1.0418703665767
+0.0063439852656993 1.1079894814115
+0.0064370007725862 1.0181464965338
+0.0067700112827337 1.0284362664964
+0.0072147040026715 1.0075422560958
+0.0072147345866971 1.005141651513
+0.0072552657880536 1.0159068483686
+0.0073955101300139 1.0270836362974
+0.0075601807485764 0.87796486602543
+0.0075846208906619 1.005664672277
+0.0076540426868624 1.0691656726885
+0.0076545709767507 1.0393063126379
+0.0078243392392545 0.9706482030548
+0.0078684015859047 1.0113845386783
+0.0080229991203446 1.0321295807817
+0.0080912048769735 0.92326767300771
+0.0081093274297777 0.91804605744968
+0.0081914564047563 1.0884831568852
+0.0082420799669376 1.0611684772575
+0.0085988620241584 0.97934102833802
+0.0086042700583964 1.0681337569531
+0.0086317565247211 1.0965815077
+0.0086877100883446 1.0613966657742
+0.0090325936723239 1.0642290359794
+0.0091937970742802 0.98847767914243
+0.0093124846369065 1.0309899099924
+0.0093610787196217 0.99150901122198
+0.0095182046125509 0.96156450369581
+0.0098565007172308 1.0231093119236
+0.010085699347547 0.92493012213765
+0.010134284614919 1.0625884470087
+0.010134759761007 1.0114312003025
+0.010137460301897 1.0582028884459
+0.010161484027346 1.0529583645258
+0.010180421225783 1.0124220397017
+0.010272128926572 0.94258736702648
+0.010337444607625 1.0511557043993
+0.010502606827105 0.95620171852664
+0.010602603181501 1.071339744457
+0.010708326531136 1.0990813397727
+0.010770611926688 1.0663070021607
+0.010857444908193 1.0821580894742
+0.01087252409477 1.0102685301875
+0.010879298486783 1.0486842408767
+0.010925016873378 1.0426501691464
+0.011049215681401 0.98405746050785
+0.011141698683219 1.0395943748499
+0.011297037003578 0.99148509160355
+0.01143384317409 1.0408993844554
+0.011504563095799 1.0111969525834
+0.011836532225832 1.0222814371318
+0.011888728932758 1.0498836586742
+0.012029900281952 1.0576116844045
+0.012203513188507 1.0573256242583
+0.012500784622885 0.97516747914589
+0.012777008242192 1.0374631218444
+0.01282075892159 1.0696583889507
+0.012909830803139 0.99729308445196
+0.012941454427996 1.0298626613511
+0.013017273205807 1.0577004792451
+0.01308403868513 0.9539579327229
+0.013102415958702 1.0365102456167
+0.013113346967619 1.0196376398175
+0.01346501865041 1.0354695151069
+0.01350386495236 1.0166011019852
+0.013533992230859 1.1129854139547
+0.013674828477071 0.93834808296201
+0.01406135034296 1.0572362437224
+0.014081813345285 0.97633654963902
+0.014147449341317 1.0105827936211
+0.014150960511119 1.0115171656703
+0.014225558917807 0.99849352864909
+0.014260389091348 1.1683491600407
+0.014418800187395 0.92434205926985
+0.014419750123603 1.14027049672
+0.014507699204776 0.95552993791494
+0.014908668414493 1.1147456854191
+0.015093881115487 0.9631439791273
+0.015098573428855 1.0258490783406
+0.015292770173054 1.071229447711
+0.015368671758418 1.0331479812098
+0.015553589898961 1.0039797046279
+0.0155609732264 1.0800965341895
+0.015725879419026 1.0289355118472
+0.015871912902265 1.0284138375106
+0.015905492877941 1.0348149349955
+0.015941908237059 1.0660404934481
+0.015945634590042 1.0120341881501
+0.016141751978679 1.1052414288306
+0.016160190752488 1.0357755261293
+0.016359980791383 1.0744700333012
+0.01642866847927 0.96288284081881
+0.016583253184364 0.98953340117282
+0.016696550040182 0.94110620852999
+0.016922124800065 1.0424262603562
+0.017030569506559 1.0698041371875
+0.017051705998802 1.0553259182931
+0.017282128754192 1.0039684110328
+0.017417378082143 0.96028178750007
+0.017887710723729 0.9827018245746
+0.017898994443654 1.0241805693287
+0.018037171432874 0.96287628894744
+0.01851032185427 0.98790633991486
+0.018709174810016 1.0281802686356
+0.018727901667061 1.0547319346744
+0.018829528944943 1.0351067313865
+0.018895681257876 1.0179168776503
+0.018903032989451 0.96474723853857
+0.019205572883374 1.0859543613351
+0.019494166670844 0.97232321977605
+0.019507581096314 0.9726625420087
+0.019668554473331 0.94998090567495
+0.0197131700718 1.0008010240421
+0.0198692615434 0.94511834655175
+0.020050016682543 0.95784011264144
+0.02011340231706 0.99705083311697
+0.020211133211749 1.0466655319694
+0.020234294953036 0.98405182863708
+0.02049439219505 1.0172191182221
+0.020637161065652 1.0680309258268
+0.02085387308435 1.0059013670464
+0.020899223469087 0.97040527574945
+0.0210265489618 1.045818331305
+0.021049316550854 1.0149917764653
+0.021116819847902 0.98331521268201
+0.021122651459881 1.0244443094554
+0.021225060154508 1.0276882489486
+0.021257854198092 0.99964709472859
+0.021283631314431 1.0626630294589
+0.021447572973755 1.0782930896598
+0.021922789055741 0.94808935879213
+0.02202858224506 1.0169195998982
+0.022042386758173 1.000558091231
+0.022062427382497 1.002042767849
+0.022263076685167 0.99700105804475
+0.022293994450485 1.1022334608761
+0.022715223628719 1.031899585785
+0.022765974712226 0.96113065010116
+0.022831326921834 1.0048582131613
+0.023074580060181 0.97569985391017
+0.023140941764479 1.006513879428
+0.023143118320972 0.97834394016194
+0.023245132176524 1.0783041675985
+0.023628113265696 1.0141626749386
+0.023981834796485 1.0864858999385
+0.024350126074633 1.0252079874348
+0.024352273480329 1.045486363435
+0.024450523828204 1.0173125290406
+0.024564961162555 0.98442735848749
+0.024608471557522 0.98079815516155
+0.024809058983448 1.054916331769
+0.025228813636827 1.0296586700395
+0.025282524456184 0.95378643514728
+0.02552158011949 1.0189139140356
+0.025669875815051 1.0366452153996
+0.026077530357781 1.0471609732866
+0.026499599299338 1.0104981310846
+0.026615022645137 0.99078384736132
+0.02662590877257 1.0493198105823
+0.026679676368358 0.98824780333697
+0.026751067105868 1.049599368277
+0.026837799845485 1.1178317769583
+0.026953805385285 0.99963462189295
+0.027158453827208 0.97795734721765
+0.027170052679867 0.98624487339856
+0.027358383118237 0.95541900052572
+0.0273738494741 1.0547753185296
+0.027500794822952 1.0805012499818
+0.027659557564461 1.0541612816688
+0.027705556409851 1.1488643105053
+0.028020251328698 1.0045256260893
+0.028036660904329 1.0003127201671
+0.028098786734137 1.0394086475942
+0.028317222818538 1.0112156469072
+0.028421510252491 1.0156392196981
+0.028645207779681 0.94230931753062
+0.028683751912147 1.0877582415913
+0.028768623223295 0.98929788380211
+0.028857484304221 1.0453571070496
+0.02904322563878 1.0848286308982
+0.02919561621358 1.0864857273189
+0.029225190250773 0.98628692890288
+0.029646362469737 1.0261478948922
+0.02964677437912 0.99702761707941
+0.029662871403009 1.005491099253
+0.029926564328208 1.0702366708537
+0.030178929465324 1.0972329952387
+0.030237394599483 1.0535186461771
+0.030313352019638 1.1075158205476
+0.0303157637218 1.0704371460914
+0.030628565197279 1.0151034667186
+0.030644479617132 0.91731772274914
+0.030779774604582 0.97911233384225
+0.030941990399659 0.88752691548246
+0.030953777500026 1.0095430185526
+0.031320107993001 0.96635576560823
+0.031655665330205 1.0331403752718
+0.031673133832858 1.0238293100553
+0.031699042969189 0.97984375833737
+0.03222015525919 1.1151591622605
+0.032433085915793 0.99899500341757
+0.033062888927242 1.0853229848012
+0.033078895638448 1.0303950854167
+0.033327681795111 1.0772972758706
+0.033408983975653 0.98459060501458
+0.033816402421665 1.0154321946522
+0.033929295924365 0.92048653480942
+0.034187104537838 1.0540048652167
+0.034222616178629 0.99811019486802
+0.034346536816875 1.0392815103869
+0.034490123575669 0.9809824508012
+0.034833428296485 1.1031183426062
+0.034869843908933 1.0487851508055
+0.034895395573931 1.078997631104
+0.035259119801695 1.0344023204696
+0.035639885510115 1.0321459192509
+0.035799209278114 1.0839682491541
+0.035958509825295 0.97260296777951
+0.036026300364388 0.9677733039372
+0.036098862748665 1.0803292938465
+0.036375017274307 1.0273313529625
+0.036504598500912 0.96733566064317
+0.03660120981688 1.0601436093779
+0.037603804479863 0.95464202095512
+0.03809112783811 1.0584812880739
+0.038099285601581 1.0395384679374
+0.038189595662354 1.0453903265099
+0.038273268255126 1.0314165000675
+0.038624834679437 1.0204996139523
+0.039168588940156 1.120319555628
+0.039377230759286 0.94766505811834
+0.039591485776566 0.92573388461208
+0.03961808314401 1.0069537422831
+0.039650607737064 1.0636927887308
+0.04003685104011 1.0773335978314
+0.040808651114823 1.0151102990024
+0.041286747134842 1.0851270233913
+0.041548104285585 1.0431682864162
+0.041719825548821 1.0640628297714
+0.041771871050351 1.0134336016919
+0.042193337632687 1.1111498086743
+0.04235047007377 1.0206050563846
+0.042583510690642 1.0667042927321
+0.042772984222355 0.96722499598334
+0.043654621860094 0.95228489540099
+0.044084277978237 1.0909671316556
+0.044463522313928 1.1251823790052
+0.045010522457284 1.0642421667496
+0.045145021425994 0.98488270328995
+0.045560912095109 1.0250297861358
+0.045739209849681 1.0590818576862
+0.045944538592886 1.0285044457061
+0.046592584635802 1.0289484254842
+0.047197709914132 0.99366026588084
+0.047499104665422 1.0377384412091
+0.047525364050753 1.0150969099136
+0.047595345778739 1.0064073729005
+0.048673989489001 0.98711110343051
+0.048831633483705 1.0882450127709
+0.050118652809664 1.0411967871505
+0.050245397163205 1.0106868150147
+0.050436671856146 1.0756116791925
+0.050740072052791 1.0578058969475
+0.050894580790338 0.96810549488535
+0.050988395564919 1.0393614727887
+0.052020069999987 1.0255869041742
+0.052156679731714 0.9925531719253
+0.052165558064237 0.9634536696998
+0.052952612989063 1.052403732257
+0.053234817319711 1.0200011600463
+0.053358337923465 0.95094917947528
+0.053460732745464 1.068520657942
+0.053776899327352 1.0407893642295
+0.054274825328357 1.0335844770488
+0.054446738292654 1.0461657193955
+0.05626028675661 1.0180579100677
+0.056297467244842 0.99402044208965
+0.057659427902007 1.0420357079997
+0.057929593934987 1.0829911299245
+0.06157444016881 1.050187076556
+0.062774743966219 1.0627873235938
+0.06284628250561 1.0027190889251
+0.064440280365611 0.96611386734755
+0.064858039658033 1.005024785914
+0.064907410804515 0.9289389649871
+0.067983347144436 0.97273210974652
+0.069250785223519 0.9979882152955
+0.071494845745689 1.0140234214242
+0.073417721323025 0.9859479082183
+0.073715601110968 1.0629187379046
+0.07823653059819 1.0314634264846
+0.084318640058829 1.0067173360376
diff --git a/packages/basics/stats/test/test_bootstrap.lua b/packages/basics/stats/test/test_bootstrap.lua
index be9453120..d3c73c940 100644
--- a/packages/basics/stats/test/test_bootstrap.lua
+++ b/packages/basics/stats/test/test_bootstrap.lua
@@ -2,16 +2,16 @@ local check = utest.check
 local T = utest.test
 local base_dir = string.get_path(arg[0])
 local rnd = random(567)
-local errors = iterator(range(1,1000)):map(function()return rnd:randNorm(0.0,1.0)end):table()
+local errors = matrix(iterator(range(1,1000)):map(function()return rnd:randNorm(0.0,1.0)end):table())
 
 T("BootstrapTest",
   function()
     local boot_result = stats.boot{
-      data=errors, R=1000, seed=1234,
-      statistic = function(it)
-        local mv = stats.mean_var()
-        for k,v in it do mv:add(v) end
-        return { mv:compute() }
+      size=errors:size(), R=1000, seed=1234,
+      statistic = function(sample)
+        local s = errors:index(1, sample)
+        local var,mean = stats.var(s)
+        return { mean,var }
       end
     }
     table.sort(boot_result, function(a,b) return a[1]<b[1] end)
@@ -19,9 +19,12 @@ T("BootstrapTest",
       map(string.tokenize):
       enumerate():
       apply(function(i,t)
-          check.lt(math.abs(tonumber(t[1]) - boot_result[i][1]), 1e-03)
-          check.lt(math.abs(tonumber(t[2]) - boot_result[i][2]), 1e-03)
+          check.number_eq(tonumber(t[1]), boot_result[i][1])
+          check.number_eq(tonumber(t[2]), boot_result[i][2])
       end)
     local a,b = stats.boot.ci(boot_result, 0.95)
     local m = stats.boot.percentil(boot_result, 0.5)
+    check.number_eq(a, -0.071339398099482)
+    check.number_eq(b,  0.052156679731714)
+    check.number_eq(m, -0.010296339535622)
 end)
diff --git a/packages/basics/stats/test/test_covariance.lua b/packages/basics/stats/test/test_covariance.lua
new file mode 100644
index 000000000..6b33091d8
--- /dev/null
+++ b/packages/basics/stats/test/test_covariance.lua
@@ -0,0 +1,15 @@
+local check = utest.check
+local T = utest.test
+T("CovarianceCorrelationTest", function()
+    local m = matrix(3,3,{1,6,9,
+			  4,5,5,
+			  7,4,1})
+    check.eq(stats.cov(m),
+	     matrix(3,3,{9,-3,-12,
+			   -3,1,4,
+			   -12,4,16}))
+    check.eq(stats.cor(m),
+	     matrix(3,3,{1,-1,-1,
+			 -1,1,1,
+			   -1,1,1}))
+end)
diff --git a/packages/basics/stats/test/test_distributions.lua b/packages/basics/stats/test/test_distributions.lua
index 7db489709..643ad56fa 100644
--- a/packages/basics/stats/test/test_distributions.lua
+++ b/packages/basics/stats/test/test_distributions.lua
@@ -1,6 +1,6 @@
 local check = utest.check
 local T = utest.test
-local M = matrix.col_major
+local M = matrix
 local EPSILON = 0.001
 local N = 1000
 
@@ -39,7 +39,7 @@ T("NormalDistTest", function()
                                  M(3,3):zeros():diag(2):set(1,2,1):set(2,1,1) )
     check.eq(type(d), "stats.dist.normal.general")
     
-    local pdf_result = M(2, { 0.0175621, 0.00572678 })
+    local pdf_result = M(2, { 0.0151933, 0.00832571 })
     
     check.eq( d:logpdf( M(2,3):uniformf(-1,2,random(9427)) ):exp(), pdf_result )
     
@@ -52,7 +52,7 @@ T("NormalDistTest", function()
         -- check(function()
         --     return data:sum(1):scal(1/N):equals( M(1,3):fill(a) )
         -- end, "Multivariate population mean test")
-        local mv = stats.mean_var()
+        local mv = stats.running.mean_var()
         data:map(function(x) mv:add(x) end)
         local mu,sigma = mv:compute()
         check.number_eq(mu, a, ( math.abs(a) < 1.0 ) and 0.4 or nil,
@@ -77,7 +77,7 @@ T("DiagNormalDistTest", function()
         -- check(function()
         --     return data:sum(1):scal(1/N):equals( M(1,3):fill(a) )
         -- end, "Multivariate population mean test")
-        local mv = stats.mean_var()
+        local mv = stats.running.mean_var()
         data:map(function(x) mv:add(x) end)
         local mu,sigma = mv:compute()
         check.number_eq(mu, a, ( math.abs(a) < 1.0 ) and 0.4 or nil,
@@ -98,7 +98,7 @@ T("StdNormalDist", function()
     check(function()
         return math.abs(data:sum()/N) < 0.1
     end)
-    local mv = stats.mean_var()
+    local mv = stats.running.mean_var()
     data:map(function(x) mv:add(x) end)
     local mu,sigma = mv:compute()
     check(function() return math.abs(mu) < 0.04 end)
@@ -201,7 +201,7 @@ T("LogNormalDistTest", function()
         check(function()
             return (data:sum(1):scal(1/N):log() - M(1,3):fill(a + b/2)):abs():sum()/3 < 0.1
         end)
-        local mv = stats.mean_var()
+        local mv = stats.running.mean_var()
         data:map(function(x) mv:add(x) end)
         local mu,sigma = mv:compute()
         check.number_eq(math.log(mu), a + b/2, 0.1)
@@ -223,7 +223,7 @@ T("DiagLogNormalDistTest", function()
         check(function()
             return (data:sum(1):scal(1/N):log() - M(1,3):fill(a + b/2)):abs():sum()/3 < 0.1
         end)
-        local mv = stats.mean_var()
+        local mv = stats.running.mean_var()
         data:map(function(x) mv:add(x) end)
         local mu,sigma = mv:compute()
         check.number_eq(mu, math.exp(a + b/2), 0.1)
diff --git a/packages/basics/stats/test/test_means.lua b/packages/basics/stats/test/test_means.lua
new file mode 100644
index 000000000..e9b2b7ac6
--- /dev/null
+++ b/packages/basics/stats/test/test_means.lua
@@ -0,0 +1,23 @@
+local check = utest.check
+local T = utest.test
+
+T("MeansTest", function()
+    local m = matrix(3,4):linear()
+    check.number_eq(stats.amean(m), m:sum()/m:size())
+    check.TRUE(stats.gmean(m) == 0)
+    check.TRUE(stats.hmean(m) == 0)
+    
+    check.eq(stats.amean(m,1),
+             matrix(1,4,{(0+4+8)/3, (1+5+9)/3, (2+6+10)/3, (3+7+11)/3}))
+    check.eq(stats.gmean(m,1),
+             matrix(1,4,{(0*4*8)^(1/3), (1*5*9)^(1/3), (2*6*10)^(1/3), (3*7*11)^(1/3)}))
+    check.eq(stats.hmean(m,1),
+             matrix(1,4,{0, 3/(1/1+1/5+1/9), 3/(1/2+1/6+1/10), 3/(1/3+1/7+1/11)}))
+    
+    local m = matrix(3,4):linear(1)
+    check.number_eq(stats.amean(m), m:sum()/m:size())
+    check.number_eq(stats.gmean(m),
+                    iterator(range(1,12)):reduce(math.mul(),1)^(1/m:size()))
+    check.number_eq(stats.hmean(m),
+                    m:size() / iterator(range(1,12)):map(function(x) return 1/x end):reduce(math.add(),0))             
+end)
diff --git a/packages/basics/tokens/binding/bind_tokens.lua.cc b/packages/basics/tokens/binding/bind_tokens.lua.cc
index 90b6206a2..c954a5bcc 100644
--- a/packages/basics/tokens/binding/bind_tokens.lua.cc
+++ b/packages/basics/tokens/binding/bind_tokens.lua.cc
@@ -18,6 +18,22 @@
  * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  *
  */
+//BIND_HEADER_H
+#include "token_base.h"
+#include "token_memory_block.h"
+#include "token_matrix.h"
+#include "token_null.h"
+#include "token_sparse_matrix.h"
+#include "token_vector.h"
+#include "smart_ptr.h"
+
+using namespace Basics;
+
+bool lua_isAuxToken(lua_State *L, int n);
+AprilUtils::SharedPtr<Token> lua_toAuxToken(lua_State *L, int n);
+void lua_pushAuxToken(lua_State *L, AprilUtils::SharedPtr<Token> &value);
+//BIND_END
+
 //BIND_HEADER_C
 #include "bind_matrix.h"
 #include "bind_sparse_matrix.h"
@@ -46,10 +62,7 @@ bool lua_isAuxToken(lua_State *L, int n) {
   return lua_isSparseMatrixFloat(L,n) || lua_isMatrixFloat(L,n) || lua_isToken(L,n);
 }
 
-// Be careful, this function returns an object which needs to call IncRef and
-// DecRef ALWAYS, even if the receives is not getting the property. Otherwise, a
-// memory leak will exists.
-Token *lua_toAuxToken(lua_State *L, int n) {
+AprilUtils::SharedPtr<Token> lua_toAuxToken(lua_State *L, int n) {
   if (lua_isMatrixFloat(L, n)) {
     MatrixFloat *mat = lua_toMatrixFloat(L,n);
     return new TokenMatrixFloat(mat);
@@ -60,20 +73,20 @@ Token *lua_toAuxToken(lua_State *L, int n) {
   }
   return lua_toToken(L,n);
 }
-//BIND_END
 
-//BIND_HEADER_H
-#include "token_base.h"
-#include "token_memory_block.h"
-#include "token_matrix.h"
-#include "token_null.h"
-#include "token_sparse_matrix.h"
-#include "token_vector.h"
-
-using namespace Basics;
+void lua_pushAuxToken(lua_State *L, AprilUtils::SharedPtr<Token> &value) {
+  switch(value->getTokenCode()) {
+  case Basics::table_of_token_codes::token_matrix:
+    lua_pushMatrixFloat(L, ((TokenMatrixFloat*)value.get())->getMatrix());
+    break;
+  case Basics::table_of_token_codes::token_sparse_matrix:
+    lua_pushSparseMatrixFloat(L, ((TokenSparseMatrixFloat*)value.get())->getMatrix());
+    break;
+  default:
+    lua_pushToken(L, value.get());
+  }
+}
 
-bool lua_isAuxToken(lua_State *L, int n);
-Token *lua_toAuxToken(lua_State *L, int n);
 //BIND_END
 
 //BIND_LUACLASSNAME Token tokens.base
diff --git a/packages/basics/utest/lua_src/utest.lua b/packages/basics/utest/lua_src/utest.lua
index 6b2c0909b..2e9b5e1ab 100644
--- a/packages/basics/utest/lua_src/utest.lua
+++ b/packages/basics/utest/lua_src/utest.lua
@@ -97,7 +97,6 @@ local check = function (func,error_msg)
               write(1, "%s\n",
                     iterator(ipairs(ret)):select(2):map(tostring):concat(" "))
             end)
-      write(1, "%s\n", debug.traceback())
     end
     write(1, "Test %s %d: %sfail%s", test_name, testn,
           ansi.fg.bright_red, ansi.fg.default)
@@ -109,7 +108,8 @@ local check = function (func,error_msg)
       end
       error_msg = ", msg: %s"%{error_msg}
     end
-    write(1, "%s\n", error_msg or "")
+    write(1, "%s, it follows the traceback\n", error_msg or "")
+    write(1, "%s\n", debug.traceback())
     failed = failed + 1
     if not failed_list[test_name] then
       table.insert(names_order, test_name)
@@ -149,17 +149,25 @@ utest.check.success = check
 utest.check.fail = function(f, ...)
   return check(function() return not f() end, ...)
 end
+utest.check.errored = function(f, ...)
+  util.silent_errors(true)
+  local ok = check(function() local ok=pcall(f) return not ok end, ...)
+  util.silent_errors(false)
+  return ok
+end
 utest.check.TRUE = function(a, ...)
   return check(function() return a end, ...)
 end
 utest.check.FALSE = function(a, ...)
   return check(function() return not a end, ...)
 end
---_
+--
+local selected_tests
 utest.test = function(name, test_func)
   assert( test_name == NONAMED )
   assert( type(name) == "string", "Needs a string as first argument" )
   assert( type(test_func) == "function", "Needs a function as second argument")
+  if selected_tests and not selected_tests[name] then return end
   test_name = name
   local ok,msg = xpcall(test_func,debug.traceback)
   if not ok then 
@@ -176,4 +184,10 @@ utest.test = function(name, test_func)
   test_name = NONAMED
 end
 --
+utest.select_tests = function(arg)
+  if #arg > 0 then selected_tests = table.invert(arg)
+  else selected_tests = nil
+  end
+end
+--
 setmetatable(utest.check,{ __call = function(self,...) return check(...) end })
diff --git a/packages/basics/util/binding/bind_util.lua.cc b/packages/basics/util/binding/bind_util.lua.cc
index 9d67c5ae9..5d3ae3424 100644
--- a/packages/basics/util/binding/bind_util.lua.cc
+++ b/packages/basics/util/binding/bind_util.lua.cc
@@ -18,8 +18,33 @@
  * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  *
  */
-//BIND_HEADER_C
+//BIND_HEADER_H
+#include <cmath>
+#include <ctime>
+#include <cstdlib>
+
+#include "mfset.h"
+#include "mmapped_data.h"
+#include "linear_least_squares.h"
+#include "lua_table.h"
+#include "popen2.h"
+#include "signal_handler.h"
+#include "trie_vector.h"
+#include "trie_hash_4_lua.h"
+#include "stopwatch.h"
+#include "words_table.h"
+
+using namespace AprilUtils;
+
+extern const char *__COMMIT_NUMBER__;
 
+int lua_isLuaTable(lua_State *L, int idx);
+AprilUtils::LuaTable lua_toLuaTable(lua_State *L, int idx);
+void lua_pushLuaTable(lua_State *L, AprilUtils::LuaTable &tbl);
+
+//BIND_END
+
+//BIND_HEADER_C
 #include <cmath>
 #include <cstring>
 #include <csignal>
@@ -36,10 +61,51 @@ extern "C" {
 #endif
 #include "binarizer.h"
 #include "error_print.h"
-#include "generic_options.h"
 #include "omp_utils.h"
 #include "smart_ptr.h"
 
+int lua_isLuaTable(lua_State *L, int idx) {
+  return lua_istable(L, idx);
+}
+
+AprilUtils::LuaTable lua_toLuaTable(lua_State *L, int idx) {
+  return AprilUtils::LuaTable(L, idx);
+}
+
+void lua_pushLuaTable(lua_State *L, AprilUtils::LuaTable &tbl) {
+  tbl.pushTable(L);
+}
+
+namespace AprilUtils {
+
+  template<> LuaTable LuaTable::convertTo<LuaTable>(lua_State *L, int idx) {
+    return lua_toLuaTable(L, idx);
+  }
+
+  template<> void LuaTable::pushInto<LuaTable>(lua_State *L, LuaTable value) {
+    value.pushTable(L);
+  }
+
+  template<> bool LuaTable::checkType<LuaTable>(lua_State *L, int idx) {
+    return lua_isLuaTable(L, idx);
+  }
+
+  template<> stopwatch *LuaTable::
+  convertTo<stopwatch *>(lua_State *L, int idx) {
+    return lua_tostopwatch(L, idx);
+  }
+  
+  template<> void LuaTable::
+  pushInto<stopwatch *>(lua_State *L, stopwatch *value) {
+    lua_pushstopwatch(L, value);
+  }
+
+  template<> bool LuaTable::
+  checkType<stopwatch *>(lua_State *L, int idx) {
+    return lua_isstopwatch(L, idx);
+  }
+}
+
 // COPIED FROM liolib.c:168
 static int io_fclose (lua_State *L) {
   luaL_Stream *p = ((luaL_Stream *)luaL_checkudata(L, 1, LUA_FILEHANDLE));
@@ -57,31 +123,10 @@ FILE **newfile (lua_State *L) {
 }
 //BIND_END
 
-//BIND_HEADER_H
-#include "mfset.h"
-#include "trie_vector.h"
-#include "trie_hash_4_lua.h"
-#include "stopwatch.h"
-#include "linear_least_squares.h"
-#include "words_table.h"
-#include <cmath>
-#include <ctime>
-#include "popen2.h"
-#include "signal_handler.h"
-#include <cstdlib>
-#include "mmapped_data.h"
-
-using namespace AprilUtils;
-
-extern const char *__COMMIT_NUMBER__;
-
-//BIND_END
-
 //BIND_STATIC_CONSTRUCTOR utils_static_constructor
 {
   binarizer::init();
   SignalHandler::initialize(L);
-  errorPrintSetLuaState(L);
 }
 //BIND_END
 
@@ -582,6 +627,12 @@ extern const char *__COMMIT_NUMBER__;
 }
 //BIND_END
 
+//BIND_METHOD stopwatch to_lua_string
+{
+  LUABIND_RETURN(string, "stopwatch()");
+}
+//BIND_END
+
 // FIXME: nanosleep puede volver antes, en tal caso para avisar a lua
 // se podría devolver el booleano que devuelve (y que estamos
 // ignorando) y el tiempo restante :P
@@ -831,6 +882,20 @@ extern const char *__COMMIT_NUMBER__;
 
 /////////////////////////////////////////////////////////////////////////////
 
+//BIND_FUNCTION util.silent_errors
+{
+  int argn = lua_gettop(L);
+  if (argn > 0) {
+    bool v;
+    LUABIND_GET_PARAMETER(1, bool, v);
+    setSilentErrorsValue(v);
+  }
+  LUABIND_RETURN(bool, getSilentErrorsValue());
+}
+//BIND_END
+
+/////////////////////////////////////////////////////////////////////////////
+
 //BIND_FUNCTION util.options.test
 {
   AprilUtils::SharedPtr<stopwatch> clock = new stopwatch();
@@ -841,12 +906,11 @@ extern const char *__COMMIT_NUMBER__;
   // stack: table stopwatch
   lua_setfield(L,-2,"clock1");
   // stack: table
-  AprilUtils::UniquePtr<AprilUtils::LuaTableOptions>
-    opt(new AprilUtils::LuaTableOptions(L,1));
-  opt->putReferenced("clock2", clock.get());
+  AprilUtils::LuaTable opt(L,1);
+  opt.put("clock2", clock.get());
   //
-  stopwatch *opt_clock1 = opt->getReferenced<stopwatch>("clock1");
-  stopwatch *opt_clock2 = opt->getReferenced<stopwatch>("clock2");
+  stopwatch *opt_clock1 = opt.get<stopwatch *>("clock1");
+  stopwatch *opt_clock2 = opt.get<stopwatch *>("clock2");
   // stack: table
   lua_getfield(L,-1,"clock1");
   // stack: table stopwatch
@@ -855,21 +919,19 @@ extern const char *__COMMIT_NUMBER__;
   lua_pop(L,1);
   // stack: table
   lua_getfield(L,-1,"clock2");
-  if (lua_type(L,-1) != LUA_TUSERDATA) LUABIND_ERROR("TEST 1 FAILED\n");
+  if (!lua_isstopwatch(L,-1)) LUABIND_ERROR("TEST 1 FAILED\n");
   // stack: table stopwatch
-  Referenced **pre_obj = static_cast<Referenced**>(lua_touserdata(L,-1));
-  Referenced *obj = 0;
-  if (pre_obj != 0) obj = (*pre_obj);
-  else LUABIND_ERROR("TEST 2 FAILED\n");
-  stopwatch *tbl_clock2 = dynamic_cast<stopwatch*>(obj);
-  if (tbl_clock2 == 0) LUABIND_ERROR("TEST 3 FAILED\n");
+  stopwatch *tbl_clock2 = lua_tostopwatch(L,-1);
+  if (tbl_clock2 == 0) LUABIND_ERROR("TEST 2 FAILED\n");
   // stack: table stopwatch
   lua_pop(L,1);
   // stack: table
   if (opt_clock1 != tbl_clock1) LUABIND_ERROR("TEST 1 FAILED\n");
   if (opt_clock2 != tbl_clock2) LUABIND_ERROR("TEST 2 FAILED\n");
   //
-  opt->putString("str", "Hello world!");
-  return 1; // returns the table
+  opt.put("str", "Hello world!");
+  string str(opt.toLuaString());
+  lua_pushstring(L, str.c_str());
+  return 2; // returns the table
 }
 //BIND_END
diff --git a/packages/basics/util/c_src/error_print.cc b/packages/basics/util/c_src/error_print.cc
index 77d257379..047d1426c 100644
--- a/packages/basics/util/c_src/error_print.cc
+++ b/packages/basics/util/c_src/error_print.cc
@@ -18,15 +18,16 @@
  * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  *
  */
+#include "base.h"
 #include "error_print.h"
-extern "C" {
-#include "lua.h"
-}
 
-lua_State *error_print_globalL=0;
+bool silent_errors = false;
 
-void errorPrintSetLuaState(lua_State *L) {
-  error_print_globalL = L;
+void setSilentErrorsValue(bool value) {
+  silent_errors = value;
+}
+bool getSilentErrorsValue() {
+  return silent_errors;
 }
 
 #define MAX_FRAMES     256
@@ -43,6 +44,7 @@ void errorPrintSetLuaState(lua_State *L) {
 
 /** Print a demangled stack backtrace of the caller function to FILE* out. */
 void print_CPP_stacktrace(FILE *out) {
+  if (getSilentErrorsValue()) return;
 #ifdef NDEBUG
   UNUSED_VARIABLE(out);
 #else
@@ -128,9 +130,9 @@ void print_CPP_stacktrace(FILE *out) {
 
 void print_CPP_LUA_stacktrace_and_exit(int errorcode) {
   print_CPP_stacktrace();
-  if (error_print_globalL != 0) {
-    lua_pushstring(error_print_globalL, "");
-    lua_error(error_print_globalL);
+  if (Base::getGlobalLuaState() != 0) {
+    lua_pushstring(Base::getGlobalLuaState(), "");
+    lua_error(Base::getGlobalLuaState());
   }
   else {
     exit(errorcode);
diff --git a/packages/basics/util/c_src/error_print.h b/packages/basics/util/c_src/error_print.h
index 5f6d29864..c9d72347a 100644
--- a/packages/basics/util/c_src/error_print.h
+++ b/packages/basics/util/c_src/error_print.h
@@ -22,60 +22,58 @@
 #define ERROR_PRINT_H
 
 #include <cstdio>
-extern "C" {
-#include "lua.h"
-}
 
-void errorPrintSetLuaState(lua_State *L);
+bool getSilentErrorsValue();
+void setSilentErrorsValue(bool value);
 void print_CPP_LUA_stacktrace_and_exit(int errorcode);
 void print_CPP_stacktrace(FILE *out = stderr);
 
 #define ERROR_PRINT(strformat)						\
-  fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__)
+  if (!getSilentErrorsValue()) fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__)
 
 #define ERROR_PRINT1(strformat, v1)					\
-  fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__,(v1))
+  if (!getSilentErrorsValue()) fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__,(v1))
 
 #define ERROR_PRINT2(strformat, v1, v2)					\
-  fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2))
+  if (!getSilentErrorsValue()) fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2))
 
 #define ERROR_PRINT3(strformat, v1, v2, v3)				\
-  fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2), (v3))
+  if (!getSilentErrorsValue()) fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2), (v3))
 
 #define ERROR_PRINT4(strformat, v1, v2, v3, v4)				\
-  fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2), (v3), (v4))
+  if (!getSilentErrorsValue()) fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2), (v3), (v4))
 
 #define ERROR_PRINT5(strformat, v1, v2, v3, v4, v5)			\
-  fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2), (v3), (v4), (v5))
+  if (!getSilentErrorsValue()) fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2), (v3), (v4), (v5))
 
 #define ERROR_PRINT6(strformat, v1, v2, v3, v4, v5, v6)			\
-  fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2), (v3), (v4), (v5), (v6))
+  if (!getSilentErrorsValue()) fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2), (v3), (v4), (v5), (v6))
 
 #define ERROR_PRINT7(strformat, v1, v2, v3, v4, v5, v6, v7)		\
-  fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2), (v3), (v4), (v5), (v6), (v7))
+  if (!getSilentErrorsValue()) fprintf(stderr, "Error in file %s in line %d, function %s: "  strformat, __FILE__, __LINE__, __FUNCTION__, (v1), (v2), (v3), (v4), (v5), (v6), (v7))
 
 #define ERROR_EXIT(errorcode, strformat)			\
-  do { ERROR_PRINT(strformat); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
+  do { if (!getSilentErrorsValue()) ERROR_PRINT(strformat); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
 
 #define ERROR_EXIT1(errorcode, strformat, v1)			\
-  do { ERROR_PRINT1(strformat,(v1)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
+  do { if (!getSilentErrorsValue()) ERROR_PRINT1(strformat,(v1)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
 
 #define ERROR_EXIT2(errorcode, strformat, v1, v2)			\
-  do { ERROR_PRINT2(strformat,(v1),(v2)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
+  do { if (!getSilentErrorsValue()) ERROR_PRINT2(strformat,(v1),(v2)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
 
 #define ERROR_EXIT3(errorcode, strformat, v1, v2, v3)			\
-  do { ERROR_PRINT3(strformat,(v1),(v2),(v3)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
+  do { if (!getSilentErrorsValue()) ERROR_PRINT3(strformat,(v1),(v2),(v3)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
 
 #define ERROR_EXIT4(errorcode, strformat, v1, v2, v3, v4)		\
-  do { ERROR_PRINT4(strformat,(v1),(v2),(v3),(v4)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
+  do { if (!getSilentErrorsValue()) ERROR_PRINT4(strformat,(v1),(v2),(v3),(v4)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
 
 #define ERROR_EXIT5(errorcode, strformat, v1, v2, v3, v4, v5)		\
-  do { ERROR_PRINT5(strformat,(v1),(v2),(v3),(v4),(v5)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
+  do { if (!getSilentErrorsValue()) ERROR_PRINT5(strformat,(v1),(v2),(v3),(v4),(v5)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
 
 #define ERROR_EXIT6(errorcode, strformat, v1, v2, v3, v4, v5, v6)	\
-  do { ERROR_PRINT6(strformat,(v1),(v2),(v3),(v4),(v5),(v6)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
+  do { if (!getSilentErrorsValue()) ERROR_PRINT6(strformat,(v1),(v2),(v3),(v4),(v5),(v6)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
 
 #define ERROR_EXIT7(errorcode, strformat, v1, v2, v3, v4, v5, v6, v7)	\
-  do { ERROR_PRINT7(strformat,(v1),(v2),(v3),(v4),(v5),(v6),(v7)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
+  do { if (!getSilentErrorsValue()) ERROR_PRINT7(strformat,(v1),(v2),(v3),(v4),(v5),(v6),(v7)); print_CPP_LUA_stacktrace_and_exit(errorcode); /*exit(errorcode);*/ } while(0)
 
 #endif // ERROR_EXIT_H
diff --git a/packages/basics/util/c_src/generic_options.cc b/packages/basics/util/c_src/generic_options.cc
deleted file mode 100644
index 45e3f13de..000000000
--- a/packages/basics/util/c_src/generic_options.cc
+++ /dev/null
@@ -1,294 +0,0 @@
-/*
- * This file is part of APRIL-ANN toolkit (A
- * Pattern Recognizer In Lua with Artificial Neural Networks).
- *
- * Copyright 2014, Francisco Zamora-Martinez
- *
- * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License version 3 as
- * published by the Free Software Foundation
- *
- * This library is distributed in the hope that it will be useful, but WITHOUT
- * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
- * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this library; if not, write to the Free Software Foundation,
- * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
- *
- */
-extern "C" {
-#include "lauxlib.h"
-#include "lualib.h"
-#include "lua.h"
-}
-
-#include "error_print.h"
-#include "generic_options.h"
-
-namespace AprilUtils {
-  
-  /************************************************************************/
-  static char lua_isCHAR(lua_State *L, int i) {
-    return lua_isstring(L,i) && luaL_len(L,i) == 1;
-  }
-  static char lua_toCHAR(lua_State *L, int i) {
-    const char *str = lua_tostring(L,i);
-    return str[0];
-  }
-  static void lua_pushCHAR(lua_State *L, char c) {
-    lua_pushlstring(L, &c, 1u);
-  }
-  /************************************************************************/
-  
-  /************************************************************************/  
-  static Referenced *april_rawgetReferenced(lua_State *L, int index) {
-    Referenced **pre_obj = static_cast<Referenced**>(lua_touserdata(L,index));
-    Referenced *obj = 0;
-    if (pre_obj != 0) obj = (*pre_obj);
-    return obj;
-  }
-  
-  static int april_deleteReferenced(lua_State *L) {
-    // stops garbage collector to avoid problems with reference counting
-    lua_gc(L, LUA_GCSTOP, 0);
-    Referenced *obj = april_rawgetReferenced(L,1);
-    if (obj != 0) {
-      DecRef(obj);
-    }
-    // restart the garbage collector
-    lua_gc(L, LUA_GCRESTART, 0);
-    return 0;
-  }
-  
-  static void april_pushReferenced(lua_State *L, Referenced *obj) {
-    IncRef(obj);
-    Referenced **ptr;
-    ptr = static_cast<Referenced**>
-      (lua_newuserdata(L,sizeof(Referenced*)) );
-    *ptr = obj;
-    // stack: ptr
-    lua_newtable(L); // a metatable
-    // stack: ptr mt
-    lua_pushcfunction(L, april_deleteReferenced);
-    // stack: ptr mt func
-    lua_setfield(L,-2,"__gc");
-    // stack: ptr mt
-    lua_setmetatable(L,-2);
-    // stack: ptr
-  }
-  
-  static Referenced *april_toReferenced(lua_State *L, int index) {
-    return april_rawgetReferenced(L,index);
-  }
-  /************************************************************************/
-  
-  // int HashTableOptions::pushToLua(lua_State *L, const char *name) {
-  //   Value *v = dict.find(name);
-  //   if (v == 0) lua_pushnil(L);
-  //   switch(v->type) {
-  //   case DOUBLE:
-  //     lua_pushnumber(L,v->dbl);
-  //     break;
-  //   case FLOAT:
-  //     lua_pushnumber(L,static_cast<double>(v->flt));
-  //     break;
-  //   case CHAR:
-  //     lua_pushCHAR(L,v->chr);
-  //     break;
-  //   case STRING:
-  //     lua_pushstring(L,v->str.c_str());
-  //     break;
-  //   case INT32:
-  //     lua_pushnumber(L,static_cast<double>(v->i32));
-  //     break;
-  //   case UINT32:
-  //     lua_pushnumber(L,static_cast<double>(v->u32));
-  //     break;
-  //   case INT64:
-  //     lua_pushnumber(L,static_cast<double>(v->i64));
-  //     break;
-  //   case UINT64:
-  //     lua_pushnumber(L,static_cast<double>(v->u64));
-  //     break;
-  //   case BOOL:
-  //     lua_pushboolean(L,v->bl);
-  //     break;
-  //   case REFERENCED:
-  //     april_pushReferenced(L,v->ref_ptr.get());
-  //     break;
-  //   default:
-  //     ERROR_EXIT(128, "Unknown type\n");;
-  //   }
-  //   return 1;
-  // }
-
-#define METHODS_IMPLEMENTATION(method, c_type, enum_type, value_name)   \
-  GenericOptions *HashTableOptions::put##method(const char *name, c_type value) { \
-    Value v;                                                            \
-    v.value_name = value;                                               \
-    v.type = enum_type;                                                 \
-    dict[name] = v;                                                     \
-    return this;                                                        \
-  }                                                                     \
-  c_type HashTableOptions::get##method(const char *name) const {        \
-    Value *v = dict.find(name);                                         \
-    if (v == 0) ERROR_EXIT1(128, "Unable to find field %s\n", name);    \
-    if (v->type != enum_type) {                                         \
-      ERROR_EXIT(128, "Unexpected type error\n");                       \
-    }                                                                   \
-    return v->value_name;                                               \
-  }                                                                     \
-  c_type HashTableOptions::getOptional##method(const char *name,        \
-                                               c_type const opt) const { \
-    Value *v = dict.find(name);                                         \
-    if (v == 0) return opt;                                             \
-    else if (v->type != enum_type) {                                    \
-      ERROR_EXIT(128, "Unexpected type error\n");                       \
-    }                                                                   \
-    return v->value_name;                                               \
-  }
-  
-  METHODS_IMPLEMENTATION(Double, double, DOUBLE, dbl);
-  METHODS_IMPLEMENTATION(Float, float, FLOAT, flt);
-  METHODS_IMPLEMENTATION(Char, char, CHAR, chr);
-  METHODS_IMPLEMENTATION(String, const char *, STRING, str);
-  METHODS_IMPLEMENTATION(Int32, int32_t, INT32, i32);
-  METHODS_IMPLEMENTATION(UInt32, uint32_t, UINT32, u32);
-  METHODS_IMPLEMENTATION(Int64, int64_t, INT64, i64);
-  METHODS_IMPLEMENTATION(UInt64, uint64_t, UINT64, u64);
-  METHODS_IMPLEMENTATION(Boolean, bool, BOOL, bl);
-  
-#undef METHODS_IMPLEMENTATION
-
-  GenericOptions *HashTableOptions::putReferenced(const char *name,
-                                                  Referenced *value) {
-    Value v;
-    v.ref_ptr = value;
-    v.type = REFERENCED;
-    dict[name] = v;
-    return this;
-  }
-  
-  Referenced *HashTableOptions::privateGetReferenced(const char *name) const {
-    Value *v = dict.find(name);
-    if (v == 0) return 0;
-    if (v->type != REFERENCED) {
-      ERROR_EXIT(128, "Unexpected type error\n");
-    }
-    return v->ref_ptr.get();
-  }
-
-  ////////////////////////////////////////////////////////////////////////////
-  
-  LuaTableOptions::LuaTableOptions(lua_State *L) : GenericOptions() {
-    lua_newtable(L);
-    init(L, -1);
-    lua_pop(L,1);
-  }
-  
-  LuaTableOptions::LuaTableOptions(lua_State *L, int i) : GenericOptions() {
-    init(L, i);
-  }
-  
-  LuaTableOptions::~LuaTableOptions() {
-    luaL_unref(L, LUA_REGISTRYINDEX, ref);
-  }
-
-  void LuaTableOptions::init(lua_State *L, int i) {
-    this->L = L;
-    if (lua_isnil(L,i) || lua_type(L,i) == LUA_TNONE) ref = LUA_NOREF;
-    else {
-      lua_pushvalue(L,i);
-      if (!lua_istable(L,-1)) {
-        ERROR_EXIT1(128,"Expected a table parameter at pos %d\n", i);
-      }
-      this->ref = luaL_ref(L, LUA_REGISTRYINDEX);
-    }
-  }
-  
-  // int LuaTableOptions::pushToLua(lua_State *L, const char *name) {
-  //   if (ref == LUA_NOREF) ERROR_EXIT(128, "Unable to get options\n");
-  //   lua_rawgeti(L, LUA_REGISTRYINDEX, ref);
-  //   lua_getfield(L, -1, name);
-  //   return 1;
-  // }
-
-#define METHODS_IMPLEMENTATION(method, c_type, lua_type)                \
-  GenericOptions *LuaTableOptions::put##method(const char *name, c_type value) { \
-    if (ref == LUA_NOREF) ERROR_EXIT(128, "Unable to put options\n");   \
-    lua_rawgeti(L, LUA_REGISTRYINDEX, ref);                             \
-    lua_push##lua_type(L, value);                                       \
-      lua_setfield(L, -2, name);                                        \
-      lua_pop(L,1);                                                     \
-      return this;                                                      \
-  }                                                                     \
-  c_type LuaTableOptions::get##method(const char *name) const {         \
-    if (ref == LUA_NOREF) ERROR_EXIT(128, "Unable to get options\n");   \
-    lua_rawgeti(L, LUA_REGISTRYINDEX, ref);                             \
-    lua_getfield(L, -1, name);                                          \
-    if (lua_isnil(L,-1)) ERROR_EXIT1(128, "Unable to find field %s\n", name); \
-    if (!lua_is##lua_type(L, -1)) {                                     \
-      ERROR_EXIT(128, "Unexpected type error\n");                       \
-    }                                                                   \
-    c_type v = static_cast<c_type>(lua_to##lua_type(L,-1));             \
-    lua_pop(L,2);                                                       \
-    return v;                                                           \
-  }                                                                     \
-  c_type LuaTableOptions::getOptional##method(const char *name,         \
-                                              c_type const opt) const { \
-    if (ref == LUA_NOREF) return opt;                                   \
-    lua_rawgeti(L, LUA_REGISTRYINDEX, ref);                             \
-    lua_getfield(L, -1, name);                                          \
-    if (lua_isnil(L,-1)) {                                              \
-      lua_pop(L,2);                                                     \
-      return opt;                                                       \
-    }                                                                   \
-    if (!lua_is##lua_type(L, -1)) {                                     \
-      ERROR_EXIT(128, "Unexpected type error\n");                       \
-    }                                                                   \
-    c_type v = static_cast<c_type>(lua_to##lua_type(L,-1));             \
-    lua_pop(L,2);                                                       \
-    return v;                                                           \
-  }
-
-  METHODS_IMPLEMENTATION(Double, double, number);
-  METHODS_IMPLEMENTATION(Float, float, number);
-  METHODS_IMPLEMENTATION(Char, char, CHAR);
-  METHODS_IMPLEMENTATION(String, const char *, string);
-  METHODS_IMPLEMENTATION(Int32, int32_t, number);
-  METHODS_IMPLEMENTATION(UInt32, uint32_t, number);
-  METHODS_IMPLEMENTATION(Int64, int64_t, number);
-  METHODS_IMPLEMENTATION(UInt64, uint64_t, number);
-  METHODS_IMPLEMENTATION(Boolean, bool, boolean);
-  
-#undef METHODS_IMPLEMENTATION
-
-  GenericOptions *LuaTableOptions::putReferenced(const char *name,
-                                                 Referenced *value) {
-    if (ref == LUA_NOREF) ERROR_EXIT(128, "Unable to put options\n");
-    lua_rawgeti(L, LUA_REGISTRYINDEX, ref);
-    april_pushReferenced(L, value);
-    lua_setfield(L, -2, name);
-    lua_pop(L,1);
-    return this;
-  }
-  
-  Referenced *LuaTableOptions::privateGetReferenced(const char *name) const {
-    if (ref == LUA_NOREF) ERROR_EXIT(128, "Unable to get options\n");
-    lua_rawgeti(L, LUA_REGISTRYINDEX, ref);
-    lua_getfield(L, -1, name);
-    if (lua_isnil(L,-1)) {
-      lua_pop(L,2);
-      return 0;
-    }
-    Referenced *v = april_toReferenced(L,-1);
-    if (v == 0) {
-      ERROR_EXIT(128, "Unexpected type error\n");
-    }
-    lua_pop(L,2);
-    return v;
-  }
-  
-} // namespace AprilUtils
diff --git a/packages/basics/util/c_src/generic_options.h b/packages/basics/util/c_src/generic_options.h
deleted file mode 100644
index 8b4f673f4..000000000
--- a/packages/basics/util/c_src/generic_options.h
+++ /dev/null
@@ -1,243 +0,0 @@
-/*
- * This file is part of APRIL-ANN toolkit (A
- * Pattern Recognizer In Lua with Artificial Neural Networks).
- *
- * Copyright 2014, Francisco Zamora-Martinez
- *
- * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
- * under the terms of the GNU General Public License version 3 as
- * published by the Free Software Foundation
- *
- * This library is distributed in the hope that it will be useful, but WITHOUT
- * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
- * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
- * for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this library; if not, write to the Free Software Foundation,
- * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
- *
- */
-#ifndef GENERIC_OPTIONS_H
-#define GENERIC_OPTIONS_H
-
-#include "error_print.h"
-#include "hash_table.h"
-#include "mystring.h"
-#include "referenced.h"
-#include "smart_ptr.h"
-
-namespace AprilUtils {
-  
-#define METHODS(method, type)                                            \
-  virtual GenericOptions *put##method(const char *name, type value) = 0; \
-  virtual type get##method(const char *name) const = 0;                  \
-  virtual type getOptional##method(const char *name, type const value) const = 0
-
-  /**
-   * @brief Class which contains pairs key,value of standard types.
-   *
-   * The key is always a string and the value can be one of the following:
-   * double, float, char, const char *, int32_t, uint32_t, int64_t, uint64_t,
-   * bool, classes derived from Referenced.
-   *
-   * Three methods are available for each type:
-   *
-   * - The put method as putDouble() which receives a <tt>const char * key</tt>
-   *   and a <tt>double value</tt> and inserts into the set the pair
-   *   (key,value).
-   *
-   * - The get method as getDouble() which receives a <tt>const char * key</tt>
-   *   and returns a @c double value. In case the given @c key doesn't exists,
-   *   this method throws an error.
-   *
-   * - The getOptional method as getOptionalDouble() which receives a <tt>const
-   *   char *key</tt>, an optional value <tt>double opt</tt>, and returns a @c
-   *   double. In case the given @c key doesn't exists, this method returns the
-   *   given @c opt value.
-   *
-   * @note The types can be binded to Lua, allowing to have the same generic
-   * interface for data coming from Lua or from C/C++.
-   *
-   * @note getReferenced() and getOptionalReferenced() are templates which use
-   * @c dynamic_cast to convert from Referenced to the corresponding class.
-   */
-  class GenericOptions {
-  public:
-    
-    /// Constructor.
-    GenericOptions() { }
-    /// Destructor.
-    virtual ~GenericOptions() { }
-
-    // virtual int pushToLua(lua_State *L, const char *name) = 0;
-    
-    METHODS(Double, double);
-    METHODS(Float, float);
-    METHODS(Char, char);
-    METHODS(String, const char *);
-    METHODS(Int32, int32_t);
-    METHODS(UInt32, uint32_t);
-    METHODS(Int64, int64_t);
-    METHODS(UInt64, uint64_t);
-    METHODS(Boolean, bool);
-    
-    virtual GenericOptions *putReferenced(const char *name,
-                                          Referenced *value) = 0;
-    
-    template<typename T>
-    T *getReferenced(const char *name) const {
-      Referenced *aux = privateGetReferenced(name);
-      if (aux == 0) {
-        ERROR_EXIT1(128, "Unable to locate a Referenced class at key %s\n", name);
-      }
-      T *ret = dynamic_cast<T*>(aux);
-      if (ret == 0) {
-        ERROR_EXIT1(128, "Unable dynamic_cast from Referenced at key %s\n", name);
-      }
-      return ret;
-    }
-
-    template<typename T>
-    T *getOptionalReferenced(const char *name, T *opt) const {
-      Referenced *aux = privateGetReferenced(name);
-      if (aux == 0) return opt;
-      T *ret = dynamic_cast<T*>(aux);
-      if (ret == 0) {
-        ERROR_EXIT1(128, "Unable dynamic_cast from Referenced at key %s\n", name);
-      }
-      return ret;
-    }
-    
-  protected:
-    
-    /// Protected method which looks-up for a Referenced object and returns it
-    /// or NULL in the given key name doesn't exits. If the key name exists but
-    /// doesn't contains a Referenced object, this method must throw an error.
-    virtual Referenced *privateGetReferenced(const char *name) const = 0;
-  };
-#undef METHODS
-  
-#define METHODS(method, type)                                           \
-  virtual GenericOptions *put##method(const char *name, type value);    \
-  virtual type get##method(const char *name) const;                     \
-  virtual type getOptional##method(const char *name, type const value) const
-
-  /**
-   * @brief Specialization of GenericOptions for passing data stored at a hash
-   * table in C++.
-   *
-   * This class uses a AprilUtils::hash table where (key,value) pairs will be
-   * stored. To allow multiple value types, a @c union has been declared, and an
-   * enum HashTableOptions::ValueTpyes allows to indicate which type has been
-   * stored.
-   */  
-  class HashTableOptions : public GenericOptions {
-  public:
-    
-    HashTableOptions() : GenericOptions() { }
-    virtual ~HashTableOptions() { }
-
-    // virtual int pushToLua(lua_State *L, const char *name);
-    
-    METHODS(Double, double);
-    METHODS(Float, float);
-    METHODS(Char, char);
-    METHODS(String, const char *);
-    METHODS(Int32, int32_t);
-    METHODS(UInt32, uint32_t);
-    METHODS(Int64, int64_t);
-    METHODS(UInt64, uint64_t);
-    METHODS(Boolean, bool);
-
-    virtual GenericOptions *putReferenced(const char *name, Referenced *value);
-
-  protected:
-    
-    virtual Referenced *privateGetReferenced(const char *name) const;
-    
-  private:
-
-    /// Enumeration with the types which can be stored in the table.
-    enum ValueTypes {
-      DOUBLE, FLOAT, CHAR, STRING, INT32, UINT32, INT64, UINT64, BOOL,
-      REFERENCED, NUM_TYPES
-    };
-    
-    /// Value part of the table elements, it is a union of all the possible
-    /// values and a ValueTypes instance indicating which one it is.
-    struct Value {
-      union {
-        float flt;
-        double dbl; 
-        char chr;
-        int32_t i32;
-        uint32_t u32;
-        int64_t i64;
-        uint64_t u64;
-        bool bl;
-      };
-      AprilUtils::string str; // can't be in the union
-      AprilUtils::SharedPtr<Referenced> ref_ptr;
-      ValueTypes type;
-    };
-    
-    typedef AprilUtils::hash<AprilUtils::string, Value> HashTable;
-    
-    /// The AprilUtils::hash with the key,value pairs.
-    HashTable dict;
-      
-  };
-
-  /**
-   * @brief Specialization of GenericOptions for passing data stored at a Lua
-   * table.
-   *
-   * This class uses Lua references to copy a reference to a Lua table in the
-   * registry. It can receive a Lua table at the constructor, or if not given,
-   * a new empty table will be allocated.
-   */
-  class LuaTableOptions : public GenericOptions {
-  public:
-    
-    /// Constructor from a new allocated Lua table.
-    LuaTableOptions(lua_State *L);
-    /// Constructor from a table allocated at Lua stack position @c i.
-    LuaTableOptions(lua_State *L, int i);
-    /// Destructor, de-references the Lua table for garbage collection.
-    virtual ~LuaTableOptions();
-
-    // virtual int pushToLua(lua_State *L, const char *name);
-    
-    METHODS(Double, double);
-    METHODS(Float, float);
-    METHODS(Char, char);
-    METHODS(String, const char *);
-    METHODS(Int32, int32_t);
-    METHODS(UInt32, uint32_t);
-    METHODS(Int64, int64_t);
-    METHODS(UInt64, uint64_t);
-    METHODS(Boolean, bool);
-
-    virtual GenericOptions *putReferenced(const char *name, Referenced *value);
-    
-  protected:
-    
-    virtual Referenced *privateGetReferenced(const char *name) const;
-
-  private:
-    
-    /// The lua_State where the table is allocated.
-    lua_State *L;
-    /// The reference in the registry where the table can be retrieved.
-    int ref;
-
-    /// Auxiliary method to simplify constructors.
-    void init(lua_State *L, int i);
-  };
-
-#undef METHODS
-
-} // namespace AprilUtils
-
-#endif // GENERIC_OPTIONS_H
diff --git a/packages/basics/util/c_src/lua_table.cc b/packages/basics/util/c_src/lua_table.cc
new file mode 100644
index 000000000..92559ba4d
--- /dev/null
+++ b/packages/basics/util/c_src/lua_table.cc
@@ -0,0 +1,235 @@
+/*
+ * This file is part of APRIL-ANN toolkit (A
+ * Pattern Recognizer In Lua with Artificial Neural Networks).
+ *
+ * Copyright 2014, Francisco Zamora-Martinez
+ *
+ * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 3 as
+ * published by the Free Software Foundation
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this library; if not, write to the Free Software Foundation,
+ * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ */
+extern "C" {
+#include "lauxlib.h"
+#include "lualib.h"
+#include "lua.h"
+}
+#include "lua_table.h"
+
+namespace AprilUtils {
+
+  LuaTable::LuaTable(lua_State *L) {
+    lua_newtable(L);
+    init(L, -1);
+    lua_pop(L, 1);
+  }
+  
+  LuaTable::LuaTable(lua_State *L, int i) {
+    init(L, i);
+  }
+
+  LuaTable::LuaTable(const LuaTable &other) {
+    other.checkAndGetRef();
+    init(other.L, -1);
+    lua_pop(L, 1);
+  }
+
+  LuaTable::~LuaTable() {
+    luaL_unref(L, LUA_REGISTRYINDEX, ref);
+  }
+
+  LuaTable &LuaTable::operator=(const LuaTable &other) {
+    luaL_unref(L, LUA_REGISTRYINDEX, ref);
+    other.checkAndGetRef();
+    init(other.L, -1);
+    lua_pop(L, 1);
+    return *this;
+  }
+  
+  void LuaTable::init(lua_State *L, int i) {
+    this->L = L;
+    if (lua_isnil(L,i) || lua_type(L,i) == LUA_TNONE) ref = LUA_NOREF;
+    else {
+      lua_pushvalue(L,i);
+      if (!lua_istable(L,-1)) {
+        ERROR_EXIT1(128,"Expected a table parameter at pos %d\n", i);
+      }
+      this->ref = luaL_ref(L, LUA_REGISTRYINDEX);
+    }
+  }
+
+  string LuaTable::toLuaString() {
+    /* the function name */
+    lua_getglobal(L, "util");
+    lua_getfield(L, -1, "to_lua_string");
+    pushTable(L);
+    lua_pushstring(L, "binary");
+    lua_call(L, 2, 1);
+    string str(lua_tostring(L,-1));
+    lua_pop(L,2);
+    return str;
+  }
+    
+  void LuaTable::pushTable(lua_State *L) {
+    if (this->L != L) ERROR_EXIT(128, "Given incorrect lua_State\n");
+    checkAndGetRef();
+  }
+  
+  bool LuaTable::checkAndGetRef() const {
+    if (ref == LUA_NOREF) {
+      lua_pushnil(L); // just to be coherent, it always pushes a value
+      return false;
+    }
+    else {
+      lua_rawgeti(L, LUA_REGISTRYINDEX, ref);
+      return true;
+    }
+  }
+
+  ///////////////////////////////////////////////////////////////////////////
+  
+  template<>
+  int LuaTable::convertTo<int>(lua_State *L, int idx) {
+    return lua_tointeger(L, idx);
+  }
+
+  template<>
+  float LuaTable::convertTo<float>(lua_State *L, int idx) {
+    return static_cast<float>(lua_tonumber(L, idx));
+  }
+
+  template<>
+  double LuaTable::convertTo<double>(lua_State *L, int idx) {
+    return lua_tonumber(L, idx);
+  }
+  
+  template<>
+  bool LuaTable::convertTo<bool>(lua_State *L, int idx) {
+    return lua_toboolean(L, idx);
+  }
+
+  template<>
+  const char *LuaTable::convertTo<const char *>(lua_State *L, int idx) {
+    UNUSED_VARIABLE(L);
+    UNUSED_VARIABLE(idx);
+    ERROR_EXIT(128, "Not implemented for 'const char *', use 'string'\n");
+    return 0;
+  }
+
+  template<>
+  string LuaTable::convertTo<string>(lua_State *L, int idx) {
+    string aux(lua_tostring(L, idx), luaL_len(L, idx));
+    return aux;
+  }
+  
+  template<>
+  void LuaTable::pushInto<int>(lua_State *L, int value) {
+    lua_pushnumber(L, static_cast<double>(value));
+  }
+
+  template<>
+  void LuaTable::pushInto<float>(lua_State *L, float value) {
+    lua_pushnumber(L, static_cast<double>(value));
+  }
+
+  template<>
+  void LuaTable::pushInto<double>(lua_State *L, double value) {
+    lua_pushnumber(L, value);
+  }
+
+  template<>
+  void LuaTable::pushInto<bool>(lua_State *L, bool value) {
+    lua_pushboolean(L, value);
+  }
+
+  template<>
+  void LuaTable::pushInto<const string &>(lua_State *L,
+                                          const string &value) {
+    lua_pushlstring(L, value.c_str(), value.size());
+  }
+
+  template<>
+  void LuaTable::pushInto<const char *>(lua_State *L,
+                                        const char *value) {
+    lua_pushstring(L, value);
+  }
+
+  template<>
+  bool LuaTable::checkType<int>(lua_State *L, int idx) {
+    return lua_isnumber(L, idx);
+  }
+  
+  template<>
+  bool LuaTable::checkType<float>(lua_State *L, int idx) {
+    return lua_isnumber(L, idx);
+  }
+  
+  template<>
+  bool LuaTable::checkType<double>(lua_State *L, int idx) {
+    return lua_isnumber(L, idx);
+  }
+  
+  template<>
+  bool LuaTable::checkType<bool>(lua_State *L, int idx) {
+    return lua_isboolean(L, idx);
+  }
+  
+  template<>
+  bool LuaTable::checkType<const char *>(lua_State *L, int idx) {
+    return lua_isstring(L, idx);
+  }
+  
+  template<>
+  bool LuaTable::checkType<string>(lua_State *L, int idx) {
+    return lua_isstring(L, idx);
+  }
+  
+  // overload of get for const char *
+  template<>
+  const char *LuaTable::get<const char *>(const char *name) const {
+    if (!checkAndGetRef()) ERROR_EXIT(128, "Invalid reference\n");
+    lua_getfield(L, -1, name);
+    if (lua_isnil(L,-1)) ERROR_EXIT1(128, "Unable to find field %s\n", name);
+    const char *str = lua_tostring(L, -1);
+    // NOTE: it is safe to pop becase: 1) garbage collection has been stopped in
+    // C/C++ environment, it has shown to be better in APRIL-ANN binding; 2) the
+    // string is referenced in a table, so, as far as the table exists, the
+    // string will also exists.
+    lua_pop(L, 2);
+    return str;
+  }
+
+  // overload of opt for const char *
+  template<>
+  const char *LuaTable::opt<const char *>(const char *name, const char *def) const {
+    if (!checkAndGetRef()) {
+      lua_pop(L, 1);
+      return def;
+    }
+    else {
+      lua_getfield(L, -1, name);
+      if (lua_isnil(L,-1)) {
+        lua_pop(L, 2);
+        return def;
+      }
+      const char *str = lua_tostring(L,-1);
+      // NOTE: it is safe to pop becase: 1) garbage collection has been stopped in
+      // C/C++ environment, it has shown to be better in APRIL-ANN binding; 2) the
+      // string is referenced in a table, so, as far as the table exists, the
+      // string will also exists.
+      lua_pop(L, 2);
+      return str;
+    }
+    // return T();
+  }
+  
+}
diff --git a/packages/basics/util/c_src/lua_table.h b/packages/basics/util/c_src/lua_table.h
new file mode 100644
index 000000000..9ce112310
--- /dev/null
+++ b/packages/basics/util/c_src/lua_table.h
@@ -0,0 +1,245 @@
+/*
+ * This file is part of APRIL-ANN toolkit (A
+ * Pattern Recognizer In Lua with Artificial Neural Networks).
+ *
+ * Copyright 2014, Francisco Zamora-Martinez
+ *
+ * The APRIL-ANN toolkit is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU General Public License version 3 as
+ * published by the Free Software Foundation
+ *
+ * This library is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
+ * for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this library; if not, write to the Free Software Foundation,
+ * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ */
+#ifndef LUA_TABLE_H
+#define LUA_TABLE_H
+extern "C" {
+#include "lauxlib.h"
+#include "lualib.h"
+#include "lua.h"
+}
+#include <typeinfo>
+
+#include "base.h"
+#include "error_print.h"
+#include "mystring.h"
+#include "referenced.h"
+#include "unused_variable.h"
+
+namespace AprilUtils {
+
+  /**
+   * @brief A class which allow to put and get data into a Lua table.
+   *
+   * This class allow to access from C++ to Lua values stored into a Lua table.
+   * The Lua table is stored at the C registry, and will be remove in the
+   * destructor. Template methods for put(), get(), and opt() operations are
+   * defined. It is possible to specialize this methods in new C++ types by
+   * specializing the static template methods: convertTo(), pushInto() and
+   * checkType().
+   *
+   * @note All keys are forced to be strings, so, it works with dictionary style
+   * Lua tables, not with arrays.
+   */
+  class LuaTable {
+  public:
+    
+    /// Constructor for a new LuaTable in the registry.
+    LuaTable(lua_State *L = Base::getGlobalLuaState());
+    
+    /// Constructor for a LuaTable in a given Lua stack position.
+    LuaTable(lua_State *L, int n);
+    
+    /// Copy constructor.
+    LuaTable(const LuaTable &other);
+    
+    /// Destructor.
+    ~LuaTable();
+    
+    /// Copy operator.
+    LuaTable &operator=(const LuaTable &other);
+    
+    /// Returns a C++ string with the Lua representation of the table.
+    string toLuaString();
+    
+    /// Puts a new value into the table, using the given key name.
+    template<typename T>
+    LuaTable &put(const string &name, T value) {
+      return put<T>(name.c_str(), value);
+    }
+    
+    /// Checks if the field at the given key name is nil.
+    bool checkNil(const string &name) const {
+      return checkNil(name.c_str());
+    }
+
+    /// Checks if the field at the given key name is of the given type (a nil
+    /// value will be taken as true).
+    template<typename T>
+    bool checkNilOrType(const string &name) const {
+      return checkNilOrType<T>(name.c_str());
+    }
+
+    /// Returns the value stored at the given key name field.
+    template<typename T>
+    T get(const string &name) const {
+      return get<T>(name.c_str());
+    }
+
+    /// Returns the value stored at the given key name field. In case the field
+    /// is empty, it returns the given def_value argument.
+    template<typename T>
+    T opt(const string &name, const T def_value = T()) const {
+      return opt<T>(name.c_str(), def_value);
+    }
+
+    /// Puts a new value into the table, using the given key name.
+    template<typename T>
+    LuaTable &put(const char *name, T value) {
+      if (!checkAndGetRef()) ERROR_EXIT(128, "Invalid reference\n");
+      pushInto(L, value);
+      lua_setfield(L, -2, name);
+      lua_pop(L, 1);
+      return *this;
+    }
+
+    /// Checks if the field at the given key name is nil.    
+    bool checkNil(const char *name) const {
+      if (!checkAndGetRef()) ERROR_EXIT(128, "Invalid reference\n");
+      lua_getfield(L, -1, name);
+      bool ret =  lua_isnil(L, -1);
+      lua_pop(L, 2);
+      return ret;
+    }
+
+    /// Checks if the field at the given key name is of the given type (a nil
+    /// value will be taken as true).
+    template<typename T>
+    bool checkNilOrType(const char *name) const {
+      if (!checkAndGetRef()) ERROR_EXIT(128, "Invalid reference\n");
+      lua_getfield(L, -1, name);
+      bool ret = lua_isnil(L, -1) || checkType<T>(L, -1);
+      lua_pop(L, 2);
+      return ret;
+    }
+
+    /// Returns the value stored at the given key name field.    
+    template<typename T>
+    T get(const char *name) const {
+      if (!checkAndGetRef()) ERROR_EXIT(128, "Invalid reference\n");
+      lua_getfield(L, -1, name);
+      if (lua_isnil(L,-1)) ERROR_EXIT1(128, "Unable to find field %s\n", name);
+      if (!checkType<T>(L, -1)) ERROR_EXIT(128, "Incorrect type\n");
+      T v = convertTo<T>(L, -1);
+      lua_pop(L,2);
+      return v;
+    }
+
+    /// Returns the value stored at the given key name field. In case the field
+    /// is empty, it returns the given def_value argument.    
+    template<typename T>
+    T opt(const char *name, const T def_value = T()) const {
+      if (!checkAndGetRef()) {
+        lua_pop(L, 1);
+        return def_value;
+      }
+      else {
+        lua_getfield(L, -1, name);
+        T v(def_value);
+        if (!lua_isnil(L,-1)) {
+          if (!checkType<T>(L, -1)) ERROR_EXIT(128, "Incorrect type\n");
+          v = convertTo<T>(L, -1);
+        }
+        lua_pop(L,2);
+        return v;
+      }
+      // return T();
+    }
+    
+    /// Pushes into Lua stack the Lua table associated with the object.
+    void pushTable(lua_State *L);
+    
+    /// Converts the value at the given Lua stack index, without removing it.
+    template<typename T>
+    static T convertTo(lua_State *L, int idx) {
+      UNUSED_VARIABLE(L);
+      UNUSED_VARIABLE(idx);
+      ERROR_EXIT1(128, "NOT IMPLEMENTED FOR TYPE %s\n", typeid(T).name());
+      return T();
+    }
+    
+    /// Pushes a value into the Lua stack.
+    template<typename T>
+    static void pushInto(lua_State *L, T value) {
+      UNUSED_VARIABLE(L);
+      UNUSED_VARIABLE(value);
+      ERROR_EXIT1(128, "NOT IMPLEMENTED FOR TYPE %s\n", typeid(value).name());
+    }
+    
+    /// Checks the expected type of the value at the given Lua stack index.
+    template<typename T>
+    static bool checkType(lua_State *L, int idx) {
+      UNUSED_VARIABLE(L);
+      UNUSED_VARIABLE(idx);
+      ERROR_EXIT1(128, "NOT IMPLEMENTED FOR TYPE %s\n", typeid(T).name());
+      return false;
+    }
+    
+  private:
+    /// The lua_State where the table is allocated.
+    mutable lua_State *L;
+    /// The reference in the registry where the table can be retrieved.
+    int ref;
+    
+    /// Auxiliary method to simplify constructors.
+    void init(lua_State *L, int i);
+    /// Checks ref != LUA_NOREF and pushes it into the Lua stack.
+    bool checkAndGetRef() const;
+    
+  };
+
+  // Basic data types specializations.
+  template<> int LuaTable::convertTo<int>(lua_State *L, int idx);
+  template<> float LuaTable::convertTo<float>(lua_State *L, int idx);
+  template<> double LuaTable::convertTo<double>(lua_State *L, int idx);
+  template<> bool LuaTable::convertTo<bool>(lua_State *L, int idx);
+  template<> const char *LuaTable::convertTo<const char *>(lua_State *L, int idx);
+  template<> string LuaTable::convertTo<string>(lua_State *L, int idx);
+  template<> LuaTable LuaTable::convertTo<LuaTable>(lua_State *L, int idx);
+  
+  template<> void LuaTable::pushInto<int>(lua_State *L, int value);
+  template<> void LuaTable::pushInto<float>(lua_State *L, float value);
+  template<> void LuaTable::pushInto<double>(lua_State *L, double value);
+  template<> void LuaTable::pushInto<bool>(lua_State *L, bool value);
+  template<> void LuaTable::pushInto<const string &>(lua_State *L,
+                                                     const string &value);
+  template<> void LuaTable::pushInto<const char *>(lua_State *L,
+                                                   const char *value);
+  template<> void LuaTable::pushInto<LuaTable>(lua_State *L, LuaTable value);
+
+  template<> bool LuaTable::checkType<int>(lua_State *L, int idx);
+  template<> bool LuaTable::checkType<float>(lua_State *L, int idx);
+  template<> bool LuaTable::checkType<double>(lua_State *L, int idx);
+  template<> bool LuaTable::checkType<bool>(lua_State *L, int idx);
+  template<> bool LuaTable::checkType<const char *>(lua_State *L, int idx);
+  template<> bool LuaTable::checkType<string>(lua_State *L, int idx);
+  template<> bool LuaTable::checkType<LuaTable>(lua_State *L, int idx);
+
+  // overload of get for const char *
+  template<>
+  const char *LuaTable::get<const char *>(const char *name) const;
+  
+  // overload of opt for const char *
+  template<>
+  const char *LuaTable::opt<const char *>(const char *name, const char *def) const;
+  
+} // namespace AprilUtils
+
+#endif // LUA_TABLE_H
diff --git a/packages/basics/util/lua_src/april_doc.lua b/packages/basics/util/lua_src/april_doc.lua
index 2c54bb933..19c55a127 100644
--- a/packages/basics/util/lua_src/april_doc.lua
+++ b/packages/basics/util/lua_src/april_doc.lua
@@ -22,12 +22,18 @@ function april_set_doc(object, docblock)
       class       = { mandatory=true,  type_match="string", default=nil },
       summary     = { mandatory=true },
       description = { mandatory=false, default=docblock.summary },
-      params      = { mandatory=false, type_match="table", default=nil },
-      outputs     = { mandatory=false, type_match="table", default=nil },
+      params      = { mandatory=false, default=nil },
+      outputs     = { mandatory=false, default=nil },
     }, docblock)
   assert(allowed_classes[docblock.class], "Incorrect class: " .. docblock.class)
   docblock.summary     = concat(docblock.summary)
   docblock.description = concat(docblock.description)
+  if type(docblock.params) == "string" then docblock.params = { docblock.params } end
+  if type(docblock.outputs) == "string" then docblock.outputs = { docblock.outputs } end
+  assert(not docblock.params or type(docblock.params) == "table",
+         "Params filed needs to be nil, table or string")
+  assert(not docblock.outputs or type(docblock.outputs) == "table",
+         "Outputs filed needs to be nil, table or string")
   --
   local tt = type(object)
   if not object or tt == "string" or tt == "number" or tt == "boolean" then
diff --git a/packages/basics/util/lua_src/util.lua b/packages/basics/util/lua_src/util.lua
index 695f7ceef..33a7b1745 100644
--- a/packages/basics/util/lua_src/util.lua
+++ b/packages/basics/util/lua_src/util.lua
@@ -27,6 +27,31 @@ is_class = make_deprecated_function("is_class",
 
 ------------------------------------------------------------------------------
 
+-- Clones the function and its upvalues
+local function clone_function(func,lookup_table)
+  local lookup_table = lookup_table or {}
+  -- clone by using a string dump
+  local ok,func_dump = pcall(string.dump, func)
+  local func_clone = (ok and loadstring(func_dump)) or func
+  if func_clone ~= func then
+    -- copy upvalues
+    local i = 1
+    while true do
+      local name,value = debug.getupvalue(func,i)
+      if not name then break end
+      if name == "_ENV" then
+        debug.setupvalue(func_clone, i, value)
+      else
+        debug.setupvalue(func_clone, i, util.clone(value, lookup_table))
+      end
+      i = i + 1
+    end
+  end
+  return func_clone
+end
+
+------------------------------------------------------------------------------
+
 function iscallable(obj)
   local t = luatype(obj)
   return t == "function" or (t == "table" and (getmetatable(obj) or {}).__call)
@@ -181,40 +206,6 @@ function multiple_ipairs(...)
   return mult_ipairs_it, t, 0
 end
 
-function iterable_filter(func, f, s, v)
-  return function(s,v)
-    local tmp = table.pack(f(s,v))
-    while tmp[1] ~= nil and not func(table.unpack(tmp)) do
-      v = tmp[1]
-      tmp = table.pack(f(s,v))
-    end
-    return table.unpack(tmp)
-  end, s, v
-end
-
--- FROM: http://www.corsix.org/content/mapping-and-lua-iterators
-function iterable_map(func, f, s, v)
-  local done
-  local function maybeyield(...)
-    if ... ~= nil then
-      coroutine.yield(...)
-    end
-  end
-  local function domap(...)
-    v = ...
-    if v ~= nil then
-      return maybeyield(func(...))
-    else
-      done = true
-    end
-  end
-  return coroutine.wrap(function()
-			  repeat
-			    domap(f(s,v))
-			  until done
-			end)
-end
-
 function filter(func, ...)
   assert(func, "filter: needs a function as first argument")
   local t,key,value = {}
@@ -258,25 +249,6 @@ function mapn(func, f, s, v)
   return t
 end
 
-function reduce(func, initial_value, ...)
-  assert(initial_value ~= nil,
-	 "reduce: needs an initial_value as second argument")
-  local accum,key,value = initial_value
-  for key,value in ... do
-    accum = func(accum, value or key)
-  end
-  return accum
-end
-
-function apply(func, f, s, v)
-  if not func then func = function() end end
-  local tmp = table.pack(f(s,v))
-  while tmp[1] ~= nil do
-    func(table.unpack(tmp))
-    tmp = table.pack(f(s,tmp[1]))
-  end
-end
-
 function glob(...)
   local r = {}
   for i,expr in ipairs(table.pack(...)) do
@@ -364,16 +336,6 @@ function fprintf(file,...)
   file:write(string.format(...))
 end
 
-function range(...)
-  local arg = table.pack(...)
-  local inf,sup,step = arg[1],arg[2],arg[3] or 1
-  local i = inf - step
-  return function()
-    i = i + step
-    if i <= sup then return i end
-  end
-end
-
 function check_mandatory_table_fields(fields, t)
   for _,name in ipairs(fields) do
     table.insert(ret, t[name] or error("The "..name.." field is mandatory"))
@@ -1010,135 +972,6 @@ function io.uncommented_lines(filename)
   end
 end
 
----------------------------------------------------------------
----------------------- ITERATOR CLASS -------------------------
----------------------------------------------------------------
-
--- The iterator class is useful to simplify the syntax of map, filter, reduce,
--- and apply functions, introducing a more natural order of application of the
--- functions.
-
-local iterator, iterator_methods = class("iterator")
-_G.iterator = iterator -- make global
-
-function iterator:constructor(...)
-  self.data = table.pack(...)
-end
-
-function iterator.meta_instance:__call() return table.unpack(self.data) end
-
-function iterator_methods:get() return table.unpack(self.data) end
-
-function iterator_methods:step()
-  return self.data[1](table.unpack(table.slice(self.data,2,#self.data)))
-end
-
-function iterator_methods:map(func)
-  return iterator(iterable_map(func, self:get()))
-end
-
-function iterator_methods:filter(func)
-  return iterator(iterable_filter(func, self:get()))
-end
-
-function iterator_methods:apply(func)
-  apply(func, self:get())
-end
-
-function iterator_methods:reduce(func, initial_value)
-  return reduce(func, initial_value, self:get())
-end
-
-function iterator_methods:enumerate()
-  local id = 0
-  return self:map(function(...)
-		    id = id + 1
-		    return id, ...
-		  end)
-end
-
-function iterator_methods:call(funcname, ...)
-  local func_args = table.pack(...)
-  return self:map(function(...)
-		    local arg    = table.pack(...)
-		    local result = {}
-		    for i=1,#arg do
-		      local t = table.pack(arg[i][funcname](arg[i],table.unpack(func_args)))
-		      for j=1,#t do table.insert(result, t[j]) end
-		    end
-		    return table.unpack(result)
-		  end)
-end
-
-function iterator_methods:iterate(iterator_func)
-  return self:map(function(...)
-		    local f,s,v = iterator_func(...)
-		    local tmp   = table.pack(f(s,v))
-		    while tmp[1] ~= nil do
-		      coroutine.yield(table.unpack(tmp))
-		      tmp = table.pack(f(s,tmp[1]))
-		    end
-		  end)
-end
-
-function iterator_methods:concat(sep1,sep2)
-  local sep1,sep2 = sep1 or "",sep2 or sep1 or ""
-  local t = {}
-  self:apply(function(...)
-	       local arg = table.pack(...)
-	       table.insert(t, string.format("%s", table.concat(arg, sep1)))
-	     end)
-  return table.concat(t, sep2)
-end
-
-function iterator_methods:field(...)
-  local f,s,v = self:get()
-  local arg   = table.pack(...)
-  return iterator(function(s)
-		    local tmp = table.pack(f(s,v))
-		    if tmp[1] == nil then return nil end
-		    v = tmp[1]
-		    local ret = { }
-		    for i=1,#tmp do
-		      for j=1,#arg do
-			table.insert(ret, tmp[i][arg[j]])
-		      end
-		    end
-		    return table.unpack(ret)
-		  end,s)
-end
-
-function iterator_methods:select(...)
-  local f,s,v = self:get()
-  local arg   = table.pack(...)
-  for i=1,#arg do arg[i]=tonumber(arg[i]) assert(arg[i],"select: expected a number") end
-  return iterator(function(s)
-		    local tmp = table.pack(f(s,v))
-		    if tmp[1] == nil then return nil end
-		    v = tmp[1]
-		    local selected = {}
-		    for i=1,#arg do selected[i] = tmp[arg[i]] end
-		    return table.unpack(selected)
-		  end,s)
-end
-
-function iterator_methods:table()
-  local t = {}
-  local idx = 1
-  self:apply(function(...)
-	       local v = table.pack(...)
-	       local k = table.remove(v, 1)
-	       if #v == 0 then
-		 k,v = idx,k
-	       elseif #v == 1 then
-		 v = v[1]
-	       end
-	       t[k] = v
-	       idx = idx + 1
-	     end)
-  return t
-end
-
 ----------------------------------------------------------------------------
 
 function util.function_setupvalues(func, upvalues)
@@ -1176,6 +1009,33 @@ function util.function_to_lua_string(func,format)
   return table.concat(t, "")
 end
 
+-- It clones a data object. Doesn't work if exists loops in tables.
+function util.clone(data, lookup_table)
+  if data == nil then return nil end
+  local lookup_table = lookup_table or {}
+  if lookup_table[data] then
+    return lookup_table[data]
+  else
+    local obj
+    local tt = type(data)
+    if tt == "number" or tt == "string" or tt == "thread" or tt == "boolean" then obj = data
+    elseif tt == "function" then obj = clone_function(data, lookup_table)
+    elseif data.clone then obj = data:clone()
+    elseif luatype(data) == "userdata" then obj = data
+    else
+      assert(luatype(data) == "table", "Expected a table")
+      obj = {}
+      for i,v in pairs(data) do
+        local clone_i = util.clone(i, lookup_table)
+        local clone_v = util.clone(v, lookup_table)
+        obj[clone_i] = clone_v
+      end
+    end
+    lookup_table[data] = obj
+    return obj
+  end
+end
+
 function util.to_lua_string(data,format)
   local tt = luatype(data)
   if tt == "table" then
diff --git a/packages/basics/util/package.lua b/packages/basics/util/package.lua
index 117d0bfc7..5b407cd06 100644
--- a/packages/basics/util/package.lua
+++ b/packages/basics/util/package.lua
@@ -1,6 +1,6 @@
 package{ name = "util",
    version = "1.0",
-   depends = { "class" },
+   depends = { "class", "iterator" },
    keywords = { },
    description = "",
    -- targets como en ant
diff --git a/packages/basics/util/test/test-functional-programming.lua b/packages/basics/util/test/test-functional-programming.lua
deleted file mode 100644
index 7f87115b0..000000000
--- a/packages/basics/util/test/test-functional-programming.lua
+++ /dev/null
@@ -1,66 +0,0 @@
-value = reduce(math.min, math.huge, ipairs({4, 2, 1, 10}))
-assert(value==1)
-assert( iterator(ipairs({4,2,1,10})):reduce(math.min, math.huge) == 1 )
-
-value = reduce(function(acc,v) return acc*2+v end, 0, string.gmatch("01101", "." ))
-assert(value==13)
-assert( iterator(string.gmatch("01101",".")):reduce(function(acc,v)return acc*2+v end, 0) == 13 )
-
-t = { "a", "c", 3, 2 }
-expected = { {1, "a", "a"}, {2, "c", "c"}, {3, 3, 3}, {4, 2, 2} }
-apply(function(i,v1,v2) assert(i==expected[i][1] and v1==expected[i][2] and v2==expected[i][3]) end, multiple_ipairs(t,t))
-iterator(multiple_ipairs(t,t)):apply(function(i,v1,v2) assert(i==expected[i][1] and v1==expected[i][2] and v2==expected[i][3]) end)
-
-tmapped = map(function(v) return v*2 end, ipairs({1, 2, 3, 4}))
-assert(table.concat(tmapped, " ") == "2 4 6 8")
-assert(iterator(ipairs({1,2,3,4})):map(function(i,v) return v*2 end):concat(" ") == "2 4 6 8")
-
-tmapped = map2(function(k,v) return k+v*2 end, ipairs({1, 2, 3, 4}))
-assert(table.concat(tmapped, " ") == "3 6 9 12")
-
-tmapped = mapn(function(idx, ...) return table.pack(...) end,
-	       multiple_ipairs({1, 2, 3, 4},{5, 6, 7, 8}))
-expected = { {1,5},{2,6},{3,7},{4,8} }
-for i,v in ipairs(tmapped) do assert(v[1]==expected[i][1] and v[2]==expected[i][2]) end
-
-t = filter(function(v) return v%2 == 0 end, ipairs{1,2,3,4,5,6,7})
-assert(table.concat(t, " ") == "2 4 6")
-assert( iterator(ipairs{1,2,3,4,5,6,7}):filter(function(i,v) return v%2==0 end):map(function(i,v)return v end):concat(" ") == "2 4 6")
-
-t = { Lemon = "sour", Cake = "nice", }
-expected = {
-  ["lemon is slightly SOUR"]=0,
-  ["cake is slightly NICE"]=0,
-}
-for ingredient, modifier, taste in iterable_map(function(a, b)
-						  return a:lower(),"slightly",b:upper()
-						end, pairs(t)) do
-  local str = ingredient .." is ".. modifier .. " " .. taste
-  assert(expected[str] == 0)
-  expected[str] = expected[str] + 1
-end
-
-t = { Lemon = "sour", Cake = "nice", }
-expected = {
-  ["cake is very NICE"]=0,
-  ["Cake is slightly nice"]=0,
-  ["lemon is very SOUR"]=0,
-  ["Lemon is slightly sour"]=0,
-}
-for ingredient, modifier, taste in iterable_map(function(a, b)
-                                         coroutine.yield(a:lower(),"very",b:upper())
-                                         return a, "slightly", b
-                                       end, pairs(t)) do
-  local str = ingredient .." is ".. modifier .. " " .. taste
-  assert(expected[str]==0)
-  expected[str] = expected[str] + 1
-end
-
-
-idx=1
-expected={2,4,6}
-for v in iterable_filter(function(key,value) return value%2==0 end,
-                         ipairs{1,2,3,4,5,6,7}) do
-  assert(v == expected[idx])
-  idx=idx+1
-end
diff --git a/packages/basics/util/test/test.lua b/packages/basics/util/test/test.lua
index 678f02097..8f81754aa 100644
--- a/packages/basics/util/test/test.lua
+++ b/packages/basics/util/test/test.lua
@@ -3,8 +3,11 @@ local T = utest.test
 
 T("GenericOptionsTest", function()
     check(function() return util.options.test() end)
-    local tbl = util.options.test()
+    local tbl,str2 = util.options.test()
     check.TRUE(tbl.clock1)
     check.TRUE(tbl.clock2)
+    check.TRUE(class.is_a(tbl.clock1, util.stopwatch))
+    check.TRUE(class.is_a(tbl.clock2, util.stopwatch))
     check.eq(tbl.str, "Hello world!")
+    check.eq(str2, util.to_lua_string(tbl))
 end)
diff --git a/packages/bayesian/lua_src/bayesian.lua b/packages/bayesian/lua_src/bayesian.lua
index e38af1144..c79a291da 100644
--- a/packages/bayesian/lua_src/bayesian.lua
+++ b/packages/bayesian/lua_src/bayesian.lua
@@ -1,7 +1,5 @@
 get_table_from_dotted_string("bayesian", true)
 
-local wrap_matrices = matrix.dict.wrap_matrices
-
 -- modifies model weights to be the MAP model for a given eval function
 function bayesian.get_MAP_weights(eval, samples)
   assert(samples, "Needs a table with samples as 2nd argument")
@@ -43,13 +41,11 @@ function bayesian.build_bayes_comb(t)
       local invN    = 1/N
       local which   = rnd:choose(samples)
       local out     = forward(which, input)
-      if class.is_a(out, tokens.base) then out = out:get_matrix() end
       assert(class.is_a(out, matrix), "The forward function must return a matrix")
       local output  = out:clone():scal(invN)
       for i=2,N do
         local which = rnd:choose(samples)
         local out   = forward(which, input)
-        if class.is_a(out, tokens.base) then out = out:get_matrix() end
         output:axpy(invN, out)
       end
       return output
diff --git a/packages/bayesian/lua_src/hmc.lua b/packages/bayesian/lua_src/hmc.lua
index 4fcae8a1e..f6c118f9f 100644
--- a/packages/bayesian/lua_src/hmc.lua
+++ b/packages/bayesian/lua_src/hmc.lua
@@ -1,7 +1,5 @@
 get_table_from_dotted_string("bayesian.optimizer", true)
 
-local wrap_matrices = matrix.dict.wrap_matrices
-
 -- Hamiltonian Monte-Carlo implementation with a basic on-line adaptation of
 -- epsilon, bounded by [epsilon_min,epsilon_max].
 
@@ -19,17 +17,17 @@ local wrap_matrices = matrix.dict.wrap_matrices
 -- implemented to minimize the negative of the log-likelihood (maximize the
 -- log-likelihood).
 --
--- @param theta is a matrix, a table of matrices or a matrix.dict instance.
+-- @param theta is a matrix, a table of matrices.
 local function hmc(self, eval, theta)
   local state       = self.state
   --
   local energies    = state.energies
   local math_log    = math.log
   local math_clamp  = math.clamp
+  local md          = matrix.dict
   local priors      = state.priors
   local samples     = state.samples
   local origw = theta
-  local theta = wrap_matrices(theta)
   --
   local acc_decay   = self:get_option("acc_decay")
   local alpha       = self:get_option("alpha")
@@ -61,7 +59,7 @@ local function hmc(self, eval, theta)
   --
   -- kinetic energy associated with given velocity
   local kinetic_energy = function(vel)
-    return 0.5 * vel:dot(vel)
+    return 0.5 * md.dot(vel,vel)
   end
   --
   -- executes the simulation chain of HMC using leapfrog updates
@@ -72,21 +70,19 @@ local function hmc(self, eval, theta)
     local leapfrog = function(pos, vel, epsilon, i)
       -- from pos(t) and vel(t - eps/2), compute vel(t + eps/2)
       local _,grads = eval_with_priors(origw, i)
-      grads = wrap_matrices(grads)
-      vel:axpy(-epsilon, grads)
+      md.axpy(vel, -epsilon, grads)
       -- from vel(t + eps/2) compute pos(t + eps)
-      pos:axpy(epsilon*inv_mass, vel)
+      md.axpy(pos, epsilon*inv_mass, vel)
       -- local eval_result,grads = eval_with_priors(origw, i)
-      -- vel:axpy(-epsilon*0.5, grads)
+      -- md.axpy(vel, -epsilon*0.5, grads)
     end
     --
     -- compute velocity at time: t + eps/2
     local initial_energy,grads = eval_with_priors(origw, 0)
     initial_energy = scale*initial_energy + priors:compute_neg_log_prior(pos)
-    grads = wrap_matrices(grads)
-    vel:axpy(-0.5*epsilon, grads)
+    md.axpy(vel, -0.5*epsilon, grads)
     -- compute position at time: t + eps
-    pos:axpy(epsilon*inv_mass, vel)
+    md.axpy(pos, epsilon*inv_mass, vel)
     -- compute from 2 to nsteps leapfrog updates
     for i=2,nsteps do
       leapfrog(pos, vel, epsilon, i-1)
@@ -94,8 +90,7 @@ local function hmc(self, eval, theta)
     -- compute velocity at time: t + nsteps*eps
     local final_energy,grads = eval_with_priors(origw, nsteps)
     final_energy = scale*final_energy + priors:compute_neg_log_prior(pos)
-    grads = wrap_matrices(grads)
-    vel:axpy(-0.5*epsilon, grads)
+    md.axpy(vel, -0.5*epsilon, grads)
     return initial_energy, final_energy
   end
   --
@@ -111,20 +106,20 @@ local function hmc(self, eval, theta)
   --
   -- one HMC sample procedure
   local norm01 = state.norm01 or stats.dist.normal()
-  local theta0 = theta:clone() -- for in case of rejection
+  local theta0 = md.clone(theta) -- for in case of rejection
   local vel    = self.state.vel
   local vel0 -- only if persistent
   -- sample velocity from a standard normal distribution
   if persistence == 0.0 or not vel then
-    vel = vel or theta:clone_only_dims()
-    for name,v in pairs(vel) do
+    vel = vel or md.clone_only_dims(theta)
+    for _,v in pairs(vel) do
       norm01:sample(rng, v:rewrap(v:size(), 1))
     end
   else
-    vel0 = vel:clone() -- for in case of rejection
-    vel:scal(-persistence)
-    for name,v in pairs(vel) do
-      local aux = matrix.col_major(v:size(),1)
+    vel0 = md.clone(vel) -- for in case of rejection
+    md.scal(vel, -persistence)
+    for _,v in pairs(vel) do
+      local aux = matrix(v:size(),1)
       norm01:sample(rng, aux)
       v:rewrap(v:size(),1):axpy(spersistence, aux)
     end
@@ -134,7 +129,7 @@ local function hmc(self, eval, theta)
   local initial_kinetic = kinetic_energy(vel) * inv_mass
   -- simulate the HMC mechanics
   local initial_energy, final_energy = simulation(theta, vel, p_epsilon, nsteps)
-  vel:scal(-1.0)
+  md.scal(vel, -1.0)
   local final_kinetic = kinetic_energy(vel) * inv_mass
   -- rejection based in metropolis hastings
   local accept = metropolis_hastings(initial_energy + initial_kinetic,
@@ -145,8 +140,8 @@ local function hmc(self, eval, theta)
   -- if not ok then print(ok, "PROBLEM") end
   if not accept or not ok then
     energy = initial_energy
-    theta:copy(theta0)
-    if persistent then vel:copy(vel0) end
+    md.copy(theta, theta0)
+    if persistent then md.copy(vel, vel0) end
   end
   local accepted = (accept and 1) or 0
   -- accept rate update (exponential mean)
@@ -154,7 +149,7 @@ local function hmc(self, eval, theta)
   --
   self:count_one()
   if self:get_count() % thin == 0 then
-    table.insert(samples, theta:clone())
+    table.insert(samples, md.clone(theta))
     table.insert(energies, energy)
   end
   local acceptance_rate
diff --git a/packages/bayesian/lua_src/metropolis.lua b/packages/bayesian/lua_src/metropolis.lua
index 6479abb30..6d3ca299b 100644
--- a/packages/bayesian/lua_src/metropolis.lua
+++ b/packages/bayesian/lua_src/metropolis.lua
@@ -1,24 +1,22 @@
 get_table_from_dotted_string("bayesian.optimizer", true)
 
-local wrap_matrices = matrix.dict.wrap_matrices
-
 -- Random walk Metropolis update with normal proposals
 
 -- @param eval is a function a function which returns L(Theta). It is
 -- implemented to minimize the negative of the log-likelihood (maximize the
 -- log-likelihood).
 --
--- @param theta is a matrix, a table of matrices or a matrix.dict instance.
+-- @param theta is a matrix, a table of matrices.
 local function metropolis(self, eval, theta)
   local state       = self.state
   --
   local energies    = state.energies
   local math_log    = math.log
   local math_clamp  = math.clamp
+  local md          = matrix.dict
   local priors      = state.priors
   local samples     = state.samples
-  local origw = theta
-  local theta = wrap_matrices(theta)
+  local origw       = theta
   --
   local acc_decay   = self:get_option("acc_decay")
   local epsilon     = state.epsilon or self:get_option("epsilon")
@@ -40,10 +38,10 @@ local function metropolis(self, eval, theta)
   --
   -- one METROPOLIS sample procedure
   local norm01 = state.norm01 or stats.dist.normal()
-  local theta0 = theta:clone() -- for in case of rejection
+  local theta0 = md.clone(theta) -- for in case of rejection
   local eval0_result = table.pack( eval(origw, 0) )
   local initial_energy = scale*eval0_result[1]
-  for name,v in pairs(theta) do
+  for _,v in pairs(theta) do
     local aux = matrix.as(v)
     norm01:sample(rng, aux:rewrap(v:size(),1))
     v:axpy(epsilon, aux)
@@ -55,12 +53,12 @@ local function metropolis(self, eval, theta)
   --
   local result = eval1_result
   local energy = final_energy
-  local ok =  pcall(theta.prune_subnormal_and_check_normal, theta)
+  local ok =  pcall(md.prune_subnormal_and_check_normal, theta)
   -- if not ok then print(ok, "PROBLEM") end
   if not accept or not ok then
     energy = initial_energy
     result = eval0_result
-    theta:copy(theta0)
+    md.copy(theta,theta0)
   end
   local accepted = (accept and 1) or 0
   -- accept rate update (exponential mean)
@@ -68,7 +66,7 @@ local function metropolis(self, eval, theta)
   --
   self:count_one()
   if self:get_count() % thin == 0 then
-    table.insert(samples, theta:clone())
+    table.insert(samples, md.clone(theta))
     table.insert(energies, energy)
   end
   local acceptance_rate
diff --git a/packages/bayesian/lua_src/nuts.lua b/packages/bayesian/lua_src/nuts.lua
index 2022e1f54..6059c5289 100644
--- a/packages/bayesian/lua_src/nuts.lua
+++ b/packages/bayesian/lua_src/nuts.lua
@@ -1,7 +1,5 @@
 get_table_from_dotted_string("bayesian.optimizer", true)
 
-local wrap_matrices = matrix.dict.wrap_matrices
-
 -- Radford M. Neal. MCMC using Hamiltonian dynamics. 2010
 -- http://www.cs.toronto.edu/~radford/ham-mcmc.abstract.html
 
diff --git a/packages/bayesian/lua_src/priors.lua b/packages/bayesian/lua_src/priors.lua
index dd8c2655a..86367dbea 100644
--- a/packages/bayesian/lua_src/priors.lua
+++ b/packages/bayesian/lua_src/priors.lua
@@ -1,7 +1,5 @@
 get_table_from_dotted_string("bayesian", true)
 
-local wrap_matrices = matrix.dict.wrap_matrices
-
 ------------------------------------------------------------------------------
 
 local make_value = function(value)
@@ -68,7 +66,7 @@ function priors_class:constructor(tree,order,outcomes)
 end
 
 function priors_methods:compute_neg_log_prior(weights)
-  local weights = wrap_matrices(weights or {})
+  error("NOT IMPLEMENTED")
   local logprob = 0.0
   for name,m in pairs(self.outcomes) do
     local d = self.tree[name].obj
@@ -120,7 +118,6 @@ end
 
 function priors_methods:sample(rng, weights)
   local outcomes = {}
-  local weights  = wrap_matrices(weights or {})
   for _,name in ipairs(self.order) do
     local v = assert( self.tree[name] )
     local s = sampling_funcs[v.t](v, outcomes)
@@ -135,8 +132,6 @@ function priors_methods:sample(rng, weights)
 end
 
 function priors_methods:update_gradients_with_priors(weights, grads)
-  local weights  = wrap_matrices(weights or {})
-  local grads  = wrap_matrices(grads or {})
   for name,w in pairs(weights) do
     local wgrads = assert( grads(name) )
     local v = self.tree[name]
diff --git a/packages/bayesian/test/demo_hmc.lua b/packages/bayesian/test/demo_hmc.lua
index 42b2b2b9a..25db2bb6e 100644
--- a/packages/bayesian/test/demo_hmc.lua
+++ b/packages/bayesian/test/demo_hmc.lua
@@ -1,13 +1,13 @@
 local gp = require "april_tools.gnuplot"()
 local rnd = random(1234)
-local x = stats.dist.normal(0,1):sample(rnd, matrix.col_major(2,1)):transpose()
+local x = stats.dist.normal(0,1):sample(rnd, matrix(2,1)):transpose()
 
 -- A = inv([1, 1.98; 1.98, 4]);
-local A = matrix.col_major(2,2,{ 50.251256, -24.874372,
-                                   -24.874372, 12.562814 })
+local A = matrix(2,2,{ 50.251256, -24.874372,
+                         -24.874372, 12.562814 })
 
 function plot_samples(samples)
-  local data = matrix.col_major(#samples,2)
+  local data = matrix(#samples,2)
   for i=1,#samples do
     data(i,':'):copy(samples[i]("x"))
   end
diff --git a/packages/bayesian/test/demo_metropolis.lua b/packages/bayesian/test/demo_metropolis.lua
index dbf677bc6..a9621f3a7 100644
--- a/packages/bayesian/test/demo_metropolis.lua
+++ b/packages/bayesian/test/demo_metropolis.lua
@@ -1,13 +1,13 @@
 local gp = require "april_tools.gnuplot"()
 local rnd = random(1234)
-local x = stats.dist.normal(0,1):sample(rnd, matrix.col_major(2,1)):transpose()
+local x = stats.dist.normal(0,1):sample(rnd, matrix(2,1)):transpose()
 
 -- A = inv([1, 1.98; 1.98, 4]);
-local A = matrix.col_major(2,2,{ 50.251256, -24.874372,
-                                   -24.874372, 12.562814 })
+local A = matrix(2,2,{ 50.251256, -24.874372,
+                         -24.874372, 12.562814 })
 
 function plot_samples(samples)
-  local data = matrix.col_major(#samples,2)
+  local data = matrix(#samples,2)
   for i=1,#samples do
     data(i,':'):copy(samples[i]("x"))
   end
diff --git a/packages/bayesian/test/test_digits_hmc.lua b/packages/bayesian/test/test_digits_hmc.lua
index 6d8f225a3..bfd0f1dad 100644
--- a/packages/bayesian/test/test_digits_hmc.lua
+++ b/packages/bayesian/test/test_digits_hmc.lua
@@ -146,7 +146,7 @@ for j=1,#trainers do
   local bayesian_model = bayesian.build_bayes_comb{
     forward = function(weights, input)
       thenet:build{ weights = weights }
-      return thenet:forward(input):get_matrix()
+      return thenet:forward(input)
     end,
     N=1000,
     shuffle=rnd,
diff --git a/packages/bayesian/test/test_digits_metropolis.lua b/packages/bayesian/test/test_digits_metropolis.lua
index 36f7a2f82..49094cdfe 100644
--- a/packages/bayesian/test/test_digits_metropolis.lua
+++ b/packages/bayesian/test/test_digits_metropolis.lua
@@ -139,7 +139,7 @@ for j=1,#trainers do
   local bayesian_model = bayesian.build_bayes_comb{
     forward = function(weights, input)
       thenet:build{ weights = weights }
-      return thenet:forward(input):get_matrix()
+      return thenet:forward(input)
     end,
     N=1000,
     shuffle=rnd,
diff --git a/packages/clustering/kmeans/matrix/lua_src/kmeans_matrix.lua b/packages/clustering/kmeans/matrix/lua_src/kmeans_matrix.lua
index cde8c67f3..13ecda33f 100644
--- a/packages/clustering/kmeans/matrix/lua_src/kmeans_matrix.lua
+++ b/packages/clustering/kmeans/matrix/lua_src/kmeans_matrix.lua
@@ -19,8 +19,6 @@ function funcs.find_clusters(X,C,T,verbose)
   local Cdim = C:dim()
   assert(#Xdim == 2, "Data matrix must be bi-dimensional")
   assert(#Cdim == 2, "Centroids matrix must be bi-dimensional")
-  assert(X:get_major_order() == C:get_major_order(),
-	 "Given matrices with different major order")
   local N = Xdim[1] -- number of samples
   local D = Xdim[2] -- number of features (dimensions)
   local K = Cdim[1] -- number of clusters
@@ -33,7 +31,7 @@ function funcs.find_clusters(X,C,T,verbose)
 	       N)
   --
   local auxXblock,mins
-  local Mnew       = matrix[X:get_major_order()]
+  local Mnew       = matrix
   local M2Y        = Mnew(BSIZE,K)
   local CScores    = Mnew(K):zeros()
   local CSqScores  = Mnew(K):zeros()
@@ -103,8 +101,6 @@ function funcs.basic(X,C,params)
   local Cdim = C:dim()
   assert(#Xdim == 2, "Data matrix must be bi-dimensional")
   assert(#Cdim == 2, "Centroids matrix must be bi-dimensional")
-  assert(X:get_major_order() == C:get_major_order(),
-	 "Given matrices with different major order")
   local N = Xdim[1] -- number of samples
   local D = Xdim[2] -- number of features (dimensions)
   local K = Cdim[1] -- number of clusters
@@ -113,7 +109,7 @@ function funcs.basic(X,C,params)
 	       D, Cdim[2])
   local max_iter    = params.max_iter
   local threshold   = params.threshold
-  local Mnew        = matrix[X:get_major_order()]
+  local Mnew        = matrix
   local M2Y         = Mnew(BSIZE,K)
   local Csum        = Mnew(K,D)
   local Csq         = Mnew(K,D)
@@ -236,8 +232,6 @@ function funcs.refine(X,C,params)
   local Cdim = C:dim()
   assert(#Xdim == 2, "Data matrix must be bi-dimensional")
   assert(#Cdim == 2, "Centroids matrix must be bi-dimensional")
-  assert(X:get_major_order() == C:get_major_order(),
-	 "Given matrices with different major order")
   local N = Xdim[1] -- number of samples
   local D = Xdim[2] -- number of features (dimensions)
   local K = Cdim[1] -- number of clusters
@@ -247,7 +241,7 @@ function funcs.refine(X,C,params)
 	       "Different columns found between data and centroids: %d ~= %d\n",
 	       D, Cdim[2])
   local num_samples = math.max(K, math.round(N * params.percentage))
-  local Mnew = matrix[X:get_major_order()]
+  local Mnew = matrix
   local S = Mnew(num_samples, D)
   local CM = Mnew(J, K, D)
   local FM = matrix.as(CM)
@@ -329,7 +323,7 @@ local function metatable_call(self,params)
   local distortion
   if not centroids then
     assert(random, "Field random is mandatory when not given centroids")
-    centroids = matrix[data:get_major_order()](params.K,data:dim(2))
+    centroids = matrix(params.K,data:dim(2))
     distortion = funcs.refine(data, centroids, {
 				max_iter   = params.max_iter,
 				random     = params.random,
diff --git a/packages/imaging/Image/binding/bind_image_RGB.lua.cc b/packages/imaging/Image/binding/bind_image_RGB.lua.cc
index 98a91094d..c0ed219db 100644
--- a/packages/imaging/Image/binding/bind_image_RGB.lua.cc
+++ b/packages/imaging/Image/binding/bind_image_RGB.lua.cc
@@ -55,7 +55,6 @@ using namespace Imaging;
   float_rgb_mem = img->getRawDataAccess()->reinterpretAs<FloatRGB>();
   int dims[2] = { img->getDimSize(0), img->getDimSize(1) };
   Basics::Matrix<FloatRGB> *img_rgb = new Basics::Matrix<FloatRGB>(2, dims,
-                                                                   CblasRowMajor,
                                                                    float_rgb_mem);
   //
   obj = new ImageFloatRGB(img_rgb);
@@ -138,7 +137,6 @@ using namespace Imaging;
   mat_mem = img_rgb->getRawDataAccess()->reinterpretAs<float>();
   int dims[3] = { img_rgb->getDimSize(0), img_rgb->getDimSize(1), 3 };
   Basics::MatrixFloat *output = new Basics::MatrixFloat(3, dims,
-                                                        img_rgb->getMajorOrder(),
                                                         mat_mem);
   LUABIND_RETURN(MatrixFloat, output);
 }
diff --git a/packages/imaging/Image/c_src/image.cc b/packages/imaging/Image/c_src/image.cc
index 4f263afe5..4131ece20 100644
--- a/packages/imaging/Image/c_src/image.cc
+++ b/packages/imaging/Image/c_src/image.cc
@@ -42,8 +42,7 @@ namespace Imaging {
   template <typename T>
   Image<T>::Image(Basics::Matrix<T> *mat) {
     if (!mat->isSimple())
-      ERROR_EXIT(128, "Image only works with simple matrices "
-                 "(contiguous, and in row-major\n");
+      ERROR_EXIT(128, "Image only works with contiguous matrices\n");
     // if (mat->numDim != 2) { ... } // <- TODO
     matrix = mat;
     IncRef(matrix); // garbage collection
@@ -101,8 +100,7 @@ namespace Imaging {
     int dims[2];
     dims[0] = h;
     dims[1] = w;
-    Basics::Matrix<T> *mat = new Basics::Matrix<T>(2, dims,
-                                                   matrix->getMajorOrder());
+    Basics::Matrix<T> *mat = new Basics::Matrix<T>(2, dims);
     Image<T>  *img = new Image<T>(mat);
 
     AprilMath::MatrixExt::Operations::matFill(mat, default_color);
@@ -185,7 +183,7 @@ namespace Imaging {
   void Image<T>::projection_v(Basics::Matrix<T> **m) const {
     int dims[1];
     dims[0] = width();
-    *m = new Basics::Matrix<T>(1, dims, matrix->getMajorOrder());
+    *m = new Basics::Matrix<T>(1, dims);
     projection_v((*m)->getRawDataAccess()->getPPALForWrite());
   }
 
@@ -207,7 +205,7 @@ namespace Imaging {
   void Image<T>::projection_h(Basics::Matrix<T> **m) const {
     int dims[1];
     dims[0] = height();
-    *m = new Basics::Matrix<T>(1, dims, matrix->getMajorOrder());
+    *m = new Basics::Matrix<T>(1, dims);
     projection_h((*m)->getRawDataAccess()->getPPALForWrite());
   }
 
@@ -237,8 +235,7 @@ namespace Imaging {
 
     //printf("dims = %dfilas x %dcolumnas\n", dims[0], dims[1]);
 	
-    Basics::Matrix<T> *mat = new Basics::Matrix<T>(2, dims,
-                                                   matrix->getMajorOrder());
+    Basics::Matrix<T> *mat = new Basics::Matrix<T>(2, dims);
     Image<T>  *img = new Image<T>(mat);
   
     if (angle > 0) {
@@ -567,8 +564,7 @@ namespace Imaging {
     dimensions[0] = width();
     dimensions[1] = height();
 
-    Basics::Matrix<T> *new_mat = new Basics::Matrix<T>(2, dimensions,
-                                                       matrix->getMajorOrder());
+    Basics::Matrix<T> *new_mat = new Basics::Matrix<T>(2, dimensions);
     Image<T> *result = new Image<T>(new_mat);
   
     typename Basics::Matrix<T>::const_random_access_iterator
@@ -592,8 +588,7 @@ namespace Imaging {
     dimensions[0] = width();
     dimensions[1] = height();
 
-    Basics::Matrix<T> *new_mat = new Basics::Matrix<T>(2, dimensions,
-                                                       matrix->getMajorOrder());
+    Basics::Matrix<T> *new_mat = new Basics::Matrix<T>(2, dimensions);
     Image<T> *result = new Image<T>(new_mat);
   
     typename Basics::Matrix<T>::const_random_access_iterator
@@ -646,8 +641,7 @@ namespace Imaging {
     dimensions[0]=height();
     dimensions[1]=width() - nblanco;
 	
-    Basics::Matrix<T> *new_mat = new Basics::Matrix<T>(2, dimensions,
-                                                       matrix->getMajorOrder());
+    Basics::Matrix<T> *new_mat = new Basics::Matrix<T>(2, dimensions);
     Image<T> *result = new Image<T>(new_mat);
   
     typename Basics::Matrix<T>::random_access_iterator dst_it(new_mat);
@@ -702,7 +696,6 @@ namespace Imaging {
       new AprilMath::GPUMirroredMemoryBlock<float>(25, k);
     // prepare kernel matrix
     Basics::Matrix<T> *kernel_mat = new Basics::Matrix<T>(4, dimensions,
-                                                          matrix->getMajorOrder(),
                                                           k_mem_block);
     // add padding to image
     Basics::Matrix<T> *padded_this_mat = matrix->padding(2, default_color);
diff --git a/packages/knn/kdtree/test/test-digits.lua b/packages/knn/kdtree/test/test-digits.lua
index 1b3c09657..75db5e76e 100644
--- a/packages/knn/kdtree/test/test-digits.lua
+++ b/packages/knn/kdtree/test/test-digits.lua
@@ -29,14 +29,12 @@ T("KDTreeTest", function()
     end
 
     if DO_PCA then
-      local U,S = stats.pca(train_data:clone("col_major"))
-      U=U:clone("row_major")
-      S=S:clone("row_major")
-      train_data = stats.pca_whitening(train_data,U,S,PCA_EPSILON)
+      local U,S = stats.pca(train_data)
+      train_data = stats.pca.whitening(train_data,U,S,PCA_EPSILON)
       -- print(stats.pca_threshold(S,0.99))
       train_data = train_data(':',{1,TOP_PCA})
       
-      val_data = stats.pca_whitening(val_data,U,S,PCA_EPSILON)
+      val_data = stats.pca.whitening(val_data,U,S,PCA_EPSILON)
       val_data = val_data(':',{1,TOP_PCA})
     end
 
diff --git a/packages/language_model/LM_interface/lua_src/test_set_ppl.lua b/packages/language_model/LM_interface/lua_src/test_set_ppl.lua
index b9985cffc..f07f95870 100644
--- a/packages/language_model/LM_interface/lua_src/test_set_ppl.lua
+++ b/packages/language_model/LM_interface/lua_src/test_set_ppl.lua
@@ -65,7 +65,7 @@ function language_models.get_sentence_prob(params)
     sum = sum + p
   end
 
-  for word_id,word in words_it() do
+  for word_id,word in words_it do
     -- the word which will be passed to print_pw function; a showed_word==nil
     -- means to show nothing
     local printed_word
@@ -250,7 +250,7 @@ function language_models.test_set_ppl(params)
   local lines_it = iterator(io.lines(testset)):
   map( function(line) return line,iterator(line:gmatch("[^%s]+")) end )
 
-  for sentence,words_it in lines_it() do
+  for sentence,words_it in lines_it do
     words_it = words_it:map( function(w) return (vocab:getWordId(w) or unk_id),w end )
     local use_sentence = true
     if train_restriction then
diff --git a/packages/metrics/roc/test/test_roc.lua b/packages/metrics/roc/test/test_roc.lua
index 3937b2b2d..eb49a36b8 100644
--- a/packages/metrics/roc/test/test_roc.lua
+++ b/packages/metrics/roc/test/test_roc.lua
@@ -11,15 +11,9 @@ T("ROCTest", function()
     check.number_eq( metrics.roc( matrix{0.2,0.3,0.4,0.5},
                                   matrix{0,1,0,1} ):compute_area(),
                      0.75 )
-    check.number_eq( metrics.roc( matrix.col_major{0.2,0.3,0.4,0.5},
-                                  matrix.col_major{0,1,0,1} ):compute_area(),
-                     0.75 )
     check.eq( metrics.roc( matrix{0.2,0.3,0.4,0.5},
                            matrix{1,0,0,0} ):compute_area(),
               0.0 )
-    check.eq( metrics.roc( matrix.col_major{0.2,0.3,0.4,0.5},
-                           matrix.col_major{1,0,0,0} ):compute_area(),
-              0.0 )
     check.number_eq( metrics.roc( matrix{0.2,0.3,0.4,0.5},
                                   matrix{0,0,1,0} ):compute_area(),
                      0.66 )
diff --git a/packages/misc/matlab/binding/bind_matlab.lua.cc b/packages/misc/matlab/binding/bind_matlab.lua.cc
index c7202097f..e5418c9fb 100644
--- a/packages/misc/matlab/binding/bind_matlab.lua.cc
+++ b/packages/misc/matlab/binding/bind_matlab.lua.cc
@@ -160,10 +160,8 @@ typedef MatFileReader::StructureDataElement MatStructureDataElement;
 
 //BIND_METHOD MatTaggedDataElement get_matrix
 {
-  bool col_major;
-  LUABIND_GET_OPTIONAL_PARAMETER(1, bool, col_major, false);
   char name[MAX_NAME_SIZE];
-  Basics::MatrixFloat *m = obj->getMatrix(name, MAX_NAME_SIZE, col_major);
+  Basics::MatrixFloat *m = obj->getMatrix(name, MAX_NAME_SIZE);
   if (m != 0) {
     LUABIND_RETURN(MatrixFloat, m);
     LUABIND_RETURN(string, name);
@@ -173,10 +171,8 @@ typedef MatFileReader::StructureDataElement MatStructureDataElement;
 
 //BIND_METHOD MatTaggedDataElement get_matrix_complex
 {
-  bool col_major;
-  LUABIND_GET_OPTIONAL_PARAMETER(1, bool, col_major, false);
   char name[MAX_NAME_SIZE];
-  Basics::MatrixComplexF *m = obj->getMatrixComplexF(name, MAX_NAME_SIZE, col_major);
+  Basics::MatrixComplexF *m = obj->getMatrixComplexF(name, MAX_NAME_SIZE);
   LUABIND_RETURN(MatrixComplexF, m);
   LUABIND_RETURN(string, name);
 }
diff --git a/packages/misc/matlab/c_src/matlab.cc b/packages/misc/matlab/c_src/matlab.cc
index 0b4f709d0..829f10043 100644
--- a/packages/misc/matlab/c_src/matlab.cc
+++ b/packages/misc/matlab/c_src/matlab.cc
@@ -132,8 +132,8 @@ namespace Matlab {
   }
 
   template<typename T>
-  void readMatrixData(MatrixFloat::col_major_iterator &m_it,
-                      MatrixFloat::col_major_iterator &end,
+  void readMatrixData(MatrixFloat::iterator &m_it,
+                      MatrixFloat::iterator &end,
                       const T *ptr, const uint32_t nbytes) {
     UNUSED_VARIABLE(end);
     for (uint32_t ptr_pos=0; ptr_pos < nbytes; ptr_pos += sizeof(T), ++ptr) {
@@ -145,8 +145,8 @@ namespace Matlab {
   }
 
   template<typename T>
-  void readMatrixData(MatrixComplexF::col_major_iterator &m_it,
-                      MatrixComplexF::col_major_iterator &end,
+  void readMatrixData(MatrixComplexF::iterator &m_it,
+                      MatrixComplexF::iterator &end,
                       const T *ptr_real, const T *ptr_img,
                       const uint32_t nbytes) {
     UNUSED_VARIABLE(end);
@@ -173,8 +173,8 @@ namespace Matlab {
   }
 
   template<typename T>
-  void readMatrixData(MatrixDouble::col_major_iterator &m_it,
-                      MatrixDouble::col_major_iterator &end,
+  void readMatrixData(MatrixDouble::iterator &m_it,
+                      MatrixDouble::iterator &end,
                       const T *ptr, const uint32_t nbytes) {
     UNUSED_VARIABLE(end);
     for (uint32_t ptr_pos=0; ptr_pos < nbytes; ptr_pos += sizeof(T), ++ptr) {
@@ -186,8 +186,8 @@ namespace Matlab {
   }
 
   template<typename T>
-  void readMatrixData(MatrixChar::col_major_iterator &m_it,
-                      MatrixChar::col_major_iterator &end,
+  void readMatrixData(MatrixChar::iterator &m_it,
+                      MatrixChar::iterator &end,
                       const T *ptr, const uint32_t nbytes) {
     UNUSED_VARIABLE(end);
     for (uint32_t ptr_pos=0; ptr_pos < nbytes; ptr_pos += sizeof(T), ++ptr) {
@@ -198,8 +198,8 @@ namespace Matlab {
   }
 
   template<typename T>
-  void readMatrixData(MatrixInt32::col_major_iterator &m_it,
-                      MatrixInt32::col_major_iterator &end,
+  void readMatrixData(MatrixInt32::iterator &m_it,
+                      MatrixInt32::iterator &end,
                       const T *ptr, const uint32_t nbytes) {
     UNUSED_VARIABLE(end);
     for (uint32_t ptr_pos=0; ptr_pos < nbytes; ptr_pos += sizeof(T), ++ptr) {
@@ -365,8 +365,9 @@ namespace Matlab {
     // traversing in col_major the real/img part of the matrix will be traversed
     // last, so it is possible add all real components in a first step, and in a
     // second step to add all the imaginary components
-    MatrixChar::col_major_iterator it(m->begin());
-    MatrixChar::col_major_iterator end(m->end());
+    AprilUtils::SharedPtr< MatrixChar > mT(m->transpose());
+    MatrixChar::iterator it(mT->begin());
+    MatrixChar::iterator end(mT->end());
     // this loop traverses all the real components, and later all the imaginary
     // components (if any)
     switch(real_part->getDataType()) {
@@ -397,8 +398,7 @@ namespace Matlab {
   }
 
   MatrixFloat *MatFileReader::TaggedDataElement::getMatrix(char *name,
-                                                           size_t maxsize,
-                                                           bool col_major) {
+                                                           size_t maxsize) {
     if (getDataType() != MATRIX) {
       ERROR_PRINT1("Impossible to get a Matrix from a non "
                    "Matrix element (type %d)\n", getDataType());
@@ -438,11 +438,11 @@ namespace Matlab {
     for (int i=0; i<num_dims; ++i)
       dims[i] = static_cast<int>(const_dims[i]);
     MatrixFloat *m;
-    m = new MatrixFloat(num_dims, dims,
-                        (col_major)?CblasColMajor:CblasRowMajor);
+    m = new MatrixFloat(num_dims, dims);
     // traversing in col_major
-    MatrixFloat::col_major_iterator it(m->begin());
-    MatrixFloat::col_major_iterator end(m->end());
+    AprilUtils::SharedPtr< MatrixFloat > mT(m->transpose());
+    MatrixFloat::iterator it(mT->begin());
+    MatrixFloat::iterator end(mT->end());
     switch(real_part->getDataType()) {
     case SINGLE:
       readMatrixData(it, end, real_part->getData<const float*>(),
@@ -490,7 +490,7 @@ namespace Matlab {
   }
 
   MatrixComplexF *MatFileReader::TaggedDataElement::
-  getMatrixComplexF(char *name, size_t maxsize, bool col_major) {
+  getMatrixComplexF(char *name, size_t maxsize) {
     if (getDataType() != MATRIX) {
       ERROR_PRINT1("Impossible to get a Matrix from a non "
                    "Matrix element (type %d)\n", getDataType());
@@ -521,11 +521,11 @@ namespace Matlab {
     for (int i=0; i<num_dims; ++i)
       dims[i] = static_cast<int>(const_dims[i]);
     MatrixComplexF *m;
-    m = new MatrixComplexF(num_dims, dims,
-                           (col_major)?CblasColMajor:CblasRowMajor);
+    m = new MatrixComplexF(num_dims, dims);
     // traversing in col_major
-    MatrixComplexF::col_major_iterator it(m->begin());
-    MatrixComplexF::col_major_iterator end(m->end());
+    AprilUtils::SharedPtr< MatrixComplexF > mT(m->transpose());
+    MatrixComplexF::iterator it(mT->begin());
+    MatrixComplexF::iterator end(mT->end());
     if (real_part->getDataType() != img_part->getDataType())
       ERROR_EXIT(256, "Found different data-type for real and imaginary part\n");
     switch(real_part->getDataType()) {
@@ -633,8 +633,9 @@ namespace Matlab {
     MatrixDouble *m;
     m = new MatrixDouble(num_dims, dims);
     // traversing in col_major
-    MatrixDouble::col_major_iterator it(m->begin());
-    MatrixDouble::col_major_iterator end(m->end());
+    AprilUtils::SharedPtr< MatrixDouble > mT(m->transpose());
+    MatrixDouble::iterator it(mT->begin());
+    MatrixDouble::iterator end(mT->end());
     switch(real_part->getDataType()) {
     case INT8:
       readMatrixData(it, end, real_part->getData<const int8_t*>(),
@@ -739,8 +740,9 @@ namespace Matlab {
     MatrixInt32 *m;
     m = new MatrixInt32(num_dims, dims);
     // traversing in col_major
-    MatrixInt32::col_major_iterator it(m->begin());
-    MatrixInt32::col_major_iterator end(m->end());
+    AprilUtils::SharedPtr< MatrixInt32 > mT(m->transpose());
+    MatrixInt32::iterator it(mT->begin());
+    MatrixInt32::iterator end(mT->end());
     switch(real_part->getDataType()) {
     case INT8:
       readMatrixData(it, end, real_part->getData<const int8_t*>(),
diff --git a/packages/misc/matlab/c_src/matlab.h b/packages/misc/matlab/c_src/matlab.h
index ce3a96e67..ef2ddf5d1 100644
--- a/packages/misc/matlab/c_src/matlab.h
+++ b/packages/misc/matlab/c_src/matlab.h
@@ -142,10 +142,9 @@ namespace Matlab {
       // SUB-ELEMENTS
       TaggedDataElement *getNextSubElement();
       // FOR NUMERIC TYPES (casting)
-      Basics::MatrixFloat *getMatrix(char *name, size_t maxsize, bool col_major=false);
+      Basics::MatrixFloat *getMatrix(char *name, size_t maxsize);
       // FOR NUMERIC TYPES (casting)
-      Basics::MatrixComplexF *getMatrixComplexF(char *name, size_t maxsize,
-                                                bool col_major=false);
+      Basics::MatrixComplexF *getMatrixComplexF(char *name, size_t maxsize);
       // FOR NUMERIC TYPES (casting)
       Basics::MatrixDouble *getMatrixDouble(char *name, size_t maxsize);
       virtual uint32_t getClass();
diff --git a/packages/misc/matlab/lua_src/matlab.lua b/packages/misc/matlab/lua_src/matlab.lua
index b80b095c6..b5fc63318 100644
--- a/packages/misc/matlab/lua_src/matlab.lua
+++ b/packages/misc/matlab/lua_src/matlab.lua
@@ -14,10 +14,10 @@ end
 
 -- this function receives an element and returns its corresponding APRIL-ANN Lua
 -- object
-function matlab.tolua(element,col_major)
+function matlab.tolua(element)
   if element:get_type() == matlab.types.matrix then
     local func = class_tolua_table[element:get_class()]
-    if func then return func(element,col_major)
+    if func then return func(element)
     else error("Not recognized class: " .. matlab.classes[element:get_class()])
     end
   else
@@ -30,22 +30,22 @@ end
 -----------------------------
 -- CLASS BUILDER FUNCTIONS --
 -----------------------------
-local function tomatrix(e,col_major)
-  local elem,name = e:get_matrix(col_major)
+local function tomatrix(e)
+  local elem,name = e:get_matrix()
   if elem ~= nil then
     print("# Loading matrix float element: ", name)
   else
-    elem,name = e:get_matrix_complex(col_major)
+    elem,name = e:get_matrix_complex()
     print("# Loading matrix complex element: ", name)
   end
   return elem,name
 end
-local function tomatrixdouble(e,col_major)
+local function tomatrixdouble(e)
   local elem,name = e:get_matrix_double()
   if elem ~= nil then
     print("# Loading matrix double element: ", name)
   else
-    elem,name = e:get_matrix_complex(col_major)
+    elem,name = e:get_matrix_complex()
     print("# Loading matrix complex (casted from double) element: ", name)
   end
   return elem,name
@@ -64,24 +64,24 @@ local function tomatrixchar(e)
   print("# Loading matrix char element:  ", name)
   return elem,name
 end
-local function tocellarray(e,col_major)
+local function tocellarray(e)
   local cell_array,name = e:get_cell_array()
   local wrapper = class_wrapper(cell_array)
   wrapper = class_instance(wrapper, class.of(cell_array))
   wrapper.get = function(obj, ...)
-    return matlab.tolua(cell_array:get(...),col_major)
+    return matlab.tolua(cell_array:get(...))
   end
   wrapper.raw_get = function(obj, ...)
-    return matlab.tolua(cell_array:raw_get(...),col_major)
+    return matlab.tolua(cell_array:raw_get(...))
   end
   print("# Loading cell array element:   ", name, cell_array)
   return wrapper,name
 end
-local function tostructure(e,col_major)
+local function tostructure(e)
   local dictionary,name = e:get_structure()
   for ename,elem in pairs(dictionary) do
     print("# Loading structure element:  ", name, ename, elem)
-    dictionary[ename] = matlab.tolua(elem,col_major)
+    dictionary[ename] = matlab.tolua(elem)
   end
   return dictionary,name
 end
@@ -152,13 +152,12 @@ end
 -- reads a MAT file and returns a Lua table with all the elements, indexed by
 -- its names, and recursively containing matrix, cell_array or struct objects
 -- with all the data
-function matlab.read(path,col_major)
+function matlab.read(path)
   assert(path and type(path)=="string", "First argument must be a path string")
-  local col_major = col_major or false
   local reader    = matlab.reader(path)
   local elements  = {}
   for e in reader:elements() do
-    local lua_element,name = matlab.tolua(e,col_major)
+    local lua_element,name = matlab.tolua(e)
     elements[name] = lua_element
   end
   setmetatable(elements,
diff --git a/packages/trainable/lua_src/qlearning.lua b/packages/trainable/lua_src/qlearning.lua
index fb8504e53..18be91365 100644
--- a/packages/trainable/lua_src/qlearning.lua
+++ b/packages/trainable/lua_src/qlearning.lua
@@ -3,6 +3,8 @@ local trainable_qlearning_trainer,trainable_qlearning_trainer_methods =
 trainable = trainable or {} -- global environment
 trainable.qlearning_trainer = trainable_qlearning_trainer -- global environment
 
+local md = matrix.dict
+
 -----------------------------
 -- QLEARNING TRAINER CLASS --
 -----------------------------
@@ -13,8 +15,8 @@ function trainable_qlearning_trainer:constructor(t)
       sup_trainer = { isa_match=trainable.supervised_trainer, mandatory=true },
       discount = { type_match="number", mandatory=true, default=0.6 },
       lambda = { type_match="number", mandatory=true, default=0.6 },
-      gradients = { mandatory=false, default=matrix.dict() },
-      traces = { mandatory=false, default=matrix.dict() },
+      gradients = { mandatory=false, default={} },
+      traces = { mandatory=false, default={} },
       noise = { mandatory=false, default=ann.components.base() },
       clampQ = { mandatory=false },
       nactions = { mandatory=false, type_match="number" },
@@ -56,7 +58,7 @@ local function trainable_qlearning_trainer_train(self, prev_state, prev_action,
   local prev_state = noise:forward(prev_state, true)
   noise:reset(0)
   local state = noise:forward(state, true)
-  local error_grad = matrix.col_major(1, nactions):zeros()
+  local error_grad = matrix(1, nactions):zeros()
   local needs_gradient = optimizer:needs_property("gradient")
   local loss,Qsp,Qs
   loss,gradients,Qsp,Qs,expected_Qsa =
@@ -66,8 +68,8 @@ local function trainable_qlearning_trainer_train(self, prev_state, prev_action,
                           thenet:build{ weights = weights }
                         end
                         thenet:reset(it)
-                        local Qsp = thenet:forward(state):get_matrix()
-                        local Qs  = thenet:forward(prev_state,true):get_matrix()
+                        local Qsp = thenet:forward(state)
+                        local Qs  = thenet:forward(prev_state,true)
                         local Qsa = Qs:get(1, prev_action)
                         local delta = reward + discount * Qsp:max() - Qsa
                         local diff = delta
@@ -82,8 +84,8 @@ local function trainable_qlearning_trainer_train(self, prev_state, prev_action,
                               traces[name] = matrix.as(g):zeros()
                             end
                           end
-                          traces:scal(lambda*discount)
-                          traces:axpy(1.0, gradients)
+                          md.scal( traces, lambda*discount )
+                          md.axpy( traces, 1.0, gradients )
                           return loss,traces,Qsp,Qs,expected_Qsa
                         else
                           return loss,nil,Qsp,Qs,expected_Qsa
@@ -116,7 +118,7 @@ function trainable_qlearning_trainer_methods:one_step(action, state, reward)
   else
     self.noise:reset(0)
     local state = self.noise:forward(state,true)
-    Qsp = self.thenet:forward(state):get_matrix()
+    Qsp = self.thenet:forward(state)
   end
   self.prev_state = state
   return Qsp
@@ -209,10 +211,10 @@ function trainable_batch_builder_methods:add(prev_state, output, action, reward)
   assert(type(reward) == "number",  "Needs a matrix as 4th argument")
   table.insert(self.batch,
                {
-                 prev_state:clone("row_major"):rewrap(prev_state:size()),
+                 prev_state:clone():rewrap(prev_state:size()),
                  action,
                  reward,
-                 output:clone("row_major"):rewrap(output:size()),
+                 output:clone():rewrap(output:size()),
                })
   if self.state_size then
     assert(self.state_size == prev_state:size(), "Found different state sizes")
diff --git a/packages/trainable/lua_src/supervised.lua b/packages/trainable/lua_src/supervised.lua
index 6c5547d23..84868c5a5 100644
--- a/packages/trainable/lua_src/supervised.lua
+++ b/packages/trainable/lua_src/supervised.lua
@@ -11,15 +11,14 @@ local pairs = pairs
 local assert = assert
 --
 local type = type
+local april_assert = april_assert
 local is_a = class.is_a
 local iterator = iterator
 local get_table_fields = get_table_fields
-local april_assert = april_assert
+local md = matrix.dict
 
 -----------------------------------------
 
-local wrap_matrices = matrix.dict.wrap_matrices
-
 ------------------------------
 -- SUPERVISED_TRAINER CLASS --
 ------------------------------
@@ -84,21 +83,17 @@ trainable_supervised_trainer.constructor =
       trainable.supervised_trainer.constructor(self,
                                                model, loss, bunch_size,
                                                optimizer, smooth_gradients)
-      local weight = connections
-      if not is_a(connections, matrix.dict) then
-        weights = matrix.dict()
-        for name,wdata in pairs(connections) do
-          local m = wdata
-          if not is_a(m, matrix) then
-            m = wdata.w:rewrap(wdata.output,wdata.input)
-          end
-          if m:get_major_order() == "col_major" then
-            weights:insert(name,m)
-          else
-            weights:insert(name,m:clone("col_major"))
-          end
-        end
-      end
+      local weights = connections
+      -- if not is_a(connections, matrix.dict) then
+      --   weights = matrix.dict()
+      --   for name,wdata in pairs(connections) do
+      --     local m = wdata
+      --     if not is_a(m, matrix) then
+      --       m = wdata.w:rewrap(wdata.output,wdata.input)
+      --     end
+      --     weights:insert(name,m:clone())
+      --   end
+      -- end
       self:build{ weights = weights }
     else
       -- Constructor of a new object
@@ -118,14 +113,14 @@ trainable_supervised_trainer.constructor =
       self.loss_function    = loss_function or false
       self.optimizer        = optimizer
       self.smooth_gradients = smooth_gradients
-      self.weights_table    = matrix.dict()
+      self.weights_table    = {}
       self.components_table = {}
       self.component2weights_dict = {}
       self.weights2component_dict = {}
       self.weights_order    = {}
       self.components_order = {}
       self.bunch_size       = bunch_size or false
-      self.weight_grads     = matrix.dict()
+      self.weight_grads     = {}
     end
   end
 
@@ -321,7 +316,7 @@ trainable_supervised_trainer_methods.size =
     if not self.is_built then
       error("It is not build")
     end
-    return self.weights_table:size()
+    return md.size(self.weights_table)
   end
 
 ------------------------------------------------------------------------
@@ -335,7 +330,7 @@ function trainable_supervised_trainer_methods:to_lua_string(format)
   table.insert(t, ",\n")
   table.insert(t, "connections={")
   for _,wname in ipairs(self.weights_order) do
-    local cobj = self.weights_table(wname)
+    local cobj = self.weights_table[wname]
     local w = cobj
     table.insert(t, string.format("\n[%q] = ", wname))
     table.insert(t, w:to_lua_string(format))
@@ -534,7 +529,7 @@ trainable_supervised_trainer_methods.iterate_weights =
         end
       until self.weights_order[pos]:match(match_string)
       local name = self.weights_order[pos]
-      return name,self.weights_table(name)
+      return name,self.weights_table[name]
     end
   end
 
@@ -581,7 +576,7 @@ trainable_supervised_trainer_methods.weights =
     if not self.is_built then
       error("Needs execution of build method")
     end
-    return self.weights_table(str)
+    return self.weights_table[str]
   end
 
 ------------------------------------------------------------------------
@@ -644,7 +639,7 @@ trainable_supervised_trainer_methods.randomize_weights =
         local current_inf = params.inf
         local current_sup = params.sup
         local constant    = 0
-        local connection  = self.weights_table(wname)
+        local connection  = self.weights_table[wname]
         if params.use_fanin then
           constant = constant + ann.connections.get_input_size(connection)
         end
@@ -679,25 +674,25 @@ trainable_supervised_trainer_methods.build =
         "to provide easy acces to components and connections.",
       }, 
     params = {
-      ["weights"] = "A dictionary weights_name => ann.connections object [optional]",
+      ["weights"] = "A table weights_name=>matrix [optional]",
       ["input"]   = "The input size of the component [optional]",
       ["output"]  = "The output size of the component [optional]",
     },
     outputs = {
       "The caller object",
-      "Weights table, associates weights_name => ann.connections object",
+      "Weights table, associates weights_name=>matrix",
       "Components table, associates component_name => ann.components object",
     },
   } ..
   function(self, t)
     local params = get_table_fields(
       {
-        weights = { mandatory = false, default=nil },
+        weights = { mandatory = false, default=nil, type_match="table" },
         input   = { type_match="number", mandatory = false, default=nil },
         output  = { type_match="number", mandatory = false, default=nil },
       }, t or {})
-    self.weight_grads  = matrix.dict()
-    self.weights_table = wrap_matrices(params.weights or matrix.dict())
+    self.weight_grads  = {}
+    self.weights_table = params.weights or {}
     -- BUILD CALL
     _,
     self.weights_table,
@@ -706,7 +701,7 @@ trainable_supervised_trainer_methods.build =
       output  = params.output,
       weights = self.weights_table, }
     --
-    self.weights_order = self.weights_table:keys()
+    self.weights_order = iterator(table.keys(self.weights_table)):table()
     table.sort(self.weights_order)
     self.components_order = {}
     self.component2weights_dict = {}
@@ -735,7 +730,7 @@ trainable_supervised_trainer_methods.get_weights_of =
     outputs = { "An instance of ann.connections" },
   } ..
   function(self, name)
-    return self.weights_table(self.component2weights_dict[name])
+    return self.weights_table[self.component2weights_dict[name]]
   end
 
 trainable_supervised_trainer_methods.get_components_of =
@@ -763,13 +758,13 @@ trainable_supervised_trainer_methods.train_step =
         "the gradient computed at component inputs.",
       }, 
     params = {
-      "A table with one input pattern or a token (with one or more patterns)",
-      "The corresponding target output pattern (table or token)",
+      "A table with one input pattern or a token (with one or more patterns, usually a matrix)",
+      "The corresponding target output pattern (table or token, usually a matrix)",
       "The loss function [optional]",
       "An optimizer [optional]",
       "The bunch size [optional]",
       "A smooth gradients boolean [optional]",
-      "A mask [optional]",
+      "A mask token [optional] (usually a matrix)",
     },
     outputs = {
       "The mean of loss function at current batch",
@@ -778,22 +773,21 @@ trainable_supervised_trainer_methods.train_step =
   } ..
   function(self, input, target, loss, optimizer,
            bunch_size, smooth_gradients, mask)
-    if type(input)  == "table" then input  = matrix.col_major(input)  end
-    if type(target) == "table" then target = matrix.col_major(target) end
-    if type(mask)   == "table" then mask   = matrix.col_major(mask) end
+    if type(input)  == "table" then input  = matrix(input)  end
+    if type(target) == "table" then target = matrix(target) end
+    if type(mask)   == "table" then mask   = matrix(mask) end
     local loss       = loss or self.loss_function or error("Needs a loss object")
     local optimizer  = optimizer or self.optimizer or error("Needs an optimizer object")
     local bunch_size = bunch_size or self.bunch_size or 1
     local smooth_gradients = (smooth_gradients==nil or smooth_gradients)
     if mask then
-      if not is_a(mask,matrix) then mask = mask:get_matrix() end
-      if not is_a(target,matrix) then
-        target = target:get_matrix()
-      end
+      assert( is_a(mask, matrix) )
+      assert( is_a(target, matrix) )
       target = target:clone():cmul(mask)
     end
+    local has_average = optimizer:has_property("average")
     local needs_gradient = optimizer:needs_property("gradient")
-    local tr_loss, _, tr_loss_matrix =
+    local tr_loss, _, tr_loss_matrix, average =
       optimizer:execute(function(weights, it)
           if weights ~= self.weights_table then
             self:build{ weights = weights }
@@ -807,12 +801,8 @@ trainable_supervised_trainer_methods.train_step =
           model:reset(it)
           local output = model:forward(input, true)
           if mask then
-            if not is_a(output,matrix) then
-              output = output:get_matrix()
-            end
-            if not is_a(target,matrix) then
-              target = target:get_matrix()
-            end
+            assert( is_a(output, matrix) )
+            assert( is_a(target, matrix) )
             output = output:clone():cmul(mask)
           end
           local tr_loss,tr_loss_matrix
@@ -821,7 +811,7 @@ trainable_supervised_trainer_methods.train_step =
           if needs_gradient then
             local gradient=model:backprop(loss:gradient(output,target))
             --
-            grads:zeros()
+            md.zeros(grads)
             --
             local grads = model:compute_gradients(grads)
             self.weight_grads = grads
@@ -856,8 +846,8 @@ trainable_supervised_trainer_methods.validate_step =
         "the loss for the given pair input/target output.",
       }, 
     params = {
-      "A table with one input pattern or a token (with one or more patterns)",
-      "The corresponding target output pattern (table or token)",
+      "A table with one input pattern or a token (with one or more patterns, usually a matrix)",
+      "The corresponding target output pattern (table or token, usually a matrix)",
       "The loss function [optional]",
     },
     outputs = {
@@ -866,21 +856,17 @@ trainable_supervised_trainer_methods.validate_step =
     },
   } ..
   function(self, input, target, loss, mask)
-    if type(input)  == "table" then input  = matrix.col_major(input)  end
-    if type(target) == "table" then target = matrix.col_major(target) end
-    if type(mask)   == "table" then mask   = matrix.col_major(mask) end
+    if type(input)  == "table" then input  = matrix(input)  end
+    if type(target) == "table" then target = matrix(target) end
+    if type(mask)   == "table" then mask   = matrix(mask) end
     local model = self.ann_component
     local loss  = loss or self.loss_function
     model:reset()
     local output = model:forward(input)
     if mask then
-      if not is_a(mask,matrix) then mask = mask:get_matrix() end
-      if not is_a(output,matrix) then
-        output = output:get_matrix()
-      end
-      if not is_a(target,matrix) then
-        target = target:get_matrix()
-      end
+      assert( is_a(mask, matrix) )
+      assert( is_a(output, matrix) )
+      assert( is_a(target, matrix) )
       output = output:clone():cmul(mask)
       target = target:clone():cmul(mask)
     end
@@ -898,8 +884,8 @@ trainable_supervised_trainer_methods.compute_gradients_step =
     class = "method",
     summary = "Executes one gradients computation step",
     params = {
-      "A table with one input pattern or a token (with one or more patterns)",
-      "The corresponding target output pattern (table or token)",
+      "A table with one input pattern or a token (with one or more patterns, usually a matrix)",
+      "The corresponding target output pattern (table or token, usually a matrix)",
       "The loss function [optional].",
       "A table with matrices where to store the gradients [optional]",
     },
@@ -910,10 +896,10 @@ trainable_supervised_trainer_methods.compute_gradients_step =
     },
   } ..
   function(self, input, target, loss, weight_grads)
-    if type(input)  == "table" then input  = matrix.col_major(input)  end
-    if type(target) == "table" then target = matrix.col_major(target) end
+    if type(input)  == "table" then input  = matrix(input)  end
+    if type(target) == "table" then target = matrix(target) end
     local loss         = loss or self.loss_function
-    local weight_grads = weight_grads or matrix.dict()
+    local weight_grads = weight_grads or {}
     local tr_loss,tr_loss_matrix,gradient
     self.ann_component:reset()
     local output = self.ann_component:forward(input, true)
@@ -923,8 +909,7 @@ trainable_supervised_trainer_methods.compute_gradients_step =
       gradient = loss:gradient(output, target)
       gradient = self.ann_component:backprop(gradient)
       --
-      iterator(pairs(weight_grads)):
-      apply(function(name,mat)mat:zeros()end)
+      md.zeros(weight_grads)
       --
       weight_grads = self.ann_component:compute_gradients(weight_grads)
       return weight_grads,tr_loss,tr_loss_matrix
@@ -938,8 +923,8 @@ trainable_supervised_trainer_methods.grad_check_step =
     class = "method",
     summary = "Executes one gradients check step",
     params = {
-      "A table with one input pattern or a token (with one or more patterns)",
-      "The corresponding target output pattern (table or token)",
+      "A table with one input pattern or a token (with one or more patterns, usually a matrix)",
+      "The corresponding target output pattern (table or token, usually a matrix)",
       "A boolean, true if you want high verbosity level [optional]",
       "The loss function [optional].",
     },
@@ -948,8 +933,8 @@ trainable_supervised_trainer_methods.grad_check_step =
     },
   } ..
   function(self, input, target, verbose, loss)
-    if type(input)  == "table" then input  = matrix.col_major(input)  end
-    if type(target) == "table" then target = matrix.col_major(target) end
+    if type(input)  == "table" then input  = matrix(input)  end
+    if type(target) == "table" then target = matrix(target) end
     local loss = loss or self.loss_function
     self.ann_component:reset()
     loss:reset()
@@ -964,12 +949,13 @@ trainable_supervised_trainer_methods.grad_check_step =
     local ret      = true
     local bunch_size = tr_loss_matrix:dim(1)
     local it = 1
+    -- local counts = iterator(self:iterate_weights()):map(function(name,cnn) return name,cnn:get_shared_count() end):table()
     for wname,cnn in self:iterate_weights() do
       collectgarbage("collect")
       local w = cnn
       -- The shared parameter has no effect in gradients check, only bunch_size
       local ratio = 1/bunch_size
-      local ann_grads = self.weight_grads(wname)
+      local ann_grads = self.weight_grads[wname]
       assert(w:is_contiguous(),
              "Unable to check grads of non-contiguous matrices")
       for i=1,w:size() do
@@ -1031,16 +1017,16 @@ trainable_supervised_trainer_methods.calculate =
         "the computed output for the given input.",
       }, 
     params = {
-      "A table with one input pattern, a col-major matrix or a token (with one or more patterns)",
+      "A table with one input pattern, a matrix or a token (with one or more patterns, usually a matrix)",
     },
     outputs = {
-      "A col-major matrix with the computed output",
+      "A token with the computed output, usually a matrix",
     },
   } ..
   function(self,input)
-    if type(input) == "table" then input = matrix.col_major(input) end
+    if type(input) == "table" then input = matrix(input) end
     self.ann_component:reset()
-    return self.ann_component:forward(input):get_matrix()
+    return self.ann_component:forward(input)
   end
 
 ------------------------------------------------------------------------
@@ -1511,7 +1497,7 @@ trainable_supervised_trainer_methods.show_weights =
   } ..
   function(self)
     for _,wname in pairs(self.weights_order) do
-      local w = self.weights_table(wname):toTable()
+      local w = self.weights_table[wname]:toTable()
       print(wname, table.concat(w, " "))
     end
   end
@@ -1532,7 +1518,8 @@ trainable_supervised_trainer_methods.clone =
     local obj = trainable.supervised_trainer(self.ann_component:clone(),
                                              nil,
                                              self.bunch_size,
-                                             nil)
+                                             nil,
+                                             self.smooth_gradients)
     if self.loss_function then
       obj:set_loss_function(self.loss_function:clone())
     end
@@ -1540,7 +1527,7 @@ trainable_supervised_trainer_methods.clone =
       obj:set_optimizer(self.optimizer:clone())
     end
     if #self.weights_order > 0 then
-      obj:build{ weights = self.weights_table:clone() }
+      obj:build{ weights = md.clone(self.weights_table) }
     end
     -- add possible user functions
     for i,v in pairs(self) do
diff --git a/packages/trainable/lua_src/trainable.lua b/packages/trainable/lua_src/trainable.lua
index d5b6b88c6..f914fef3d 100644
--- a/packages/trainable/lua_src/trainable.lua
+++ b/packages/trainable/lua_src/trainable.lua
@@ -152,7 +152,7 @@ trainable.dataset_multiple_iterator =
             else nump = ds:numPatterns()
             end
             return is_a(ds,dataset) and dataset.token.wrapper(ds,
-                                                             params.bunch_major) or ds
+                                                              params.bunch_major) or ds
 	end):
         table(), nump
     end
@@ -414,11 +414,11 @@ train_holdout_methods.execute =
         "A function which trains a model and returns the trained model,",
         "the training loss and the validation loss",
       },
-      first_epoch = "The first epoch number",
+      "Variadic list of arguments for the function [optional]",
     },
     outputs = { "True or false, indicating if the training continues or not" },
   } ..
-  function(self, epoch_function)
+  function(self, epoch_function, ...)
     local params = self.params
     local state  = self.state
     -- check max epochs
@@ -432,7 +432,7 @@ train_holdout_methods.execute =
     end
     -- compute one training step by using epoch_function
     state.current_epoch = state.current_epoch + 1
-    state.last, state.train_error, state.validation_error = epoch_function()
+    state.last, state.train_error, state.validation_error = epoch_function(...)
     assert(state.last and state.train_error and state.validation_error,
            "Needs a function which returns three values: a model, training error and validation error")
     -- update with the best model
@@ -443,7 +443,7 @@ train_holdout_methods.execute =
       if state.best_val_error == math.huge or rel_error > params.tolerance then
         state.best_epoch     = state.current_epoch
         state.best_val_error = state.validation_error
-        state.best           = state.last:clone()
+        state.best           = util.clone( state.last )
       end
     end
     return true
@@ -693,11 +693,11 @@ train_wo_validation_methods.execute =
         "A function which trains a model and returns the trained model",
         "and the training loss",
       },
-      first_epoch = "The first epoch number",
+      "Variadic list of arguments for the function [optional]",
     },
     outputs = { "True or false, indicating if the training continues or not" },
   } ..
-  function(self, epoch_function)
+  function(self, epoch_function, ...)
     local params = self.params
     local state  = self.state
     -- stopping criterion
@@ -711,7 +711,7 @@ train_wo_validation_methods.execute =
     end
     -- compute one training step by using epoch_function
     state.current_epoch = state.current_epoch + 1
-    local model,tr_err = epoch_function()
+    local model,tr_err = epoch_function(...)
     assert(model and tr_err,
            "Needs a function which returns two values: a model and training error")
     --
diff --git a/packages/trainable/test/qlearning_test.lua b/packages/trainable/test/qlearning_test.lua
index 5b5b4c23a..f0cb4bd07 100644
--- a/packages/trainable/test/qlearning_test.lua
+++ b/packages/trainable/test/qlearning_test.lua
@@ -27,7 +27,7 @@ local shuffle_random = random(23824)
 
 -- two dimensions: velocity, position
 local function start_state()
-  return matrix.col_major(1,2,{0.0, -0.5})
+  return matrix(1,2,{0.0, -0.5})
 end
 
 local function stop_condition(state)
diff --git a/packages/trainable/test/test.lua b/packages/trainable/test/test.lua
index 7c9d56620..350cd44f0 100644
--- a/packages/trainable/test/test.lua
+++ b/packages/trainable/test/test.lua
@@ -89,6 +89,7 @@ tmpname = os.tmpname()
 while train_func:execute(function()
 			   local tr = trainer:train_dataset(training_data)
 			   local va = trainer:validate_dataset(validation_data)
+                           print(tr,va)
 			   return trainer,tr,va
 			 end) do
   train_func:save(tmpname, "binary", { shuffle = training_data.shuffle })
diff --git a/tools/gnuplot.lua b/tools/gnuplot.lua
index 85d2fe274..cb6c38610 100644
--- a/tools/gnuplot.lua
+++ b/tools/gnuplot.lua
@@ -107,6 +107,34 @@ function gnuplot_methods:plot(params, range)
   return self
 end
 
+-- Plots (or multiplots) a given table with gnuplot parameters
+function gnuplot_methods:rawplot(data, line)
+  if type(data) ~= "table" then data = { data } end
+  -- remove previous temporal files
+  for _,tmpname in pairs(self.tmpnames) do
+    self:writeln(string.format("!rm -f %s", tmpname))
+  end
+  self.tmpnames = {}
+  local tmpnames = self.tmpnames
+  local dict = {}
+  for i,m in ipairs(data) do
+    local aux_tmpname = tmpnames[m]
+    if not aux_tmpname then
+      assert(m.toTabFilename,
+	     "The matrix object needs the method toTabFilename")
+      aux_tmpname = os.tmpname()
+      tmpnames[m] = aux_tmpname
+      m:toTabFilename(aux_tmpname)
+    end
+    dict["#"..i] = aux_tmpname
+  end
+  local line = line:gsub("(#%d*)",dict)
+  print(line)
+  self:writeln(line)
+  self:flush()
+  return self
+end
+
 -- Closes the gnuplot pipe (interface)
 function gnuplot_methods:close()
   -- remove previous temporal files
diff --git a/tools/statistics/pearson-correlation-coefficient.lua b/tools/statistics/pearson-correlation-coefficient.lua
deleted file mode 100644
index 1344bd86a..000000000
--- a/tools/statistics/pearson-correlation-coefficient.lua
+++ /dev/null
@@ -1,70 +0,0 @@
-if #arg ~= 5 then
-  print("Syntax error!")
-  printf("\t%s [FILENAME | -] NUMCOL1 NUMCOL2 SEED CONF\n", arg[0])
-  printf("\t\tuse - as FILENAME for stdin\n")
-  printf("\t\tNUMCOL1 and NUMCOL2 are column indexes of your data\n")
-  printf("\t\tSEED is a random number generator seed for bootstrap confidences\n")
-  printf("\t\tCONF is the confidence value (0.95 for example)\n")
-  os.exit(1)
-end
-filename = arg[1]
-col1     = tonumber(arg[2])
-col2     = tonumber(arg[3])
-seed     = tonumber(arg[4])
-conf     = tonumber(arg[5])
-reps     = 100
-
-if conf > 0.5  then reps = 1000 end
-if conf > 0.95 then reps = 10000  end
-if conf > 0.99 then reps = 100000 end
-
-local f
-if filename == "-" then f = io.stdin
-else f = io.open(filename, "r") end
-
-function zero_if_null(v)
-  if v == "None" or v == "Undefined" or v == "Unintialized" or v == "Null" then
-    v = 0
-  end
-  return v
-end
-
-local points = iterator(f:lines()):
-map(string.tokenize):
--- remove commentaries
-filter(function(t) return string.sub(t[1],1,1) ~= "#" end):
--- filter null values
-map(function(t) return zero_if_null(t[col1]),zero_if_null(t[col2]) end):
--- check numbers
-map(function(a,b)
-      local a =
-	tonumber(a) or error("Impossible to convert to number col1: " .. a)
-      local b =
-	tonumber(b) or error("Impossible to convert to number col2: " .. b)
-      return {a,b}
-    end):
--- table conversion
-table()
-
-local N   = #points
-local rnd = random(seed)
-
-fprintf(io.stderr, "%d repetitions, %d points\n", reps, N)
-
-local boot_result = stats.boot{
-  verbose         = true,
-  data            = points,
-  R               = reps,
-  statistic       = function(it)
-    local c = stats.correlation.pearson()
-    for k,v in it do c:add(table.unpack(v)) end
-    return { c:compute() }
-  end,
-}
-local rxy1,rxy2 = stats.boot.ci(data, conf)
-
-local alpha,beta = util.linear_least_squares(points)
-
-printf("rxy= % .4f +- % .4f [% .4f, % .4f]\n",
-       (rxy1 + rxy2)/2, math.abs(rxy1-rxy2)*0.5, rxy1, rxy2)
-printf("y=   % .4f + % .4f x\n", alpha, beta)
diff --git a/update_doc.sh b/update_doc.sh
new file mode 100755
index 000000000..8a6139498
--- /dev/null
+++ b/update_doc.sh
@@ -0,0 +1,2 @@
+#!/bin/bash
+rsync -vrhz --rsh="ssh -l pako" doxygen_doc cafre.dsic.upv.es:~/public_html/STUFF