[mlpack-svn] r13110 - mlpack/trunk/src/mlpack/methods/sparse_coding

Tue Jun 26 15:42:50 EDT 2012

Author: rcurtin
Date: 2012-06-26 15:42:50 -0400 (Tue, 26 Jun 2012)
New Revision: 13110

Modified:
   mlpack/trunk/src/mlpack/methods/sparse_coding/sparse_coding_main.cpp
Log:
Clean up main executable.  Avoid unnecessary copies.


Modified: mlpack/trunk/src/mlpack/methods/sparse_coding/sparse_coding_main.cpp
===================================================================

--- mlpack/trunk/src/mlpack/methods/sparse_coding/sparse_coding_main.cpp	2012-06-26 19:16:29 UTC (rev 13109)
+++ mlpack/trunk/src/mlpack/methods/sparse_coding/sparse_coding_main.cpp	2012-06-26 19:42:50 UTC (rev 13110)
@@ -7,21 +7,57 @@
 #include <mlpack/core.hpp>
 #include "sparse_coding.hpp"
 
-PROGRAM_INFO("Sparse Coding", "An implementation of l1-norm and l1+l2-norm "
-    "regularized Sparse Coding with Dictionary Learning");
+PROGRAM_INFO("Sparse Coding", "An implementation of Sparse Coding with "
+    "Dictionary Learning, which achieves sparsity via an l1-norm regularizer on"
+    " the codes (LASSO) or an (l1+l2)-norm regularizer on the codes (the "
+    "Elastic Net).  Given a dense data matrix X with n points and d dimensions,"
+    " sparse coding seeks to find a dense dictionary matrix D with k atoms in "
+    "d dimensions, and a sparse coding matrix Z with n points in k dimensions."
+    "\n\n"
+    "The original data matrix X can then be reconstructed as D * Z.  Therefore,"
+    " this program finds a representation of each point in X as a sparse linear"
+    " combination of atoms in the dictionary D."
+    "\n\n"
+    "The sparse coding is found with an algorithm which alternates between a "
+    "dictionary step, which updates the dictionary D, and a sparse coding step,"
+    " which updates the sparse coding matrix."
+    "\n\n"
+    "To run this program, the input matrix X must be specified (with -i), along"
+    " with the number of atoms in the dictionary (-k).  An initial dictionary "
+    "may also be specified with the --initial_dictionary option.  The l1 and l2"
+    " norm regularization parameters may be specified with -l and -L, "
+    "respectively.  For example, to run sparse coding on the dataset in "
+    "data.csv using 200 atoms and an l1-regularization parameter of 0.1, saving"
+    " the dictionary into dict.csv and the codes into codes.csv, use "
+    "\n\n"
+    "$ sparse_coding -i data.csv -k 200 -l 0.1 -d dict.csv -c codes.csv"
+    "\n\n"
+    "The maximum number of iterations may be specified with the -n option. "
+    "Optionally, the input data matrix X can be normalized before coding with "
+    "the -N option.");
 
-PARAM_DOUBLE_REQ("lambda1", "Sparse coding l1-norm regularization parameter.",
-    "l");
+PARAM_STRING_REQ("input_file", "Filename of the input data.", "i");
+PARAM_INT_REQ("atoms", "Number of atoms in the dictionary.", "k");
+
+PARAM_DOUBLE("lambda1", "Sparse coding l1-norm regularization parameter.", "l",
+    0);
 PARAM_DOUBLE("lambda2", "Sparse coding l2-norm regularization parameter.", "L",
     0);
 
-PARAM_INT_REQ("n_atoms", "Number of atoms in the dictionary.", "k");
+PARAM_INT("max_iterations", "Maximum number of iterations for sparse coding (0 "
+    "indicates no limit).", "n", 0);
 
-PARAM_INT_REQ("n_iterations", "Number of iterations for sparse coding.", "n");
+PARAM_STRING("initial_dictionary", "Filename for optional initial dictionary.",
+    "D", "");
 
-PARAM_STRING_REQ("input_file", "Filename of the input data.", "i");
-PARAM_STRING("initial_dictionary", "Filename for optional initial dictionary.",     "d", "");
-PARAM_STRING("results_dir", "Directory to store results in.", "r", "");
+PARAM_STRING("dictionary_file", "Filename to save the output dictionary to.",
+    "d", "dictionary.csv");
+PARAM_STRING("codes_file", "Filename to save the output sparse codes to.", "c",
+    "codes.csv");
+
+PARAM_FLAG("normalize", "If set, the input data matrix will be normalized "
+    "before coding.", "N");
+
 PARAM_INT("seed", "Random seed.  If 0, 'std::time(NULL) is used.", "s", 0);
 
 using namespace arma;
@@ -39,76 +75,67 @@
   else
     RandomSeed((size_t) std::time(NULL));
 
-  double lambda1 = CLI::GetParam<double>("lambda1");
-  double lambda2 = CLI::GetParam<double>("lambda2");
+  const double lambda1 = CLI::GetParam<double>("lambda1");
+  const double lambda2 = CLI::GetParam<double>("lambda2");
 
-  const char* resultsDir = CLI::GetParam<string>("results_dir").c_str();
-  const char* dataFullpath = CLI::GetParam<string>("input_file").c_str();
-  const char* initialDictionaryFullpath =
-      CLI::GetParam<string>("initial_dictionary").c_str();
+  const string inputFile = CLI::GetParam<string>("input_file");
+  const string dictionaryFile = CLI::GetParam<string>("dictionary_file");
+  const string codesFile = CLI::GetParam<string>("codes_file");
+  const string initialDictionaryFile =
+      CLI::GetParam<string>("initial_dictionary");
 
-  size_t nIterations = CLI::GetParam<int>("n_iterations");
+  const size_t maxIterations = CLI::GetParam<int>("max_iterations");
+  const size_t atoms = CLI::GetParam<int>("atoms");
 
-  size_t nAtoms = CLI::GetParam<int>("n_atoms");
+  const bool normalize = CLI::HasParam("normalize");
 
   mat matX;
-  data::Load(dataFullpath, matX);
+  data::Load(inputFile, matX, true);
 
-  const size_t nPoints = matX.n_cols;
-  Log::Info << "Loaded " << nPoints << " points in " << matX.n_rows <<
+  Log::Info << "Loaded " << matX.n_cols << " points in " << matX.n_rows <<
       " dimensions." << endl;
 
   // Normalize each point since these are images.
-  for (size_t i = 0; i < nPoints; ++i)
-    matX.col(i) /= norm(matX.col(i), 2);
+  if (normalize)
+  {
+    Log::Info << "Normalizing data before coding..." << std::endl;
+    for (size_t i = 0; i < matX.n_cols; ++i)
+      matX.col(i) /= norm(matX.col(i), 2);
+  }
 
   // Run the sparse coding algorithm.
-  SparseCoding<> sc(matX, nAtoms, lambda1, lambda2);
+  SparseCoding<> sc(matX, atoms, lambda1, lambda2);
 
-  if (CLI::HasParam("initial_dictionary"))
+  if (initialDictionaryFile != "")
   {
-    mat matInitialD;
-    data::Load(initialDictionaryFullpath, matInitialD);
+    // Load initial dictionary directly into sparse coding object.
+    data::Load(initialDictionaryFile, sc.Dictionary());
 
-    if (matInitialD.n_cols != nAtoms)
+    if (sc.Dictionary().n_cols != atoms)
     {
       Log::Fatal << "The specified initial dictionary to load has "
-          << matInitialD.n_cols << " atoms, but the learned dictionary "
-          << "was specified to have " << nAtoms << " atoms!" << endl;
+          << sc.Dictionary().n_cols << " atoms, but the learned dictionary "
+          << "was specified to have " << atoms << " atoms!" << endl;
     }
 
-    if (matInitialD.n_rows != matX.n_rows)
+    if (sc.Dictionary().n_rows != matX.n_rows)
     {
       Log::Fatal << "The specified initial dictionary to load has "
-          << matInitialD.n_rows << " dimensions, but the specified data "
+          << sc.Dictionary().n_rows << " dimensions, but the specified data "
           << "has " << matX.n_rows << " dimensions!" << endl;
     }
-
-    sc.Dictionary() = matInitialD;
   }
 
   Timer::Start("sparse_coding");
-  sc.Encode(nIterations);
+  sc.Encode(maxIterations);
   Timer::Stop("sparse_coding");
 
-  mat learnedD = sc.Dictionary();
-  mat learnedZ = sc.Codes();
+  // Save the results.
+  Log::Info << "Saving dictionary matrix to '" << dictionaryFile << "'.\n";
 
-  if (strlen(resultsDir) == 0)
-  {
-    data::Save("D.csv", learnedD);
-    data::Save("Z.csv", learnedZ);
-  }
-  else
-  {
-    stringstream datapath;
-    datapath << resultsDir << "/D.csv";
+  data::Save(dictionaryFile, sc.Dictionary());
 
-    data::Save(datapath.str(), learnedD);
+  Log::Info << "Saving sparse codes to '" << codesFile << "'.\n";
 
-    datapath.clear();
-    datapath << resultsDir << "/Z.csv";
-
-    data::Save(datapath.str(), learnedZ);
-  }
+  data::Save(codesFile, sc.Codes());
 }