doc/nnet-test-utils_8cc_source.html

 // nnet3/nnet-test-utils.cc

 // Copyright      2015  Johns Hopkins University (author: Daniel Povey)
 // Copyright      2015  Vijayaditya Peddinti
 // Copyright      2016  Daniel Galvez

 // See ../../COPYING for clarification regarding multiple authors
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //  http://www.apache.org/licenses/LICENSE-2.0
 //
 // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
 // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
 // MERCHANTABLITY OR NON-INFRINGEMENT.
 // See the Apache 2 License for the specific language governing permissions and
 // limitations under the License.

 #include <iterator>
 #include <sstream>
 #include "nnet3/nnet-test-utils.h"
 #include "nnet3/nnet-utils.h"

 namespace kaldi {
 namespace nnet3 {


 // A super-simple case that is just a single affine component, no nonlinearity,
 // no splicing.
 void GenerateConfigSequenceSimplest(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   std::ostringstream os;

   int32 input_dim = 10 + Rand() % 20,
       output_dim = (opts.output_dim > 0 ?
                     opts.output_dim :
                     100 + Rand() % 200);


   os << "component name=affine1 type=AffineComponent input-dim="
      << input_dim << " output-dim=" << output_dim << std::endl;

   os << "input-node name=input dim=" << input_dim << std::endl;
   os << "component-node name=affine1_node component=affine1 input=input\n";
   os << "output-node name=output input=affine1_node\n";
   configs->push_back(os.str());
 }

 // A setup with context and an affine component, but no nonlinearity.
 void GenerateConfigSequenceSimpleContext(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   std::ostringstream os;

   std::vector<int32> splice_context;
   for (int32 i = -5; i < 4; i++)
     if (Rand() % 3 == 0)
       splice_context.push_back(i);
   if (splice_context.empty())
     splice_context.push_back(0);

   int32 input_dim = 10 + Rand() % 20,
       spliced_dim = input_dim * splice_context.size(),
       output_dim = (opts.output_dim > 0 ?
                     opts.output_dim :
                     100 + Rand() % 200);

   if (RandInt(0,1) == 0) {
     // do it the traditional way with an AffineComponent and an Append() expression.
     os << "component name=affine1 type=AffineComponent input-dim="
        << spliced_dim << " output-dim=" << output_dim << std::endl;

     os << "input-node name=input dim=" << input_dim << std::endl;

     os << "component-node name=affine1_node component=affine1 input=Append(";
     for (size_t i = 0; i < splice_context.size(); i++) {
       int32 offset = splice_context[i];
       os << "Offset(input, " << offset << ")";
       if (i + 1 < splice_context.size())
         os << ", ";
     }
     os << ")\n";
     os << "output-node name=output input=affine1_node\n";
   } else {
     os << "component name=tdnn1 type=TdnnComponent input-dim="
        << input_dim << " output-dim=" << output_dim
        << " time-offsets=";
     for (size_t i = 0; i < splice_context.size(); i++) {
       if (i>0) os << ',';
       os << splice_context[i];
     }
     os << " use-bias=" << (RandInt(0,1) == 0 ? "true":"false")
        << " use-natural-gradient="  << (RandInt(0,1) == 0 ? "true":"false")
        << std::endl;
     os << "input-node name=input dim=" << input_dim << std::endl;
     os << "component-node name=tdnn1_node component=tdnn1 input=input\n";
     os << "output-node name=output input=tdnn1_node\n";
   }
   configs->push_back(os.str());
 }


 // A simple case, just to get started.
 // Generate a single config with one input, splicing, and one hidden layer.
 // Also sometimes generate a part of the config that adds a new hidden layer.
 void GenerateConfigSequenceSimple(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   std::ostringstream os;

   std::vector<int32> splice_context;
   for (int32 i = -5; i < 4; i++)
     if (Rand() % 3 == 0)
       splice_context.push_back(i);
   if (splice_context.empty())
     splice_context.push_back(0);

   int32 input_dim = 10 + Rand() % 20,
       output_dim = (opts.output_dim > 0 ?
                     opts.output_dim :
                     100 + Rand() % 200),
       hidden_dim = 40 + Rand() % 50;
   int32 ivector_dim = 10 + Rand() % 20;
   if (RandInt(0, 1) == 0 || !opts.allow_ivector)
     ivector_dim = 0;
   int32 spliced_dim = input_dim * splice_context.size() + ivector_dim;

   bool use_final_nonlinearity = (opts.allow_final_nonlinearity &&
                                  RandInt(0, 1) == 0);
   bool use_batch_norm = (RandInt(0, 1) == 0);

   os << "component name=affine1 type=NaturalGradientAffineComponent input-dim="
      << spliced_dim << " output-dim=" << hidden_dim << std::endl;
   os << "component name=relu1 type=RectifiedLinearComponent dim="
      << hidden_dim << std::endl;
   if (use_batch_norm) {
     int32 block_dim = (hidden_dim % 2 == 0 ? hidden_dim / 2 : hidden_dim);
     os << "component name=batch-norm type=BatchNormComponent dim="
        << hidden_dim << " block-dim=" << block_dim
        << " target-rms=2.0";
     if (RandInt(0, 1) == 0)
       os << " epsilon=3.0";
     os << '\n';
   }
   os << "component name=final_affine type=NaturalGradientAffineComponent input-dim="
      << hidden_dim << " output-dim=" << output_dim << std::endl;
   if (use_final_nonlinearity) {
     if (Rand() % 2 == 0) {
       os << "component name=logsoftmax type=SoftmaxComponent dim="
          << output_dim << std::endl;
     } else {
       os << "component name=logsoftmax type=LogSoftmaxComponent dim="
          << output_dim << std::endl;
     }
   }
   os << "input-node name=input dim=" << input_dim << std::endl;
   if (ivector_dim != 0)
     os << "input-node name=ivector dim=" << ivector_dim << std::endl;

   os << "component-node name=affine1_node component=affine1 input=Append(";
   if (ivector_dim != 0)
     os << "ReplaceIndex(ivector, t, 0), ";
   for (size_t i = 0; i < splice_context.size(); i++) {
     int32 offset = splice_context[i];
     if (RandInt(0, 1) == 0) {
       os << "Offset(input, " << offset << ")";
     } else {
       // testing the Scale() expression.
       os << "Scale(-1, Offset(input, " << offset << "))";
     }
     if (i + 1 < splice_context.size())
       os << ", ";
   }
   os << ")\n";
   if (RandInt(0, 1) == 0) {
     os << "component-node name=nonlin1 component=relu1 input=affine1_node\n";
   } else if (RandInt(0, 1) == 0) {
     os << "component-node name=nonlin1 component=relu1 input=Scale(-1.0, affine1_node)\n";
   } else {
     os << "component-node name=nonlin1 component=relu1 input=Sum(Const(1.0, "
        << hidden_dim << "), Scale(-1.0, affine1_node))\n";
   }
   if (use_batch_norm) {
     os << "component-node name=batch-norm component=batch-norm input=nonlin1\n";
     os << "component-node name=final_affine component=final_affine input=batch-norm\n";
   } else {
     os << "component-node name=final_affine component=final_affine input=nonlin1\n";
   }
   if (use_final_nonlinearity) {
     os << "component-node name=output_nonlin component=logsoftmax input=final_affine\n";
     os << "output-node name=output input=output_nonlin\n";
   } else {
     os << "output-node name=output input=final_affine\n";
   }
   configs->push_back(os.str());

   if ((Rand() % 2) == 0) {
     std::ostringstream os2;
     os2 << "component name=affine2 type=NaturalGradientAffineComponent input-dim="
         << hidden_dim << " output-dim=" << hidden_dim << std::endl;
     os2 << "component name=relu2 type=RectifiedLinearComponent dim="
         << hidden_dim << std::endl;
     // regenerate the final_affine component when we add the new config.
     os2 << "component name=final_affine type=NaturalGradientAffineComponent input-dim="
         << hidden_dim << " output-dim=" << output_dim << std::endl;
     os2 << "component-node name=affine2 component=affine2 input=nonlin1\n";
     os2 << "component-node name=relu2 component=relu2 input=affine2\n";
     os2 << "component-node name=final_affine component=final_affine input=relu2\n";
     configs->push_back(os2.str());
   }
 }


 void GenerateConfigSequenceStatistics(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   int32 input_dim = RandInt(10, 30),
       input_period = RandInt(1, 3),
       stats_period = input_period * RandInt(1, 3),
       left_context = stats_period * RandInt(1, 10),
       right_context = stats_period * RandInt(1, 10),
       log_count_features = RandInt(0, 3);
   BaseFloat variance_floor = RandInt(1, 10) * 1.0e-10;
   bool output_stddevs = (RandInt(0, 1) == 0);

   int32 raw_stats_dim = 1 + input_dim + (output_stddevs ? input_dim : 0),
       pooled_stats_dim = log_count_features + input_dim +
         (output_stddevs ? input_dim : 0);
   std::ostringstream os;
   os << "input-node name=input dim=" << input_dim << std::endl;
   os << "component name=statistics-extraction type=StatisticsExtractionComponent "
      << "input-dim=" << input_dim << " input-period=" << input_period
      << " output-period=" << stats_period << " include-variance="
      << std::boolalpha << output_stddevs << "\n";

   os << "component name=statistics-pooling type=StatisticsPoolingComponent "
      << "input-dim=" << raw_stats_dim << " input-period=" << stats_period
      << " left-context=" << left_context << " right-context=" << right_context
      << " num-log-count-features=" << log_count_features << " output-stddevs="
      << std::boolalpha << output_stddevs << " variance-floor="
      << variance_floor << "\n";

   os << "component name=affine type=AffineComponent "
      << "input-dim=" << input_dim << " output-dim=" << pooled_stats_dim
      << "\n";

   os << "component-node name=statistics-extraction component=statistics-extraction "
      << "input=input\n";
   os << "component-node name=statistics-pooling component=statistics-pooling "
      << "input=statistics-extraction\n";
   os << "component-node name=affine component=affine input=input\n";
   os << "output-node name=output input=Sum(affine, Round(statistics-pooling, "
      << stats_period << "))\n";
   configs->push_back(os.str());
 }

 // This generates a single config corresponding to an RNN.
 void GenerateConfigSequenceRnn(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   std::ostringstream os;

   std::vector<int32> splice_context;
   for (int32 i = -5; i < 4; i++)
     if (Rand() % 3 == 0)
       splice_context.push_back(i);
   if (splice_context.empty())
     splice_context.push_back(0);

   int32 input_dim = 10 + Rand() % 20,
       spliced_dim = input_dim * splice_context.size(),
       output_dim = (opts.output_dim > 0 ?
                     opts.output_dim :
                     100 + Rand() % 200),
       hidden_dim = 40 + Rand() % 50;
   os << "component name=affine1 type=NaturalGradientAffineComponent input-dim="
      << spliced_dim << " output-dim=" << hidden_dim << std::endl;
   if (RandInt(0, 1) == 0) {
     os << "component name=nonlin1 type=RectifiedLinearComponent dim="
        << hidden_dim << std::endl;
   } else {
     os << "component name=nonlin1 type=TanhComponent dim="
        << hidden_dim << std::endl;
   }
   os << "component name=recurrent_affine1 type=NaturalGradientAffineComponent input-dim="
      << hidden_dim << " output-dim=" << hidden_dim << std::endl;
   os << "component name=affine2 type=NaturalGradientAffineComponent input-dim="
      << hidden_dim << " output-dim=" << output_dim << std::endl;
   os << "component name=logsoftmax type=LogSoftmaxComponent dim="
      << output_dim << std::endl;
   os << "input-node name=input dim=" << input_dim << std::endl;

   os << "component-node name=affine1_node component=affine1 input=Append(";
   for (size_t i = 0; i < splice_context.size(); i++) {
     int32 offset = splice_context[i];
     os << "Offset(input, " << offset << ")";
     if (i + 1 < splice_context.size())
       os << ", ";
   }
   os << ")\n";
   os << "component-node name=recurrent_affine1 component=recurrent_affine1 "
         "input=Offset(nonlin1, -1)\n";
   os << "component-node name=nonlin1 component=nonlin1 "
         "input=Sum(affine1_node, IfDefined(recurrent_affine1))\n";
   os << "component-node name=affine2 component=affine2 input=nonlin1\n";
   os << "component-node name=output_nonlin component=logsoftmax input=affine2\n";
   os << "output-node name=output input=output_nonlin\n";
   configs->push_back(os.str());
 }


 // This generates a config sequence for what I *think* is a clockwork RNN, in
 // that different parts operate at different speeds.  The output layer is
 // evaluated every frame, but the internal RNN layer is evaluated every 3
 // frames.
 void GenerateConfigSequenceRnnClockwork(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   std::ostringstream os;

   std::vector<int32> splice_context;
   for (int32 i = -5; i < 4; i++)
     if (Rand() % 3 == 0)
       splice_context.push_back(i);
   if (splice_context.empty())
     splice_context.push_back(0);

   int32 input_dim = 10 + Rand() % 20,
       spliced_dim = input_dim * splice_context.size(),
       output_dim = (opts.output_dim > 0 ?
                     opts.output_dim :
                     100 + Rand() % 200),
       hidden_dim = 40 + Rand() % 50;
   os << "component name=affine1 type=NaturalGradientAffineComponent input-dim="
      << spliced_dim << " output-dim=" << hidden_dim << std::endl;
   os << "component name=nonlin1 type=RectifiedLinearComponent dim="
      << hidden_dim << std::endl;
   os << "component name=recurrent_affine1 type=NaturalGradientAffineComponent input-dim="
      << hidden_dim << " output-dim=" << hidden_dim << std::endl;
   // the suffix _0, _1, _2 equals the index of the output-frame modulo 3; there
   // are 3 versions of the final affine layer.  There was a paper by Vincent
   // Vanhoucke about something like this.
   os << "component name=final_affine_0 type=NaturalGradientAffineComponent input-dim="
      << hidden_dim << " output-dim=" << output_dim << std::endl;
   os << "component name=final_affine_1 type=NaturalGradientAffineComponent input-dim="
      << hidden_dim << " output-dim=" << output_dim << std::endl;
   os << "component name=final_affine_2 type=NaturalGradientAffineComponent input-dim="
      << hidden_dim << " output-dim=" << output_dim << std::endl;
   os << "component name=logsoftmax type=LogSoftmaxComponent dim="
      << output_dim << std::endl;
   os << "input-node name=input dim=" << input_dim << std::endl;

   os << "component-node name=affine1_node component=affine1 input=Append(";
   for (size_t i = 0; i < splice_context.size(); i++) {
     int32 offset = splice_context[i];
     os << "Offset(input, " << offset << ")";
     if (i + 1 < splice_context.size())
       os << ", ";
   }
   os << ")\n";
   os << "component-node name=recurrent_affine1 component=recurrent_affine1 "
         "input=Offset(nonlin1, -1)\n";
   os << "component-node name=nonlin1 component=nonlin1 "
         "input=Sum(affine1_node, IfDefined(recurrent_affine1))\n";
   os << "component-node name=final_affine_0 component=final_affine_0 input=nonlin1\n";
   os << "component-node name=final_affine_1 component=final_affine_1 input=Offset(nonlin1, -1)\n";
   os << "component-node name=final_affine_2 component=final_affine_2 input=Offset(nonlin1, 1)\n";
   os << "component-node name=output_nonlin component=logsoftmax input=Switch(final_affine_0, final_affine_1, final_affine_2)\n";
   os << "output-node name=output input=output_nonlin\n";
   configs->push_back(os.str());
 }


 // This generates a single config corresponding to an LSTM.
 // based on the equations in
 // Sak et. al. "LSTM based RNN architectures for LVCSR", 2014
 // We name the components based on the following equations (Eqs 7-15 in paper)
 //      i(t) = S(Wix * x(t) + Wir * r(t-1) + Wic * c(t-1) + bi)
 //      f(t) = S(Wfx * x(t) + Wfr * r(t-1) + Wfc * c(t-1) + bf)
 //      c(t) = {f(t) .* c(t-1)} + {i(t) .* g(Wcx * x(t) + Wcr * r(t-1) + bc)}
 //      o(t) = S(Wox * x(t) + Wor * r(t-1) + Woc * c(t) + bo)
 //      m(t) = o(t) .* h(c(t))
 //      r(t) = Wrm * m(t)
 //      p(t) = Wpm * m(t)
 //      y(t) = Wyr * r(t) + Wyp * p(t) + by
 // where S : sigmoid
 // matrix with feed-forward connections
 // from the input x(t)
 // W*x = [Wix^T, Wfx^T, Wcx^T, Wox^T]^T

 // matrix with recurrent (feed-back) connections
 // from the output projection
 // W*r = [Wir^T, Wfr^T, Wcr^T, Wor^T]^T

 // matrix to generate r(t) and p(t)
 // m(t)
 // W*m = [Wrm^T, Wpm^T]^T
 // matrix to generate y(t)
 // Wy* = [Wyr^T, Wyp^T]

 // Diagonal matrices with recurrent connections and feed-forward connections
 // from the cell output c(t) since these can be both recurrent and
 // feed-forward we dont combine the matrices
 // Wic, Wfc, Woc


 void GenerateConfigSequenceLstm(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   std::ostringstream os;

   std::vector<int32> splice_context;
   for (int32 i = -5; i < 4; i++)
     if (Rand() % 3 == 0)
       splice_context.push_back(i);
   if (splice_context.empty())
     splice_context.push_back(0);

   int32 input_dim = 10 + Rand() % 20,
       spliced_dim = input_dim * splice_context.size(),
       output_dim = (opts.output_dim > 0 ?
                     opts.output_dim :
                     100 + Rand() % 200),
       cell_dim = 40 + Rand() % 50,
       projection_dim = std::ceil(cell_dim / (Rand() % 10 + 1));

   os << "input-node name=input dim=" << input_dim << std::endl;

   // trainable cell value for start/end of file.
   os << "component name=c0 type=ConstantComponent"
      << " output-dim=" << cell_dim << std::endl;


   // Parameter Definitions W*(* replaced by - to have valid names)
   // Input gate control : Wi* matrices
   os << "component name=Wi-xr type=NaturalGradientAffineComponent"
      << " input-dim=" << spliced_dim + projection_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=Wic type=PerElementScaleComponent "
      << " dim=" << cell_dim << std::endl;

   // Forget gate control : Wf* matrices
   os << "component name=Wf-xr type=NaturalGradientAffineComponent"
      << " input-dim=" << spliced_dim + projection_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=Wfc type=PerElementScaleComponent "
      << " dim=" << cell_dim << std::endl;

   // Output gate control : Wo* matrices
   os << "component name=Wo-xr type=NaturalGradientAffineComponent"
      << " input-dim=" << spliced_dim + projection_dim
      << " output-dim=" << cell_dim  << std::endl;
   os << "component name=Woc type=PerElementScaleComponent "
      << " dim=" << cell_dim << std::endl;

   // Cell input matrices : Wc* matrices
   os << "component name=Wc-xr type=NaturalGradientAffineComponent"
      << " input-dim=" << spliced_dim + projection_dim
      << " output-dim=" << cell_dim  << std::endl;


   // projection matrices : Wrm and Wpm
   os << "component name=W-m type=NaturalGradientAffineComponent "
      << " input-dim=" << cell_dim
      << " output-dim=" << 2 * projection_dim << std::endl;

   // Output : Wyr and Wyp
   os << "component name=Wy- type=NaturalGradientAffineComponent "
      << " input-dim=" << 2 * projection_dim
      << " output-dim=" << cell_dim << std::endl;

   // Defining the diagonal matrices
   // Defining the final affine transform
   os << "component name=final_affine type=NaturalGradientAffineComponent "
      << "input-dim=" << cell_dim << " output-dim=" << output_dim << std::endl;
   os << "component name=logsoftmax type=LogSoftmaxComponent dim="
      << output_dim << std::endl;

   // Defining the non-linearities
   //  declare a no-op component so that we can use a sum descriptor's output
   //  multiple times, and to make the config more readable given the equations
   os << "component name=i type=SigmoidComponent dim="
      << cell_dim << std::endl;
   os << "component name=f type=SigmoidComponent dim="
      << cell_dim << std::endl;
   os << "component name=o type=SigmoidComponent dim="
      << cell_dim << std::endl;
   os << "component name=g type=TanhComponent dim="
      << cell_dim << std::endl;
   os << "component name=h type=TanhComponent dim="
      << cell_dim << std::endl;
   os << "component name=c1 type=ElementwiseProductComponent "
      << " input-dim=" << 2 * cell_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=c2 type=ElementwiseProductComponent "
      << " input-dim=" << 2 * cell_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=m type=ElementwiseProductComponent "
      << " input-dim=" << 2 * cell_dim
      << " output-dim=" << cell_dim << std::endl;

   // Defining the computations
   std::ostringstream temp_string_stream;
   for (size_t i = 0; i < splice_context.size(); i++) {
     int32 offset = splice_context[i];
     temp_string_stream << "Offset(input, " << offset << ")";
     if (i + 1 < splice_context.size())
       temp_string_stream << ", ";
   }
   std::string spliced_input = temp_string_stream.str();

   std::string c_tminus1 = "Sum(Failover(Offset(c1_t, -1), c0), IfDefined(Offset( c2_t, -1)))";


   // c0.  note: the input is never used as the component requires
   // no input indexes; we just write itself as input to keep the
   // structures happy.
   os << "component-node name=c0 component=c0 input=c0\n";

   // i_t
   os << "component-node name=i1 component=Wi-xr input=Append("
      << spliced_input << ", IfDefined(Offset(r_t, -1)))\n";
   os << "component-node name=i2 component=Wic "
      << " input=" << c_tminus1 << std::endl;
   os << "component-node name=i_t component=i input=Sum(i1, i2)\n";

   // f_t
   os << "component-node name=f1 component=Wf-xr input=Append("
      << spliced_input << ", IfDefined(Offset(r_t, -1)))\n";
   os << "component-node name=f2 component=Wfc "
      << " input=" << c_tminus1 << std::endl;
   os << "component-node name=f_t component=f input=Sum(f1, f2)\n";

   // o_t
   os << "component-node name=o1 component=Wo-xr input=Append("
      << spliced_input << ", IfDefined(Offset(r_t, -1)))\n";
   os << "component-node name=o2 component=Woc input=Sum(c1_t, c2_t)\n";
   os << "component-node name=o_t component=o input=Sum(o1, o2)\n";

   // h_t
   os << "component-node name=h_t component=h input=Sum(c1_t, c2_t)\n";

   // g_t
   os << "component-node name=g1 component=Wc-xr input=Append("
      << spliced_input << ", IfDefined(Offset(r_t, -1)))\n";
   os << "component-node name=g_t component=g input=g1\n";

   // parts of c_t
   os << "component-node name=c1_t component=c1 "
      << " input=Append(f_t, " << c_tminus1 << ")\n";
   os << "component-node name=c2_t component=c2 input=Append(i_t, g_t)\n";

   // m_t
   os << "component-node name=m_t component=m input=Append(o_t, h_t)\n";

   // r_t and p_t
   os << "component-node name=rp_t component=W-m input=m_t\n";
   // Splitting outputs of Wy- node
   os << "dim-range-node name=r_t input-node=rp_t dim-offset=0 "
      << "dim=" << projection_dim << std::endl;

   // y_t
   os << "component-node name=y_t component=Wy- input=rp_t\n";

   // Final affine transform
   os << "component-node name=final_affine component=final_affine input=y_t\n";
   os << "component-node name=posteriors component=logsoftmax input=final_affine\n";
   os << "output-node name=output input=posteriors\n";
   configs->push_back(os.str());
 }

 void GenerateConfigSequenceLstmWithTruncation(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   std::ostringstream os;

   std::vector<int32> splice_context;
   for (int32 i = -5; i < 4; i++)
     if (Rand() % 3 == 0)
       splice_context.push_back(i);
   if (splice_context.empty())
     splice_context.push_back(0);

   int32 input_dim = 10 + Rand() % 20,
       spliced_dim = input_dim * splice_context.size(),
       output_dim = (opts.output_dim > 0 ?
                     opts.output_dim :
                     100 + Rand() % 200),
       cell_dim = 40 + Rand() % 50,
       projection_dim = std::ceil(cell_dim / (Rand() % 10 + 1));
   int32 clipping_threshold = RandInt(6, 50),
       zeroing_threshold = RandInt(1,  5),
       zeroing_interval = RandInt(1, 5) * 10;
   BaseFloat scale = 0.8 + 0.1*RandInt(0,3);

   os << "input-node name=input dim=" << input_dim << std::endl;

   // Parameter Definitions W*(* replaced by - to have valid names)
   // Input gate control : Wi* matrices
   os << "component name=Wi-xr type=NaturalGradientAffineComponent"
      << " input-dim=" << spliced_dim + projection_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=Wic type=PerElementScaleComponent "
      << " dim=" << cell_dim << std::endl;

   // Forget gate control : Wf* matrices
   os << "component name=Wf-xr type=NaturalGradientAffineComponent"
      << " input-dim=" << spliced_dim + projection_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=Wfc type=PerElementScaleComponent "
      << " dim=" << cell_dim << std::endl;

   // Output gate control : Wo* matrices
   os << "component name=Wo-xr type=NaturalGradientAffineComponent"
      << " input-dim=" << spliced_dim + projection_dim
      << " output-dim=" << cell_dim  << std::endl;
   os << "component name=Woc type=PerElementScaleComponent "
      << " dim=" << cell_dim << std::endl;

   // Cell input matrices : Wc* matrices
   os << "component name=Wc-xr type=NaturalGradientAffineComponent"
      << " input-dim=" << spliced_dim + projection_dim
      << " output-dim=" << cell_dim  << std::endl;


   // projection matrices : Wrm and Wpm
   os << "component name=W-m type=NaturalGradientAffineComponent "
      << " input-dim=" << cell_dim
      << " output-dim=" << 2 * projection_dim << std::endl;

   // Output : Wyr and Wyp
   os << "component name=Wy- type=NaturalGradientAffineComponent "
      << " input-dim=" << 2 * projection_dim
      << " output-dim=" << cell_dim << std::endl;

   // Defining the diagonal matrices
   // Defining the final affine transform
   os << "component name=final_affine type=NaturalGradientAffineComponent "
      << "input-dim=" << cell_dim << " output-dim=" << output_dim << std::endl;
   os << "component name=logsoftmax type=LogSoftmaxComponent dim="
      << output_dim << std::endl;

   // Defining the non-linearities
   //  declare a no-op component so that we can use a sum descriptor's output
   //  multiple times, and to make the config more readable given the equations
   os << "component name=i type=SigmoidComponent dim="
      << cell_dim << std::endl;
   os << "component name=f type=SigmoidComponent dim="
      << cell_dim << std::endl;
   os << "component name=o type=SigmoidComponent dim="
      << cell_dim << std::endl;
   os << "component name=g type=TanhComponent dim="
      << cell_dim << std::endl;
   os << "component name=h type=TanhComponent dim="
      << cell_dim << std::endl;
   os << "component name=c1 type=ElementwiseProductComponent "
      << " input-dim=" << 2 * cell_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=c2 type=ElementwiseProductComponent "
      << " input-dim=" << 2 * cell_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=m type=ElementwiseProductComponent "
      << " input-dim=" << 2 * cell_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=c type=BackpropTruncationComponent dim="
      << cell_dim
      << " scale=" << scale
      << " clipping-threshold=" << clipping_threshold
      << " zeroing-threshold=" << zeroing_threshold
      << " zeroing-interval=" << zeroing_interval
      << " recurrence-interval=1" << std::endl;
   os << "component name=r type=BackpropTruncationComponent dim="
      << projection_dim
      << " scale=" << scale
      << " clipping-threshold=" << clipping_threshold
      << " zeroing-threshold=" << zeroing_threshold
      << " zeroing-interval=" << zeroing_interval
      << " recurrence-interval=1" << std::endl;

   // Defining the computations
   std::ostringstream temp_string_stream;
   for (size_t i = 0; i < splice_context.size(); i++) {
     int32 offset = splice_context[i];
     temp_string_stream << "Offset(input, " << offset << ")";
     if (i + 1 < splice_context.size())
       temp_string_stream << ", ";
   }
   std::string spliced_input = temp_string_stream.str();

   int32 offset = RandInt(-3, 3);
   if (offset == 0)
     offset = -1;


   std::string c_tminus1;
   {
     std::ostringstream os_temp;
     os_temp << "IfDefined(Offset(c_t, " << offset << "))";
     c_tminus1 = os_temp.str();
   }
   os << "component-node name=c_t component=c input=Sum(c1_t, c2_t)\n";

   // i_t
   os << "component-node name=i1 component=Wi-xr input=Append("
      << spliced_input << ", IfDefined(Offset(r_t, " << offset << ")))\n";
   os << "component-node name=i2 component=Wic "
      << " input=" << c_tminus1 << std::endl;
   os << "component-node name=i_t component=i input=Sum(i1, i2)\n";

   // f_t
   os << "component-node name=f1 component=Wf-xr input=Append("
      << spliced_input << ", IfDefined(Offset(r_t, " << offset << ")))\n";
   os << "component-node name=f2 component=Wfc "
      << " input=" << c_tminus1 << std::endl;
   os << "component-node name=f_t component=f input=Sum(f1, f2)\n";

   // o_t
   os << "component-node name=o1 component=Wo-xr input=Append("
      << spliced_input << ", IfDefined(Offset(r_t, " << offset << ")))\n";
   os << "component-node name=o2 component=Woc input=Sum(c1_t, c2_t)\n";
   os << "component-node name=o_t component=o input=Sum(o1, o2)\n";

   // h_t
   os << "component-node name=h_t component=h input=Sum(c1_t, c2_t)\n";

   // g_t
   os << "component-node name=g1 component=Wc-xr input=Append("
      << spliced_input << ", IfDefined(Offset(r_t, " << offset << ")))\n";
   os << "component-node name=g_t component=g input=g1\n";

   // parts of c_t
   os << "component-node name=c1_t component=c1 "
      << " input=Append(f_t, " << c_tminus1 << ")\n";
   os << "component-node name=c2_t component=c2 input=Append(i_t, g_t)\n";

   // m_t
   os << "component-node name=m_t component=m input=Append(o_t, h_t)\n";

   // r_t and p_t
   os << "component-node name=rp_t component=W-m input=m_t\n";
   // Splitting outputs of Wy- node
   os << "dim-range-node name=r_t_pretrunc input-node=rp_t dim-offset=0 "
      << "dim=" << projection_dim << std::endl;
   os << "component-node name=r_t component=r input=r_t_pretrunc\n";

   // y_t
   os << "component-node name=y_t component=Wy- input=rp_t\n";

   // Final affine transform
   os << "component-node name=final_affine component=final_affine input=y_t\n";
   os << "component-node name=posteriors component=logsoftmax input=final_affine\n";
   os << "output-node name=output input=posteriors\n";
   configs->push_back(os.str());
 }

 // This is a different LSTM config where computation is bunched according
 // to inputs this is not complete, it is left here for future comparisons
 void GenerateConfigSequenceLstmType2(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   KALDI_ERR << "Not Implemented";
   std::ostringstream os;

   std::vector<int32> splice_context;
   for (int32 i = -5; i < 4; i++)
     if (Rand() % 3 == 0)
       splice_context.push_back(i);
   if (splice_context.empty())
     splice_context.push_back(0);

   int32 input_dim = 10 + Rand() % 20,
       spliced_dim = input_dim * splice_context.size(),
       output_dim = (opts.output_dim > 0 ?
                     opts.output_dim :
                     100 + Rand() % 200),
       cell_dim = 40 + Rand() % 50,
       projection_dim = std::ceil(cell_dim / (Rand() % 10 + 2));

   int32 offset = RandInt(-3, 3);
   if (offset == 0)
     offset = -1;

   os << "input-node name=input dim=" << input_dim << std::endl;
   // Parameter Definitions W*(* replaced by - to have valid names)
   os << "component name=W-x type=NaturalGradientAffineComponent input-dim="
      << spliced_dim << " output-dim=" << 4 * cell_dim << std::endl;
   os << "component name=W-r type=NaturalGradientAffineComponent input-dim="
      << projection_dim << " output-dim=" << 4 * cell_dim << std::endl;
   os << "component name=W-m type=NaturalGradientAffineComponent input-dim="
      << cell_dim << " output-dim=" << 2 * projection_dim  << std::endl;
   os << "component name=Wyr type=NaturalGradientAffineComponent input-dim="
      << projection_dim << " output-dim=" << cell_dim << std::endl;
   os << "component name=Wyp type=NaturalGradientAffineComponent input-dim="
      << projection_dim << " output-dim=" << cell_dim << std::endl;
   // Defining the diagonal matrices
   os << "component name=Wic type=PerElementScaleComponent "
      << " dim=" << cell_dim << std::endl;
   os << "component name=Wfc type=PerElementScaleComponent "
      << " dim=" << cell_dim << std::endl;
   os << "component name=Woc type=PerElementScaleComponent "
      << " dim=" << cell_dim << std::endl;
   // Defining the final affine transform
   os << "component name=final_affine type=NaturalGradientAffineComponent "
      << "input-dim=" << cell_dim << " output-dim=" << output_dim << std::endl;
   os << "component name=logsoftmax type=LogSoftmaxComponent dim="
      << output_dim << std::endl;

   // Defining the non-linearities
   //  declare a no-op component so that we can use a sum descriptor's output
   //  multiple times, and to make the config more readable given the equations
   os << "component name=c_t type=NoOpComponent dim="
      << cell_dim << std::endl;
   os << "component name=i_t type=SigmoidComponent dim="
      << cell_dim << std::endl;
   os << "component name=f_t type=SigmoidComponent dim="
      << cell_dim << std::endl;
   os << "component name=o_t type=SigmoidComponent dim="
      << cell_dim << std::endl;
   os << "component name=g type=TanhComponent dim="
      << cell_dim << std::endl;
   os << "component name=h type=TanhComponent dim="
      << cell_dim << std::endl;
   os << "component name=f_t-c_tminus1 type=ElementwiseProductComponent "
      << " input-dim=" << 2 * cell_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=i_t-g type=ElementwiseProductComponent "
      << " input-dim=" << 2 * cell_dim
      << " output-dim=" << cell_dim << std::endl;
   os << "component name=m_t type=ElementwiseProductComponent "
      << " input-dim=" << 2 * cell_dim
      << " output-dim=" << cell_dim << std::endl;


   // Defining the computations
   os << "component-node name=W-x component=W-x input=Append(";
   for (size_t i = 0; i < splice_context.size(); i++) {
     int32 offset = splice_context[i];
     os << "Offset(input, " << offset << ")";
     if (i + 1 < splice_context.size())
       os << ", ";
   }
   os << ")\n";

   os << "component-node name=W-r component=W-r input=IfDefined(Offset(r_t"
      << offset << "))\n";
   os << "component-node name=W-m component=W-m input=m_t \n";
   os << "component-node name=Wic component=Wic input=IfDefined(Offset(c_t"
      << offset << "))\n";
   os << "component-node name=Wfc component=Wfc input=IfDefined(Offset(c_t"
      << offset << "))\n";
   os << "component-node name=Woc component=Woc input=c_t\n";

   // Splitting the outputs of W*m node
   os << "dim-range-node name=r_t input-node=W-m dim-offset=0 "
      << "dim=" << projection_dim << std::endl;
   os << "dim-range-node name=p_t input-node=W-m dim-offset=" << projection_dim
      << " dim=" << projection_dim << std::endl;

   // Splitting outputs of W*x node
   os << "dim-range-node name=W_ix-x_t input-node=W-x dim-offset=0 "
      << "dim=" << cell_dim << std::endl;
   os << "dim-range-node name=W_fx-x_t input-node=W-x "
      << "dim-offset=" << cell_dim << " dim="<<cell_dim << std::endl;
   os << "dim-range-node name=W_cx-x_t input-node=W-x "
      << "dim-offset=" << 2 * cell_dim << " dim="<<cell_dim << std::endl;
   os << "dim-range-node name=W_ox-x_t input-node=W-x "
      << "dim-offset=" << 3 * cell_dim << " dim="<<cell_dim << std::endl;

   // Splitting outputs of W*r node
   os << "dim-range-node name=W_ir-r_tminus1 input-node=W-r dim-offset=0 "
      << "dim=" << cell_dim << std::endl;
   os << "dim-range-node name=W_fr-r_tminus1 input-node=W-r "
      << "dim-offset=" << cell_dim << " dim="<<cell_dim << std::endl;
   os << "dim-range-node name=W_cr-r_tminus1 input-node=W-r "
      << "dim-offset=" << 2 * cell_dim << " dim="<<cell_dim << std::endl;
   os << "dim-range-node name=W_or-r_tminus1 input-node=W-r "
      << "dim-offset=" << 3 * cell_dim << " dim="<<cell_dim << std::endl;

   // Non-linear operations
   os << "component-node name=c_t component=c_t input=Sum(f_t-c_tminus1, i_t-g)\n";
   os << "component-node name=h component=h input=c_t\n";
   os << "component-node name=i_t component=i_t input=Sum(W_ix-x_t, Sum(W_ir-r_tminus1, Wic))\n";
   os << "component-node name=f_t component=f_t input=Sum(W_fx-x_t, Sum(W_fr-r_tminus1, Wfc))\n";
   os << "component-node name=o_t component=o_t input=Sum(W_ox-x_t, Sum(W_or-r_tminus1, Woc))\n";
   os << "component-node name=f_t-c_tminus1 component=f_t-c_tminus1 input=Append(f_t, Offset(c_t"
      << offset << "))\n";
   os << "component-node name=i_t-g component=i_t-g input=Append(i_t, g)\n";
   os << "component-node name=m_t component=m_t input=Append(o_t, h)\n";

   os << "component-node name=g component=g input=Sum(W_cx-x_t, W_cr-r_tminus1)\n";

   // Final affine transform
   os << "component-node name=Wyr component=Wyr input=r_t\n";
   os << "component-node name=Wyp component=Wyp input=p_t\n";

   os << "component-node name=final_affine component=final_affine input=Sum(Wyr, Wyp)\n";

   os << "component-node name=posteriors component=logsoftmax input=final_affine\n";
   os << "output-node name=output input=posteriors\n";

   configs->push_back(os.str());
 }

 void GenerateConfigSequenceCnn(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   std::ostringstream os;


   int32 input_x_dim = 10 + Rand() % 20,
         input_y_dim = 10 + Rand() % 20,
         input_z_dim = 3 + Rand() % 10,
         filt_x_dim = 1 + Rand() % input_x_dim,
         filt_y_dim = 1 + Rand() % input_y_dim,
         num_filters = 10 + Rand() % 20,
         filt_x_step = (1 + Rand() % filt_x_dim),
         filt_y_step = (1 + Rand() % filt_y_dim);
   int32 remainder = (input_x_dim - filt_x_dim) % filt_x_step;
   // adjusting input_x_dim to ensure divisibility
   input_x_dim = input_x_dim - remainder;
   remainder = (input_y_dim - filt_y_dim) % filt_y_step;
   // adjusting input_x_dim to ensure divisibility
   input_y_dim = input_y_dim - remainder;

   int32 input_vectorization = Rand() % 2;
   std::string vectorization;
   if (input_vectorization == 0) {
     vectorization = "yzx";
   } else  {
     vectorization = "zyx";
   }

   os << "component name=conv type=ConvolutionComponent "
      << " input-x-dim=" << input_x_dim
      << " input-y-dim=" << input_y_dim
      << " input-z-dim=" << input_z_dim
      << " filt-x-dim=" << filt_x_dim
      << " filt-y-dim=" << filt_y_dim
      << " filt-x-step=" << filt_x_step
      << " filt-y-step=" << filt_y_step
      << " num-filters=" << num_filters
      << " input-vectorization-order=" << vectorization
      << std::endl;

   int32 conv_output_x_dim = (1 + (input_x_dim - filt_x_dim) / filt_x_step);
   int32 conv_output_y_dim = (1 + (input_y_dim - filt_y_dim) / filt_y_step);
   int32 conv_output_z_dim = num_filters;
   int32 pool_x_size = 1 + Rand() % conv_output_x_dim;
   int32 pool_y_size = 1 + Rand() % conv_output_y_dim;
   int32 pool_z_size = 1 + Rand() % conv_output_z_dim;
   int32 pool_x_step = 1;
   int32 pool_y_step = 1;
   int32 pool_z_step = 1;
   do {
     pool_x_step = (1 + Rand() % pool_x_size);
   } while((conv_output_x_dim - pool_x_size) % pool_x_step);
   do {
     pool_y_step = (1 + Rand() % pool_y_size);
   } while((conv_output_y_dim - pool_y_size) % pool_y_step);
   do {
     pool_z_step = (1 + Rand() % pool_z_size);
   } while((conv_output_z_dim - pool_z_size) % pool_z_step);

   os << "component name=maxpooling type=MaxpoolingComponent "
      << " input-x-dim=" << conv_output_x_dim
      << " input-y-dim=" << conv_output_y_dim
      << " input-z-dim=" << conv_output_z_dim
      << " pool-x-size=" << pool_x_size
      << " pool-y-size=" << pool_y_size
      << " pool-z-size=" << pool_z_size
      << " pool-x-step=" << pool_x_step
      << " pool-y-step=" << pool_y_step
      << " pool-z-step=" << pool_z_step
      << std::endl;

   os << "input-node name=input dim=" << (input_x_dim * input_y_dim * input_z_dim) << std::endl;
   os << "component-node name=conv_node component=conv input=input\n";
   os << "component-node name=maxpooling_node component=maxpooling input=conv_node\n";
   os << "output-node name=output input=conv_node\n";
   configs->push_back(os.str());
 }


 void GenerateConfigSequenceCnnNew(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   std::ostringstream ss;


   int32 cur_height = RandInt(5, 15),
       cur_num_filt = RandInt(1, 3),
       num_layers = RandInt(0, 3);
   // note: generating zero layers is a bit odd but it exercises some code that
   // we otherwise wouldn't exercise.


   std::string cur_layer_descriptor = "input";

   { // input layer.
     ss << "input-node name=input dim=" << (cur_height * cur_num_filt)
        << std::endl;
   }


   for (int32 l = 0; l < num_layers; l++) {
     int32 next_num_filt = RandInt(1, 10);

     bool height_padding = (cur_height < 5 || RandInt(0, 1) == 0);
     int32 height_subsampling_factor = RandInt(1, 2);
     if (cur_height < 4) {
       // output height of 1 causes a problem with unused height-offsets,
       // so don't subsample in that case.
       height_subsampling_factor = 1;
     }

     int32 next_height = cur_height;
     if (!height_padding) {
       next_height -= 2;  // the kernel will have height 3.
     }
     next_height = (next_height + height_subsampling_factor - 1) /
         height_subsampling_factor;

     if (next_height == cur_height && RandInt(0, 1) == 0) {
       // ensure that with sufficient frequency, we have the
       // same height and num-filt out; this enables ResNet-style
       // addition.
       next_num_filt = cur_num_filt;
     }

     std::string time_offsets, required_time_offsets;
     if (RandInt(0, 3) == 0) {
       time_offsets = "0";
       required_time_offsets = (RandInt(0, 1) == 0 ? "" : "0");
     } else if (RandInt(0, 1) == 0) {
       time_offsets = "-1,0,1";
       required_time_offsets = (RandInt(0, 1) == 0 ? "" : "-1");
     } else {
       time_offsets = "-2,0,2";
       required_time_offsets = (RandInt(0, 1) == 0 ? "" : "0");
     }

     ss << "component type=TimeHeightConvolutionComponent name=layer" << l << "-conv "
        << "num-filters-in=" << cur_num_filt
        << " num-filters-out=" << next_num_filt
        << " height-in=" << cur_height
        << " height-out=" << next_height
        << " height-offsets=" << (height_padding ? "-1,0,1" : "0,1,2")
        << " time-offsets=" << time_offsets;

     if (RandInt(0, 1) == 0) {
       // this limits the 'temp memory' usage to 100
       // bytes, which will test another code path where
       // it breaks up the temporary matrix into pieces
       ss << " max-memory-mb=1.0e-04";
     }

     if (height_subsampling_factor != 1 || RandInt(0, 1) == 0)
       ss << " height-subsample-out=" << height_subsampling_factor;
     if (required_time_offsets == "" && RandInt(0, 1) == 0) {
       required_time_offsets = time_offsets;
       // it should default to this, but we're exercising more of the config
       // parsing code this way.
     }
     if (required_time_offsets != "")
       ss << " required-time-offsets=" << required_time_offsets;
     if (RandInt(0, 1) == 0)
       ss << " param-stddev=0.1 bias-stddev=1";
     if (RandInt(0, 1) == 0)
       ss << " use-natural-gradient=false";
     if (RandInt(0, 1) == 0)
       ss << " rank-in=4";
     if (RandInt(0, 1) == 0)
       ss << " rank-out=4";
     if (RandInt(0, 1) == 0)
       ss << " alpha-in=2.0";
     if (RandInt(0, 1) == 0)
       ss << " alpha-out=2.0";
     ss << std::endl;

     ss << "component-node name=layer" << l << "-conv component=layer"
        << l << "-conv input=" << cur_layer_descriptor << std::endl;

     bool use_relu = false;
     if (use_relu) {
       ss << "component type=RectifiedLinearComponent name=layer" << l
          << "-relu dim=" << (next_height * next_num_filt) << std::endl;
       ss << "component-node name=layer" << l << "-relu component=layer"
          << l << "-relu input=layer" << l << "-conv" << std::endl;
     }

     std::ostringstream desc_ss;
     if (next_height == cur_height && next_num_filt == cur_num_filt
         && RandInt(0, 1) == 0) {
       desc_ss << "Sum(" << cur_layer_descriptor << ", layer" << l
               << (use_relu ? "-relu)" : "-conv)");
     } else {
       desc_ss << "layer" << l << (use_relu ? "-relu" : "-conv");
     }

     if (RandInt(0, 3) == 0) {
       std::ostringstream round_desc_ss;
       int32 modulus = RandInt(2, 3);
       round_desc_ss << "Round(" << desc_ss.str() << ", " << modulus << ")";
       cur_layer_descriptor = round_desc_ss.str();
     } else {
       cur_layer_descriptor = desc_ss.str();
     }
     cur_height = next_height;
     cur_num_filt = next_num_filt;
   }

   ss << "output-node name=output input=" << cur_layer_descriptor << std::endl;


   configs->push_back(ss.str());
 }


 void GenerateConfigSequenceRestrictedAttention(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   std::ostringstream ss;


   int32 input_dim = RandInt(100, 150),
       num_heads = RandInt(1, 2),
       key_dim = RandInt(20, 40),
       value_dim = RandInt(20, 40),
       time_stride = RandInt(1, 3),
       num_left_inputs = RandInt(1, 4),
       num_right_inputs = RandInt(0, 2),
       num_left_inputs_required = RandInt(0, num_left_inputs),
       num_right_inputs_required = RandInt(0, num_right_inputs);
   bool output_context = (RandInt(0, 1) == 0);
   int32 context_dim = (num_left_inputs + 1 + num_right_inputs),
       query_dim = key_dim + context_dim;
   int32 attention_input_dim = num_heads * (key_dim + value_dim + query_dim);

   std::string cur_layer_descriptor = "input";

   { // input layer.
     ss << "input-node name=input dim=" << input_dim
        << std::endl;
   }

   { // affine component
     ss << "component name=affine type=NaturalGradientAffineComponent input-dim="
        << input_dim << " output-dim=" << attention_input_dim << std::endl;
     ss << "component-node name=affine component=affine input=input"
        << std::endl;
   }

   { // attention component
     ss << "component-node name=attention component=attention input=affine"
        << std::endl;
     ss << "component name=attention type=RestrictedAttentionComponent"
        << " num-heads=" << num_heads << " key-dim=" << key_dim
        << " value-dim=" << value_dim << " time-stride=" << time_stride
        << " num-left-inputs=" << num_left_inputs << " num-right-inputs="
        << num_right_inputs << " num-left-inputs-required="
        << num_left_inputs_required << " num-right-inputs-required="
        << num_right_inputs_required
        << " output-context=" << (output_context ? "true" : "false")
        << (RandInt(0, 1) == 0 ? " key-scale=1.0" : "")
        << std::endl;
   }

   { // output
     ss << "output-node name=output input=attention" << std::endl;
   }
   configs->push_back(ss.str());
 }


 // generates a config sequence involving DistributeComponent.
 void GenerateConfigSequenceDistribute(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
   int32 output_dim = (opts.output_dim > 0 ? opts.output_dim : 100);
   int32 x_expand = RandInt(1, 5), after_expand_dim = RandInt(10, 20),
       input_dim = x_expand * after_expand_dim;
   std::ostringstream os;
   os << "input-node name=input dim=" << input_dim << std::endl;
   os << "component name=distribute type=DistributeComponent input-dim="
      << input_dim << " output-dim=" << after_expand_dim << std::endl;
   os << "component-node name=distribute component=distribute input=input\n";
   os << "component name=affine type=AffineComponent input-dim="
      << after_expand_dim << " output-dim=" << output_dim << std::endl;
   os << "component-node name=affine component=affine input=distribute\n";
   os << "output-node name=output input=Sum(";
   for (int32 i = 0; i < x_expand; i++) {
     if (i > 0) os << ", ";
     os << "ReplaceIndex(affine, x, " << i << ")";
   }
   os << ")\n";
   configs->push_back(os.str());
 }

 void GenerateConfigSequenceCompositeBlock(const NnetGenerationOptions &opts,
                                           std::vector<std::string> *configs) {
   int32 num_components = RandInt(1,5);
   int32 input_dim = 10 * RandInt(1,10);
   if (opts.output_dim > 0) {
     KALDI_WARN  << "This function doesn't take a requested output_dim due to "
       "implementation complications.";
   }
   int32 max_rows_process = 512 + 512 * RandInt(1,3);
   std::ostringstream os;
   os << "component name=composite1 type=CompositeComponent max-rows-process="
      << max_rows_process << " num-components=" << num_components;

   int32 types_length = 3;
   std::string types[] = {"BlockAffineComponent",
                          "RepeatedAffineComponent",
                          "NaturalGradientRepeatedAffineComponent"};
   int32 last_output_dim = input_dim;
   // components within a composite component are indexed from 1.
   for(int32 i = 1; i <= num_components; i++) {
     os << " component" << i << "=";
     int32 rand_index = RandInt(0, types_length - 1);
     std::string rand_type = types[rand_index];
     os << "'type=" << rand_type << " input-dim=" << last_output_dim;
     int32 current_output_dim = 10 * RandInt(1,10);
     // must be a divisor or current_output_dim and last_output_dim
     int32 num_repeats = 10;
     os << " output-dim=" << current_output_dim;
     std::string repeats_string = (rand_type == "BlockAffineComponent") ? "num-blocks": "num-repeats";
     os << " " << repeats_string << "=" << num_repeats << "'";
     last_output_dim = current_output_dim;
   }
   os << std::endl << std::endl;
   os << "input-node name=input dim=" << input_dim << std::endl;
   os << "component-node name=composite1 component=composite1 input=input\n";
   os << "output-node name=output input=composite1\n";
   configs->push_back(os.str());
 }

 void GenerateConfigSequence(
     const NnetGenerationOptions &opts,
     std::vector<std::string> *configs) {
 start:
   int32 network_type = RandInt(0, 14);
   switch(network_type) {
     case 0:
       GenerateConfigSequenceSimplest(opts, configs);
       break;
     case 1:
       if (!opts.allow_context)
         goto start;
       GenerateConfigSequenceSimpleContext(opts, configs);
       break;
     case 2:
       if (!opts.allow_context || !opts.allow_nonlinearity)
         goto start;
       GenerateConfigSequenceSimple(opts, configs);
       break;
     case 3:
       if (!opts.allow_recursion || !opts.allow_context ||
           !opts.allow_nonlinearity)
         goto start;
       GenerateConfigSequenceRnn(opts, configs);
       break;
     case 4:
       if (!opts.allow_recursion || !opts.allow_context ||
           !opts.allow_nonlinearity)
         goto start;
       GenerateConfigSequenceRnnClockwork(opts, configs);
       break;
     case 5:
       if (!opts.allow_recursion || !opts.allow_context ||
           !opts.allow_nonlinearity)
         goto start;
       GenerateConfigSequenceLstm(opts, configs);
       break;
     case 6:
       if (!opts.allow_recursion || !opts.allow_context ||
           !opts.allow_nonlinearity)
         goto start;
       GenerateConfigSequenceLstm(opts, configs);
       break;
     case 7:
       if (!opts.allow_nonlinearity)
         goto start;
       GenerateConfigSequenceCnn(opts, configs);
       break;
     case 8:
       if (!opts.allow_use_of_x_dim)
         goto start;
       GenerateConfigSequenceDistribute(opts, configs);
       break;
     case 9:
       GenerateConfigSequenceCompositeBlock(opts, configs);
       break;
     case 10:
       if (!opts.allow_statistics_pooling)
         goto start;
       GenerateConfigSequenceStatistics(opts, configs);
       break;
     case 11:
       if (!opts.allow_recursion || !opts.allow_context ||
           !opts.allow_nonlinearity)
         goto start;
       GenerateConfigSequenceLstmWithTruncation(opts, configs);
       break;
       // We're allocating more case statements to the most recently
       // added type of model, to give more thorough testing where
       // it's needed most.
     case 12:
       if (!opts.allow_nonlinearity || !opts.allow_context)
         goto start;
       GenerateConfigSequenceCnnNew(opts, configs);
       break;
     case 13: case 14:
       if (!opts.allow_nonlinearity || !opts.allow_context)
         goto start;
       GenerateConfigSequenceRestrictedAttention(opts, configs);
       break;
     default:
       KALDI_ERR << "Error generating config sequence.";
   }
   KALDI_ASSERT(!configs->empty());
 }

 void ComputeExampleComputationRequestSimple(
     const Nnet &nnet,
     ComputationRequest *request,
     std::vector<Matrix<BaseFloat> > *inputs) {
   KALDI_ASSERT(IsSimpleNnet(nnet));

   int32 left_context, right_context;
   ComputeSimpleNnetContext(nnet, &left_context, &right_context);

   int32 num_output_frames = 1 + Rand() % 10,
       output_start_frame = Rand() % 10,
       num_examples = 1 + Rand() % 4,
       output_end_frame = output_start_frame + num_output_frames,
       input_start_frame = output_start_frame - left_context - (Rand() % 3),
       input_end_frame = output_end_frame + right_context + (Rand() % 3),
       n_offset = Rand() % 2;
   bool need_deriv = (Rand() % 2 == 0);
   // make sure there are at least 3 frames of input available.  this makes a
   // difference for our tests of statistics-pooling and statistics-extraction
   // component.
   if (input_end_frame < input_start_frame + 3)
     input_end_frame = input_start_frame + 3;

   request->inputs.clear();
   request->outputs.clear();
   inputs->clear();

   std::vector<Index> input_indexes, ivector_indexes, output_indexes;
   for (int32 n = n_offset; n < n_offset + num_examples; n++) {
     for (int32 t = input_start_frame; t < input_end_frame; t++)
       input_indexes.push_back(Index(n, t, 0));
     for (int32 t = output_start_frame; t < output_end_frame; t++)
       output_indexes.push_back(Index(n, t, 0));
     ivector_indexes.push_back(Index(n, 0, 0));
   }
   request->outputs.push_back(IoSpecification("output", output_indexes));
   if (need_deriv || (Rand() % 3 == 0))
     request->outputs.back().has_deriv = true;
   request->inputs.push_back(IoSpecification("input", input_indexes));
   if (need_deriv && (Rand() % 2 == 0))
     request->inputs.back().has_deriv = true;
   int32 input_dim = nnet.InputDim("input");
   KALDI_ASSERT(input_dim > 0);
   inputs->push_back(
       Matrix<BaseFloat>((input_end_frame - input_start_frame) * num_examples,
                         input_dim));
   inputs->back().SetRandn();
   int32 ivector_dim = nnet.InputDim("ivector");  // may not exist.
   if (ivector_dim != -1) {
     request->inputs.push_back(IoSpecification("ivector", ivector_indexes));
     inputs->push_back(Matrix<BaseFloat>(num_examples, ivector_dim));
     inputs->back().SetRandn();
     if (need_deriv && (Rand() % 2 == 0))
       request->inputs.back().has_deriv = true;
   }
   if (Rand() % 2 == 0)
     request->need_model_derivative = need_deriv;
   if (Rand() % 2 == 0)
     request->store_component_stats = true;
 }


 static void GenerateRandomComponentConfig(std::string *component_type,
                                           std::string *config) {

   int32 n = RandInt(0, 37);
   BaseFloat learning_rate = 0.001 * RandInt(1, 100);

   std::ostringstream os;
   switch(n) {
     case 0: {
       *component_type = "PnormComponent";
       int32 output_dim = RandInt(1, 50), group_size = RandInt(1, 15),
           input_dim = output_dim * group_size;
       os << "input-dim=" << input_dim << " output-dim=" << output_dim;
       break;
     }
     case 1: {
       BaseFloat target_rms = (RandInt(1, 200) / 100.0);
       std::string add_log_stddev = (Rand() % 2 == 0 ? "True" : "False");
       *component_type = "NormalizeComponent";

       int32 block_dim = RandInt(2, 50), num_blocks = RandInt(1, 3),
           dim = block_dim * num_blocks;
       // avoid dim=1 because the derivatives would be zero, which
       // makes them hard to test.
       os << "dim=" << dim << " block-dim=" << block_dim
          << " target-rms=" << target_rms
          << " add-log-stddev=" << add_log_stddev;
       break;
     }
     case 2: {
       *component_type = "SigmoidComponent";
       os << "dim=" << RandInt(1, 50);
       break;
     }
     case 3: {
       *component_type = "TanhComponent";
       os << "dim=" << RandInt(1, 50);
       break;
     }
     case 4: {
       *component_type = "RectifiedLinearComponent";
       os << "dim=" << RandInt(1, 50);
       break;
     }
     case 5: {
       *component_type = "SoftmaxComponent";
       os << "dim=" << RandInt(1, 50);
       break;
     }
     case 6: {
       *component_type = "LogSoftmaxComponent";
       os << "dim=" << RandInt(1, 50);
       break;
     }
     case 7: {
       *component_type = "NoOpComponent";
       os << "dim=" << RandInt(1, 50);
       break;
     }
     case 8: {
       *component_type = "FixedAffineComponent";
       int32 input_dim = RandInt(1, 50), output_dim = RandInt(1, 50);
       os << "input-dim=" << input_dim << " output-dim=" << output_dim;
       break;
     }
     case 9: {
       *component_type = "AffineComponent";
       int32 input_dim = RandInt(1, 50), output_dim = RandInt(1, 50);
       os << "input-dim=" << input_dim << " output-dim=" << output_dim
          << " learning-rate=" << learning_rate;
       break;
     }
     case 10: {
       *component_type = "NaturalGradientAffineComponent";
       int32 input_dim = RandInt(1, 50), output_dim = RandInt(1, 50);
       os << "input-dim=" << input_dim << " output-dim=" << output_dim
          << " learning-rate=" << learning_rate;
       break;
     }
     case 11: {
       *component_type = "SumGroupComponent";
       std::vector<int32> sizes;
       int32 num_groups = RandInt(1, 50);
       os << "sizes=";
       for (int32 i = 0; i < num_groups; i++) {
         os << RandInt(1, 5);
         if (i + 1 < num_groups)
           os << ',';
       }
       break;
     }
     case 12: {
       *component_type = "FixedScaleComponent";
       os << "dim=" << RandInt(1, 100);
       break;
     }
     case 13: {
       *component_type = "FixedBiasComponent";
       os << "dim=" << RandInt(1, 100);
       break;
     }
     case 14: {
       *component_type = "NaturalGradientPerElementScaleComponent";
       os << "dim=" << RandInt(1, 100)
          << " learning-rate=" << learning_rate;
       break;
     }
     case 15: {
       *component_type = "PerElementScaleComponent";
       os << "dim=" << RandInt(1, 100)
          << " learning-rate=" << learning_rate;
       break;
     }
     case 16: {
       *component_type = "ElementwiseProductComponent";
       int32 output_dim = RandInt(1, 100), multiple = RandInt(2, 4),
           input_dim = output_dim * multiple;
       os << "input-dim=" << input_dim << " output-dim=" << output_dim;
       break;
     }
     case 17: {
       int32 input_vectorization = Rand() % 2;
       std::string vectorization;
       if (input_vectorization == 0) {
         vectorization = "yzx";
       } else  {
         vectorization = "zyx";
       }
       *component_type = "ConvolutionComponent";
       int32 input_x_dim = 10 + Rand() % 20,
             input_y_dim = 10 + Rand() % 20,
             input_z_dim = 3 + Rand() % 10,
             filt_x_dim = 1 + Rand() % input_x_dim,
             filt_y_dim = 1 + Rand() % input_y_dim,
             num_filters = 1 + Rand() % 10,
             filt_x_step = (1 + Rand() % filt_x_dim),
             filt_y_step = (1 + Rand() % filt_y_dim);
       int32 remainder = (input_x_dim - filt_x_dim) % filt_x_step;
       // adjusting input_x_dim to ensure divisibility
       input_x_dim = input_x_dim - remainder;
       remainder = (input_y_dim - filt_y_dim) % filt_y_step;
       // adjusting input_x_dim to ensure divisibility
       input_y_dim = input_y_dim - remainder;

       os << "input-x-dim=" << input_x_dim
          << " input-y-dim=" << input_y_dim
          << " input-z-dim=" << input_z_dim
          << " filt-x-dim=" << filt_x_dim
          << " filt-y-dim=" << filt_y_dim
          << " filt-x-step=" << filt_x_step
          << " filt-y-step=" << filt_y_step
          << " num-filters=" << num_filters
          << " input-vectorization-order=" << vectorization
          << " learning-rate=" << learning_rate;
       break;
       // TODO : add test for file based initialization. But confirm how to write
       // a file which is not going to be overwritten by other components
     }
     case 18: {
       *component_type = "PermuteComponent";
       int32 input_dim = 10 + Rand() % 100;
       std::vector<int32> column_map(input_dim);
       for (int32 i = 0; i < input_dim; i++)
         column_map[i] = i;
       std::random_shuffle(column_map.begin(), column_map.end());
       std::ostringstream buffer;
       for (int32 i = 0; i < input_dim-1; i++)
         buffer << column_map[i] << ",";
       buffer << column_map.back();
       os << "column-map=" << buffer.str();
       break;
     }
     case 19: {
       *component_type = "PerElementOffsetComponent";
       std::string param_config = RandInt(0, 1)?
                                  " param-mean=0.0 param-stddev=0.0":
                                  " param-mean=1.0 param-stddev=1.0";
       int32 block_dim = RandInt(10, 20), dim = block_dim * RandInt(1, 2);
       os << "dim=" << dim << " block-dim=" << block_dim
          << " use-natural-gradient=" << (RandInt(0, 1) == 0 ? "true" : "false")
          << " learning-rate=" << learning_rate << param_config;
       break;
     }
     case 20: case 21: {
       *component_type = "CompositeComponent";
       int32 cur_dim = RandInt(20, 30), num_components = RandInt(1, 3),
           max_rows_process = RandInt(1, 30);
       os << "num-components=" << num_components
          << " max-rows-process=" << max_rows_process;
       std::vector<std::string> sub_configs;
       for (int32 i = 1; i <= num_components; i++) {
         if (RandInt(1, 3) == 1) {
           os << " component" << i << "='type=RectifiedLinearComponent dim="
              << cur_dim << "'";
         } else if (RandInt(1, 2) == 1) {
           os << " component" << i << "='type=TanhComponent dim="
              << cur_dim << "'";
         } else {
           int32 next_dim = RandInt(20, 30);
           os << " component" << i << "='type=AffineComponent input-dim="
              << cur_dim << " output-dim=" << next_dim << "'";
           cur_dim = next_dim;
         }
       }
       break;
     }
     case 22: {
       *component_type = "SumGroupComponent";
       int32 num_groups = RandInt(1, 50),
         input_dim = num_groups * RandInt(1, 15);
       os << "input-dim=" << input_dim << " output-dim=" << num_groups;
       break;
     }
     case 23: {
       *component_type = "RepeatedAffineComponent";
       int32 num_repeats = RandInt(1, 50),
           input_dim = num_repeats * RandInt(1, 15),
           output_dim = num_repeats * RandInt(1, 15);
       os << "input-dim=" << input_dim << " output-dim=" << output_dim
          << " num-repeats=" << num_repeats;
       break;
     }
     case 24: {
       *component_type = "BlockAffineComponent";
       int32 num_blocks = RandInt(1, 50),
           input_dim = num_blocks * RandInt(1, 15),
           output_dim = num_blocks * RandInt(1, 15);
       os << "input-dim=" << input_dim << " output-dim=" << output_dim
          << " num-blocks=" << num_blocks;
       break;
     }
     case 25: {
       *component_type = "NaturalGradientRepeatedAffineComponent";
       int32 num_repeats = RandInt(1, 50),
           input_dim = num_repeats * RandInt(1, 15),
           output_dim = num_repeats * RandInt(1, 15);
       os << "input-dim=" << input_dim << " output-dim=" << output_dim
          << " num-repeats=" << num_repeats;
       break;
     }
     case 26: {
       *component_type = "MaxpoolingComponent";
       int32 input_x_dim = 5 + Rand() % 10,
             input_y_dim = 5 + Rand() % 10,
             input_z_dim = 5 + Rand() % 10;
       int32 pool_x_size = 1 + Rand() % input_x_dim,
             pool_y_size = 1 + Rand() % input_y_dim,
             pool_z_size = 1 + Rand() % input_z_dim;
       int32 pool_x_step = (1 + Rand() % pool_x_size),
             pool_y_step = (1 + Rand() % pool_y_size),
             pool_z_step = (1 + Rand() % pool_z_size);
       // adjusting input dim to ensure divisibility
       int32 remainder = (input_x_dim - pool_x_size) % pool_x_step;
       input_x_dim = input_x_dim - remainder;
       remainder = (input_y_dim - pool_y_size) % pool_y_step;
       input_y_dim = input_y_dim - remainder;
       remainder = (input_z_dim - pool_z_size) % pool_z_step;
       input_z_dim = input_z_dim - remainder;
       os << " input-x-dim=" << input_x_dim
          << " input-y-dim=" << input_y_dim
          << " input-z-dim=" << input_z_dim
          << " pool-x-size=" << pool_x_size
          << " pool-y-size=" << pool_y_size
          << " pool-z-size=" << pool_z_size
          << " pool-x-step=" << pool_x_step
          << " pool-y-step=" << pool_y_step
          << " pool-z-step=" << pool_z_step;
       break;
     }
     case 27: {
       *component_type = "ConstantFunctionComponent";
       int32 input_dim = RandInt(1, 50), output_dim = RandInt(1, 50);
       bool is_updatable = (RandInt(0, 1) == 0),
           use_natural_gradient =  (RandInt(0, 1) == 0);
       os << "input-dim=" << input_dim << " output-dim=" << output_dim
          << " learning-rate=" << learning_rate
          << " is-updatable=" << std::boolalpha << is_updatable
          << " use-natural-gradient=" << std::boolalpha << use_natural_gradient;
       break;
     }
     case 28: {
       *component_type = "ClipGradientComponent";
       os << "dim=" << RandInt(1, 50);
       os << " clipping-threshold=" << RandInt(1, 50)
          << " norm-based-clipping=" << (RandInt(0, 1) == 0 ? "false" : "true");
       if (RandInt(0, 1) == 1)
         os << " self-repair-scale="
            << (RandInt(0, 1) == 0 ? 0 : RandInt(1, 50));
       if (RandInt(0, 1) == 1)
         os << " self-repair-clipped-proportion-threshold=" << RandUniform();
       if (RandInt(0, 1) == 1)
         os << " self-repair-target=" << RandUniform();
       break;
     }
     case 29: {
       *component_type = "DropoutComponent";
       bool test_mode = (RandInt(0, 1) == 0);
       os << "dim=" << RandInt(1, 200)
          << " dropout-proportion=" << RandUniform() << " test-mode="
          << (test_mode ? "true" : "false");
       break;
     }
     case 30: {
       *component_type = "LstmNonlinearityComponent";
       // set self-repair scale to zero so the derivative tests will pass.
       os << "cell-dim=" << RandInt(1, 200)
          << " self-repair-scale=0.0";
       break;
     }
     // I think we'll get in the habit of allocating a larger number of case
     // labels to the most recently added component, so it gets tested more
     case 31: {
       *component_type = "BatchNormComponent";
       int32 block_dim = RandInt(1, 20), dim = block_dim * RandInt(1, 2);
       bool test_mode = (RandInt(0, 1) == 0);
       os << " dim=" << dim
          << " block-dim=" << block_dim << " target-rms="
          << RandInt(1, 4) << " test-mode="
          << (test_mode ? "true" : "false")
          << " epsilon=" << (RandInt(0, 1) == 0 ? "0.1" : "1.0");
       break;
     }
     case 32: {
       *component_type = "SumBlockComponent";
       BaseFloat scale = 0.5 * RandInt(1, 3);
       BaseFloat output_dim = RandInt(1, 10),
           input_dim = output_dim * RandInt(1, 3);
       os << "input-dim=" << input_dim
          << " output-dim=" << output_dim
          << " scale=" << scale;
       break;
     }
     case 33: {
       *component_type = "ScaleAndOffsetComponent";
       int32 block_dim = RandInt(10, 20),
           num_blocks = RandInt(1, 3),
           dim = block_dim * num_blocks;
       os << "dim=" << dim << " block-dim=" << block_dim
          << " use-natural-gradient="
          << (RandInt(0,1) == 0 ? "true" : "false");
       break;
     }
     case 34: {
       *component_type = "LinearComponent";
       int32 input_dim = RandInt(1, 50), output_dim = RandInt(1, 50);
       os << "input-dim=" << input_dim << " output-dim=" << output_dim
          << " learning-rate=" << learning_rate;
       break;
     }
     case 35: {
       // This is not technically a SimpleComponent, but it behaves as one
       // if time-offsets=0.
       *component_type = "TdnnComponent";
       int32 input_dim = RandInt(1, 50), output_dim = RandInt(1, 50);
       os << "input-dim=" << input_dim << " output-dim=" << output_dim
          << " learning-rate=" << learning_rate << " time-offsets=0"
          << " use-natural-gradient=" << (RandInt(0,1) == 0 ? "true":"false")
          << " use-bias=" << (RandInt(0,1) == 0 ? "true":"false");
       break;
     }
     case 36: {
       *component_type = "GruNonlinearityComponent";
       int32 cell_dim = RandInt(10, 20);
       int32 recurrent_dim = (RandInt(0, 1) == 0 ?
                              RandInt(5, cell_dim - 1) : cell_dim);
       os << "cell-dim=" << cell_dim
          << " recurrent-dim=" << recurrent_dim;
       break;
     }
     case 37: {
       *component_type = "OutputGruNonlinearityComponent";
       os << "cell-dim=" << RandInt(10, 20)
          << " learning-rate=" << learning_rate;

       break;
     }
     default:
       KALDI_ERR << "Error generating random component";
   }
   *config = os.str();
 }

 Component *GenerateRandomSimpleComponent() {
   std::string component_type, config;
   GenerateRandomComponentConfig(&component_type, &config);
   ConfigLine config_line;
   if (!config_line.ParseLine(config))
     KALDI_ERR << "Bad config line " << config;

   Component *c = Component::NewComponentOfType(component_type);
   if (c == NULL)
     KALDI_ERR << "Invalid component type " << component_type;
   c->InitFromConfig(&config_line);
   if (config_line.HasUnusedValues()) {
     KALDI_ERR << "Config line " << config_line.WholeLine()
               << " has unused values: "
               << config_line.UnusedValues();
   }
   return c;
 }

 bool NnetParametersAreIdentical(const Nnet &nnet1,
                                 const Nnet &nnet2,
                                 BaseFloat threshold = 1.0e-05) {
   KALDI_ASSERT(nnet1.NumComponents() == nnet2.NumComponents());
   int32 num_components = nnet1.NumComponents();
   for (int32 c = 0; c < num_components; c++) {
     const Component *c1 = nnet1.GetComponent(c),
                     *c2 = nnet2.GetComponent(c);
     KALDI_ASSERT(c1->Type() == c2->Type());
     if (c1->Properties() & kUpdatableComponent) {
       const UpdatableComponent *u1 = dynamic_cast<const UpdatableComponent*>(c1),
                                *u2 = dynamic_cast<const UpdatableComponent*>(c2);
       KALDI_ASSERT(u1 != NULL && u2 != NULL);
       BaseFloat prod11 = u1->DotProduct(*u1), prod12 = u1->DotProduct(*u2),
                 prod21 = u2->DotProduct(*u1), prod22 = u2->DotProduct(*u2);
       BaseFloat max_prod = std::max(std::max(prod11, prod12),
                                     std::max(prod21, prod22)),
                 min_prod = std::min(std::min(prod11, prod12),
                                     std::min(prod21, prod22));
       if (max_prod - min_prod > threshold * max_prod) {
         KALDI_WARN << "Component '" << nnet1.GetComponentName(c)
                    << "' differs in nnet1 versus nnet2: prod(11,12,21,22) = "
                    << prod11 << ',' << prod12 << ',' << prod21 << ',' << prod22;
         return false;
       }
     }
   }
   return true;
 }

 void GenerateSimpleNnetTrainingExample(
     int32 num_supervised_frames,
     int32 left_context,
     int32 right_context,
     int32 output_dim,
     int32 input_dim,
     int32 ivector_dim,
     NnetExample *example) {
   KALDI_ASSERT(num_supervised_frames > 0 && left_context >= 0 &&
                right_context >= 0 && output_dim > 0 && input_dim > 0
                && example != NULL);
   example->io.clear();

   int32 feature_t_begin = RandInt(0, 2);
   int32 num_feat_frames = left_context + right_context + num_supervised_frames;
   Matrix<BaseFloat> input_mat(num_feat_frames, input_dim);
   input_mat.SetRandn();
   NnetIo input_feat("input", feature_t_begin, input_mat);
   if (RandInt(0, 1) == 0)
     input_feat.features.Compress();
   example->io.push_back(input_feat);

   if (ivector_dim > 0) {
     // Create a feature for the iVectors.  iVectors always have t=0 in the
     // current framework.
     Matrix<BaseFloat> ivector_mat(1, ivector_dim);
     ivector_mat.SetRandn();
     NnetIo ivector_feat("ivector", 0, ivector_mat);
     if (RandInt(0, 1) == 0)
       ivector_feat.features.Compress();
     example->io.push_back(ivector_feat);
   }

   {  // set up the output supervision.
     Posterior labels(num_supervised_frames);
     for (int32 t = 0; t < num_supervised_frames; t++) {
       int32 num_labels = RandInt(1, 3);
       BaseFloat remaining_prob_mass = 1.0;
       for (int32 i = 0; i < num_labels; i++) {
         BaseFloat this_prob = (i+1 == num_labels ? 1.0 : RandUniform()) *
             remaining_prob_mass;
         remaining_prob_mass -= this_prob;
         labels[t].push_back(std::pair<int32, BaseFloat>(RandInt(0, output_dim-1),
                                                         this_prob));
       }
     }
     int32 supervision_t_begin = feature_t_begin + left_context;
     NnetIo output_sup("output", output_dim, supervision_t_begin,
                       labels);
     example->io.push_back(output_sup);
   }
 }

 bool ExampleApproxEqual(const NnetExample &eg1,
                         const NnetExample &eg2,
                         BaseFloat delta) {
   if (eg1.io.size() != eg2.io.size())
     return false;
   for (size_t i = 0; i < eg1.io.size(); i++) {
     NnetIo io1 = eg1.io[i], io2 = eg2.io[i];
     if (io1.name != io2.name || io1.indexes != io2.indexes)
       return false;
     Matrix<BaseFloat> feat1, feat2;
     io1.features.GetMatrix(&feat1);
     io2.features.GetMatrix(&feat2);
     if (!ApproxEqual(feat1, feat2, delta))
       return false;
   }
   return true;
 }


 } // namespace nnet3
 } // namespace kaldi
kaldi::nnet3::NnetExample
NnetExample is the input data and corresponding label (or labels) for one or more frames of input...
Definition: nnet-example.h:111

kaldi
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
Definition: chain.dox:20

kaldi::nnet3::NnetIo
Definition: nnet-example.h:33

kaldi::nnet3::Nnet::InputDim
int32 InputDim(const std::string &input_name) const
Definition: nnet-nnet.cc:669

kaldi::GeneralMatrix::Compress
void Compress()
Definition: sparse-matrix.cc:802

kaldi::nnet3::GenerateSimpleNnetTrainingExample
void GenerateSimpleNnetTrainingExample(int32 num_supervised_frames, int32 left_context, int32 right_context, int32 output_dim, int32 input_dim, int32 ivector_dim, NnetExample *example)
Low-level function that generates an nnet training example.
Definition: nnet-test-utils.cc:1832

kaldi::ConfigLine::WholeLine
const std::string WholeLine()
Definition: text-utils.h:230

kaldi::ConfigLine::ParseLine
bool ParseLine(const std::string &line)
Definition: text-utils.cc:343

kaldi::nnet3::ComputationRequest::store_component_stats
bool store_component_stats
you should set need_component_stats to true if you need the average-activation and average-derivative...
Definition: nnet-computation.h:126

kaldi::nnet3::NnetGenerationOptions::allow_statistics_pooling
bool allow_statistics_pooling
Definition: nnet-test-utils.h:43

kaldi::nnet3::GenerateConfigSequenceLstm
void GenerateConfigSequenceLstm(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:414

kaldi::RandUniform
float RandUniform(struct RandomState *state=NULL)
Returns a random number strictly between 0 and 1.
Definition: kaldi-math.h:151

kaldi::nnet3::NnetParametersAreIdentical
bool NnetParametersAreIdentical(const Nnet &nnet1, const Nnet &nnet2, BaseFloat threshold=1.0e-05)
Used for testing that the updatable parameters in two networks are the same.
Definition: nnet-test-utils.cc:1802

kaldi::nnet3::ComputationRequest::need_model_derivative
bool need_model_derivative
if need_model_derivative is true, then we&#39;ll be doing either model training or model-derivative compu...
Definition: nnet-computation.h:121

kaldi::GeneralMatrix::GetMatrix
void GetMatrix(Matrix< BaseFloat > *mat) const
Outputs the contents as a matrix.
Definition: sparse-matrix.cc:817

kaldi::nnet3::Component
Abstract base-class for neural-net components.
Definition: nnet-component-itf.h:114

kaldi::nnet3::GenerateConfigSequenceRnnClockwork
void GenerateConfigSequenceRnnClockwork(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:322

kaldi::nnet3::GenerateConfigSequenceLstmType2
void GenerateConfigSequenceLstmType2(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:767

kaldi::nnet3::kUpdatableComponent
Definition: nnet-component-itf.h:42

nnet-test-utils.h
This file contains various routines that are useful in test code.

kaldi::nnet3::GenerateConfigSequenceLstmWithTruncation
void GenerateConfigSequenceLstmWithTruncation(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:580

kaldi::nnet3::GenerateConfigSequenceSimpleContext
void GenerateConfigSequenceSimpleContext(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:54

kaldi::nnet3::NnetGenerationOptions::allow_ivector
bool allow_ivector
Definition: nnet-test-utils.h:42

kaldi::int32
kaldi::int32 int32
Definition: online-tcp-source.cc:27

kaldi::nnet3::NnetIo::features
GeneralMatrix features
The features or labels.
Definition: nnet-example.h:46

kaldi::nnet3::NnetGenerationOptions
Definition: nnet-test-utils.h:33

kaldi::Matrix< BaseFloat >

kaldi::nnet3::ComputationRequest::inputs
std::vector< IoSpecification > inputs
Definition: nnet-computation.h:115

kaldi::nnet3::NnetIo::indexes
std::vector< Index > indexes
"indexes" is a vector the same length as features.NumRows(), explaining the meaning of each row of th...
Definition: nnet-example.h:42

kaldi::nnet3::GenerateRandomComponentConfig
static void GenerateRandomComponentConfig(std::string *component_type, std::string *config)
Definition: nnet-test-utils.cc:1400

kaldi::nnet3::Index
struct Index is intended to represent the various indexes by which we number the rows of the matrices...
Definition: nnet-common.h:44

nnet-utils.h
This file contains some miscellaneous functions dealing with class Nnet.

kaldi::nnet3::GenerateConfigSequenceDistribute
void GenerateConfigSequenceDistribute(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:1187

kaldi::nnet3::NnetGenerationOptions::allow_recursion
bool allow_recursion
Definition: nnet-test-utils.h:36

kaldi::ConfigLine::UnusedValues
std::string UnusedValues() const
returns e.g.
Definition: text-utils.cc:518

kaldi::nnet3::ComputationRequest
Definition: nnet-computation.h:114

kaldi::nnet3::ComputeExampleComputationRequestSimple
void ComputeExampleComputationRequestSimple(const Nnet &nnet, ComputationRequest *request, std::vector< Matrix< BaseFloat > > *inputs)
This function computes an example computation request, for testing purposes.
Definition: nnet-test-utils.cc:1338

kaldi::BaseFloat
float BaseFloat
Definition: kaldi-types.h:29

kaldi::Posterior
std::vector< std::vector< std::pair< int32, BaseFloat > > > Posterior
Posterior is a typedef for storing acoustic-state (actually, transition-id) posteriors over an uttera...
Definition: posterior.h:42

kaldi::nnet3::GenerateConfigSequenceRnn
void GenerateConfigSequenceRnn(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:263

kaldi::nnet3::ComputeSimpleNnetContext
void ComputeSimpleNnetContext(const Nnet &nnet, int32 *left_context, int32 *right_context)
ComputeSimpleNnetContext computes the left-context and right-context of a nnet.
Definition: nnet-utils.cc:146

kaldi::nnet3::UpdatableComponent::DotProduct
virtual BaseFloat DotProduct(const UpdatableComponent &other) const =0
Computes dot-product between parameters of two instances of a Component.

kaldi::nnet3::Component::Properties
virtual int32 Properties() const =0
Return bitmask of the component&#39;s properties.

rnnlm::n
struct rnnlm::@11::@12 n

kaldi::nnet3::Nnet
Definition: nnet-nnet.h:115

kaldi::nnet3::GenerateConfigSequenceCnn
void GenerateConfigSequenceCnn(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:913

kaldi::nnet3::GenerateConfigSequenceCnnNew
void GenerateConfigSequenceCnnNew(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:994

kaldi::MatrixBase::SetRandn
void SetRandn()
Sets to random values of a normal distribution.
Definition: kaldi-matrix.cc:1355

KALDI_ERR
#define KALDI_ERR
Definition: kaldi-error.h:147

kaldi::nnet3::ExampleApproxEqual
bool ExampleApproxEqual(const NnetExample &eg1, const NnetExample &eg2, BaseFloat delta)
Returns true if the examples are approximately equal (only intended to be used in testing)...
Definition: nnet-test-utils.cc:1885

KALDI_WARN
#define KALDI_WARN
Definition: kaldi-error.h:150

kaldi::nnet3::GenerateConfigSequenceStatistics
void GenerateConfigSequenceStatistics(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:219

kaldi::nnet3::Nnet::GetComponentName
const std::string & GetComponentName(int32 component_index) const
returns individual component name.
Definition: nnet-nnet.cc:689

kaldi::Rand
int Rand(struct RandomState *state)
Definition: kaldi-math.cc:45

kaldi::nnet3::Nnet::GetComponent
Component * GetComponent(int32 c)
Return component indexed c. Not a copy; not owned by caller.
Definition: nnet-nnet.cc:150

kaldi::nnet3::IoSpecification
Definition: nnet-computation.h:72

kaldi::nnet3::UpdatableComponent
Class UpdatableComponent is a Component which has trainable parameters; it extends the interface of C...
Definition: nnet-component-itf.h:455

kaldi::nnet3::GenerateConfigSequenceSimplest
void GenerateConfigSequenceSimplest(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:33

rnnlm::i
int i
Definition: mikolov-rnnlm-lib.cc:66

kaldi::nnet3::Component::Type
virtual std::string Type() const =0
Returns a string such as "SigmoidComponent", describing the type of the object.

kaldi::nnet3::NnetGenerationOptions::allow_nonlinearity
bool allow_nonlinearity
Definition: nnet-test-utils.h:35

kaldi::nnet3::NnetGenerationOptions::allow_final_nonlinearity
bool allow_final_nonlinearity
Definition: nnet-test-utils.h:40

kaldi::nnet3::GenerateConfigSequenceRestrictedAttention
void GenerateConfigSequenceRestrictedAttention(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:1130

kaldi::nnet3::IsSimpleNnet
bool IsSimpleNnet(const Nnet &nnet)
This function returns true if the nnet has the following properties: It has an output called "output"...
Definition: nnet-utils.cc:52

kaldi::nnet3::Nnet::NumComponents
int32 NumComponents() const
Definition: nnet-nnet.h:124

kaldi::ConfigLine
This class is responsible for parsing input like hi-there xx=yyy a=b c empty= f-oo=Append(bar, sss) ba_z=123 bing=&#39;a b c&#39; baz="a b c d=&#39;a b&#39; e" and giving you access to the fields, in this case.
Definition: text-utils.h:205

KALDI_ASSERT
#define KALDI_ASSERT(cond)
Definition: kaldi-error.h:185

kaldi::nnet3::ComputationRequest::outputs
std::vector< IoSpecification > outputs
Definition: nnet-computation.h:116

kaldi::ConfigLine::HasUnusedValues
bool HasUnusedValues() const
Definition: text-utils.cc:510

kaldi::nnet3::NnetIo::name
std::string name
the name of the input in the neural net; in simple setups it will just be "input".
Definition: nnet-example.h:36

kaldi::nnet3::NnetGenerationOptions::allow_context
bool allow_context
Definition: nnet-test-utils.h:34

kaldi::nnet3::GenerateConfigSequenceSimple
void GenerateConfigSequenceSimple(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Definition: nnet-test-utils.cc:111

kaldi::nnet3::GenerateConfigSequence
void GenerateConfigSequence(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Generates a sequence of at least one config files, output as strings, where the first in the sequence...
Definition: nnet-test-utils.cc:1252

kaldi::nnet3::NnetGenerationOptions::allow_use_of_x_dim
bool allow_use_of_x_dim
Definition: nnet-test-utils.h:41

kaldi::nnet3::NnetExample::io
std::vector< NnetIo > io
"io" contains the input and output.
Definition: nnet-example.h:116

kaldi::nnet3::NnetGenerationOptions::output_dim
int32 output_dim
Definition: nnet-test-utils.h:46

kaldi::nnet3::Component::NewComponentOfType
static Component * NewComponentOfType(const std::string &type)
Returns a new Component of the given type e.g.
Definition: nnet-component-itf.cc:98

kaldi::ApproxEqual
static bool ApproxEqual(float a, float b, float relative_tolerance=0.001)
return abs(a - b) <= relative_tolerance * (abs(a)+abs(b)).
Definition: kaldi-math.h:265

kaldi::nnet3::GenerateConfigSequenceCompositeBlock
void GenerateConfigSequenceCompositeBlock(const NnetGenerationOptions &opts, std::vector< std::string > *configs)
Generate a config string with a composite component composed only of block affine, repeated affine, and natural gradient repeated affine components.
Definition: nnet-test-utils.cc:1213

kaldi::nnet3::Component::InitFromConfig
virtual void InitFromConfig(ConfigLine *cfl)=0
Initialize, from a ConfigLine object.

kaldi::RandInt
int32 RandInt(int32 min_val, int32 max_val, struct RandomState *state)
Definition: kaldi-math.cc:95

kaldi::nnet3::GenerateRandomSimpleComponent
Component * GenerateRandomSimpleComponent()
Generates random simple component for testing.
Definition: nnet-test-utils.cc:1783