29 using namespace kaldi;
32 typedef kaldi::int64 int64;
35 "Does the neural net computation, taking as input the nnet-training examples\n" 36 "(typically an archive with the extension .egs), ignoring the labels; it\n" 37 "outputs as a matrix the result. Used mostly for debugging.\n" 39 "Usage: nnet-compute-from-egs [options] <raw-nnet-in> <egs-rspecifier> " 40 "<feature-wspecifier>\n" 41 "e.g.: nnet-compute-from-egs 'nnet-to-raw-nnet final.mdl -|' egs.10.1.ark ark:-\n";
47 if (po.NumArgs() != 3) {
52 std::string raw_nnet_rxfilename = po.GetArg(1),
53 examples_rspecifier = po.GetArg(2),
54 features_or_loglikes_wspecifier = po.GetArg(3);
67 for (; !example_reader.Done(); example_reader.Next()) {
71 spk_dim = eg.
spk_info.Dim(), dim = basic_dim + spk_dim;
73 input_block(context, dim);
74 input_block.Range(0, context, 0, basic_dim).CopyFromMat(
75 input_frames.Range(start_offset, context, 0, basic_dim));
77 input_block.Range(0, context, basic_dim, spk_dim).CopyRowsFromVec(
81 gpu_input_block.
Swap(&input_block);
84 bool pad_input =
false;
90 KALDI_LOG <<
"Processed " << num_egs <<
" examples.";
92 return (num_egs == 0 ? 1 : 0);
93 }
catch(
const std::exception &e) {
94 std::cerr << e.what() <<
'\n';
CompressedMatrix input_frames
The input data, with NumRows() >= labels.size() + left_context; it includes features to the left and ...
This code computes Goodness of Pronunciation (GOP) and extracts phone-level pronunciation feature for...
int32 LeftContext() const
Returns the left-context summed over all the Components...
NnetExample is the input data and corresponding label (or labels) for one or more frames of input...
int32 left_context
The number of frames of left context (we can work out the #frames of right context from input_frames...
int32 OutputDim() const
The output dimension of the network – typically the number of pdfs.
A templated class for writing objects to an archive or script file; see The Table concept...
This class represents a matrix that's stored on the GPU if we have one, and in memory if not...
void NnetComputation(const Nnet &nnet, const CuMatrixBase< BaseFloat > &input, bool pad_input, CuMatrixBase< BaseFloat > *output)
Does the basic neural net computation, on a sequence of data (e.g.
void ReadKaldiObject(const std::string &filename, Matrix< float > *m)
The class ParseOptions is for parsing command-line options; see Parsing command-line options for more...
void Swap(Matrix< Real > *mat)
int32 RightContext() const
Returns the right-context summed over all the Components...
A templated class for reading objects sequentially from an archive or script file; see The Table conc...
MatrixIndexT NumCols() const
Returns number of columns (or zero for emtpy matrix).
Vector< BaseFloat > spk_info
The speaker-specific input, if any, or an empty vector if we're not using this features.