#include <nnet-simple-component.h>
Public Member Functions | |
virtual std::string | Type () const |
Returns a string such as "SigmoidComponent", describing the type of the object. More... | |
virtual void | Read (std::istream &is, bool binary) |
Read function (used after we know the type of the Component); accepts input that is missing the token that describes the component type, in case it has already been consumed. More... | |
virtual void | Write (std::ostream &os, bool binary) const |
Write component to stream. More... | |
NaturalGradientAffineComponent () | |
void | InitFromConfig (ConfigLine *cfl) |
Initialize, from a ConfigLine object. More... | |
virtual std::string | Info () const |
Returns some text-form information about this component, for diagnostics. More... | |
virtual Component * | Copy () const |
Copies component (deep copy). More... | |
virtual void | Scale (BaseFloat scale) |
This virtual function when called on – an UpdatableComponent scales the parameters by "scale" when called by an UpdatableComponent. More... | |
virtual void | Add (BaseFloat alpha, const Component &other) |
This virtual function when called by – an UpdatableComponent adds the parameters of another updatable component, times some constant, to the current parameters. More... | |
virtual void | FreezeNaturalGradient (bool freeze) |
freezes/unfreezes NaturalGradient updates, if applicable (to be overriden by components that use Natural Gradient). More... | |
virtual void | ConsolidateMemory () |
This virtual function relates to memory management, and avoiding fragmentation. More... | |
NaturalGradientAffineComponent (const NaturalGradientAffineComponent &other) | |
NaturalGradientAffineComponent (const CuMatrixBase< BaseFloat > &linear_params, const CuVectorBase< BaseFloat > &bias_params) | |
Public Member Functions inherited from AffineComponent | |
virtual int32 | InputDim () const |
Returns input-dimension of this component. More... | |
virtual int32 | OutputDim () const |
Returns output-dimension of this component. More... | |
BaseFloat | OrthonormalConstraint () const |
AffineComponent () | |
virtual int32 | Properties () const |
Return bitmask of the component's properties. More... | |
virtual void * | Propagate (const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in, CuMatrixBase< BaseFloat > *out) const |
Propagate function. More... | |
virtual void | Backprop (const std::string &debug_info, const ComponentPrecomputedIndexes *indexes, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &, const CuMatrixBase< BaseFloat > &out_deriv, void *memo, Component *to_update, CuMatrixBase< BaseFloat > *in_deriv) const |
Backprop function; depending on which of the arguments 'to_update' and 'in_deriv' are non-NULL, this can compute input-data derivatives and/or perform model update. More... | |
virtual void | PerturbParams (BaseFloat stddev) |
This function is to be used in testing. More... | |
virtual BaseFloat | DotProduct (const UpdatableComponent &other) const |
Computes dot-product between parameters of two instances of a Component. More... | |
virtual int32 | NumParameters () const |
The following new virtual function returns the total dimension of the parameters in this class. More... | |
virtual void | Vectorize (VectorBase< BaseFloat > *params) const |
Turns the parameters into vector form. More... | |
virtual void | UnVectorize (const VectorBase< BaseFloat > ¶ms) |
Converts the parameters from vector form. More... | |
virtual void | SetParams (const CuVectorBase< BaseFloat > &bias, const CuMatrixBase< BaseFloat > &linear) |
const CuVector< BaseFloat > & | BiasParams () const |
CuVector< BaseFloat > & | BiasParams () |
const CuMatrix< BaseFloat > & | LinearParams () const |
CuMatrix< BaseFloat > & | LinearParams () |
AffineComponent (const AffineComponent &other) | |
AffineComponent (const CuMatrixBase< BaseFloat > &linear_params, const CuVectorBase< BaseFloat > &bias_params, BaseFloat learning_rate) | |
virtual void | Resize (int32 input_dim, int32 output_dim) |
void | Init (int32 input_dim, int32 output_dim, BaseFloat param_stddev, BaseFloat bias_stddev) |
Public Member Functions inherited from UpdatableComponent | |
UpdatableComponent (const UpdatableComponent &other) | |
UpdatableComponent () | |
virtual | ~UpdatableComponent () |
virtual void | SetUnderlyingLearningRate (BaseFloat lrate) |
Sets the learning rate of gradient descent- gets multiplied by learning_rate_factor_. More... | |
virtual void | SetActualLearningRate (BaseFloat lrate) |
Sets the learning rate directly, bypassing learning_rate_factor_. More... | |
virtual void | SetAsGradient () |
Sets is_gradient_ to true and sets learning_rate_ to 1, ignoring learning_rate_factor_. More... | |
virtual BaseFloat | LearningRateFactor () |
virtual void | SetLearningRateFactor (BaseFloat lrate_factor) |
void | SetUpdatableConfigs (const UpdatableComponent &other) |
BaseFloat | LearningRate () const |
Gets the learning rate to be used in gradient descent. More... | |
BaseFloat | MaxChange () const |
Returns the per-component max-change value, which is interpreted as the maximum change (in l2 norm) in parameters that is allowed per minibatch for this component. More... | |
void | SetMaxChange (BaseFloat max_change) |
BaseFloat | L2Regularization () const |
Returns the l2 regularization constant, which may be set in any updatable component (usually from the config file). More... | |
void | SetL2Regularization (BaseFloat a) |
Public Member Functions inherited from Component | |
virtual void | StoreStats (const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_value, void *memo) |
This function may store stats on average activation values, and for some component types, the average value of the derivative of the nonlinearity. More... | |
virtual void | ZeroStats () |
Components that provide an implementation of StoreStats should also provide an implementation of ZeroStats(), to set those stats to zero. More... | |
virtual void | GetInputIndexes (const MiscComputationInfo &misc_info, const Index &output_index, std::vector< Index > *desired_indexes) const |
This function only does something interesting for non-simple Components. More... | |
virtual bool | IsComputable (const MiscComputationInfo &misc_info, const Index &output_index, const IndexSet &input_index_set, std::vector< Index > *used_inputs) const |
This function only does something interesting for non-simple Components, and it exists to make it possible to manage optionally-required inputs. More... | |
virtual void | ReorderIndexes (std::vector< Index > *input_indexes, std::vector< Index > *output_indexes) const |
This function only does something interesting for non-simple Components. More... | |
virtual ComponentPrecomputedIndexes * | PrecomputeIndexes (const MiscComputationInfo &misc_info, const std::vector< Index > &input_indexes, const std::vector< Index > &output_indexes, bool need_backprop) const |
This function must return NULL for simple Components. More... | |
virtual void | DeleteMemo (void *memo) const |
This virtual function only needs to be overwritten by Components that return a non-NULL memo from their Propagate() function. More... | |
Component () | |
virtual | ~Component () |
Private Member Functions | |
NaturalGradientAffineComponent & | operator= (const NaturalGradientAffineComponent &) |
virtual void | Update (const std::string &debug_info, const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_deriv) |
Private Attributes | |
OnlineNaturalGradient | preconditioner_in_ |
OnlineNaturalGradient | preconditioner_out_ |
Additional Inherited Members | |
Static Public Member Functions inherited from Component | |
static Component * | ReadNew (std::istream &is, bool binary) |
Read component from stream (works out its type). Dies on error. More... | |
static Component * | NewComponentOfType (const std::string &type) |
Returns a new Component of the given type e.g. More... | |
Protected Member Functions inherited from AffineComponent | |
void | Init (std::string matrix_filename) |
virtual void | UpdateSimple (const CuMatrixBase< BaseFloat > &in_value, const CuMatrixBase< BaseFloat > &out_deriv) |
const AffineComponent & | operator= (const AffineComponent &other) |
Protected Member Functions inherited from UpdatableComponent | |
void | InitLearningRatesFromConfig (ConfigLine *cfl) |
std::string | ReadUpdatableCommon (std::istream &is, bool binary) |
void | WriteUpdatableCommon (std::ostream &is, bool binary) const |
Protected Attributes inherited from AffineComponent | |
CuMatrix< BaseFloat > | linear_params_ |
CuVector< BaseFloat > | bias_params_ |
BaseFloat | orthonormal_constraint_ |
Protected Attributes inherited from UpdatableComponent | |
BaseFloat | learning_rate_ |
learning rate (typically 0.0..0.01) More... | |
BaseFloat | learning_rate_factor_ |
learning rate factor (normally 1.0, but can be set to another < value so that when < you call SetLearningRate(), that value will be scaled by this factor. More... | |
BaseFloat | l2_regularize_ |
L2 regularization constant. More... | |
bool | is_gradient_ |
True if this component is to be treated as a gradient rather than as parameters. More... | |
BaseFloat | max_change_ |
configuration value for imposing max-change More... | |
Definition at line 825 of file nnet-simple-component.h.
|
inline |
Definition at line 831 of file nnet-simple-component.h.
References Component::Add(), Component::ConsolidateMemory(), PnormComponent::Copy(), kaldi::nnet3::FreezeNaturalGradient(), Component::Info(), PnormComponent::InitFromConfig(), and Component::Scale().
Referenced by NaturalGradientAffineComponent::Copy().
|
explicit |
Definition at line 2987 of file nnet-simple-component.cc.
NaturalGradientAffineComponent | ( | const CuMatrixBase< BaseFloat > & | linear_params, |
const CuVectorBase< BaseFloat > & | bias_params | ||
) |
Definition at line 2853 of file nnet-simple-component.cc.
References CuVectorBase< Real >::Dim(), KALDI_ASSERT, CuMatrixBase< Real >::NumRows(), NaturalGradientAffineComponent::preconditioner_in_, NaturalGradientAffineComponent::preconditioner_out_, OnlineNaturalGradient::SetRank(), and OnlineNaturalGradient::SetUpdatePeriod().
This virtual function when called by – an UpdatableComponent adds the parameters of another updatable component, times some constant, to the current parameters.
– a NonlinearComponent (or another component that stores stats, like BatchNormComponent)– it relates to adding stats. Otherwise it will normally do nothing.
Reimplemented from AffineComponent.
Definition at line 3049 of file nnet-simple-component.cc.
References AffineComponent::bias_params_, KALDI_ASSERT, and AffineComponent::linear_params_.
|
virtual |
This virtual function relates to memory management, and avoiding fragmentation.
It is called only once per model, after we do the first minibatch of training. The default implementation does nothing, but it can be overridden by child classes, where it may re-initialize certain quantities that may possibly have been allocated during the forward pass (e.g. certain statistics; OnlineNaturalGradient objects). We use our own CPU-based allocator (see cu-allocator.h) and since it can't do paging since we're not in control of the GPU page table, fragmentation can be a problem. The allocator always tries to put things in 'low-address memory' (i.e. at smaller memory addresses) near the beginning of the block it allocated, to avoid fragmentation; but if permanent things (belonging to the model) are allocated in the forward pass, they can permanently stay in high memory. This function helps to prevent that, by re-allocating those things into low-address memory (It's important that it's called after all the temporary buffers for the forward-backward have been freed, so that there is low-address memory available)).
Reimplemented from Component.
Definition at line 3062 of file nnet-simple-component.cc.
References NaturalGradientAffineComponent::preconditioner_in_, NaturalGradientAffineComponent::preconditioner_out_, and OnlineNaturalGradient::Swap().
|
virtual |
Copies component (deep copy).
Reimplemented from AffineComponent.
Definition at line 2983 of file nnet-simple-component.cc.
References NaturalGradientAffineComponent::NaturalGradientAffineComponent().
|
virtual |
freezes/unfreezes NaturalGradient updates, if applicable (to be overriden by components that use Natural Gradient).
Reimplemented from UpdatableComponent.
Definition at line 3057 of file nnet-simple-component.cc.
References OnlineNaturalGradient::Freeze(), NaturalGradientAffineComponent::preconditioner_in_, and NaturalGradientAffineComponent::preconditioner_out_.
|
virtual |
Returns some text-form information about this component, for diagnostics.
Starts with the type of the component. E.g. "SigmoidComponent dim=900", although most components will have much more info.
Reimplemented from AffineComponent.
Definition at line 2972 of file nnet-simple-component.cc.
References OnlineNaturalGradient::GetAlpha(), OnlineNaturalGradient::GetNumSamplesHistory(), OnlineNaturalGradient::GetRank(), OnlineNaturalGradient::GetUpdatePeriod(), AffineComponent::Info(), NaturalGradientAffineComponent::preconditioner_in_, and NaturalGradientAffineComponent::preconditioner_out_.
|
virtual |
Initialize, from a ConfigLine object.
[in] | cfl | A ConfigLine containing any parameters that are needed for initialization. For example: "dim=100 param-stddev=0.1" |
Reimplemented from AffineComponent.
Definition at line 2867 of file nnet-simple-component.cc.
References AffineComponent::bias_params_, ConfigLine::GetValue(), ConfigLine::HasUnusedValues(), UpdatableComponent::InitLearningRatesFromConfig(), AffineComponent::InputDim(), UpdatableComponent::is_gradient_, KALDI_ASSERT, KALDI_ERR, AffineComponent::linear_params_, CuMatrixBase< Real >::NumCols(), CuMatrixBase< Real >::NumRows(), AffineComponent::orthonormal_constraint_, AffineComponent::OutputDim(), NaturalGradientAffineComponent::preconditioner_in_, NaturalGradientAffineComponent::preconditioner_out_, CuMatrixBase< Real >::Range(), kaldi::ReadKaldiObject(), OnlineNaturalGradient::SetAlpha(), OnlineNaturalGradient::SetNumSamplesHistory(), OnlineNaturalGradient::SetRank(), OnlineNaturalGradient::SetUpdatePeriod(), ConfigLine::UnusedValues(), and ConfigLine::WholeLine().
|
private |
|
virtual |
Read function (used after we know the type of the Component); accepts input that is missing the token that describes the component type, in case it has already been consumed.
Reimplemented from AffineComponent.
Definition at line 2786 of file nnet-simple-component.cc.
References kaldi::nnet3::ExpectToken(), UpdatableComponent::is_gradient_, KALDI_ERR, kaldi::PeekToken(), kaldi::ReadBasicType(), kaldi::ReadToken(), and UpdatableComponent::ReadUpdatableCommon().
|
virtual |
This virtual function when called on – an UpdatableComponent scales the parameters by "scale" when called by an UpdatableComponent.
– a Nonlinear component (or another component that stores stats, like BatchNormComponent)– it relates to scaling activation stats, not parameters. Otherwise it will normally do nothing.
Reimplemented from AffineComponent.
Definition at line 3039 of file nnet-simple-component.cc.
References AffineComponent::bias_params_, and AffineComponent::linear_params_.
|
inlinevirtual |
Returns a string such as "SigmoidComponent", describing the type of the object.
Reimplemented from AffineComponent.
Definition at line 827 of file nnet-simple-component.h.
References PnormComponent::Read(), and PnormComponent::Write().
|
privatevirtual |
Reimplemented from AffineComponent.
Definition at line 2993 of file nnet-simple-component.cc.
References AffineComponent::bias_params_, CuVectorBase< Real >::CopyColFromMat(), kaldi::kNoTrans, kaldi::kTrans, kaldi::kUndefined, UpdatableComponent::learning_rate_, AffineComponent::linear_params_, CuMatrixBase< Real >::NumCols(), CuMatrixBase< Real >::NumRows(), OnlineNaturalGradient::PreconditionDirections(), NaturalGradientAffineComponent::preconditioner_in_, NaturalGradientAffineComponent::preconditioner_out_, CuMatrixBase< Real >::Range(), and CuMatrix< Real >::Resize().
|
virtual |
Write component to stream.
Reimplemented from AffineComponent.
Definition at line 2948 of file nnet-simple-component.cc.
References AffineComponent::bias_params_, OnlineNaturalGradient::GetAlpha(), OnlineNaturalGradient::GetNumSamplesHistory(), OnlineNaturalGradient::GetRank(), OnlineNaturalGradient::GetUpdatePeriod(), AffineComponent::linear_params_, AffineComponent::orthonormal_constraint_, NaturalGradientAffineComponent::preconditioner_in_, NaturalGradientAffineComponent::preconditioner_out_, kaldi::WriteBasicType(), kaldi::WriteToken(), and UpdatableComponent::WriteUpdatableCommon().
|
private |
Definition at line 852 of file nnet-simple-component.h.
Referenced by NaturalGradientAffineComponent::ConsolidateMemory(), NaturalGradientAffineComponent::FreezeNaturalGradient(), NaturalGradientAffineComponent::Info(), LinearComponent::Info(), NaturalGradientAffineComponent::InitFromConfig(), LinearComponent::InitFromConfig(), NaturalGradientAffineComponent::NaturalGradientAffineComponent(), LinearComponent::Read(), NaturalGradientAffineComponent::Update(), NaturalGradientAffineComponent::Write(), and LinearComponent::Write().
|
private |
Definition at line 854 of file nnet-simple-component.h.
Referenced by NaturalGradientAffineComponent::ConsolidateMemory(), NaturalGradientAffineComponent::FreezeNaturalGradient(), NaturalGradientAffineComponent::Info(), LinearComponent::Info(), NaturalGradientAffineComponent::InitFromConfig(), LinearComponent::InitFromConfig(), NaturalGradientAffineComponent::NaturalGradientAffineComponent(), LinearComponent::Read(), NaturalGradientAffineComponent::Update(), NaturalGradientAffineComponent::Write(), and LinearComponent::Write().