tesseract/a01022_source.html

 // File:        fullyconnected.cpp
 // Description: Simple feed-forward layer with various non-linearities.
 // Author:      Ray Smith
 // Created:     Wed Feb 26 14:49:15 PST 2014
 //
 // (C) Copyright 2014, Google Inc.
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 // http://www.apache.org/licenses/LICENSE-2.0
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 #include "fullyconnected.h"

 #ifdef _OPENMP
 #include <omp.h>
 #endif
 #include <stdio.h>
 #include <stdlib.h>

 #include "functions.h"
 #include "networkscratch.h"

 // Number of threads to use for parallel calculation of Forward and Backward.
 const int kNumThreads = 4;

 namespace tesseract {

 FullyConnected::FullyConnected(const STRING& name, int ni, int no,
                                NetworkType type)
   : Network(type, name, ni, no), external_source_(NULL), int_mode_(false) {
 }

 FullyConnected::~FullyConnected() {
 }

 // Returns the shape output from the network given an input shape (which may
 // be partially unknown ie zero).
 StaticShape FullyConnected::OutputShape(const StaticShape& input_shape) const {
   LossType loss_type = LT_NONE;
   if (type_ == NT_SOFTMAX)
     loss_type = LT_CTC;
   else if (type_ == NT_SOFTMAX_NO_CTC)
     loss_type = LT_SOFTMAX;
   else if (type_ == NT_LOGISTIC)
     loss_type = LT_LOGISTIC;
   StaticShape result(input_shape);
   result.set_depth(no_);
   result.set_loss_type(loss_type);
   return result;
 }

 // Suspends/Enables training by setting the training_ flag.
 void FullyConnected::SetEnableTraining(TrainingState state) {
   if (state == TS_RE_ENABLE) {
     // Enable only from temp disabled.
     if (training_ == TS_TEMP_DISABLE) training_ = TS_ENABLED;
   } else if (state == TS_TEMP_DISABLE) {
     // Temp disable only from enabled.
     if (training_ == TS_ENABLED) training_ = state;
   } else {
     if (state == TS_ENABLED && training_ != TS_ENABLED)
       weights_.InitBackward();
     training_ = state;
   }
 }

 // Sets up the network for training. Initializes weights using weights of
 // scale `range` picked according to the random number generator `randomizer`.
 int FullyConnected::InitWeights(float range, TRand* randomizer) {
   Network::SetRandomizer(randomizer);
   num_weights_ = weights_.InitWeightsFloat(no_, ni_ + 1, TestFlag(NF_ADA_GRAD),
                                            range, randomizer);
   return num_weights_;
 }

 // Converts a float network to an int network.
 void FullyConnected::ConvertToInt() {
   weights_.ConvertToInt();
 }

 // Provides debug output on the weights.
 void FullyConnected::DebugWeights() {
   weights_.Debug2D(name_.string());
 }

 // Writes to the given file. Returns false in case of error.
 bool FullyConnected::Serialize(TFile* fp) const {
   if (!Network::Serialize(fp)) return false;
   if (!weights_.Serialize(IsTraining(), fp)) return false;
   return true;
 }

 // Reads from the given file. Returns false in case of error.
 bool FullyConnected::DeSerialize(TFile* fp) {
   return weights_.DeSerialize(IsTraining(), fp);
 }

 // Runs forward propagation of activations on the input line.
 // See NetworkCpp for a detailed discussion of the arguments.
 void FullyConnected::Forward(bool debug, const NetworkIO& input,
                              const TransposedArray* input_transpose,
                              NetworkScratch* scratch, NetworkIO* output) {
   int width = input.Width();
   if (type_ == NT_SOFTMAX)
     output->ResizeFloat(input, no_);
   else
     output->Resize(input, no_);
   SetupForward(input, input_transpose);
   GenericVector<NetworkScratch::FloatVec> temp_lines;
   temp_lines.init_to_size(kNumThreads, NetworkScratch::FloatVec());
   GenericVector<NetworkScratch::FloatVec> curr_input;
   curr_input.init_to_size(kNumThreads, NetworkScratch::FloatVec());
   for (int i = 0; i < temp_lines.size(); ++i) {
     temp_lines[i].Init(no_, scratch);
     curr_input[i].Init(ni_, scratch);
   }
 #ifdef _OPENMP
 #pragma omp parallel for num_threads(kNumThreads)
   for (int t = 0; t < width; ++t) {
     // Thread-local pointer to temporary storage.
     int thread_id = omp_get_thread_num();
 #else
   for (int t = 0; t < width; ++t) {
     // Thread-local pointer to temporary storage.
     int thread_id = 0;
 #endif
     double* temp_line = temp_lines[thread_id];
     const double* d_input = NULL;
     const inT8* i_input = NULL;
     if (input.int_mode()) {
       i_input = input.i(t);
     } else {
       input.ReadTimeStep(t, curr_input[thread_id]);
       d_input = curr_input[thread_id];
     }
     ForwardTimeStep(d_input, i_input, t, temp_line);
     output->WriteTimeStep(t, temp_line);
     if (IsTraining() && type_ != NT_SOFTMAX) {
       acts_.CopyTimeStepFrom(t, *output, t);
     }
   }
   // Zero all the elements that are in the padding around images that allows
   // multiple different-sized images to exist in a single array.
   // acts_ is only used if this is not a softmax op.
   if (IsTraining() && type_ != NT_SOFTMAX) {
     acts_.ZeroInvalidElements();
   }
   output->ZeroInvalidElements();
 #if DEBUG_DETAIL > 0
   tprintf("F Output:%s\n", name_.string());
   output->Print(10);
 #endif
   if (debug) DisplayForward(*output);
 }

 // Components of Forward so FullyConnected can be reused inside LSTM.
 void FullyConnected::SetupForward(const NetworkIO& input,
                                   const TransposedArray* input_transpose) {
   // Softmax output is always float, so save the input type.
   int_mode_ = input.int_mode();
   if (IsTraining()) {
     acts_.Resize(input, no_);
     // Source_ is a transposed copy of input. It isn't needed if provided.
     external_source_ = input_transpose;
     if (external_source_ == NULL) source_t_.ResizeNoInit(ni_, input.Width());
   }
 }

 void FullyConnected::ForwardTimeStep(const double* d_input, const inT8* i_input,
                                      int t, double* output_line) {
   // input is copied to source_ line-by-line for cache coherency.
   if (IsTraining() && external_source_ == NULL && d_input != NULL)
     source_t_.WriteStrided(t, d_input);
   if (d_input != NULL)
     weights_.MatrixDotVector(d_input, output_line);
   else
     weights_.MatrixDotVector(i_input, output_line);
   if (type_ == NT_TANH) {
     FuncInplace<GFunc>(no_, output_line);
   } else if (type_ == NT_LOGISTIC) {
     FuncInplace<FFunc>(no_, output_line);
   } else if (type_ == NT_POSCLIP) {
     FuncInplace<ClipFFunc>(no_, output_line);
   } else if (type_ == NT_SYMCLIP) {
     FuncInplace<ClipGFunc>(no_, output_line);
   } else if (type_ == NT_RELU) {
     FuncInplace<Relu>(no_, output_line);
   } else if (type_ == NT_SOFTMAX || type_ == NT_SOFTMAX_NO_CTC) {
     SoftmaxInPlace(no_, output_line);
   } else if (type_ != NT_LINEAR) {
     ASSERT_HOST("Invalid fully-connected type!" == NULL);
   }
 }

 // Runs backward propagation of errors on the deltas line.
 // See NetworkCpp for a detailed discussion of the arguments.
 bool FullyConnected::Backward(bool debug, const NetworkIO& fwd_deltas,
                               NetworkScratch* scratch,
                               NetworkIO* back_deltas) {
   if (debug) DisplayBackward(fwd_deltas);
   back_deltas->Resize(fwd_deltas, ni_);
   GenericVector<NetworkScratch::FloatVec> errors;
   errors.init_to_size(kNumThreads, NetworkScratch::FloatVec());
   for (int i = 0; i < errors.size(); ++i) errors[i].Init(no_, scratch);
   GenericVector<NetworkScratch::FloatVec> temp_backprops;
   if (needs_to_backprop_) {
     temp_backprops.init_to_size(kNumThreads, NetworkScratch::FloatVec());
     for (int i = 0; i < kNumThreads; ++i) temp_backprops[i].Init(ni_, scratch);
   }
   int width = fwd_deltas.Width();
   NetworkScratch::GradientStore errors_t;
   errors_t.Init(no_, width, scratch);
 #ifdef _OPENMP
 #pragma omp parallel for num_threads(kNumThreads)
   for (int t = 0; t < width; ++t) {
     int thread_id = omp_get_thread_num();
 #else
   for (int t = 0; t < width; ++t) {
     int thread_id = 0;
 #endif
     double* backprop = NULL;
     if (needs_to_backprop_) backprop = temp_backprops[thread_id];
     double* curr_errors = errors[thread_id];
     BackwardTimeStep(fwd_deltas, t, curr_errors, errors_t.get(), backprop);
     if (backprop != NULL) {
       back_deltas->WriteTimeStep(t, backprop);
     }
   }
   FinishBackward(*errors_t.get());
   if (needs_to_backprop_) {
     back_deltas->ZeroInvalidElements();
     back_deltas->CopyWithNormalization(*back_deltas, fwd_deltas);
 #if DEBUG_DETAIL > 0
     tprintf("F Backprop:%s\n", name_.string());
     back_deltas->Print(10);
 #endif
     return true;
   }
   return false;  // No point going further back.
 }

 void FullyConnected::BackwardTimeStep(const NetworkIO& fwd_deltas, int t,
                                       double* curr_errors,
                                       TransposedArray* errors_t,
                                       double* backprop) {
   if (type_ == NT_TANH)
     acts_.FuncMultiply<GPrime>(fwd_deltas, t, curr_errors);
   else if (type_ == NT_LOGISTIC)
     acts_.FuncMultiply<FPrime>(fwd_deltas, t, curr_errors);
   else if (type_ == NT_POSCLIP)
     acts_.FuncMultiply<ClipFPrime>(fwd_deltas, t, curr_errors);
   else if (type_ == NT_SYMCLIP)
     acts_.FuncMultiply<ClipGPrime>(fwd_deltas, t, curr_errors);
   else if (type_ == NT_RELU)
     acts_.FuncMultiply<ReluPrime>(fwd_deltas, t, curr_errors);
   else if (type_ == NT_SOFTMAX || type_ == NT_SOFTMAX_NO_CTC ||
            type_ == NT_LINEAR)
     fwd_deltas.ReadTimeStep(t, curr_errors);  // fwd_deltas are the errors.
   else
     ASSERT_HOST("Invalid fully-connected type!" == NULL);
   // Generate backprop only if needed by the lower layer.
   if (backprop != NULL) weights_.VectorDotMatrix(curr_errors, backprop);
   errors_t->WriteStrided(t, curr_errors);
 }

 void FullyConnected::FinishBackward(const TransposedArray& errors_t) {
   if (external_source_ == NULL)
     weights_.SumOuterTransposed(errors_t, source_t_, true);
   else
     weights_.SumOuterTransposed(errors_t, *external_source_, true);
 }

 // Updates the weights using the given learning rate and momentum.
 // num_samples is the quotient to be used in the adagrad computation iff
 // use_ada_grad_ is true.
 void FullyConnected::Update(float learning_rate, float momentum,
                             int num_samples) {
   weights_.Update(learning_rate, momentum, num_samples);
 }

 // Sums the products of weight updates in *this and other, splitting into
 // positive (same direction) in *same and negative (different direction) in
 // *changed.
 void FullyConnected::CountAlternators(const Network& other, double* same,
                                       double* changed) const {
   ASSERT_HOST(other.type() == type_);
   const FullyConnected* fc = static_cast<const FullyConnected*>(&other);
   weights_.CountAlternators(fc->weights_, same, changed);
 }

 }  // namespace tesseract.
tesseract::LT_LOGISTIC
Definition: static_shape.h:31

tesseract::NT_POSCLIP
Definition: network.h:63

tesseract::NetworkIO::CopyTimeStepFrom
void CopyTimeStepFrom(int dest_t, const NetworkIO &src, int src_t)
Definition: networkio.cpp:383

tesseract::NetworkIO::ZeroInvalidElements
void ZeroInvalidElements()
Definition: networkio.cpp:88

tesseract::NetworkScratch::GradientStore
Definition: networkscratch.h:176

tesseract::NetworkIO::ReadTimeStep
void ReadTimeStep(int t, double *output) const
Definition: networkio.cpp:598

tesseract::Network::needs_to_backprop_
bool needs_to_backprop_
Definition: network.h:287

tesseract::FullyConnected::FullyConnected
FullyConnected(const STRING &name, int ni, int no, NetworkType type)
Definition: fullyconnected.cpp:35

tesseract::NetworkScratch
Definition: networkscratch.h:36

tesseract::Network
Definition: network.h:105

tesseract::WeightMatrix::Debug2D
void Debug2D(const char *msg)
Definition: weightmatrix.cpp:307

tesseract::FullyConnected::int_mode_
bool int_mode_
Definition: fullyconnected.h:126

tesseract::NetworkIO::Width
int Width() const
Definition: networkio.h:107

tesseract::FullyConnected::source_t_
TransposedArray source_t_
Definition: fullyconnected.h:118

tesseract::FullyConnected::Update
virtual void Update(float learning_rate, float momentum, int num_samples)
Definition: fullyconnected.cpp:283

tesseract::TS_ENABLED
Definition: network.h:95

tesseract::Network::SetRandomizer
virtual void SetRandomizer(TRand *randomizer)
Definition: network.cpp:140

GenericVector::init_to_size
void init_to_size(int size, T t)
Definition: genericvector.h:696

tesseract::WeightMatrix::MatrixDotVector
void MatrixDotVector(const double *u, double *v) const
Definition: weightmatrix.cpp:174

tesseract::Network::DisplayForward
void DisplayForward(const NetworkIO &matrix)
Definition: network.cpp:285

tesseract::LT_NONE
Definition: static_shape.h:28

tesseract::FullyConnected
Definition: fullyconnected.h:28

tesseract::NetworkScratch::FloatVec
Definition: networkscratch.h:136

tesseract::FullyConnected::Backward
virtual bool Backward(bool debug, const NetworkIO &fwd_deltas, NetworkScratch *scratch, NetworkIO *back_deltas)
Definition: fullyconnected.cpp:204

tesseract::NT_SOFTMAX_NO_CTC
Definition: network.h:69

tesseract::NT_SOFTMAX
Definition: network.h:68

tesseract::LT_CTC
Definition: static_shape.h:29

tesseract::Network::type
NetworkType type() const
Definition: network.h:112

tesseract::Network::name_
STRING name_
Definition: network.h:292

tprintf
#define tprintf(...)
Definition: tprintf.h:31

tesseract::FPrime
Definition: functions.h:86

STRING::string
const char * string() const
Definition: strngs.cpp:198

tesseract::NetworkIO::Resize
void Resize(const NetworkIO &src, int num_features)
Definition: networkio.h:45

tesseract::WeightMatrix::VectorDotMatrix
void VectorDotMatrix(const double *u, double *v) const
Definition: weightmatrix.cpp:212

tesseract::TransposedArray::WriteStrided
void WriteStrided(int t, const float *data)
Definition: weightmatrix.h:37

tesseract::WeightMatrix::CountAlternators
void CountAlternators(const WeightMatrix &other, double *same, double *changed) const
Definition: weightmatrix.cpp:276

tesseract::Network::IsTraining
bool IsTraining() const
Definition: network.h:115

GenericVector::size
int size() const
Definition: genericvector.h:72

tesseract::NetworkIO::int_mode
bool int_mode() const
Definition: networkio.h:127

tesseract
Definition: baseapi.cpp:82

tesseract::FullyConnected::~FullyConnected
virtual ~FullyConnected()
Definition: fullyconnected.cpp:40

tesseract::TrainingState
TrainingState
Definition: network.h:92

tesseract::StaticShape::set_loss_type
void set_loss_type(LossType value)
Definition: static_shape.h:49

tesseract::FullyConnected::DebugWeights
virtual void DebugWeights()
Definition: fullyconnected.cpp:89

ASSERT_HOST
#define ASSERT_HOST(x)
Definition: errcode.h:84

tesseract::FullyConnected::acts_
NetworkIO acts_
Definition: fullyconnected.h:123

GenericVector
Definition: baseapi.h:42

tesseract::TS_RE_ENABLE
Definition: network.h:99

tesseract::NetworkIO::FuncMultiply
void FuncMultiply(const NetworkIO &v_io, int t, double *product)
Definition: networkio.h:259

networkscratch.h

tesseract::NT_SYMCLIP
Definition: network.h:64

tesseract::FullyConnected::DeSerialize
virtual bool DeSerialize(TFile *fp)
Definition: fullyconnected.cpp:101

tesseract::Network::training_
TrainingState training_
Definition: network.h:286

tesseract::TRand
Definition: helpers.h:41

STRING
Definition: strngs.h:45

tesseract::TS_TEMP_DISABLE
Definition: network.h:97

tesseract::NF_ADA_GRAD
Definition: network.h:88

tesseract::LT_SOFTMAX
Definition: static_shape.h:30

tesseract::ClipFPrime
Definition: functions.h:96

tesseract::FullyConnected::weights_
WeightMatrix weights_
Definition: fullyconnected.h:116

tesseract::NetworkScratch::GradientStore::get
TransposedArray * get() const
Definition: networkscratch.h:193

tesseract::Network::TestFlag
bool TestFlag(NetworkFlags flag) const
Definition: network.h:144

tesseract::FullyConnected::SetEnableTraining
virtual void SetEnableTraining(TrainingState state)
Definition: fullyconnected.cpp:60

tesseract::FullyConnected::SetupForward
void SetupForward(const NetworkIO &input, const TransposedArray *input_transpose)
Definition: fullyconnected.cpp:164

tesseract::NetworkIO::CopyWithNormalization
void CopyWithNormalization(const NetworkIO &src, const NetworkIO &scale)
Definition: networkio.cpp:831

tesseract::NetworkIO
Definition: networkio.h:39

tesseract::SoftmaxInPlace
void SoftmaxInPlace(int n, T *inout)
Definition: functions.h:163

tesseract::ReluPrime
Definition: functions.h:107

tesseract::WeightMatrix::Update
void Update(double learning_rate, double momentum, int num_samples)
Definition: weightmatrix.cpp:252

GENERIC_2D_ARRAY::ResizeNoInit
void ResizeNoInit(int size1, int size2)
Definition: matrix.h:86

tesseract::NetworkIO::ResizeFloat
void ResizeFloat(const NetworkIO &src, int num_features)
Definition: networkio.h:52

tesseract::NT_TANH
Definition: network.h:65

tesseract::NetworkType
NetworkType
Definition: network.h:43

inT8
int8_t inT8
Definition: host.h:34

kNumThreads
const int kNumThreads
Definition: fullyconnected.cpp:31

tesseract::TFile
Definition: serialis.h:51

tesseract::Network::type_
NetworkType type_
Definition: network.h:285

tesseract::NT_LOGISTIC
Definition: network.h:62

tesseract::WeightMatrix::DeSerialize
bool DeSerialize(bool training, TFile *fp)
Definition: weightmatrix.cpp:125

tesseract::WeightMatrix::InitWeightsFloat
int InitWeightsFloat(int no, int ni, bool ada_grad, float weight_range, TRand *randomizer)
Definition: weightmatrix.cpp:39

tesseract::FullyConnected::ForwardTimeStep
void ForwardTimeStep(const double *d_input, const inT8 *i_input, int t, double *output_line)
Definition: fullyconnected.cpp:176

tesseract::TransposedArray
Definition: weightmatrix.h:31

tesseract::NetworkIO::Print
void Print(int num) const
Definition: networkio.cpp:366

tesseract::WeightMatrix::Serialize
bool Serialize(bool training, TFile *fp) const
Definition: weightmatrix.cpp:106

tesseract::StaticShape
Definition: static_shape.h:36

tesseract::NetworkIO::i
const inT8 * i(int t) const
Definition: networkio.h:123

tesseract::GPrime
Definition: functions.h:113

tesseract::NT_LINEAR
Definition: network.h:67

fullyconnected.h

tesseract::NetworkScratch::GradientStore::Init
void Init(int size1, int size2, NetworkScratch *scratch)
Definition: networkscratch.h:184

tesseract::FullyConnected::OutputShape
virtual StaticShape OutputShape(const StaticShape &input_shape) const
Definition: fullyconnected.cpp:45

tesseract::FullyConnected::external_source_
const TransposedArray * external_source_
Definition: fullyconnected.h:121

tesseract::NetworkIO::WriteTimeStep
void WriteTimeStep(int t, const double *input)
Definition: networkio.cpp:645

tesseract::WeightMatrix::InitBackward
void InitBackward()
Definition: weightmatrix.cpp:87

tesseract::Network::no_
inT32 no_
Definition: network.h:290

tesseract::NT_RELU
Definition: network.h:66

tesseract::LossType
LossType
Definition: static_shape.h:27

tesseract::Network::Serialize
virtual bool Serialize(TFile *fp) const
Definition: network.cpp:153

tesseract::ClipGPrime
Definition: functions.h:123

tesseract::FullyConnected::ConvertToInt
virtual void ConvertToInt()
Definition: fullyconnected.cpp:84

tesseract::Network::DisplayBackward
void DisplayBackward(const NetworkIO &matrix)
Definition: network.cpp:296

tesseract::FullyConnected::Serialize
virtual bool Serialize(TFile *fp) const
Definition: fullyconnected.cpp:94

tesseract::Network::num_weights_
inT32 num_weights_
Definition: network.h:291

tesseract::Network::ni_
inT32 ni_
Definition: network.h:289

tesseract::WeightMatrix::SumOuterTransposed
void SumOuterTransposed(const TransposedArray &u, const TransposedArray &v, bool parallel)
Definition: weightmatrix.cpp:222

tesseract::FullyConnected::CountAlternators
virtual void CountAlternators(const Network &other, double *same, double *changed) const
Definition: fullyconnected.cpp:291

functions.h

tesseract::FullyConnected::Forward
virtual void Forward(bool debug, const NetworkIO &input, const TransposedArray *input_transpose, NetworkScratch *scratch, NetworkIO *output)
Definition: fullyconnected.cpp:107

tesseract::FullyConnected::FinishBackward
void FinishBackward(const TransposedArray &errors_t)
Definition: fullyconnected.cpp:273

tesseract::FullyConnected::InitWeights
virtual int InitWeights(float range, TRand *randomizer)
Definition: fullyconnected.cpp:76

tesseract::WeightMatrix::ConvertToInt
void ConvertToInt()
Definition: weightmatrix.cpp:62

tesseract::FullyConnected::BackwardTimeStep
void BackwardTimeStep(const NetworkIO &fwd_deltas, int t, double *curr_errors, TransposedArray *errors_t, double *backprop)
Definition: fullyconnected.cpp:249

tesseract::StaticShape::set_depth
void set_depth(int value)
Definition: static_shape.h:47