tesseract-ocr.github.io/3.x/a01087_source.html

 // Copyright 2008 Google Inc.

 // All Rights Reserved.

 // Author: ahmadab@google.com (Ahmad Abdulkader)

 //

 // neural_net.cpp: Declarations of a class for an object that

 // represents an arbitrary network of neurons

 //

 #include <vector>

 #include <string>

 #include "neural_net.h"

 #include "input_file_buffer.h"


 namespace tesseract {


 NeuralNet::NeuralNet() {

   Init();

 }


 NeuralNet::~NeuralNet() {

   // clean up the wts chunks vector

   for (int vec = 0; vec < static_cast<int>(wts_vec_.size()); vec++) {

     delete wts_vec_[vec];

   }

   // clean up neurons

   delete []neurons_;

   // clean up nodes

   for (int node_idx = 0; node_idx < neuron_cnt_; node_idx++) {

     delete []fast_nodes_[node_idx].inputs;

   }


 }


 // Initiaization function

 void NeuralNet::Init() {

   read_only_ = true;

   auto_encoder_ = false;

   alloc_wgt_cnt_ = 0;

   wts_cnt_ = 0;

   neuron_cnt_ = 0;

   in_cnt_ = 0;

   out_cnt_ = 0;

   wts_vec_.clear();

   neurons_ = NULL;

   inputs_mean_.clear();

   inputs_std_dev_.clear();

   inputs_min_.clear();

   inputs_max_.clear();

 }


 // Does a fast feedforward for read_only nets

 // Templatized for float and double Types

 template <typename Type> bool NeuralNet::FastFeedForward(const Type *inputs,

                                                          Type *outputs) {

   int node_idx = 0;

   Node *node = &fast_nodes_[0];

   // feed inputs in and offset them by the pre-computed bias

   for (node_idx = 0; node_idx < in_cnt_; node_idx++, node++) {

     node->out = inputs[node_idx] - node->bias;

   }

   // compute nodes activations and outputs

   for (;node_idx < neuron_cnt_; node_idx++, node++) {

     double activation = -node->bias;

     for (int fan_in_idx = 0; fan_in_idx < node->fan_in_cnt; fan_in_idx++) {

       activation += (node->inputs[fan_in_idx].input_weight *

                      node->inputs[fan_in_idx].input_node->out);

     }

     node->out = Neuron::Sigmoid(activation);

   }

   // copy the outputs to the output buffers

   node = &fast_nodes_[neuron_cnt_ - out_cnt_];

   for (node_idx = 0; node_idx < out_cnt_; node_idx++, node++) {

     outputs[node_idx] = node->out;

   }

   return true;

 }


 // Performs a feedforward for general nets. Used mainly in training mode

 // Templatized for float and double Types

 template <typename Type> bool NeuralNet::FeedForward(const Type *inputs,

                                                      Type *outputs) {

   // call the fast version in case of readonly nets

   if (read_only_) {

     return FastFeedForward(inputs, outputs);

   }

   // clear all neurons

   Clear();

   // for auto encoders, apply no input normalization

   if (auto_encoder_) {

     for (int in = 0; in < in_cnt_; in++) {

       neurons_[in].set_output(inputs[in]);

     }

   } else {

     // Input normalization : subtract mean and divide by stddev

     for (int in = 0; in < in_cnt_; in++) {

       neurons_[in].set_output((inputs[in] - inputs_min_[in]) /

                               (inputs_max_[in] - inputs_min_[in]));

       neurons_[in].set_output((neurons_[in].output() - inputs_mean_[in]) /

                               inputs_std_dev_[in]);

     }

   }

   // compute the net outputs: follow a pull model each output pulls the

   // outputs of its input nodes and so on

   for (int out = neuron_cnt_ - out_cnt_; out < neuron_cnt_; out++) {

     neurons_[out].FeedForward();

     // copy the values to the output buffer

     outputs[out] = neurons_[out].output();

   }

   return true;

 }


 // Sets a connection between two neurons

 bool NeuralNet::SetConnection(int from, int to) {

   // allocate the wgt

   float *wts  =  AllocWgt(1);

   if (wts == NULL) {

     return false;

   }

   // register the connection

   neurons_[to].AddFromConnection(neurons_ + from, wts, 1);

   return true;

 }


 // Create a fast readonly version of the net

 bool NeuralNet::CreateFastNet() {

   fast_nodes_.resize(neuron_cnt_);

   // build the node structures

   int wts_cnt = 0;

   for (int node_idx = 0; node_idx < neuron_cnt_; node_idx++) {

     Node *node = &fast_nodes_[node_idx];

     if (neurons_[node_idx].node_type() == Neuron::Input) {

       // Input neurons have no fan-in

       node->fan_in_cnt = 0;

       node->inputs = NULL;

       // Input bias is the normalization offset computed from

       // training input stats

       if (fabs(inputs_max_[node_idx] - inputs_min_[node_idx]) <

           kMinInputRange) {

         // if the range approaches zero, the stdev is not defined,

         // this indicates that this input does not change.

         // Set the bias to zero

         node->bias = 0.0f;

       } else {

         node->bias = inputs_min_[node_idx] + (inputs_mean_[node_idx] *

             (inputs_max_[node_idx] - inputs_min_[node_idx]));

       }

     } else {

       node->bias = neurons_[node_idx].bias();

       node->fan_in_cnt = neurons_[node_idx].fan_in_cnt();

       // allocate memory for fan-in nodes

       node->inputs = new WeightedNode[node->fan_in_cnt];

       if (node->inputs == NULL) {

         return false;

       }

       for (int fan_in = 0; fan_in < node->fan_in_cnt; fan_in++) {

         // identify fan-in neuron

         const int id = neurons_[node_idx].fan_in(fan_in)->id();

         // Feedback connections are not allowed and should never happen

         if (id >= node_idx) {

           return false;

         }

         // add the the fan-in neuron and its wgt

         node->inputs[fan_in].input_node = &fast_nodes_[id];

         float wgt_val = neurons_[node_idx].fan_in_wts(fan_in);

         // for input neurons normalize the wgt by the input scaling

         // values to save time during feedforward

         if (neurons_[node_idx].fan_in(fan_in)->node_type() == Neuron::Input) {

           // if the range approaches zero, the stdev is not defined,

           // this indicates that this input does not change.

           // Set the weight to zero

           if (fabs(inputs_max_[id] - inputs_min_[id]) < kMinInputRange) {

             wgt_val = 0.0f;

           } else {

             wgt_val /= ((inputs_max_[id] - inputs_min_[id]) *

                 inputs_std_dev_[id]);

           }

         }

         node->inputs[fan_in].input_weight = wgt_val;

       }

       // incr wgt count to validate against at the end

       wts_cnt += node->fan_in_cnt;

     }

   }

   // sanity check

   return wts_cnt_ == wts_cnt;

 }


 // returns a pointer to the requested set of weights

 // Allocates in chunks

 float * NeuralNet::AllocWgt(int wgt_cnt) {

   // see if need to allocate a new chunk of wts

   if (wts_vec_.size() == 0 || (alloc_wgt_cnt_ + wgt_cnt) > kWgtChunkSize) {

     // add the new chunck to the wts_chunks vector

     wts_vec_.push_back(new vector<float> (kWgtChunkSize));

     alloc_wgt_cnt_ = 0;

   }

   float *ret_ptr = &((*wts_vec_.back())[alloc_wgt_cnt_]);

   // incr usage counts

   alloc_wgt_cnt_ += wgt_cnt;

   wts_cnt_ += wgt_cnt;

   return ret_ptr;

 }


 // create a new net object using an input file as a source

 NeuralNet *NeuralNet::FromFile(const string file_name) {

   // open the file

   InputFileBuffer   input_buff(file_name);

   // create a new net object using input buffer

   NeuralNet *net_obj = FromInputBuffer(&input_buff);

   return net_obj;

 }


 // create a net object from an input buffer

 NeuralNet *NeuralNet::FromInputBuffer(InputFileBuffer *ib) {

       // create a new net object

   NeuralNet *net_obj = new NeuralNet();

   if (net_obj == NULL) {

     return NULL;

   }

       // load the net

   if (!net_obj->ReadBinary(ib)) {

     delete net_obj;

     net_obj = NULL;

   }

   return net_obj;

 }


 // Compute the output of a specific output node.

 // This function is useful for application that are interested in a single

 // output of the net and do not want to waste time on the rest

 // This is the fast-read-only version of this function

 template <typename Type> bool NeuralNet::FastGetNetOutput(const Type *inputs,

                                                           int output_id,

                                                           Type *output) {

   // feed inputs in and offset them by the pre-computed bias

   int node_idx = 0;

   Node *node = &fast_nodes_[0];

   for (node_idx = 0; node_idx < in_cnt_; node_idx++, node++) {

     node->out = inputs[node_idx] - node->bias;

   }


   // compute nodes' activations and outputs for hidden nodes if any

   int hidden_node_cnt = neuron_cnt_ - out_cnt_;

   for (;node_idx < hidden_node_cnt; node_idx++, node++) {

     double activation = -node->bias;

     for (int fan_in_idx = 0; fan_in_idx < node->fan_in_cnt; fan_in_idx++) {

       activation += (node->inputs[fan_in_idx].input_weight *

                      node->inputs[fan_in_idx].input_node->out);

     }

     node->out = Neuron::Sigmoid(activation);

   }


   // compute the output of the required output node

   node += output_id;

   double activation = -node->bias;

   for (int fan_in_idx = 0; fan_in_idx < node->fan_in_cnt; fan_in_idx++) {

     activation += (node->inputs[fan_in_idx].input_weight *

                    node->inputs[fan_in_idx].input_node->out);

   }

   (*output) = Neuron::Sigmoid(activation);

   return true;

 }


 // Performs a feedforward for general nets. Used mainly in training mode

 // Templatized for float and double Types

 template <typename Type> bool NeuralNet::GetNetOutput(const Type *inputs,

                                                       int output_id,

                                                       Type *output) {

   // validate output id

   if (output_id < 0 || output_id >= out_cnt_) {

     return false;

   }


   // call the fast version in case of readonly nets

   if (read_only_) {

     return FastGetNetOutput(inputs, output_id, output);

   }


   // For the slow version, we'll just call FeedForward and return the

   // appropriate output

   vector<Type> outputs(out_cnt_);

   if (!FeedForward(inputs, &outputs[0])) {

     return false;

   }

   (*output) = outputs[output_id];


   return true;

 }


 // Instantiate all supported templates now that the functions have been defined.

 template bool NeuralNet::FeedForward(const float *inputs, float *outputs);

 template bool NeuralNet::FeedForward(const double *inputs, double *outputs);

 template bool NeuralNet::FastFeedForward(const float *inputs, float *outputs);

 template bool NeuralNet::FastFeedForward(const double *inputs,

                                          double *outputs);

 template bool NeuralNet::GetNetOutput(const float *inputs, int output_id,

                                       float *output);

 template bool NeuralNet::GetNetOutput(const double *inputs, int output_id,

                                       double *output);

 template bool NeuralNet::FastGetNetOutput(const float *inputs, int output_id,

                                           float *output);

 template bool NeuralNet::FastGetNetOutput(const double *inputs, int output_id,

                                           double *output);

 template bool NeuralNet::ReadBinary(InputFileBuffer *input_buffer);


 }

tesseract::Neuron::AddFromConnection
void AddFromConnection(Neuron *neuron_vec, float *wts_offset, int from_cnt)
Definition: neuron.cpp:74

tesseract::NeuralNet::FromInputBuffer
static NeuralNet * FromInputBuffer(InputFileBuffer *ib)
Definition: neural_net.cpp:213

tesseract::NeuralNet::kWgtChunkSize
static const int kWgtChunkSize
Definition: neural_net.h:76

tesseract::NeuralNet::WeightedNode::input_node
Node * input_node
Definition: neural_net.h:47

tesseract::NeuralNet::inputs_min_
vector< float > inputs_min_
Definition: neural_net.h:89

tesseract::NeuralNet::AllocWgt
float * AllocWgt(int wgt_cnt)
Definition: neural_net.cpp:189

tesseract::NeuralNet::Clear
void Clear()
Definition: neural_net.h:100

tesseract::NeuralNet::out_cnt_
int out_cnt_
Definition: neural_net.h:65

tesseract::Neuron::fan_in_wts
float fan_in_wts(int idx) const
Definition: neuron.h:108

tesseract::Neuron::set_output
void set_output(float out_val)
Definition: neuron.h:96

tesseract::NeuralNet::ReadBinary
bool ReadBinary(ReadBuffType *input_buff)
Definition: neural_net.h:106

tesseract::NeuralNet::Node::fan_in_cnt
int fan_in_cnt
Definition: neural_net.h:55

tesseract::Neuron::id
int id() const
Definition: neuron.h:99

neural_net.h

tesseract::NeuralNet::read_only_
bool read_only_
Definition: neural_net.h:61

tesseract::NeuralNet::FastFeedForward
bool FastFeedForward(const Type *inputs, Type *outputs)
Definition: neural_net.cpp:52

tesseract::NeuralNet::FastGetNetOutput
bool FastGetNetOutput(const Type *inputs, int output_id, Type *output)
Definition: neural_net.cpp:231

tesseract::NeuralNet
Definition: neural_net.h:22

tesseract::NeuralNet::GetNetOutput
bool GetNetOutput(const Type *inputs, int output_id, Type *output)
Definition: neural_net.cpp:265

tesseract::NeuralNet::Node::bias
float bias
Definition: neural_net.h:54

tesseract::NeuralNet::inputs_mean_
vector< float > inputs_mean_
Definition: neural_net.h:91

tesseract::NeuralNet::in_cnt_
int in_cnt_
Definition: neural_net.h:63

tesseract::NeuralNet::FeedForward
bool FeedForward(const Type *inputs, Type *outputs)
Definition: neural_net.cpp:79

tesseract::NeuralNet::inputs_std_dev_
vector< float > inputs_std_dev_
Definition: neural_net.h:93

tesseract::NeuralNet::WeightedNode::input_weight
float input_weight
Definition: neural_net.h:48

tesseract::Neuron::fan_in
Neuron * fan_in(int idx) const
Definition: neuron.h:105

tesseract::Neuron::bias
float bias() const
Definition: neuron.h:114

tesseract::NeuralNet::fast_nodes_
vector< Node > fast_nodes_
Definition: neural_net.h:96

tesseract::NeuralNet::Node::out
float out
Definition: neural_net.h:53

tesseract::NeuralNet::~NeuralNet
virtual ~NeuralNet()
Definition: neural_net.cpp:19

tesseract::NeuralNet::CreateFastNet
bool CreateFastNet()
Definition: neural_net.cpp:124

tesseract::NeuralNet::wts_cnt_
int wts_cnt_
Definition: neural_net.h:69

tesseract::NeuralNet::Init
void Init()
Definition: neural_net.cpp:34

tesseract::NeuralNet::alloc_wgt_cnt_
int alloc_wgt_cnt_
Definition: neural_net.h:81

tesseract::Neuron::output
float output() const
Definition: neuron.h:93

tesseract::NeuralNet::auto_encoder_
bool auto_encoder_
Definition: neural_net.h:85

tesseract::NeuralNet::inputs_max_
vector< float > inputs_max_
Definition: neural_net.h:87

tesseract::NeuralNet::NeuralNet
NeuralNet()
Definition: neural_net.cpp:15

tesseract::Neuron::Sigmoid
static float Sigmoid(float activation)
Definition: neuron.cpp:85

tesseract::NeuralNet::neurons_
Neuron * neurons_
Definition: neural_net.h:71

tesseract::Neuron::Input
Definition: neuron.h:29

tesseract
Definition: baseapi.cpp:83

tesseract::Neuron::fan_in_cnt
int fan_in_cnt() const
Definition: neuron.h:102

tesseract::NeuralNet::Node
Definition: neural_net.h:52

input_file_buffer.h

NULL
#define NULL
Definition: host.h:144

tesseract::Neuron::FeedForward
void FeedForward()
Definition: neuron.cpp:39

tesseract::NeuralNet::WeightedNode
Definition: neural_net.h:46

tesseract::NeuralNet::wts_vec_
vector< vector< float > * > wts_vec_
Definition: neural_net.h:83

tesseract::NeuralNet::SetConnection
bool SetConnection(int from, int to)
Definition: neural_net.cpp:112

tesseract::NeuralNet::neuron_cnt_
int neuron_cnt_
Definition: neural_net.h:67

tesseract::NeuralNet::Node::inputs
WeightedNode * inputs
Definition: neural_net.h:56

tesseract::InputFileBuffer
Definition: input_file_buffer.h:19

tesseract::NeuralNet::FromFile
static NeuralNet * FromFile(const string file_name)
Definition: neural_net.cpp:204