tesseract-ocr.github.io/3.x/a01088_source.html

 // Copyright 2008 Google Inc.

 // All Rights Reserved.

 // Author: ahmadab@google.com (Ahmad Abdulkader)

 //

 // neural_net.h: Declarations of a class for an object that

 // represents an arbitrary network of neurons

 //


 #ifndef NEURAL_NET_H

 #define NEURAL_NET_H


 #include <string>

 #include <vector>

 #include "neuron.h"

 #include "input_file_buffer.h"


 namespace tesseract {


 // Minimum input range below which we set the input weight to zero

 static const float kMinInputRange = 1e-6f;


 class NeuralNet {

   public:

     NeuralNet();

     virtual ~NeuralNet();

     // create a net object from a file. Uses stdio

     static NeuralNet *FromFile(const string file_name);

     // create a net object from an input buffer

     static NeuralNet *FromInputBuffer(InputFileBuffer *ib);

     // Different flavors of feed forward function

     template <typename Type> bool FeedForward(const Type *inputs,

                                               Type *outputs);

     // Compute the output of a specific output node.

     // This function is useful for application that are interested in a single

     // output of the net and do not want to waste time on the rest

     template <typename Type> bool GetNetOutput(const Type *inputs,

                                                int output_id,

                                                Type *output);

     // Accessor functions

     int in_cnt() const { return in_cnt_; }

     int out_cnt() const { return out_cnt_; }


   protected:

     struct Node;

     // A node-weight pair

     struct WeightedNode {

       Node *input_node;

       float input_weight;

     };

     // node struct used for fast feedforward in

     // Read only nets

     struct Node {

       float out;

       float bias;

       int fan_in_cnt;

       WeightedNode *inputs;

     };

     // Read-Only flag (no training: On by default)

     // will presumeably be set to false by

     // the inherting TrainableNeuralNet class

     bool read_only_;

     // input count

     int in_cnt_;

     // output count

     int out_cnt_;

     // Total neuron count (including inputs)

     int neuron_cnt_;

     // count of unique weights

     int  wts_cnt_;

     // Neuron vector

     Neuron *neurons_;

     // size of allocated weight chunk (in weights)

     // This is basically the size of the biggest network

     // that I have trained. However, the class will allow

     // a bigger sized net if desired

     static const int kWgtChunkSize = 0x10000;

     // Magic number expected at the beginning of the NN

     // binary file

     static const unsigned int kNetSignature = 0xFEFEABD0;

     // count of allocated wgts in the last chunk

     int alloc_wgt_cnt_;

     // vector of weights buffers

     vector<vector<float> *>wts_vec_;

     // Is the net an auto-encoder type

     bool auto_encoder_;

     // vector of input max values

     vector<float> inputs_max_;

     // vector of input min values

     vector<float> inputs_min_;

     // vector of input mean values

     vector<float> inputs_mean_;

     // vector of input standard deviation values

     vector<float> inputs_std_dev_;

     // vector of input offsets used by fast read-only

     // feedforward function

     vector<Node> fast_nodes_;

     // Network Initialization function

     void Init();

     // Clears all neurons

     void Clear() {

       for (int node = 0; node < neuron_cnt_; node++) {

         neurons_[node].Clear();

       }

     }

     // Reads the net from an input buffer

     template<class ReadBuffType> bool ReadBinary(ReadBuffType *input_buff) {

       // Init vars

       Init();

       // is this an autoencoder

       unsigned int read_val;

       unsigned int auto_encode;

       // read and verify signature

       if (input_buff->Read(&read_val, sizeof(read_val)) != sizeof(read_val)) {

         return false;

       }

       if (read_val != kNetSignature) {

         return false;

       }

       if (input_buff->Read(&auto_encode, sizeof(auto_encode)) !=

           sizeof(auto_encode)) {

         return false;

       }

       auto_encoder_ = auto_encode;

       // read and validate total # of nodes

       if (input_buff->Read(&read_val, sizeof(read_val)) != sizeof(read_val)) {

         return false;

       }

       neuron_cnt_ = read_val;

       if (neuron_cnt_ <= 0) {

         return false;

       }

       // set the size of the neurons vector

       neurons_ = new Neuron[neuron_cnt_];

       if (neurons_ == NULL) {

         return false;

       }

       // read & validate inputs

       if (input_buff->Read(&read_val, sizeof(read_val)) != sizeof(read_val)) {

         return false;

       }

       in_cnt_ = read_val;

       if (in_cnt_ <= 0) {

         return false;

       }

       // read outputs

       if (input_buff->Read(&read_val, sizeof(read_val)) != sizeof(read_val)) {

         return false;

       }

       out_cnt_ = read_val;

       if (out_cnt_ <= 0) {

         return false;

       }

       // set neuron ids and types

       for (int idx = 0; idx < neuron_cnt_; idx++) {

         neurons_[idx].set_id(idx);

         // input type

         if (idx < in_cnt_) {

           neurons_[idx].set_node_type(Neuron::Input);

         } else if (idx >= (neuron_cnt_ - out_cnt_)) {

           neurons_[idx].set_node_type(Neuron::Output);

         } else {

           neurons_[idx].set_node_type(Neuron::Hidden);

         }

       }

       // read the connections

       for (int node_idx = 0; node_idx < neuron_cnt_; node_idx++) {

         // read fanout

         if (input_buff->Read(&read_val, sizeof(read_val)) != sizeof(read_val)) {

           return false;

         }

         // read the neuron's info

         int fan_out_cnt = read_val;

         for (int fan_out_idx = 0; fan_out_idx < fan_out_cnt; fan_out_idx++) {

           // read the neuron id

           if (input_buff->Read(&read_val, sizeof(read_val)) != sizeof(read_val)) {

             return false;

           }

           // create the connection

           if (!SetConnection(node_idx, read_val)) {

             return false;

           }

         }

       }

       // read all the neurons' fan-in connections

       for (int node_idx = 0; node_idx < neuron_cnt_; node_idx++) {

         // read

         if (!neurons_[node_idx].ReadBinary(input_buff)) {

           return false;

         }

       }

       // size input stats vector to expected input size

       inputs_mean_.resize(in_cnt_);

       inputs_std_dev_.resize(in_cnt_);

       inputs_min_.resize(in_cnt_);

       inputs_max_.resize(in_cnt_);

       // read stats

       if (input_buff->Read(&(inputs_mean_.front()),

           sizeof(inputs_mean_[0]) * in_cnt_) !=

           sizeof(inputs_mean_[0]) * in_cnt_) {

         return false;

       }

       if (input_buff->Read(&(inputs_std_dev_.front()),

           sizeof(inputs_std_dev_[0]) * in_cnt_) !=

           sizeof(inputs_std_dev_[0]) * in_cnt_) {

         return false;

       }

       if (input_buff->Read(&(inputs_min_.front()),

           sizeof(inputs_min_[0]) * in_cnt_) !=

           sizeof(inputs_min_[0]) * in_cnt_) {

         return false;

       }

       if (input_buff->Read(&(inputs_max_.front()),

           sizeof(inputs_max_[0]) * in_cnt_) !=

           sizeof(inputs_max_[0]) * in_cnt_) {

         return false;

       }

       // create a readonly version for fast feedforward

       if (read_only_) {

         return CreateFastNet();

       }

       return true;

     }


     // creates a connection between two nodes

     bool SetConnection(int from, int to);

     // Create a read only version of the net that

     // has faster feedforward performance

     bool CreateFastNet();

     // internal function to allocate a new set of weights

     // Centralized weight allocation attempts to increase

     // weights locality of reference making it more cache friendly

     float *AllocWgt(int wgt_cnt);

     // different flavors read-only feedforward function

     template <typename Type> bool FastFeedForward(const Type *inputs,

                                                   Type *outputs);

     // Compute the output of a specific output node.

     // This function is useful for application that are interested in a single

     // output of the net and do not want to waste time on the rest

     // This is the fast-read-only version of this function

     template <typename Type> bool FastGetNetOutput(const Type *inputs,

                                                    int output_id,

                                                    Type *output);

 };

 }


 #endif  // NEURAL_NET_H__

tesseract::NeuralNet::FromInputBuffer
static NeuralNet * FromInputBuffer(InputFileBuffer *ib)
Definition: neural_net.cpp:213

tesseract::NeuralNet::kWgtChunkSize
static const int kWgtChunkSize
Definition: neural_net.h:76

tesseract::NeuralNet::WeightedNode::input_node
Node * input_node
Definition: neural_net.h:47

tesseract::NeuralNet::in_cnt
int in_cnt() const
Definition: neural_net.h:40

tesseract::NeuralNet::inputs_min_
vector< float > inputs_min_
Definition: neural_net.h:89

tesseract::NeuralNet::AllocWgt
float * AllocWgt(int wgt_cnt)
Definition: neural_net.cpp:189

tesseract::Neuron
Definition: neuron.h:24

tesseract::NeuralNet::Clear
void Clear()
Definition: neural_net.h:100

tesseract::NeuralNet::out_cnt_
int out_cnt_
Definition: neural_net.h:65

tesseract::NeuralNet::ReadBinary
bool ReadBinary(ReadBuffType *input_buff)
Definition: neural_net.h:106

tesseract::NeuralNet::Node::fan_in_cnt
int fan_in_cnt
Definition: neural_net.h:55

tesseract::NeuralNet::read_only_
bool read_only_
Definition: neural_net.h:61

tesseract::NeuralNet::FastFeedForward
bool FastFeedForward(const Type *inputs, Type *outputs)
Definition: neural_net.cpp:52

tesseract::NeuralNet::FastGetNetOutput
bool FastGetNetOutput(const Type *inputs, int output_id, Type *output)
Definition: neural_net.cpp:231

tesseract::NeuralNet
Definition: neural_net.h:22

tesseract::NeuralNet::GetNetOutput
bool GetNetOutput(const Type *inputs, int output_id, Type *output)
Definition: neural_net.cpp:265

tesseract::NeuralNet::Node::bias
float bias
Definition: neural_net.h:54

tesseract::NeuralNet::inputs_mean_
vector< float > inputs_mean_
Definition: neural_net.h:91

tesseract::NeuralNet::in_cnt_
int in_cnt_
Definition: neural_net.h:63

tesseract::NeuralNet::FeedForward
bool FeedForward(const Type *inputs, Type *outputs)
Definition: neural_net.cpp:79

tesseract::NeuralNet::inputs_std_dev_
vector< float > inputs_std_dev_
Definition: neural_net.h:93

tesseract::NeuralNet::WeightedNode::input_weight
float input_weight
Definition: neural_net.h:48

tesseract::NeuralNet::fast_nodes_
vector< Node > fast_nodes_
Definition: neural_net.h:96

tesseract::NeuralNet::Node::out
float out
Definition: neural_net.h:53

tesseract::NeuralNet::~NeuralNet
virtual ~NeuralNet()
Definition: neural_net.cpp:19

neuron.h

tesseract::NeuralNet::CreateFastNet
bool CreateFastNet()
Definition: neural_net.cpp:124

tesseract::NeuralNet::wts_cnt_
int wts_cnt_
Definition: neural_net.h:69

tesseract::NeuralNet::out_cnt
int out_cnt() const
Definition: neural_net.h:41

tesseract::NeuralNet::Init
void Init()
Definition: neural_net.cpp:34

tesseract::NeuralNet::alloc_wgt_cnt_
int alloc_wgt_cnt_
Definition: neural_net.h:81

tesseract::NeuralNet::kNetSignature
static const unsigned int kNetSignature
Definition: neural_net.h:79

tesseract::NeuralNet::auto_encoder_
bool auto_encoder_
Definition: neural_net.h:85

tesseract::NeuralNet::inputs_max_
vector< float > inputs_max_
Definition: neural_net.h:87

tesseract::NeuralNet::NeuralNet
NeuralNet()
Definition: neural_net.cpp:15

tesseract::Neuron::Clear
void Clear()
Definition: neuron.h:37

tesseract::Neuron::Hidden
Definition: neuron.h:30

tesseract::NeuralNet::neurons_
Neuron * neurons_
Definition: neural_net.h:71

tesseract::Neuron::Input
Definition: neuron.h:29

tesseract
Definition: baseapi.cpp:83

tesseract::Neuron::Output
Definition: neuron.h:31

tesseract::Neuron::set_id
void set_id(int id)
Definition: neuron.h:111

tesseract::NeuralNet::Node
Definition: neural_net.h:52

tesseract::Neuron::set_node_type
void set_node_type(NeuronTypes type)
Definition: neuron.cpp:62

input_file_buffer.h

NULL
#define NULL
Definition: host.h:144

tesseract::NeuralNet::WeightedNode
Definition: neural_net.h:46

tesseract::NeuralNet::wts_vec_
vector< vector< float > * > wts_vec_
Definition: neural_net.h:83

tesseract::NeuralNet::SetConnection
bool SetConnection(int from, int to)
Definition: neural_net.cpp:112

tesseract::NeuralNet::neuron_cnt_
int neuron_cnt_
Definition: neural_net.h:67

tesseract::NeuralNet::Node::inputs
WeightedNode * inputs
Definition: neural_net.h:56

tesseract::InputFileBuffer
Definition: input_file_buffer.h:19

tesseract::NeuralNet::FromFile
static NeuralNet * FromFile(const string file_name)
Definition: neural_net.cpp:204