FunASR/runtime/onnxruntime/third_party/kaldi/lm/mikolov-rnnlm-lib.h

// lm/mikolov-rnnlm-lib.h

// Copyright       2015  Guoguo Chen  Hainan Xu
//            2010-2012  Tomas Mikolov

// See ../../COPYING for clarification regarding multiple authors
//
// This file is based on version 0.3e of the RNNLM language modeling
// toolkit by Tomas Mikolov.  Changes made by authors other than
// Tomas Mikolov are licensed under the Apache License, the short form
// os which is below.  The original code by Tomas Mikolov is licensed
// under the BSD 3-clause license, whose text is further below.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//  http://www.apache.org/licenses/LICENSE-2.0
//
// THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
// WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
// MERCHANTABLITY OR NON-INFRINGEMENT.
// See the Apache 2 License for the specific language governing permissions and
// limitations under the License.
//
//
// Original BSD 3-clause license text:
// Copyright (c) 2010-2012 Tomas Mikolov
//
// All rights reserved. Redistribution and use in source and binary forms, with
// or without modification, are permitted provided that the following conditions
// are met: 1. Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following
// disclaimer. 2. Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer in the
// documentation and/or other materials provided with the
// distribution. 3. Neither name of copyright holders nor the names of its
// contributors may be used to endorse or promote products derived from this
// software without specific prior written permission. THIS SOFTWARE IS PROVIDED
// BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS ``AS IS'' AND ANY EXPRESS OR
// IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
// EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
// INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,
// OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
// EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#ifndef KALDI_LM_MIKOLOV_RNNLM_LIB_H_
#define KALDI_LM_MIKOLOV_RNNLM_LIB_H_

#include <string>
#include <vector>
#include "util/stl-utils.h"

namespace rnnlm {

#define MAX_STRING 100
#define MAX_FILENAME_STRING 300

typedef double real;      //  doubles for NN weights
typedef double direct_t;  //  doubles for ME weights;

struct neuron {
  real ac;    // actual value stored in neuron
  real er;    // error value in neuron, used by learning algorithm
};

struct synapse {
  real weight;  // weight of synapse
};

struct vocab_word {
  int cn;
  char word[MAX_STRING];

  real prob;
  int class_index;
};

const unsigned int PRIMES[] = {108641969, 116049371, 125925907, 133333309,
  145678979, 175308587, 197530793, 234567803, 251851741, 264197411,
  330864029, 399999781,
  407407183, 459258997, 479012069, 545678687, 560493491, 607407037, 629629243,
  656789717, 716048933, 718518067, 725925469, 733332871, 753085943, 755555077,
  782715551, 790122953, 812345159, 814814293, 893826581, 923456189, 940740127,
  953085797, 985184539, 990122807};
const unsigned int PRIMES_SIZE  =  sizeof(PRIMES) / sizeof(PRIMES[0]);

const int MAX_NGRAM_ORDER = 20;

enum FileTypeEnum {TEXT, BINARY, COMPRESSED};  // COMPRESSED not yet implemented

class CRnnLM {
 protected:
  char train_file[MAX_FILENAME_STRING];
  char valid_file[MAX_FILENAME_STRING];
  char test_file[MAX_FILENAME_STRING];
  char rnnlm_file[MAX_FILENAME_STRING];
  char lmprob_file[MAX_FILENAME_STRING];

  int rand_seed;
  int version;
  int filetype;

  int use_lmprob;
  real gradient_cutoff;

  real dynamic;

  real alpha;
  real starting_alpha;
  int alpha_divide;
  double logp, llogp;
  float min_improvement;
  int iter;
  int vocab_max_size;
  int vocab_size;
  int train_words;
  int train_cur_pos;
  int counter;

  int anti_k;

  real beta;

  int class_size;
  int **class_words;
  int *class_cn;
  int *class_max_cn;
  int old_classes;

  struct vocab_word *vocab;
  void sortVocab();
  int *vocab_hash;
  int vocab_hash_size;

  int layer0_size;
  int layer1_size;
  int layerc_size;
  int layer2_size;

  long long direct_size;
  int direct_order;
  int history[MAX_NGRAM_ORDER];

  int bptt;
  int bptt_block;
  int *bptt_history;
  neuron *bptt_hidden;
  struct synapse *bptt_syn0;

  int gen;

  int independent;

  struct neuron *neu0;    // neurons in input layer
  struct neuron *neu1;    // neurons in hidden layer
  struct neuron *neuc;    // neurons in hidden layer
  struct neuron *neu2;    // neurons in output layer

  struct synapse *syn0;   // weights between input and hidden layer
  struct synapse *syn1;   // weights between hidden and output layer
                          // (or hidden and compression if compression>0)
  struct synapse *sync;   // weights between hidden and compression layer
  direct_t *syn_d;        // direct parameters between input and output layer
                          // (similar to Maximum Entropy model parameters)

  // backup used in training:
  struct neuron *neu0b;
  struct neuron *neu1b;
  struct neuron *neucb;
  struct neuron *neu2b;

  struct synapse *syn0b;
  struct synapse *syn1b;
  struct synapse *syncb;
  direct_t *syn_db;

  // backup used in n-bset rescoring:
  struct neuron *neu1b2;

  unordered_map<std::string, float> unk_penalty;
  std::string unk_sym;

 public:

  int alpha_set, train_file_set;

  CRnnLM();

  ~CRnnLM();

  real random(real min, real max);

  void setRnnLMFile(const std::string &str);
  int getHiddenLayerSize() const { return layer1_size; }
  void setRandSeed(int newSeed);

  int getWordHash(const char *word);
  void readWord(char *word, FILE *fin);
  int searchVocab(const char *word);

  void saveWeights();      // saves current weights and unit activations
  void initNet();
  void goToDelimiter(int delim, FILE *fi);
  void restoreNet();
  void netReset();         // will erase just hidden layer state + bptt history
                           // + maxent history (called at end of sentences in
                           // the independent mode)

  void computeNet(int last_word, int word);
  void copyHiddenLayerToInput();

  void matrixXvector(struct neuron *dest, struct neuron *srcvec,
                     struct synapse *srcmatrix, int matrix_width,
                     int from, int to, int from2, int to2, int type);

  void restoreContextFromVector(const std::vector<float> &context_in);
  void saveContextToVector(std::vector<float> *context_out);

  float computeConditionalLogprob(
      std::string current_word,
      const std::vector<std::string> &history_words,
      const std::vector<float> &context_in,
      std::vector<float> *context_out);

  void setUnkSym(const std::string &unk);
  void setUnkPenalty(const std::string &filename);
  float getUnkPenalty(const std::string &word);
  bool isUnk(const std::string &word);
};

}  // namespace rnnlm

#endif  // KALDI_LM_MIKOLOV_RNNLM_LIB_H_
first commit for takway.ai 2024-05-18 15:50:56 +08:00			`// lm/mikolov-rnnlm-lib.h`

			`// Copyright 2015 Guoguo Chen Hainan Xu`
			`// 2010-2012 Tomas Mikolov`

			`// See ../../COPYING for clarification regarding multiple authors`
			`//`
			`// This file is based on version 0.3e of the RNNLM language modeling`
			`// toolkit by Tomas Mikolov. Changes made by authors other than`
			`// Tomas Mikolov are licensed under the Apache License, the short form`
			`// os which is below. The original code by Tomas Mikolov is licensed`
			`// under the BSD 3-clause license, whose text is further below.`
			`//`
			`// Licensed under the Apache License, Version 2.0 (the "License");`
			`// you may not use this file except in compliance with the License.`
			`// You may obtain a copy of the License at`
			`//`
			`// http://www.apache.org/licenses/LICENSE-2.0`
			`//`
			`// THIS CODE IS PROVIDED AS IS BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY`
			`// KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED`
			`// WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,`
			`// MERCHANTABLITY OR NON-INFRINGEMENT.`
			`// See the Apache 2 License for the specific language governing permissions and`
			`// limitations under the License.`
			`//`
			`//`
			`// Original BSD 3-clause license text:`
			`// Copyright (c) 2010-2012 Tomas Mikolov`
			`//`
			`// All rights reserved. Redistribution and use in source and binary forms, with`
			`// or without modification, are permitted provided that the following conditions`
			`// are met: 1. Redistributions of source code must retain the above copyright`
			`// notice, this list of conditions and the following`
			`// disclaimer. 2. Redistributions in binary form must reproduce the above`
			`// copyright notice, this list of conditions and the following disclaimer in the`
			`// documentation and/or other materials provided with the`
			`// distribution. 3. Neither name of copyright holders nor the names of its`
			`// contributors may be used to endorse or promote products derived from this`
			`// software without specific prior written permission. THIS SOFTWARE IS PROVIDED`
			// BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS ``AS IS'' AND ANY EXPRESS OR
			`// IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF`
			`// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO`
			`// EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,`
			`// INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT`
			`// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,`
			`// OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF`
			`// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING`
			`// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,`
			`// EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.`

			`#ifndef KALDI_LM_MIKOLOV_RNNLM_LIB_H_`
			`#define KALDI_LM_MIKOLOV_RNNLM_LIB_H_`

			`#include <string>`
			`#include <vector>`
			`#include "util/stl-utils.h"`

			`namespace rnnlm {`

			`#define MAX_STRING 100`
			`#define MAX_FILENAME_STRING 300`

			`typedef double real; // doubles for NN weights`
			`typedef double direct_t; // doubles for ME weights;`

			`struct neuron {`
			`real ac; // actual value stored in neuron`
			`real er; // error value in neuron, used by learning algorithm`
			`};`

			`struct synapse {`
			`real weight; // weight of synapse`
			`};`

			`struct vocab_word {`
			`int cn;`
			`char word[MAX_STRING];`

			`real prob;`
			`int class_index;`
			`};`

			`const unsigned int PRIMES[] = {108641969, 116049371, 125925907, 133333309,`
			`145678979, 175308587, 197530793, 234567803, 251851741, 264197411,`
			`330864029, 399999781,`
			`407407183, 459258997, 479012069, 545678687, 560493491, 607407037, 629629243,`
			`656789717, 716048933, 718518067, 725925469, 733332871, 753085943, 755555077,`
			`782715551, 790122953, 812345159, 814814293, 893826581, 923456189, 940740127,`
			`953085797, 985184539, 990122807};`
			`const unsigned int PRIMES_SIZE = sizeof(PRIMES) / sizeof(PRIMES[0]);`

			`const int MAX_NGRAM_ORDER = 20;`

			`enum FileTypeEnum {TEXT, BINARY, COMPRESSED}; // COMPRESSED not yet implemented`

			`class CRnnLM {`
			`protected:`
			`char train_file[MAX_FILENAME_STRING];`
			`char valid_file[MAX_FILENAME_STRING];`
			`char test_file[MAX_FILENAME_STRING];`
			`char rnnlm_file[MAX_FILENAME_STRING];`
			`char lmprob_file[MAX_FILENAME_STRING];`

			`int rand_seed;`
			`int version;`
			`int filetype;`

			`int use_lmprob;`
			`real gradient_cutoff;`

			`real dynamic;`

			`real alpha;`
			`real starting_alpha;`
			`int alpha_divide;`
			`double logp, llogp;`
			`float min_improvement;`
			`int iter;`
			`int vocab_max_size;`
			`int vocab_size;`
			`int train_words;`
			`int train_cur_pos;`
			`int counter;`

			`int anti_k;`

			`real beta;`

			`int class_size;`
			`int **class_words;`
			`int *class_cn;`
			`int *class_max_cn;`
			`int old_classes;`

			`struct vocab_word *vocab;`
			`void sortVocab();`
			`int *vocab_hash;`
			`int vocab_hash_size;`

			`int layer0_size;`
			`int layer1_size;`
			`int layerc_size;`
			`int layer2_size;`

			`long long direct_size;`
			`int direct_order;`
			`int history[MAX_NGRAM_ORDER];`

			`int bptt;`
			`int bptt_block;`
			`int *bptt_history;`
			`neuron *bptt_hidden;`
			`struct synapse *bptt_syn0;`

			`int gen;`

			`int independent;`

			`struct neuron *neu0; // neurons in input layer`
			`struct neuron *neu1; // neurons in hidden layer`
			`struct neuron *neuc; // neurons in hidden layer`
			`struct neuron *neu2; // neurons in output layer`

			`struct synapse *syn0; // weights between input and hidden layer`
			`struct synapse *syn1; // weights between hidden and output layer`
			`// (or hidden and compression if compression>0)`
			`struct synapse *sync; // weights between hidden and compression layer`
			`direct_t *syn_d; // direct parameters between input and output layer`
			`// (similar to Maximum Entropy model parameters)`

			`// backup used in training:`
			`struct neuron *neu0b;`
			`struct neuron *neu1b;`
			`struct neuron *neucb;`
			`struct neuron *neu2b;`

			`struct synapse *syn0b;`
			`struct synapse *syn1b;`
			`struct synapse *syncb;`
			`direct_t *syn_db;`

			`// backup used in n-bset rescoring:`
			`struct neuron *neu1b2;`

			`unordered_map<std::string, float> unk_penalty;`
			`std::string unk_sym;`

			`public:`

			`int alpha_set, train_file_set;`

			`CRnnLM();`

			`~CRnnLM();`

			`real random(real min, real max);`

			`void setRnnLMFile(const std::string &str);`
			`int getHiddenLayerSize() const { return layer1_size; }`
			`void setRandSeed(int newSeed);`

			`int getWordHash(const char *word);`
			`void readWord(char word, FILE fin);`
			`int searchVocab(const char *word);`

			`void saveWeights(); // saves current weights and unit activations`
			`void initNet();`
			`void goToDelimiter(int delim, FILE *fi);`
			`void restoreNet();`
			`void netReset(); // will erase just hidden layer state + bptt history`
			`// + maxent history (called at end of sentences in`
			`// the independent mode)`

			`void computeNet(int last_word, int word);`
			`void copyHiddenLayerToInput();`

			`void matrixXvector(struct neuron dest, struct neuron srcvec,`
			`struct synapse *srcmatrix, int matrix_width,`
			`int from, int to, int from2, int to2, int type);`

			`void restoreContextFromVector(const std::vector<float> &context_in);`
			`void saveContextToVector(std::vector<float> *context_out);`

			`float computeConditionalLogprob(`
			`std::string current_word,`
			`const std::vector<std::string> &history_words,`
			`const std::vector<float> &context_in,`
			`std::vector<float> *context_out);`

			`void setUnkSym(const std::string &unk);`
			`void setUnkPenalty(const std::string &filename);`
			`float getUnkPenalty(const std::string &word);`
			`bool isUnk(const std::string &word);`
			`};`

			`} // namespace rnnlm`

			`#endif // KALDI_LM_MIKOLOV_RNNLM_LIB_H_`