#include <cstdarg>
#include <cstdlib>
#include "EST_String.h"
#include "EST_Val.h"
#include "EST_rw_status.h"
#include "EST_types.h"
#include "EST_FMatrix.h"
#include "EST_TList.h"
#include "EST_StringTrie.h"
#include "EST_simplestats.h"
#include "EST_PST.h"
#include "EST_string_aux.h"
#include "EST_math.h"
Go to the source code of this file.
Classes | |
class | EST_NgrammarState |
class | EST_BackoffNgrammarState |
class | EST_Ngrammar |
Macros | |
#define | SENTENCE_START_MARKER "!ENTER" |
#define | SENTENCE_END_MARKER "!EXIT" |
#define | OOV_MARKER "!OOV" |
#define | EST_NGRAMBIN_MAGIC 1315402337 |
#define | GZIP_FILENAME_EXTENSION "gz" |
#define | COMPRESS_FILENAME_EXTENSION "Z" |
#define | TINY_FREQ 1.0e-10 |
Functions | |
EST_write_status | save_ngram_htk_ascii (const EST_String filename, EST_Ngrammar &n, double floor=0.0) |
EST_write_status | save_ngram_cstr_ascii (const EST_String filename, EST_Ngrammar &n, const bool trace=false, double floor=0.0) |
EST_write_status | save_ngram_cstr_bin (const EST_String filename, EST_Ngrammar &n, const bool trace=false, double floor=0.0) |
void | frequency_of_frequencies (EST_DVector &ff, EST_Ngrammar &n, int this_order=0) |
void | map_frequencies (EST_Ngrammar &n, const EST_DVector &map, const int this_order=0) |
bool | Good_Turing_smooth (EST_Ngrammar &n, int maxcount, int mincount=0) |
void | Good_Turing_discount (EST_Ngrammar &ngrammar, const int maxcount, const double default_discount=0.5) |
void | Ngram_freqsmooth (EST_Ngrammar &ngram, int smooth_thresh1, int smooth_thresh2) |
void | slide (EST_IVector &i, const int l) |
void | slide (EST_StrVector &i, const int l) |
bool | test_stats (EST_Ngrammar &ngram, const EST_String &filename, double &raw_entropy, double &count, double &entropy, double &perplexity, const EST_String &input_format, const EST_String &prev=SENTENCE_START_MARKER, const EST_String &prev_prev=SENTENCE_END_MARKER, const EST_String &last=SENTENCE_END_MARKER) |
#define SENTENCE_START_MARKER "!ENTER" |
Definition at line 59 of file EST_Ngrammar.h.
#define SENTENCE_END_MARKER "!EXIT" |
Definition at line 60 of file EST_Ngrammar.h.
#define OOV_MARKER "!OOV" |
Definition at line 61 of file EST_Ngrammar.h.
#define EST_NGRAMBIN_MAGIC 1315402337 |
Definition at line 63 of file EST_Ngrammar.h.
#define GZIP_FILENAME_EXTENSION "gz" |
Definition at line 66 of file EST_Ngrammar.h.
#define COMPRESS_FILENAME_EXTENSION "Z" |
Definition at line 67 of file EST_Ngrammar.h.
#define TINY_FREQ 1.0e-10 |
Definition at line 70 of file EST_Ngrammar.h.
EST_write_status save_ngram_htk_ascii | ( | const EST_String | filename, |
EST_Ngrammar & | n, | ||
double | floor = 0.0 |
||
) |
Definition at line 565 of file ngrammar_io.cc.
EST_write_status save_ngram_cstr_ascii | ( | const EST_String | filename, |
EST_Ngrammar & | n, | ||
const bool | trace = false , |
||
double | floor = 0.0 |
||
) |
Definition at line 747 of file ngrammar_io.cc.
EST_write_status save_ngram_cstr_bin | ( | const EST_String | filename, |
EST_Ngrammar & | n, | ||
const bool | trace = false , |
||
double | floor = 0.0 |
||
) |
Definition at line 844 of file ngrammar_io.cc.
void frequency_of_frequencies | ( | EST_DVector & | ff, |
EST_Ngrammar & | n, | ||
int | this_order = 0 |
||
) |
Definition at line 207 of file ngrammar_aux.cc.
void map_frequencies | ( | EST_Ngrammar & | n, |
const EST_DVector & | map, | ||
const int | this_order = 0 |
||
) |
Definition at line 306 of file ngrammar_aux.cc.
bool Good_Turing_smooth | ( | EST_Ngrammar & | n, |
int | maxcount, | ||
int | mincount = 0 |
||
) |
Definition at line 410 of file ngrammar_aux.cc.
void Good_Turing_discount | ( | EST_Ngrammar & | ngrammar, |
const int | maxcount, | ||
const double | default_discount = 0.5 |
||
) |
Definition at line 540 of file ngrammar_aux.cc.
void Ngram_freqsmooth | ( | EST_Ngrammar & | ngram, |
int | smooth_thresh1, | ||
int | smooth_thresh2 | ||
) |
Definition at line 58 of file freqsmooth.cc.
void slide | ( | EST_IVector & | i, |
const int | l | ||
) |
Definition at line 2614 of file EST_Ngrammar.cc.
void slide | ( | EST_StrVector & | i, |
const int | l | ||
) |
Definition at line 2735 of file EST_Ngrammar.cc.
bool test_stats | ( | EST_Ngrammar & | ngram, |
const EST_String & | filename, | ||
double & | raw_entropy, | ||
double & | count, | ||
double & | entropy, | ||
double & | perplexity, | ||
const EST_String & | input_format, | ||
const EST_String & | prev = SENTENCE_START_MARKER , |
||
const EST_String & | prev_prev = SENTENCE_END_MARKER , |
||
const EST_String & | last = SENTENCE_END_MARKER |
||
) |
Definition at line 89 of file ngrammar_utils.cc.