.\" DO NOT MODIFY THIS FILE! It was generated by help2man 1.47.4. .TH NGRAMCOUNT "1" "August 2017" "OpenGrm NGram library 1.3.2" "User Commands" .SH NAME ngramcount \- Count ngram from input file. .SH DESCRIPTION Count ngram from input file. .IP .SH SYNOPSIS ngramcount [\-\-options] [in.far [out.fst]] .SH OPTIONS .PP .HP \fB\-\-alpha\fR: type = double, default = 1 .IP Weight for first FST .HP \fB\-\-backoff_label\fR: type = int64, default = 0 .IP Backoff label .HP \fB\-\-beta\fR: type = double, default = 1 .IP Weight for second (and subsequent) FST(s) .HP \fB\-\-check_consistency\fR: type = bool, default = false .IP Check model consistency .HP \fB\-\-context_pattern\fR: type = string, default = "" .IP Pattern of contexts to count .HP \fB\-\-epsilon_as_backoff\fR: type = bool, default = false .IP Treat epsilon in the input Fsts as backoff .HP \fB\-\-method\fR: type = string, default = "counts" .IP One of: "counts", "histograms", "count_of_counts", "count_of_histograms" .HP \fB\-\-norm_eps\fR: type = double, default = 0.001 .IP Normalization check epsilon .HP \fB\-\-normalize\fR: type = bool, default = false .IP Normalize resulting model .HP \fB\-\-order\fR: type = int64, default = 3 .IP Set maximal order of ngrams to be counted .HP \fB\-\-output_fst\fR: type = bool, default = true .IP Output counts as fst (otherwise strings) .HP \fB\-\-require_symbols\fR: type = bool, default = true .IP Require symbol tables? (default: yes) .HP \fB\-\-round_to_int\fR: type = bool, default = false .IP Round all counts to integers .PP .HP \fB\-\-help\fR: type = bool, default = false .IP show usage information .HP \fB\-\-helpshort\fR: type = bool, default = false .IP show brief usage information .HP \fB\-\-tmpdir\fR: type = string, default = "/tmp" .IP temporary directory .HP \fB\-\-v\fR: type = int32, default = 0 .IP verbosity level .PP .HP \fB\-\-fst_align\fR: type = bool, default = false .IP Write FST data aligned where appropriate .HP \fB\-\-fst_default_cache_gc\fR: type = bool, default = true .IP Enable garbage collection of cache .HP \fB\-\-fst_default_cache_gc_limit\fR: type = int64, default = 1048576 .IP Cache byte size that triggers garbage collection .HP \fB\-\-fst_read_mode\fR: type = string, default = "read" .IP Default file reading mode for mappable files .HP \fB\-\-fst_verify_properties\fR: type = bool, default = false .IP Verify FST properties queried by TestProperties .HP \fB\-\-save_relabel_ipairs\fR: type = string, default = "" .IP Save input relabel pairs to file .HP \fB\-\-save_relabel_opairs\fR: type = string, default = "" .IP Save output relabel pairs to file .PP .HP \fB\-\-end_symbol\fR: type = string, default = "" .IP Class label for sentence start .HP \fB\-\-start_symbol\fR: type = string, default = "" .IP Class label for sentence start .PP .HP \fB\-\-fst_compat_symbols\fR: type = bool, default = true .IP Require symbol tables to match when appropriate .HP \fB\-\-fst_field_separator\fR: type = string, default = " " .IP Set of characters used as a separator between printed fields .PP .HP \fB\-\-fst_error_fatal\fR: type = bool, default = true .IP FST errors are fatal; o.w. return objects flagged as bad: e.g., FSTs: kError property set, FST weights: not a Member() .HP \fB\-\-ngram_error_fatal\fR: type = bool, default = true .IP NGram errors are fatal; o.w. return objects flagged as bad: e.g., NGramModel::Error() returns true. .PP .HP \fB\-\-fst_weight_parentheses\fR: type = string, default = "" .IP Characters enclosing the first weight of a printed composite weight (e.g., pair weight, tuple weight and derived classes) to ensure proper I/O of nested composite weights; must have size 0 (none) or 2 (open and close parenthesis) .HP \fB\-\-fst_weight_separator\fR: type = string, default = "," .IP Character separator between printed composite weights; must be a single character