Provided by: libngram-tools_1.3.2-3_amd64 bug

NAME

       ngramcount - Count ngram from input file.

DESCRIPTION

       Count ngram from input file.

SYNOPSIS

       ngramcount [--options] [in.far [out.fst]]

OPTIONS

       --alpha: type = double, default = 1

              Weight for first FST

       --backoff_label: type = int64, default = 0

              Backoff label

       --beta: type = double, default = 1

              Weight for second (and subsequent) FST(s)

       --check_consistency: type = bool, default = false

              Check model consistency

       --context_pattern: type = string, default = ""

              Pattern of contexts to count

       --epsilon_as_backoff: type = bool, default = false

              Treat epsilon in the input Fsts as backoff

       --method: type = string, default = "counts"

              One of: "counts", "histograms", "count_of_counts", "count_of_histograms"

       --norm_eps: type = double, default = 0.001

              Normalization check epsilon

       --normalize: type = bool, default = false

              Normalize resulting model

       --order: type = int64, default = 3

              Set maximal order of ngrams to be counted

       --output_fst: type = bool, default = true

              Output counts as fst (otherwise strings)

       --require_symbols: type = bool, default = true

              Require symbol tables? (default: yes)

       --round_to_int: type = bool, default = false

              Round all counts to integers

       --help: type = bool, default = false

              show usage information

       --helpshort: type = bool, default = false

              show brief usage information

       --tmpdir: type = string, default = "/tmp"

              temporary directory

       --v: type = int32, default = 0

              verbosity level

       --fst_align: type = bool, default = false

              Write FST data aligned where appropriate

       --fst_default_cache_gc: type = bool, default = true

              Enable garbage collection of cache

       --fst_default_cache_gc_limit: type = int64, default = 1048576

              Cache byte size that triggers garbage collection

       --fst_read_mode: type = string, default = "read"

              Default file reading mode for mappable files

       --fst_verify_properties: type = bool, default = false

              Verify FST properties queried by TestProperties

       --save_relabel_ipairs: type = string, default = ""

              Save input relabel pairs to file

       --save_relabel_opairs: type = string, default = ""

              Save output relabel pairs to file

       --end_symbol: type = string, default = "</s>"

              Class label for sentence start

       --start_symbol: type = string, default = "<s>"

              Class label for sentence start

       --fst_compat_symbols: type = bool, default = true

              Require symbol tables to match when appropriate

       --fst_field_separator: type = string, default = "      "

              Set of characters used as a separator between printed fields

       --fst_error_fatal: type = bool, default = true

              FST  errors  are  fatal;  o.w.  return  objects  flagged as bad: e.g., FSTs: kError
              property set, FST weights: not a Member()

       --ngram_error_fatal: type = bool, default = true

              NGram  errors  are  fatal;   o.w.   return   objects   flagged   as   bad:    e.g.,
              NGramModel::Error() returns true.

       --fst_weight_parentheses: type = string, default = ""

              Characters  enclosing  the  first  weight of a printed composite weight (e.g., pair
              weight, tuple weight and derived classes) to ensure proper I/O of nested  composite
              weights; must have size 0 (none) or 2 (open and close parenthesis)

       --fst_weight_separator: type = string, default = ","

              Character separator between printed composite weights; must be a single character