https://github.com/vsiivola/variKN
Raw File
Tip revision: c525568ed62fddfb0351946efe049c4e9ead9ddf authored by Vesa Siivola on 16 January 2014, 08:27:59 UTC
Implement leave-one-out estimates for the discounts. If optimization corpus is not set, use these estimates. Also, initialize numerical search for the parameters with these values. In the latter case, preliminary tests seem to indicate that better accuracy is reached than with the original heuristic search start point.
Tip revision: c525568
arpa2bin.cc
#include "conf.hh"
#include "io.hh"
#include "TreeGramArpaReader.hh"

int main (int argc, char **argv) {
  conf::Config config;
  config("Usage: arpa2bin arpa_in bin_out\nConverts arpa LMs to binary.\n");
  config.parse(argc,argv,2);
  
  io::Stream::verbose=true;
  io::Stream in(config.arguments[0], "r");
  io::Stream out(config.arguments[1], "w");

  TreeGramArpaReader areader;
  TreeGram ng;
  
  fprintf(stderr,"Reading\n");
  areader.read(in.file,&ng);
  in.close();

  if (ng.get_type() == NGram::INTERPOLATED) {
    fprintf(stderr, "Converting to backoff\n");
    ng.convert_to_backoff();
  }

  fprintf(stderr,"Writing\n");
  ng.write(out.file, true);
  out.close();
}
back to top