1 // fstcompile.cc 2 3 // Licensed under the Apache License, Version 2.0 (the "License"); 4 // you may not use this file except in compliance with the License. 5 // You may obtain a copy of the License at 6 // 7 // http://www.apache.org/licenses/LICENSE-2.0 8 // 9 // Unless required by applicable law or agreed to in writing, software 10 // distributed under the License is distributed on an "AS IS" BASIS, 11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 12 // See the License for the specific language governing permissions and 13 // limitations under the License. 14 // 15 // Copyright 2005-2010 Google, Inc. 16 // Author: riley (at) google.com (Michael Riley) 17 // Modified: jpr (at) google.com (Jake Ratkiewicz) to use FstClass 18 // 19 // \file 20 // Creates binary FSTs from simple text format used by AT&T 21 // (see http://www.research.att.com/projects/mohri/fsm/doc4/fsm.5.html). 22 23 #include <fst/script/compile.h> 24 25 DEFINE_bool(acceptor, false, "Input in acceptor format"); 26 DEFINE_string(arc_type, "standard", "Output arc type"); 27 DEFINE_string(fst_type, "vector", "Output FST type"); 28 DEFINE_string(isymbols, "", "Input label symbol table"); 29 DEFINE_string(osymbols, "", "Output label symbol table"); 30 DEFINE_string(ssymbols, "", "State label symbol table"); 31 DEFINE_bool(keep_isymbols, false, "Store input label symbol table with FST"); 32 DEFINE_bool(keep_osymbols, false, "Store output label symbol table with FST"); 33 DEFINE_bool(keep_state_numbering, false, "Do not renumber input states"); 34 DEFINE_bool(allow_negative_labels, false, 35 "Allow negative labels (not recommended; may cause conflicts)"); 36 37 int main(int argc, char **argv) { 38 namespace s = fst::script; 39 using fst::istream; 40 using fst::ifstream; 41 using fst::SymbolTable; 42 43 string usage = "Creates binary FSTs from simple text format.\n\n Usage: "; 44 usage += argv[0]; 45 usage += " [text.fst [binary.fst]]\n"; 46 47 std::set_new_handler(FailedNewHandler); 48 SetFlags(usage.c_str(), &argc, &argv, true); 49 if (argc > 3) { 50 ShowUsage(); 51 return 1; 52 } 53 54 const char *source = "standard input"; 55 istream *istrm = &std::cin; 56 if (argc > 1 && strcmp(argv[1], "-") != 0) { 57 source = argv[1]; 58 istrm = new fst::ifstream(argv[1]); 59 if (!*istrm) { 60 LOG(ERROR) << argv[0] << ": Open failed, file = " << argv[1]; 61 return 1; 62 } 63 } 64 const SymbolTable *isyms = 0, *osyms = 0, *ssyms = 0; 65 66 if (!FLAGS_isymbols.empty()) { 67 isyms = SymbolTable::ReadText(FLAGS_isymbols, FLAGS_allow_negative_labels); 68 if (!isyms) exit(1); 69 } 70 71 if (!FLAGS_osymbols.empty()) { 72 osyms = SymbolTable::ReadText(FLAGS_osymbols, FLAGS_allow_negative_labels); 73 if (!osyms) exit(1); 74 } 75 76 if (!FLAGS_ssymbols.empty()) { 77 ssyms = SymbolTable::ReadText(FLAGS_ssymbols); 78 if (!ssyms) exit(1); 79 } 80 81 string dest = argc > 2 ? argv[2] : ""; 82 83 s::CompileFst(*istrm, source, dest, FLAGS_fst_type, FLAGS_arc_type, 84 isyms, osyms, ssyms, 85 FLAGS_acceptor, FLAGS_keep_isymbols, FLAGS_keep_osymbols, 86 FLAGS_keep_state_numbering, FLAGS_allow_negative_labels); 87 88 if (istrm != &std::cin) 89 delete istrm; 90 91 return 0; 92 } 93