1f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
2f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// Licensed under the Apache License, Version 2.0 (the "License");
3f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// you may not use this file except in compliance with the License.
4f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// You may obtain a copy of the License at
5f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson//
6f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson//     http://www.apache.org/licenses/LICENSE-2.0
7f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson//
8f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// Unless required by applicable law or agreed to in writing, software
9f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// distributed under the License is distributed on an "AS IS" BASIS,
10f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
11f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// See the License for the specific language governing permissions and
12f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// limitations under the License.
13f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson//
14f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// Copyright 2005-2010 Google, Inc.
15f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// Author: jpr@google.com (Jake Ratkiewicz)
16f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
17f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson#include <fst/script/text-io.h>
18f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
19f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson#include <cstring>
20f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson#include <sstream>
21f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson#include <utility>
22f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodsonusing std::pair; using std::make_pair;
23f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
24f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson#include <fst/types.h>
25f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson#include <fst/util.h>
26f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
27f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodsonnamespace fst {
28f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodsonnamespace script {
29f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
30f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// Reads vector of weights; returns true on success.
31f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodsonbool ReadPotentials(const string &weight_type,
32f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson                    const string& filename,
33f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson                    vector<WeightClass>* potential) {
34f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  ifstream strm(filename.c_str());
35f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  if (!strm) {
36f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    LOG(ERROR) << "ReadPotentials: Can't open file: " << filename;
37f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    return false;
38f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  }
39f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
40f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  const int kLineLen = 8096;
41f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  char line[kLineLen];
42f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  size_t nline = 0;
43f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
44f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  potential->clear();
45f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  while (strm.getline(line, kLineLen)) {
46f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    ++nline;
47f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    vector<char *> col;
48f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    SplitToVector(line, "\n\t ", &col, true);
49f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    if (col.size() == 0 || col[0][0] == '\0')  // empty line
50f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson      continue;
51f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    if (col.size() != 2) {
52f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson      LOG(ERROR) << "ReadPotentials: Bad number of columns, "
53f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson                 << "file = " << filename << ", line = " << nline;
54f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson      return false;
55f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    }
56f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
57f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    ssize_t s = StrToInt64(col[0], filename, nline, false);
58f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    WeightClass weight(weight_type, col[1]);
59f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
60f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    while (potential->size() <= s)
61f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson      potential->push_back(WeightClass::Zero());
62f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    (*potential)[s] = weight;
63f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  }
64f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  return true;
65f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson}
66f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
67f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson// Writes vector of weights; returns true on success.
68f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodsonbool WritePotentials(const string& filename,
69f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson                     const vector<WeightClass>& potential) {
70dfd8b8327b93660601d016cdc6f29f433b45a8d8Alexander Gutkin  ostream *strm = &cout;
71f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  if (!filename.empty()) {
72f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    strm = new ofstream(filename.c_str());
73f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    if (!*strm) {
74f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson      LOG(ERROR) << "WritePotentials: Can't open file: " << filename;
75f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson      delete strm;
76f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson      return false;
77f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    }
78f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  }
79f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
80f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  strm->precision(9);
81f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  for (ssize_t s = 0; s < potential.size(); ++s)
82f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    *strm << s << "\t" << potential[s] << "\n";
83f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
84f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  if (!*strm)
85f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    LOG(ERROR) << "WritePotentials: Write failed: "
86f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson               << (filename.empty() ? "standard output" : filename);
87f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  bool ret = *strm;
88dfd8b8327b93660601d016cdc6f29f433b45a8d8Alexander Gutkin  if (strm != &cout)
89f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson    delete strm;
90f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson  return ret;
91f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson}
92f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
93f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson
94f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson}  // namespace script
95f4c12fce1ee58e670f9c3fce46c40296ba9ee8a2Ian Hodson}  // namespace fst
96