forked from hschwenk/cslm-toolkit
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconv_wl_sort.cpp
60 lines (53 loc) · 2.01 KB
/
conv_wl_sort.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
/*
* This file is part of the continuous space language and translation model toolkit
* for statistical machine translation and large vocabulary speech recognition.
*
* Copyright 2015, Holger Schwenk, LIUM, University of Le Mans, France
*
* The CSLM toolkit is free software; you can redistribute it and/or modify it
* under the terms of the GNU Lesser General Public License version 3 as
* published by the Free Software Foundation
*
* This library is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License
* for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with this library; if not, write to the Free Software Foundation,
* Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
*
*
*/
#include "WordList.h"
#include <iostream>
#include <string>
using namespace std;
int main (int argc, char *argv[])
{
if (3 != argc) {
string sProgName(argv[0]);
size_t stEndPath = sProgName.find_last_of("/\\");
cout << "Usage: " << ((stEndPath != string::npos) ? sProgName.substr(stEndPath + 1) : sProgName)
<< " input_word_list output_word_list\n"
<< " Creates a new word list file compatible with stable and unstable sort." << endl;
return 2;
}
WordList wl;
/* open word list file with unstable sort */
cout << "Reading " << argv[1] << flush;
wl.SetSortBehavior(false);
WordList::WordIndex n_words = wl.Read(argv[1]);
cout << ", done." << endl;
/* modify word counts to keep order with stable sort */
cout << "Modifying word counts" << flush;
WordList::const_iterator end = wl.End();
for (WordList::const_iterator ci = wl.Begin() ; ci != end ; ci++)
wl.GetWordInfo(ci->id).n = n_words--;
cout << ", done." << endl;
/* save new word list file */
cout << "Writing " << argv[2] << flush;
wl.Write(argv[2], 3);
cout << ", done." << endl;
return 0;
}