/
dictcompress.cpp
executable file
·54 lines (40 loc) · 1.24 KB
/
dictcompress.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
#include <iostream>
#include <fstream>
#include <sstream>
#include <string>
#include <algorithm>
#include <vector>
#include <utility>
using namespace std;
int main(){
string finname ("cedict_tsbackup.u8");
string foutname = "cedict_ts.u8";
ifstream fin(finname.c_str());
ofstream fout(foutname.c_str());
vector < pair < string, string > > tradsimpdups;
while(fin.good()){
string line;
getline(fin, line);
//skip comments
if(line[0] == '#')
continue;
// Make line a stream
stringstream linestream(stringstream::in | stringstream::out); linestream << line;
// Get simp and trad chars
string simp, trad; linestream >> simp >> trad;
if (simp != trad){
if (find(tradsimpdups.begin(), tradsimpdups.end(), make_pair(simp, trad)) != tradsimpdups.end()) {
continue;
}
tradsimpdups.push_back(make_pair(trad, simp));
}
//get pinyin as stringstream
size_t obracket = line.find_first_of("[");//find opening bracket
size_t cbracket = line.find_first_of("]");//find closing bracket
//write simp and trad
fout << simp << " " << trad << " ";
//newline
fout << line.substr(obracket+1, cbracket - obracket -1) << '\n';
}
return 0;
}