-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathstat.js
56 lines (53 loc) · 1.28 KB
/
stat.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
var fs = require('fs')
var dutizi = fs.readFileSync('dutizi.txt', 'utf8')
var chailines = fs.readFileSync('chaizi/chaizi-jt.txt', 'utf-8').split('\n')
var tophz = fs.readFileSync('tophz.txt', 'utf8').split('\n')
// dutizi
const dtz = {}
for(var i = 0; i < dutizi.length; i++) {
dtz[dutizi[i]] = 1
}
function isDtz(ch) {
return dtz[ch]
}
// chaizi
const chaizi = {}
for(let line of chailines) {
const parts = line.split('\t')
if(parts.length < 2) continue
chaizi[parts[0]] = parts[1].split(' ')
}
// top hanzi
const partCount = {}
function addCount(z, c) {
if(!partCount[z]) {
partCount[z] = c
} else {
partCount[z] += c
}
}
for(let i = 0; i<2000; i++) {
const line = tophz[i]
if(line.startsWith('//')) continue;
const parts = line.split('\t')
const z = parts[1]
const count = Number(parts[2])
if(isDtz(z)) {
addCount(z, count)
} else {
if(chaizi[z]) {
for(let cz of chaizi[z]) {
addCount(cz, count)
}
} else {
addCount(z, count)
}
}
}
// sort
const parts = []
for(let k in partCount) {
parts.push([k, partCount[k]])
parts.sort((a, b) => b[1] - a[1])
}
fs.writeFileSync('top_parts.txt', parts.map(p => p[0] + '\t' + p[1]).join('\n'))