-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrussify.js
80 lines (58 loc) · 1.36 KB
/
russify.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
const Az = require('az');
const forms = require('./forms');
function getAdjective(tag, adjective = null) {
let form = [];
form.push(tag.NMbr);
if (tag.NMbr === 'sing') {
form.push(tag.GNdr);
}
form.push(tag.CAse);
let key = form.join(':');
// Find key in forms
if (forms.hasOwnProperty(key)) {
adjective = forms[key];
}
return adjective;
}
function getMorph(token, pos) {
let morph = Az.Morph(token.toString());
if (morph[0] && morph[0].tag.POS === pos) {
return morph[0];
}
return false;
}
function updateWord(tokens, i) {
// Get token morph
let morph = getMorph(tokens[i], 'NOUN');
// Get token
let token = tokens[i].toString();
// Check if current word is noun first
if (!morph || tokens[i].firstUpper) {
return token;
}
// Get adjective
let adjective = getAdjective(morph.tag, null);
if (adjective === null) {
return token;
}
// Check prev tokens
for (let k = i - 1; k >= 0; k--) {
// Break on word
if (tokens[k].type === Az.Tokens.WORD) {
// Check if prev word is adjective
if (getMorph(tokens[k], 'ADJF')) {
adjective = null;
}
break;
}
// Break on new sentence
if (tokens[k].toString() === '.') {
break;
}
}
if (adjective) {
token = `<ins>${adjective} </ins>${token}`;
}
return token;
}
module.exports = updateWord;