forked from aojiaotage/text-censor
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathindex.js
More file actions
81 lines (67 loc) · 1.61 KB
/
index.js
File metadata and controls
81 lines (67 loc) · 1.61 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
const fs = require('fs')
const path = __dirname + '/keywords'
let map = new Map();
let lineReader = require('readline').createInterface({
input: fs.createReadStream(path, { encoding: 'UTF-8' })
});
lineReader.on('line', line => {
if (!line) return
addWord(line)
});
let addWord = word => {
let parent = map
for (let i = 0; i < word.length; i++) {
let char = word[i]
if (!parent.has(char)) {
parent.set(char, new Map())
}
parent = parent.get(char)
}
parent.set('isEnd', true)
}
let getMap = async s => {
return new Promise((res) => {
lineReader.on('close', () => res(map))
})
}
let filter = async s => {
let parent = map.size > 0 ? map : await getMap()
// 敏感词收集
let words = []
for (let i = 0; i < s.length; i++) {
let word = ''
let sWord = ''
for (let j = i; j < s.length; j++) {
let char = s[j]
// 一次对比敏感词结束,收集要替换的敏感词
if (!parent.has(char)) {
parent = map
// 去重,去空
if (!words.includes(word) && word.length > 0) {
words.unshift(word)
}
break
}
sWord = sWord + char
// 记录关键字
if (parent.get(char).get('isEnd')) {
word = sWord
}
parent = parent.get(char)
}
}
// 排序,先替换长字符长
words = words.sort((a, b) => b.length - a.length)
console.log(words)
// 替换敏感词
words.forEach(word => {
let stars = ''.padEnd(word.length, '*');
let reg = new RegExp(word, 'g')
s = s.replace(reg, stars)
})
return s
}
module.exports = {
addWord,
filter
}