-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathslang.go
More file actions
64 lines (61 loc) · 1 KB
/
slang.go
File metadata and controls
64 lines (61 loc) · 1 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
package chopstick
import "regexp"
var slangs = []string{
"개",
"걸레",
"년",
"놈",
"느금마",
"닥쳐",
"등신",
"또라이",
"미친",
"멍청",
"병신",
"새끼",
"썅",
"시발",
"씨발",
"씨팔",
"씨발",
"썖",
"씹",
"에미",
"애미",
"애비",
"에비",
"염병",
"옘병",
"좆",
"좃",
"좇",
"지랄",
"창",
"호로",
"후레",
"호구",
"후장",
}
// SlangSimilarity returns similarity of string with slang,
// a float number between 0 and 1.
func SlangSimilarity(str string, exceptions []string) float64 {
var preprocessed string
var similaritys []float64
re := regexp.MustCompile("[^가-힣]")
preprocessed = re.ReplaceAllString(str, "")
for _, e := range exceptions {
if Similarity([]rune(preprocessed), []rune(e)) > 0.4 {
return 0
}
}
for _, s := range slangs {
similaritys = append(similaritys, Similarity([]rune(s), []rune(preprocessed)))
}
var max float64
for _, s := range similaritys {
if s >= max {
max = s
}
}
return max
}