-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathemoticons.py
83 lines (79 loc) · 1.03 KB
/
emoticons.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
Created on Mon Jul 24 21:02:22 2017
@author: duc
"""
# a list of emoticons containing letters or numbers,
# which the TweetTokenizer does or may not know
# reason: emoticons without letters or numbers are removed easily
# without the need of tokenization
emoticons = [
":-3",
":3",
"8:o)",
"8=o)",
"8-)",
"8)",
"8=)",
"b)",
"b|",
":o)",
":o",
";o",
"=o",
":-o",
">:o",
"o:-)",
"o:)",
"0:-)",
"0:)",
"3:-)",
"3:)",
":c)",
":-c",
":c",
":-d",
":'d",
":d",
":dd",
":ddd",
"xd",
"xdd",
"xddd",
"xdddd",
"xddddd",
"xdddddd",
"d-':",
"d:<",
"d;",
"d=",
"8-d",
"x-d",
"=d",
"=dd",
"=3",
"b^d",
";d",
":p",
";p",
"X-p",
":-p",
":b",
":-b",
"=b",
"=p",
">:p",
":l",
"=l",
":S",
"\o/",
"v.v",
"o_o",
"o-o",
"<3",
"<33",
"<333",
"<3333",
"</3"
]