-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathshrink_my_tweet.py
103 lines (95 loc) · 2.48 KB
/
shrink_my_tweet.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
""" A simple tweet text shrinker """
import re
num_subs = {
'1': r"(one|\bwon)\b",
'2': r"\b(to+|two)\b",
'3': r"(three)",
'4': r"((ph|f)oa?u?re?)",
'5': r"(five)\b",
'6': r"(six)\b",
'7': r"(seven)\b",
'8': r"(eight\b|ate(?:ly)\b|ait\b)",
'9': r"(nine)\b",
'0': r"(zero)"
}
general = {
'&': r'(and)',
'@': r'\b(at)\b',
'yw': r'((you(\')?re?|ur) welcome)',
'wtf': r'(what the fuck)',
'wth': r'(what the he(ll|ck))',
'wo': r'(with out)',
'w': r'(with)',
'we': r'(what(\s)?ever)',
'gtg': r'(got to go)',
'bbl': r'(be back later)',
'til': r'(today I learned)',
'thx': r'(thanks)',
'ty': r'(thank you)',
'tbh': r'(to be honest)',
'x': r'(cks)',
'sup': r'(wh?at(\')?s?(\s)?up)',
'rl': r'(real+)',
'srs': r'(serious)',
'ppl': r'(people)',
'plz': r'(please)',
'pov': r'(point of view)',
'oyo': r'(on your own)',
'omg': r'(oh my go(d|sh))',
'nm': r'(not(hing)? much)',
'ne': r'(any)',
'mgmt': r'(management)',
'ez': r'(easy)',
'cu': r'(see you)',
'ba': r'(bad(\s)+ass)',
'bc': r'(because)',
'dis': r'(this)',
'lyk': r'(like)',
'wat': r'(what)',
'b': r'(be)',
'c': r'(see)',
'g': r'(gee)',
'k': r'\b(o?k+(ay)?)',
'o': r'(oh+)',
'p': r'(pee+)',
'x': r'(ex)',
'y': r'(why)',
'z': r'(the+)',
'u': r'(you)',
'r': r'(are)',
'tho': r'(though)',
'n': r'(in)',
'ya': r'(ye?ah?)',
# '�': r'(cc)',
# '㎳': r'(ms)',
# '㎱': r'(ns)',
# '㎰': r'(ps)',
# '�': r'(in)',
# 'ʪ': r'(ls)',
# '�': r'(fi)',
# 'ѹ': r'(oy)',
# 'â…±': r'(ii)',
# 'â…º': r'(xi)',
# 'nj': r'(nj)',
# '.': r'(\. )',
}
def init():
""" Initialize and compile regex patterns """
global num_subs, general
for k, v in general.items():
general[k] = re.compile(v, re.IGNORECASE)
for k, v in num_subs.items():
num_subs[k] = re.compile(v, re.IGNORECASE)
def fix(tweet):
""" Fix the tweet to be smaller """
old_len = len(tweet)
for k, v in num_subs.items():
tweet = v.sub(k, tweet)
for k, v in general.items():
tweet = v.sub(k, tweet)
return tweet, old_len-len(tweet)
init()
while True:
tweet = input('Tweet: ')
tweet, saved = fix(tweet)
print("\nSaved "+str(saved)+":", tweet, "\n")