Skip to content

Commit 28d7680

Browse files
authored
Merge pull request #204 from Cerberus98/new_domains_list
Updates the corrector email list
2 parents 27f3d56 + ad65343 commit 28d7680

File tree

1 file changed

+82
-78
lines changed

1 file changed

+82
-78
lines changed

flanker/addresslib/corrector.py

Lines changed: 82 additions & 78 deletions
Original file line numberDiff line numberDiff line change
@@ -30,177 +30,191 @@ def suggest(word, cutoff=0.77):
3030
return guess[0]
3131
return word
3232

33-
3433
MOST_COMMON_DOMAINS = [
3534
# mailgun :)
3635
'mailgun.net',
37-
# big esps
36+
# The Top 200 domains from 30mm open events gathered during the
37+
# last 30 days prior to 8/22/2018
38+
'126.com',
3839
'163.com',
40+
'account.tradeshift.com',
3941
'aim.com',
42+
'airwallex.com',
4043
'alice.it',
41-
'aol.co.uk',
44+
'ameritech.net',
45+
'anz.com',
4246
'aol.com',
47+
'apple.com',
48+
'asu.edu',
4349
'att.net',
44-
'azet.sk',
50+
'bain.com',
4551
'bell.net',
4652
'bellsouth.net',
53+
'berkeley.edu',
4754
'bigpond.com',
4855
'bigpond.com.au',
4956
'bigpond.net.au',
57+
'bk.ru',
5058
'bluewin.ch',
51-
'blueyonder.co.uk',
5259
'bol.com.br',
5360
'btinternet.com',
54-
'btopenworld.com',
55-
'cableone.net',
56-
'centrum.sk',
5761
'centurylink.net',
58-
'centurytel.net',
62+
'cfl.rr.com',
63+
'charter.com',
5964
'charter.net',
65+
'citi.com',
66+
'colemanrg.com',
67+
'columbia.edu',
6068
'comcast.net',
69+
'compass.com',
70+
'cornell.edu',
6171
'cox.net',
62-
'cs.com',
72+
'cpp.edu',
73+
'cytonn.com',
74+
'deloitte.com',
75+
'det.nsw.edu.au',
76+
'docomo.ne.jp',
6377
'earthlink.net',
64-
'email.com',
65-
'email.cz',
66-
'email.it',
78+
'edumail.vic.gov.au',
79+
'eim.ae',
80+
'email.arizona.edu',
6781
'embarqmail.com',
82+
'emirates.net.ae',
6883
'excite.com',
69-
'fastwebnet.it',
84+
'exploretrip.com',
85+
'ext.uber.com',
86+
'ezweb.ne.jp',
7087
'free.fr',
71-
'freemail.hu',
7288
'freenet.de',
7389
'frontier.com',
7490
'frontiernet.net',
7591
'fuse.net',
92+
'g.austincc.edu',
93+
'ge.com',
7694
'gmail.com',
7795
'gmx.at',
78-
'gmx.ch',
7996
'gmx.com',
8097
'gmx.de',
8198
'gmx.net',
8299
'google.com',
83100
'googlemail.com',
101+
'gs.com',
102+
'guest.booking.com',
84103
'hanmail.net',
85-
'home.nl',
86-
'hotmail.be',
87104
'hotmail.ca',
88105
'hotmail.co.jp',
89106
'hotmail.co.nz',
90107
'hotmail.co.uk',
91108
'hotmail.com',
92-
'hotmail.com.ar',
93109
'hotmail.com.au',
94110
'hotmail.de',
95111
'hotmail.es',
96112
'hotmail.fr',
97-
'hotmail.gr',
98113
'hotmail.it',
99-
'hotmail.nl',
100-
'hotmail.no',
101-
'hotmail.se',
102-
'hughes.net',
114+
'i.softbank.jp',
103115
'icloud.com',
104116
'iinet.net.au',
105-
'inbox.lv',
106117
'inbox.ru',
107-
'interia.pl',
118+
'indeedemail.com',
119+
'internationalsos.com',
120+
'internode.on.net',
121+
'iprimus.com.au',
122+
'jhu.edu',
123+
'jtbap.com',
108124
'juno.com',
125+
'kw.com',
109126
'laposte.net',
110127
'libero.it',
128+
'limetray.com',
111129
'list.ru',
112-
'live.be',
113130
'live.ca',
114131
'live.co.uk',
115132
'live.com',
116-
'live.com.ar',
117133
'live.com.au',
118-
'live.com.mx',
119-
'live.de',
120-
'live.dk',
121134
'live.fr',
122-
'live.it',
123135
'live.nl',
124-
'live.no',
125-
'live.se',
136+
'lynk.co.in',
126137
'mac.com',
127138
'mail.com',
128139
'mail.ru',
140+
'marketplace.amazon.com',
141+
'marriott.com',
142+
'mavs.uta.edu',
143+
'mchsi.com',
144+
'mckinsey.com',
129145
'me.com',
130-
'microsoft.com',
146+
'mergermarket.com',
131147
'mindspring.com',
148+
'montaportal.nl',
132149
'msn.com',
150+
'msu.edu',
133151
'naver.com',
152+
'nc.rr.com',
134153
'netscape.net',
135-
'netspace.net.au',
136-
'netzero.com',
137-
'netzero.net',
138-
'neuf.fr',
139-
'nhs.net',
140154
'ntlworld.com',
141-
'o2.pl',
142-
'online.no',
143-
'optimum.net',
144155
'optonline.net',
145156
'optusnet.com.au',
146157
'orange.fr',
147-
'ostrovok.ru',
158+
'ou.edu',
148159
'outlook.com',
149160
'outlook.com.au',
150-
'outlook.de',
151-
'outlook.es',
152-
'outlook.fr',
153-
'outlook.it',
161+
'ozemail.com.au',
154162
'pacbell.net',
155-
'planet.nl',
163+
'paisabazaar.com',
164+
'pegipegi.com',
156165
'prodigy.net',
157-
'prodigy.net.mx',
158-
'protonmail.com',
166+
'ptd.net',
167+
'pwc.com',
159168
'q.com',
169+
'qiniu.com',
160170
'qq.com',
161171
'rambler.ru',
162-
'reagan.com',
163-
'rediffmail.com',
172+
'rev.com',
164173
'roadrunner.com',
165174
'rocketmail.com',
166175
'rogers.com',
176+
'rothschild.com',
177+
'royallepage.ca',
178+
'sasktel.net',
179+
'savaari.com',
167180
'sbcglobal.net',
168181
'seznam.cz',
169182
'sfr.fr',
170183
'shaw.ca',
171184
'sky.com',
172185
'skynet.be',
186+
'springspa.com',
187+
'stanford.edu',
188+
'student.sbccd.edu',
173189
'suddenlink.net',
174190
'swbell.net',
175191
'sympatico.ca',
176192
't-online.de',
177-
'talktalk.net',
178-
'telefonica.net',
193+
'tampabay.rr.com',
179194
'telenet.be',
180-
'telfort.nl',
181195
'telia.com',
182196
'telus.net',
183-
'telusplanet.net',
184-
'tiscali.co.uk',
185-
'tiscali.it',
186-
'ukr.net',
197+
'terra.com.br',
198+
'tpg.com.au',
199+
'twc.com',
200+
'umich.edu',
201+
'umn.edu',
187202
'uol.com.br',
188-
'usa.net',
203+
'usc.edu',
204+
'utexas.edu',
205+
'uw.edu',
189206
'vepl.com',
190207
'verizon.net',
191208
'videotron.ca',
192-
'virgilio.it',
193-
'virgin.net',
194-
'virginmedia.com',
209+
'vt.edu',
195210
'wanadoo.fr',
196211
'web.de',
197-
'windowslive.com',
212+
'westnet.com.au',
213+
'wi.rr.com',
198214
'windstream.net',
199215
'wp.pl',
200-
'xs4all.nl',
201216
'xtra.co.nz',
202217
'y7mail.com',
203-
'ya.ru',
204218
'yahoo.ca',
205219
'yahoo.co.id',
206220
'yahoo.co.in',
@@ -213,24 +227,14 @@ def suggest(word, cutoff=0.77):
213227
'yahoo.com.br',
214228
'yahoo.com.hk',
215229
'yahoo.com.mx',
216-
'yahoo.com.my',
217-
'yahoo.com.ph',
218230
'yahoo.com.sg',
219231
'yahoo.com.tw',
220232
'yahoo.de',
221233
'yahoo.es',
222234
'yahoo.fr',
223-
'yahoo.gr',
224-
'yahoo.ie',
225-
'yahoo.in',
226235
'yahoo.it',
227-
'yahoo.no',
228-
'yahoo.se',
229-
'yandex.com',
230236
'yandex.ru',
231-
'ymail.com',
232-
'ziggo.nl',
233-
'zoominternet.net'
237+
'ymail.com'
234238
]
235239

236240
# domains that the corrector doesn't fix that we should fix

0 commit comments

Comments
 (0)