diff --git a/factory/resultant/top500_direct.list b/factory/resultant/top500_direct.list index 8dd2b70..48e26b4 100644 --- a/factory/resultant/top500_direct.list +++ b/factory/resultant/top500_direct.list @@ -1,4 +1,4 @@ -# top500 direct list update time: 2018-07-21 10:47:06 +# top500 direct list update time: 2018-11-06 10:09:53 163.com 1688.com 1905.com @@ -23,12 +23,8 @@ aliexpress.com alipay.com allegro.pl amazon.ca -amazon.co.jp -amazon.co.uk -amazon.com -amazon.fr +amazon.es amazon.in -amazon.it amazonaws.com ameblo.jp americanexpress.com @@ -82,6 +78,7 @@ dcinside.com dell.com detail.tmall.com detik.com +deviantart.com dictionary.com digikala.com diply.com @@ -109,18 +106,18 @@ fedex.com feedly.com fiverr.com fivethirtyeight.com -flickr.com flipkart.com +forbes.com force.com foxnews.com free.fr freepik.com gearbest.com -gfycat.com giphy.com github.com github.io gizmodo.com +globaloffers.link globo.com gmx.net go.com @@ -135,7 +132,6 @@ hatena.ne.jp hatenablog.com hdfcbank.com hespress.com -hola.com homedepot.com hotstar.com hp.com @@ -155,6 +151,7 @@ infusionsoft.com instructure.com intuit.com iqiyi.com +irctc.co.in isanalyze.com iwanttodeliver.com jd.com @@ -214,8 +211,6 @@ pandora.com paypal.com paytm.com php.net -pinimg.com -pixabay.com popads.net popcash.net poptm.com @@ -223,7 +218,6 @@ putlocker.is qiita.com qq.com quizlet.com -quora.com rakuten.co.jp rambler.ru rarbg.to @@ -233,6 +227,7 @@ researchgate.net roblox.com rt.com rutracker.org +sabah.com.tr salesforce.com samsung.com savefrom.net @@ -284,9 +279,9 @@ tudou.com tutorialspoint.com twitch.tv udemy.com +uol.com.br uploaded.net ups.com -uptodown.com upwork.com usatoday.com usps.com @@ -301,7 +296,6 @@ weather.com web.de weblio.jp webmd.com -webtretho.com weebly.com weibo.com wellsfargo.com diff --git a/factory/resultant/top500_proxy.list b/factory/resultant/top500_proxy.list index 4a6d1ca..8242d6e 100644 --- a/factory/resultant/top500_proxy.list +++ b/factory/resultant/top500_proxy.list @@ -1,9 +1,13 @@ -# top500 proxy list update time: 2018-07-21 10:47:06 +# top500 proxy list update time: 2018-11-06 10:09:53 123movies.to 4shared.com adnetworkperformance.com +amazon.co.jp +amazon.co.uk +amazon.com amazon.de -amazon.es +amazon.fr +amazon.it archive.org ask.com bbc.co.uk @@ -22,7 +26,6 @@ bp.blogspot.com chaturbate.com cloudfront.net dailymotion.com -deviantart.com disqus.com doubleclick.net dropbox.com @@ -33,14 +36,14 @@ facebook.com fbcdn.net fc2.com files.wordpress.com -forbes.com -globaloffers.link +flickr.com +gfycat.com goo.gl hclips.com +hola.com hootsuite.com hurriyet.com.tr instagram.com -irctc.co.in livedoor.jp ltn.com.tw media.tumblr.com @@ -52,14 +55,16 @@ microsoftonline.com nyaa.se nytimes.com ozock.com +pinimg.com pinterest.com +pixabay.com pixnet.net pornhub.com +quora.com reddituploads.com redtube.com reuters.com ruten.com.tw -sabah.com.tr scribd.com shutterstock.com slack.com @@ -76,9 +81,10 @@ tumblr.com twimg.com twitter.com txxx.com -uol.com.br upornia.com +uptodown.com vimeo.com +webtretho.com whatsapp.com wordpress.com wsj.com diff --git a/factory/top500.py b/factory/top500.py index b1ce8b7..25de071 100644 --- a/factory/top500.py +++ b/factory/top500.py @@ -99,10 +99,10 @@ class DomainScaner(threading.Thread): is_proxy = False try: - requests.get('http://' + domain, timeout=10, headers=requests_header) + requests.get('http://www.' + domain, timeout=10, headers=requests_header) except BaseException: try: - requests.get('http://www.' + domain, timeout=10, headers=requests_header) + requests.get('http://' + domain, timeout=10, headers=requests_header) except BaseException: is_proxy = True