From 7571165f54ac45e850d0103fa6a85bcac6d2cbcf Mon Sep 17 00:00:00 2001 From: Denis Thiessen Date: Wed, 8 May 2024 21:21:17 +0200 Subject: [PATCH] feat: added filtered Top100 SemRush sites as scraper --- websites.json | 102 ++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 102 insertions(+) create mode 100644 websites.json diff --git a/websites.json b/websites.json new file mode 100644 index 0000000..02a869a --- /dev/null +++ b/websites.json @@ -0,0 +1,102 @@ +[ +"google.com", +"youtube.com", +"facebook.com", +"wikipedia.org", +"twitter.com", +"instagram.com", +"reddit.com", +"duckduckgo.com", +"amazon.com", +"yahoo.com", +"tiktok.com", +"weather.com", +"yahoo.co.jp", +"bing.com", +"fandom.com", +"whatsapp.com", +"yandex.ru", +"openai.com", +"archiveofourown.org", +"microsoftonline.com", +"twitch.tv", +"microsoft.com", +"linkedin.com", +"live.com", +"netflix.com", +"quora.com", +"t.me", +"pixiv.net", +"office.com", +"vk.com", +"livedoor.jp", +"bit.ly", +"globo.com", +"webpkgcache.com", +"imdb.com", +"animeflv.net", +"youtu.be", +"aliexpress.com", +"cnn.com", +"nytimes.com", +"pinterest.com", +"github.com", +"uol.com.br", +"ebay.com", +"amazon.co.jp", +"discord.com", +"marca.com", +"apple.com", +"spotify.com", +"msn.com", +"sharepoint.com", +"espn.com", +"dailymail.co.uk", +"bbc.com", +"canva.com", +"indeed.com", +"syosetu.com", +"zoom.us", +"mail.ru", +"bbc.co.uk", +"paypal.com", +"naver.com", +"amazon.in", +"x.com", +"accuweather.com", +"noodlemagazine.com", +"foxnews.com", +"hanime.tv", +"samsung.com", +"dzen.ru", +"mangadex.org", +"mediafire.com", +"goo.gl", +"9gag.com", +"wordpress.com", +"rakuten.co.jp", +"mangago.me", +"amazon.de", +"dailymotion.com", +"theguardian.com", +"booking.com", +"sxyprn.com", +"roblox.com", +"etsy.com", +"appsflyer.com", +"as.com", +"mangakakalot.com", +"adjust.com", +"fanfiction.net", +"amazon.co.uk", +"steampowered.com", +"4chan.org", +"imgur.com", +"page.link", +"adobe.com", +"temu.com", +"fmoviesz.to", +"app.link", +"ign.com", +"animesuge.to" +] \ No newline at end of file