Browse Source

feat: added filtered Top100 SemRush sites as scraper

master
Denis Thiessen 6 months ago
parent
commit
7571165f54
  1. 102
      websites.json

102
websites.json

@ -0,0 +1,102 @@
[
"google.com",
"youtube.com",
"facebook.com",
"wikipedia.org",
"twitter.com",
"instagram.com",
"reddit.com",
"duckduckgo.com",
"amazon.com",
"yahoo.com",
"tiktok.com",
"weather.com",
"yahoo.co.jp",
"bing.com",
"fandom.com",
"whatsapp.com",
"yandex.ru",
"openai.com",
"archiveofourown.org",
"microsoftonline.com",
"twitch.tv",
"microsoft.com",
"linkedin.com",
"live.com",
"netflix.com",
"quora.com",
"t.me",
"pixiv.net",
"office.com",
"vk.com",
"livedoor.jp",
"bit.ly",
"globo.com",
"webpkgcache.com",
"imdb.com",
"animeflv.net",
"youtu.be",
"aliexpress.com",
"cnn.com",
"nytimes.com",
"pinterest.com",
"github.com",
"uol.com.br",
"ebay.com",
"amazon.co.jp",
"discord.com",
"marca.com",
"apple.com",
"spotify.com",
"msn.com",
"sharepoint.com",
"espn.com",
"dailymail.co.uk",
"bbc.com",
"canva.com",
"indeed.com",
"syosetu.com",
"zoom.us",
"mail.ru",
"bbc.co.uk",
"paypal.com",
"naver.com",
"amazon.in",
"x.com",
"accuweather.com",
"noodlemagazine.com",
"foxnews.com",
"hanime.tv",
"samsung.com",
"dzen.ru",
"mangadex.org",
"mediafire.com",
"goo.gl",
"9gag.com",
"wordpress.com",
"rakuten.co.jp",
"mangago.me",
"amazon.de",
"dailymotion.com",
"theguardian.com",
"booking.com",
"sxyprn.com",
"roblox.com",
"etsy.com",
"appsflyer.com",
"as.com",
"mangakakalot.com",
"adjust.com",
"fanfiction.net",
"amazon.co.uk",
"steampowered.com",
"4chan.org",
"imgur.com",
"page.link",
"adobe.com",
"temu.com",
"fmoviesz.to",
"app.link",
"ign.com",
"animesuge.to"
]
Loading…
Cancel
Save