diff --git a/config/source_log.csv b/config/source_log.csv index 13806510d..b8bbc2ae9 100644 --- a/config/source_log.csv +++ b/config/source_log.csv @@ -2333,4 +2333,3 @@ Timestamp,Source,Item,Raw Count,Final Count,Whitelisted,Dead,Parked,Toplist,Quer 09:58:31 09-12-24,dnstwist,,11,11,0,0,0,0,,saved 09:58:31 09-12-24,Regex,,4103,4080,21,0,0,1,,saved 10:07:47 09-12-24,Regex,,1,1,0,0,0,0,,saved -16:36:16 09-12-24,Internet Storm Center,,41,18,1,0,0,12,,saved diff --git a/data/pending/domains_isc.tmp b/data/pending/domains_isc.tmp deleted file mode 100644 index a6fb1a9d9..000000000 --- a/data/pending/domains_isc.tmp +++ /dev/null @@ -1,22 +0,0 @@ -171.107 -178.159.43.149 -193.222 -193.222.99.121 -85.217 -85.217.171.107 -99.121 -botman.pro -bottap.ru -btcbot.cc -duda.com.ua -eth0.me -gift-bnb -gogetsms -gogetsms.com -jambler.io -sambot.ru -stk-ms.ru -tbiz -tbiz.pro -tgmaster.xyz -token-mining.org diff --git a/data/raw.txt b/data/raw.txt index f9ca24b26..2d8384f2a 100644 --- a/data/raw.txt +++ b/data/raw.txt @@ -19267,8 +19267,6 @@ babgmxnets-mail86f9365fd400845787e836ba90b7746a09612f95d678975.square.site babieskleidung.com babolatfr.top babolattennisgearhub48.shop -baboon-tg-web-app-v2.onrender -baboon-tg-web-app-v2.onrender.com babooundefinedzfyvdi.blogspot.com babxcqvn.shop baby-seat-store.anneise.com @@ -46209,7 +46207,6 @@ ducksinarowct.com duckybabe.com ducoduckgo.com ductamyoutube.com -duda.com dudjemamsnejdkwsi.weebly.com duduba.ba duecancelacionorcraftsmanship.weebly.com @@ -50554,7 +50551,6 @@ exchange-coinbase.com exchange-crypto.ru exchange-crypto.us exchange-owa-mail-reathenticate.vercel.app -exchange-pool.com exchange-smoky-tau.vercel.app exchange.add-solution.de exchange.choicecorp.net @@ -50964,7 +50960,6 @@ express-partners.com express-sporing.net express-upsdelivery.eu express.courierserv.com -express12.com express247delivery.net expressbaselogistics.com expressbtdsgr.top @@ -55618,8 +55613,6 @@ freeacymall.shop freealo.com freeantivirusprotection.com freeantivirusprotection.pro -freeapi.bot-t -freeapi.bot-t.com freebiefrenzy-amazon.com freebitcoin.auction freebitcoin.shop @@ -58849,7 +58842,6 @@ gifnest.com gifonmzao.shop gift-99.top gift-binance.com -gift-bnb.org gift-box-shop.com gift-box-shop.onshopbase.com gift-card-arbitragea-apple.today @@ -81102,7 +81094,6 @@ juzihongle.pages.dev juzzsupport.web.app jv9p75-8080.csb.app jvamatak.com -jvault.xyz jvgpb1unt.top jvh211.duckdns.org jvhggyhuhhj.weebly.com @@ -82129,7 +82120,6 @@ keyholder.live keyiflendiren-yenilikler-hizmetinizde-daima-yaninda.com keynesdigitalmarketing.com keyrecon.kolotas.top -keys.neovpn keyste-one.top keystone-armorystore.com keystonerealestateinvestments.com @@ -101411,8 +101401,6 @@ myspotifymusic.freewebhostmost.com myspotifysongs.vip mysql.home.elasticsearch-production.yovip.net mysql.yadustudio.highclassacademia.com -mystars-hk.syllix -mystars-hk.syllix.io mystarstoreusa.top mystart-crypto.com mystart-crypto.icu @@ -104812,7 +104800,6 @@ ninng-moilerdate-sdesstk.glitch.me ninorleo.lol nintendoswitchgame.com ninw.asia -niolic.com nionalat-onven.dsmtp.com niotchvote.vercel.app nipponkodostorestore.shop @@ -126703,7 +126690,6 @@ santanderpayment.com santanderpod.globalizeme-dublin2.co.uk santanderprivate.co.uk santanmac.com -santasol.fun sante-assurance-ameli.com sante-assurance-maladie.org sante-gestion-info.fr @@ -137215,8 +137201,6 @@ static-selfies-407469.framer.app static.binance-taxs.com static.eusstore.com static.onpsummer.com -static.tgcube -static.tgcube.store staticpopdiscountshop.com statics2024.freewebhostmost.com statintinx.shop @@ -137283,7 +137267,6 @@ stealthymarketingmama.com steam-crypto.com steam-store.xiaohuanya.top steam-store.yusheng433.com -steam-up.ru steam.aus-iget.com steam.communitysharedfile.com steam.communityworkshopfiles.com @@ -154394,7 +154377,6 @@ umber-lark-kb2rrx.mystrikingly.com umber-peach-kdws36.mystrikingly.com umbertoravelli.fr umbrella.2efyvrzn.publicvm.com -umbrella.day umbrella.k7bprksw.publicvm.com umbrellacockatooforsale.com umbrosoldes.fr diff --git a/data/raw_light.txt b/data/raw_light.txt index 9452e20a2..6781e4a22 100644 --- a/data/raw_light.txt +++ b/data/raw_light.txt @@ -1265,8 +1265,6 @@ b2kmjunit.com b2secops.co.uk b8yxmetpg0uns.pages.dev b9inance.com -baboon-tg-web-app-v2.onrender -baboon-tg-web-app-v2.onrender.com babybeans.shop babyclothstore.xyz babys-toys.com @@ -3872,7 +3870,6 @@ duckdzckgo.com duckruckgo.com duckybabe.com ducoduckgo.com -duda.com duduba.ba duetschecredit.com dukesfishingsupply.com @@ -4407,7 +4404,6 @@ excelttsv.top exceltwlg.top exchagestels.info exchagestels.top -exchange-pool.com exchangtels.today exchangtels.top exchtestcheckingapi.azurewebsites.net @@ -4444,7 +4440,6 @@ expreshipment.top expreshsipment.top expresipment.top express-fuhrerschein.com -express12.com expressbtdsgr.top expressdeliveryairservice.com expressdriverslicense.ca @@ -4874,8 +4869,6 @@ freaky-fitness.com fredsalezx.shop freeactbat.com freeacymall.shop -freeapi.bot-t -freeapi.bot-t.com freedailyanalysis.com freedomammoco.com freedomyields.com @@ -5157,7 +5150,6 @@ gianniandsantaniellolaw.com giantsmainecoons.wixsite.com giaseva.com gidredy.com -gift-bnb.org gift-box-shop.com gift-box-shop.onshopbase.com gift-te-shop.com @@ -7604,7 +7596,6 @@ juvkahrhwaii.shop juxincai.top juyuantiancheng.shop juzfiity.shop -jvault.xyz jwilliamsattorneys.com jwskuw.biz jwskuw.love @@ -7691,7 +7682,6 @@ kexcet.com keyesden.com keyholder.live keyrecon.kolotas.top -keys.neovpn kfyuuspsnx.com kgbdq.ltd kght3n.shop @@ -9153,8 +9143,6 @@ myrepairunder100.com myreservation.top myriama.com myspostjv.cyou -mystars-hk.syllix -mystars-hk.syllix.io mysteryboxprojss.on.fleek.co mysterymint81.vercel.app mysterymint89.vercel.app @@ -9391,7 +9379,6 @@ nilibili.com nilkrgwegniture.shop nimberous.com nimbleglib.com -niolic.com niscey.com niteconfgnights.shop nitroways.com @@ -11583,7 +11570,6 @@ sanjinshop.com sanjinyneksa.com sanmatrade.com sanmsung.net -santasol.fun santhisukham.com sapuppyheaven.co.za saqueindeniza.com @@ -12448,8 +12434,6 @@ startdis.shop startransitlogistics.com starxpresslogs.com statealliantbank.com -static.tgcube -static.tgcube.store stayible.com stayyoung01.com stb-trustsave.com @@ -12457,7 +12441,6 @@ stciasa.ink stcseasa.ink steaanncommunity.ru steady-salmiakki-2bf1ce.netlify.app -steam-up.ru steam.tappalm.com steamcammunity.com steamcommmunity.ru @@ -14258,7 +14241,6 @@ ultimatestakers.org ultra-connect.co.za ultracleanmasters.com ultragolfcarts-sa.co.za -umbrella.day umbrellacockatooforsale.com umvct.ancientan.buzz unboxingmega.com diff --git a/data/root_domains.txt b/data/root_domains.txt index ec3dd6b38..0ad9dee70 100644 --- a/data/root_domains.txt +++ b/data/root_domains.txt @@ -3437,7 +3437,6 @@ giantztool.com gidawm.majesticbank.de gidredy.com giencoe.com -gift-bnb.org gift-te-shop.com gift10800cpfree.com giftcard-mania.org diff --git a/data/subdomains.txt b/data/subdomains.txt index 158b31f06..70040ce54 100644 --- a/data/subdomains.txt +++ b/data/subdomains.txt @@ -4082,7 +4082,6 @@ www.ghtcfz.blogspot.md www.giantztool.com www.gidawm.majesticbank.de www.gidredy.com -www.gift-bnb.org www.gift-te-shop.com www.gift10800cpfree.com www.giftozoom.com diff --git a/scripts/retrieve_domains.sh b/scripts/retrieve_domains.sh index f75770bf3..9c3a94e42 100644 --- a/scripts/retrieve_domains.sh +++ b/scripts/retrieve_domains.sh @@ -31,9 +31,21 @@ readonly DOMAIN_DASH_REGEX='[[:alnum:].-]+-[[:alnum:]-]+' readonly STRICT_DOMAIN_REGEX='[[:alnum:]][[:alnum:].-]+\.[[:alnum:]-]*[a-z]{2,}[[:alnum:]-]*' readonly -a SOURCES=( - - source_isc - + source_aa419 + source_dnstwist + source_emerging_threats + source_fakewebshoplisthun + source_guntab + source_jeroengui_phishing + source_jeroengui_scam + source_manual + source_phishstats + source_phishstats_nrd + source_regex + source_scamadviser + source_scamdirectory + source_stopgunscams + source_google_search ) # Function 'source' calls on the respective functions of each source to @@ -646,15 +658,6 @@ source_guntab() { # Note results are not sorted by time added } -source_isc() { - source='Internet Storm Center' - results_file='data/pending/domains_isc.tmp' - - url='https://isc.sans.edu/diaryarchive.html' - curl -sSZ --retry 2 --retry-all-errors "${url}" \ - | grep -oE "$DOMAIN_REGEX" | grep '\[\.\]' > "$results_file" -} - source_jeroengui_phishing() { source='Jeroengui phishing' ignore_from_light=true