Browse Source

Update CDN & Reject Hosts

SukkaW 1 year ago
parent
commit
f61804ff51

+ 1 - 0
Build/lib/get-phishing-domains.test.ts

@@ -4,6 +4,7 @@ import { calcDomainAbuseScore } from './get-phishing-domains';
 
 
 describe('sortDomains', () => {
 describe('sortDomains', () => {
   it('nmdj.pl', () => {
   it('nmdj.pl', () => {
+    console.log(calcDomainAbuseScore('.booking-com'));
     console.log(calcDomainAbuseScore('plikgier'));
     console.log(calcDomainAbuseScore('plikgier'));
     console.log(calcDomainAbuseScore('www.addgumtree'));
     console.log(calcDomainAbuseScore('www.addgumtree'));
     console.log(calcDomainAbuseScore('zrz'));
     console.log(calcDomainAbuseScore('zrz'));

+ 21 - 5
Build/lib/get-phishing-domains.ts

@@ -1,7 +1,7 @@
 import { processDomainLists } from './parse-filter';
 import { processDomainLists } from './parse-filter';
 import * as tldts from 'tldts-experimental';
 import * as tldts from 'tldts-experimental';
 
 
-import type { Span } from '../trace';
+import { dummySpan, type Span } from '../trace';
 import { appendArrayInPlaceCurried } from './append-array-in-place';
 import { appendArrayInPlaceCurried } from './append-array-in-place';
 import { PHISHING_DOMAIN_LISTS_EXTRA } from '../constants/reject-data-source';
 import { PHISHING_DOMAIN_LISTS_EXTRA } from '../constants/reject-data-source';
 import { loosTldOptWithPrivateDomains } from '../constants/loose-tldts-opt';
 import { loosTldOptWithPrivateDomains } from '../constants/loose-tldts-opt';
@@ -13,6 +13,7 @@ const BLACK_TLD = new Set([
   'accountant',
   'accountant',
   'autos',
   'autos',
   'bar',
   'bar',
+  'beauty',
   'bid',
   'bid',
   'biz',
   'biz',
   'bond',
   'bond',
@@ -55,10 +56,13 @@ const BLACK_TLD = new Set([
   'live',
   'live',
   'link',
   'link',
   'loan',
   'loan',
+  'lol',
   'ltd',
   'ltd',
+  'me',
   'men',
   'men',
   'ml',
   'ml',
   'mobi',
   'mobi',
+  'mom',
   'net.pl',
   'net.pl',
   'one',
   'one',
   'online',
   'online',
@@ -122,18 +126,24 @@ const sensitiveKeywords = createKeywordFilter([
   'virus-',
   'virus-',
   'icloud-',
   'icloud-',
   'apple-',
   'apple-',
-  'www.apple.',
+  'www.apple',
   '-coinbase',
   '-coinbase',
   'coinbase-',
   'coinbase-',
   'lcloud.',
   'lcloud.',
-  'lcloud-'
+  'lcloud-',
+  'booking-com',
+  'booking.com-',
+  'booking-eu',
+  'vinted-cz',
+  'inpost-pl'
 ]);
 ]);
 const lowKeywords = createKeywordFilter([
 const lowKeywords = createKeywordFilter([
   '-co-jp',
   '-co-jp',
   'customer.',
   'customer.',
   'customer-',
   'customer-',
   '.www-',
   '.www-',
-  'instagram'
+  'instagram',
+  'microsoft'
 ]);
 ]);
 
 
 const cacheKey = createCacheKey(__filename);
 const cacheKey = createCacheKey(__filename);
@@ -198,11 +208,12 @@ export const getPhishingDomains = (parentSpan: Span) => parentSpan.traceChild('g
         || (domainScoreMap[domain] >= 5 && domainCountMap[domain] >= 4)
         || (domainScoreMap[domain] >= 5 && domainCountMap[domain] >= 4)
       )
       )
     ) {
     ) {
-      console.log({ domain });
       domainArr.push(`.${domain}`);
       domainArr.push(`.${domain}`);
     }
     }
   }
   }
 
 
+  // console.log(domainScoreMap['']);
+
   return domainArr;
   return domainArr;
 });
 });
 
 
@@ -252,3 +263,8 @@ export function calcDomainAbuseScore(subdomain: string | null) {
 
 
   return weight;
   return weight;
 }
 }
+
+if (require.main === module) {
+  getPhishingDomains(dummySpan)
+    .catch(console.error);
+}

+ 5 - 0
Source/domainset/cdn.conf

@@ -2156,6 +2156,11 @@ runkit-packages-static-executables.com
 runkit-packages-static.com
 runkit-packages-static.com
 # bilibili.tv
 # bilibili.tv
 pic-bstarstatic.akamaized.net
 pic-bstarstatic.akamaized.net
+# Vinted
+static.vinted.com
+static-assets.vinted.com
+marketplace-web-assets.vinted.com
+images1.vinted.net
 # Others
 # Others
 .ziffstatic.com
 .ziffstatic.com
 .muscache.com
 .muscache.com

+ 9 - 0
Source/domainset/reject_sukka.conf

@@ -322,6 +322,11 @@ inst.360safe.com
 .jdie.pl
 .jdie.pl
 .lumindigitalhosting.com
 .lumindigitalhosting.com
 
 
+.mdy8.skin
+.sfmc-marketing.com
+.sfmc-contentqa.com
+
+
 # --- AD Block ---
 # --- AD Block ---
 
 
 # >> General
 # >> General
@@ -929,6 +934,10 @@ analytics.bytegiftia.top
 .5clo0xmbf.com
 .5clo0xmbf.com
 .k3718qw08.com
 .k3718qw08.com
 .j6t91e89q.com
 .j6t91e89q.com
+.marketingcloudqaops.com
+.marketingcloudqaapis.com
+.cfolks.pl
+.deeplinking.sfmctest.com
 
 
 # >> Alexa
 # >> Alexa
 data.alexa.com
 data.alexa.com