build-microsoft-cdn.ts 3.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071
  1. import { task } from './trace';
  2. import { SHARED_DESCRIPTION } from './constants/description';
  3. import { once } from 'foxts/once';
  4. import { RulesetOutput } from './lib/rules/ruleset';
  5. import Worktank from 'worktank';
  6. const pool = new Worktank({
  7. name: 'build-internal-reverse-chn-cidr',
  8. size: 1,
  9. timeout: 10000, // The maximum number of milliseconds to wait for the result from the worker, if exceeded the worker is terminated and the execution promise rejects
  10. warmup: true,
  11. autoterminate: 30000, // The interval of milliseconds at which to check if the pool can be automatically terminated, to free up resources, workers will be spawned up again if needed
  12. env: {},
  13. methods: {
  14. // eslint-disable-next-line object-shorthand -- workertank
  15. getMicrosoftCdnRuleset: async function (importMetaUrl: string): Promise<[domains: string[], domainSuffixes: string[]]> {
  16. // TODO: createRequire is a temporary workaround for https://github.com/nodejs/node/issues/51956
  17. const { default: module } = await import('node:module');
  18. const __require = module.createRequire(importMetaUrl);
  19. const { HostnameSmolTrie } = __require('./lib/trie');
  20. const { PROBE_DOMAINS, DOMAINS, DOMAIN_SUFFIXES, BLACKLIST } = __require('./constants/microsoft-cdn') as typeof import('./constants/microsoft-cdn');
  21. const { fetchRemoteTextByLine } = __require('./lib/fetch-text-by-line') as typeof import('./lib/fetch-text-by-line');
  22. const { appendArrayInPlace } = __require('foxts/append-array-in-place') as typeof import('foxts/append-array-in-place');
  23. const { extractDomainsFromFelixDnsmasq } = __require('./lib/parse-dnsmasq') as typeof import('./lib/parse-dnsmasq');
  24. const trie = new HostnameSmolTrie();
  25. for await (const line of await fetchRemoteTextByLine('https://raw.githubusercontent.com/felixonmars/dnsmasq-china-list/master/accelerated-domains.china.conf')) {
  26. const domain = extractDomainsFromFelixDnsmasq(line);
  27. if (domain) {
  28. trie.add(domain);
  29. }
  30. }
  31. // remove blacklist domain from trie, to prevent them from being included in the later dump
  32. BLACKLIST.forEach(black => trie.whitelist(black));
  33. const domains: string[] = DOMAINS;
  34. const domainSuffixes = appendArrayInPlace(PROBE_DOMAINS.flatMap(domain => trie.find(domain)), DOMAIN_SUFFIXES);
  35. return [domains, domainSuffixes] as const;
  36. }
  37. }
  38. });
  39. export const getMicrosoftCdnRulesetPromise = once<Promise<[domains: string[], domainSuffixes: string[]]>>(async () => {
  40. const res = await pool.exec(
  41. 'getMicrosoftCdnRuleset',
  42. [import.meta.url]
  43. );
  44. pool.terminate();
  45. return res;
  46. });
  47. export const buildMicrosoftCdn = task(require.main === module, __filename)(async (span) => {
  48. const [domains, domainSuffixes] = await span.traceChildPromise('get microsoft cdn domains', getMicrosoftCdnRulesetPromise());
  49. return new RulesetOutput(span, 'microsoft_cdn', 'non_ip')
  50. .withTitle('Sukka\'s Ruleset - Microsoft CDN')
  51. .appendDescription(SHARED_DESCRIPTION)
  52. .appendDescription(
  53. '',
  54. 'This file contains Microsoft\'s domains using their China mainland CDN servers.'
  55. )
  56. .appendDataSource('https://github.com/felixonmars/dnsmasq-china-list')
  57. .bulkAddDomain(domains)
  58. .bulkAddDomainSuffix(domainSuffixes)
  59. .write();
  60. });