build-microsoft-cdn.ts 3.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475
  1. import { task } from './trace';
  2. import { SHARED_DESCRIPTION } from './constants/description';
  3. import { createMemoizedPromise } from './lib/memo-promise';
  4. import { RulesetOutput } from './lib/rules/ruleset';
  5. import Worktank from 'worktank';
  6. const pool = new Worktank({
  7. name: 'build-internal-reverse-chn-cidr',
  8. size: 1,
  9. timeout: 10000, // The maximum number of milliseconds to wait for the result from the worker, if exceeded the worker is terminated and the execution promise rejects
  10. warmup: true,
  11. autoterminate: 30000, // The interval of milliseconds at which to check if the pool can be automatically terminated, to free up resources, workers will be spawned up again if needed
  12. env: {},
  13. methods: {
  14. // eslint-disable-next-line object-shorthand -- workertank
  15. getMicrosoftCdnRuleset: async function (importMetaUrl: string): Promise<[domains: string[], domainSuffixes: string[]]> {
  16. // TODO: createRequire is a temporary workaround for https://github.com/nodejs/node/issues/51956
  17. const { default: module } = await import('node:module');
  18. const __require = module.createRequire(importMetaUrl);
  19. const { HostnameSmolTrie } = __require('./lib/trie');
  20. const { PROBE_DOMAINS, DOMAINS, DOMAIN_SUFFIXES, BLACKLIST } = __require('./constants/microsoft-cdn') as typeof import('./constants/microsoft-cdn');
  21. const { fetchRemoteTextByLine } = __require('./lib/fetch-text-by-line') as typeof import('./lib/fetch-text-by-line');
  22. const { appendArrayInPlace } = __require('foxts/append-array-in-place') as typeof import('foxts/append-array-in-place');
  23. const { extractDomainsFromFelixDnsmasq } = __require('./lib/parse-dnsmasq') as typeof import('./lib/parse-dnsmasq');
  24. const trie = new HostnameSmolTrie();
  25. for await (const line of await fetchRemoteTextByLine('https://raw.githubusercontent.com/felixonmars/dnsmasq-china-list/master/accelerated-domains.china.conf')) {
  26. const domain = extractDomainsFromFelixDnsmasq(line);
  27. if (domain) {
  28. trie.add(domain);
  29. }
  30. }
  31. // remove blacklist domain from trie, to prevent them from being included in the later dump
  32. BLACKLIST.forEach(black => trie.whitelist(black));
  33. const domains: string[] = DOMAINS;
  34. const domainSuffixes = appendArrayInPlace(PROBE_DOMAINS.flatMap(domain => trie.find(domain)), DOMAIN_SUFFIXES);
  35. return [domains, domainSuffixes] as const;
  36. }
  37. }
  38. });
  39. export const getMicrosoftCdnRulesetPromise = createMemoizedPromise<[domains: string[], domainSuffixes: string[]]>(async () => {
  40. const res = await pool.exec(
  41. 'getMicrosoftCdnRuleset',
  42. [import.meta.url]
  43. );
  44. pool.terminate();
  45. return res;
  46. });
  47. export const buildMicrosoftCdn = task(require.main === module, __filename)(async (span) => {
  48. const description = [
  49. ...SHARED_DESCRIPTION,
  50. '',
  51. 'This file contains Microsoft\'s domains using their China mainland CDN servers.',
  52. '',
  53. 'Data from:',
  54. ' - https://github.com/felixonmars/dnsmasq-china-list'
  55. ];
  56. const [domains, domainSuffixes] = await span.traceChildPromise('get microsoft cdn domains', getMicrosoftCdnRulesetPromise());
  57. return new RulesetOutput(span, 'microsoft_cdn', 'non_ip')
  58. .withTitle('Sukka\'s Ruleset - Microsoft CDN')
  59. .withDescription(description)
  60. .bulkAddDomain(domains)
  61. .bulkAddDomainSuffix(domainSuffixes)
  62. .write();
  63. });