build-microsoft-cdn.ts 3.2 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970
  1. import { task } from './trace';
  2. import { SHARED_DESCRIPTION } from './constants/description';
  3. import { RulesetOutput } from './lib/rules/ruleset';
  4. import Worktank from 'worktank';
  5. import { RULES } from './constants/microsoft-cdn';
  6. const pool = new Worktank({
  7. pool: {
  8. name: 'get-microsoft-cdn',
  9. size: 1 // The number of workers to keep in the pool, if more workers are needed they will be spawned up to this limit
  10. },
  11. worker: {
  12. autoAbort: 10000,
  13. autoTerminate: 30000, // The interval of milliseconds at which to check if the pool can be automatically terminated, to free up resources, workers will be spawned up again if needed
  14. autoInstantiate: true,
  15. methods: {
  16. // eslint-disable-next-line object-shorthand -- workertank
  17. getMicrosoftCdnRuleset: async function (__filename: string): Promise<[domains: string[], domainSuffixes: string[]]> {
  18. // TODO: createRequire is a temporary workaround for https://github.com/nodejs/node/issues/51956
  19. const { default: module } = await import('node:module');
  20. const __require = module.createRequire(__filename);
  21. const { HostnameSmolTrie } = __require('./lib/trie');
  22. const { PROBE_DOMAINS, DOMAINS, DOMAIN_SUFFIXES, BLACKLIST } = __require('./constants/microsoft-cdn') as typeof import('./constants/microsoft-cdn');
  23. const { fetchRemoteTextByLine } = __require('./lib/fetch-text-by-line') as typeof import('./lib/fetch-text-by-line');
  24. const { appendArrayInPlace } = __require('foxts/append-array-in-place') as typeof import('foxts/append-array-in-place');
  25. const { extractDomainsFromFelixDnsmasq } = __require('./lib/parse-dnsmasq') as typeof import('./lib/parse-dnsmasq');
  26. const trie = new HostnameSmolTrie();
  27. for await (const line of await fetchRemoteTextByLine('https://raw.githubusercontent.com/felixonmars/dnsmasq-china-list/master/accelerated-domains.china.conf')) {
  28. const domain = extractDomainsFromFelixDnsmasq(line);
  29. if (domain) {
  30. trie.add(domain);
  31. }
  32. }
  33. // remove blacklist domain from trie, to prevent them from being included in the later dump
  34. BLACKLIST.forEach(black => trie.whitelist(black));
  35. const domains: string[] = DOMAINS;
  36. const domainSuffixes = appendArrayInPlace(PROBE_DOMAINS.flatMap(domain => trie.find(domain)), DOMAIN_SUFFIXES);
  37. return [domains, domainSuffixes] as const;
  38. }
  39. }
  40. }
  41. });
  42. export const getMicrosoftCdnRulesetPromise = pool.exec(
  43. 'getMicrosoftCdnRuleset',
  44. [__filename]
  45. ).finally(() => pool.terminate());
  46. export const buildMicrosoftCdn = task(require.main === module, __filename)(async (span) => {
  47. const [domains, domainSuffixes] = await span.traceChildPromise('get microsoft cdn domains', getMicrosoftCdnRulesetPromise);
  48. return new RulesetOutput(span, 'microsoft_cdn', 'non_ip')
  49. .withTitle('Sukka\'s Ruleset - Microsoft CDN')
  50. .appendDescription(SHARED_DESCRIPTION)
  51. .appendDescription(
  52. '',
  53. 'This file contains Microsoft\'s domains using their China mainland CDN servers.'
  54. )
  55. .addFromRuleset(RULES)
  56. .appendDataSource('https://github.com/felixonmars/dnsmasq-china-list')
  57. .bulkAddDomain(domains)
  58. .bulkAddDomainSuffix(domainSuffixes)
  59. .write();
  60. });