build-cdn-download-conf.ts 3.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293
  1. import path from 'node:path';
  2. import { fetchRemoteTextByLine, readFileIntoProcessedArray } from './lib/fetch-text-by-line';
  3. import { HostnameTrie } from './lib/trie';
  4. import { task } from './trace';
  5. import { SHARED_DESCRIPTION } from './constants/description';
  6. import { appendArrayInPlace } from './lib/append-array-in-place';
  7. import { SOURCE_DIR } from './constants/dir';
  8. import { DomainsetOutput } from './lib/create-file';
  9. import { CRASHLYTICS_WHITELIST } from './constants/reject-data-source';
  10. import { appendSetElementsToArray } from 'foxts/append-set-elements-to-array';
  11. const getS3OSSDomainsPromise = (async (): Promise<Set<string>> => {
  12. const trie = new HostnameTrie();
  13. for await (const line of await fetchRemoteTextByLine('https://publicsuffix.org/list/public_suffix_list.dat', true)) {
  14. trie.add(line);
  15. }
  16. /**
  17. * Extract OSS domain from publicsuffix list
  18. */
  19. const S3OSSDomains = new Set<string>();
  20. trie.find('.amazonaws.com').forEach((line: string) => {
  21. if (
  22. (line.startsWith('s3-') || line.startsWith('s3.'))
  23. && !line.includes('cn-')
  24. ) {
  25. S3OSSDomains.add('.' + line);
  26. }
  27. });
  28. trie.find('.scw.cloud').forEach((line: string) => {
  29. if (
  30. (line.startsWith('s3-') || line.startsWith('s3.'))
  31. && !line.includes('cn-')
  32. ) {
  33. S3OSSDomains.add('.' + line);
  34. }
  35. });
  36. trie.find('sakurastorage.jp').forEach((line: string) => {
  37. if (
  38. (line.startsWith('s3-') || line.startsWith('s3.'))
  39. ) {
  40. S3OSSDomains.add('.' + line);
  41. }
  42. });
  43. return S3OSSDomains;
  44. })();
  45. export const buildCdnDownloadConf = task(require.main === module, __filename)(async (span) => {
  46. const [
  47. S3OSSDomains,
  48. cdnDomainsList,
  49. downloadDomainSet,
  50. steamDomainSet
  51. ] = await Promise.all([
  52. getS3OSSDomainsPromise,
  53. readFileIntoProcessedArray(path.join(SOURCE_DIR, 'domainset/cdn.conf')),
  54. readFileIntoProcessedArray(path.join(SOURCE_DIR, 'domainset/download.conf')),
  55. readFileIntoProcessedArray(path.join(SOURCE_DIR, 'domainset/game-download.conf'))
  56. ]);
  57. // Move S3 domains to download domain set, since S3 files may be large
  58. appendSetElementsToArray(downloadDomainSet, S3OSSDomains);
  59. appendArrayInPlace(downloadDomainSet, steamDomainSet);
  60. // we have whitelisted the crashlytics domain, and we also want to put it in CDN policy
  61. appendArrayInPlace(cdnDomainsList, CRASHLYTICS_WHITELIST);
  62. return Promise.all([
  63. new DomainsetOutput(span, 'cdn')
  64. .withTitle('Sukka\'s Ruleset - CDN Domains')
  65. .withDescription([
  66. ...SHARED_DESCRIPTION,
  67. '',
  68. 'This file contains object storage and static assets CDN domains.'
  69. ])
  70. .addFromDomainset(cdnDomainsList)
  71. .write(),
  72. new DomainsetOutput(span, 'download')
  73. .withTitle('Sukka\'s Ruleset - Large Files Hosting Domains')
  74. .withDescription([
  75. ...SHARED_DESCRIPTION,
  76. '',
  77. 'This file contains domains for software updating & large file hosting.'
  78. ])
  79. .addFromDomainset(downloadDomainSet)
  80. .write()
  81. ]);
  82. });