build-speedtest-domainset.ts 7.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272
  1. import { domainDeduper } from './lib/domain-deduper';
  2. import path from 'path';
  3. import { createRuleset } from './lib/create-file';
  4. import { sortDomains } from './lib/stable-sort-domain';
  5. import { Sema } from 'async-sema';
  6. import { getHostname } from 'tldts';
  7. import { task } from './trace';
  8. import { fetchWithRetry } from './lib/fetch-retry';
  9. import { SHARED_DESCRIPTION } from './lib/constants';
  10. import picocolors from 'picocolors';
  11. import { readFileIntoProcessedArray } from './lib/fetch-text-by-line';
  12. import { TTL, deserializeArray, fsFetchCache, serializeArray } from './lib/cache-filesystem';
  13. import { createTrie } from './lib/trie';
  14. const s = new Sema(2);
  15. const latestTopUserAgentsPromise = fsFetchCache.apply(
  16. 'https://cdn.jsdelivr.net/npm/top-user-agents@latest/src/desktop.json',
  17. () => fetchWithRetry('https://cdn.jsdelivr.net/npm/top-user-agents@latest/src/desktop.json')
  18. .then(res => res.json() as Promise<string[]>)
  19. .then((userAgents) => userAgents.filter(ua => ua.startsWith('Mozilla/5.0 '))),
  20. {
  21. serializer: serializeArray,
  22. deserializer: deserializeArray,
  23. ttl: TTL.THREE_DAYS()
  24. }
  25. );
  26. const querySpeedtestApi = async (keyword: string): Promise<Array<string | null>> => {
  27. const topUserAgents = await latestTopUserAgentsPromise;
  28. const url = `https://www.speedtest.net/api/js/servers?engine=js&search=${keyword}&limit=100`;
  29. try {
  30. const randomUserAgent = topUserAgents[Math.floor(Math.random() * topUserAgents.length)];
  31. return await fsFetchCache.apply(
  32. url,
  33. () => s.acquire().then(() => fetchWithRetry(url, {
  34. headers: {
  35. dnt: '1',
  36. Referer: 'https://www.speedtest.net/',
  37. accept: 'application/json, text/plain, */*',
  38. 'User-Agent': randomUserAgent,
  39. 'Accept-Language': 'en-US,en;q=0.9',
  40. ...(randomUserAgent.includes('Chrome')
  41. ? {
  42. 'Sec-Ch-Ua-Mobile': '?0',
  43. 'Sec-Fetch-Dest': 'empty',
  44. 'Sec-Fetch-Mode': 'cors',
  45. 'Sec-Fetch-Site': 'same-origin',
  46. 'Sec-Gpc': '1'
  47. }
  48. : {})
  49. },
  50. signal: AbortSignal.timeout(1000 * 4),
  51. retry: {
  52. retries: 2
  53. }
  54. })).then(r => r.json() as any).then((data: Array<{ url: string, host: string }>) => data.reduce<string[]>(
  55. (prev, cur) => {
  56. const line = cur.host || cur.url;
  57. const hn = getHostname(line, { detectIp: false, validateHostname: true });
  58. if (hn) {
  59. prev.push(hn);
  60. }
  61. return prev;
  62. }, []
  63. )).finally(() => s.release()),
  64. {
  65. ttl: TTL.ONE_WEEK(),
  66. serializer: serializeArray,
  67. deserializer: deserializeArray
  68. }
  69. );
  70. } catch (e) {
  71. console.error(e);
  72. return [];
  73. }
  74. };
  75. export const buildSpeedtestDomainSet = task(import.meta.main, import.meta.path)(async (span) => {
  76. const domainTrie = createTrie(
  77. [
  78. // speedtest.net
  79. '.speedtest.net',
  80. '.speedtestcustom.com',
  81. '.ooklaserver.net',
  82. '.speed.misaka.one',
  83. '.speedtest.rt.ru',
  84. '.speedtest.aptg.com.tw',
  85. '.speedtest.gslnetworks.com',
  86. '.speedtest.jsinfo.net',
  87. '.speedtest.i3d.net',
  88. '.speedtestkorea.com',
  89. '.speedtest.telus.com',
  90. '.speedtest.telstra.net',
  91. '.speedtest.clouvider.net',
  92. '.speedtest.idv.tw',
  93. '.speedtest.frontier.com',
  94. '.speedtest.orange.fr',
  95. '.speedtest.centurylink.net',
  96. '.srvr.bell.ca',
  97. '.speedtest.contabo.net',
  98. 'speedtest.hk.chinamobile.com',
  99. 'speedtestbb.hk.chinamobile.com',
  100. '.hizinitestet.com',
  101. '.linknetspeedtest.net.br',
  102. 'speedtest.rit.edu',
  103. 'speedtest.ropa.de',
  104. 'speedtest.sits.su',
  105. 'speedtest.tigo.cr',
  106. 'speedtest.upp.com',
  107. '.speedtest.pni.tw',
  108. '.speed.pfm.gg',
  109. '.speedtest.faelix.net',
  110. '.speedtest.labixe.net',
  111. '.speedtest.warian.net',
  112. '.speedtest.starhub.com',
  113. '.speedtest.gibir.net.tr',
  114. '.speedtest.ozarksgo.net',
  115. '.speedtest.exetel.com.au',
  116. '.speedtest.sbcglobal.net',
  117. '.speedtest.leaptel.com.au',
  118. '.speedtest.windstream.net',
  119. '.speedtest.vodafone.com.au',
  120. '.speedtest.rascom.ru',
  121. '.speedtest.dchost.com',
  122. '.speedtest.highnet.com',
  123. '.speedtest.seattle.wa.limewave.net',
  124. '.speedtest.optitel.com.au',
  125. '.speednet.net.tr',
  126. '.speedtest.angolacables.co.ao',
  127. '.ookla-speedtest.fsr.com',
  128. '.speedtest.comnet.com.tr',
  129. '.speedtest.gslnetworks.com.au',
  130. '.test.gslnetworks.com.au',
  131. '.speedtest.gslnetworks.com',
  132. '.speedtestunonet.com.br',
  133. '.speedtest.alagas.net',
  134. 'speedtest.surfshark.com',
  135. '.speedtest.aarnet.net.au',
  136. '.ookla.rcp.net',
  137. '.ookla-speedtests.e2ro.com',
  138. '.speedtest.com.sg',
  139. '.ookla.ddnsgeek.com',
  140. '.speedtest.pni.tw',
  141. '.speedtest.cmcnetworks.net',
  142. '.speedtestwnet.com.br',
  143. // Cloudflare
  144. '.speed.cloudflare.com',
  145. // Wi-Fi Man
  146. '.wifiman.com',
  147. '.wifiman.me',
  148. '.wifiman.ubncloud.com',
  149. // Fast.com
  150. '.fast.com',
  151. // MacPaw
  152. 'speedtest.macpaw.com',
  153. // speedtestmaster
  154. '.netspeedtestmaster.com',
  155. // Google Search Result of "speedtest", powered by this
  156. '.measurement-lab.org',
  157. '.measurementlab.net',
  158. // Google Fiber legacy speedtest site (new fiber speedtest use speedtestcustom.com)
  159. '.speed.googlefiber.net',
  160. // librespeed
  161. '.backend.librespeed.org',
  162. // Apple,
  163. 'mensura.cdn-apple.com', // From netQuality command
  164. // OpenSpeedtest
  165. 'open.cachefly.net'
  166. ],
  167. true,
  168. true
  169. );
  170. await span.traceChildAsync(
  171. 'fetch previous speedtest domainset',
  172. async () => {
  173. try {
  174. (
  175. await readFileIntoProcessedArray(path.resolve(import.meta.dir, '../List/domainset/speedtest.conf'))
  176. ) .forEach(line => {
  177. const hn = getHostname(line, { detectIp: false, validateHostname: true });
  178. if (hn) {
  179. domainTrie.add(hn);
  180. }
  181. });
  182. } catch { }
  183. }
  184. );
  185. await new Promise<void>((resolve, reject) => {
  186. const pMap = ([
  187. 'Hong Kong',
  188. 'Taiwan',
  189. 'China Telecom',
  190. 'China Mobile',
  191. 'China Unicom',
  192. 'Japan',
  193. 'Tokyo',
  194. 'Singapore',
  195. 'Korea',
  196. 'Seoul',
  197. 'Canada',
  198. 'Toronto',
  199. 'Montreal',
  200. 'Los Ang',
  201. 'San Jos',
  202. 'Seattle',
  203. 'New York',
  204. 'Dallas',
  205. 'Miami',
  206. 'Berlin',
  207. 'Frankfurt',
  208. 'London',
  209. 'Paris',
  210. 'Amsterdam',
  211. 'Moscow',
  212. 'Australia',
  213. 'Sydney',
  214. 'Brazil',
  215. 'Turkey'
  216. ]).reduce<Record<string, Promise<void>>>((pMap, keyword) => {
  217. pMap[keyword] = span.traceChildAsync(`fetch speedtest endpoints: ${keyword}`, () => querySpeedtestApi(keyword)).then(hostnameGroup => {
  218. return hostnameGroup.forEach(hostname => {
  219. if (hostname) {
  220. domainTrie.add(hostname);
  221. }
  222. });
  223. });
  224. return pMap;
  225. }, {});
  226. const timer = setTimeout(() => {
  227. console.error(picocolors.red('Task timeout!'));
  228. Object.entries(pMap).forEach(([name, p]) => {
  229. console.log(`[${name}]`, Bun.peek.status(p));
  230. });
  231. resolve();
  232. }, 1000 * 60 * 1.5);
  233. Promise.all(Object.values(pMap)).then(() => {
  234. clearTimeout(timer);
  235. return resolve();
  236. }).catch(() => reject);
  237. });
  238. const deduped = span.traceChildSync('sort result', () => sortDomains(domainDeduper(domainTrie)));
  239. const description = [
  240. ...SHARED_DESCRIPTION,
  241. '',
  242. 'This file contains common speedtest endpoints.'
  243. ];
  244. return createRuleset(
  245. span,
  246. 'Sukka\'s Ruleset - Speedtest Domains',
  247. description,
  248. new Date(),
  249. deduped,
  250. 'domainset',
  251. path.resolve(import.meta.dir, '../List/domainset/speedtest.conf'),
  252. path.resolve(import.meta.dir, '../Clash/domainset/speedtest.txt')
  253. );
  254. });