Any Hackernews Link Utils

Utility functions for Any Hackernews Link

此脚本不应直接安装,它是一个供其他脚本使用的外部库。如果您需要使用该库,请在脚本元属性加入:// @require https://update.gf.qytechs.cn/scripts/524693/1525919/Any%20Hackernews%20Link%20Utils.js

  1. // ==UserScript==
  2. // @name Any Hackernews Link Utils
  3. // @namespace http://tampermonkey.net/
  4. // @version 0.1.0
  5. // @description Utility functions for Any Hackernews Link
  6. // @author RoCry
  7. // @grant GM_xmlhttpRequest
  8. // @connect hn.algolia.com
  9. // @license MIT
  10. // ==/UserScript==
  11.  
  12. /**
  13. * Configuration
  14. */
  15. const CONFIG = {
  16. // Additional domains to ignore that couldn't be handled by @exclude
  17. IGNORED_DOMAINS: [
  18. 'gmail.com',
  19. 'accounts.google.com',
  20. 'accounts.youtube.com',
  21. 'signin.',
  22. 'login.',
  23. 'auth.',
  24. 'oauth.',
  25. ],
  26.  
  27. // Patterns that indicate a search page
  28. SEARCH_PATTERNS: [
  29. '/search',
  30. '/webhp',
  31. '/results',
  32. '?q=',
  33. '?query=',
  34. '?search=',
  35. '?s='
  36. ],
  37.  
  38. // URL parameters to remove during normalization
  39. TRACKING_PARAMS: [
  40. 'utm_source',
  41. 'utm_medium',
  42. 'utm_campaign',
  43. 'utm_term',
  44. 'utm_content',
  45. 'fbclid',
  46. 'gclid',
  47. '_ga',
  48. 'ref',
  49. 'source'
  50. ],
  51.  
  52. // Minimum ratio of ASCII characters to consider content as English
  53. MIN_ASCII_RATIO: 0.9,
  54. // Number of characters to check for language detection
  55. CHARS_TO_CHECK: 300
  56. };
  57.  
  58. /**
  59. * URL Utilities
  60. */
  61. const URLUtils = {
  62. /**
  63. * Check if a URL should be ignored based on domain or search patterns
  64. * @param {string} url - URL to check
  65. * @returns {boolean} - True if URL should be ignored
  66. */
  67. shouldIgnoreUrl(url) {
  68. try {
  69. const urlObj = new URL(url);
  70. // Check remaining ignored domains
  71. if (CONFIG.IGNORED_DOMAINS.some(domain => urlObj.hostname.includes(domain))) {
  72. return true;
  73. }
  74.  
  75. // Check if it's a search page
  76. if (CONFIG.SEARCH_PATTERNS.some(pattern =>
  77. urlObj.pathname.includes(pattern) || urlObj.search.includes(pattern))) {
  78. return true;
  79. }
  80.  
  81. return false;
  82. } catch (e) {
  83. console.error('Error checking URL:', e);
  84. return false;
  85. }
  86. },
  87.  
  88. /**
  89. * Normalize URL by removing tracking parameters and standardizing format
  90. * @param {string} url - URL to normalize
  91. * @returns {string} - Normalized URL
  92. */
  93. normalizeUrl(url) {
  94. try {
  95. const urlObj = new URL(url);
  96. // Remove tracking parameters
  97. CONFIG.TRACKING_PARAMS.forEach(param => urlObj.searchParams.delete(param));
  98. // Remove sepecial parameter for all hosts
  99. // https://github.com/HackerNews/API?tab=readme-ov-file -> https://github.com/HackerNews/API
  100. urlObj.searchParams.delete('tab');
  101.  
  102. // Handle GitHub repository paths
  103. if (urlObj.hostname === 'github.com') {
  104. // Split path into segments
  105. const pathSegments = urlObj.pathname.split('/').filter(Boolean);
  106. // Only process if we have at least username/repo
  107. if (pathSegments.length >= 2) {
  108. const [username, repo, ...rest] = pathSegments;
  109. // If path contains tree/master, blob/master, or similar, remove them
  110. if (rest.length > 0 && (rest[0] === 'tree' || rest[0] === 'blob')) {
  111. urlObj.pathname = `/${username}/${repo}`;
  112. }
  113. }
  114. }
  115. // for arxiv
  116. // https://arxiv.org/pdf/1706.03762 -> https://arxiv.org/abs/1706.03762
  117. if (urlObj.hostname === 'arxiv.org') {
  118. urlObj.pathname = urlObj.pathname.replace('/pdf/', '/abs/');
  119. }
  120.  
  121. // Remove hash
  122. urlObj.hash = '';
  123. // Remove trailing slash for consistency
  124. let normalizedUrl = urlObj.toString();
  125. if (normalizedUrl.endsWith('/')) {
  126. normalizedUrl = normalizedUrl.slice(0, -1);
  127. }
  128. return normalizedUrl;
  129. } catch (e) {
  130. console.error('Error normalizing URL:', e);
  131. return url;
  132. }
  133. },
  134.  
  135. /**
  136. * Compare two URLs for equality after normalization
  137. * @param {string} url1 - First URL
  138. * @param {string} url2 - Second URL
  139. * @returns {boolean} - True if URLs match
  140. */
  141. urlsMatch(url1, url2) {
  142. try {
  143. const u1 = new URL(this.normalizeUrl(url1));
  144. const u2 = new URL(this.normalizeUrl(url2));
  145. return u1.hostname.toLowerCase() === u2.hostname.toLowerCase() &&
  146. u1.pathname.toLowerCase() === u2.pathname.toLowerCase() &&
  147. u1.search === u2.search;
  148. } catch (e) {
  149. console.error('Error comparing URLs:', e);
  150. return false;
  151. }
  152. }
  153. };
  154.  
  155. /**
  156. * Content Utilities
  157. */
  158. const ContentUtils = {
  159. /**
  160. * Check if text is primarily English by checking ASCII ratio
  161. * @param {string} text - Text to analyze
  162. * @returns {boolean} - True if content is likely English
  163. */
  164. isEnglishContent() {
  165. try {
  166. // Get text from title and first paragraph or relevant content
  167. const title = document.title || '';
  168. const firstParagraphs = Array.from(document.getElementsByTagName('p'))
  169. .slice(0, 3)
  170. .map(p => p.textContent)
  171. .join(' ');
  172. const textToAnalyze = (title + ' ' + firstParagraphs)
  173. .slice(0, CONFIG.CHARS_TO_CHECK)
  174. .replace(/\s+/g, ' ')
  175. .trim();
  176.  
  177. if (!textToAnalyze) return true; // If no text found, assume English
  178.  
  179. // Count ASCII characters (excluding spaces and common punctuation)
  180. const asciiChars = textToAnalyze.replace(/[\s\.,\-_'"!?()]/g, '')
  181. .split('')
  182. .filter(char => char.charCodeAt(0) <= 127).length;
  183. const totalChars = textToAnalyze.replace(/[\s\.,\-_'"!?()]/g, '').length;
  184. if (totalChars === 0) return true;
  185. const asciiRatio = asciiChars / totalChars;
  186. console.log('🈂️ ASCII Ratio:', asciiRatio.toFixed(2));
  187. return asciiRatio >= CONFIG.MIN_ASCII_RATIO;
  188. } catch (e) {
  189. console.error('Error checking content language:', e);
  190. return true; // Default to allowing English in case of error
  191. }
  192. }
  193. };
  194.  
  195. /**
  196. * HackerNews API Handler
  197. */
  198. const HNApi = {
  199. /**
  200. * Search for a URL on HackerNews
  201. * @param {string} normalizedUrl - URL to search for
  202. * @param {Function} updateUI - Callback function to update UI with results
  203. */
  204. checkHackerNews(normalizedUrl, updateUI) {
  205. const apiUrl = `https://hn.algolia.com/api/v1/search?query=${encodeURIComponent(normalizedUrl)}&restrictSearchableAttributes=url`;
  206. GM_xmlhttpRequest({
  207. method: 'GET',
  208. url: apiUrl,
  209. onload: (response) => this.handleApiResponse(response, normalizedUrl, updateUI),
  210. onerror: (error) => {
  211. console.error('Error fetching from HN API:', error);
  212. updateUI(null);
  213. }
  214. });
  215. },
  216.  
  217. /**
  218. * Handle the API response
  219. * @param {Object} response - API response
  220. * @param {string} normalizedUrl - Original normalized URL
  221. * @param {Function} updateUI - Callback function to update UI with results
  222. */
  223. handleApiResponse(response, normalizedUrl, updateUI) {
  224. try {
  225. const data = JSON.parse(response.responseText);
  226. const matchingHits = data.hits.filter(hit => URLUtils.urlsMatch(hit.url, normalizedUrl));
  227. if (matchingHits.length === 0) {
  228. console.log('🔍 URL not found on Hacker News');
  229. updateUI(null);
  230. return;
  231. }
  232.  
  233. const topHit = matchingHits.sort((a, b) => (b.points || 0) - (a.points || 0))[0];
  234. const result = {
  235. title: topHit.title,
  236. points: topHit.points || 0,
  237. comments: topHit.num_comments || 0,
  238. link: `https://news.ycombinator.com/item?id=${topHit.objectID}`,
  239. posted: new Date(topHit.created_at).toLocaleDateString()
  240. };
  241.  
  242. console.log('📰 Found on Hacker News:', result);
  243. updateUI(result);
  244. } catch (e) {
  245. console.error('Error parsing HN API response:', e);
  246. updateUI(null);
  247. }
  248. }
  249. };

QingJ © 2025

镜像随时可能失效,请加Q群300939539或关注我们的公众号极客氢云获取最新地址