Back

Version 77

11/10/2024
import { Hono } from "https://esm.sh/hono@3.10.2";
import { encode } from "https://esm.sh/js-base64@3.7.5";
import { parse } from "https://esm.sh/node-html-parser@6.1.5";

const app = new Hono();

// Expanded stopwords list with additional web-specific terms
const stopwords = new Set([
'a', 'about', 'above', 'after', 'again', 'against', 'all', 'am', 'an', 'and', 'any', 'are', 'as', 'at', 'be', 'because',
'been', 'before', 'being', 'below', 'between', 'both', 'but', 'by', 'could', 'did', 'do', 'does', 'doing', 'down',
'during', 'each', 'few', 'for', 'from', 'further', 'had', 'has', 'have', 'having', 'he', 'her', 'here', 'hers',
'herself', 'him', 'himself', 'his', 'how', 'i', 'if', 'in', 'into', 'is', 'it', 'its', 'itself', 'just', 'me',
'more', 'most', 'my', 'myself', 'no', 'nor', 'not', 'now', 'of', 'off', 'on', 'once', 'only', 'or', 'other',
'ought', 'our', 'ours', 'ourselves', 'out', 'over', 'own', 'same', 'she', 'should', 'so', 'some', 'such', 'than',
'that', 'the', 'their', 'theirs', 'them', 'themselves', 'then', 'there', 'these', 'they', 'this', 'those', 'through',
'to', 'too', 'under', 'until', 'up', 'very', 'was', 'we', 'were', 'what', 'when', 'where', 'which', 'while', 'who',
'whom', 'why', 'with', 'would', 'you', 'your', 'yours', 'yourself', 'yourselves',
// Additional navigation-related terms
'back', 'contents', 'menu', 'home', 'next', 'previous', 'top', 'bottom', 'navigation', 'nav', 'sidebar', 'footer',
'header', 'main', 'article', 'section', 'page', 'skip', 'jump', 'return',
// Web-specific terms
'image', 'photo', 'photograph', 'picture', 'fullscreen', 'share', 'reuse', 'features', 'topics', 'observer',
'getty', 'rex', 'shutterstock', 'ap', 'afp', 'reuters', 'epa', 'pa', 'alamy', 'getty images', 'associated press',
'agence france-presse', 'press association', 'copyright', 'rights reserved', 'all rights reserved',
'click', 'tap', 'swipe', 'scroll', 'zoom', 'enlarge', 'expand', 'collapse', 'hide', 'show',
'login', 'sign in', 'register', 'subscribe', 'newsletter', 'email', 'follow', 'like', 'comment', 'share',
'twitter', 'facebook', 'instagram', 'linkedin', 'pinterest', 'youtube', 'google',
'advertisement', 'sponsored', 'promoted', 'partner content', 'paid content',
'cookie', 'privacy', 'terms', 'conditions', 'policy', 'agreement',
'mobile', 'desktop', 'tablet', 'app', 'website', 'browser',
'search', 'find', 'results', 'query', 'keyword',
'loading', 'please wait', 'error', 'not found', '404', 'server error', '500',
'menu', 'navigation', 'sitemap', 'archive', 'category', 'tag', 'related', 'popular', 'trending',
'breaking news', 'latest', 'update', 'live', 'developing story',
'read more', 'continue reading', 'full article', 'paywall', 'subscribe now',
'comments', 'discussion', 'forum', 'community', 'join the conversation',
mikehiggins-sanguinecyanmastodon.web.val.run
Updated: November 16, 2024