npm - @rmdes/indiekit-endpoint-microsub - Versions diffs - 1.0.56 → 1.0.58 - Mend

@rmdes/indiekit-endpoint-microsub 1.0.56 → 1.0.58

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (51) hide show

package/assets/reader.js +408 -0
package/index.js +37 -36
package/lib/cache/redis.js +12 -3
package/lib/controllers/reader/actor.js +142 -0
package/lib/controllers/reader/channel.js +301 -0
package/lib/controllers/reader/compose.js +242 -0
package/lib/controllers/reader/deck.js +129 -0
package/lib/controllers/reader/feed-repair.js +117 -0
package/lib/controllers/reader/feed.js +246 -0
package/lib/controllers/reader/index.js +126 -0
package/lib/controllers/reader/search.js +157 -0
package/lib/controllers/reader/timeline.js +251 -0
package/lib/controllers/timeline.js +4 -2
package/lib/feeds/atom.js +1 -1
package/lib/feeds/fetcher.js +1 -30
package/lib/feeds/hfeed.js +1 -1
package/lib/feeds/jsonfeed.js +1 -1
package/lib/feeds/normalizer-hfeed.js +209 -0
package/lib/feeds/normalizer-jsonfeed.js +171 -0
package/lib/feeds/normalizer-rss.js +178 -0
package/lib/feeds/normalizer.js +20 -560
package/lib/feeds/rss.js +1 -1
package/lib/polling/processor.js +3 -17
package/lib/storage/items-read-state.js +287 -0
package/lib/storage/items-retention.js +174 -0
package/lib/storage/items-search.js +34 -0
package/lib/storage/items.js +99 -590
package/lib/storage/read-state.js +1 -1
package/lib/utils/async-handler.js +7 -0
package/lib/utils/html.js +25 -0
package/lib/utils/source-type.js +28 -0
package/lib/webmention/processor.js +1 -1
package/locales/de.json +3 -0
package/locales/en.json +2 -0
package/locales/es-419.json +3 -0
package/locales/es.json +3 -0
package/locales/fr.json +3 -0
package/locales/hi.json +3 -0
package/locales/id.json +3 -0
package/locales/it.json +3 -0
package/locales/nl.json +3 -0
package/locales/pl.json +3 -0
package/locales/pt-BR.json +3 -0
package/locales/pt.json +3 -0
package/locales/sr.json +3 -0
package/locales/sv.json +3 -0
package/locales/zh-Hans-CN.json +3 -0
package/package.json +1 -1
package/views/channel.njk +1 -348
package/views/timeline.njk +3 -274
package/lib/controllers/reader.js +0 -1562

package/lib/feeds/normalizer.js CHANGED Viewed

@@ -1,5 +1,5 @@
 /**
- * Feed normalizer - converts all feed formats to jf2
+ * Feed normalizer — shared helpers
  * @module feeds/normalizer
  */
@@ -8,27 +8,21 @@ import crypto from "node:crypto";
 import sanitizeHtml from "sanitize-html";
 import { SANITIZE_OPTIONS } from "../utils/sanitize.js";
+import { extractImagesFromHtml } from "../utils/html.js";
+// Re-export for use by format-specific normalizers
+export { SANITIZE_OPTIONS, sanitizeHtml, extractImagesFromHtml };
 /**
- * Extract image URLs from HTML content.
- * Used as a fallback when no explicit photo/enclosure is provided.
- * @param {string} html - HTML content (already sanitized)
- * @returns {string[]} Array of image URLs
+ * Generate unique ID for an item
+ * @param {string} feedUrl - Feed URL
+ * @param {string} itemId - Item identifier (URL or ID)
+ * @returns {string} Unique ID hash
  */
-function extractImagesFromHtml(html) {
-  if (!html) {
-    return [];
-  }
-  const urls = [];
-  const imgRegex = /<img[^>]+src=["']([^"']+)["'][^>]*>/gi;
-  let match;
-  while ((match = imgRegex.exec(html)) !== null) {
-    const src = match[1];
-    if (src && !urls.includes(src)) {
-      urls.push(src);
-    }
-  }
-  return urls;
+export function generateItemUid(feedUrl, itemId) {
+  const hash = crypto.createHash("sha256");
+  hash.update(`${feedUrl}::${itemId}`);
+  return hash.digest("hex").slice(0, 24);
 }
 /**
@@ -36,7 +30,7 @@ function extractImagesFromHtml(html) {
  * @param {string|Date} dateInput - Date string or Date object
  * @returns {Date|undefined} Parsed Date or undefined if invalid
  */
-function parseDate(dateInput) {
+export function parseDate(dateInput) {
   if (!dateInput) {
     return;
   }
@@ -86,527 +80,17 @@ function parseDate(dateInput) {
  * @param {string|Date} dateInput - Date input
  * @returns {string|undefined} ISO string or undefined
  */
-function toISOStringSafe(dateInput) {
+export function toISOStringSafe(dateInput) {
   const date = parseDate(dateInput);
   return date ? date.toISOString() : undefined;
 }
-// SANITIZE_OPTIONS imported from ../utils/sanitize.js (shared with AP outbox fetcher)
-/**
- * Generate unique ID for an item
- * @param {string} feedUrl - Feed URL
- * @param {string} itemId - Item identifier (URL or ID)
- * @returns {string} Unique ID hash
- */
-export function generateItemUid(feedUrl, itemId) {
-  const hash = crypto.createHash("sha256");
-  hash.update(`${feedUrl}::${itemId}`);
-  return hash.digest("hex").slice(0, 24);
-}
-/**
- * Normalize RSS/Atom item from feedparser
- * @param {object} item - Feedparser item
- * @param {string} feedUrl - Feed URL
- * @param {string} feedType - 'rss' or 'atom'
- * @returns {object} Normalized jf2 item
- */
-export function normalizeItem(item, feedUrl, feedType) {
-  const url = item.link || item.origlink || item.guid;
-  const uid = generateItemUid(feedUrl, item.guid || url || item.title);
-  const normalized = {
-    type: "entry",
-    uid,
-    url,
-    name: item.title
-      ? sanitizeHtml(item.title, { allowedTags: [] }).trim()
-      : undefined,
-    published: toISOStringSafe(item.pubdate),
-    updated: toISOStringSafe(item.date),
-    _source: {
-      url: feedUrl,
-      feedUrl,
-      feedType,
-      originalId: item.guid,
-    },
-  };
-  // Content
-  if (item.description || item.summary) {
-    const html = item.description || item.summary;
-    normalized.content = {
-      html: sanitizeHtml(html, SANITIZE_OPTIONS),
-      text: sanitizeHtml(html, { allowedTags: [] }).trim(),
-    };
-  }
-  // Summary (prefer explicit summary over truncated content)
-  if (item.summary && item.description && item.summary !== item.description) {
-    normalized.summary = sanitizeHtml(item.summary, { allowedTags: [] }).trim();
-  }
-  // Author
-  if (item.author || item["dc:creator"]) {
-    const authorName = item.author || item["dc:creator"];
-    normalized.author = {
-      type: "card",
-      name: authorName,
-    };
-  }
-  // Categories/tags
-  if (item.categories && item.categories.length > 0) {
-    normalized.category = item.categories;
-  }
-  // Enclosures (media)
-  if (item.enclosures && item.enclosures.length > 0) {
-    for (const enclosure of item.enclosures) {
-      const mediaUrl = enclosure.url;
-      const mediaType = enclosure.type || "";
-      if (mediaType.startsWith("image/")) {
-        normalized.photo = normalized.photo || [];
-        normalized.photo.push(mediaUrl);
-      } else if (mediaType.startsWith("video/")) {
-        normalized.video = normalized.video || [];
-        normalized.video.push(mediaUrl);
-      } else if (mediaType.startsWith("audio/")) {
-        normalized.audio = normalized.audio || [];
-        normalized.audio.push(mediaUrl);
-      }
-    }
-  }
-  // Featured image from media content
-  if (item["media:content"] && item["media:content"].url) {
-    const mediaType = item["media:content"].type || "";
-    if (
-      mediaType.startsWith("image/") ||
-      item["media:content"].medium === "image"
-    ) {
-      normalized.photo = normalized.photo || [];
-      if (!normalized.photo.includes(item["media:content"].url)) {
-        normalized.photo.push(item["media:content"].url);
-      }
-    }
-  }
-  // Image from item.image
-  if (item.image && item.image.url) {
-    normalized.photo = normalized.photo || [];
-    if (!normalized.photo.includes(item.image.url)) {
-      normalized.photo.push(item.image.url);
-    }
-  }
-  // Extract images from HTML content as fallback
-  if (!normalized.photo && normalized.content?.html) {
-    const extracted = extractImagesFromHtml(normalized.content.html);
-    if (extracted.length > 0) {
-      normalized.photo = extracted;
-    }
-  }
-  return normalized;
-}
-/**
- * Normalize feed metadata from feedparser
- * @param {object} meta - Feedparser meta object
- * @param {string} feedUrl - Feed URL
- * @returns {object} Normalized feed metadata
- */
-export function normalizeFeedMeta(meta, feedUrl) {
-  const normalized = {
-    name: meta.title
-      ? sanitizeHtml(meta.title, { allowedTags: [] }).trim()
-      : feedUrl,
-  };
-  if (meta.description) {
-    normalized.summary = meta.description;
-  }
-  if (meta.link) {
-    normalized.url = meta.link;
-  }
-  if (meta.image && meta.image.url) {
-    normalized.photo = meta.image.url;
-  }
-  if (meta.favicon) {
-    normalized.photo = normalized.photo || meta.favicon;
-  }
-  // Author/publisher
-  if (meta.author) {
-    normalized.author = {
-      type: "card",
-      name: meta.author,
-    };
-  }
-  // Hub for WebSub
-  if (meta.cloud && meta.cloud.href) {
-    normalized._hub = meta.cloud.href;
-  }
-  // Look for hub in links
-  if (meta.link && meta["atom:link"]) {
-    const links = Array.isArray(meta["atom:link"])
-      ? meta["atom:link"]
-      : [meta["atom:link"]];
-    for (const link of links) {
-      if (link["@"] && link["@"].rel === "hub") {
-        normalized._hub = link["@"].href;
-        break;
-      }
-    }
-  }
-  return normalized;
-}
-/**
- * Normalize JSON Feed item
- * @param {object} item - JSON Feed item
- * @param {string} feedUrl - Feed URL
- * @returns {object} Normalized jf2 item
- */
-export function normalizeJsonFeedItem(item, feedUrl) {
-  const url = item.url || item.external_url;
-  const uid = generateItemUid(feedUrl, item.id || url);
-  const normalized = {
-    type: "entry",
-    uid,
-    url,
-    name: item.title
-      ? sanitizeHtml(item.title, { allowedTags: [] }).trim()
-      : undefined,
-    published: item.date_published
-      ? new Date(item.date_published).toISOString()
-      : undefined,
-    updated: item.date_modified
-      ? new Date(item.date_modified).toISOString()
-      : undefined,
-    _source: {
-      url: feedUrl,
-      feedUrl,
-      feedType: "jsonfeed",
-      originalId: item.id,
-    },
-  };
-  // Content
-  if (item.content_html || item.content_text) {
-    normalized.content = {};
-    if (item.content_html) {
-      normalized.content.html = sanitizeHtml(
-        item.content_html,
-        SANITIZE_OPTIONS,
-      );
-      normalized.content.text = sanitizeHtml(item.content_html, {
-        allowedTags: [],
-      }).trim();
-    } else if (item.content_text) {
-      normalized.content.text = item.content_text;
-    }
-  }
-  // Summary
-  if (item.summary) {
-    normalized.summary = item.summary;
-  }
-  // Author
-  if (item.author || item.authors) {
-    const author = item.author || (item.authors && item.authors[0]);
-    if (author) {
-      normalized.author = {
-        type: "card",
-        name: author.name,
-        url: author.url,
-        photo: author.avatar,
-      };
-    }
-  }
-  // Tags
-  if (item.tags && item.tags.length > 0) {
-    normalized.category = item.tags;
-  }
-  // Featured image
-  if (item.image) {
-    normalized.photo = [item.image];
-  }
-  if (item.banner_image && !normalized.photo) {
-    normalized.photo = [item.banner_image];
-  }
-  // Attachments
-  if (item.attachments && item.attachments.length > 0) {
-    for (const attachment of item.attachments) {
-      const mediaType = attachment.mime_type || "";
-      if (mediaType.startsWith("image/")) {
-        normalized.photo = normalized.photo || [];
-        normalized.photo.push(attachment.url);
-      } else if (mediaType.startsWith("video/")) {
-        normalized.video = normalized.video || [];
-        normalized.video.push(attachment.url);
-      } else if (mediaType.startsWith("audio/")) {
-        normalized.audio = normalized.audio || [];
-        normalized.audio.push(attachment.url);
-      }
-    }
-  }
-  // External URL
-  if (item.external_url && item.url !== item.external_url) {
-    normalized["bookmark-of"] = [item.external_url];
-  }
-  // Extract images from HTML content as fallback
-  if (!normalized.photo && normalized.content?.html) {
-    const extracted = extractImagesFromHtml(normalized.content.html);
-    if (extracted.length > 0) {
-      normalized.photo = extracted;
-    }
-  }
-  return normalized;
-}
-/**
- * Normalize JSON Feed metadata
- * @param {object} feed - JSON Feed object
- * @param {string} feedUrl - Feed URL
- * @returns {object} Normalized feed metadata
- */
-export function normalizeJsonFeedMeta(feed, feedUrl) {
-  const normalized = {
-    name: feed.title
-      ? sanitizeHtml(feed.title, { allowedTags: [] }).trim()
-      : feedUrl,
-  };
-  if (feed.description) {
-    normalized.summary = feed.description;
-  }
-  if (feed.home_page_url) {
-    normalized.url = feed.home_page_url;
-  }
-  if (feed.icon) {
-    normalized.photo = feed.icon;
-  } else if (feed.favicon) {
-    normalized.photo = feed.favicon;
-  }
-  if (feed.author || feed.authors) {
-    const author = feed.author || (feed.authors && feed.authors[0]);
-    if (author) {
-      normalized.author = {
-        type: "card",
-        name: author.name,
-        url: author.url,
-        photo: author.avatar,
-      };
-    }
-  }
-  // Hub for WebSub
-  if (feed.hubs && feed.hubs.length > 0) {
-    normalized._hub = feed.hubs[0].url;
-  }
-  return normalized;
-}
-/**
- * Normalize h-feed entry
- * @param {object} entry - Microformats h-entry
- * @param {string} feedUrl - Feed URL
- * @returns {object} Normalized jf2 item
- */
-export function normalizeHfeedItem(entry, feedUrl) {
-  const properties = entry.properties || {};
-  const url = getFirst(properties.url) || getFirst(properties.uid);
-  const uid = generateItemUid(feedUrl, getFirst(properties.uid) || url);
-  const normalized = {
-    type: "entry",
-    uid,
-    url,
-    _source: {
-      url: feedUrl,
-      feedUrl,
-      feedType: "hfeed",
-      originalId: getFirst(properties.uid),
-    },
-  };
-  // Name/title
-  if (properties.name) {
-    const name = getFirst(properties.name);
-    // Only include name if it's not just the content
-    if (
-      name &&
-      (!properties.content || name !== getContentText(properties.content))
-    ) {
-      normalized.name = name;
-    }
-  }
-  // Published
-  if (properties.published) {
-    const published = getFirst(properties.published);
-    normalized.published = new Date(published).toISOString();
-  }
-  // Updated
-  if (properties.updated) {
-    const updated = getFirst(properties.updated);
-    normalized.updated = new Date(updated).toISOString();
-  }
-  // Content
-  if (properties.content) {
-    const content = getFirst(properties.content);
-    if (typeof content === "object") {
-      normalized.content = {
-        html: content.html
-          ? sanitizeHtml(content.html, SANITIZE_OPTIONS)
-          : undefined,
-        text: content.value || undefined,
-      };
-    } else if (typeof content === "string") {
-      normalized.content = { text: content };
-    }
-  }
-  // Summary
-  if (properties.summary) {
-    normalized.summary = getFirst(properties.summary);
-  }
-  // Author
-  if (properties.author) {
-    const author = getFirst(properties.author);
-    normalized.author = normalizeHcard(author);
-  }
-  // Categories
-  if (properties.category) {
-    normalized.category = properties.category;
-  }
-  // Photos
-  if (properties.photo) {
-    normalized.photo = properties.photo.map((p) =>
-      typeof p === "object" ? p.value || p.url : p,
-    );
-  }
-  // Videos
-  if (properties.video) {
-    normalized.video = properties.video.map((v) =>
-      typeof v === "object" ? v.value || v.url : v,
-    );
-  }
-  // Audio
-  if (properties.audio) {
-    normalized.audio = properties.audio.map((a) =>
-      typeof a === "object" ? a.value || a.url : a,
-    );
-  }
-  // Interaction types - normalize to string URLs
-  if (properties["like-of"]) {
-    normalized["like-of"] = normalizeUrlArray(properties["like-of"]);
-  }
-  if (properties["repost-of"]) {
-    normalized["repost-of"] = normalizeUrlArray(properties["repost-of"]);
-  }
-  if (properties["bookmark-of"]) {
-    normalized["bookmark-of"] = normalizeUrlArray(properties["bookmark-of"]);
-  }
-  if (properties["in-reply-to"]) {
-    normalized["in-reply-to"] = normalizeUrlArray(properties["in-reply-to"]);
-  }
-  // RSVP
-  if (properties.rsvp) {
-    normalized.rsvp = getFirst(properties.rsvp);
-  }
-  // Syndication
-  if (properties.syndication) {
-    normalized.syndication = properties.syndication;
-  }
-  // Extract images from HTML content as fallback
-  if (!normalized.photo && normalized.content?.html) {
-    const extracted = extractImagesFromHtml(normalized.content.html);
-    if (extracted.length > 0) {
-      normalized.photo = extracted;
-    }
-  }
-  return normalized;
-}
-/**
- * Normalize h-feed metadata
- * @param {object} hfeed - h-feed microformat object
- * @param {string} feedUrl - Feed URL
- * @returns {object} Normalized feed metadata
- */
-export function normalizeHfeedMeta(hfeed, feedUrl) {
-  const properties = hfeed.properties || {};
-  const normalized = {
-    name: getFirst(properties.name) || feedUrl,
-  };
-  if (properties.summary) {
-    normalized.summary = getFirst(properties.summary);
-  }
-  if (properties.url) {
-    normalized.url = getFirst(properties.url);
-  }
-  if (properties.photo) {
-    normalized.photo = getFirst(properties.photo);
-    if (typeof normalized.photo === "object") {
-      normalized.photo = normalized.photo.value || normalized.photo.url;
-    }
-  }
-  if (properties.author) {
-    const author = getFirst(properties.author);
-    normalized.author = normalizeHcard(author);
-  }
-  return normalized;
-}
 /**
  * Extract URL string from a photo value
  * @param {object|string} photo - Photo value (can be string URL or object with value/url)
  * @returns {string|undefined} Photo URL string
  */
-function extractPhotoUrl(photo) {
+export function extractPhotoUrl(photo) {
   if (!photo) {
     return;
   }
@@ -624,7 +108,7 @@ function extractPhotoUrl(photo) {
  * @param {object|string} value - URL string or object with url/value property
  * @returns {string|undefined} URL string
  */
-function extractUrl(value) {
+export function extractUrl(value) {
   if (!value) {
     return;
   }
@@ -642,43 +126,19 @@ function extractUrl(value) {
  * @param {Array} urls - Array of URL strings or objects
  * @returns {Array<string>} Array of URL strings
  */
-function normalizeUrlArray(urls) {
+export function normalizeUrlArray(urls) {
   if (!urls || !Array.isArray(urls)) {
     return [];
   }
   return urls.map((u) => extractUrl(u)).filter(Boolean);
 }
-/**
- * Normalize h-card author
- * @param {object|string} hcard - h-card or author name string
- * @returns {object} Normalized author object
- */
-function normalizeHcard(hcard) {
-  if (typeof hcard === "string") {
-    return { type: "card", name: hcard };
-  }
-  if (!hcard || !hcard.properties) {
-    return;
-  }
-  const properties = hcard.properties;
-  return {
-    type: "card",
-    name: getFirst(properties.name),
-    url: getFirst(properties.url),
-    photo: extractPhotoUrl(getFirst(properties.photo)),
-  };
-}
 /**
  * Get first item from array or return the value itself
  * @param {Array|*} value - Value or array of values
  * @returns {*} First value or the value itself
  */
-function getFirst(value) {
+export function getFirst(value) {
   if (Array.isArray(value)) {
     return value[0];
   }
@@ -690,7 +150,7 @@ function getFirst(value) {
  * @param {Array} content - Content property array
  * @returns {string} Text content
  */
-function getContentText(content) {
+export function getContentText(content) {
   const first = getFirst(content);
   if (typeof first === "object") {
     return first.value || first.text || "";

package/lib/feeds/rss.js CHANGED Viewed

@@ -7,7 +7,7 @@ import { Readable } from "node:stream";
 import FeedParser from "feedparser";
-import { normalizeItem, normalizeFeedMeta } from "./normalizer.js";
+import { normalizeItem, normalizeFeedMeta } from "./normalizer-rss.js";
 /**
  * Parse RSS feed content

package/lib/polling/processor.js CHANGED Viewed

@@ -18,6 +18,7 @@ import {
 } from "../storage/feeds.js";
 import { passesRegexFilter, passesTypeFilter } from "../storage/filters.js";
 import { addItem } from "../storage/items.js";
+import { classifyUrl } from "../utils/source-type.js";
 import {
   subscribe as websubSubscribe,
   getCallbackUrl,
@@ -43,7 +44,7 @@ export async function processFeed(application, feed) {
   try {
     // Get Redis client for caching
-    const redis = getRedisClient(application);
+    const redis = await getRedisClient(application);
     // Fetch and parse the feed
     const parsed = await fetchAndParseFeed(feed.url, {
@@ -96,7 +97,7 @@ export async function processFeed(application, feed) {
       if (feed.capabilities?.source_type) {
         item._source.source_type = feed.capabilities.source_type;
       } else {
-        item._source.source_type = inferSourceType(feed.url);
+        item._source.source_type = classifyUrl(feed.url).type;
       }
       // Store the item
@@ -242,21 +243,6 @@ export async function processFeed(application, feed) {
   return result;
 }
-/**
- * Infer source type from feed URL when capabilities haven't been detected yet
- * @param {string} url - Feed URL
- * @returns {string} Source type
- */
-function inferSourceType(url) {
-  if (!url) return "web";
-  const lower = url.toLowerCase();
-  if (lower.includes("bsky.app") || lower.includes("bluesky")) return "bluesky";
-  if (lower.includes("mastodon.") || lower.includes("mstdn.") ||
-      lower.includes("fosstodon.") || lower.includes("pleroma.") ||
-      lower.includes("misskey.") || lower.includes("pixelfed.")) return "mastodon";
-  return "web";
-}
 /**
  * Check if an item passes channel filters
  * @param {object} item - Feed item