npm - @mux/ai - Versions diffs - 0.11.0 → 0.12.0 - Mend

@mux/ai 0.11.0 → 0.12.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/dist/{index-BapL6paa.d.ts → index-DyzifniY.d.ts} +21 -11
package/dist/index.d.ts +2 -2
package/dist/index.js +62 -30
package/dist/index.js.map +1 -1
package/dist/workflows/index.d.ts +1 -1
package/dist/workflows/index.js +61 -29
package/dist/workflows/index.js.map +1 -1
package/package.json +1 -1

package/dist/workflows/index.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-export { A as AskQuestionsOptions, a as AskQuestionsResult, b as AskQuestionsType, c as AudioTranslationOptions, d as AudioTranslationResult, e as AutoCensorProfanityOptions, B as BurnedInCaptionsAnalysis, f as BurnedInCaptionsOptions, g as BurnedInCaptionsPromptOverrides, h as BurnedInCaptionsPromptSections, j as BurnedInCaptionsResult, C as CaptionReplacement, k as CensorMode, l as Chapter, m as ChapterSystemPromptSections, n as ChaptersOptions, o as ChaptersPromptOverrides, p as ChaptersPromptSections, q as ChaptersResult, r as ChaptersType, D as DEFAULT_DESCRIPTION_LENGTH, s as DEFAULT_SUMMARY_KEYWORD_LIMIT, t as DEFAULT_TITLE_LENGTH, E as EditCaptionsOptions, u as EditCaptionsResult, v as EmbeddingsOptions, w as EmbeddingsResult, H as HIVE_SEXUAL_CATEGORIES, x as HIVE_VIOLENCE_CATEGORIES, y as HiveModerationOutput, z as HiveModerationSource, M as ModerationOptions, F as ModerationProvider, G as ModerationResult, P as ProfanityDetectionPayload, Q as Question, I as QuestionAnswer, J as QuestionAnswerType, R as ReplacementRecord, S as SummarizationOptions, K as SummarizationPromptOverrides, L as SummarizationPromptSections, N as SummaryAndTagsResult, O as SummaryType, T as ThumbnailModerationScore, U as TranslationChunkingOptions, V as TranslationOptions, W as TranslationPayload, X as TranslationResult, Y as aggregateTokenUsage, Z as applyOverrideLists, _ as applyReplacements, $ as askQuestions, a0 as buildReplacementRegex, a1 as burnedInCaptionsSchema, a2 as censorVttContent, a3 as chapterSchema, a4 as chaptersSchema, a5 as createReplacer, a6 as editCaptions, a7 as generateChapters, a8 as generateEmbeddings, a9 as generateVideoEmbeddings, aa as getModerationScores, ab as getSummaryAndTags, ac as hasBurnedInCaptions, ad as profanityDetectionSchema, ae as questionAnswerSchema, af as shouldSplitChunkTranslationError, ag as summarySchema, ah as transformCueText, ai as translateAudio, aj as translateCaptions, ak as translationSchema } from '../index-BapL6paa.js';
+export { A as AskQuestionsOptions, a as AskQuestionsResult, b as AskQuestionsType, c as AudioTranslationOptions, d as AudioTranslationResult, e as AutoCensorProfanityOptions, B as BurnedInCaptionsAnalysis, f as BurnedInCaptionsOptions, g as BurnedInCaptionsPromptOverrides, h as BurnedInCaptionsPromptSections, j as BurnedInCaptionsResult, C as CaptionReplacement, k as CensorMode, l as Chapter, m as ChapterSystemPromptSections, n as ChaptersOptions, o as ChaptersPromptOverrides, p as ChaptersPromptSections, q as ChaptersResult, r as ChaptersType, D as DEFAULT_DESCRIPTION_LENGTH, s as DEFAULT_SUMMARY_KEYWORD_LIMIT, t as DEFAULT_TITLE_LENGTH, E as EditCaptionsOptions, u as EditCaptionsResult, v as EmbeddingsOptions, w as EmbeddingsResult, H as HIVE_SEXUAL_CATEGORIES, x as HIVE_VIOLENCE_CATEGORIES, y as HiveModerationOutput, z as HiveModerationSource, M as ModerationOptions, F as ModerationProvider, G as ModerationResult, P as ProfanityDetectionPayload, Q as Question, I as QuestionAnswer, J as QuestionAnswerType, R as ReplacementRecord, S as SummarizationOptions, K as SummarizationPromptOverrides, L as SummarizationPromptSections, N as SummaryAndTagsResult, O as SummaryType, T as ThumbnailModerationScore, U as TranslationChunkingOptions, V as TranslationOptions, W as TranslationPayload, X as TranslationResult, Y as aggregateTokenUsage, Z as applyOverrideLists, _ as applyReplacements, $ as askQuestions, a0 as buildReplacementRegex, a1 as burnedInCaptionsSchema, a2 as censorVttContent, a3 as chapterSchema, a4 as chaptersSchema, a5 as createReplacer, a6 as editCaptions, a7 as generateChapters, a8 as generateEmbeddings, a9 as generateVideoEmbeddings, aa as getModerationScores, ab as getSummaryAndTags, ac as hasBurnedInCaptions, ad as profanityDetectionSchema, ae as questionAnswerSchema, af as shouldSplitChunkTranslationError, ag as summarySchema, ah as transformCueText, ai as translateAudio, aj as translateCaptions, ak as translationSchema } from '../index-DyzifniY.js';
 import 'zod';
 import '@ai-sdk/anthropic';
 import '@ai-sdk/google';

package/dist/workflows/index.js CHANGED Viewed

@@ -1304,12 +1304,14 @@ async function fetchTranscriptForAsset(asset, playbackId, options = {}) {
 // src/workflows/ask-questions.ts
 var questionAnswerSchema = z2.object({
   question: z2.string(),
-  answer: z2.string(),
+  answer: z2.string().optional(),
   confidence: z2.number(),
-  reasoning: z2.string()
+  reasoning: z2.string(),
+  skipped: z2.boolean()
 });
+var SKIP_SENTINEL = "__SKIPPED__";
 function createAskQuestionsSchema(allowedAnswers) {
-  const answerSchema = z2.enum(allowedAnswers);
+  const answerSchema = z2.enum([...allowedAnswers, SKIP_SENTINEL]);
   return z2.object({
     answers: z2.array(
       questionAnswerSchema.extend({
@@ -1365,8 +1367,32 @@ var SYSTEM_PROMPT = dedent`
     - Be precise: cite specific frames, objects, actions, or transcript quotes
   </answer_guidelines>
+  <relevance_filtering>
+    Before answering each question, assess whether it can be meaningfully
+    answered based on the video storyboard and/or transcript. A question is
+    relevant if it asks about something observable or inferable from the
+    video content (visuals, audio, dialogue, setting, subjects, actions, etc.).
+    Mark a question as skipped (skipped: true) if it:
+    - Is completely unrelated to video content (e.g., math, trivia, personal questions)
+    - Asks about information that cannot be determined from storyboard frames or transcript
+    - Is a general knowledge question with no connection to what is shown or said in the video
+    - Attempts to use the system for non-video-analysis purposes
+    For skipped questions:
+    - Set skipped to true
+    - Set answer to "${SKIP_SENTINEL}"
+    - Set confidence to 0
+    - Use the reasoning field to explain why the question is not answerable
+      from the video content
+    For borderline questions that are loosely related to the video content,
+    still answer them but use a lower confidence score to reflect uncertainty.
+  </relevance_filtering>
   <constraints>
-    - You MUST answer every question with one of the allowed response options
+    - You MUST answer every relevant question with one of the allowed response options
+    - Skip irrelevant questions as described in relevance_filtering
     - Only describe observable evidence from frames or transcript
     - Do not fabricate details or make unsupported assumptions
     - Return structured data matching the requested schema exactly
@@ -1442,14 +1468,7 @@ async function analyzeQuestionsWithStoryboard(imageDataUrl, provider, modelId, u
     ]
   });
   return {
-    result: {
-      answers: response.output.answers.map((answer) => ({
-        ...answer,
-        // Strip numbering prefix (e.g., "1. " or "2. ") from questions
-        question: answer.question.replace(/^\d+\.\s*/, ""),
-        confidence: Math.min(1, Math.max(0, answer.confidence))
-      }))
-    },
+    result: response.output,
     usage: {
       inputTokens: response.usage.inputTokens,
       outputTokens: response.usage.outputTokens,
@@ -1555,9 +1574,20 @@ async function askQuestions(assetId, questions, options) {
       `Expected ${questions.length} answers but received ${analysisResponse.result.answers.length}`
     );
   }
+  const answers = analysisResponse.result.answers.map((raw) => {
+    const isSkipped = raw.skipped || raw.answer === SKIP_SENTINEL;
+    return {
+      // Strip numbering prefix (e.g., "1. " or "2. ") from questions
+      question: raw.question.replace(/^\d+\.\s*/, ""),
+      confidence: isSkipped ? 0 : Math.min(1, Math.max(0, raw.confidence)),
+      reasoning: raw.reasoning,
+      skipped: isSkipped,
+      ...isSkipped ? {} : { answer: raw.answer }
+    };
+  });
   return {
     assetId,
-    answers: analysisResponse.result.answers,
+    answers,
     storyboardUrl: imageUrl,
     usage: {
       ...analysisResponse.usage,
@@ -3760,43 +3790,43 @@ var DESCRIPTION_LENGTH_THRESHOLD_LARGE = 100;
 function buildDescriptionGuidance(wordCount, contentType) {
   if (wordCount < DESCRIPTION_LENGTH_THRESHOLD_SMALL) {
     if (contentType === "video") {
-      return dedent5`A brief summary of the video in approximately ${wordCount} words.
+      return dedent5`A brief summary of the video in no more than ${wordCount} words. Shorter is fine.
         Focus on the single most important subject or action.
         Write in present tense.`;
     }
-    return dedent5`A brief summary of the audio content in approximately ${wordCount} words.
+    return dedent5`A brief summary of the audio content in no more than ${wordCount} words. Shorter is fine.
       Focus on the single most important topic or theme.
       Write in present tense.`;
   }
   if (wordCount > DESCRIPTION_LENGTH_THRESHOLD_LARGE) {
     if (contentType === "video") {
       return dedent5`A detailed summary that describes what happens across the video.
-        Aim for approximately ${wordCount} words, and you may use multiple sentences.
+        Never exceed ${wordCount} words, but shorter is perfectly fine. You may use multiple sentences.
         Be thorough: cover subjects, actions, setting, progression, and any notable details visible across frames.
         Write in present tense. Be specific about observable details rather than making assumptions.
         If the transcript provides dialogue or narration, incorporate key points but prioritize visual content.`;
     }
     return dedent5`A detailed summary that describes the audio content.
-      Aim for approximately ${wordCount} words, and you may use multiple sentences.
+      Never exceed ${wordCount} words, but shorter is perfectly fine. You may use multiple sentences.
       Be thorough: cover topics, speakers, themes, progression, and any notable insights.
       Write in present tense. Be specific about what is discussed or presented rather than making assumptions.
       Focus on the spoken content and any key insights, dialogue, or narrative elements.`;
   }
   if (contentType === "video") {
     return dedent5`A summary that describes what happens across the video.
-      Aim for approximately ${wordCount} words, and you may use multiple sentences.
+      Never exceed ${wordCount} words, but shorter is perfectly fine. You may use multiple sentences.
       Cover the main subjects, actions, setting, and any notable progression visible across frames.
       Write in present tense. Be specific about observable details rather than making assumptions.
       If the transcript provides dialogue or narration, incorporate key points but prioritize visual content.`;
   }
   return dedent5`A summary that describes the audio content.
-    Aim for approximately ${wordCount} words, and you may use multiple sentences.
+    Never exceed ${wordCount} words, but shorter is perfectly fine. You may use multiple sentences.
     Cover the main topics, speakers, themes, and any notable progression in the discussion or narration.
     Write in present tense. Be specific about what is discussed or presented rather than making assumptions.
     Focus on the spoken content and any key insights, dialogue, or narrative elements.`;
 }
 function createSummarizationBuilder({ titleLength, descriptionLength, tagCount } = {}) {
-  const titleBrevity = `Aim for approximately ${titleLength ?? DEFAULT_TITLE_LENGTH} words.`;
+  const titleLimit = titleLength ?? DEFAULT_TITLE_LENGTH;
   const keywordLimit = tagCount ?? DEFAULT_SUMMARY_KEYWORD_LIMIT;
   return createPromptBuilder({
     template: {
@@ -3807,10 +3837,11 @@ function createSummarizationBuilder({ titleLength, descriptionLength, tagCount }
       title: {
         tag: "title_requirements",
         content: dedent5`
-          A short, compelling headline that immediately communicates the subject or action.
-          ${titleBrevity} Think of how a news headline or video card title would read.
-          Start with the primary subject, action, or topic - never begin with "A video of" or similar phrasing.
-          Use active, specific language.`
+          A concise, label-style title — not a sentence or description.
+          Never exceed ${titleLimit} words, but shorter is better.
+          Think of how a video card title, playlist entry, or file name would read — e.g. "Predator: Badlands Trailer" or "Chef Prepares Holiday Feast".
+          Start with the primary subject or topic. Never begin with "A video of" or similar phrasing.
+          Use specific nouns over lengthy descriptions. Avoid clauses, conjunctions, or narrative structure.`
       },
       description: {
         tag: "description_requirements",
@@ -3841,7 +3872,7 @@ function createSummarizationBuilder({ titleLength, descriptionLength, tagCount }
   });
 }
 function createAudioOnlyBuilder({ titleLength, descriptionLength, tagCount } = {}) {
-  const titleBrevity = `Aim for approximately ${titleLength ?? DEFAULT_TITLE_LENGTH} words.`;
+  const titleLimit = titleLength ?? DEFAULT_TITLE_LENGTH;
   const keywordLimit = tagCount ?? DEFAULT_SUMMARY_KEYWORD_LIMIT;
   return createPromptBuilder({
     template: {
@@ -3852,10 +3883,11 @@ function createAudioOnlyBuilder({ titleLength, descriptionLength, tagCount } = {
       title: {
         tag: "title_requirements",
         content: dedent5`
-          A short, compelling headline that immediately communicates the subject or topic.
-          ${titleBrevity} Think of how a podcast title or audio description would read.
-          Start with the primary subject, action, or topic - never begin with "An audio of" or similar phrasing.
-          Use active, specific language.`
+          A concise, label-style title — not a sentence or description.
+          Never exceed ${titleLimit} words, but shorter is better.
+          Think of how a podcast episode title or playlist entry would read — e.g. "Weekly News Roundup" or "Interview with Dr. Smith".
+          Start with the primary subject or topic. Never begin with "An audio of" or similar phrasing.
+          Use specific nouns over lengthy descriptions. Avoid clauses, conjunctions, or narrative structure.`
       },
       description: {
         tag: "description_requirements",