npm - @paroicms/site-generator-plugin - Versions diffs - 0.8.0 → 0.8.1 - Mend

@paroicms/site-generator-plugin 0.8.0 → 0.8.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/gen-backend/dist/db/db.queries.js CHANGED Viewed

@@ -1,8 +1,8 @@
-import { strVal } from "@paroi/data-formatters-lib";
+import { strVal, strValOrUndef } from "@paroi/data-formatters-lib";
 export async function readSession(ctx, sessionId) {
     const { cn } = ctx;
     const row = await cn("PaGenSession")
-        .select("id", "status", "guardCount", "promptCount", "nodeTypeCount", "contentCount", "errorMessage")
+        .select("id", "createdAt", "status", "guardCount", "promptCount", "nodeTypeCount", "contentCount", "errorMessage")
         .where({ id: sessionId })
         .first();
     if (!row)
@@ -15,7 +15,7 @@ export async function readSession(ctx, sessionId) {
         promptCount: Number(row.promptCount),
         nodeTypeCount: Number(row.nodeTypeCount),
         contentCount: Number(row.contentCount),
-        errorMessage: strVal(row.errorMessage),
+        errorMessage: strValOrUndef(row.errorMessage),
     };
 }
 export async function insertSession(ctx, { sessionId }) {

package/gen-backend/dist/generator/fake-content-generator.ts/content-helpers.js ADDED Viewed

@@ -0,0 +1,17 @@
+export function dedupMessages(messages) {
+    const counters = new Map();
+    const result = [];
+    for (const m of messages) {
+        const counter = counters.get(m);
+        if (counter) {
+            counters.set(m, counter + 1);
+            continue;
+        }
+        counters.set(m, 1);
+        result.push(m);
+    }
+    return result.map((m) => {
+        const counter = counters.get(m);
+        return counter && counter > 1 ? `${m} (×${counter})` : m;
+    });
+}

package/gen-backend/dist/generator/fake-content-generator.ts/create-database-with-fake-content.js CHANGED Viewed

@@ -2,6 +2,7 @@ import { getPartTypeByName, getRegularDocumentTypeByName, getRoutingDocumentType
 import { createSimpleTranslator, } from "@paroicms/public-server-lib";
 import { getRandomImagePath } from "../lib/images-lib.js";
 import { createTaskCollector } from "../lib/tasks.js";
+import { dedupMessages } from "./content-helpers.js";
 import { createGeneratedContentReport } from "./content-report.js";
 import { generateLocalizedFooterMention } from "./create-node-contents.js";
 import { generateFieldSetContent, generateMultipleFieldSetContents, } from "./generate-fake-content.js";
@@ -161,8 +162,9 @@ async function addRegularDocuments(ctx, report, siteOptions, nodeOptions) {
         tolerateErrors,
         debugName: nodeType.kebabName,
     });
-    if (tolerateErrors.errorMessages.length > 0) {
-        ctx.logger.warn(`Error generating content for ${nodeType.typeName}:\n  - ${tolerateErrors.errorMessages.join("\n  - ")}`);
+    const errorMessages = dedupMessages(tolerateErrors.errorMessages);
+    if (errorMessages.length > 0) {
+        ctx.logger.warn(`Error generating content for ${nodeType.typeName}:\n  - ${errorMessages.join("\n  - ")}`);
     }
     await ctx.service.connector.addMultipleDocumentContents(fqdn, {
         parentNodeId,
@@ -187,8 +189,9 @@ async function addParts(ctx, report, siteOptions, nodeOptions) {
         tolerateErrors,
         debugName: nodeType.kebabName,
     });
-    if (tolerateErrors.errorMessages.length > 0) {
-        ctx.logger.warn(`Error generating content for ${nodeType.typeName}:\n  - ${tolerateErrors.errorMessages.join("\n  - ")}`);
+    const errorMessages = dedupMessages(tolerateErrors.errorMessages);
+    if (errorMessages.length > 0) {
+        ctx.logger.warn(`Error generating content for ${nodeType.typeName}:\n  - ${errorMessages.join("\n  - ")}`);
     }
     await ctx.service.connector.addMultiplePartContents(fqdn, {
         parentNodeId,

package/gen-backend/dist/generator/lib/parse-llm-response.js CHANGED Viewed

@@ -106,9 +106,9 @@ export function parseLlmRawTags(llmResponse, tagNames, options = {}) {
         const current = matches[i];
         if (current.isOpening) {
             // Find the next corresponding closing tag
-            let j = i + 1;
+            const j = i + 1;
             let foundClosing = false;
-            while (j < matches.length) {
+            if (j < matches.length) {
                 const next = matches[j];
                 // If we encounter another opening tag of any type before finding our closing tag,
                 // it's an error if not tolerating errors
@@ -119,9 +119,15 @@ export function parseLlmRawTags(llmResponse, tagNames, options = {}) {
                     tolerateErrors.errorMessages.push(message);
                     foundClosing = undefined;
                     // If we are tolerating errors, we skip this opening tag entirely
-                    break;
                 }
-                if (!next.isOpening && next.tagName === current.tagName) {
+                else {
+                    if (next.tagName !== current.tagName) {
+                        // Found a non-matching closing tag
+                        const message = `Mismatched tags: opening <${current.tagName}>, closing </${next.tagName}>`;
+                        if (!tolerateErrors)
+                            throw new Error(message);
+                        tolerateErrors.errorMessages.push(message);
+                    }
                     // Found a matching closing tag
                     const contentStart = current.position + `<${current.tagName}>`.length;
                     const contentEnd = next.position;
@@ -133,19 +139,7 @@ export function parseLlmRawTags(llmResponse, tagNames, options = {}) {
                     // Skip to after this closing tag
                     i = j;
                     foundClosing = true;
-                    break;
                 }
-                if (!next.isOpening && next.tagName !== current.tagName) {
-                    // Found a non-matching closing tag
-                    const message = `Mismatched tags: opening <${current.tagName}>, closing </${next.tagName}>`;
-                    if (!tolerateErrors)
-                        throw new Error(message);
-                    tolerateErrors.errorMessages.push(message);
-                    foundClosing = undefined;
-                    // If we are tolerating errors, we skip this current opening tag entirely
-                    break;
-                }
-                ++j;
             }
             // Handle case where no matching closing tag was found
             if (foundClosing === false) {

package/gen-backend/dist/generator/llm-queries/invoke-new-site-analysis.js CHANGED Viewed

@@ -18,13 +18,13 @@ const fieldsPrompt = await createPromptTemplate({
 export async function invokeNewSiteAnalysis(ctx, input) {
     const { analysis, explanation, unusedInformation } = await invokeAnalysisStep1(ctx, input);
     const siteSchema = createSiteSchemaFromAnalysis(analysis);
-    await invokeAnalysisStep2(ctx, { prompt: unusedInformation ?? "" }, siteSchema);
+    const { unusedInformation: unusedInformation2 } = await invokeAnalysisStep2(ctx, { prompt: createUnusedInformationPrompt(unusedInformation, analysis) ?? "" }, siteSchema);
     reorderSiteSchemaNodeTypes(siteSchema);
     const l10n = createL10n(analysis, siteSchema);
     const siteTitle = {
         [analysis.siteProperties.language]: analysis.siteProperties.title,
     };
-    if (!unusedInformation) {
+    if (!unusedInformation2) {
         await updateSession(ctx, { status: "analyzed", promptCountInc: 1 });
         return {
             siteTitle,
@@ -34,9 +34,9 @@ export async function invokeNewSiteAnalysis(ctx, input) {
             explanation,
         };
     }
-    ctx.logger.debug("Unused information:", unusedInformation);
+    ctx.logger.debug("Unused information:", unusedInformation2);
     const updated = await invokeUpdateSiteSchema(ctx, {
-        prompt: unusedInformation,
+        prompt: unusedInformation2,
         generatedSchema: {
             siteTitle,
             siteSchema,
@@ -125,16 +125,23 @@ siteSchema) {
         const llmMessage = await fieldsPrompt.pipe(ctx.goodModel).invoke(llmInput);
         llmMessageContent = await debug.getMessageContent(llmMessage);
     }
-    const { assignedFields } = parseLlmResponseAsProperties(llmMessageContent, [
+    const { assignedFields, unusedInformation } = parseLlmResponseAsProperties(llmMessageContent, [
         {
             tagName: "yaml_result",
             key: "assignedFields",
             format: "yaml",
         },
+        {
+            tagName: "unused_information_md",
+            key: "unusedInformation",
+            format: "markdown",
+            optional: true,
+        },
     ]);
     if (siteSchema.nodeTypes) {
         assignFieldsToNodeTypes(ctx, assignedFields, siteSchema.nodeTypes);
     }
+    return { unusedInformation };
 }
 function assignFieldsToNodeTypes(ctx, assignedFields, nodeTypes) {
     const remainingTypeNames = new Set(Object.keys(assignedFields));
@@ -172,3 +179,15 @@ function reorderSiteSchemaNodeTypes(siteSchema) {
         "orderChildrenBy",
     ]));
 }
+function createUnusedInformationPrompt(unusedInformation, analysis) {
+    const prompts = Object.entries(analysis.dictionary)
+        .map(([typeName, entry]) => {
+        return entry.prompt ? `${typeName}: ${entry.prompt}` : undefined;
+    })
+        .filter(Boolean);
+    if (prompts.length > 0) {
+        const nodeTypePrompts = `To do:\n\n- ${prompts.join("- \n")}`;
+        return unusedInformation ? `${nodeTypePrompts}\n\n${unusedInformation}` : nodeTypePrompts;
+    }
+    return unusedInformation;
+}

package/gen-backend/dist/generator/site-schema-generator/create-site-schema.js CHANGED Viewed

@@ -9,6 +9,7 @@ export function createSiteSchemaFromAnalysis(analysis) {
             "@paroicms/content-loading-plugin",
             "@paroicms/public-menu-plugin",
             "@paroicms/contact-form-plugin",
+            "@paroicms/video-plugin",
         ],
         nodeTypes: [
             {

package/gen-backend/dist/plugin.js CHANGED Viewed

@@ -31,7 +31,7 @@ const plugin = {
             modelName: "claude-3-7-sonnet-20250219",
             anthropicApiKey: pluginConf.anthropicApiKey,
             temperature: 0.1,
-            maxTokens: 4096,
+            maxTokens: 6500,
             clientOptions: {
                 timeout: 60_000,
             },
@@ -40,7 +40,7 @@ const plugin = {
             modelName: "claude-3-7-sonnet-20250219",
             anthropicApiKey: pluginConf.anthropicApiKey,
             temperature: 0.1,
-            maxTokens: 4096,
+            maxTokens: 3000,
             clientOptions: {
                 timeout: 20_000,
             },

package/gen-backend/prompts/0-context.md CHANGED Viewed

@@ -1,4 +1,4 @@
-We use **ParoiCMS** technology. With this technology, a web page is called a **document**. A website is a tree of documents. The home page is a document, the site section with news posts is a document, each post is a document. Each document has its own path in the URL.
+We use **ParoiCMS** for creating a website. With this technology, a web page is called a **document**. A website is a tree of documents. The home page is a document, the site section with news posts is a document, each post is a document. Each document has its own path in the URL.
 There is a special kind of documents that we want to detect: **routing documents** are the site sections. They can't be duplicated. They are never items of a list. For example, the homepage document, the search-page document, the "about us" document, the parent page of blog posts are _routing documents_. Other documents are **regular documents**, and they are always items of a list.
@@ -6,4 +6,4 @@ A document always has the following base attributes: a localized _title_, a _pub
 A document can contain lists of **parts**. A _part_ is a sub-section of a document, or of another _part_. A part always has a _publish date_ and a _draft_ flag. It may contain a sequence of fields and/or a sequence of child parts. A part is always an item of a list.
-Important: In the current version, we don't support any taxonomy. No categories, no tags etc.
+Any routing document which is parent of regular documents can be used as a **taxonomy**. Then, the terms are the regular child documents. Then a taxonomy can be used in any document or part, by declaring a **labeling field**.

package/gen-backend/prompts/new-site-1-analysis.md CHANGED Viewed

@@ -100,7 +100,9 @@ Here's an example of correct output using parts, and with the default contact an
 * `home` (routing document)
   * list of `homeSection` (parts), list name: `homeSections`
   * `news` (routing document)
-    * list of `article` (regular documents)
+    * list of `post` (regular documents)
+    * `tags` (routing document)
+      * list of `tag` (regular documents)
   * `pages` (routing document)
     * list of `page` (regular documents)
       * list of `pageSection` (parts), list name: `pageSections`
@@ -125,6 +127,7 @@ Guidelines for creating the dictionnary YAML:
   - ogType: (optional, and document only) If you think of a particular Open-Graph type for this document, give it here.
   - label: A label of the node type, in the _website language_.
   - description: A description (5-40 words) for describing the purpose and theme of the node type. Write it in the _website language_.
+  - prompt: This is an optional property. If there is an information to process later about this node type (a description of fields), then write it here. Keep is short.
 - For a list type (only for part list, never for document list), provide the following properties:
   - confidence: Your confidence level for the accuracy of this node type (0.0-1.0).
   - kind: Must be `partList`.
@@ -155,14 +158,26 @@ news:
   kind: routingDocument
   entryPage: true
   label: News
-  description: This is the blog section of the website. The news document contains all the topical articles.
-article:
+  description: This is the blog section of the website. The news document contains all the topical posts.
+post:
   confidence: 0.8
   kind: regularDocument
   temporal: true
   ogType: article
-  label: Article
-  description: A topical article about the subject of the website whatever it is.
+  label: Post
+  description: A topical post about the subject of the website whatever it is.
+  prompt: Add a labeling field using the tags taxonomy
+tags:
+  confidence: 0.9
+  kind: routingDocument
+  label: Tags
+  description: Tags taxonomy for post documents.
+tag:
+  confidence: 0.9
+  kind: regularDocument
+  temporal: true
+  label: Tag
+  description: A tag is a term in the tags taxonomy.
 pages:
   confidence: 0.9
   kind: routingDocument

package/gen-backend/prompts/new-site-2-fields.md CHANGED Viewed

@@ -33,6 +33,7 @@ Guidelines for creating the dictionnary YAML:
   - By default, for most of node types, if you are not sure about what could be the best fields, then remember that a document is a webpage and just use a `[htmlContent]`.
   - Except if there are specific instructions in the website description, here is the default value for the `_site` node type: `["logo", "footerMention"]`.
 - Gallery of medias: there is a predefined field named `"gallery"`. It contains a list of medias. The theme can render it as a carousel, a slider, an image gallery, a slideshow, etc.
+- This task is about predefined fields only. Custom fields will be added in a further step.
 Here is an example of expected output:

package/gen-backend/prompts/update-site-schema-2-execute.md CHANGED Viewed

@@ -73,7 +73,23 @@ Important:
 - Never add an unknown predefined field.
 - The type name of the "site" node type is omitted from the JSON but its value is always `_site`.
-# 3. Examine the current JSON data, which conforms to the `JtSiteSchema` type:
+# 3. Labeling fields (using a taxonomy)
+A labeling field lets the user assign taxonomy terms to a document (or part).
+<field_type_example>
+{{
+  "name": "tags",
+  "localized": false,
+  "storedAs": "labeling",
+  "taxonomy": "tags",
+  "multiple": true
+}},
+</field_type_example>
+Most of the time, the field name will be the same as the taxonomy type name.
+# 4. Examine the current JSON data, which conforms to the `JtSiteSchema` type:
 <site_schema_json>
 {siteSchemaJson}
@@ -85,19 +101,19 @@ Also, the attached locales:
 {l10nJson}
 </l10n_json>
-# 4. Now, here is what to do:
+# 5. Now, here is what to do:
 <user_request>
 {taskDetailsMd}
 </user_request>
-# 5. Guidelines
+# 6. Guidelines
 - Don't assume how the CMS works. If you are not sure how to do something, don't do it.
 - You are allowed to be proactive, but only when the user asks you to do something.
 - Remember to adhere strictly to the TypeScript typing when making changes. If the update message requests changes that would violate the typing, then prioritize maintaining the correct structure over making those specific changes.
-# 6. Output
+# 7. Output
 If there is a change in the site schema, then provide the updated site schema in JSON within <updated_site_schema_json> tags. Otherwise, let this tag empty.