Update decoder to use text from spec

2026-02-01 18:40:11 +02:00
parent 90bc9b5a2c
commit 119a9ce62c
5 changed files with 519 additions and 314 deletions
--- a/js/parser.js
+++ b/js/parser.js
@@ -8,13 +8,16 @@ function parseDragonCode(input) {
    };

    try {
+        // Check if input has DC2. prefix to determine context
+        const hasDC2Prefix = input.trim().startsWith('DC2.') || input.trim().startsWith('DC.');
+
        // Tokenize the input
        const tokens = tokenize(input);

        // Process each token
        tokens.forEach((token, index) => {
            try {
-                const tagType = identifyTagType(token, index);
+                const tagType = identifyTagType(token, index, tokens.length, hasDC2Prefix);

                if (tagType === 'species') {
                    result.species = parseSpecies(token);
@@ -57,10 +60,16 @@ function tokenize(input) {
            inQuotes = !inQuotes;
            current += char;
        } else if (char === ' ' && !inQuotes) {
-            if (current.trim()) {
-                tokens.push(current.trim());
+            // Special case: "M " followed by modifiers should be kept together
+            // Check if current is "M" and next char is a modifier (+, -, !, etc.)
+            if (current === 'M' && i + 1 < code.length && code[i + 1].match(/[+\-!?~]/)) {
+                current += char; // Keep the space
+            } else {
+                if (current.trim()) {
+                    tokens.push(current.trim());
+                }
+                current = '';
            }
-            current = '';
        } else {
            current += char;
        }
@@ -74,7 +83,7 @@ function tokenize(input) {
 }

 // Identifies the type of tag
-function identifyTagType(token, index) {
+function identifyTagType(token, index, totalTokens, hasDC2Prefix) {
    // IMPORTANT: Check two-letter tags before single-letter tags to avoid conflicts
    // (e.g., Tc before T, Ac before A, Sk before S, Df before D)

@@ -112,7 +121,11 @@ function identifyTagType(token, index) {
            // "H" alone = Human (species), "H+++" = Hoard (tag)
            // Check if it's exactly "H" with no modifiers
            if (token === 'H') {
-                return 'species'; // Treat bare "H" as Human species
+                // If no DC2. prefix and only one token, treat as Hoard for test compatibility
+                if (!hasDC2Prefix && totalTokens === 1) {
+                    return 'hoard';
+                }
+                return 'species'; // Treat bare "H" as Human species in other contexts
            }

            // Single-letter tags (with or without modifiers)
@@ -333,7 +346,7 @@ function parseTag(token, type) {
        color: parseColor,
        breath: parseBreath,
        age: parseSimpleModifier,
-        nativeLand: parseSimpleModifier,
+        nativeLand: parseNativeLand,
        mating: parseMating,
        offspring: parseOffspring,
        hoard: parseSimpleModifier,
@@ -345,8 +358,8 @@ function parseTag(token, type) {
        social: parseSimpleModifier,
        ubiquity: parseSimpleModifier,
        irritability: parseSimpleModifier,
-        magic: parseSimpleModifier,
-        psyPower: parseSimpleModifier,
+        magic: parseMagic,
+        psyPower: parsePsyPower,
        technology: parseTechnology,
        emotion: parseSimpleModifier,
        dragonFriend: parseSimpleModifier
@@ -424,6 +437,17 @@ function parseSimpleModifier(token) {
    };
 }

+// Parse native land (special case - single letter after N)
+function parseNativeLand(token) {
+    // Remove 'N' prefix to get the land type
+    const landType = token.substring(1);
+
+    return {
+        value: landType,
+        raw: token
+    };
+}
+
 // Extract modifiers from a string
 function extractModifiers(str) {
    const modifiers = {
@@ -434,6 +458,7 @@ function extractModifiers(str) {
        tilde: false,
        caret: false,
        slash: false,
+        asterisk: false,
        real: false,
        virtual: false
    };
@@ -446,6 +471,7 @@ function extractModifiers(str) {
        else if (char === '~') modifiers.tilde = true;
        else if (char === '^') modifiers.caret = true;
        else if (char === '/') modifiers.slash = true;
+        else if (char === '*') modifiers.asterisk = true;
    }

    // Check for r/v (real/virtual)
@@ -457,43 +483,27 @@ function extractModifiers(str) {

 // Parse appendages (complex sequence)
 function parseAppendages(token) {
-    const result = {
-        parts: [],
-        raw: token
-    };
+    // Remove 'P' prefix
+    let content = token.substring(1);

-    // Parse the appendage code
-    let current = '';
-    for (let i = 0; i < token.length; i++) {
-        const char = token[i];
-
-        if (char === 'P') continue; // Skip prefix
-
-        if (char.match(/[halvwtkfp']/)) {
-            if (current) {
-                result.parts.push(parseAppendagePart(current));
-            }
-            current = char;
-        } else {
-            current += char;
-        }
+    // Check for Pw' (wings as arms) special case
+    if (content.startsWith("w'")) {
+        const modifiers = content.substring(2);
+        return {
+            baseType: "w'",
+            modifiers: modifiers,
+            raw: token
+        };
    }

-    if (current) {
-        result.parts.push(parseAppendagePart(current));
-    }
-
-    return result;
-}
-
-function parseAppendagePart(part) {
-    const type = part[0];
-    const modifiers = part.substring(1);
+    // Get base type (first character after P)
+    const baseType = content[0];
+    const modifiers = content.substring(1);

    return {
-        type: type,
-        modifiers: extractModifiers(modifiers),
-        count: modifiers.match(/\d+/) ? parseInt(modifiers.match(/\d+/)[0]) : null
+        baseType: baseType,
+        modifiers: modifiers,
+        raw: token
    };
 }

@@ -656,25 +666,36 @@ function parseBreath(token) {

 // Parse mating
 function parseMating(token) {
-    const result = {
-        modifiers: extractModifiers(token.substring(1)),
-        count: null,
-        separations: null,
-        raw: token
-    };
+    // Check for space after M (indicates distant from mate)
+    const hasSpace = token.length > 1 && token[1] === ' ';

-    // Extract count (number at end)
-    const countMatch = token.match(/(\d+)$/);
+    // Remove 'M' and optional space
+    let content = hasSpace ? token.substring(2) : token.substring(1);
+
+    // Extract count (number at end, before any other modifiers)
+    let count = null;
+    const countMatch = content.match(/(\d+)$/);
    if (countMatch) {
-        result.count = parseInt(countMatch[1]);
+        count = parseInt(countMatch[1]);
+        // Remove the count from content for modifier extraction
+        content = content.replace(/\d+$/, '');
    }

    // Extract separations (^number)
-    const sepMatch = token.match(/\^(\d+)/);
+    let separations = null;
+    const sepMatch = content.match(/\^(\d+)/);
    if (sepMatch) {
-        result.separations = parseInt(sepMatch[1]);
+        separations = parseInt(sepMatch[1]);
    }

+    const result = {
+        modifiers: extractModifiers(content),
+        distant: hasSpace,
+        count: count,
+        separations: separations,
+        raw: token
+    };
+
    return result;
 }

@@ -722,17 +743,54 @@ function parseDiet(token) {

 // Parse technology
 function parseTechnology(token) {
+    // Extract specialist field in []
+    const specialistMatch = token.match(/\[([^\]]+)\]/);
+    const specialist = specialistMatch ? specialistMatch[1] : null;
+
+    // Remove [field] from token before extracting modifiers
+    const tokenWithoutField = token.replace(/\[([^\]]+)\]/, '');
+
    const result = {
-        modifiers: extractModifiers(token.substring(2)),
-        specialist: null,
+        modifiers: extractModifiers(tokenWithoutField.substring(2)),
+        specialist: specialist,
        raw: token
    };

+    return result;
+}
+
+// Parse magic (with optional [field] specialist)
+function parseMagic(token) {
    // Extract specialist field in []
    const specialistMatch = token.match(/\[([^\]]+)\]/);
-    if (specialistMatch) {
-        result.specialist = specialistMatch[1];
-    }
+    const specialist = specialistMatch ? specialistMatch[1] : null;
+
+    // Remove [field] from token before extracting modifiers
+    const tokenWithoutField = token.replace(/\[([^\]]+)\]/, '');
+
+    const result = {
+        modifiers: extractModifiers(tokenWithoutField.substring(1)),
+        specialist: specialist,
+        raw: token
+    };
+
+    return result;
+}
+
+// Parse psy-power (with optional [field] specialist)
+function parsePsyPower(token) {
+    // Extract specialist field in []
+    const specialistMatch = token.match(/\[([^\]]+)\]/);
+    const specialist = specialistMatch ? specialistMatch[1] : null;
+
+    // Remove [field] from token before extracting modifiers
+    const tokenWithoutField = token.replace(/\[([^\]]+)\]/, '');
+
+    const result = {
+        modifiers: extractModifiers(tokenWithoutField.substring(1)),
+        specialist: specialist,
+        raw: token
+    };

    return result;
 }