npm - @shd101wyy/yo - Versions diffs - 0.1.5 → 0.1.7 - Mend

@shd101wyy/yo 0.1.5 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

package/README.md +8 -6
package/out/cjs/index.cjs +691 -636
package/out/cjs/yo-cli.cjs +710 -653
package/out/esm/index.mjs +649 -594
package/out/types/src/build-runner.d.ts +1 -1
package/out/types/src/codegen/async/runtime-io-common.d.ts +2 -1
package/out/types/src/codegen/async/runtime.d.ts +5 -1
package/out/types/src/codegen/codegen-c.d.ts +2 -0
package/out/types/src/codegen/functions/collection.d.ts +1 -1
package/out/types/src/codegen/functions/context.d.ts +1 -0
package/out/types/src/codegen/functions/generation.d.ts +10 -0
package/out/types/src/codegen/utils/index.d.ts +4 -0
package/out/types/src/env.d.ts +1 -0
package/out/types/src/evaluator/builtins/build.d.ts +1 -0
package/out/types/src/evaluator/builtins/comptime-index-fns.d.ts +17 -0
package/out/types/src/evaluator/calls/index-trait.d.ts +17 -0
package/out/types/src/evaluator/context.d.ts +19 -14
package/out/types/src/evaluator/index.d.ts +3 -1
package/out/types/src/evaluator/trait-checking.d.ts +1 -0
package/out/types/src/evaluator/values/anonymous-module.d.ts +3 -2
package/out/types/src/expr.d.ts +22 -1
package/out/types/src/module-manager.d.ts +1 -0
package/out/types/src/target.d.ts +1 -0
package/out/types/src/value.d.ts +4 -1
package/out/types/tsconfig.tsbuildinfo +1 -1
package/package.json +1 -1
package/std/build.yo +2 -1
package/std/collections/array_list.yo +114 -26
package/std/collections/btree_map.yo +13 -3
package/std/collections/deque.yo +10 -0
package/std/collections/hash_map.yo +15 -0
package/std/collections/priority_queue.yo +5 -5
package/std/encoding/html.yo +283 -0
package/std/encoding/html_char_utils.yo +36 -0
package/std/encoding/html_entities.yo +2262 -0
package/std/encoding/punycode.yo +366 -0
package/std/encoding/toml.yo +1 -1
package/std/fmt/to_string.yo +5 -4
package/std/glob/index.yo +2 -2
package/std/libc/wctype.yo +55 -0
package/std/path.yo +6 -6
package/std/prelude.yo +826 -205
package/std/process.yo +1 -1
package/std/regex/compiler.yo +11 -11
package/std/regex/index.yo +2 -4
package/std/regex/parser.yo +69 -4
package/std/regex/vm.yo +53 -46
package/std/string/string.yo +1424 -1339
package/std/string/unicode.yo +242 -0
package/out/types/src/evaluator/calls/array.d.ts +0 -14

package/std/encoding/punycode.yo ADDED Viewed

@@ -0,0 +1,366 @@
+// Punycode codec (RFC 3492)
+//
+// Provides punycode encoding/decoding and IDN hostname conversion.
+//
+// Example:
+//   { punycode_decode, punycode_encode, to_unicode, to_ascii } :: import "std/encoding/punycode";
+//
+//   encoded := punycode_encode(`München`);
+//   decoded := punycode_decode(encoded);
+//   ascii_domain := to_ascii(`münchen.de`);  // "xn--mnchen-3ya.de"
+//   unicode_domain := to_unicode(ascii_domain);  // "münchen.de"
+open import "../string";
+{ ArrayList } :: import "../collections/array_list";
+// Punycode constants (RFC 3492 section 5)
+_BASE :: i32(36);
+_TMIN :: i32(1);
+_TMAX :: i32(26);
+_SKEW :: i32(38);
+_DAMP :: i32(700);
+_INITIAL_BIAS :: i32(72);
+_INITIAL_N :: i32(128);
+// Decode a single punycode digit character to its value.
+_decode_digit :: (fn(cp: i32) -> i32)(
+  cond(
+    ((cp >= i32(0x30)) && (cp <= i32(0x39))) => (cp - i32(22)),
+    ((cp >= i32(0x41)) && (cp <= i32(0x5A))) => (cp - i32(0x41)),
+    ((cp >= i32(0x61)) && (cp <= i32(0x7A))) => (cp - i32(0x61)),
+    true => i32(-1)
+  )
+);
+// Encode a digit value to its punycode character.
+_encode_digit :: (fn(d: i32) -> u8)(
+  cond(
+    (d < i32(26)) => u8((d + i32(0x61))),
+    true => u8(((d - i32(26)) + i32(0x30)))
+  )
+);
+// Bias adaptation function (RFC 3492 section 3.4)
+_adapt :: (fn(delta_val: i32, num_points: i32, first_time: bool) -> i32)({
+  (d : i32) = cond(
+    first_time => (delta_val / _DAMP),
+    true => (delta_val / i32(2))
+  );
+  d = (d + (d / num_points));
+  (k : i32) = i32(0);
+  while (d > (((_BASE - _TMIN) * _TMAX) / i32(2))), {
+    d = (d / (_BASE - _TMIN));
+    k = (k + _BASE);
+  };
+  (k + ((((_BASE - _TMIN) + i32(1)) * d) / (d + _SKEW)))
+});
+// Encode a single Unicode code point as UTF-8 bytes.
+_encode_codepoint :: (fn(cp: i32, out: *(ArrayList(u8))) -> unit)(
+  cond(
+    (cp < i32(0x80)) => {
+      out.*.push(u8(cp));
+    },
+    (cp < i32(0x800)) => {
+      out.*.push(u8((i32(0xC0) | (cp >> i32(6)))));
+      out.*.push(u8((i32(0x80) | (cp & i32(0x3F)))));
+    },
+    (cp < i32(0x10000)) => {
+      out.*.push(u8((i32(0xE0) | (cp >> i32(12)))));
+      out.*.push(u8((i32(0x80) | ((cp >> i32(6)) & i32(0x3F)))));
+      out.*.push(u8((i32(0x80) | (cp & i32(0x3F)))));
+    },
+    true => {
+      out.*.push(u8((i32(0xF0) | (cp >> i32(18)))));
+      out.*.push(u8((i32(0x80) | ((cp >> i32(12)) & i32(0x3F)))));
+      out.*.push(u8((i32(0x80) | ((cp >> i32(6)) & i32(0x3F)))));
+      out.*.push(u8((i32(0x80) | (cp & i32(0x3F)))));
+    }
+  )
+);
+// Decode a UTF-8 string into an array of code points.
+_string_to_codepoints :: (fn(s: String) -> ArrayList(i32))({
+  (bytes : ArrayList(u8)) = s.as_bytes();
+  (cps : ArrayList(i32)) = ArrayList(i32).new();
+  (i : usize) = usize(0);
+  (blen : usize) = bytes.len();
+  while (i < blen), {
+    (b : i32) = i32(bytes.get(i).unwrap());
+    (cp : i32) = i32(0);
+    (size : usize) = usize(1);
+    cond(
+      (b < i32(0x80)) => {
+        cp = b;
+      },
+      ((b >= i32(0xC0)) && (b < i32(0xE0))) => {
+        cp = (b & i32(0x1F));
+        size = usize(2);
+      },
+      ((b >= i32(0xE0)) && (b < i32(0xF0))) => {
+        cp = (b & i32(0x0F));
+        size = usize(3);
+      },
+      ((b >= i32(0xF0)) && (b < i32(0xF8))) => {
+        cp = (b & i32(0x07));
+        size = usize(4);
+      },
+      true => {
+        cp = i32(0xFFFD);
+      }
+    );
+    (j : usize) = usize(1);
+    while (j < size), {
+      if(((i + j) < blen), {
+        cp = ((cp << i32(6)) | (i32(bytes.get((i + j)).unwrap()) & i32(0x3F)));
+      });
+      j = (j + usize(1));
+    };
+    cps.push(cp);
+    i = (i + size);
+  };
+  cps
+});
+// Decode a punycode-encoded string (without the xn-- prefix).
+// Returns .Some(decoded) on success, .None on error.
+punycode_decode :: (fn(input: String) -> Option(String))({
+  (bytes : ArrayList(u8)) = input.as_bytes();
+  (input_len : i32) = i32(bytes.len());
+  // Find the last '-' separator
+  (basic_end : i32) = i32(-1);
+  (j : i32) = (input_len - i32(1));
+  while ((j >= i32(0)) && (basic_end < i32(0))), {
+    if((i32(bytes.get(usize(j)).unwrap()) == i32(0x2D)), {
+      basic_end = j;
+    });
+    j = (j - i32(1));
+  };
+  (output : ArrayList(i32)) = ArrayList(i32).new();
+  (basic_length : i32) = cond(
+    (basic_end >= i32(0)) => basic_end,
+    true => i32(0)
+  );
+  (bi : i32) = i32(0);
+  while (bi < basic_length), {
+    (cp : i32) = i32(bytes.get(usize(bi)).unwrap());
+    if((cp >= i32(0x80)), {
+      return .None;
+    });
+    output.push(cp);
+    bi = (bi + i32(1));
+  };
+  (idx : i32) = cond(
+    (basic_end >= i32(0)) => (basic_end + i32(1)),
+    true => i32(0)
+  );
+  (n : i32) = _INITIAL_N;
+  (bias : i32) = _INITIAL_BIAS;
+  (i_val : i32) = i32(0);
+  while (idx < input_len), {
+    (old_i : i32) = i_val;
+    (w : i32) = i32(1);
+    (k : i32) = _BASE;
+    (decode_done : bool) = false;
+    while (!(decode_done)), {
+      if((idx >= input_len), {
+        return .None;
+      });
+      (digit : i32) = _decode_digit(i32(bytes.get(usize(idx)).unwrap()));
+      idx = (idx + i32(1));
+      if((digit < i32(0)), {
+        return .None;
+      });
+      i_val = (i_val + (digit * w));
+      (t : i32) = cond(
+        (k <= bias) => _TMIN,
+        (k >= (bias + _TMAX)) => _TMAX,
+        true => (k - bias)
+      );
+      if((digit < t), {
+        decode_done = true;
+      }, {
+        w = (w * (_BASE - t));
+        k = (k + _BASE);
+      });
+    };
+    (out_len : i32) = (i32(output.len()) + i32(1));
+    bias = _adapt((i_val - old_i), out_len, (old_i == i32(0)));
+    n = (n + (i_val / out_len));
+    i_val = (i_val % out_len);
+    // Insert code point at position i_val
+    output.push(i32(0));
+    (shift_idx : i32) = (i32(output.len()) - i32(1));
+    while (shift_idx > i_val), {
+      &(output(usize(shift_idx))).* = output(usize((shift_idx - i32(1))));
+      shift_idx = (shift_idx - i32(1));
+    };
+    &(output(usize(i_val))).* = n;
+    i_val = (i_val + i32(1));
+  };
+  // Convert code points to UTF-8
+  (result_bytes : ArrayList(u8)) = ArrayList(u8).new();
+  (ri : usize) = usize(0);
+  while (ri < output.len()), {
+    _encode_codepoint(output.get(ri).unwrap(), (&result_bytes));
+    ri = (ri + usize(1));
+  };
+  .Some(String.from_bytes(result_bytes))
+});
+// Encode a Unicode string to punycode (without the xn-- prefix).
+punycode_encode :: (fn(input: String) -> String)({
+  (cps : ArrayList(i32)) = _string_to_codepoints(input);
+  (cp_count : i32) = i32(cps.len());
+  // Separate basic and non-basic code points
+  (out : ArrayList(u8)) = ArrayList(u8).new();
+  (basic_count : i32) = i32(0);
+  (ci : i32) = i32(0);
+  while (ci < cp_count), {
+    (cp : i32) = cps.get(usize(ci)).unwrap();
+    if((cp < i32(0x80)), {
+      out.push(u8(cp));
+      basic_count = (basic_count + i32(1));
+    });
+    ci = (ci + i32(1));
+  };
+  if((basic_count > i32(0)), {
+    out.push(u8(0x2D));
+  });
+  (handled : i32) = basic_count;
+  (n : i32) = _INITIAL_N;
+  (delta : i32) = i32(0);
+  (bias : i32) = _INITIAL_BIAS;
+  while (handled < cp_count), {
+    // Find minimum code point >= n
+    (m : i32) = i32(0x7FFFFFFF);
+    (mi : i32) = i32(0);
+    while (mi < cp_count), {
+      (cp : i32) = cps.get(usize(mi)).unwrap();
+      if(((cp >= n) && (cp < m)), {
+        m = cp;
+      });
+      mi = (mi + i32(1));
+    };
+    delta = (delta + ((m - n) * (handled + i32(1))));
+    n = m;
+    (ei : i32) = i32(0);
+    while (ei < cp_count), {
+      (cp : i32) = cps.get(usize(ei)).unwrap();
+      if((cp < n), {
+        delta = (delta + i32(1));
+      });
+      if((cp == n), {
+        (q : i32) = delta;
+        (k : i32) = _BASE;
+        (encode_done : bool) = false;
+        while (!(encode_done)), {
+          (t : i32) = cond(
+            (k <= bias) => _TMIN,
+            (k >= (bias + _TMAX)) => _TMAX,
+            true => (k - bias)
+          );
+          if((q < t), {
+            out.push(_encode_digit(q));
+            encode_done = true;
+          }, {
+            out.push(_encode_digit((t + ((q - t) % (_BASE - t)))));
+            q = ((q - t) / (_BASE - t));
+            k = (k + _BASE);
+          });
+        };
+        bias = _adapt(delta, (handled + i32(1)), (handled == basic_count));
+        delta = i32(0);
+        handled = (handled + i32(1));
+      });
+      ei = (ei + i32(1));
+    };
+    delta = (delta + i32(1));
+    n = (n + i32(1));
+  };
+  String.from_bytes(out)
+});
+// Convert an IDN hostname to Unicode display form.
+// Splits on '.', decodes xn-- labels, keeps original on failure.
+to_unicode :: (fn(hostname: String) -> String)({
+  (parts : ArrayList(String)) = hostname.split(`.`);
+  (result : String) = ``;
+  (pi : usize) = usize(0);
+  while (pi < parts.len()), {
+    (part : String) = parts.get(pi).unwrap();
+    if((pi > usize(0)), {
+      result = `${result}.`;
+    });
+    (part_lower : String) = part.to_lowercase();
+    if(part_lower.starts_with(`xn--`), {
+      (encoded : String) = part.substring(usize(4), part.len());
+      match(punycode_decode(encoded),
+        .Some(decoded) => {
+          result = `${result}${decoded}`;
+        },
+        .None => {
+          // Keep the original label including xn-- prefix on decode failure
+          result = `${result}${part}`;
+        }
+      );
+    }, {
+      result = `${result}${part}`;
+    });
+    pi = (pi + usize(1));
+  };
+  result
+});
+// Convert a Unicode hostname to ASCII punycode form.
+// Non-ASCII labels get xn-- prefix.
+to_ascii :: (fn(hostname: String) -> String)({
+  (parts : ArrayList(String)) = hostname.split(`.`);
+  (result : String) = ``;
+  (pi : usize) = usize(0);
+  while (pi < parts.len()), {
+    (part : String) = parts.get(pi).unwrap();
+    if((pi > usize(0)), {
+      result = `${result}.`;
+    });
+    // Check if the label has non-ASCII characters
+    (has_non_ascii : bool) = false;
+    (bytes : ArrayList(u8)) = part.as_bytes();
+    (bi : usize) = usize(0);
+    while (bi < bytes.len()), {
+      if((i32(bytes.get(bi).unwrap()) >= i32(0x80)), {
+        has_non_ascii = true;
+      });
+      bi = (bi + usize(1));
+    };
+    if(has_non_ascii, {
+      (encoded : String) = punycode_encode(part);
+      result = `${result}xn--${encoded}`;
+    }, {
+      result = `${result}${part}`;
+    });
+    pi = (pi + usize(1));
+  };
+  result
+});
+export punycode_decode, punycode_encode, to_unicode, to_ascii;

package/std/encoding/toml.yo CHANGED Viewed

@@ -54,7 +54,7 @@ impl(TomlValue,
         while (i < len), (i = (i + usize(1))), {
           cond(
             (keys.get(i).unwrap() == key) => {
-              values.set(i, value);
+              &(values(i)).* = value;
               found = true;
             },
             true => ()

package/std/fmt/to_string.yo CHANGED Viewed

@@ -203,24 +203,25 @@ impl(rune, ToString(
     // 0x80-0x7FF: 2 bytes
     // 0x800-0xFFFF: 3 bytes (excluding surrogates 0xD800-0xDFFF)
     // 0x10000-0x10FFFF: 4 bytes
+    // Use 5-byte buffer to always have space for null terminator
     buffer := cond(
       (code <= 0x7F) => {
         // 1-byte encoding: 0xxxxxxx
-        arr := Array(u8, usize(4)).fill(0);
+        arr := Array(u8, usize(5)).fill(0);
         arr(0) = u8(code);
         arr
       },
       (code <= 0x7FF) => {
         // 2-byte encoding: 110xxxxx 10xxxxxx
-        arr := Array(u8, usize(4)).fill(0);
+        arr := Array(u8, usize(5)).fill(0);
         arr(0) = u8(u32(0xC0) | ((code >> 6) & 0x1F));
         arr(1) = u8(u32(0x80) | (code & 0x3F));
         arr
       },
       (code <= 0xFFFF) => {
         // 3-byte encoding: 1110xxxx 10xxxxxx 10xxxxxx
-        arr := Array(u8, usize(4)).fill(0);
+        arr := Array(u8, usize(5)).fill(0);
         arr(0) = u8(u32(0xE0) | ((code >> 12) & 0x0F));
         arr(1) = u8(u32(0x80) | ((code >> 6) & 0x3F));
         arr(2) = u8(u32(0x80) | (code & 0x3F));
@@ -228,7 +229,7 @@ impl(rune, ToString(
       },
       true => {
         // 4-byte encoding: 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx
-        arr := Array(u8, usize(4)).fill(0);
+        arr := Array(u8, usize(5)).fill(0);
         arr(0) = u8(u32(0xF0) | ((code >> 18) & 0x07));
         arr(1) = u8(u32(0x80) | ((code >> 12) & 0x3F));
         arr(2) = u8(u32(0x80) | ((code >> 6) & 0x3F));

package/std/glob/index.yo CHANGED Viewed

@@ -187,7 +187,7 @@ _glob_match_impl :: (fn(pb: ArrayList(u8), pi: usize, tb: ArrayList(u8), ti: usi
 });
 glob_match :: (fn(pattern: String, text: String) -> bool)(
-  _glob_match_impl(pattern._bytes, usize(0), text._bytes, usize(0))
+  _glob_match_impl(pattern.as_bytes(), usize(0), text.as_bytes(), usize(0))
 );
 GlobPattern :: object(
@@ -199,7 +199,7 @@ impl(GlobPattern,
     Self(_pattern: pattern)
   ),
   matches : (fn(self: Self, text: String) -> bool)(
-    _glob_match_impl(self._pattern._bytes, usize(0), text._bytes, usize(0))
+    _glob_match_impl(self._pattern.as_bytes(), usize(0), text.as_bytes(), usize(0))
   )
 );

package/std/libc/wctype.yo ADDED Viewed

@@ -0,0 +1,55 @@
+// C11 wctype.h - Wide character classification and conversion functions
+// Provides functions to test and convert wide character types
+{ wint_t } :: import "./stdint";
+c_include "<wctype.h>",
+  // Wide character classification functions
+  iswalnum :
+    fn(wc : wint_t) -> int,
+  iswalpha :
+    fn(wc : wint_t) -> int,
+  iswblank :
+    fn(wc : wint_t) -> int,
+  iswcntrl :
+    fn(wc : wint_t) -> int,
+  iswdigit :
+    fn(wc : wint_t) -> int,
+  iswgraph :
+    fn(wc : wint_t) -> int,
+  iswlower :
+    fn(wc : wint_t) -> int,
+  iswprint :
+    fn(wc : wint_t) -> int,
+  iswpunct :
+    fn(wc : wint_t) -> int,
+  iswspace :
+    fn(wc : wint_t) -> int,
+  iswupper :
+    fn(wc : wint_t) -> int,
+  iswxdigit :
+    fn(wc : wint_t) -> int,
+  // Wide character conversion functions
+  towlower :
+    fn(wc : wint_t) -> wint_t,
+  towupper :
+    fn(wc : wint_t) -> wint_t
+;
+export
+  iswalnum,
+  iswalpha,
+  iswblank,
+  iswcntrl,
+  iswdigit,
+  iswgraph,
+  iswlower,
+  iswprint,
+  iswpunct,
+  iswspace,
+  iswupper,
+  iswxdigit,
+  towlower,
+  towupper
+;

package/std/path.yo CHANGED Viewed

@@ -67,7 +67,7 @@ impl(Path,
     // Check if path is absolute
     // Unix: starts with '/'
     // Windows: starts with drive letter like 'C:' or UNC path '\\'
-    bytes := normalized._bytes;
+    bytes := normalized.as_bytes();
     cond(
       (bytes.len() > usize(0)) => {
         first_byte := bytes.get(usize(0));
@@ -128,7 +128,7 @@ impl(Path,
             true => {
               // Check if it's "." (current directory)
               is_dot := ((part.len() == usize(1)) && {
-                byte_opt := part._bytes.get(usize(0));
+                byte_opt := part.as_bytes().get(usize(0));
                 match(byte_opt,
                   .Some(b) => (b == u8(46)),
                   .None => false
@@ -137,8 +137,8 @@ impl(Path,
               // Check if it's ".." (parent directory)
               is_dotdot := ((part.len() == usize(2)) && {
-                b0_opt := part._bytes.get(usize(0));
-                b1_opt := part._bytes.get(usize(1));
+                b0_opt := part.as_bytes().get(usize(0));
+                b1_opt := part.as_bytes().get(usize(1));
                 match(b0_opt,
                   .Some(b0) => match(b1_opt,
                     .Some(b1) => ((b0 == u8(46)) && (b1 == u8(46))),
@@ -605,8 +605,8 @@ impl(Path, ToString(
             // Check if it's a drive letter like "C:"
             cond(
               (first_seg.len() == usize(2)) => {
-                b0_opt := first_seg._bytes.get(usize(0));
-                b1_opt := first_seg._bytes.get(usize(1));
+                b0_opt := first_seg.as_bytes().get(usize(0));
+                b1_opt := first_seg.as_bytes().get(usize(1));
                 match(b0_opt,
                   .Some(b0) => match(b1_opt,
                     .Some(b1) => {