porffor 0.2.0-eaee2da → 0.2.0-ef043de

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (52) hide show
  1. package/LICENSE +20 -20
  2. package/README.md +159 -88
  3. package/asur/README.md +2 -0
  4. package/asur/index.js +1262 -0
  5. package/byg/index.js +237 -0
  6. package/compiler/2c.js +317 -72
  7. package/compiler/{sections.js → assemble.js} +63 -15
  8. package/compiler/builtins/annexb_string.js +72 -0
  9. package/compiler/builtins/annexb_string.ts +19 -0
  10. package/compiler/builtins/array.ts +145 -0
  11. package/compiler/builtins/base64.ts +151 -0
  12. package/compiler/builtins/crypto.ts +120 -0
  13. package/compiler/builtins/date.ts +1370 -0
  14. package/compiler/builtins/escape.ts +141 -0
  15. package/compiler/builtins/int.ts +147 -0
  16. package/compiler/builtins/number.ts +527 -0
  17. package/compiler/builtins/porffor.d.ts +42 -0
  18. package/compiler/builtins/string.ts +1055 -0
  19. package/compiler/builtins/tostring.ts +45 -0
  20. package/compiler/builtins.js +470 -269
  21. package/compiler/{codeGen.js → codegen.js} +999 -378
  22. package/compiler/embedding.js +22 -22
  23. package/compiler/encoding.js +108 -10
  24. package/compiler/generated_builtins.js +1262 -0
  25. package/compiler/index.js +36 -34
  26. package/compiler/log.js +6 -3
  27. package/compiler/opt.js +51 -36
  28. package/compiler/parse.js +35 -27
  29. package/compiler/precompile.js +123 -0
  30. package/compiler/prefs.js +26 -0
  31. package/compiler/prototype.js +13 -28
  32. package/compiler/types.js +37 -0
  33. package/compiler/wasmSpec.js +28 -8
  34. package/compiler/wrap.js +54 -46
  35. package/fib.js +7 -0
  36. package/package.json +9 -5
  37. package/porf +4 -0
  38. package/rhemyn/compile.js +5 -3
  39. package/rhemyn/parse.js +323 -320
  40. package/rhemyn/test/parse.js +58 -58
  41. package/runner/compare.js +34 -34
  42. package/runner/debug.js +122 -0
  43. package/runner/index.js +62 -10
  44. package/runner/profiler.js +102 -0
  45. package/runner/repl.js +40 -7
  46. package/runner/sizes.js +37 -37
  47. package/compiler/builtins/base64.js +0 -92
  48. package/runner/info.js +0 -89
  49. package/runner/profile.js +0 -46
  50. package/runner/results.json +0 -1
  51. package/runner/transform.js +0 -15
  52. package/util/enum.js +0 -20
@@ -2,30 +2,16 @@ import { Opcodes, Blocktype, Valtype, ValtypeSize, PageSize } from "./wasmSpec.j
2
2
  import { number } from "./embedding.js";
3
3
  import { unsignedLEB128 } from "./encoding.js";
4
4
  import { UNDEFINED } from "./builtins.js";
5
-
6
- // todo: do not duplicate this
7
- const TYPES = {
8
- number: 0x00,
9
- boolean: 0x01,
10
- string: 0x02,
11
- undefined: 0x03,
12
- object: 0x04,
13
- function: 0x05,
14
- symbol: 0x06,
15
- bigint: 0x07,
16
-
17
- // these are not "typeof" types but tracked internally
18
- _array: 0x10,
19
- _regexp: 0x11,
20
- _bytestring: 0x12
21
- };
5
+ import Prefs from './prefs.js';
6
+ import { TYPES } from './types.js';
22
7
 
23
8
  // todo: turn these into built-ins once arrays and these become less hacky
24
9
 
25
10
  export const PrototypeFuncs = function() {
26
- const noUnlikelyChecks = process.argv.includes('-funsafe-no-unlikely-proto-checks');
27
- let zeroChecks = process.argv.find(x => x.startsWith('-funsafe-zero-proto-checks='));
28
- if (zeroChecks) zeroChecks = zeroChecks.split('=')[1].split(',').reduce((acc, x) => { acc[x.toLowerCase()] = true; return acc; }, {});
11
+ const noUnlikelyChecks = Prefs.funsafeNoUnlikelyProtoChecks;
12
+
13
+ let zeroChecks;
14
+ if (Prefs.zeroChecks) zeroChecks = Prefs.zeroChecks.split('=')[1].split(',').reduce((acc, x) => { acc[x.toLowerCase()] = true; return acc; }, {});
29
15
  else zeroChecks = {};
30
16
 
31
17
  this[TYPES._array] = {
@@ -148,7 +134,7 @@ export const PrototypeFuncs = function() {
148
134
  shift: (pointer, length) => [
149
135
  // if length == 0, noop
150
136
  ...length.getCachedI32(),
151
- Opcodes.i32_eqz,
137
+ [ Opcodes.i32_eqz ],
152
138
  [ Opcodes.if, Blocktype.void ],
153
139
  ...number(UNDEFINED),
154
140
  [ Opcodes.br, 1 ],
@@ -342,8 +328,8 @@ export const PrototypeFuncs = function() {
342
328
  ...number(0, Valtype.i32), // base 0 for store later
343
329
 
344
330
  ...wIndex,
345
-
346
331
  Opcodes.i32_to,
332
+
347
333
  ...number(ValtypeSize.i16, Valtype.i32),
348
334
  [ Opcodes.i32_mul ],
349
335
 
@@ -383,7 +369,7 @@ export const PrototypeFuncs = function() {
383
369
 
384
370
  ...(noUnlikelyChecks ? [] : [ [ Opcodes.i32_or ] ]),
385
371
  [ Opcodes.if, Blocktype.void ],
386
- ...number(NaN),
372
+ ...number(valtype === 'i32' ? -1 : NaN),
387
373
  [ Opcodes.br, 1 ],
388
374
  [ Opcodes.end ],
389
375
 
@@ -489,10 +475,10 @@ export const PrototypeFuncs = function() {
489
475
  this[TYPES.string].isWellFormed.local2 = Valtype.i32;
490
476
  this[TYPES.string].isWellFormed.returnType = TYPES.boolean;
491
477
 
492
- if (process.argv.includes('-bytestring')) {
478
+ if (Prefs.bytestring) {
493
479
  this[TYPES._bytestring] = {
494
480
  at: (pointer, length, wIndex, iTmp, _, arrayShell) => {
495
- const [ newOut, newPointer ] = arrayShell(1, 'i16');
481
+ const [ newOut, newPointer ] = arrayShell(1, 'i8');
496
482
 
497
483
  return [
498
484
  // setup new/out array
@@ -548,7 +534,7 @@ export const PrototypeFuncs = function() {
548
534
 
549
535
  // todo: out of bounds properly
550
536
  charAt: (pointer, length, wIndex, _1, _2, arrayShell) => {
551
- const [ newOut, newPointer ] = arrayShell(1, 'i16');
537
+ const [ newOut, newPointer ] = arrayShell(1, 'i8');
552
538
 
553
539
  return [
554
540
  // setup new/out array
@@ -558,7 +544,6 @@ export const PrototypeFuncs = function() {
558
544
  ...number(0, Valtype.i32), // base 0 for store later
559
545
 
560
546
  ...wIndex,
561
-
562
547
  Opcodes.i32_to,
563
548
 
564
549
  ...pointer,
@@ -597,7 +582,7 @@ export const PrototypeFuncs = function() {
597
582
 
598
583
  ...(noUnlikelyChecks ? [] : [ [ Opcodes.i32_or ] ]),
599
584
  [ Opcodes.if, Blocktype.void ],
600
- ...number(NaN),
585
+ ...number(valtype === 'i32' ? -1 : NaN),
601
586
  [ Opcodes.br, 1 ],
602
587
  [ Opcodes.end ],
603
588
 
@@ -0,0 +1,37 @@
1
+ export const TYPES = {
2
+ number: 0x00,
3
+ boolean: 0x01,
4
+ string: 0x02,
5
+ undefined: 0x03,
6
+ object: 0x04,
7
+ function: 0x05,
8
+ symbol: 0x06,
9
+ bigint: 0x07
10
+ };
11
+
12
+ export const TYPE_NAMES = {
13
+ [TYPES.number]: 'Number',
14
+ [TYPES.boolean]: 'Boolean',
15
+ [TYPES.string]: 'String',
16
+ [TYPES.undefined]: 'undefined',
17
+ [TYPES.object]: 'Object',
18
+ [TYPES.function]: 'Function',
19
+ [TYPES.symbol]: 'Symbol',
20
+ [TYPES.bigint]: 'BigInt'
21
+ };
22
+
23
+ export const INTERNAL_TYPE_BASE = 0x10;
24
+ let internalTypeIndex = INTERNAL_TYPE_BASE;
25
+ const registerInternalType = name => {
26
+ const n = internalTypeIndex++;
27
+ TYPES['_' + name.toLowerCase()] = n;
28
+ TYPE_NAMES[n] = name;
29
+ };
30
+
31
+ // note: when adding a new internal type, please also add a deserializer to wrap.js
32
+ // (it is okay to add a throw todo deserializer for wips)
33
+
34
+ registerInternalType('Array');
35
+ registerInternalType('RegExp');
36
+ registerInternalType('ByteString');
37
+ registerInternalType('Date');
@@ -1,4 +1,13 @@
1
- import { enumify } from "../util/enum.js";
1
+ const enumify = (...args) => {
2
+ const obj = {};
3
+
4
+ for (let i = 0; i < args.length; i++) {
5
+ obj[i] = args[i];
6
+ obj[args[i]] = i;
7
+ }
8
+
9
+ return obj;
10
+ };
2
11
 
3
12
  export const Section = enumify('custom', 'type', 'import', 'func', 'table', 'memory', 'global', 'export', 'start', 'element', 'code', 'data', 'data_count', 'tag');
4
13
  export const ExportDesc = enumify('func', 'table', 'mem', 'global', 'tag');
@@ -32,17 +41,16 @@ export const Opcodes = {
32
41
  throw: 0x08,
33
42
  rethrow: 0x09,
34
43
 
35
- call: 0x10,
36
- call_indirect: 0x11,
37
- return_call: 0x12,
38
- return_call_indirect: 0x13,
39
-
40
44
  end: 0x0b,
41
45
  br: 0x0c,
42
46
  br_if: 0x0d,
43
47
  br_table: 0x0e,
44
48
  return: 0x0f,
49
+
45
50
  call: 0x10,
51
+ call_indirect: 0x11,
52
+ return_call: 0x12,
53
+ return_call_indirect: 0x13,
46
54
 
47
55
  drop: 0x1a,
48
56
 
@@ -62,13 +70,22 @@ export const Opcodes = {
62
70
  i32_load16_s: 0x2e,
63
71
  i32_load16_u: 0x2f,
64
72
 
65
- i32_store8: 0x3a,
66
- i32_store16: 0x3b,
73
+ i64_load8_s: 0x30,
74
+ i64_load8_u: 0x31,
75
+ i64_load16_s: 0x32,
76
+ i64_load16_u: 0x33,
67
77
 
68
78
  i32_store: 0x36,
69
79
  i64_store: 0x37,
70
80
  f64_store: 0x39,
71
81
 
82
+ i32_store8: 0x3a,
83
+ i32_store16: 0x3b,
84
+
85
+ i64_store8: 0x3c,
86
+ i64_store16: 0x3d,
87
+
88
+ memory_size: 0x3f,
72
89
  memory_grow: 0x40,
73
90
 
74
91
  i32_const: 0x41,
@@ -100,6 +117,8 @@ export const Opcodes = {
100
117
  i32_shl: 0x74,
101
118
  i32_shr_s: 0x75,
102
119
  i32_shr_u: 0x76,
120
+ i32_rotl: 0x77,
121
+ i32_rotr: 0x78,
103
122
 
104
123
  i64_eqz: 0x50,
105
124
  i64_eq: 0x51,
@@ -123,6 +142,7 @@ export const Opcodes = {
123
142
  i64_shr_s: 0x87,
124
143
  i64_shr_u: 0x88,
125
144
  i64_rotl: 0x89,
145
+ i64_rotr: 0x8a,
126
146
 
127
147
  f64_eq: 0x61,
128
148
  f64_ne: 0x62,
package/compiler/wrap.js CHANGED
@@ -1,56 +1,56 @@
1
1
  import compile from './index.js';
2
2
  import decompile from './decompile.js';
3
3
  import { encodeVector, encodeLocal } from './encoding.js';
4
- // import fs from 'node:fs';
4
+ import Prefs from './prefs.js';
5
+ import { log } from './log.js';
6
+ import { TYPES } from './types.js';
5
7
 
6
8
  const bold = x => `\u001b[1m${x}\u001b[0m`;
7
9
 
8
- const typeBase = 0x00;
9
- const internalTypeBase = 0x10;
10
- const TYPES = {
11
- [typeBase]: 'number',
12
- [typeBase + 1]: 'boolean',
13
- [typeBase + 2]: 'string',
14
- [typeBase + 3]: 'undefined',
15
- [typeBase + 4]: 'object',
16
- [typeBase + 5]: 'function',
17
- [typeBase + 6]: 'symbol',
18
- [typeBase + 7]: 'bigint',
19
-
20
- // internal
21
- [internalTypeBase]: '_array',
22
- [internalTypeBase + 1]: '_regexp',
23
- [internalTypeBase + 2]: '_bytestring'
24
- };
25
-
26
10
  export default async (source, flags = [ 'module' ], customImports = {}, print = str => process.stdout.write(str)) => {
27
11
  const times = [];
28
12
 
29
13
  const t1 = performance.now();
30
14
  const { wasm, funcs, globals, tags, exceptions, pages, c } = compile(source, flags);
31
15
 
16
+ globalThis.porfDebugInfo = { funcs, globals };
17
+
32
18
  if (source.includes('export function')) flags.push('module');
33
19
 
34
- // fs.writeFileSync('out.wasm', Buffer.from(wasm));
20
+ // (await import('node:fs')).writeFileSync('out.wasm', Buffer.from(wasm));
35
21
 
36
22
  times.push(performance.now() - t1);
37
- if (flags.includes('info')) console.log(bold(`compiled in ${times[0].toFixed(2)}ms`));
23
+ if (Prefs.profileCompiler) console.log(bold(`compiled in ${times[0].toFixed(2)}ms`));
38
24
 
39
25
  const t2 = performance.now();
40
26
 
41
27
  let instance;
42
28
  try {
43
- 0, { instance } = await WebAssembly.instantiate(wasm, {
29
+ let wasmEngine = WebAssembly;
30
+ if (Prefs.asur) {
31
+ log.warning('wrap', 'using our !experimental! asur wasm engine instead of host to run');
32
+ wasmEngine = await import('../asur/index.js');
33
+ }
34
+
35
+ 0, { instance } = await wasmEngine.instantiate(wasm, {
44
36
  '': {
45
37
  p: valtype === 'i64' ? i => print(Number(i).toString()) : i => print(i.toString()),
46
38
  c: valtype === 'i64' ? i => print(String.fromCharCode(Number(i))) : i => print(String.fromCharCode(i)),
47
- t: _ => performance.now(),
39
+ t: () => performance.now(),
40
+ u: () => performance.timeOrigin,
41
+ y: () => {},
42
+ z: () => {},
48
43
  ...customImports
49
44
  }
50
45
  });
51
46
  } catch (e) {
52
- const funcInd = parseInt(e.message.match(/function #([0-9]+) /)[1]);
53
- const blobOffset = parseInt(e.message.split('@')[1]);
47
+ // only backtrace for runner, not test262/etc
48
+ if (!process.argv[1].includes('/runner')) throw e;
49
+
50
+ const funcInd = parseInt(e.message.match(/function #([0-9]+) /)?.[1]);
51
+ const blobOffset = parseInt(e.message.split('@')?.[1]);
52
+
53
+ if (!funcInd) throw e;
54
54
 
55
55
  // convert blob offset -> function wasm offset.
56
56
  // this is not good code and is somewhat duplicated
@@ -128,7 +128,7 @@ export default async (source, flags = [ 'module' ], customImports = {}, print =
128
128
  }
129
129
 
130
130
  times.push(performance.now() - t2);
131
- if (flags.includes('info')) console.log(`instantiated in ${times[1].toFixed(2)}ms`);
131
+ if (Prefs.profileCompiler) console.log(`instantiated in ${times[1].toFixed(2)}ms`);
132
132
 
133
133
  const exports = {};
134
134
 
@@ -156,42 +156,50 @@ export default async (source, flags = [ 'module' ], customImports = {}, print =
156
156
 
157
157
  // if (ret >= typeBase && ret <= typeBase + 8) return ret > (typeBase + 7) ? 'object' : TYPES[ret];
158
158
 
159
- switch (TYPES[type]) {
160
- case 'boolean': return Boolean(ret);
161
- case 'undefined': return undefined;
162
- case 'object': return ret === 0 ? null : {};
159
+ switch (type) {
160
+ case TYPES.boolean: return Boolean(ret);
161
+ case TYPES.undefined: return undefined;
162
+ case TYPES.object: return ret === 0 ? null : {};
163
163
 
164
- case '_array': {
164
+ case TYPES.string: {
165
165
  const pointer = ret;
166
- const length = new Int32Array(memory.buffer, pointer, 1);
166
+ const length = (new Int32Array(memory.buffer, pointer, 1))[0];
167
167
 
168
- // have to slice because of memory alignment
169
- const buf = memory.buffer.slice(pointer + 4, pointer + 4 + 8 * length);
168
+ return Array.from(new Uint16Array(memory.buffer, pointer + 4, length)).map(x => String.fromCharCode(x)).join('');
169
+ }
170
170
 
171
- return Array.from(new Float64Array(buf));
171
+ case TYPES.function: {
172
+ // wasm func index, including all imports
173
+ const func = funcs.find(x => (x.originalIndex ?? x.index) === ret);
174
+ // if (!func) return ret;
175
+ if (!func) return function () {};
176
+
177
+ // make fake empty func for repl/etc
178
+ return {[func.name]() {}}[func.name];
172
179
  }
173
180
 
174
- case 'string': {
181
+ case TYPES._array: {
175
182
  const pointer = ret;
176
- const length = new Int32Array(memory.buffer, pointer, 1);
183
+ const length = (new Int32Array(memory.buffer, pointer, 1))[0];
177
184
 
178
- return Array.from(new Uint16Array(memory.buffer, pointer + 4, length)).map(x => String.fromCharCode(x)).join('');
185
+ // have to slice because of memory alignment
186
+ const buf = memory.buffer.slice(pointer + 4, pointer + 4 + 8 * length);
187
+
188
+ return Array.from(new Float64Array(buf));
179
189
  }
180
190
 
181
- case '_bytestring': {
191
+ case TYPES._bytestring: {
182
192
  const pointer = ret;
183
- const length = new Int32Array(memory.buffer, pointer, 1);
193
+ const length = (new Int32Array(memory.buffer, pointer, 1))[0];
184
194
 
185
195
  return Array.from(new Uint8Array(memory.buffer, pointer + 4, length)).map(x => String.fromCharCode(x)).join('');
186
196
  }
187
197
 
188
- case 'function': {
189
- // wasm func index, including all imports
190
- const func = funcs.find(x => (x.originalIndex ?? x.index) === ret);
191
- if (!func) return ret;
198
+ case TYPES._date: {
199
+ const pointer = ret;
200
+ const value = (new Float64Array(memory.buffer, pointer, 1))[0];
192
201
 
193
- // make fake empty func for repl/etc
194
- return {[func.name]() {}}[func.name];
202
+ return new Date(value);
195
203
  }
196
204
 
197
205
  default: return ret;
package/fib.js ADDED
@@ -0,0 +1,7 @@
1
+ export const fib = n => {
2
+ if (n < 2) {
3
+ return n;
4
+ } else {
5
+ return fib(n - 1) + fib(n - 2);
6
+ }
7
+ };
package/package.json CHANGED
@@ -1,21 +1,25 @@
1
1
  {
2
2
  "name": "porffor",
3
3
  "description": "a basic experimental wip aot optimizing js -> wasm engine/compiler/runtime in js",
4
- "version": "0.2.0-eaee2da",
4
+ "version": "0.2.0-ef043de",
5
5
  "author": "CanadaHonk",
6
6
  "license": "MIT",
7
+ "scripts": {
8
+ "precompile": "node ./compiler/precompile.js"
9
+ },
7
10
  "dependencies": {
8
- "acorn": "^8.9.0"
11
+ "acorn": "^8.11.3",
12
+ "node-repl-polyfill": "^0.1.1"
9
13
  },
10
14
  "optionalDependencies": {
11
- "@babel/parser": "^7.23.6",
15
+ "@babel/parser": "^7.24.4",
12
16
  "hermes-parser": "^0.18.2",
13
17
  "meriyah": "^4.3.9"
14
18
  },
15
19
  "bin": {
16
20
  "porf": "./runner/index.js"
17
21
  },
18
- "main": "./runner/index.js",
22
+ "main": "./compiler/wrap.js",
19
23
  "type": "module",
20
24
  "repository": {
21
25
  "type": "git",
@@ -25,4 +29,4 @@
25
29
  "url": "https://github.com/CanadaHonk/porffor/issues"
26
30
  },
27
31
  "homepage": "https://porffor.goose.icu"
28
- }
32
+ }
package/porf ADDED
@@ -0,0 +1,4 @@
1
+ #!/bin/sh
2
+ node runner/index.js "$@"
3
+ # deno run -A runner/index.js "$@"
4
+ # bun runner/index.js "$@"
package/rhemyn/compile.js CHANGED
@@ -2,6 +2,7 @@ import { Blocktype, Opcodes, Valtype, PageSize, ValtypeSize } from '../compiler/
2
2
  import { number } from '../compiler/embedding.js';
3
3
  import { signedLEB128, unsignedLEB128 } from '../compiler/encoding.js';
4
4
  import parse from './parse.js';
5
+ import Prefs from '../compiler/prefs.js';
5
6
 
6
7
  // local indexes
7
8
  const BasePointer = 0; // base string pointer
@@ -80,7 +81,7 @@ const generate = (node, negated = false, get = true, func = 'test') => {
80
81
  })[func], Valtype.i32)
81
82
  ];
82
83
 
83
- if (globalThis.regexLog) {
84
+ if (Prefs.regexLog) {
84
85
  const underline = x => `\u001b[4m\u001b[1m${x}\u001b[0m`;
85
86
  console.log(`\n${underline('ast')}`);
86
87
  console.log(node);
@@ -159,7 +160,7 @@ const generateSet = (node, negated, get) => {
159
160
  ];
160
161
  }
161
162
 
162
- out = out.concat(new Array(node.body.length - 1).fill(negated ? [ Opcodes.i32_or ] : [ Opcodes.i32_and ]));
163
+ if (node.body.length > 0) out = out.concat(new Array(node.body.length - 1).fill(negated ? [ Opcodes.i32_or ] : [ Opcodes.i32_and ]));
163
164
 
164
165
  return [
165
166
  ...out,
@@ -187,7 +188,8 @@ const generateRange = (node, negated, get) => {
187
188
  };
188
189
 
189
190
  const generateGroup = (node, negated, get) => {
190
-
191
+ // todo
192
+ return [];
191
193
  };
192
194
 
193
195
  export const test = (regex, index = 0, name = 'regex_test_' + regex) => outputFunc(generate(parse(regex), false, true, 'test'), name, index);