AsmIntGen: Support [pb, pc, field] three-operand memory access

Teach the DSL and both arch backends to handle memory operands of the form [pb, pc, field_ref], meaning base + index + field_offset. On aarch64, since x21 already caches pb + pc (the instruction pointer), this emits a single `ldr dst, [x21, #offset]` instead of the previous `mov t0, x21` + `ldr dst, [t0, #offset]` two-instruction sequence. On x86_64, this emits `[r14 + r13 + offset]` which is natively supported by x86 addressing modes. Convert all `lea t0, [pb, pc]` + `loadNN tX, [t0, field]` pairs in the DSL to the new single-instruction form, saving one instruction per IC access and other field loads in GetById, PutById, GetLength, GetGlobal, SetGlobal, and CallBuiltin handlers.
Author: https://github.com/awesomekling Commit: https://github.com/LadybirdBrowser/ladybird/commit/368efef6204 Pull-request: https://github.com/LadybirdBrowser/ladybird/pull/8316
2026-05-05 06:32:30 +02:00 · 2026-03-07 23:01:21 +01:00 · 2026-03-08 09:28:09 +00:00
parent 54a1a66112
commit 368efef620
3 changed files with 107 additions and 33 deletions
--- a/Libraries/LibJS/Bytecode/AsmInterpreter/asmint.asm
+++ b/Libraries/LibJS/Bytecode/AsmInterpreter/asmint.asm
@@ -316,8 +316,7 @@ end

 # Dispatch using the instruction's m_length field (for variable-length instructions).
 macro dispatch_callbuiltin_size()
-    lea t0, [pb, pc]
-    load32 t0, [t0, m_length]
+    load32 t0, [pb, pc, m_length]
    dispatch_variable t0
 end

@@ -1422,8 +1421,7 @@ handler GetById
    # Load Object.m_shape
    load64 t4, [t3, OBJECT_SHAPE]
    # Get PropertyLookupCache* (direct pointer from instruction stream)
-    lea t0, [pb, pc]
-    load64 t5, [t0, m_cache]
+    load64 t5, [pb, pc, m_cache]
    # Check entry[0].shape matches Object's shape (direct pointer compare)
    load64 t0, [t5, PROPERTY_LOOKUP_CACHE_ENTRY0_SHAPE]
    branch_ne t0, t4, .try_cache
@@ -1484,8 +1482,7 @@ handler PutById
    # Load Object.m_shape
    load64 t4, [t3, OBJECT_SHAPE]
    # Get PropertyLookupCache* (direct pointer from instruction stream)
-    lea t0, [pb, pc]
-    load64 t5, [t0, m_cache]
+    load64 t5, [pb, pc, m_cache]
    # Check entry[0].shape matches Object's shape (direct pointer compare)
    load64 t0, [t5, PROPERTY_LOOKUP_CACHE_ENTRY0_SHAPE]
    branch_ne t0, t4, .try_cache
@@ -1679,8 +1676,7 @@ handler GetLength
    branch_bits_set t0, OBJECT_FLAG_HAS_MAGICAL_LENGTH, .magical_length
    # Non-magical length: IC fast path (same as GetById)
    load64 t4, [t3, OBJECT_SHAPE]
-    lea t0, [pb, pc]
-    load64 t5, [t0, m_cache]
+    load64 t5, [pb, pc, m_cache]
    # Check entry[0].shape matches (direct pointer compare)
    load64 t0, [t5, PROPERTY_LOOKUP_CACHE_ENTRY0_SHAPE]
    branch_ne t0, t4, .slow
@@ -1733,8 +1729,7 @@ handler GetGlobal
    load64 t1, [exec_ctx, EXECUTION_CONTEXT_GLOBAL_DECLARATIVE_ENVIRONMENT]
    load64 t2, [exec_ctx, EXECUTION_CONTEXT_GLOBAL_OBJECT]
    # Get GlobalVariableCache* (direct pointer from instruction stream)
-    lea t0, [pb, pc]
-    load64 t3, [t0, m_cache]
+    load64 t3, [pb, pc, m_cache]
    # Check environment_serial_number matches
    load64 t0, [t3, GLOBAL_VARIABLE_CACHE_ENVIRONMENT_SERIAL]
    load64 t4, [t1, DECLARATIVE_ENVIRONMENT_SERIAL]
@@ -1791,8 +1786,7 @@ handler SetGlobal
    load64 t1, [exec_ctx, EXECUTION_CONTEXT_GLOBAL_DECLARATIVE_ENVIRONMENT]
    load64 t2, [exec_ctx, EXECUTION_CONTEXT_GLOBAL_OBJECT]
    # Get GlobalVariableCache* (direct pointer from instruction stream)
-    lea t0, [pb, pc]
-    load64 t3, [t0, m_cache]
+    load64 t3, [pb, pc, m_cache]
    # Check environment_serial_number matches
    load64 t0, [t3, GLOBAL_VARIABLE_CACHE_ENVIRONMENT_SERIAL]
    load64 t4, [t1, DECLARATIVE_ENVIRONMENT_SERIAL]
@@ -1879,8 +1873,7 @@ handler CallBuiltin
    branch_zero t3, .slow
    # Compare FunctionObject::m_builtin value with instruction's m_builtin
    load8 t3, [t2, FUNCTION_OBJECT_BUILTIN_VALUE]
-    lea t0, [pb, pc]
-    load8 t4, [t0, m_builtin]
+    load8 t4, [pb, pc, m_builtin]
    branch_ne t3, t4, .slow
    # Callee validated. Now dispatch on the builtin enum (already in t4).
    branch_eq t4, BUILTIN_MATH_ABS, .math_abs