dotnet · kg · Dec 8, 2025 · Dec 8, 2025 · Dec 8, 2025 · Dec 8, 2025
diff --git a/src/coreclr/jit/codegenwasm.cpp b/src/coreclr/jit/codegenwasm.cpp
@@ -275,6 +275,10 @@ void CodeGen::genCodeForTreeNode(GenTree* treeNode)
             genCodeForConstant(treeNode);
             break;
 
+        case GT_CAST:
+            genCodeForCast(treeNode->AsOp());
+            break;
+
         default:
 #ifdef DEBUG
             NYIRAW(GenTree::OpName(treeNode->OperGet()));
@@ -373,22 +377,82 @@ static constexpr uint32_t PackOperAndType(genTreeOps oper, var_types type)
     {
         type = TYP_I_IMPL;
     }
-    static_assert((ssize_t)GT_COUNT > (ssize_t)TYP_COUNT);
-    return ((uint32_t)oper << (ConstLog2<GT_COUNT>::value + 1)) | ((uint32_t)type);
+    const int shift1 = ConstLog2<TYP_COUNT>::value + 1;
+    return ((uint32_t)oper << shift1) | ((uint32_t)type);
 }
 
 //------------------------------------------------------------------------
-// PackOperAndType: Pack a GenTreeOp* into a uint32_t
+// PackOperAndType: Pack a genTreeOps and two var_types into a uint32_t
 //
 // Arguments:
-//    treeNode - a GenTreeOp to extract oper and type from
+//    oper - a genTreeOps to pack
+//    toType - a var_types to pack
+//    fromType - a var_types to pack
 //
 // Return Value:
-//    the node's oper and type packed into an integer that can be used as a switch value
+//    oper and the types packed into an integer that can be used as a switch value/case
 //
-static uint32_t PackOperAndType(GenTreeOp* treeNode)
+static constexpr uint32_t PackOperAndType(genTreeOps oper, var_types toType, var_types fromType)
 {
-    return PackOperAndType(treeNode->OperGet(), treeNode->TypeGet());
+    if (fromType == TYP_BYREF)
+    {
+        fromType = TYP_I_IMPL;
+    }
+    if (toType == TYP_BYREF)
+    {
+        toType = TYP_I_IMPL;
+    }
+    const int shift1 = ConstLog2<TYP_COUNT>::value + 1;
+    const int shift2 = shift1 + ConstLog2<GT_COUNT>::value + 1;
+    return ((uint32_t)oper << shift1) | ((uint32_t)fromType) | ((uint32_t)toType << shift2);
+}
+
+//------------------------------------------------------------------------
+// genCodeForCastr: Generate code for a binary arithmetic operator
+//
+// Arguments:
+//    tree - The binary operation for which we are generating code.
+//
+void CodeGen::genCodeForCast(GenTreeOp* tree)
+{
+    genConsumeOperands(tree);
+
+    instruction ins;
+    switch (PackOperAndType(tree->OperGet(), /* toType */ tree->TypeGet(), /* fromType */ tree->gtOp1->TypeGet()))
+    {
+        // NOTE: For this, RyuJIT seems to just generate an i32 load of the i64 operand instead of a GT_CAST.
+        // I suspect once we implement use of wasm locals instead of the linear stack, GT_CAST will appear.
+        case PackOperAndType(GT_CAST, TYP_INT, TYP_LONG):
+            if (tree->gtOverflow())
+                NYI_WASM("Overflow checks");
+            ins = INS_i32_wrap_i64;
+            break;
+
+        case PackOperAndType(GT_CAST, TYP_LONG, TYP_INT):
+            // FIXME: Use extend8/extend16 as appropriate
+            ins = tree->IsUnsigned() ? INS_i64_extend_u_i32 : INS_i64_extend_s_i32;
+            break;
+
+        case PackOperAndType(GT_CAST, TYP_DOUBLE, TYP_FLOAT):
+            // NOTE: This name is wrong in the spec.
+            ins = INS_f64_promote_f32;
+            break;
+
+        case PackOperAndType(GT_CAST, TYP_FLOAT, TYP_DOUBLE):
+            ins = INS_f32_demote_f64;
+            break;
+
+            // TODO: Floating point conversions - we need to figure out where semantics require a helper and where they
+            // don't.
+
+        default:
+            ins = INS_none;
+            NYI_WASM("genCodeForCast");
+            break;
+    }
+
+    GetEmitter()->emitIns(ins);
+    genProduceReg(tree);
 }
 
 //------------------------------------------------------------------------
@@ -402,7 +466,7 @@ void CodeGen::genCodeForBinary(GenTreeOp* treeNode)
     genConsumeOperands(treeNode);
 
     instruction ins;
-    switch (PackOperAndType(treeNode))
+    switch (PackOperAndType(treeNode->OperGet(), treeNode->TypeGet()))
     {
         case PackOperAndType(GT_ADD, TYP_INT):
             if (treeNode->gtOverflow())
@@ -497,7 +561,7 @@ void CodeGen::genCodeForDivMod(GenTreeOp* treeNode)
     genConsumeOperands(treeNode);
 
     instruction ins;
-    switch (PackOperAndType(treeNode))
+    switch (PackOperAndType(treeNode->OperGet(), treeNode->TypeGet()))
     {
         case PackOperAndType(GT_DIV, TYP_INT):
             ins = INS_i32_div_s;
@@ -615,7 +679,7 @@ void CodeGen::genCodeForShift(GenTree* tree)
     // for both the shift and shiftee. So the shift may need to be extended (zero-extended) for TYP_LONG.
 
     instruction ins;
-    switch (PackOperAndType(treeNode))
+    switch (PackOperAndType(treeNode->OperGet(), treeNode->TypeGet()))
     {
         case PackOperAndType(GT_LSH, TYP_INT):
             ins = INS_i32_shl;

diff --git a/src/coreclr/jit/gentree.cpp b/src/coreclr/jit/gentree.cpp
@@ -5445,10 +5445,11 @@ unsigned Compiler::gtSetEvalOrder(GenTree* tree)
                     costEx = 1;
                     costSz = 4;
 #elif defined(TARGET_WASM)
+                    // TODO-WASM: Better estimate of costs for these opcodes. Most of them are one op on x64 but may be
+                    // multiple uops.
+                    costEx = 2;
-                    // TODO-WASM: Better estimate of costs for these opcodes. Most of them are one op on x64 but may be
-                    // multiple uops.
-                    costEx = 2;
+                    costEx = 1;
-                    // TODO-WASM: Better estimate of costs for these opcodes. Most of them are one op on x64 but may be
-                    // multiple uops.
-                    costEx = 2;
+                    costEx = 1;
                     // TODO-WASM: 1 byte opcodes except for the int->fp saturating casts which are 2 bytes.
-                    // TODO-WASM: 1 byte opcodes except for the int->fp saturating casts which are 2 bytes.
-                    // TODO-WASM: 1 byte opcodes except for the int->fp saturating casts which are 2 bytes.
-                    NYI_WASM("Cast costing");
-                    costEx = 0;
-                    costSz = 0;
+                    costSz = 1;
-                    costSz = 1;
+                    costSz = varTypeIsFloating(op1) && !varTypeIsFloating(tree) ? 2 : 1;
-                    costSz = 1;
+                    costSz = varTypeIsFloating(op1) && !varTypeIsFloating(tree) ? 2 : 1;
 #else
 #error "Unknown TARGET"
 #endif

diff --git a/src/coreclr/jit/instrswasm.h b/src/coreclr/jit/instrswasm.h
@@ -151,6 +151,39 @@ INST(f64_div,     "f64.div",     0, IF_OPCODE,  0xA3)
 INST(f64_min,     "f64.min",     0, IF_OPCODE,  0xA4)
 INST(f64_max,     "f64.max",     0, IF_OPCODE,  0xA5)
 INST(f64_copysign,"f64.copysign",0, IF_OPCODE,  0xA6)
+// Unary operations
+INST(i32_wrap_i64,   "i32.wrap_i64",   0, IF_OPCODE,  0xA7)
+INST(i32_trunc_s_f32,"i32.trunc_s_f32",0, IF_OPCODE,  0xA8)
+INST(i32_trunc_u_f32,"i32.trunc_u_f32",0, IF_OPCODE,  0xA9)
+INST(i32_trunc_s_f64,"i32.trunc_s_f64",0, IF_OPCODE,  0xAA)
+INST(i32_trunc_u_f64,"i32.trunc_u_f64",0, IF_OPCODE,  0xAB)
+INST(i64_extend_s_i32,"i32.extend_s_i32",0, IF_OPCODE,  0xAC)
+INST(i64_extend_u_i32,"i32.extend_u_i32",0, IF_OPCODE,  0xAD)
+INST(i64_trunc_s_f32,"i64.trunc_s_f32",0, IF_OPCODE,  0xAE)
+INST(i64_trunc_u_f32,"i64.trunc_u_f32",0, IF_OPCODE,  0xAF)
+INST(i64_trunc_s_f64,"i64.trunc_s_f64",0, IF_OPCODE,  0xB0)
+INST(i64_trunc_u_f64,"i64.trunc_u_f64",0, IF_OPCODE,  0xB1)
+INST(f32_convert_s_i32,"f32.convert_s_i32",0, IF_OPCODE,  0xB2)
+INST(f32_convert_u_i32,"f32.convert_u_i32",0, IF_OPCODE,  0xB3)
+INST(f32_convert_s_i64,"f32.convert_s_i64",0, IF_OPCODE,  0xB4)
+INST(f32_convert_u_i64,"f32.convert_u_i64",0, IF_OPCODE,  0xB5)
+INST(f32_demote_f64,"f32.demote_f64",0, IF_OPCODE,  0xB6)
+INST(f64_convert_s_i32,"f64.convert_s_i32",0, IF_OPCODE,  0xB7)
+INST(f64_convert_u_i32,"f64.convert_u_i32",0, IF_OPCODE,  0xB8)
+INST(f64_convert_s_i64,"f64.convert_s_i64",0, IF_OPCODE,  0xB9)
+INST(f64_convert_u_i64,"f64.convert_u_i64",0, IF_OPCODE,  0xBA)
+// NOTE: This is named f32_promote_f64 in the spec, which is wrong.
+INST(f64_promote_f32,"f64.promote_f32",0, IF_OPCODE,  0xBB)
+INST(i32_reinterpret_f32,"i32.reinterpret_f32",0, IF_OPCODE,  0xBC)
+INST(i64_reinterpret_f64,"i64.reinterpret_f64",0, IF_OPCODE,  0xBD)
+INST(f32_reinterpret_i32,"f32.reinterpret_i32",0, IF_OPCODE,  0xBE)
+INST(f64_reinterpret_i64,"f64.reinterpret_i64",0, IF_OPCODE,  0xBF)
+INST(i32_extend8_s,"i32.extend8_s",0, IF_OPCODE,  0xC0)
+INST(i32_extend16_s,"i32.extend16_s",0, IF_OPCODE,  0xC1)
+INST(i64_extend8_s,"i64.extend8_s",0, IF_OPCODE,  0xC2)
+INST(i64_extend16_s,"i64.extend16_s",0, IF_OPCODE,  0xC3)
+INST(i64_extend32_s,"i64.extend32_s",0, IF_OPCODE,  0xC4)
+
 // clang-format on
 
 #undef INST
diff --git a/src/coreclr/jit/lower.cpp b/src/coreclr/jit/lower.cpp
@@ -9680,7 +9680,7 @@ void Lowering::ContainCheckRet(GenTreeUnOp* ret)
 {
     assert(ret->OperIs(GT_RETURN, GT_SWIFT_ERROR_RET));
 
-#if !defined(TARGET_64BIT)
+#if !defined(TARGET_64BIT) && !defined(TARGET_WASM)
     if (ret->TypeIs(TYP_LONG))
     {
         GenTree* op1 = ret->AsOp()->GetReturnValue();