dotnet · kg · May 22, 2025 · May 29, 2025 · May 29, 2025 · jkotas
@@ -3026,36 +3026,53 @@ int InterpCompiler::GenerateCode(CORINFO_METHOD_INFO* methodInfo)
                 m_compHnd->getMethodSig(ctorMethod, &ctorSignature);
                 ctorClass = m_compHnd->getMethodClass(ctorMethod);
                 int32_t numArgs = ctorSignature.numArgs;
+                bool isStringOrArray = m_compHnd->getClassAttribs(ctorClass) & CORINFO_FLG_VAROBJSIZE;
+                int32_t numExtraArgs = isStringOrArray ? 1 : 2;
+                int32_t callArgOffset = isStringOrArray ? 0 : 1;
 
-                // TODO Special case array ctor / string ctor
                 m_pStackPointer -= numArgs;
 
                 // Allocate callArgs for the call, this + numArgs + terminator
-                int32_t *callArgs = (int32_t*) AllocMemPool((numArgs + 2) * sizeof(int32_t));
+                int32_t *callArgs = (int32_t*) AllocMemPool((numArgs + numExtraArgs) * sizeof(int32_t));
                 for (int i = 0; i < numArgs; i++)
-                    callArgs[i + 1] = m_pStackPointer[i].var;
-                callArgs[numArgs + 1] = -1;
+                    callArgs[i + callArgOffset] = m_pStackPointer[i].var;
+                callArgs[numArgs + callArgOffset] = -1;
 
                 // Push the return value and `this` argument to the ctor
                 InterpType retType = GetInterpType(m_compHnd->asCorInfoType(ctorClass));
-                int32_t vtsize = 0;
-                if (retType == InterpTypeVT)
+                int32_t vtsize = 0, dVar, thisVar;
+                if (isStringOrArray)
+                {
+                    // result
+                    PushInterpType(retType, ctorClass);
+                    dVar = m_pStackPointer[-1].var;
+                    thisVar = -1;
+                }
+                else if (retType == InterpTypeVT)
                 {
                     vtsize = m_compHnd->getClassSize(ctorClass);
                     PushTypeVT(ctorClass, vtsize);
                     PushInterpType(InterpTypeByRef, NULL);
+                    dVar = m_pStackPointer[-2].var;
+                    thisVar = m_pStackPointer[-1].var;
                 }
                 else
                 {
+                    // result
                     PushInterpType(retType, ctorClass);
+                    // this-ref
                     PushInterpType(retType, ctorClass);
+                    dVar = m_pStackPointer[-2].var;
+                    thisVar = m_pStackPointer[-1].var;
+                }
+
+                if (!isStringOrArray)
+                {
+                    // Consider this arg as being defined, although newobj defines it
+                    AddIns(INTOP_DEF);
+                    m_pLastNewIns->SetDVar(thisVar);
+                    callArgs[0] = thisVar;
                 }
-                int32_t dVar = m_pStackPointer[-2].var;
-                int32_t thisVar = m_pStackPointer[-1].var;
-                // Consider this arg as being defined, although newobj defines it
-                AddIns(INTOP_DEF);
-                m_pLastNewIns->SetDVar(thisVar);
-                callArgs[0] = thisVar;
 
                 if (retType == InterpTypeVT)
                 {
@@ -3064,9 +3081,10 @@ int InterpCompiler::GenerateCode(CORINFO_METHOD_INFO* methodInfo)
                 }
                 else
                 {
-                    AddIns(INTOP_NEWOBJ);
+                    AddIns(isStringOrArray ? INTOP_NEWOBJ_VAROBJSIZE : INTOP_NEWOBJ);
                     m_pLastNewIns->data[1] = GetDataItemIndex(ctorClass);
                 }
+
                 m_pLastNewIns->data[0] = GetMethodDataItemIndex(ctorMethod);
                 m_pLastNewIns->SetSVar(CALL_ARGS_SVAR);
                 m_pLastNewIns->SetDVar(dVar);
@@ -3076,7 +3094,8 @@ int InterpCompiler::GenerateCode(CORINFO_METHOD_INFO* methodInfo)
                 m_pLastNewIns->info.pCallInfo->pCallArgs = callArgs;
 
                 // Pop this, the result of the newobj still remains on the stack
-                m_pStackPointer--;
+                if (!isStringOrArray)
+                    m_pStackPointer--;
                 break;
             }
             case CEE_DUP:

@@ -281,6 +281,7 @@ OPDEF(INTOP_CALL, "call", 4, 1, 1, InterpOpMethodHandle)
 OPDEF(INTOP_CALLVIRT, "callvirt", 4, 1, 1, InterpOpMethodHandle)
 OPDEF(INTOP_NEWOBJ, "newobj", 5, 1, 1, InterpOpMethodHandle)
 OPDEF(INTOP_NEWOBJ_VT, "newobj.vt", 5, 1, 1, InterpOpMethodHandle)
+OPDEF(INTOP_NEWOBJ_VAROBJSIZE, "newobj.varobjsize", 5, 1, 1, InterpOpMethodHandle)
 
 OPDEF(INTOP_CALL_HELPER_PP, "call.helper.pp", 5, 1, 0, InterpOpThreeInts)
 

diff --git a/src/coreclr/vm/callstubgenerator.cpp b/src/coreclr/vm/callstubgenerator.cpp
@@ -548,6 +548,14 @@ CallStubHeader *CallStubGenerator::GenerateCallStub(MethodDesc *pMD, AllocMemTra
     _ASSERTE(pMD != NULL);
 
     MetaSig sig(pMD);
+
+    // Classes like System.String have special constructors that are fcalls. When invoking these, we need to override
+    //  HasThis (there's no thisref) and the return type (the return value is the new instance, not void).
+    bool isSpecialConstructor = sig.HasThis() && (pMD->GetMethodTable() == g_pStringClass) && pMD->IsCtor();
+
+    if (isSpecialConstructor)
+        sig.ClearHasThis();
+
     ArgIterator argIt(&sig);
 
     m_r1 = NoRange; // indicates that there is no active range of general purpose registers
@@ -679,6 +687,12 @@ CallStubHeader *CallStubGenerator::GenerateCallStub(MethodDesc *pMD, AllocMemTra
     {
         TypeHandle thReturnValueType;
         CorElementType thReturnType = sig.GetReturnTypeNormalized(&thReturnValueType);
+        if (isSpecialConstructor)
+        {
+            assert(thReturnType == ELEMENT_TYPE_VOID);
+            // FIXME: String?
+            thReturnType = ELEMENT_TYPE_CLASS;
+        }
 
         switch (thReturnType)
         {

@@ -8,7 +8,7 @@
 #include "interpexec.h"
 #include "callstubgenerator.h"
 
-void InvokeCompiledMethod(MethodDesc *pMD, int8_t *pArgs, int8_t *pRet)
+void InvokeCompiledMethod(MethodDesc *pMD, int8_t *pArgs, int8_t *pRet, PCODE pCode)
 {
     CONTRACTL
     {
@@ -41,7 +41,7 @@ void InvokeCompiledMethod(MethodDesc *pMD, int8_t *pArgs, int8_t *pRet)
         }
     }
 
-    pHeader->SetTarget(pMD->GetNativeCode()); // The method to call
+    pHeader->SetTarget(pCode); // The method to call
 
     pHeader->Invoke(pHeader->Routines, pArgs, pRet, pHeader->TotalStackSize);
 }
@@ -1151,7 +1151,7 @@ void InterpExecMethod(InterpreterFrame *pInterpreterFrame, InterpMethodContextFr
                     else if (codeInfo.GetCodeManager() != ExecutionManager::GetInterpreterCodeManager())
                     {
                         MethodDesc *pMD = codeInfo.GetMethodDesc();
-                        InvokeCompiledMethod(pMD, stack + callArgsOffset, stack + returnOffset);
+                        InvokeCompiledMethod(pMD, stack + callArgsOffset, stack + returnOffset, pMD->GetNativeCode());
                         break;
                     }
 
@@ -1213,6 +1213,28 @@ void InterpExecMethod(InterpreterFrame *pInterpreterFrame, InterpMethodContextFr
                     ip += 5;
                     goto CALL_INTERP_SLOT;
                 }
+                case INTOP_NEWOBJ_VAROBJSIZE:
 public extern String(char c, int count); 
 public extern String(char c, int count); 
+                {
+                    returnOffset = ip[1];
+                    callArgsOffset = ip[2];
+                    methodSlot = ip[3];
+
+                    size_t targetMethod = (size_t)pMethod->pDataItems[methodSlot];
+                    assert(targetMethod & INTERP_METHOD_HANDLE_TAG);
+                    MethodDesc *pMD = (MethodDesc*)(targetMethod & ~INTERP_METHOD_HANDLE_TAG);
+
+                    // If we are constructing a type with a component size (i.e. a string) its constructor is a special
+                    //  fcall that is basically a static method that returns the new instance.
+                    // Get the address of the fcall that implements the ctor
+                    PCODE code = pMD->TryGetMultiCallableAddrOfCode(CORINFO_ACCESS_ANY);
+                    assert(code);
+
+                    // callArgsOffset points to the ctor arguments, which are what the fcall expects.
+                    // returnOffset points to where the new instance goes, and the fcall will write it there.
+                    InvokeCompiledMethod(pMD, stack + callArgsOffset, stack + returnOffset, code);
+                    ip += 5;
+                    break;
+                }
                 case INTOP_ZEROBLK_IMM:
                     memset(LOCAL_VAR(ip[1], void*), 0, ip[2]);
                     ip += 3;

diff --git a/src/tests/JIT/interpreter/Interpreter.cs b/src/tests/JIT/interpreter/Interpreter.cs
@@ -413,6 +413,9 @@ public static void RunInterpreterTests()
         if (!TestBoxing())
             Environment.FailFast(null);
 
+        if (!TestStringCtor())
+            Environment.FailFast(null);
+
         if (!TestArray())
             Environment.FailFast(null);
 
@@ -708,6 +711,18 @@ public static bool TestBoxing()
         return result == 3;
     }
 
+    public static bool TestStringCtor()
+    {
+        string s = new string('a', 4);
+        if (s.Length != 4)
+            return false;
+        if (s[0] != 'a')
+            return false;
+        if (s != "aaaa")
+            return false;
+        return true;
+    }
+
     [MethodImpl(MethodImplOptions.NoInlining | MethodImplOptions.NoOptimization)]
     static object BoxedSubtraction (object lhs, object rhs) {
         return (int)lhs - (int)rhs;