RPCS3 · AniLeo · Jul 30, 2020 · Jul 29, 2020 · Jul 29, 2020 · Jul 30, 2020
diff --git a/rpcs3/Emu/CPU/CPUTranslator.cpp b/rpcs3/Emu/CPU/CPUTranslator.cpp
@@ -83,12 +83,31 @@ llvm::Value* cpu_translator::bitcast(llvm::Value* val, llvm::Type* type)
 }
 
 template <>
-v128 cpu_translator::get_const_vector<v128>(llvm::Constant* c, u32 a, u32 b)
+std::pair<bool, v128> cpu_translator::get_const_vector<v128>(llvm::Value* c, u32 a, u32 b)
 {
+	v128 result{};
+
+	if (!llvm::isa<llvm::Constant>(c))
+	{
+		return {false, result};
+	}
+
 	const auto t = c->getType();
 
 	if (!t->isVectorTy())
 	{
+		if (const auto ci = llvm::dyn_cast<llvm::ConstantInt>(c); ci && ci->getBitWidth() == 128)
+		{
+			auto cv = ci->getValue();
+
+			for (int i = 0; i < 128; i++)
+			{
+				result._bit[i] = cv[i];
+			}
+
+			return {true, result};
+		}
+
 		fmt::throw_exception("[0x%x, %u] Not a vector" HERE, a, b);
 	}
 
@@ -106,13 +125,17 @@ v128 cpu_translator::get_const_vector<v128>(llvm::Constant* c, u32 a, u32 b)
 			return {};
 		}
 
+		if (llvm::isa<llvm::ConstantExpr>(c))
+		{
+			// Sorry, if we cannot evaluate it we cannot use it
+			fmt::throw_exception("[0x%x, %u] Constant Expression!" HERE, a, b);
+		}
+
 		fmt::throw_exception("[0x%x, %u] Unexpected constant type" HERE, a, b);
 	}
 
 	const auto sct = t->getScalarType();
 
-	v128 result;
-
 	if (sct->isIntegerTy(8))
 	{
 		for (u32 i = 0; i < 16; i++)
@@ -160,12 +183,17 @@ v128 cpu_translator::get_const_vector<v128>(llvm::Constant* c, u32 a, u32 b)
 		fmt::throw_exception("[0x%x, %u] Unexpected vector element type" HERE, a, b);
 	}
 
-	return result;
+	return {true, result};
 }
 
 template <>
 llvm::Constant* cpu_translator::make_const_vector<v128>(v128 v, llvm::Type* t)
 {
+	if (const auto ct = llvm::dyn_cast<llvm::IntegerType>(t); ct && ct->getBitWidth() == 128)
+	{
+		return llvm::ConstantInt::get(t, llvm::APInt(128, llvm::makeArrayRef(reinterpret_cast<const u64*>(v._bytes), 2)));
+	}
+
 	verify(HERE), t->isVectorTy() && llvm::cast<llvm::VectorType>(t)->getBitWidth() == 128;
 
 	const auto sct = t->getScalarType();

diff --git a/rpcs3/Emu/CPU/CPUTranslator.h b/rpcs3/Emu/CPU/CPUTranslator.h
@@ -2837,7 +2837,7 @@ class cpu_translator
 	}
 
 	template <typename R = v128>
-	R get_const_vector(llvm::Constant*, u32 a, u32 b);
+	std::pair<bool, R> get_const_vector(llvm::Value*, u32 a, u32 b);
 
 	template <typename T = v128>
 	llvm::Constant* make_const_vector(T, llvm::Type*);

diff --git a/rpcs3/Emu/Cell/PPUTranslator.cpp b/rpcs3/Emu/Cell/PPUTranslator.cpp
@@ -129,9 +129,8 @@ PPUTranslator::PPUTranslator(LLVMContext& context, Module* _module, const ppu_mo
 		m_reloc = &m_info.segs[0];
 	}
 
-	const auto nan_u32 = ConstantInt::get(get_type<u32>(), 0x7FC00000u);
-	const auto nan_f32 = ConstantExpr::getBitCast(nan_u32, get_type<f32>());
-	nan_vec4 = ConstantVector::getSplat(4, nan_f32);
+	const auto nan_v = v128::from32p(0x7FC00000u);
+	nan_vec4 = make_const_vector(nan_v, get_type<f32[4]>());
 }
 
 PPUTranslator::~PPUTranslator()
@@ -236,13 +235,13 @@ Value* PPUTranslator::VecHandleNan(Value* val)
 Value* PPUTranslator::VecHandleDenormal(Value* val)
 {
 	const auto type = val->getType();
-	const auto value = type == GetType<u32[4]>() ? val : m_ir->CreateBitCast(val, GetType<u32[4]>());
+	const auto value = bitcast(val, GetType<u32[4]>());
 
 	const auto mask = SExt(m_ir->CreateICmpEQ(m_ir->CreateAnd(value, Broadcast(RegLoad(m_jm_mask), 4)), ConstantVector::getSplat(4, m_ir->getInt32(0))), GetType<s32[4]>());
 	const auto nz = m_ir->CreateLShr(mask, 1);
 	const auto result = m_ir->CreateAnd(m_ir->CreateNot(nz), value);
 
-	return type == GetType<u32[4]>() ? result : m_ir->CreateBitCast(result, type);
+	return bitcast(result, type);
 }
 
 Value* PPUTranslator::VecHandleResult(Value* val)
@@ -398,7 +397,7 @@ void PPUTranslator::FlushRegisters()
 				m_ir->SetInsertPoint(block);
 			}
 
-			m_ir->CreateStore(local, m_ir->CreateBitCast(m_globals[index], local->getType()->getPointerTo()));
+			m_ir->CreateStore(local, bitcast(m_globals[index], local->getType()->getPointerTo()));
 			m_globals[index] = nullptr;
 		}
 	}
@@ -414,20 +413,20 @@ Value* PPUTranslator::Solid(Value* value)
 
 	if (value->getType() == GetType<bool[4]>())
 	{
-		return m_ir->CreateBitCast(SExt(value, GetType<u32[4]>()), m_ir->getIntNTy(128));
+		return bitcast(SExt(value, GetType<u32[4]>()), m_ir->getIntNTy(128));
 	}
 
 	if (value->getType() == GetType<bool[8]>())
 	{
-		return m_ir->CreateBitCast(SExt(value, GetType<u16[8]>()), m_ir->getIntNTy(128));
+		return bitcast(SExt(value, GetType<u16[8]>()), m_ir->getIntNTy(128));
 	}
 
 	if (value->getType() == GetType<bool[16]>())
 	{
-		return m_ir->CreateBitCast(SExt(value, GetType<u8[16]>()), m_ir->getIntNTy(128));
+		return bitcast(SExt(value, GetType<u8[16]>()), m_ir->getIntNTy(128));
 	}
 
-	return m_ir->CreateBitCast(value, m_ir->getIntNTy(size));
+	return bitcast(value, m_ir->getIntNTy(size));
 }
 
 Value* PPUTranslator::IsZero(Value* value)
@@ -580,7 +579,7 @@ void PPUTranslator::UseCondition(MDNode* hint, Value* cond)
 
 llvm::Value* PPUTranslator::GetMemory(llvm::Value* addr, llvm::Type* type)
 {
-	return m_ir->CreateBitCast(m_ir->CreateGEP(m_base_loaded, {m_ir->getInt64(0), addr}), type->getPointerTo());
+	return bitcast(m_ir->CreateGEP(m_base_loaded, {m_ir->getInt64(0), addr}), type->getPointerTo());
 }
 
 Value* PPUTranslator::ReadMemory(Value* addr, Type* type, bool is_be, u32 align)
@@ -592,7 +591,7 @@ Value* PPUTranslator::ReadMemory(Value* addr, Type* type, bool is_be, u32 align)
 		// Read, byteswap, bitcast
 		const auto int_type = m_ir->getIntNTy(size);
 		const auto value = m_ir->CreateAlignedLoad(GetMemory(addr, int_type), llvm::MaybeAlign{align}, true);
-		return m_ir->CreateBitCast(Call(int_type, fmt::format("llvm.bswap.i%u", size), value), type);
+		return bitcast(Call(int_type, fmt::format("llvm.bswap.i%u", size), value), type);
 	}
 
 	// Read normally
@@ -608,7 +607,7 @@ void PPUTranslator::WriteMemory(Value* addr, Value* value, bool is_be, u32 align
 	{
 		// Bitcast, byteswap
 		const auto int_type = m_ir->getIntNTy(size);
-		value = Call(int_type, fmt::format("llvm.bswap.i%u", size), m_ir->CreateBitCast(value, int_type));
+		value = Call(int_type, fmt::format("llvm.bswap.i%u", size), bitcast(value, int_type));
 	}
 
 	// Write
@@ -947,10 +946,8 @@ void PPUTranslator::VMADDFP(ppu_opcode_t op)
 	auto [a, b, c] = get_vrs<f32[4]>(op.va, op.vb, op.vc);
 
 	// Optimization: Emit only a floating multiply if the addend is zero
-	if (auto cv = llvm::dyn_cast<llvm::Constant>(b.value))
+	if (auto [ok, data] = get_const_vector(b.value, m_addr, 2000); ok)
 	{
-		v128 data = get_const_vector(cv, m_addr, 2000);
-
 		if (data == v128{})
 		{
 			set_vr(op.vd, vec_handle_result(a * c));
@@ -1253,10 +1250,8 @@ void PPUTranslator::VNMSUBFP(ppu_opcode_t op)
 	auto [a, b, c] = get_vrs<f32[4]>(op.va, op.vb, op.vc);
 
 	// Optimization: Emit only a floating multiply if the addend is zero
-	if (const auto cv = llvm::dyn_cast<llvm::Constant>(b.value))
+	if (const auto [ok, data] = get_const_vector(b.value, m_addr, 2004); ok)
 	{
-		const v128 data = get_const_vector(cv, m_addr, 2004);
-
 		if (data == v128{})
 		{
 			set_vr(op.vd, vec_handle_result(-a * c));
@@ -1438,10 +1433,8 @@ void PPUTranslator::VSEL(ppu_opcode_t op)
 	const auto c = get_vr<u32[4]>(op.vc);
 
 	// Check if the constant mask doesn't require bit granularity
-	if (auto ci = llvm::dyn_cast<llvm::Constant>(c.value))
+	if (auto [ok, mask] = get_const_vector(c.value, m_addr, 9000); ok)
 	{
-		v128 mask = get_const_vector(ci, m_addr, 9000);
-
 		bool sel_32 = true;
 		for (u32 i = 0; i < 4; i++)
 		{
@@ -2777,7 +2770,7 @@ void PPUTranslator::MTOCRF(ppu_opcode_t op)
 
 			const auto index = m_ir->CreateAnd(m_ir->CreateLShr(value, 28 - i * 4), 15);
 			const auto src = m_ir->CreateGEP(m_mtocr_table, {m_ir->getInt32(0), m_ir->CreateShl(index, 2)});
-			const auto dst = m_ir->CreateBitCast(m_ir->CreateStructGEP(nullptr, m_thread, static_cast<uint>(m_cr - m_locals) + i * 4), GetType<u8*>());
+			const auto dst = bitcast(m_ir->CreateStructGEP(nullptr, m_thread, static_cast<uint>(m_cr - m_locals) + i * 4), GetType<u8*>());
 			Call(GetType<void>(), "llvm.memcpy.p0i8.p0i8.i32", dst, src, m_ir->getInt32(4), m_ir->getFalse());
 		}
 	}
@@ -4559,15 +4552,15 @@ Value* PPUTranslator::GetFpr(u32 r, u32 bits, bool as_int)
 	}
 	else
 	{
-		return Trunc(m_ir->CreateBitCast(value, GetType<u64>()), m_ir->getIntNTy(bits));
+		return Trunc(bitcast(value, GetType<u64>()), m_ir->getIntNTy(bits));
 	}
 }
 
 void PPUTranslator::SetFpr(u32 r, Value* val)
 {
 	const auto f64_val =
-		val->getType() == GetType<s32>() ? m_ir->CreateBitCast(SExt(val), GetType<f64>()) :
-		val->getType() == GetType<s64>() ? m_ir->CreateBitCast(val, GetType<f64>()) :
+		val->getType() == GetType<s32>() ? bitcast(SExt(val), GetType<f64>()) :
+		val->getType() == GetType<s64>() ? bitcast(val, GetType<f64>()) :
 		val->getType() == GetType<f32>() ? m_ir->CreateFPExt(val, GetType<f64>()) : val;
 
 	RegStore(f64_val, m_fpr[r]);
@@ -4577,16 +4570,19 @@ Value* PPUTranslator::GetVr(u32 vr, VrType type)
 {
 	const auto value = RegLoad(m_vr[vr]);
 
+	llvm::Type* _type{};
+
 	switch (type)
 	{
-	case VrType::vi32: return m_ir->CreateBitCast(value, GetType<u32[4]>());
-	case VrType::vi8: return m_ir->CreateBitCast(value, GetType<u8[16]>());
-	case VrType::vi16: return m_ir->CreateBitCast(value, GetType<u16[8]>());
-	case VrType::vf: return m_ir->CreateBitCast(value, GetType<f32[4]>());
-	case VrType::i128: return m_ir->CreateBitCast(value, GetType<u128>());
+	case VrType::vi32: _type = GetType<u32[4]>(); break;
+	case VrType::vi8 : _type = GetType<u8[16]>(); break;
+	case VrType::vi16: _type = GetType<u16[8]>(); break;
+	case VrType::vf  : _type = GetType<f32[4]>(); break;
+	case VrType::i128: _type = GetType<u128>(); break;
+	default: report_fatal_error("GetVr(): invalid type");
 	}
 
-	report_fatal_error("GetVr(): invalid type");
+	return bitcast(value, _type);
 }
 
 void PPUTranslator::SetVr(u32 vr, Value* value)