Add support for long-to-double in the optimizing compiler.

- Add support for the long-to-double Dex instruction in the optimizing compiler. - Enable requests of temporary FPU (double) registers during code generation. - Fix art::x86::X86Assembler::LoadLongConstant and extend it to int64_t values. - Have art::x86_64::X86_64Assembler::cvtsi2sd work with 64-bit operands. - Generate x86, x86-64 and ARM (but not ARM64) code for long to double HTypeConversion nodes. - Add related tests to test/422-type-conversion. Change-Id: Ie73d9e5e25bd2e15f585c371e8fc2dcb83438ccd
author: Roland Levillain <rpl@google.com> 2014-11-27 12:06:00 +0000
committer: Roland Levillain <rpl@google.com> 2014-11-27 12:06:00 +0000
commit: 647b9ed41cdb7cf302fd356627a3ba372419b78c (patch)
tree: f1ca054aa20ae4c489f208982e7a6cba5d5ee21e /compiler/optimizing/code_generator_arm.cc
parent: 35ecc8ca8fba713728b8fc60e9e2a275da2028aa (diff)
download: art-647b9ed41cdb7cf302fd356627a3ba372419b78c.tar.gz
art-647b9ed41cdb7cf302fd356627a3ba372419b78c.tar.bz2
art-647b9ed41cdb7cf302fd356627a3ba372419b78c.zip
1 files changed, 43 insertions, 1 deletions
diff --git a/compiler/optimizing/code_generator_arm.cc b/compiler/optimizing/code_generator_arm.cc
index 890cfdd0e6..22a859071b 100644
--- a/compiler/optimizing/code_generator_arm.cc
+++ b/compiler/optimizing/code_generator_arm.cc
@@ -1481,6 +1481,14 @@ void LocationsBuilderARM::VisitTypeConversion(HTypeConversion* conversion) {
           break;
 
         case Primitive::kPrimLong:
+          // Processing a Dex `long-to-double' instruction.
+          locations->SetInAt(0, Location::RequiresRegister());
+          locations->SetOut(Location::RequiresFpuRegister());
+          locations->AddTemp(Location::RequiresRegister());
+          locations->AddTemp(Location::RequiresRegister());
+          locations->AddTemp(Location::RequiresFpuRegister());
+          break;
+
         case Primitive::kPrimFloat:
           LOG(FATAL) << "Type conversion from " << input_type
                      << " to " << result_type << " not yet implemented";
@@ -1645,7 +1653,41 @@ void InstructionCodeGeneratorARM::VisitTypeConversion(HTypeConversion* conversio
           break;
         }
 
-        case Primitive::kPrimLong:
+        case Primitive::kPrimLong: {
+          // Processing a Dex `long-to-double' instruction.
+          Register low = in.AsRegisterPairLow<Register>();
+          Register high = in.AsRegisterPairHigh<Register>();
+          SRegister out_s = out.AsFpuRegisterPairLow<SRegister>();
+          DRegister out_d = FromLowSToD(out_s);
+          Register constant_low = locations->GetTemp(0).As<Register>();
+          Register constant_high = locations->GetTemp(1).As<Register>();
+          SRegister temp_s = locations->GetTemp(2).AsFpuRegisterPairLow<SRegister>();
+          DRegister temp_d = FromLowSToD(temp_s);
+
+          // Binary encoding of 2^32 for type double.
+          const uint64_t c = UINT64_C(0x41F0000000000000);
+
+          // out_d = int-to-double(high)
+          __ vmovsr(out_s, high);
+          __ vcvtdi(out_d, out_s);
+          // Using vmovd to load the `c` constant as an immediate
+          // value into `temp_d` does not work, as this instruction
+          // only transfers 8 significant bits of its immediate
+          // operand.  Instead, use two 32-bit core registers to
+          // load `c` into `temp_d`.
+          __ LoadImmediate(constant_low, Low32Bits(c));
+          __ LoadImmediate(constant_high, High32Bits(c));
+          __ vmovdrr(temp_d, constant_low, constant_high);
+          // out_d = out_d * 2^32
+          __ vmuld(out_d, out_d, temp_d);
+          // temp_d = unsigned-to-double(low)
+          __ vmovsr(temp_s, low);
+          __ vcvtdu(temp_d, temp_s);
+          // out_d = out_d + temp_d
+          __ vaddd(out_d, out_d, temp_d);
+          break;
+        }
+
         case Primitive::kPrimFloat:
           LOG(FATAL) << "Type conversion from " << input_type
                      << " to " << result_type << " not yet implemented";
author	Roland Levillain <rpl@google.com>	2014-11-27 12:06:00 +0000
committer	Roland Levillain <rpl@google.com>	2014-11-27 12:06:00 +0000
commit	647b9ed41cdb7cf302fd356627a3ba372419b78c (patch)
tree	f1ca054aa20ae4c489f208982e7a6cba5d5ee21e /compiler/optimizing/code_generator_arm.cc
parent	35ecc8ca8fba713728b8fc60e9e2a275da2028aa (diff)
download	art-647b9ed41cdb7cf302fd356627a3ba372419b78c.tar.gz art-647b9ed41cdb7cf302fd356627a3ba372419b78c.tar.bz2 art-647b9ed41cdb7cf302fd356627a3ba372419b78c.zip