Commit 0d94d7c7 authored by erik.corry@gmail.com's avatar erik.corry@gmail.com

Add vfp support on ARM. Patch from John Jozwiak.

Review URL: http://codereview.chromium.org/348019

git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@3292 ce2b1a6d-e550-0410-aec6-3dcde31c8c00
parent 3773f96e
...@@ -19,3 +19,4 @@ Rafal Krypa <rafal@krypa.net> ...@@ -19,3 +19,4 @@ Rafal Krypa <rafal@krypa.net>
Rene Rebe <rene@exactcode.de> Rene Rebe <rene@exactcode.de>
Ryan Dahl <coldredlemur@gmail.com> Ryan Dahl <coldredlemur@gmail.com>
Patrick Gansterer <paroga@paroga.com> Patrick Gansterer <paroga@paroga.com>
John Jozwiak <jjozwiak@codeaurora.org>
This diff is collapsed.
...@@ -102,6 +102,57 @@ extern Register sp; ...@@ -102,6 +102,57 @@ extern Register sp;
extern Register lr; extern Register lr;
extern Register pc; extern Register pc;
// Support for VFP registers s0 to s32 (d0 to d16).
// Note that "sN:sM" is the same as "dN/2".
extern Register s0;
extern Register s1;
extern Register s2;
extern Register s3;
extern Register s4;
extern Register s5;
extern Register s6;
extern Register s7;
extern Register s8;
extern Register s9;
extern Register s10;
extern Register s11;
extern Register s12;
extern Register s13;
extern Register s14;
extern Register s15;
extern Register s16;
extern Register s17;
extern Register s18;
extern Register s19;
extern Register s20;
extern Register s21;
extern Register s22;
extern Register s23;
extern Register s24;
extern Register s25;
extern Register s26;
extern Register s27;
extern Register s28;
extern Register s29;
extern Register s30;
extern Register s31;
extern Register d0;
extern Register d1;
extern Register d2;
extern Register d3;
extern Register d4;
extern Register d5;
extern Register d6;
extern Register d7;
extern Register d8;
extern Register d9;
extern Register d10;
extern Register d11;
extern Register d12;
extern Register d13;
extern Register d14;
extern Register d15;
// Coprocessor register // Coprocessor register
struct CRegister { struct CRegister {
...@@ -372,6 +423,30 @@ class MemOperand BASE_EMBEDDED { ...@@ -372,6 +423,30 @@ class MemOperand BASE_EMBEDDED {
friend class Assembler; friend class Assembler;
}; };
// CpuFeatures keeps track of which features are supported by the target CPU.
// Supported features must be enabled by a Scope before use.
class CpuFeatures : public AllStatic {
public:
enum Feature { VFP3 = 1 };
// Detect features of the target CPU. Set safe defaults if the serializer
// is enabled (snapshots must be portable).
static void Probe();
// Check whether a feature is supported by the target CPU.
static bool IsSupported(Feature f) {
if (f == VFP3 && !FLAG_enable_vfp3) return false;
return (supported_ & (static_cast<uint64_t>(1) << f)) != 0;
}
// Check whether a feature is currently enabled.
static bool IsEnabled(Feature f) {
return (enabled_ & (static_cast<uint64_t>(1) << f)) != 0;
}
private:
static uint64_t supported_;
static uint64_t enabled_;
};
typedef int32_t Instr; typedef int32_t Instr;
...@@ -655,6 +730,66 @@ class Assembler : public Malloced { ...@@ -655,6 +730,66 @@ class Assembler : public Malloced {
void stc2(Coprocessor coproc, CRegister crd, Register base, int option, void stc2(Coprocessor coproc, CRegister crd, Register base, int option,
LFlag l = Short); // v5 and above LFlag l = Short); // v5 and above
// Support for VFP.
// All these APIs support S0 to S31 and D0 to D15.
// Currently these APIs do not support extended D registers, i.e, D16 to D31.
// However, some simple modifications can allow
// these APIs to support D16 to D31.
void fmdrr(const Register dst,
const Register src1,
const Register src2,
const SBit s = LeaveCC,
const Condition cond = al);
void fmrrd(const Register dst1,
const Register dst2,
const Register src,
const SBit s = LeaveCC,
const Condition cond = al);
void fmsr(const Register dst,
const Register src,
const SBit s = LeaveCC,
const Condition cond = al);
void fmrs(const Register dst,
const Register src,
const SBit s = LeaveCC,
const Condition cond = al);
void fsitod(const Register dst,
const Register src,
const SBit s = LeaveCC,
const Condition cond = al);
void ftosid(const Register dst,
const Register src,
const SBit s = LeaveCC,
const Condition cond = al);
void faddd(const Register dst,
const Register src1,
const Register src2,
const SBit s = LeaveCC,
const Condition cond = al);
void fsubd(const Register dst,
const Register src1,
const Register src2,
const SBit s = LeaveCC,
const Condition cond = al);
void fmuld(const Register dst,
const Register src1,
const Register src2,
const SBit s = LeaveCC,
const Condition cond = al);
void fdivd(const Register dst,
const Register src1,
const Register src2,
const SBit s = LeaveCC,
const Condition cond = al);
void fcmp(const Register src1,
const Register src2,
const SBit s = LeaveCC,
const Condition cond = al);
void vmrs(const Register dst,
const Condition cond = al);
// Pseudo instructions // Pseudo instructions
void nop() { mov(r0, Operand(r0)); } void nop() { mov(r0, Operand(r0)); }
......
...@@ -4599,6 +4599,21 @@ static void EmitIdenticalObjectComparison(MacroAssembler* masm, ...@@ -4599,6 +4599,21 @@ static void EmitIdenticalObjectComparison(MacroAssembler* masm,
} }
static void IntegerToDoubleConversionWithVFP3(MacroAssembler* masm,
Register inReg,
Register outHighReg,
Register outLowReg) {
// ARMv7 VFP3 instructions to implement integer to double conversion.
// This VFP3 implementation is known to work
// on ARMv7-VFP3 Snapdragon processor.
__ mov(r7, Operand(inReg, ASR, kSmiTagSize));
__ fmsr(s15, r7);
__ fsitod(d7, s15);
__ fmrrd(outLowReg, outHighReg, d7);
}
// See comment at call site. // See comment at call site.
static void EmitSmiNonsmiComparison(MacroAssembler* masm, static void EmitSmiNonsmiComparison(MacroAssembler* masm,
Label* rhs_not_nan, Label* rhs_not_nan,
...@@ -4622,9 +4637,16 @@ static void EmitSmiNonsmiComparison(MacroAssembler* masm, ...@@ -4622,9 +4637,16 @@ static void EmitSmiNonsmiComparison(MacroAssembler* masm,
// Rhs is a smi, lhs is a number. // Rhs is a smi, lhs is a number.
__ push(lr); __ push(lr);
if (CpuFeatures::IsSupported(CpuFeatures::VFP3)) {
IntegerToDoubleConversionWithVFP3(masm, r1, r3, r2);
} else {
__ mov(r7, Operand(r1)); __ mov(r7, Operand(r1));
ConvertToDoubleStub stub1(r3, r2, r7, r6); ConvertToDoubleStub stub1(r3, r2, r7, r6);
__ Call(stub1.GetCode(), RelocInfo::CODE_TARGET); __ Call(stub1.GetCode(), RelocInfo::CODE_TARGET);
}
// r3 and r2 are rhs as double. // r3 and r2 are rhs as double.
__ ldr(r1, FieldMemOperand(r0, HeapNumber::kValueOffset + kPointerSize)); __ ldr(r1, FieldMemOperand(r0, HeapNumber::kValueOffset + kPointerSize));
__ ldr(r0, FieldMemOperand(r0, HeapNumber::kValueOffset)); __ ldr(r0, FieldMemOperand(r0, HeapNumber::kValueOffset));
...@@ -4652,9 +4674,15 @@ static void EmitSmiNonsmiComparison(MacroAssembler* masm, ...@@ -4652,9 +4674,15 @@ static void EmitSmiNonsmiComparison(MacroAssembler* masm,
__ push(lr); __ push(lr);
__ ldr(r2, FieldMemOperand(r1, HeapNumber::kValueOffset)); __ ldr(r2, FieldMemOperand(r1, HeapNumber::kValueOffset));
__ ldr(r3, FieldMemOperand(r1, HeapNumber::kValueOffset + kPointerSize)); __ ldr(r3, FieldMemOperand(r1, HeapNumber::kValueOffset + kPointerSize));
if (CpuFeatures::IsSupported(CpuFeatures::VFP3)) {
IntegerToDoubleConversionWithVFP3(masm, r0, r1, r0);
} else {
__ mov(r7, Operand(r0)); __ mov(r7, Operand(r0));
ConvertToDoubleStub stub2(r1, r0, r7, r6); ConvertToDoubleStub stub2(r1, r0, r7, r6);
__ Call(stub2.GetCode(), RelocInfo::CODE_TARGET); __ Call(stub2.GetCode(), RelocInfo::CODE_TARGET);
}
__ pop(lr); __ pop(lr);
// Fall through to both_loaded_as_doubles. // Fall through to both_loaded_as_doubles.
} }
...@@ -4857,9 +4885,25 @@ void CompareStub::Generate(MacroAssembler* masm) { ...@@ -4857,9 +4885,25 @@ void CompareStub::Generate(MacroAssembler* masm) {
// fall through if neither is a NaN. Also binds rhs_not_nan. // fall through if neither is a NaN. Also binds rhs_not_nan.
EmitNanCheck(masm, &rhs_not_nan, cc_); EmitNanCheck(masm, &rhs_not_nan, cc_);
if (CpuFeatures::IsSupported(CpuFeatures::VFP3)) {
// ARMv7 VFP3 instructions to implement double precision comparison.
// This VFP3 implementation is known to work on
// ARMv7-VFP3 Snapdragon processor.
__ fmdrr(d6, r0, r1);
__ fmdrr(d7, r2, r3);
__ fcmp(d6, d7);
__ vmrs(pc);
__ mov(r0, Operand(0), LeaveCC, eq);
__ mov(r0, Operand(1), LeaveCC, lt);
__ mvn(r0, Operand(0), LeaveCC, gt);
__ mov(pc, Operand(lr));
} else {
// Compares two doubles in r0, r1, r2, r3 that are not NaNs. Returns the // Compares two doubles in r0, r1, r2, r3 that are not NaNs. Returns the
// answer. Never falls through. // answer. Never falls through.
EmitTwoNonNanDoubleComparison(masm, cc_); EmitTwoNonNanDoubleComparison(masm, cc_);
}
__ bind(&not_smis); __ bind(&not_smis);
// At this point we know we are dealing with two different objects, // At this point we know we are dealing with two different objects,
...@@ -4959,6 +5003,11 @@ static void HandleBinaryOpSlowCases(MacroAssembler* masm, ...@@ -4959,6 +5003,11 @@ static void HandleBinaryOpSlowCases(MacroAssembler* masm,
// Since both are Smis there is no heap number to overwrite, so allocate. // Since both are Smis there is no heap number to overwrite, so allocate.
// The new heap number is in r5. r6 and r7 are scratch. // The new heap number is in r5. r6 and r7 are scratch.
AllocateHeapNumber(masm, &slow, r5, r6, r7); AllocateHeapNumber(masm, &slow, r5, r6, r7);
if (CpuFeatures::IsSupported(CpuFeatures::VFP3)) {
IntegerToDoubleConversionWithVFP3(masm, r0, r3, r2);
IntegerToDoubleConversionWithVFP3(masm, r1, r1, r0);
} else {
// Write Smi from r0 to r3 and r2 in double format. r6 is scratch. // Write Smi from r0 to r3 and r2 in double format. r6 is scratch.
__ mov(r7, Operand(r0)); __ mov(r7, Operand(r0));
ConvertToDoubleStub stub1(r3, r2, r7, r6); ConvertToDoubleStub stub1(r3, r2, r7, r6);
...@@ -4969,6 +5018,8 @@ static void HandleBinaryOpSlowCases(MacroAssembler* masm, ...@@ -4969,6 +5018,8 @@ static void HandleBinaryOpSlowCases(MacroAssembler* masm,
ConvertToDoubleStub stub2(r1, r0, r7, r6); ConvertToDoubleStub stub2(r1, r0, r7, r6);
__ Call(stub2.GetCode(), RelocInfo::CODE_TARGET); __ Call(stub2.GetCode(), RelocInfo::CODE_TARGET);
__ pop(lr); __ pop(lr);
}
__ jmp(&do_the_call); // Tail call. No return. __ jmp(&do_the_call); // Tail call. No return.
// We jump to here if something goes wrong (one param is not a number of any // We jump to here if something goes wrong (one param is not a number of any
...@@ -5004,12 +5055,19 @@ static void HandleBinaryOpSlowCases(MacroAssembler* masm, ...@@ -5004,12 +5055,19 @@ static void HandleBinaryOpSlowCases(MacroAssembler* masm,
// We can't overwrite a Smi so get address of new heap number into r5. // We can't overwrite a Smi so get address of new heap number into r5.
AllocateHeapNumber(masm, &slow, r5, r6, r7); AllocateHeapNumber(masm, &slow, r5, r6, r7);
} }
if (CpuFeatures::IsSupported(CpuFeatures::VFP3)) {
IntegerToDoubleConversionWithVFP3(masm, r0, r3, r2);
} else {
// Write Smi from r0 to r3 and r2 in double format. // Write Smi from r0 to r3 and r2 in double format.
__ mov(r7, Operand(r0)); __ mov(r7, Operand(r0));
ConvertToDoubleStub stub3(r3, r2, r7, r6); ConvertToDoubleStub stub3(r3, r2, r7, r6);
__ push(lr); __ push(lr);
__ Call(stub3.GetCode(), RelocInfo::CODE_TARGET); __ Call(stub3.GetCode(), RelocInfo::CODE_TARGET);
__ pop(lr); __ pop(lr);
}
__ bind(&finished_loading_r0); __ bind(&finished_loading_r0);
// Move r1 to a double in r0-r1. // Move r1 to a double in r0-r1.
...@@ -5029,12 +5087,18 @@ static void HandleBinaryOpSlowCases(MacroAssembler* masm, ...@@ -5029,12 +5087,18 @@ static void HandleBinaryOpSlowCases(MacroAssembler* masm,
// We can't overwrite a Smi so get address of new heap number into r5. // We can't overwrite a Smi so get address of new heap number into r5.
AllocateHeapNumber(masm, &slow, r5, r6, r7); AllocateHeapNumber(masm, &slow, r5, r6, r7);
} }
if (CpuFeatures::IsSupported(CpuFeatures::VFP3)) {
IntegerToDoubleConversionWithVFP3(masm, r1, r1, r0);
} else {
// Write Smi from r1 to r1 and r0 in double format. // Write Smi from r1 to r1 and r0 in double format.
__ mov(r7, Operand(r1)); __ mov(r7, Operand(r1));
ConvertToDoubleStub stub4(r1, r0, r7, r6); ConvertToDoubleStub stub4(r1, r0, r7, r6);
__ push(lr); __ push(lr);
__ Call(stub4.GetCode(), RelocInfo::CODE_TARGET); __ Call(stub4.GetCode(), RelocInfo::CODE_TARGET);
__ pop(lr); __ pop(lr);
}
__ bind(&finished_loading_r1); __ bind(&finished_loading_r1);
__ bind(&do_the_call); __ bind(&do_the_call);
...@@ -5043,6 +5107,33 @@ static void HandleBinaryOpSlowCases(MacroAssembler* masm, ...@@ -5043,6 +5107,33 @@ static void HandleBinaryOpSlowCases(MacroAssembler* masm,
// r2: Right value (least significant part of mantissa). // r2: Right value (least significant part of mantissa).
// r3: Right value (sign, exponent, top of mantissa). // r3: Right value (sign, exponent, top of mantissa).
// r5: Address of heap number for result. // r5: Address of heap number for result.
if (CpuFeatures::IsSupported(CpuFeatures::VFP3) &&
((Token::MUL == operation) ||
(Token::DIV == operation) ||
(Token::ADD == operation) ||
(Token::SUB == operation))) {
// ARMv7 VFP3 instructions to implement
// double precision, add, subtract, multiply, divide.
// This VFP3 implementation is known to work on
// ARMv7-VFP3 Snapdragon processor
__ fmdrr(d6, r0, r1);
__ fmdrr(d7, r2, r3);
if (Token::MUL == operation) __ fmuld(d5, d6, d7);
else if (Token::DIV == operation) __ fdivd(d5, d6, d7);
else if (Token::ADD == operation) __ faddd(d5, d6, d7);
else if (Token::SUB == operation) __ fsubd(d5, d6, d7);
__ fmrrd(r0, r1, d5);
__ str(r0, FieldMemOperand(r5, HeapNumber::kValueOffset));
__ str(r1, FieldMemOperand(r5, HeapNumber::kValueOffset + 4));
__ mov(r0, Operand(r5));
__ mov(pc, lr);
return;
}
__ push(lr); // For later. __ push(lr); // For later.
__ push(r5); // Address of heap number that is answer. __ push(r5); // Address of heap number that is answer.
__ AlignStack(0); __ AlignStack(0);
...@@ -5111,27 +5202,39 @@ static void GetInt32(MacroAssembler* masm, ...@@ -5111,27 +5202,39 @@ static void GetInt32(MacroAssembler* masm,
__ sub(scratch2, scratch2, Operand(zero_exponent), SetCC); __ sub(scratch2, scratch2, Operand(zero_exponent), SetCC);
// Dest already has a Smi zero. // Dest already has a Smi zero.
__ b(lt, &done); __ b(lt, &done);
if (!CpuFeatures::IsSupported(CpuFeatures::VFP3)) {
// We have a shifted exponent between 0 and 30 in scratch2. // We have a shifted exponent between 0 and 30 in scratch2.
__ mov(dest, Operand(scratch2, LSR, HeapNumber::kExponentShift)); __ mov(dest, Operand(scratch2, LSR, HeapNumber::kExponentShift));
// We now have the exponent in dest. Subtract from 30 to get // We now have the exponent in dest. Subtract from 30 to get
// how much to shift down. // how much to shift down.
__ rsb(dest, dest, Operand(30)); __ rsb(dest, dest, Operand(30));
}
__ bind(&right_exponent); __ bind(&right_exponent);
if (CpuFeatures::IsSupported(CpuFeatures::VFP3)) {
// ARMv7 VFP3 instructions implementing double precision to integer
// conversion using round to zero.
// This VFP3 implementation is known to work on
// ARMv7-VFP3 Snapdragon processor.
__ ldr(scratch2, FieldMemOperand(source, HeapNumber::kMantissaOffset));
__ fmdrr(d7, scratch2, scratch);
__ ftosid(s15, d7);
__ fmrs(dest, s15);
} else {
// Get the top bits of the mantissa. // Get the top bits of the mantissa.
__ and_(scratch2, scratch, Operand(HeapNumber::kMantissaMask)); __ and_(scratch2, scratch, Operand(HeapNumber::kMantissaMask));
// Put back the implicit 1. // Put back the implicit 1.
__ orr(scratch2, scratch2, Operand(1 << HeapNumber::kExponentShift)); __ orr(scratch2, scratch2, Operand(1 << HeapNumber::kExponentShift));
// Shift up the mantissa bits to take up the space the exponent used to take. // Shift up the mantissa bits to take up the space the exponent used to
// We just orred in the implicit bit so that took care of one and we want to // take. We just orred in the implicit bit so that took care of one and
// leave the sign bit 0 so we subtract 2 bits from the shift distance. // we want to leave the sign bit 0 so we subtract 2 bits from the shift
// distance.
const int shift_distance = HeapNumber::kNonMantissaBitsInTopWord - 2; const int shift_distance = HeapNumber::kNonMantissaBitsInTopWord - 2;
__ mov(scratch2, Operand(scratch2, LSL, shift_distance)); __ mov(scratch2, Operand(scratch2, LSL, shift_distance));
// Put sign in zero flag. // Put sign in zero flag.
__ tst(scratch, Operand(HeapNumber::kSignMask)); __ tst(scratch, Operand(HeapNumber::kSignMask));
// Get the second half of the double. For some exponents we don't actually // Get the second half of the double. For some exponents we don't
// need this because the bits get shifted out again, but it's probably slower // actually need this because the bits get shifted out again, but
// to test than just to do it. // it's probably slower to test than just to do it.
__ ldr(scratch, FieldMemOperand(source, HeapNumber::kMantissaOffset)); __ ldr(scratch, FieldMemOperand(source, HeapNumber::kMantissaOffset));
// Shift down 22 bits to get the last 10 bits. // Shift down 22 bits to get the last 10 bits.
__ orr(scratch, scratch2, Operand(scratch, LSR, 32 - shift_distance)); __ orr(scratch, scratch2, Operand(scratch, LSR, 32 - shift_distance));
...@@ -5139,10 +5242,10 @@ static void GetInt32(MacroAssembler* masm, ...@@ -5139,10 +5242,10 @@ static void GetInt32(MacroAssembler* masm,
__ mov(dest, Operand(scratch, LSR, dest)); __ mov(dest, Operand(scratch, LSR, dest));
// Fix sign if sign bit was set. // Fix sign if sign bit was set.
__ rsb(dest, dest, Operand(0), LeaveCC, ne); __ rsb(dest, dest, Operand(0), LeaveCC, ne);
}
__ bind(&done); __ bind(&done);
} }
// For bitwise ops where the inputs are not both Smis we here try to determine // For bitwise ops where the inputs are not both Smis we here try to determine
// whether both inputs are either Smis or at least heap numbers that can be // whether both inputs are either Smis or at least heap numbers that can be
// represented by a 32 bit signed value. We truncate towards zero as required // represented by a 32 bit signed value. We truncate towards zero as required
...@@ -5159,7 +5262,7 @@ void GenericBinaryOpStub::HandleNonSmiBitwiseOp(MacroAssembler* masm) { ...@@ -5159,7 +5262,7 @@ void GenericBinaryOpStub::HandleNonSmiBitwiseOp(MacroAssembler* masm) {
__ b(eq, &r1_is_smi); // It's a Smi so don't check it's a heap number. __ b(eq, &r1_is_smi); // It's a Smi so don't check it's a heap number.
__ CompareObjectType(r1, r4, r4, HEAP_NUMBER_TYPE); __ CompareObjectType(r1, r4, r4, HEAP_NUMBER_TYPE);
__ b(ne, &slow); __ b(ne, &slow);
GetInt32(masm, r1, r3, r4, r5, &slow); GetInt32(masm, r1, r3, r5, r4, &slow);
__ jmp(&done_checking_r1); __ jmp(&done_checking_r1);
__ bind(&r1_is_smi); __ bind(&r1_is_smi);
__ mov(r3, Operand(r1, ASR, 1)); __ mov(r3, Operand(r1, ASR, 1));
...@@ -5169,7 +5272,7 @@ void GenericBinaryOpStub::HandleNonSmiBitwiseOp(MacroAssembler* masm) { ...@@ -5169,7 +5272,7 @@ void GenericBinaryOpStub::HandleNonSmiBitwiseOp(MacroAssembler* masm) {
__ b(eq, &r0_is_smi); // It's a Smi so don't check it's a heap number. __ b(eq, &r0_is_smi); // It's a Smi so don't check it's a heap number.
__ CompareObjectType(r0, r4, r4, HEAP_NUMBER_TYPE); __ CompareObjectType(r0, r4, r4, HEAP_NUMBER_TYPE);
__ b(ne, &slow); __ b(ne, &slow);
GetInt32(masm, r0, r2, r4, r5, &slow); GetInt32(masm, r0, r2, r5, r4, &slow);
__ jmp(&done_checking_r0); __ jmp(&done_checking_r0);
__ bind(&r0_is_smi); __ bind(&r0_is_smi);
__ mov(r2, Operand(r0, ASR, 1)); __ mov(r2, Operand(r0, ASR, 1));
......
...@@ -66,6 +66,28 @@ const char* Registers::Name(int reg) { ...@@ -66,6 +66,28 @@ const char* Registers::Name(int reg) {
return result; return result;
} }
// Support for VFP registers s0 to s31 (d0 to d15).
// Note that "sN:sM" is the same as "dN/2"
// These register names are defined in a way to match the native disassembler
// formatting. See for example the command "objdump -d <binary file>".
const char* VFPRegisters::names_[kNumVFPRegisters] = {
"s0", "s1", "s2", "s3", "s4", "s5", "s6", "s7",
"s8", "s9", "s10", "s11", "s12", "s13", "s14", "s15",
"s16", "s17", "s18", "s19", "s20", "s21", "s22", "s23",
"s24", "s25", "s26", "s27", "s28", "s29", "s30", "s31",
"d0", "d1", "d2", "d3", "d4", "d5", "d6", "d7",
"d8", "d9", "d10", "d11", "d12", "d13", "d14", "d15",
};
const char* VFPRegisters::Name(int reg) {
const char* result;
if ((0 <= reg) && (reg < kNumVFPRegisters)) {
result = names_[reg];
} else {
result = "no_vfp_reg";
}
return result;
}
int Registers::Number(const char* name) { int Registers::Number(const char* name) {
// Look through the canonical names. // Look through the canonical names.
......
...@@ -75,6 +75,9 @@ namespace arm { ...@@ -75,6 +75,9 @@ namespace arm {
// Number of registers in normal ARM mode. // Number of registers in normal ARM mode.
static const int kNumRegisters = 16; static const int kNumRegisters = 16;
// VFP support.
static const int kNumVFPRegisters = 48;
// PC is register 15. // PC is register 15.
static const int kPCRegister = 15; static const int kPCRegister = 15;
static const int kNoRegister = -1; static const int kNoRegister = -1;
...@@ -231,6 +234,16 @@ class Instr { ...@@ -231,6 +234,16 @@ class Instr {
inline int RnField() const { return Bits(19, 16); } inline int RnField() const { return Bits(19, 16); }
inline int RdField() const { return Bits(15, 12); } inline int RdField() const { return Bits(15, 12); }
// Support for VFP.
// Vn(19-16) | Vd(15-12) | Vm(3-0)
inline int VnField() const { return Bits(19, 16); }
inline int VmField() const { return Bits(3, 0); }
inline int VdField() const { return Bits(15, 12); }
inline int NField() const { return Bit(7); }
inline int MField() const { return Bit(5); }
inline int DField() const { return Bit(22); }
inline int RtField() const { return Bits(15, 12); }
// Fields used in Data processing instructions // Fields used in Data processing instructions
inline Opcode OpcodeField() const { inline Opcode OpcodeField() const {
return static_cast<Opcode>(Bits(24, 21)); return static_cast<Opcode>(Bits(24, 21));
...@@ -315,6 +328,15 @@ class Registers { ...@@ -315,6 +328,15 @@ class Registers {
static const RegisterAlias aliases_[]; static const RegisterAlias aliases_[];
}; };
// Helper functions for converting between VFP register numbers and names.
class VFPRegisters {
public:
// Return the name of the register.
static const char* Name(int reg);
private:
static const char* names_[kNumVFPRegisters];
};
} } // namespace assembler::arm } } // namespace assembler::arm
......
...@@ -33,12 +33,13 @@ ...@@ -33,12 +33,13 @@
#include "v8.h" #include "v8.h"
#include "cpu.h" #include "cpu.h"
#include "macro-assembler.h"
namespace v8 { namespace v8 {
namespace internal { namespace internal {
void CPU::Setup() { void CPU::Setup() {
// Nothing to do. CpuFeatures::Probe();
} }
......
...@@ -97,6 +97,10 @@ class Decoder { ...@@ -97,6 +97,10 @@ class Decoder {
// Printing of common values. // Printing of common values.
void PrintRegister(int reg); void PrintRegister(int reg);
void PrintSRegister(int reg);
void PrintDRegister(int reg);
int FormatVFPRegister(Instr* instr, const char* format);
int FormatVFPinstruction(Instr* instr, const char* format);
void PrintCondition(Instr* instr); void PrintCondition(Instr* instr);
void PrintShiftRm(Instr* instr); void PrintShiftRm(Instr* instr);
void PrintShiftImm(Instr* instr); void PrintShiftImm(Instr* instr);
...@@ -121,6 +125,10 @@ class Decoder { ...@@ -121,6 +125,10 @@ class Decoder {
void DecodeType6(Instr* instr); void DecodeType6(Instr* instr);
void DecodeType7(Instr* instr); void DecodeType7(Instr* instr);
void DecodeUnconditional(Instr* instr); void DecodeUnconditional(Instr* instr);
// For VFP support.
void DecodeTypeVFP(Instr* instr);
void DecodeType6CoprocessorIns(Instr* instr);
const disasm::NameConverter& converter_; const disasm::NameConverter& converter_;
v8::internal::Vector<char> out_buffer_; v8::internal::Vector<char> out_buffer_;
...@@ -171,6 +179,16 @@ void Decoder::PrintRegister(int reg) { ...@@ -171,6 +179,16 @@ void Decoder::PrintRegister(int reg) {
Print(converter_.NameOfCPURegister(reg)); Print(converter_.NameOfCPURegister(reg));
} }
// Print the VFP S register name according to the active name converter.
void Decoder::PrintSRegister(int reg) {
Print(assembler::arm::VFPRegisters::Name(reg));
}
// Print the VFP D register name according to the active name converter.
void Decoder::PrintDRegister(int reg) {
Print(assembler::arm::VFPRegisters::Name(reg + 32));
}
// These shift names are defined in a way to match the native disassembler // These shift names are defined in a way to match the native disassembler
// formatting. See for example the command "objdump -d <binary file>". // formatting. See for example the command "objdump -d <binary file>".
...@@ -290,6 +308,10 @@ int Decoder::FormatRegister(Instr* instr, const char* format) { ...@@ -290,6 +308,10 @@ int Decoder::FormatRegister(Instr* instr, const char* format) {
int reg = instr->RmField(); int reg = instr->RmField();
PrintRegister(reg); PrintRegister(reg);
return 2; return 2;
} else if (format[1] == 't') { // 'rt: Rt register
int reg = instr->RtField();
PrintRegister(reg);
return 2;
} else if (format[1] == 'l') { } else if (format[1] == 'l') {
// 'rlist: register list for load and store multiple instructions // 'rlist: register list for load and store multiple instructions
ASSERT(STRING_STARTS_WITH(format, "rlist")); ASSERT(STRING_STARTS_WITH(format, "rlist"));
...@@ -314,6 +336,39 @@ int Decoder::FormatRegister(Instr* instr, const char* format) { ...@@ -314,6 +336,39 @@ int Decoder::FormatRegister(Instr* instr, const char* format) {
return -1; return -1;
} }
// Handle all VFP register based formatting in this function to reduce the
// complexity of FormatOption.
int Decoder::FormatVFPRegister(Instr* instr, const char* format) {
ASSERT((format[0] == 'S') || (format[0] == 'D'));
if (format[1] == 'n') {
int reg = instr->VnField();
if (format[0] == 'S') PrintSRegister(((reg << 1) | instr->NField()));
if (format[0] == 'D') PrintDRegister(reg);
return 2;
} else if (format[1] == 'm') {
int reg = instr->VmField();
if (format[0] == 'S') PrintSRegister(((reg << 1) | instr->MField()));
if (format[0] == 'D') PrintDRegister(reg);
return 2;
} else if (format[1] == 'd') {
int reg = instr->VdField();
if (format[0] == 'S') PrintSRegister(((reg << 1) | instr->DField()));
if (format[0] == 'D') PrintDRegister(reg);
return 2;
}
UNREACHABLE();
return -1;
}
int Decoder::FormatVFPinstruction(Instr* instr, const char* format) {
Print(format);
return 0;
}
// FormatOption takes a formatting string and interprets it based on // FormatOption takes a formatting string and interprets it based on
// the current instructions. The format string points to the first // the current instructions. The format string points to the first
...@@ -459,6 +514,13 @@ int Decoder::FormatOption(Instr* instr, const char* format) { ...@@ -459,6 +514,13 @@ int Decoder::FormatOption(Instr* instr, const char* format) {
} }
return 1; return 1;
} }
case 'v': {
return FormatVFPinstruction(instr, format);
}
case 'S':
case 'D': {
return FormatVFPRegister(instr, format);
}
case 'w': { // 'w: W field of load and store instructions case 'w': { // 'w: W field of load and store instructions
if (instr->HasW()) { if (instr->HasW()) {
Print("!"); Print("!");
...@@ -761,8 +823,7 @@ void Decoder::DecodeType5(Instr* instr) { ...@@ -761,8 +823,7 @@ void Decoder::DecodeType5(Instr* instr) {
void Decoder::DecodeType6(Instr* instr) { void Decoder::DecodeType6(Instr* instr) {
// Coprocessor instructions currently not supported. DecodeType6CoprocessorIns(instr);
Unknown(instr);
} }
...@@ -770,12 +831,10 @@ void Decoder::DecodeType7(Instr* instr) { ...@@ -770,12 +831,10 @@ void Decoder::DecodeType7(Instr* instr) {
if (instr->Bit(24) == 1) { if (instr->Bit(24) == 1) {
Format(instr, "swi'cond 'swi"); Format(instr, "swi'cond 'swi");
} else { } else {
// Coprocessor instructions currently not supported. DecodeTypeVFP(instr);
Unknown(instr);
} }
} }
void Decoder::DecodeUnconditional(Instr* instr) { void Decoder::DecodeUnconditional(Instr* instr) {
if (instr->Bits(7, 4) == 0xB && instr->Bits(27, 25) == 0 && instr->HasL()) { if (instr->Bits(7, 4) == 0xB && instr->Bits(27, 25) == 0 && instr->HasL()) {
Format(instr, "'memop'h'pu 'rd, "); Format(instr, "'memop'h'pu 'rd, ");
...@@ -837,6 +896,138 @@ void Decoder::DecodeUnconditional(Instr* instr) { ...@@ -837,6 +896,138 @@ void Decoder::DecodeUnconditional(Instr* instr) {
} }
// void Decoder::DecodeTypeVFP(Instr* instr)
// Implements the following
// VFP instructions
// fmsr :Sn = Rt
// fmrs :Rt = Sn
// fsitod: Dd = Sm
// ftosid: Sd = Dm
// Dd = faddd(Dn, Dm)
// Dd = fsubd(Dn, Dm)
// Dd = fmuld(Dn, Dm)
// Dd = fdivd(Dn, Dm)
// vcmp(Dd, Dm)
// VMRS
void Decoder::DecodeTypeVFP(Instr* instr) {
ASSERT((instr->TypeField() == 7) && (instr->Bit(24) == 0x0) );
if (instr->Bit(23) == 1) {
if ((instr->Bits(21, 19) == 0x7) &&
(instr->Bits(18, 16) == 0x5) &&
(instr->Bits(11, 9) == 0x5) &&
(instr->Bit(8) == 1) &&
(instr->Bit(6) == 1) &&
(instr->Bit(4) == 0)) {
Format(instr, "vcvt.s32.f64'cond 'Sd, 'Dm");
} else if ((instr->Bits(21, 19) == 0x7) &&
(instr->Bits(18, 16) == 0x0) &&
(instr->Bits(11, 9) == 0x5) &&
(instr->Bit(8) == 1) &&
(instr->Bit(7) == 1) &&
(instr->Bit(6) == 1) &&
(instr->Bit(4) == 0)) {
Format(instr, "vcvt.f64.s32'cond 'Dd, 'Sm");
} else if ((instr->Bit(21) == 0x0) &&
(instr->Bit(20) == 0x0) &&
(instr->Bits(11, 9) == 0x5) &&
(instr->Bit(8) == 1) &&
(instr->Bit(6) == 0) &&
(instr->Bit(4) == 0)) {
Format(instr, "vdiv.f64'cond 'Dd, 'Dn, 'Dm");
} else if ((instr->Bits(21, 20) == 0x3) &&
(instr->Bits(19, 16) == 0x4) &&
(instr->Bits(11, 9) == 0x5) &&
(instr->Bit(8) == 0x1) &&
(instr->Bit(6) == 0x1) &&
(instr->Bit(4) == 0x0)) {
Format(instr, "vcmp.f64'cond 'Dd, 'Dm");
} else if ((instr->Bits(23, 20) == 0xF) &&
(instr->Bits(19, 16) == 0x1) &&
(instr->Bits(11, 8) == 0xA) &&
(instr->Bits(7, 5) == 0x0) &&
(instr->Bit(4) == 0x1) &&
(instr->Bits(3, 0) == 0x0)) {
if (instr->Bits(15, 12) == 0xF)
Format(instr, "vmrs'cond APSR, FPSCR");
else
Unknown(instr); // not used by V8
} else {
Unknown(instr); // not used by V8
}
} else if (instr->Bit(21) == 1) {
if ((instr->Bit(20) == 0x1) &&
(instr->Bits(11, 9) == 0x5) &&
(instr->Bit(8) == 0x1) &&
(instr->Bit(6) == 0) &&
(instr->Bit(4) == 0)) {
Format(instr, "vadd.f64'cond 'Dd, 'Dn, 'Dm");
} else if ((instr->Bit(20) == 0x1) &&
(instr->Bits(11, 9) == 0x5) &&
(instr->Bit(8) == 0x1) &&
(instr->Bit(6) == 1) &&
(instr->Bit(4) == 0)) {
Format(instr, "vsub.f64'cond 'Dd, 'Dn, 'Dm");
} else if ((instr->Bit(20) == 0x0) &&
(instr->Bits(11, 9) == 0x5) &&
(instr->Bit(8) == 0x1) &&
(instr->Bit(6) == 0) &&
(instr->Bit(4) == 0)) {
Format(instr, "vmul.f64'cond 'Dd, 'Dn, 'Dm");
} else {
Unknown(instr); // not used by V8
}
} else {
if ((instr->Bit(20) == 0x0) &&
(instr->Bits(11, 8) == 0xA) &&
(instr->Bits(6, 5) == 0x0) &&
(instr->Bit(4) == 1) &&
(instr->Bits(3, 0) == 0x0)) {
Format(instr, "vmov'cond 'Sn, 'rt");
} else if ((instr->Bit(20) == 0x1) &&
(instr->Bits(11, 8) == 0xA) &&
(instr->Bits(6, 5) == 0x0) &&
(instr->Bit(4) == 1) &&
(instr->Bits(3, 0) == 0x0)) {
Format(instr, "vmov'cond 'rt, 'Sn");
} else {
Unknown(instr); // not used by V8
}
}
}
// Decode Type 6 coprocessor instructions
// Dm = fmdrr(Rt, Rt2)
// <Rt, Rt2> = fmrrd(Dm)
void Decoder::DecodeType6CoprocessorIns(Instr* instr) {
ASSERT((instr->TypeField() == 6));
if (instr->Bit(23) == 1) {
Unknown(instr); // not used by V8
} else if (instr->Bit(22) == 1) {
if ((instr->Bits(27, 24) == 0xC) &&
(instr->Bit(22) == 1) &&
(instr->Bits(11, 8) == 0xB) &&
(instr->Bits(7, 6) == 0x0) &&
(instr->Bit(4) == 1)) {
if (instr->Bit(20) == 0) {
Format(instr, "vmov'cond 'Dm, 'rt, 'rn");
} else if (instr->Bit(20) == 1) {
Format(instr, "vmov'cond 'rt, 'rn, 'Dm");
}
} else {
Unknown(instr); // not used by V8
}
} else if (instr->Bit(21) == 1) {
Unknown(instr); // not used by V8
} else {
Unknown(instr); // not used by V8
}
}
// Disassemble the instruction at *instr_ptr into the output buffer. // Disassemble the instruction at *instr_ptr into the output buffer.
int Decoder::InstructionDecode(byte* instr_ptr) { int Decoder::InstructionDecode(byte* instr_ptr) {
Instr* instr = Instr::At(instr_ptr); Instr* instr = Instr::At(instr_ptr);
......
This diff is collapsed.
...@@ -97,7 +97,6 @@ namespace arm { ...@@ -97,7 +97,6 @@ namespace arm {
class Simulator { class Simulator {
public: public:
friend class Debugger; friend class Debugger;
enum Register { enum Register {
no_reg = -1, no_reg = -1,
r0 = 0, r1, r2, r3, r4, r5, r6, r7, r0 = 0, r1, r2, r3, r4, r5, r6, r7,
...@@ -105,7 +104,15 @@ class Simulator { ...@@ -105,7 +104,15 @@ class Simulator {
num_registers, num_registers,
sp = 13, sp = 13,
lr = 14, lr = 14,
pc = 15 pc = 15,
s0 = 0, s1, s2, s3, s4, s5, s6, s7,
s8, s9, s10, s11, s12, s13, s14, s15,
s16, s17, s18, s19, s20, s21, s22, s23,
s24, s25, s26, s27, s28, s29, s30, s31,
num_s_registers = 32,
d0 = 0, d1, d2, d3, d4, d5, d6, d7,
d8, d9, d10, d11, d12, d13, d14, d15,
num_d_registers = 16
}; };
Simulator(); Simulator();
...@@ -121,6 +128,16 @@ class Simulator { ...@@ -121,6 +128,16 @@ class Simulator {
void set_register(int reg, int32_t value); void set_register(int reg, int32_t value);
int32_t get_register(int reg) const; int32_t get_register(int reg) const;
// Support for VFP.
void set_s_register(int reg, unsigned int value);
unsigned int get_s_register(int reg) const;
void set_d_register_from_double(int dreg, const double& dbl);
double get_double_from_d_register(int dreg);
void set_s_register_from_float(int sreg, const float dbl);
float get_float_from_s_register(int sreg);
void set_s_register_from_sinteger(int reg, const int value);
int get_sinteger_from_s_register(int reg);
// Special case of set_register and get_register to access the raw PC value. // Special case of set_register and get_register to access the raw PC value.
void set_pc(int32_t value); void set_pc(int32_t value);
int32_t get_pc() const; int32_t get_pc() const;
...@@ -175,6 +192,10 @@ class Simulator { ...@@ -175,6 +192,10 @@ class Simulator {
int32_t right, int32_t right,
bool addition); bool addition);
// Support for VFP.
void Compute_FPSCR_Flags(double val1, double val2);
void Copy_FPSCR_to_APSR();
// Helper functions to decode common "addressing" modes // Helper functions to decode common "addressing" modes
int32_t GetShiftRm(Instr* instr, bool* carry_out); int32_t GetShiftRm(Instr* instr, bool* carry_out);
int32_t GetImm(Instr* instr, bool* carry_out); int32_t GetImm(Instr* instr, bool* carry_out);
...@@ -206,6 +227,10 @@ class Simulator { ...@@ -206,6 +227,10 @@ class Simulator {
void DecodeType7(Instr* instr); void DecodeType7(Instr* instr);
void DecodeUnconditional(Instr* instr); void DecodeUnconditional(Instr* instr);
// Support for VFP.
void DecodeTypeVFP(Instr* instr);
void DecodeType6CoprocessorIns(Instr* instr);
// Executes one instruction. // Executes one instruction.
void InstructionDecode(Instr* instr); void InstructionDecode(Instr* instr);
...@@ -226,6 +251,20 @@ class Simulator { ...@@ -226,6 +251,20 @@ class Simulator {
bool c_flag_; bool c_flag_;
bool v_flag_; bool v_flag_;
// VFP architecture state.
unsigned int vfp_register[32/*num_s_registers*/];
bool n_flag_FPSCR_;
bool z_flag_FPSCR_;
bool c_flag_FPSCR_;
bool v_flag_FPSCR_;
// VFP FP exception flags architecture state.
bool inv_op_vfp_flag_;
bool div_zero_vfp_flag_;
bool overflow_vfp_flag_;
bool underflow_vfp_flag_;
bool inexact_vfp_flag_;
// Simulator support. // Simulator support.
char* stack_; char* stack_;
bool pc_modified_; bool pc_modified_;
......
...@@ -114,6 +114,8 @@ DEFINE_bool(enable_rdtsc, true, ...@@ -114,6 +114,8 @@ DEFINE_bool(enable_rdtsc, true,
"enable use of RDTSC instruction if available") "enable use of RDTSC instruction if available")
DEFINE_bool(enable_sahf, true, DEFINE_bool(enable_sahf, true,
"enable use of SAHF instruction if available (X64 only)") "enable use of SAHF instruction if available (X64 only)")
DEFINE_bool(enable_vfp3, true,
"enable use of VFP3 instructions if available")
// bootstrapper.cc // bootstrapper.cc
DEFINE_string(expose_natives_as, NULL, "expose natives in global object") DEFINE_string(expose_natives_as, NULL, "expose natives in global object")
......
...@@ -89,6 +89,46 @@ double OS::nan_value() { ...@@ -89,6 +89,46 @@ double OS::nan_value() {
} }
bool OS::fgrep_vfp(const char* file_name, const char* string) {
// Simple detection of VFP at runtime for Linux.
// It is based on /proc/cpuinfo, which reveals hardware configuration
// to user-space applications. According to ARM (mid 2009), no similar
// facility is universally available on the ARM architectures,
// so it's up to individual OSes to provide such.
//
// This is written as a straight shot one pass parser
// and not using STL string and ifstream because,
// on Linux, it's reading from a (non-mmap-able)
// character special device.
FILE* f = NULL;
if (NULL == (f = fopen(file_name, "r")))
return false;
const char* what = string;
int k;
while (EOF != (k = fgetc(f))) {
if (k == *what) {
++what;
while ((*what != '\0') && (*what == fgetc(f))) {
++what;
}
if (*what == '\0') {
fclose(f);
return true;
} else {
what = string;
}
}
}
fclose(f);
// Did not find string in the file file_name.
return false;
}
int OS::ActivationFrameAlignment() { int OS::ActivationFrameAlignment() {
#ifdef V8_TARGET_ARCH_ARM #ifdef V8_TARGET_ARCH_ARM
// On EABI ARM targets this is required for fp correctness in the // On EABI ARM targets this is required for fp correctness in the
......
...@@ -250,6 +250,9 @@ class OS { ...@@ -250,6 +250,9 @@ class OS {
// Returns the double constant NAN // Returns the double constant NAN
static double nan_value(); static double nan_value();
// Support runtime detection of VFP3 on linux platforms.
static bool fgrep_vfp(const char * file_name, const char * string);
// Returns the activation frame alignment constraint or zero if // Returns the activation frame alignment constraint or zero if
// the platform doesn't care. Guaranteed to be a power of two. // the platform doesn't care. Guaranteed to be a power of two.
static int ActivationFrameAlignment(); static int ActivationFrameAlignment();
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment