NEON use vmov.i32 to splat some f32 values into vectors.

author Jim Grosbach <grosbach@apple.com>

Fri, 20 Jan 2012 18:09:51 +0000 (18:09 +0000)

committer Jim Grosbach <grosbach@apple.com>

Fri, 20 Jan 2012 18:09:51 +0000 (18:09 +0000)
author Jim Grosbach <grosbach@apple.com>
Fri, 20 Jan 2012 18:09:51 +0000 (18:09 +0000)
committer Jim Grosbach <grosbach@apple.com>
Fri, 20 Jan 2012 18:09:51 +0000 (18:09 +0000)
diff --git a/lib/Target/ARM/ARMInstrNEON.td b/lib/Target/ARM/ARMInstrNEON.td

index 1e3410221e1f83081da3574f23b2756551fc15a9..d940255378336afe0ff95a249a9719391063ac78 100644 (file)
--- a/lib/Target/ARM/ARMInstrNEON.td
+++ b/lib/Target/ARM/ARMInstrNEON.td
@@ -6088,3 +6088,12 @@ def : NEONMnemonicAlias<"vswpq", "vswp">;
  
  def : NEONMnemonicAlias<"vrecpeq.f32", "vrecpe.f32">;
  def : NEONMnemonicAlias<"vrecpeq.u32", "vrecpe.u32">;
+
+
+// Alias for loading floating point immediates that aren't representable
+// using the vmov.f32 encoding but the bitpattern is representable using
+// the .i32 encoding.
+def : NEONInstAlias<"vmov${p}.f32 $Vd, $imm",
+                     (VMOVv4i32 QPR:$Vd, nImmVMOVI32:$imm, pred:$p)>;
+def : NEONInstAlias<"vmov${p}.f32 $Vd, $imm",
+                     (VMOVv2i32 DPR:$Vd, nImmVMOVI32:$imm, pred:$p)>;
diff --git a/lib/Target/ARM/AsmParser/ARMAsmParser.cpp b/lib/Target/ARM/AsmParser/ARMAsmParser.cpp

index c8e733df2d2f17443fe8ec627fb2c62a1b8322b5..0c6098b5bc2033bfb2b92be82aedf8487b3de056 100644 (file)
--- a/lib/Target/ARM/AsmParser/ARMAsmParser.cpp
+++ b/lib/Target/ARM/AsmParser/ARMAsmParser.cpp
@@ -270,7 +270,6 @@ class ARMOperand : public MCParsedAsmOperand {
      k_CoprocReg,
      k_CoprocOption,
      k_Immediate,
-    k_FPImmediate,
      k_MemBarrierOpt,
      k_Memory,
      k_PostIndexRegister,
@@ -349,10 +348,6 @@ class ARMOperand : public MCParsedAsmOperand {
        const MCExpr *Val;
      } Imm;
  
-    struct {
-      unsigned Val;       // encoded 8-bit representation
-    } FPImm;
-
      /// Combined record for all forms of ARM address expressions.
      struct {
        unsigned BaseRegNum;
@@ -438,9 +433,6 @@ public:
      case k_Immediate:
        Imm = o.Imm;
        break;
-    case k_FPImmediate:
-      FPImm = o.FPImm;
-      break;
      case k_MemBarrierOpt:
        MBOpt = o.MBOpt;
        break;
@@ -513,11 +505,6 @@ public:
      return Imm.Val;
    }
  
-  unsigned getFPImm() const {
-    assert(Kind == k_FPImmediate && "Invalid access!");
-    return FPImm.Val;
-  }
-
    unsigned getVectorIndex() const {
      assert(Kind == k_VectorIndex && "Invalid access!");
      return VectorIndex.Val;
@@ -546,7 +533,13 @@ public:
    bool isITMask() const { return Kind == k_ITCondMask; }
    bool isITCondCode() const { return Kind == k_CondCode; }
    bool isImm() const { return Kind == k_Immediate; }
-  bool isFPImm() const { return Kind == k_FPImmediate; }
+  bool isFPImm() const {
+    if (!isImm()) return false;
+    const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
+    if (!CE) return false;
+    int Val = ARM_AM::getFP32Imm(APInt(32, CE->getValue()));
+    return Val != -1;
+  }
    bool isFBits16() const {
      if (!isImm()) return false;
      const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
@@ -1394,7 +1387,9 @@ public:
  
    void addFPImmOperands(MCInst &Inst, unsigned N) const {
      assert(N == 1 && "Invalid number of operands!");
-    Inst.addOperand(MCOperand::CreateImm(getFPImm()));
+    const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
+    int Val = ARM_AM::getFP32Imm(APInt(32, CE->getValue()));
+    Inst.addOperand(MCOperand::CreateImm(Val));
    }
  
    void addImm8s4Operands(MCInst &Inst, unsigned N) const {
@@ -2098,14 +2093,6 @@ public:
      return Op;
    }
  
-  static ARMOperand *CreateFPImm(unsigned Val, SMLoc S, MCContext &Ctx) {
-    ARMOperand *Op = new ARMOperand(k_FPImmediate);
-    Op->FPImm.Val = Val;
-    Op->StartLoc = S;
-    Op->EndLoc = S;
-    return Op;
-  }
-
    static ARMOperand *CreateMem(unsigned BaseRegNum,
                                 const MCConstantExpr *OffsetImm,
                                 unsigned OffsetRegNum,
@@ -2170,10 +2157,6 @@ public:
  
  void ARMOperand::print(raw_ostream &OS) const {
    switch (Kind) {
-  case k_FPImmediate:
-    OS << "<fpimm " << getFPImm() << "(" << ARM_AM::getFPImmFloat(getFPImm())
-       << ") >";
-    break;
    case k_CondCode:
      OS << "<ARMCC::" << ARMCondCodeToString(getCondCode()) << ">";
      break;
@@ -4247,6 +4230,15 @@ bool ARMAsmParser::parseMemRegOffsetShift(ARM_AM::ShiftOpc &St,
  /// parseFPImm - A floating point immediate expression operand.
  ARMAsmParser::OperandMatchResultTy ARMAsmParser::
  parseFPImm(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
+  // Anything that can accept a floating point constant as an operand
+  // needs to go through here, as the regular ParseExpression is
+  // integer only.
+  //
+  // This routine still creates a generic Immediate operand, containing
+  // a bitcast of the 64-bit floating point value. The various operands
+  // that accept floats can check whether the value is valid for them
+  // via the standard is*() predicates.
+
    SMLoc S = Parser.getTok().getLoc();
  
    if (Parser.getTok().isNot(AsmToken::Hash) &&
@@ -4279,19 +4271,18 @@ parseFPImm(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
    const AsmToken &Tok = Parser.getTok();
    SMLoc Loc = Tok.getLoc();
    if (Tok.is(AsmToken::Real)) {
-    APFloat RealVal(APFloat::IEEEdouble, Tok.getString());
+    APFloat RealVal(APFloat::IEEEsingle, Tok.getString());
      uint64_t IntVal = RealVal.bitcastToAPInt().getZExtValue();
      // If we had a '-' in front, toggle the sign bit.
-    IntVal ^= (uint64_t)isNegative << 63;
-    int Val = ARM_AM::getFP64Imm(APInt(64, IntVal));
+    IntVal ^= (uint64_t)isNegative << 31;
      Parser.Lex(); // Eat the token.
-    if (Val == -1) {
-      Error(Loc, "floating point value out of range");
-      return MatchOperand_ParseFail;
-    }
-    Operands.push_back(ARMOperand::CreateFPImm(Val, S, getContext()));
+    Operands.push_back(ARMOperand::CreateImm(
+          MCConstantExpr::Create(IntVal, getContext()),
+          S, Parser.getTok().getLoc()));
      return MatchOperand_Success;
    }
+  // Also handle plain integers. Instructions which allow floating point
+  // immediates also allow a raw encoded 8-bit value.
    if (Tok.is(AsmToken::Integer)) {
      int64_t Val = Tok.getIntVal();
      Parser.Lex(); // Eat the token.
@@ -4299,13 +4290,18 @@ parseFPImm(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
        Error(Loc, "encoded floating point value out of range");
        return MatchOperand_ParseFail;
      }
-    Operands.push_back(ARMOperand::CreateFPImm(Val, S, getContext()));
+    double RealVal = ARM_AM::getFPImmFloat(Val);
+    Val = APFloat(APFloat::IEEEdouble, RealVal).bitcastToAPInt().getZExtValue();
+    Operands.push_back(ARMOperand::CreateImm(
+        MCConstantExpr::Create(Val, getContext()), S,
+        Parser.getTok().getLoc()));
      return MatchOperand_Success;
    }
  
    Error(Loc, "invalid floating point immediate");
    return MatchOperand_ParseFail;
  }
+
  /// Parse a arm instruction operand.  For now this parses the operand regardless
  /// of the mnemonic.
  bool ARMAsmParser::parseOperand(SmallVectorImpl<MCParsedAsmOperand*> &Operands,
diff --git a/test/MC/ARM/simple-fp-encoding.s b/test/MC/ARM/simple-fp-encoding.s

index a008d9b170dd66be85146e2fff1c653fe1bbfad1..a40e02bcaaed1ca74a412325b9524c6f71a269bf 100644 (file)
--- a/test/MC/ARM/simple-fp-encoding.s
+++ b/test/MC/ARM/simple-fp-encoding.s
@@ -311,3 +311,11 @@
  @ CHECK: vcvt.f64.s32  d0, d0, #32     @ encoding: [0xc0,0x0b,0xba,0xee]
  @ CHECK: vcvt.f32.u16  s0, s0, #1      @ encoding: [0x67,0x0a,0xbb,0xee]
  @ CHECK: vcvt.f64.s16  d0, d0, #16     @ encoding: [0x40,0x0b,0xba,0xee]
+
+
+@ Use NEON to load some f32 immediates that don't fit the f8 representation.
+        vmov.f32 d4, #0.0
+        vmov.f32 d4, #32.0
+
+@ CHECK: vmov.i32      d4, #0x0        @ encoding: [0x10,0x40,0x80,0xf2]
+@ CHECK: vmov.i32      d4, #0x42000000 @ encoding: [0x12,0x46,0x84,0xf2]
author	Jim Grosbach <grosbach@apple.com>
	Fri, 20 Jan 2012 18:09:51 +0000 (18:09 +0000)
committer	Jim Grosbach <grosbach@apple.com>
	Fri, 20 Jan 2012 18:09:51 +0000 (18:09 +0000)
lib/Target/ARM/ARMInstrNEON.td		patch \| blob \| history
lib/Target/ARM/AsmParser/ARMAsmParser.cpp		patch \| blob \| history
test/MC/ARM/simple-fp-encoding.s		patch \| blob \| history