MC/AsmParser: Report .stabs directive as unsupported.

[oota-llvm.git] / lib / MC / MCParser / AsmLexer.cpp
diff --git a/lib/MC/MCParser/AsmLexer.cpp b/lib/MC/MCParser/AsmLexer.cpp

index 1cbe09aa6c7fa191ef34746dbd649a1791865cd9..7ca1cccc98c21fd4c870e08fbe3cfa79dc5f9b84 100644 (file)
--- a/lib/MC/MCParser/AsmLexer.cpp
+++ b/lib/MC/MCParser/AsmLexer.cpp
@@ -23,7 +23,6 @@ using namespace llvm;
  AsmLexer::AsmLexer(const MCAsmInfo &_MAI) : MAI(_MAI)  {
    CurBuf = NULL;
    CurPtr = NULL;
-  TokStart = 0;
  }
  
  AsmLexer::~AsmLexer() {
@@ -40,10 +39,6 @@ void AsmLexer::setBuffer(const MemoryBuffer *buf, const char *ptr) {
    TokStart = 0;
  }
  
-SMLoc AsmLexer::getLoc() const {
-  return SMLoc::getFromPointer(TokStart);
-}
-
  /// ReturnError - Set the error to the specified string at the specified
  /// location.  This is defined to always return AsmToken::Error.
  AsmToken AsmLexer::ReturnError(const char *Loc, const std::string &Msg) {
@@ -69,10 +64,46 @@ int AsmLexer::getNextChar() {
    }
  }
  
+/// LexFloatLiteral: [0-9]*[.][0-9]*([eE][+-]?[0-9]*)?
+///
+/// The leading integral digit sequence and dot should have already been
+/// consumed, some or all of the fractional digit sequence *can* have been
+/// consumed.
+AsmToken AsmLexer::LexFloatLiteral() {
+  // Skip the fractional digit sequence.
+  while (isdigit(*CurPtr))
+    ++CurPtr;
+
+  // Check for exponent; we intentionally accept a slighlty wider set of
+  // literals here and rely on the upstream client to reject invalid ones (e.g.,
+  // "1e+").
+  if (*CurPtr == 'e' || *CurPtr == 'E') {
+    ++CurPtr;
+    if (*CurPtr == '-' || *CurPtr == '+')
+      ++CurPtr;
+    while (isdigit(*CurPtr))
+      ++CurPtr;
+  }
+
+  return AsmToken(AsmToken::Real,
+                  StringRef(TokStart, CurPtr - TokStart));
+}
+
  /// LexIdentifier: [a-zA-Z_.][a-zA-Z0-9_$.@]*
+static bool IsIdentifierChar(char c) {
+  return isalnum(c) || c == '_' || c == '$' || c == '.' || c == '@';
+}
  AsmToken AsmLexer::LexIdentifier() {
-  while (isalnum(*CurPtr) || *CurPtr == '_' || *CurPtr == '$' ||
-         *CurPtr == '.' || *CurPtr == '@')
+  // Check for floating point literals.
+  if (CurPtr[-1] == '.' && isdigit(*CurPtr)) {
+    // Disambiguate a .1243foo identifier from a floating literal.
+    while (isdigit(*CurPtr))
+      ++CurPtr;
+    if (*CurPtr == 'e' || *CurPtr == 'E' || !IsIdentifierChar(*CurPtr))
+      return LexFloatLiteral();
+  }
+
+  while (IsIdentifierChar(*CurPtr))
      ++CurPtr;
    
    // Handle . as a special case.
@@ -122,6 +153,12 @@ AsmToken AsmLexer::LexLineComment() {
    return AsmToken(AsmToken::EndOfStatement, StringRef(CurPtr, 0));
  }
  
+static void SkipIgnoredIntegerSuffix(const char *&CurPtr) {
+  if (CurPtr[0] == 'L' && CurPtr[1] == 'L')
+    CurPtr += 2;
+  if (CurPtr[0] == 'U' && CurPtr[1] == 'L' && CurPtr[2] == 'L')
+    CurPtr += 3;
+}
  
  /// LexDigit: First character is [0-9].
  ///   Local Label: [0-9][:]
@@ -130,15 +167,20 @@ AsmToken AsmLexer::LexLineComment() {
  ///   Octal integer: 0[0-7]+
  ///   Hex integer: 0x[0-9a-fA-F]+
  ///   Decimal integer: [1-9][0-9]*
-/// TODO: FP literal.
  AsmToken AsmLexer::LexDigit() {
    // Decimal integer: [1-9][0-9]*
-  if (CurPtr[-1] != '0') {
+  if (CurPtr[-1] != '0' || CurPtr[0] == '.') {
      while (isdigit(*CurPtr))
        ++CurPtr;
-    
+
+    // Check for floating point literals.
+    if (*CurPtr == '.' || *CurPtr == 'e') {
+      ++CurPtr;
+      return LexFloatLiteral();
+    }
+
      StringRef Result(TokStart, CurPtr - TokStart);
-    
+
      long long Value;
      if (Result.getAsInteger(10, Value)) {
        // We have to handle minint_as_a_positive_value specially, because
@@ -148,6 +190,11 @@ AsmToken AsmLexer::LexDigit() {
        else
          return ReturnError(TokStart, "Invalid decimal number");
      }
+    
+    // The darwin/x86 (and x86-64) assembler accepts and ignores ULL and LL
+    // suffixes on integer literals.
+    SkipIgnoredIntegerSuffix(CurPtr);
+    
      return AsmToken(AsmToken::Integer, Result, Value);
    }
    
@@ -170,9 +217,13 @@ AsmToken AsmLexer::LexDigit() {
      StringRef Result(TokStart, CurPtr - TokStart);
      
      long long Value;
-    if (Result.getAsInteger(2, Value))
+    if (Result.substr(2).getAsInteger(2, Value))
        return ReturnError(TokStart, "Invalid binary number");
      
+    // The darwin/x86 (and x86-64) assembler accepts and ignores ULL and LL
+    // suffixes on integer literals.
+    SkipIgnoredIntegerSuffix(CurPtr);
+    
      return AsmToken(AsmToken::Integer, Result, Value);
    }
   
@@ -190,6 +241,10 @@ AsmToken AsmLexer::LexDigit() {
      if (StringRef(TokStart, CurPtr - TokStart).getAsInteger(0, Result))
        return ReturnError(TokStart, "Invalid hexadecimal number");
        
+    // The darwin/x86 (and x86-64) assembler accepts and ignores ULL and LL
+    // suffixes on integer literals.
+    SkipIgnoredIntegerSuffix(CurPtr);
+    
      return AsmToken(AsmToken::Integer, StringRef(TokStart, CurPtr - TokStart),
                      (int64_t)Result);
    }
@@ -203,6 +258,10 @@ AsmToken AsmLexer::LexDigit() {
    if (Result.getAsInteger(8, Value))
      return ReturnError(TokStart, "Invalid octal number");
    
+  // The darwin/x86 (and x86-64) assembler accepts and ignores ULL and LL
+  // suffixes on integer literals.
+  SkipIgnoredIntegerSuffix(CurPtr);
+  
    return AsmToken(AsmToken::Integer, Result, Value);
  }
  
@@ -229,7 +288,7 @@ StringRef AsmLexer::LexUntilEndOfStatement() {
    TokStart = CurPtr;
  
    while (!isAtStartOfComment(*CurPtr) && // Start of line comment.
-         *CurPtr != ';' &&  // End of statement marker.
+          *CurPtr != ';' &&  // End of statement marker.
           *CurPtr != '\n' &&
           *CurPtr != '\r' &&
           (*CurPtr != 0 || CurPtr != CurBuf->getBufferEnd())) {