bool isEOF() const { return Ptr == End; }
- char peek() const { return isEOF() ? 0 : *Ptr; }
+ char peek(unsigned I = 0) const { return End - Ptr <= I ? 0 : Ptr[I]; }
void advance() { ++Ptr; }
return C;
}
+static Cursor lexIntegerLiteral(Cursor C, MIToken &Token) {
+ auto Range = C;
+ C.advance();
+ while (isdigit(C.peek()))
+ C.advance();
+ StringRef StrVal = Range.upto(C);
+ Token = MIToken(MIToken::IntegerLiteral, StrVal, APSInt(StrVal));
+ return C;
+}
+
static MIToken::TokenKind symbolToken(char C) {
switch (C) {
case ',':
return lexIdentifier(C, Token).remaining();
if (Char == '%')
return lexPercent(C, Token).remaining();
+ if (isdigit(Char) || (Char == '-' && isdigit(C.peek(1))))
+ return lexIntegerLiteral(C, Token).remaining();
MIToken::TokenKind Kind = symbolToken(Char);
if (Kind != MIToken::Error)
return lexSymbol(C, Kind, Token).remaining();
#ifndef LLVM_LIB_CODEGEN_MIRPARSER_MILEXER_H
#define LLVM_LIB_CODEGEN_MIRPARSER_MILEXER_H
+#include "llvm/ADT/APSInt.h"
#include "llvm/ADT/StringRef.h"
#include "llvm/ADT/STLExtras.h"
#include <functional>
// Identifier tokens
Identifier,
- NamedRegister
+ NamedRegister,
+
+ // Other tokens
+ IntegerLiteral
};
private:
TokenKind Kind;
StringRef Range;
+ APSInt IntVal;
public:
MIToken(TokenKind Kind, StringRef Range) : Kind(Kind), Range(Range) {}
+ MIToken(TokenKind Kind, StringRef Range, const APSInt &IntVal)
+ : Kind(Kind), Range(Range), IntVal(IntVal) {}
+
TokenKind kind() const { return Kind; }
bool isError() const { return Kind == Error; }
StringRef::iterator location() const { return Range.begin(); }
StringRef stringValue() const { return Range; }
+
+ const APSInt &integerValue() const { return IntVal; }
};
/// Consume a single machine instruction token in the given source and return
bool parseRegister(unsigned &Reg);
bool parseRegisterOperand(MachineOperand &Dest, bool IsDef = false);
+ bool parseImmediateOperand(MachineOperand &Dest);
bool parseMachineOperand(MachineOperand &Dest);
private:
return false;
}
+bool MIParser::parseImmediateOperand(MachineOperand &Dest) {
+ assert(Token.is(MIToken::IntegerLiteral));
+ const APSInt &Int = Token.integerValue();
+ if (Int.getMinSignedBits() > 64)
+ // TODO: Replace this with an error when we can parse CIMM Machine Operands.
+ llvm_unreachable("Can't parse large integer literals yet!");
+ Dest = MachineOperand::CreateImm(Int.getExtValue());
+ lex();
+ return false;
+}
+
bool MIParser::parseMachineOperand(MachineOperand &Dest) {
switch (Token.kind()) {
case MIToken::NamedRegister:
return parseRegisterOperand(Dest);
+ case MIToken::IntegerLiteral:
+ return parseImmediateOperand(Dest);
case MIToken::Error:
return true;
default:
printReg(Op.getReg(), OS, TRI);
// TODO: Print sub register.
break;
+ case MachineOperand::MO_Immediate:
+ OS << Op.getImm();
+ break;
default:
// TODO: Print the other machine operands.
llvm_unreachable("Can't print this machine operand at the moment");
--- /dev/null
+# RUN: llc -march=x86-64 -start-after branch-folder -stop-after branch-folder -o /dev/null %s | FileCheck %s
+# This test ensures that the MIR parser parses immediate machine operands.
+
+--- |
+
+ define i32 @foo() {
+ entry:
+ ret i32 42
+ }
+
+ define i32 @bar() {
+ entry:
+ ret i32 -11
+ }
+
+...
+---
+# CHECK: name: foo
+name: foo
+body:
+ - name: entry
+ instructions:
+ # CHECK: - '%eax = MOV32ri 42'
+ # CHECK-NEXT: - 'RETQ %eax'
+ - '%eax = MOV32ri 42'
+ - 'RETQ %eax'
+...
+---
+# CHECK: name: bar
+name: bar
+body:
+ - name: entry
+ instructions:
+ # CHECK: - '%eax = MOV32ri -11'
+ # CHECK-NEXT: - 'RETQ %eax'
+ - '%eax = MOV32ri -11'
+ - 'RETQ %eax'
+...