1 #include "../include/KaleidoscopeJIT.h"
2 #include "llvm/ADT/APFloat.h"
3 #include "llvm/ADT/STLExtras.h"
4 #include "llvm/IR/BasicBlock.h"
5 #include "llvm/IR/Constants.h"
6 #include "llvm/IR/DerivedTypes.h"
7 #include "llvm/IR/Function.h"
8 #include "llvm/IR/IRBuilder.h"
9 #include "llvm/IR/LLVMContext.h"
10 #include "llvm/IR/LegacyPassManager.h"
11 #include "llvm/IR/Module.h"
12 #include "llvm/IR/Type.h"
13 #include "llvm/IR/Verifier.h"
14 #include "llvm/Support/TargetSelect.h"
15 #include "llvm/Target/TargetMachine.h"
16 #include "llvm/Transforms/InstCombine/InstCombine.h"
17 #include "llvm/Transforms/Scalar.h"
18 #include "llvm/Transforms/Scalar/GVN.h"
31 using namespace llvm::orc
;
33 //===----------------------------------------------------------------------===//
35 //===----------------------------------------------------------------------===//
37 // The lexer returns tokens [0-255] if it is an unknown character, otherwise one
38 // of these for known things.
51 static std::string IdentifierStr
; // Filled in if tok_identifier
52 static double NumVal
; // Filled in if tok_number
54 /// gettok - Return the next token from standard input.
56 static int LastChar
= ' ';
58 // Skip any whitespace.
59 while (isspace(LastChar
))
62 if (isalpha(LastChar
)) { // identifier: [a-zA-Z][a-zA-Z0-9]*
63 IdentifierStr
= LastChar
;
64 while (isalnum((LastChar
= getchar())))
65 IdentifierStr
+= LastChar
;
67 if (IdentifierStr
== "def")
69 if (IdentifierStr
== "extern")
71 return tok_identifier
;
74 if (isdigit(LastChar
) || LastChar
== '.') { // Number: [0-9.]+
79 } while (isdigit(LastChar
) || LastChar
== '.');
81 NumVal
= strtod(NumStr
.c_str(), nullptr);
85 if (LastChar
== '#') {
86 // Comment until end of line.
89 while (LastChar
!= EOF
&& LastChar
!= '\n' && LastChar
!= '\r');
95 // Check for end of file. Don't eat the EOF.
99 // Otherwise, just return the character as its ascii value.
100 int ThisChar
= LastChar
;
101 LastChar
= getchar();
105 //===----------------------------------------------------------------------===//
106 // Abstract Syntax Tree (aka Parse Tree)
107 //===----------------------------------------------------------------------===//
111 /// ExprAST - Base class for all expression nodes.
114 virtual ~ExprAST() = default;
116 virtual Value
*codegen() = 0;
119 /// NumberExprAST - Expression class for numeric literals like "1.0".
120 class NumberExprAST
: public ExprAST
{
124 NumberExprAST(double Val
) : Val(Val
) {}
126 Value
*codegen() override
;
129 /// VariableExprAST - Expression class for referencing a variable, like "a".
130 class VariableExprAST
: public ExprAST
{
134 VariableExprAST(const std::string
&Name
) : Name(Name
) {}
136 Value
*codegen() override
;
139 /// BinaryExprAST - Expression class for a binary operator.
140 class BinaryExprAST
: public ExprAST
{
142 std::unique_ptr
<ExprAST
> LHS
, RHS
;
145 BinaryExprAST(char Op
, std::unique_ptr
<ExprAST
> LHS
,
146 std::unique_ptr
<ExprAST
> RHS
)
147 : Op(Op
), LHS(std::move(LHS
)), RHS(std::move(RHS
)) {}
149 Value
*codegen() override
;
152 /// CallExprAST - Expression class for function calls.
153 class CallExprAST
: public ExprAST
{
155 std::vector
<std::unique_ptr
<ExprAST
>> Args
;
158 CallExprAST(const std::string
&Callee
,
159 std::vector
<std::unique_ptr
<ExprAST
>> Args
)
160 : Callee(Callee
), Args(std::move(Args
)) {}
162 Value
*codegen() override
;
165 /// PrototypeAST - This class represents the "prototype" for a function,
166 /// which captures its name, and its argument names (thus implicitly the number
167 /// of arguments the function takes).
170 std::vector
<std::string
> Args
;
173 PrototypeAST(const std::string
&Name
, std::vector
<std::string
> Args
)
174 : Name(Name
), Args(std::move(Args
)) {}
177 const std::string
&getName() const { return Name
; }
180 /// FunctionAST - This class represents a function definition itself.
182 std::unique_ptr
<PrototypeAST
> Proto
;
183 std::unique_ptr
<ExprAST
> Body
;
186 FunctionAST(std::unique_ptr
<PrototypeAST
> Proto
,
187 std::unique_ptr
<ExprAST
> Body
)
188 : Proto(std::move(Proto
)), Body(std::move(Body
)) {}
193 } // end anonymous namespace
195 //===----------------------------------------------------------------------===//
197 //===----------------------------------------------------------------------===//
199 /// CurTok/getNextToken - Provide a simple token buffer. CurTok is the current
200 /// token the parser is looking at. getNextToken reads another token from the
201 /// lexer and updates CurTok with its results.
203 static int getNextToken() { return CurTok
= gettok(); }
205 /// BinopPrecedence - This holds the precedence for each binary operator that is
207 static std::map
<char, int> BinopPrecedence
;
209 /// GetTokPrecedence - Get the precedence of the pending binary operator token.
210 static int GetTokPrecedence() {
211 if (!isascii(CurTok
))
214 // Make sure it's a declared binop.
215 int TokPrec
= BinopPrecedence
[CurTok
];
221 /// LogError* - These are little helper functions for error handling.
222 std::unique_ptr
<ExprAST
> LogError(const char *Str
) {
223 fprintf(stderr
, "Error: %s\n", Str
);
227 std::unique_ptr
<PrototypeAST
> LogErrorP(const char *Str
) {
232 static std::unique_ptr
<ExprAST
> ParseExpression();
234 /// numberexpr ::= number
235 static std::unique_ptr
<ExprAST
> ParseNumberExpr() {
236 auto Result
= std::make_unique
<NumberExprAST
>(NumVal
);
237 getNextToken(); // consume the number
238 return std::move(Result
);
241 /// parenexpr ::= '(' expression ')'
242 static std::unique_ptr
<ExprAST
> ParseParenExpr() {
243 getNextToken(); // eat (.
244 auto V
= ParseExpression();
249 return LogError("expected ')'");
250 getNextToken(); // eat ).
256 /// ::= identifier '(' expression* ')'
257 static std::unique_ptr
<ExprAST
> ParseIdentifierExpr() {
258 std::string IdName
= IdentifierStr
;
260 getNextToken(); // eat identifier.
262 if (CurTok
!= '(') // Simple variable ref.
263 return std::make_unique
<VariableExprAST
>(IdName
);
266 getNextToken(); // eat (
267 std::vector
<std::unique_ptr
<ExprAST
>> Args
;
270 if (auto Arg
= ParseExpression())
271 Args
.push_back(std::move(Arg
));
279 return LogError("Expected ')' or ',' in argument list");
287 return std::make_unique
<CallExprAST
>(IdName
, std::move(Args
));
291 /// ::= identifierexpr
294 static std::unique_ptr
<ExprAST
> ParsePrimary() {
297 return LogError("unknown token when expecting an expression");
299 return ParseIdentifierExpr();
301 return ParseNumberExpr();
303 return ParseParenExpr();
308 /// ::= ('+' primary)*
309 static std::unique_ptr
<ExprAST
> ParseBinOpRHS(int ExprPrec
,
310 std::unique_ptr
<ExprAST
> LHS
) {
311 // If this is a binop, find its precedence.
313 int TokPrec
= GetTokPrecedence();
315 // If this is a binop that binds at least as tightly as the current binop,
316 // consume it, otherwise we are done.
317 if (TokPrec
< ExprPrec
)
320 // Okay, we know this is a binop.
322 getNextToken(); // eat binop
324 // Parse the primary expression after the binary operator.
325 auto RHS
= ParsePrimary();
329 // If BinOp binds less tightly with RHS than the operator after RHS, let
330 // the pending operator take RHS as its LHS.
331 int NextPrec
= GetTokPrecedence();
332 if (TokPrec
< NextPrec
) {
333 RHS
= ParseBinOpRHS(TokPrec
+ 1, std::move(RHS
));
340 std::make_unique
<BinaryExprAST
>(BinOp
, std::move(LHS
), std::move(RHS
));
345 /// ::= primary binoprhs
347 static std::unique_ptr
<ExprAST
> ParseExpression() {
348 auto LHS
= ParsePrimary();
352 return ParseBinOpRHS(0, std::move(LHS
));
356 /// ::= id '(' id* ')'
357 static std::unique_ptr
<PrototypeAST
> ParsePrototype() {
358 if (CurTok
!= tok_identifier
)
359 return LogErrorP("Expected function name in prototype");
361 std::string FnName
= IdentifierStr
;
365 return LogErrorP("Expected '(' in prototype");
367 std::vector
<std::string
> ArgNames
;
368 while (getNextToken() == tok_identifier
)
369 ArgNames
.push_back(IdentifierStr
);
371 return LogErrorP("Expected ')' in prototype");
374 getNextToken(); // eat ')'.
376 return std::make_unique
<PrototypeAST
>(FnName
, std::move(ArgNames
));
379 /// definition ::= 'def' prototype expression
380 static std::unique_ptr
<FunctionAST
> ParseDefinition() {
381 getNextToken(); // eat def.
382 auto Proto
= ParsePrototype();
386 if (auto E
= ParseExpression())
387 return std::make_unique
<FunctionAST
>(std::move(Proto
), std::move(E
));
391 /// toplevelexpr ::= expression
392 static std::unique_ptr
<FunctionAST
> ParseTopLevelExpr() {
393 if (auto E
= ParseExpression()) {
394 // Make an anonymous proto.
395 auto Proto
= std::make_unique
<PrototypeAST
>("__anon_expr",
396 std::vector
<std::string
>());
397 return std::make_unique
<FunctionAST
>(std::move(Proto
), std::move(E
));
402 /// external ::= 'extern' prototype
403 static std::unique_ptr
<PrototypeAST
> ParseExtern() {
404 getNextToken(); // eat extern.
405 return ParsePrototype();
408 //===----------------------------------------------------------------------===//
410 //===----------------------------------------------------------------------===//
412 static std::unique_ptr
<LLVMContext
> TheContext
;
413 static std::unique_ptr
<Module
> TheModule
;
414 static std::unique_ptr
<IRBuilder
<>> Builder
;
415 static std::map
<std::string
, Value
*> NamedValues
;
416 static std::unique_ptr
<legacy::FunctionPassManager
> TheFPM
;
417 static std::unique_ptr
<KaleidoscopeJIT
> TheJIT
;
418 static std::map
<std::string
, std::unique_ptr
<PrototypeAST
>> FunctionProtos
;
419 static ExitOnError ExitOnErr
;
421 Value
*LogErrorV(const char *Str
) {
426 Function
*getFunction(std::string Name
) {
427 // First, see if the function has already been added to the current module.
428 if (auto *F
= TheModule
->getFunction(Name
))
431 // If not, check whether we can codegen the declaration from some existing
433 auto FI
= FunctionProtos
.find(Name
);
434 if (FI
!= FunctionProtos
.end())
435 return FI
->second
->codegen();
437 // If no existing prototype exists, return null.
441 Value
*NumberExprAST::codegen() {
442 return ConstantFP::get(*TheContext
, APFloat(Val
));
445 Value
*VariableExprAST::codegen() {
446 // Look this variable up in the function.
447 Value
*V
= NamedValues
[Name
];
449 return LogErrorV("Unknown variable name");
453 Value
*BinaryExprAST::codegen() {
454 Value
*L
= LHS
->codegen();
455 Value
*R
= RHS
->codegen();
461 return Builder
->CreateFAdd(L
, R
, "addtmp");
463 return Builder
->CreateFSub(L
, R
, "subtmp");
465 return Builder
->CreateFMul(L
, R
, "multmp");
467 L
= Builder
->CreateFCmpULT(L
, R
, "cmptmp");
468 // Convert bool 0/1 to double 0.0 or 1.0
469 return Builder
->CreateUIToFP(L
, Type::getDoubleTy(*TheContext
), "booltmp");
471 return LogErrorV("invalid binary operator");
475 Value
*CallExprAST::codegen() {
476 // Look up the name in the global module table.
477 Function
*CalleeF
= getFunction(Callee
);
479 return LogErrorV("Unknown function referenced");
481 // If argument mismatch error.
482 if (CalleeF
->arg_size() != Args
.size())
483 return LogErrorV("Incorrect # arguments passed");
485 std::vector
<Value
*> ArgsV
;
486 for (unsigned i
= 0, e
= Args
.size(); i
!= e
; ++i
) {
487 ArgsV
.push_back(Args
[i
]->codegen());
492 return Builder
->CreateCall(CalleeF
, ArgsV
, "calltmp");
495 Function
*PrototypeAST::codegen() {
496 // Make the function type: double(double,double) etc.
497 std::vector
<Type
*> Doubles(Args
.size(), Type::getDoubleTy(*TheContext
));
499 FunctionType::get(Type::getDoubleTy(*TheContext
), Doubles
, false);
502 Function::Create(FT
, Function::ExternalLinkage
, Name
, TheModule
.get());
504 // Set names for all arguments.
506 for (auto &Arg
: F
->args())
507 Arg
.setName(Args
[Idx
++]);
512 Function
*FunctionAST::codegen() {
513 // Transfer ownership of the prototype to the FunctionProtos map, but keep a
514 // reference to it for use below.
516 FunctionProtos
[Proto
->getName()] = std::move(Proto
);
517 Function
*TheFunction
= getFunction(P
.getName());
521 // Create a new basic block to start insertion into.
522 BasicBlock
*BB
= BasicBlock::Create(*TheContext
, "entry", TheFunction
);
523 Builder
->SetInsertPoint(BB
);
525 // Record the function arguments in the NamedValues map.
527 for (auto &Arg
: TheFunction
->args())
528 NamedValues
[std::string(Arg
.getName())] = &Arg
;
530 if (Value
*RetVal
= Body
->codegen()) {
531 // Finish off the function.
532 Builder
->CreateRet(RetVal
);
534 // Validate the generated code, checking for consistency.
535 verifyFunction(*TheFunction
);
537 // Run the optimizer on the function.
538 TheFPM
->run(*TheFunction
);
543 // Error reading body, remove function.
544 TheFunction
->eraseFromParent();
548 //===----------------------------------------------------------------------===//
549 // Top-Level parsing and JIT Driver
550 //===----------------------------------------------------------------------===//
552 static void InitializeModuleAndPassManager() {
553 // Open a new context and module.
554 TheContext
= std::make_unique
<LLVMContext
>();
555 TheModule
= std::make_unique
<Module
>("my cool jit", *TheContext
);
556 TheModule
->setDataLayout(TheJIT
->getDataLayout());
558 // Create a new builder for the module.
559 Builder
= std::make_unique
<IRBuilder
<>>(*TheContext
);
561 // Create a new pass manager attached to it.
562 TheFPM
= std::make_unique
<legacy::FunctionPassManager
>(TheModule
.get());
564 // Do simple "peephole" optimizations and bit-twiddling optzns.
565 TheFPM
->add(createInstructionCombiningPass());
566 // Reassociate expressions.
567 TheFPM
->add(createReassociatePass());
568 // Eliminate Common SubExpressions.
569 TheFPM
->add(createGVNPass());
570 // Simplify the control flow graph (deleting unreachable blocks, etc).
571 TheFPM
->add(createCFGSimplificationPass());
573 TheFPM
->doInitialization();
576 static void HandleDefinition() {
577 if (auto FnAST
= ParseDefinition()) {
578 if (auto *FnIR
= FnAST
->codegen()) {
579 fprintf(stderr
, "Read function definition:");
581 fprintf(stderr
, "\n");
582 ExitOnErr(TheJIT
->addModule(
583 ThreadSafeModule(std::move(TheModule
), std::move(TheContext
))));
584 InitializeModuleAndPassManager();
587 // Skip token for error recovery.
592 static void HandleExtern() {
593 if (auto ProtoAST
= ParseExtern()) {
594 if (auto *FnIR
= ProtoAST
->codegen()) {
595 fprintf(stderr
, "Read extern: ");
597 fprintf(stderr
, "\n");
598 FunctionProtos
[ProtoAST
->getName()] = std::move(ProtoAST
);
601 // Skip token for error recovery.
606 static void HandleTopLevelExpression() {
607 // Evaluate a top-level expression into an anonymous function.
608 if (auto FnAST
= ParseTopLevelExpr()) {
609 if (FnAST
->codegen()) {
610 // Create a ResourceTracker to track JIT'd memory allocated to our
611 // anonymous expression -- that way we can free it after executing.
612 auto RT
= TheJIT
->getMainJITDylib().createResourceTracker();
614 auto TSM
= ThreadSafeModule(std::move(TheModule
), std::move(TheContext
));
615 ExitOnErr(TheJIT
->addModule(std::move(TSM
), RT
));
616 InitializeModuleAndPassManager();
618 // Search the JIT for the __anon_expr symbol.
619 auto ExprSymbol
= ExitOnErr(TheJIT
->lookup("__anon_expr"));
621 // Get the symbol's address and cast it to the right type (takes no
622 // arguments, returns a double) so we can call it as a native function.
623 double (*FP
)() = (double (*)())(intptr_t)ExprSymbol
.getAddress();
624 fprintf(stderr
, "Evaluated to %f\n", FP());
626 // Delete the anonymous expression module from the JIT.
627 ExitOnErr(RT
->remove());
630 // Skip token for error recovery.
635 /// top ::= definition | external | expression | ';'
636 static void MainLoop() {
638 fprintf(stderr
, "ready> ");
642 case ';': // ignore top-level semicolons.
652 HandleTopLevelExpression();
658 //===----------------------------------------------------------------------===//
659 // "Library" functions that can be "extern'd" from user code.
660 //===----------------------------------------------------------------------===//
663 #define DLLEXPORT __declspec(dllexport)
668 /// putchard - putchar that takes a double and returns 0.
669 extern "C" DLLEXPORT
double putchard(double X
) {
670 fputc((char)X
, stderr
);
674 /// printd - printf that takes a double prints it as "%f\n", returning 0.
675 extern "C" DLLEXPORT
double printd(double X
) {
676 fprintf(stderr
, "%f\n", X
);
680 //===----------------------------------------------------------------------===//
682 //===----------------------------------------------------------------------===//
685 InitializeNativeTarget();
686 InitializeNativeTargetAsmPrinter();
687 InitializeNativeTargetAsmParser();
689 // Install standard binary operators.
690 // 1 is lowest precedence.
691 BinopPrecedence
['<'] = 10;
692 BinopPrecedence
['+'] = 20;
693 BinopPrecedence
['-'] = 20;
694 BinopPrecedence
['*'] = 40; // highest.
696 // Prime the first token.
697 fprintf(stderr
, "ready> ");
700 TheJIT
= ExitOnErr(KaleidoscopeJIT::Create());
702 InitializeModuleAndPassManager();
704 // Run the main "interpreter loop" now.