1 #include "llvm/ADT/APFloat.h"
2 #include "llvm/ADT/Optional.h"
3 #include "llvm/ADT/STLExtras.h"
4 #include "llvm/IR/BasicBlock.h"
5 #include "llvm/IR/Constants.h"
6 #include "llvm/IR/DerivedTypes.h"
7 #include "llvm/IR/Function.h"
8 #include "llvm/IR/Instructions.h"
9 #include "llvm/IR/IRBuilder.h"
10 #include "llvm/IR/LLVMContext.h"
11 #include "llvm/IR/LegacyPassManager.h"
12 #include "llvm/IR/Module.h"
13 #include "llvm/IR/Type.h"
14 #include "llvm/IR/Verifier.h"
15 #include "llvm/Support/FileSystem.h"
16 #include "llvm/Support/Host.h"
17 #include "llvm/Support/raw_ostream.h"
18 #include "llvm/Support/TargetRegistry.h"
19 #include "llvm/Support/TargetSelect.h"
20 #include "llvm/Target/TargetMachine.h"
21 #include "llvm/Target/TargetOptions.h"
30 #include <system_error>
35 using namespace llvm::sys
;
37 //===----------------------------------------------------------------------===//
39 //===----------------------------------------------------------------------===//
41 // The lexer returns tokens [0-255] if it is an unknown character, otherwise one
42 // of these for known things.
69 static std::string IdentifierStr
; // Filled in if tok_identifier
70 static double NumVal
; // Filled in if tok_number
72 /// gettok - Return the next token from standard input.
74 static int LastChar
= ' ';
76 // Skip any whitespace.
77 while (isspace(LastChar
))
80 if (isalpha(LastChar
)) { // identifier: [a-zA-Z][a-zA-Z0-9]*
81 IdentifierStr
= LastChar
;
82 while (isalnum((LastChar
= getchar())))
83 IdentifierStr
+= LastChar
;
85 if (IdentifierStr
== "def")
87 if (IdentifierStr
== "extern")
89 if (IdentifierStr
== "if")
91 if (IdentifierStr
== "then")
93 if (IdentifierStr
== "else")
95 if (IdentifierStr
== "for")
97 if (IdentifierStr
== "in")
99 if (IdentifierStr
== "binary")
101 if (IdentifierStr
== "unary")
103 if (IdentifierStr
== "var")
105 return tok_identifier
;
108 if (isdigit(LastChar
) || LastChar
== '.') { // Number: [0-9.]+
112 LastChar
= getchar();
113 } while (isdigit(LastChar
) || LastChar
== '.');
115 NumVal
= strtod(NumStr
.c_str(), nullptr);
119 if (LastChar
== '#') {
120 // Comment until end of line.
122 LastChar
= getchar();
123 while (LastChar
!= EOF
&& LastChar
!= '\n' && LastChar
!= '\r');
129 // Check for end of file. Don't eat the EOF.
133 // Otherwise, just return the character as its ascii value.
134 int ThisChar
= LastChar
;
135 LastChar
= getchar();
139 //===----------------------------------------------------------------------===//
140 // Abstract Syntax Tree (aka Parse Tree)
141 //===----------------------------------------------------------------------===//
145 /// ExprAST - Base class for all expression nodes.
148 virtual ~ExprAST() = default;
150 virtual Value
*codegen() = 0;
153 /// NumberExprAST - Expression class for numeric literals like "1.0".
154 class NumberExprAST
: public ExprAST
{
158 NumberExprAST(double Val
) : Val(Val
) {}
160 Value
*codegen() override
;
163 /// VariableExprAST - Expression class for referencing a variable, like "a".
164 class VariableExprAST
: public ExprAST
{
168 VariableExprAST(const std::string
&Name
) : Name(Name
) {}
170 Value
*codegen() override
;
171 const std::string
&getName() const { return Name
; }
174 /// UnaryExprAST - Expression class for a unary operator.
175 class UnaryExprAST
: public ExprAST
{
177 std::unique_ptr
<ExprAST
> Operand
;
180 UnaryExprAST(char Opcode
, std::unique_ptr
<ExprAST
> Operand
)
181 : Opcode(Opcode
), Operand(std::move(Operand
)) {}
183 Value
*codegen() override
;
186 /// BinaryExprAST - Expression class for a binary operator.
187 class BinaryExprAST
: public ExprAST
{
189 std::unique_ptr
<ExprAST
> LHS
, RHS
;
192 BinaryExprAST(char Op
, std::unique_ptr
<ExprAST
> LHS
,
193 std::unique_ptr
<ExprAST
> RHS
)
194 : Op(Op
), LHS(std::move(LHS
)), RHS(std::move(RHS
)) {}
196 Value
*codegen() override
;
199 /// CallExprAST - Expression class for function calls.
200 class CallExprAST
: public ExprAST
{
202 std::vector
<std::unique_ptr
<ExprAST
>> Args
;
205 CallExprAST(const std::string
&Callee
,
206 std::vector
<std::unique_ptr
<ExprAST
>> Args
)
207 : Callee(Callee
), Args(std::move(Args
)) {}
209 Value
*codegen() override
;
212 /// IfExprAST - Expression class for if/then/else.
213 class IfExprAST
: public ExprAST
{
214 std::unique_ptr
<ExprAST
> Cond
, Then
, Else
;
217 IfExprAST(std::unique_ptr
<ExprAST
> Cond
, std::unique_ptr
<ExprAST
> Then
,
218 std::unique_ptr
<ExprAST
> Else
)
219 : Cond(std::move(Cond
)), Then(std::move(Then
)), Else(std::move(Else
)) {}
221 Value
*codegen() override
;
224 /// ForExprAST - Expression class for for/in.
225 class ForExprAST
: public ExprAST
{
227 std::unique_ptr
<ExprAST
> Start
, End
, Step
, Body
;
230 ForExprAST(const std::string
&VarName
, std::unique_ptr
<ExprAST
> Start
,
231 std::unique_ptr
<ExprAST
> End
, std::unique_ptr
<ExprAST
> Step
,
232 std::unique_ptr
<ExprAST
> Body
)
233 : VarName(VarName
), Start(std::move(Start
)), End(std::move(End
)),
234 Step(std::move(Step
)), Body(std::move(Body
)) {}
236 Value
*codegen() override
;
239 /// VarExprAST - Expression class for var/in
240 class VarExprAST
: public ExprAST
{
241 std::vector
<std::pair
<std::string
, std::unique_ptr
<ExprAST
>>> VarNames
;
242 std::unique_ptr
<ExprAST
> Body
;
246 std::vector
<std::pair
<std::string
, std::unique_ptr
<ExprAST
>>> VarNames
,
247 std::unique_ptr
<ExprAST
> Body
)
248 : VarNames(std::move(VarNames
)), Body(std::move(Body
)) {}
250 Value
*codegen() override
;
253 /// PrototypeAST - This class represents the "prototype" for a function,
254 /// which captures its name, and its argument names (thus implicitly the number
255 /// of arguments the function takes), as well as if it is an operator.
258 std::vector
<std::string
> Args
;
260 unsigned Precedence
; // Precedence if a binary op.
263 PrototypeAST(const std::string
&Name
, std::vector
<std::string
> Args
,
264 bool IsOperator
= false, unsigned Prec
= 0)
265 : Name(Name
), Args(std::move(Args
)), IsOperator(IsOperator
),
269 const std::string
&getName() const { return Name
; }
271 bool isUnaryOp() const { return IsOperator
&& Args
.size() == 1; }
272 bool isBinaryOp() const { return IsOperator
&& Args
.size() == 2; }
274 char getOperatorName() const {
275 assert(isUnaryOp() || isBinaryOp());
276 return Name
[Name
.size() - 1];
279 unsigned getBinaryPrecedence() const { return Precedence
; }
282 /// FunctionAST - This class represents a function definition itself.
284 std::unique_ptr
<PrototypeAST
> Proto
;
285 std::unique_ptr
<ExprAST
> Body
;
288 FunctionAST(std::unique_ptr
<PrototypeAST
> Proto
,
289 std::unique_ptr
<ExprAST
> Body
)
290 : Proto(std::move(Proto
)), Body(std::move(Body
)) {}
295 } // end anonymous namespace
297 //===----------------------------------------------------------------------===//
299 //===----------------------------------------------------------------------===//
301 /// CurTok/getNextToken - Provide a simple token buffer. CurTok is the current
302 /// token the parser is looking at. getNextToken reads another token from the
303 /// lexer and updates CurTok with its results.
305 static int getNextToken() { return CurTok
= gettok(); }
307 /// BinopPrecedence - This holds the precedence for each binary operator that is
309 static std::map
<char, int> BinopPrecedence
;
311 /// GetTokPrecedence - Get the precedence of the pending binary operator token.
312 static int GetTokPrecedence() {
313 if (!isascii(CurTok
))
316 // Make sure it's a declared binop.
317 int TokPrec
= BinopPrecedence
[CurTok
];
323 /// LogError* - These are little helper functions for error handling.
324 std::unique_ptr
<ExprAST
> LogError(const char *Str
) {
325 fprintf(stderr
, "Error: %s\n", Str
);
329 std::unique_ptr
<PrototypeAST
> LogErrorP(const char *Str
) {
334 static std::unique_ptr
<ExprAST
> ParseExpression();
336 /// numberexpr ::= number
337 static std::unique_ptr
<ExprAST
> ParseNumberExpr() {
338 auto Result
= std::make_unique
<NumberExprAST
>(NumVal
);
339 getNextToken(); // consume the number
340 return std::move(Result
);
343 /// parenexpr ::= '(' expression ')'
344 static std::unique_ptr
<ExprAST
> ParseParenExpr() {
345 getNextToken(); // eat (.
346 auto V
= ParseExpression();
351 return LogError("expected ')'");
352 getNextToken(); // eat ).
358 /// ::= identifier '(' expression* ')'
359 static std::unique_ptr
<ExprAST
> ParseIdentifierExpr() {
360 std::string IdName
= IdentifierStr
;
362 getNextToken(); // eat identifier.
364 if (CurTok
!= '(') // Simple variable ref.
365 return std::make_unique
<VariableExprAST
>(IdName
);
368 getNextToken(); // eat (
369 std::vector
<std::unique_ptr
<ExprAST
>> Args
;
372 if (auto Arg
= ParseExpression())
373 Args
.push_back(std::move(Arg
));
381 return LogError("Expected ')' or ',' in argument list");
389 return std::make_unique
<CallExprAST
>(IdName
, std::move(Args
));
392 /// ifexpr ::= 'if' expression 'then' expression 'else' expression
393 static std::unique_ptr
<ExprAST
> ParseIfExpr() {
394 getNextToken(); // eat the if.
397 auto Cond
= ParseExpression();
401 if (CurTok
!= tok_then
)
402 return LogError("expected then");
403 getNextToken(); // eat the then
405 auto Then
= ParseExpression();
409 if (CurTok
!= tok_else
)
410 return LogError("expected else");
414 auto Else
= ParseExpression();
418 return std::make_unique
<IfExprAST
>(std::move(Cond
), std::move(Then
),
422 /// forexpr ::= 'for' identifier '=' expr ',' expr (',' expr)? 'in' expression
423 static std::unique_ptr
<ExprAST
> ParseForExpr() {
424 getNextToken(); // eat the for.
426 if (CurTok
!= tok_identifier
)
427 return LogError("expected identifier after for");
429 std::string IdName
= IdentifierStr
;
430 getNextToken(); // eat identifier.
433 return LogError("expected '=' after for");
434 getNextToken(); // eat '='.
436 auto Start
= ParseExpression();
440 return LogError("expected ',' after for start value");
443 auto End
= ParseExpression();
447 // The step value is optional.
448 std::unique_ptr
<ExprAST
> Step
;
451 Step
= ParseExpression();
456 if (CurTok
!= tok_in
)
457 return LogError("expected 'in' after for");
458 getNextToken(); // eat 'in'.
460 auto Body
= ParseExpression();
464 return std::make_unique
<ForExprAST
>(IdName
, std::move(Start
), std::move(End
),
465 std::move(Step
), std::move(Body
));
468 /// varexpr ::= 'var' identifier ('=' expression)?
469 // (',' identifier ('=' expression)?)* 'in' expression
470 static std::unique_ptr
<ExprAST
> ParseVarExpr() {
471 getNextToken(); // eat the var.
473 std::vector
<std::pair
<std::string
, std::unique_ptr
<ExprAST
>>> VarNames
;
475 // At least one variable name is required.
476 if (CurTok
!= tok_identifier
)
477 return LogError("expected identifier after var");
480 std::string Name
= IdentifierStr
;
481 getNextToken(); // eat identifier.
483 // Read the optional initializer.
484 std::unique_ptr
<ExprAST
> Init
= nullptr;
486 getNextToken(); // eat the '='.
488 Init
= ParseExpression();
493 VarNames
.push_back(std::make_pair(Name
, std::move(Init
)));
495 // End of var list, exit loop.
498 getNextToken(); // eat the ','.
500 if (CurTok
!= tok_identifier
)
501 return LogError("expected identifier list after var");
504 // At this point, we have to have 'in'.
505 if (CurTok
!= tok_in
)
506 return LogError("expected 'in' keyword after 'var'");
507 getNextToken(); // eat 'in'.
509 auto Body
= ParseExpression();
513 return std::make_unique
<VarExprAST
>(std::move(VarNames
), std::move(Body
));
517 /// ::= identifierexpr
523 static std::unique_ptr
<ExprAST
> ParsePrimary() {
526 return LogError("unknown token when expecting an expression");
528 return ParseIdentifierExpr();
530 return ParseNumberExpr();
532 return ParseParenExpr();
534 return ParseIfExpr();
536 return ParseForExpr();
538 return ParseVarExpr();
545 static std::unique_ptr
<ExprAST
> ParseUnary() {
546 // If the current token is not an operator, it must be a primary expr.
547 if (!isascii(CurTok
) || CurTok
== '(' || CurTok
== ',')
548 return ParsePrimary();
550 // If this is a unary operator, read it.
553 if (auto Operand
= ParseUnary())
554 return std::make_unique
<UnaryExprAST
>(Opc
, std::move(Operand
));
560 static std::unique_ptr
<ExprAST
> ParseBinOpRHS(int ExprPrec
,
561 std::unique_ptr
<ExprAST
> LHS
) {
562 // If this is a binop, find its precedence.
564 int TokPrec
= GetTokPrecedence();
566 // If this is a binop that binds at least as tightly as the current binop,
567 // consume it, otherwise we are done.
568 if (TokPrec
< ExprPrec
)
571 // Okay, we know this is a binop.
573 getNextToken(); // eat binop
575 // Parse the unary expression after the binary operator.
576 auto RHS
= ParseUnary();
580 // If BinOp binds less tightly with RHS than the operator after RHS, let
581 // the pending operator take RHS as its LHS.
582 int NextPrec
= GetTokPrecedence();
583 if (TokPrec
< NextPrec
) {
584 RHS
= ParseBinOpRHS(TokPrec
+ 1, std::move(RHS
));
591 std::make_unique
<BinaryExprAST
>(BinOp
, std::move(LHS
), std::move(RHS
));
596 /// ::= unary binoprhs
598 static std::unique_ptr
<ExprAST
> ParseExpression() {
599 auto LHS
= ParseUnary();
603 return ParseBinOpRHS(0, std::move(LHS
));
607 /// ::= id '(' id* ')'
608 /// ::= binary LETTER number? (id, id)
609 /// ::= unary LETTER (id)
610 static std::unique_ptr
<PrototypeAST
> ParsePrototype() {
613 unsigned Kind
= 0; // 0 = identifier, 1 = unary, 2 = binary.
614 unsigned BinaryPrecedence
= 30;
618 return LogErrorP("Expected function name in prototype");
620 FnName
= IdentifierStr
;
626 if (!isascii(CurTok
))
627 return LogErrorP("Expected unary operator");
629 FnName
+= (char)CurTok
;
635 if (!isascii(CurTok
))
636 return LogErrorP("Expected binary operator");
638 FnName
+= (char)CurTok
;
642 // Read the precedence if present.
643 if (CurTok
== tok_number
) {
644 if (NumVal
< 1 || NumVal
> 100)
645 return LogErrorP("Invalid precedence: must be 1..100");
646 BinaryPrecedence
= (unsigned)NumVal
;
653 return LogErrorP("Expected '(' in prototype");
655 std::vector
<std::string
> ArgNames
;
656 while (getNextToken() == tok_identifier
)
657 ArgNames
.push_back(IdentifierStr
);
659 return LogErrorP("Expected ')' in prototype");
662 getNextToken(); // eat ')'.
664 // Verify right number of names for operator.
665 if (Kind
&& ArgNames
.size() != Kind
)
666 return LogErrorP("Invalid number of operands for operator");
668 return std::make_unique
<PrototypeAST
>(FnName
, ArgNames
, Kind
!= 0,
672 /// definition ::= 'def' prototype expression
673 static std::unique_ptr
<FunctionAST
> ParseDefinition() {
674 getNextToken(); // eat def.
675 auto Proto
= ParsePrototype();
679 if (auto E
= ParseExpression())
680 return std::make_unique
<FunctionAST
>(std::move(Proto
), std::move(E
));
684 /// toplevelexpr ::= expression
685 static std::unique_ptr
<FunctionAST
> ParseTopLevelExpr() {
686 if (auto E
= ParseExpression()) {
687 // Make an anonymous proto.
688 auto Proto
= std::make_unique
<PrototypeAST
>("__anon_expr",
689 std::vector
<std::string
>());
690 return std::make_unique
<FunctionAST
>(std::move(Proto
), std::move(E
));
695 /// external ::= 'extern' prototype
696 static std::unique_ptr
<PrototypeAST
> ParseExtern() {
697 getNextToken(); // eat extern.
698 return ParsePrototype();
701 //===----------------------------------------------------------------------===//
703 //===----------------------------------------------------------------------===//
705 static LLVMContext TheContext
;
706 static IRBuilder
<> Builder(TheContext
);
707 static std::unique_ptr
<Module
> TheModule
;
708 static std::map
<std::string
, AllocaInst
*> NamedValues
;
709 static std::map
<std::string
, std::unique_ptr
<PrototypeAST
>> FunctionProtos
;
711 Value
*LogErrorV(const char *Str
) {
716 Function
*getFunction(std::string Name
) {
717 // First, see if the function has already been added to the current module.
718 if (auto *F
= TheModule
->getFunction(Name
))
721 // If not, check whether we can codegen the declaration from some existing
723 auto FI
= FunctionProtos
.find(Name
);
724 if (FI
!= FunctionProtos
.end())
725 return FI
->second
->codegen();
727 // If no existing prototype exists, return null.
731 /// CreateEntryBlockAlloca - Create an alloca instruction in the entry block of
732 /// the function. This is used for mutable variables etc.
733 static AllocaInst
*CreateEntryBlockAlloca(Function
*TheFunction
,
734 const std::string
&VarName
) {
735 IRBuilder
<> TmpB(&TheFunction
->getEntryBlock(),
736 TheFunction
->getEntryBlock().begin());
737 return TmpB
.CreateAlloca(Type::getDoubleTy(TheContext
), nullptr, VarName
);
740 Value
*NumberExprAST::codegen() {
741 return ConstantFP::get(TheContext
, APFloat(Val
));
744 Value
*VariableExprAST::codegen() {
745 // Look this variable up in the function.
746 Value
*V
= NamedValues
[Name
];
748 return LogErrorV("Unknown variable name");
751 return Builder
.CreateLoad(V
, Name
.c_str());
754 Value
*UnaryExprAST::codegen() {
755 Value
*OperandV
= Operand
->codegen();
759 Function
*F
= getFunction(std::string("unary") + Opcode
);
761 return LogErrorV("Unknown unary operator");
763 return Builder
.CreateCall(F
, OperandV
, "unop");
766 Value
*BinaryExprAST::codegen() {
767 // Special case '=' because we don't want to emit the LHS as an expression.
769 // Assignment requires the LHS to be an identifier.
770 // This assume we're building without RTTI because LLVM builds that way by
771 // default. If you build LLVM with RTTI this can be changed to a
772 // dynamic_cast for automatic error checking.
773 VariableExprAST
*LHSE
= static_cast<VariableExprAST
*>(LHS
.get());
775 return LogErrorV("destination of '=' must be a variable");
777 Value
*Val
= RHS
->codegen();
782 Value
*Variable
= NamedValues
[LHSE
->getName()];
784 return LogErrorV("Unknown variable name");
786 Builder
.CreateStore(Val
, Variable
);
790 Value
*L
= LHS
->codegen();
791 Value
*R
= RHS
->codegen();
797 return Builder
.CreateFAdd(L
, R
, "addtmp");
799 return Builder
.CreateFSub(L
, R
, "subtmp");
801 return Builder
.CreateFMul(L
, R
, "multmp");
803 L
= Builder
.CreateFCmpULT(L
, R
, "cmptmp");
804 // Convert bool 0/1 to double 0.0 or 1.0
805 return Builder
.CreateUIToFP(L
, Type::getDoubleTy(TheContext
), "booltmp");
810 // If it wasn't a builtin binary operator, it must be a user defined one. Emit
812 Function
*F
= getFunction(std::string("binary") + Op
);
813 assert(F
&& "binary operator not found!");
815 Value
*Ops
[] = {L
, R
};
816 return Builder
.CreateCall(F
, Ops
, "binop");
819 Value
*CallExprAST::codegen() {
820 // Look up the name in the global module table.
821 Function
*CalleeF
= getFunction(Callee
);
823 return LogErrorV("Unknown function referenced");
825 // If argument mismatch error.
826 if (CalleeF
->arg_size() != Args
.size())
827 return LogErrorV("Incorrect # arguments passed");
829 std::vector
<Value
*> ArgsV
;
830 for (unsigned i
= 0, e
= Args
.size(); i
!= e
; ++i
) {
831 ArgsV
.push_back(Args
[i
]->codegen());
836 return Builder
.CreateCall(CalleeF
, ArgsV
, "calltmp");
839 Value
*IfExprAST::codegen() {
840 Value
*CondV
= Cond
->codegen();
844 // Convert condition to a bool by comparing non-equal to 0.0.
845 CondV
= Builder
.CreateFCmpONE(
846 CondV
, ConstantFP::get(TheContext
, APFloat(0.0)), "ifcond");
848 Function
*TheFunction
= Builder
.GetInsertBlock()->getParent();
850 // Create blocks for the then and else cases. Insert the 'then' block at the
851 // end of the function.
852 BasicBlock
*ThenBB
= BasicBlock::Create(TheContext
, "then", TheFunction
);
853 BasicBlock
*ElseBB
= BasicBlock::Create(TheContext
, "else");
854 BasicBlock
*MergeBB
= BasicBlock::Create(TheContext
, "ifcont");
856 Builder
.CreateCondBr(CondV
, ThenBB
, ElseBB
);
859 Builder
.SetInsertPoint(ThenBB
);
861 Value
*ThenV
= Then
->codegen();
865 Builder
.CreateBr(MergeBB
);
866 // Codegen of 'Then' can change the current block, update ThenBB for the PHI.
867 ThenBB
= Builder
.GetInsertBlock();
870 TheFunction
->getBasicBlockList().push_back(ElseBB
);
871 Builder
.SetInsertPoint(ElseBB
);
873 Value
*ElseV
= Else
->codegen();
877 Builder
.CreateBr(MergeBB
);
878 // Codegen of 'Else' can change the current block, update ElseBB for the PHI.
879 ElseBB
= Builder
.GetInsertBlock();
882 TheFunction
->getBasicBlockList().push_back(MergeBB
);
883 Builder
.SetInsertPoint(MergeBB
);
884 PHINode
*PN
= Builder
.CreatePHI(Type::getDoubleTy(TheContext
), 2, "iftmp");
886 PN
->addIncoming(ThenV
, ThenBB
);
887 PN
->addIncoming(ElseV
, ElseBB
);
891 // Output for-loop as:
892 // var = alloca double
895 // store start -> var
906 // nextvar = curvar + step
907 // store nextvar -> var
908 // br endcond, loop, endloop
910 Value
*ForExprAST::codegen() {
911 Function
*TheFunction
= Builder
.GetInsertBlock()->getParent();
913 // Create an alloca for the variable in the entry block.
914 AllocaInst
*Alloca
= CreateEntryBlockAlloca(TheFunction
, VarName
);
916 // Emit the start code first, without 'variable' in scope.
917 Value
*StartVal
= Start
->codegen();
921 // Store the value into the alloca.
922 Builder
.CreateStore(StartVal
, Alloca
);
924 // Make the new basic block for the loop header, inserting after current
926 BasicBlock
*LoopBB
= BasicBlock::Create(TheContext
, "loop", TheFunction
);
928 // Insert an explicit fall through from the current block to the LoopBB.
929 Builder
.CreateBr(LoopBB
);
931 // Start insertion in LoopBB.
932 Builder
.SetInsertPoint(LoopBB
);
934 // Within the loop, the variable is defined equal to the PHI node. If it
935 // shadows an existing variable, we have to restore it, so save it now.
936 AllocaInst
*OldVal
= NamedValues
[VarName
];
937 NamedValues
[VarName
] = Alloca
;
939 // Emit the body of the loop. This, like any other expr, can change the
940 // current BB. Note that we ignore the value computed by the body, but don't
942 if (!Body
->codegen())
945 // Emit the step value.
946 Value
*StepVal
= nullptr;
948 StepVal
= Step
->codegen();
952 // If not specified, use 1.0.
953 StepVal
= ConstantFP::get(TheContext
, APFloat(1.0));
956 // Compute the end condition.
957 Value
*EndCond
= End
->codegen();
961 // Reload, increment, and restore the alloca. This handles the case where
962 // the body of the loop mutates the variable.
963 Value
*CurVar
= Builder
.CreateLoad(Alloca
, VarName
.c_str());
964 Value
*NextVar
= Builder
.CreateFAdd(CurVar
, StepVal
, "nextvar");
965 Builder
.CreateStore(NextVar
, Alloca
);
967 // Convert condition to a bool by comparing non-equal to 0.0.
968 EndCond
= Builder
.CreateFCmpONE(
969 EndCond
, ConstantFP::get(TheContext
, APFloat(0.0)), "loopcond");
971 // Create the "after loop" block and insert it.
972 BasicBlock
*AfterBB
=
973 BasicBlock::Create(TheContext
, "afterloop", TheFunction
);
975 // Insert the conditional branch into the end of LoopEndBB.
976 Builder
.CreateCondBr(EndCond
, LoopBB
, AfterBB
);
978 // Any new code will be inserted in AfterBB.
979 Builder
.SetInsertPoint(AfterBB
);
981 // Restore the unshadowed variable.
983 NamedValues
[VarName
] = OldVal
;
985 NamedValues
.erase(VarName
);
987 // for expr always returns 0.0.
988 return Constant::getNullValue(Type::getDoubleTy(TheContext
));
991 Value
*VarExprAST::codegen() {
992 std::vector
<AllocaInst
*> OldBindings
;
994 Function
*TheFunction
= Builder
.GetInsertBlock()->getParent();
996 // Register all variables and emit their initializer.
997 for (unsigned i
= 0, e
= VarNames
.size(); i
!= e
; ++i
) {
998 const std::string
&VarName
= VarNames
[i
].first
;
999 ExprAST
*Init
= VarNames
[i
].second
.get();
1001 // Emit the initializer before adding the variable to scope, this prevents
1002 // the initializer from referencing the variable itself, and permits stuff
1005 // var a = a in ... # refers to outer 'a'.
1008 InitVal
= Init
->codegen();
1011 } else { // If not specified, use 0.0.
1012 InitVal
= ConstantFP::get(TheContext
, APFloat(0.0));
1015 AllocaInst
*Alloca
= CreateEntryBlockAlloca(TheFunction
, VarName
);
1016 Builder
.CreateStore(InitVal
, Alloca
);
1018 // Remember the old variable binding so that we can restore the binding when
1020 OldBindings
.push_back(NamedValues
[VarName
]);
1022 // Remember this binding.
1023 NamedValues
[VarName
] = Alloca
;
1026 // Codegen the body, now that all vars are in scope.
1027 Value
*BodyVal
= Body
->codegen();
1031 // Pop all our variables from scope.
1032 for (unsigned i
= 0, e
= VarNames
.size(); i
!= e
; ++i
)
1033 NamedValues
[VarNames
[i
].first
] = OldBindings
[i
];
1035 // Return the body computation.
1039 Function
*PrototypeAST::codegen() {
1040 // Make the function type: double(double,double) etc.
1041 std::vector
<Type
*> Doubles(Args
.size(), Type::getDoubleTy(TheContext
));
1043 FunctionType::get(Type::getDoubleTy(TheContext
), Doubles
, false);
1046 Function::Create(FT
, Function::ExternalLinkage
, Name
, TheModule
.get());
1048 // Set names for all arguments.
1050 for (auto &Arg
: F
->args())
1051 Arg
.setName(Args
[Idx
++]);
1056 Function
*FunctionAST::codegen() {
1057 // Transfer ownership of the prototype to the FunctionProtos map, but keep a
1058 // reference to it for use below.
1060 FunctionProtos
[Proto
->getName()] = std::move(Proto
);
1061 Function
*TheFunction
= getFunction(P
.getName());
1065 // If this is an operator, install it.
1067 BinopPrecedence
[P
.getOperatorName()] = P
.getBinaryPrecedence();
1069 // Create a new basic block to start insertion into.
1070 BasicBlock
*BB
= BasicBlock::Create(TheContext
, "entry", TheFunction
);
1071 Builder
.SetInsertPoint(BB
);
1073 // Record the function arguments in the NamedValues map.
1074 NamedValues
.clear();
1075 for (auto &Arg
: TheFunction
->args()) {
1076 // Create an alloca for this variable.
1077 AllocaInst
*Alloca
= CreateEntryBlockAlloca(TheFunction
, Arg
.getName());
1079 // Store the initial value into the alloca.
1080 Builder
.CreateStore(&Arg
, Alloca
);
1082 // Add arguments to variable symbol table.
1083 NamedValues
[Arg
.getName()] = Alloca
;
1086 if (Value
*RetVal
= Body
->codegen()) {
1087 // Finish off the function.
1088 Builder
.CreateRet(RetVal
);
1090 // Validate the generated code, checking for consistency.
1091 verifyFunction(*TheFunction
);
1096 // Error reading body, remove function.
1097 TheFunction
->eraseFromParent();
1100 BinopPrecedence
.erase(P
.getOperatorName());
1104 //===----------------------------------------------------------------------===//
1105 // Top-Level parsing and JIT Driver
1106 //===----------------------------------------------------------------------===//
1108 static void InitializeModuleAndPassManager() {
1109 // Open a new module.
1110 TheModule
= std::make_unique
<Module
>("my cool jit", TheContext
);
1113 static void HandleDefinition() {
1114 if (auto FnAST
= ParseDefinition()) {
1115 if (auto *FnIR
= FnAST
->codegen()) {
1116 fprintf(stderr
, "Read function definition:");
1117 FnIR
->print(errs());
1118 fprintf(stderr
, "\n");
1121 // Skip token for error recovery.
1126 static void HandleExtern() {
1127 if (auto ProtoAST
= ParseExtern()) {
1128 if (auto *FnIR
= ProtoAST
->codegen()) {
1129 fprintf(stderr
, "Read extern: ");
1130 FnIR
->print(errs());
1131 fprintf(stderr
, "\n");
1132 FunctionProtos
[ProtoAST
->getName()] = std::move(ProtoAST
);
1135 // Skip token for error recovery.
1140 static void HandleTopLevelExpression() {
1141 // Evaluate a top-level expression into an anonymous function.
1142 if (auto FnAST
= ParseTopLevelExpr()) {
1145 // Skip token for error recovery.
1150 /// top ::= definition | external | expression | ';'
1151 static void MainLoop() {
1156 case ';': // ignore top-level semicolons.
1166 HandleTopLevelExpression();
1172 //===----------------------------------------------------------------------===//
1173 // "Library" functions that can be "extern'd" from user code.
1174 //===----------------------------------------------------------------------===//
1177 #define DLLEXPORT __declspec(dllexport)
1182 /// putchard - putchar that takes a double and returns 0.
1183 extern "C" DLLEXPORT
double putchard(double X
) {
1184 fputc((char)X
, stderr
);
1188 /// printd - printf that takes a double prints it as "%f\n", returning 0.
1189 extern "C" DLLEXPORT
double printd(double X
) {
1190 fprintf(stderr
, "%f\n", X
);
1194 //===----------------------------------------------------------------------===//
1195 // Main driver code.
1196 //===----------------------------------------------------------------------===//
1199 // Install standard binary operators.
1200 // 1 is lowest precedence.
1201 BinopPrecedence
['<'] = 10;
1202 BinopPrecedence
['+'] = 20;
1203 BinopPrecedence
['-'] = 20;
1204 BinopPrecedence
['*'] = 40; // highest.
1206 // Prime the first token.
1207 fprintf(stderr
, "ready> ");
1210 InitializeModuleAndPassManager();
1212 // Run the main "interpreter loop" now.
1215 // Initialize the target registry etc.
1216 InitializeAllTargetInfos();
1217 InitializeAllTargets();
1218 InitializeAllTargetMCs();
1219 InitializeAllAsmParsers();
1220 InitializeAllAsmPrinters();
1222 auto TargetTriple
= sys::getDefaultTargetTriple();
1223 TheModule
->setTargetTriple(TargetTriple
);
1226 auto Target
= TargetRegistry::lookupTarget(TargetTriple
, Error
);
1228 // Print an error and exit if we couldn't find the requested target.
1229 // This generally occurs if we've forgotten to initialise the
1230 // TargetRegistry or we have a bogus target triple.
1236 auto CPU
= "generic";
1240 auto RM
= Optional
<Reloc::Model
>();
1241 auto TheTargetMachine
=
1242 Target
->createTargetMachine(TargetTriple
, CPU
, Features
, opt
, RM
);
1244 TheModule
->setDataLayout(TheTargetMachine
->createDataLayout());
1246 auto Filename
= "output.o";
1248 raw_fd_ostream
dest(Filename
, EC
, sys::fs::OF_None
);
1251 errs() << "Could not open file: " << EC
.message();
1255 legacy::PassManager pass
;
1256 auto FileType
= TargetMachine::CGFT_ObjectFile
;
1258 if (TheTargetMachine
->addPassesToEmitFile(pass
, dest
, nullptr, FileType
)) {
1259 errs() << "TheTargetMachine can't emit a file of this type";
1263 pass
.run(*TheModule
);
1266 outs() << "Wrote " << Filename
<< "\n";