-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathlang_2-2-llvm.cxx
275 lines (227 loc) · 11.1 KB
/
lang_2-2-llvm.cxx
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
// (C) Bernard Hugueney, licence GPL v3
#include <string>
#include <iostream>
#include <boost/spirit/include/qi.hpp>
#include <boost/spirit/include/phoenix_operator.hpp>
#include <boost/spirit/include/phoenix_function.hpp>
#include <llvm/LLVMContext.h>
#include <llvm/Module.h>
#include <llvm/Function.h>
#include <llvm/PassManager.h>
#include <llvm/Analysis/Verifier.h>
#include <llvm/Assembly/PrintModulePass.h>
#include <llvm/Support/IRBuilder.h>
#include <llvm/Support/raw_ostream.h>
//#include "IRBuilderNoFold.h" //
using namespace llvm;
/*
lang_2 : variables declarations and assignments with infix arithmetic expressions, ends with a return statement.
Default llvm Internal Representation Builder does constant folding.
Variables mapping name->adress is handled directly by spirit::symbols<>
Much of the code is there only to enable support for all numeric types (short, int, long, float, double) as valid value_t.
diff from lang_2 : member function ptr dispatch of IRBuilder is done with the ptr encoded as template of a type instead of a ptr args.
*/
// time g++ -std=c++0x -o lang_2-llvm lang_2-llvm.cxx `llvm-config-2.8 --cppflags --ldflags --libs core` -lstdc++ -O4
using namespace boost::spirit;
using namespace boost::spirit::qi;
using namespace boost::spirit::standard;
// template function to map C++ type -> llvm::Type
template<typename T> static const Type* type(){ return "unkown type!";}// error
template<> const Type* type<void>() { return Type::getVoidTy(getGlobalContext());}
template<> const Type* type<int>() { return Type::getInt32Ty(getGlobalContext());}
template<> const Type* type<long>() { return Type::getInt64Ty(getGlobalContext());}
template<> const Type* type<float>() { return Type::getFloatTy(getGlobalContext());}
template<> const Type* type<double>(){ return Type::getDoubleTy(getGlobalContext());}
// template structs to map C++ type -> Spirit2 numeric parser
template<typename T> struct numeric_parser{};
template<> struct numeric_parser<short>{
typedef const short__type type;
static type parser;
};
numeric_parser<short>::type numeric_parser<short>::parser=short_;
template<> struct numeric_parser<int>{
typedef const int__type type;
static type parser;
};
numeric_parser<int>::type numeric_parser<int>::parser=int_;
template<> struct numeric_parser<long>{
typedef const long__type type;
static type parser;
};
numeric_parser<long>::type numeric_parser<long>::parser=long_;
template<> struct numeric_parser<float>{
typedef const float__type type;
static type parser;
};
numeric_parser<float>::type numeric_parser<float>::parser=float_;
template<> struct numeric_parser<double>{
typedef const double__type type;
static type parser;
};
numeric_parser<double>::type numeric_parser<double>::parser=double_;
template<> struct numeric_parser<long double>{
typedef const long_double_type type;
static type parser;
};
// now the real deal, at last ! :-)
// arithmetic expression grammar, using semantic actions to create llvm internal representation
template <typename value_t, typename Iterator>
struct language_2_grammar : grammar<Iterator, space_type> {
// symbols map use to store varables names and map them to the relevant llvm node
typedef symbols<char,AllocaInst*> vars_t;
// functor strucuture used to create llvm internal representation
// (ab)using a lot boost::phoenix::function<> ability to overload operator() !
template<Value* (IRBuilder<>::*)(Value*, Value*, const Twine&)> struct binary_op{};
template<Value* (IRBuilder<>::*)(Value*, const Twine&)> struct unary_op{};
typedef binary_op<&IRBuilder<>::CreateAdd> add_t;//
typedef binary_op<&IRBuilder<>::CreateSub> sub_t;
typedef binary_op<&IRBuilder<>::CreateMul> mul_t;//
typedef binary_op<&IRBuilder<>::CreateSDiv> div_t;
typedef unary_op<&IRBuilder<>::CreateNeg> neg_t; //
struct builder_helper{
// typedef to ease to use of pointers to member function
#if 0
typedef Value* (IRBuilder<>::*binary_op_t)(Value*, Value*, const Twine&);
typedef Value* (IRBuilder<>::*unary_op_t)(Value*, const Twine&);
#endif
// template structs to have different result type according to the argument types
// template structs to have different result type according to the argument types
//def -> Value*
//(AllocaInst*, Value*) ->StoreInst*
//(std::string const) -> AllocaInst*
//(Value*) -> ReturnInst*
template<typename T1, typename T2=void, typename T3=void, typename T4=void>
struct result : boost::mpl::if_<
boost::mpl::and_<boost::is_same<T1, AllocaInst*>
,boost::is_same<T2, Value*> >
, StoreInst*
, typename boost::mpl::if_<boost::is_same<T1, std::string>
, AllocaInst*
, typename boost::mpl::if_<boost::is_same<T1, Value*>
, ReturnInst*
, Value*>::type >::type > {};
builder_helper(vars_t &v, IRBuilder<>& b):vars(v), builder(b){}
// binary operations
template< Value*(IRBuilder<>::* const mem_fun)(Value*, Value*, const Twine&)>
Value* operator()(binary_op<mem_fun> /*unused*/,Value* a1, Value* a2, const char * name) const
{ return (builder.*mem_fun)(a1, a2, name); }
// unary operation
template< Value*(IRBuilder<>::* const mem_fun)( Value*, const Twine&)>
Value* operator()(unary_op<mem_fun> /*unused*/,Value* a, const char * name) const
{ return (builder.*mem_fun)(a, name); }
// return instruction
ReturnInst* operator()(Value* a) const { return builder.CreateRet(a); }
// variable assignment
StoreInst* operator()(AllocaInst* variable, Value* value ) const
{ return builder.CreateStore(value, variable, false); }
// reading a variable value
Value* operator()(AllocaInst* variable) const {return builder.CreateLoad(variable);}
// variable declaration
AllocaInst* operator()(std::string const& name) const{
AllocaInst* res(builder.CreateAlloca(type<value_t>(),0, name.c_str()));
vars.add(name.begin(), name.end(), res);
return res;
}
// constant values
Value* operator()(short v) const { return ConstantInt::get(getGlobalContext(), APInt(sizeof(short)*8, v)); }
Value* operator()(int v) const { return ConstantInt::get(getGlobalContext(), APInt(sizeof(int)*8, v)); }
Value* operator()(long v) const { return ConstantInt::get(getGlobalContext(), APInt(sizeof(long)*8, v)); }
Value* operator()(float v) const { return ConstantFP::get(getGlobalContext(), APFloat(v)); }// APFloat()
Value* operator()(double v)const { return ConstantFP::get(getGlobalContext(), APFloat(v)); }// is overloaded
vars_t& vars;
IRBuilder<>& builder;
};
language_2_grammar( IRBuilder<>& ir)
: language_2_grammar::base_type(program), build(builder_helper(vars, ir)) {
reserved_keywords = "var", "return";
program = *(variable_declaration | assignment) >> return_statement;
// we want to enforce the space after "return" so we must disable skipper with lexeme[]
return_statement = lexeme["return" >> space] >> additive_expression[_val=build(_1)]>>';' ;
additive_expression =
multiplicative_expression [_val=_1]
>> *(
('+' >> multiplicative_expression
[_val= build(add_t(), _val, _1,"addtmp")])
|('-' >> multiplicative_expression
[_val=build(sub_t(), _val, _1,"subtmp")])
)
;
multiplicative_expression =
unary_expression [_val=_1]
>> *(
('*' >> unary_expression[_val= build(mul_t(), _val, _1, "multmp")])
|('/' >> unary_expression [_val = build(div_t(),_val, _1, "divtmp")])
)
;
unary_expression =
primary_expression[_val = _1]
| ('-' >> primary_expression[_val= build(neg_t(), _1,"negtmp")])
| ('+' >> primary_expression[_val= _1])
;
primary_expression =
numeric_to_val [_val=_1]
| id_declared_var [_val=build(_1)]
| '(' >> additive_expression [_val=_1] >> ')'
;
numeric_to_val = numeric_parser<value_t>::parser[_val=build(_1)];
variable = id_declared_var[_val=build(_1)];
id_declaration %= raw[lexeme[alpha >> *(alnum | '_')]] ;//lexeme disables skipping for >>
id_declared_var = lexeme[ vars [_val = _1] // ditto for lexeme, id must be in vars
>> !(alnum | '_')]; // prevents partial match with only a prefix
variable_declaration = "var" >> !id_declared_var // disallow redeclaration of variables
>> !reserved_keywords
>> id_declaration [_a = build(_1)]
>> (';' | '=' >> assignment_rhs(_a));
// id_declared_var returns the AllocaInst* of the variable
assignment = id_declared_var [_a = _1] >> '=' >> assignment_rhs(_a);
assignment_rhs = additive_expression[_a=_1] >> char_(';')[build(_r1, _a)];
}
symbols<char, unused_type> reserved_keywords;
vars_t vars;
boost::phoenix::function<builder_helper> build;
rule<Iterator, Value*(), space_type> additive_expression, multiplicative_expression
, unary_expression, primary_expression, numeric_to_val, variable;
rule<Iterator, locals<AllocaInst*>, space_type> variable_declaration, assignment;
rule<Iterator, AllocaInst*(), space_type> id_declared_var;
rule<Iterator, std::string(), space_type> id_declaration;
rule<Iterator, space_type> program, return_statement;
rule<Iterator, void(AllocaInst*), locals<Value*>, space_type> assignment_rhs;
};
int main(int argc, char* argv[]){
typedef int value_t; // type used in arithmetic computations
std::cin.unsetf(std::ios::skipws); // Turn off white space skipping on the stream
typedef std::string buffer_t;
buffer_t buffer(std::istream_iterator<char>(std::cin), (std::istream_iterator<char>()));
typedef buffer_t::const_iterator iter_t;
iter_t iter(buffer.begin()), end(buffer.end());
typedef language_2_grammar<value_t, iter_t> grammar_t;
Module module("lang2", getGlobalContext());
IRBuilder<> ir(BasicBlock::Create(getGlobalContext(), "entry",
cast<Function>(module.getOrInsertFunction("main", type<value_t>(), NULL))));
grammar_t grammar(ir);
bool r = phrase_parse(iter, end, grammar, space);
if (r && iter == end) {
std::cout<<"parsing succeded !\n";
verifyModule(module, PrintMessageAction);
PassManager PM;
std::string out_data;
llvm::raw_string_ostream output(out_data);
PM.add(createPrintModulePass(&output));
PM.run(module);
std::cout<<output.str()<<std::endl;
} else {
std::string rest(iter, end);
std::cerr << "parsing failed\n" << "stopped at: \"" << rest << "\"\n";
}
return r ? 0 : 1 ;
}
template
Value* llvm::IRBuilder<true, llvm::ConstantFolder, llvm::IRBuilderDefaultInserter<true> >::CreateNeg(llvm::Value*, llvm::Twine const&);
template
Value* llvm::IRBuilder<true, llvm::ConstantFolder, llvm::IRBuilderDefaultInserter<true> >::CreateAdd(llvm::Value*, llvm::Value*, llvm::Twine const&);
template
Value* llvm::IRBuilder<true, llvm::ConstantFolder, llvm::IRBuilderDefaultInserter<true> >::CreateMul(llvm::Value*, llvm::Value*, llvm::Twine const&);
template
Value* llvm::IRBuilder<true, llvm::ConstantFolder, llvm::IRBuilderDefaultInserter<true> >::CreateSub(llvm::Value*, llvm::Value*, llvm::Twine const&);
template
Value* llvm::IRBuilder<true, llvm::ConstantFolder, llvm::IRBuilderDefaultInserter<true> >::CreateSDiv(llvm::Value*, llvm::Value*, llvm::Twine const&);