1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
|
#ifndef __LUASL_TREE_H__
#define __LUASL_TREE_H__
#define LUASL_DEBUG 0
#define COMPILE_THREADED 1
#define COMPILE_OUTPUT 0
#define LUASL_DIFF_CHECK 0
#define LUASL_BAD_CHECK 0
#include <stddef.h> // So we can have NULL defined.
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include "assert.h"
#include <unistd.h>
#include <stdlib.h>
#include <stdio.h>
#include <limits.h> // For PATH_MAX.
#include "LuaSL_lemon_yaccer.h"
#define YYERRCODE 256
#define YYDEBUG 1
// http://w-hat.com/stackdepth is a useful discussion about some aspects of the LL parser.
typedef struct _allowedTypes allowedTypes;
typedef struct _LSL_Token LSL_Token;
typedef struct _LSL_Text LSL_Text;
typedef struct _LSL_Leaf LSL_Leaf;
typedef struct _LSL_Numby LSL_Numby;
typedef struct _LSL_Parenthesis LSL_Parenthesis;
typedef struct _LSL_Identifier LSL_Identifier;
typedef struct _LSL_Statement LSL_Statement;
typedef struct _LSL_Block LSL_Block;
typedef struct _LSL_Function LSL_Function;
typedef struct _LSL_FunctionCall LSL_FunctionCall;
typedef struct _LSL_State LSL_State;
typedef struct _LSL_Script LSL_Script;
extern LSL_Token **tokens;
extern int lowestToken;
extern int logDom; // Our logging domain.
typedef int LSL_Type;
typedef enum
{
OM_LSL,
OM_LUA
} outputMode;
typedef void (*outputToken) (FILE *file, outputMode mode, LSL_Leaf *content);
typedef enum
{
LSL_NONE = 0,
LSL_LEFT2RIGHT = 1,
LSL_RIGHT2LEFT = 2,
LSL_INNER2OUTER = 4,
LSL_UNARY = 8,
LSL_ASSIGNMENT = 16,
LSL_CREATION = 32,
LSL_NOIGNORE = 64,
LSL_TYPE = 128
} LSL_Flags;
// VERY IMPORTANT to keep this in sync with allowedTypes allowed[] from LuaSL_compile.c!
typedef enum
{
OT_nothing,
OT_bool,
OT_integer,
OT_float,
OT_key,
OT_list,
OT_rotation,
OT_string,
OT_vector,
OT_other,
OT_boolBool,
OT_intBool,
OT_intInt,
OT_intFloat,
OT_floatInt,
OT_floatFloat,
OT_keyKey,
OT_keyString,
OT_stringKey,
OT_stringString,
OT_listList,
OT_listBool,
OT_listInt,
OT_listFloat,
OT_listString,
OT_intList,
OT_floatList,
OT_listOther,
OT_vectorVector,
OT_vectorFloat,
OT_vectorRotation,
OT_rotationRotation,
OT_otherOther,
OT_undeclared,
OT_invalid
} opType;
typedef enum
{
ST_NONE = 0,
ST_ASSIGNMENT = 1, // -= *= /=
ST_BIT_NOT = 2, // ~
ST_BOOL_NOT = 4, // !
ST_BITWISE = 8, // & | ^ << >>
ST_BOOLEAN = 16, // && !!
ST_COMPARISON = 32, // < > <= >=
ST_CONCATENATION = 64, // = +=
ST_EQUALITY = 128, // == !=
ST_ADD = 512, // +
ST_SUBTRACT = 1024, // -
ST_NEGATE = 2048, // -
ST_MULTIPLY = 4096, // * /
ST_MODULO = 8192 // % %=
} opSubType;
typedef enum
{
MF_NONE = 0,
MF_LOCAL = 1,
MF_NOASSIGN = 2, // These two are for completely different purposes. This one is for variable definitions with no assignment.
MF_ASSIGNEXP = 4, // These two are for completely different purposes. This one is for assignments being used as expressions.
MF_WRAPFUNC = 8,
MF_PREDEC = 16,
MF_PREINC = 32,
MF_POSTDEC = 64,
MF_POSTINC = 128,
MF_LSLCONST = 256,
MF_TYPECAST = 512,
MF_MSTRING = 1024
} miscFlags;
struct _allowedTypes
{
opType result;
const char *name;
int subTypes;
};
struct _LSL_Token
{
LSL_Type type;
opSubType subType;
const char *toKen;
LSL_Flags flags;
outputToken output;
};
struct _LSL_Text
{
const char *text;
#if LUASL_DIFF_CHECK
Eina_Strbuf *ignorable;
#endif
};
struct _LSL_Leaf
{
LSL_Leaf *left;
LSL_Leaf *right;
LSL_Token *toKen;
#if LUASL_DIFF_CHECK
Eina_Strbuf *ignorable;
#endif
int line, column, len;
opType basicType;
miscFlags flags;
union
{
float floatValue;
float vectorValue[3];
float rotationValue[4];
int integerValue;
LSL_Numby *numbyValue;
LSL_Leaf *listValue;
const char *stringValue;
opType operationValue;
LSL_Parenthesis *parenthesis;
LSL_Identifier *identifierValue;
LSL_Statement *statementValue;
LSL_Block *blockValue;
LSL_Function *functionValue;
LSL_FunctionCall *functionCallValue;
LSL_State *stateValue;
LSL_Script *scriptValue;
} value;
};
struct _LSL_Numby
{
LSL_Text text;
LSL_Type type;
union
{
float floatValue;
int integerValue;
} value;
};
struct _LSL_Parenthesis
{
LSL_Leaf *contents;
#if LUASL_DIFF_CHECK
Eina_Strbuf *rightIgnorable;
#endif
LSL_Type type;
miscFlags flags;
};
struct _LSL_Identifier // For variables and function parameters.
{
LSL_Text name;
LSL_Statement *definition;
Eina_Strbuf *ignorable;
const char *sub;
LSL_Leaf value;
miscFlags flags;
};
struct _LSL_DanglingVar
{
Eina_Clist dangler; // Entry for variables used before they are defined.
LSL_Leaf *identifier;
LSL_Leaf *dot;
LSL_Leaf *sub;
};
struct _LSL_Statement
{
Eina_Clist statement; // For block statement lists, this is the entry.
LSL_Text identifier;
LSL_Parenthesis *parenthesis;
LSL_Leaf *expressions; // A for statement will have three expressions, and two semicolons, everything else has zero or one.
LSL_Block *block;
LSL_Statement *single; // For single statement "blocks".
LSL_Statement *elseBlock;
LSL_Type type; // Expression type.
#if LUASL_DIFF_CHECK
Eina_Strbuf **ignorable; // Can be up to five of these I think.
#endif
miscFlags flags;
};
struct _LSL_Block
{
LSL_Block *outerBlock;
Eina_Clist statements; // For statement lists, this is the HEAD.
Eina_Hash *variables; // Those variables in this scope.
LSL_Function *function; // A pointer to the function if this block is a function.
#if LUASL_DIFF_CHECK
Eina_Strbuf *openIgnorable;
Eina_Strbuf *closeIgnorable;
#endif
};
struct _LSL_Function
{
LSL_Text name;
LSL_Text type;
const char *state;
#if LUASL_DIFF_CHECK
// LSL_Leaf *params; // So we store the parenthesis, and their ignorables.
// This points to the params leaf, which is a function, pointing to this structure. The actual params are in vars.
#endif
Eina_Inarray vars;
LSL_Block *block;
miscFlags flags;
};
struct _LSL_FunctionCall
{
LSL_Function *function;
Eina_Inarray params;
Eina_Clist dangler; // Entry for function calls used before the function is defined.
LSL_Leaf *call; // This is to stash the details for dangling ones, to search later.
// The line and column details are needed for bitching, so we need the leaf.
// Also need the stringValue for the search.
// On top of all that, the leaf is still used in expressions, so need to keep it around and update it when resolving danglers.
};
struct _LSL_State
{
LSL_Text name;
LSL_Text state;
LSL_Block *block;
Eina_Hash *handlers;
};
struct _LSL_Script
{
const char *name;
Eina_Hash *functions;
Eina_Hash *states;
Eina_Hash *variables;
int warningCount;
};
/* Tracking variables.
There are global variables, block local variables, and function parameters.
For outputting Lua, which is the ultimate goal -
track order, name, and type.
For looking them up during the compile -
quick access from name.
For validating them during compile -
track type.
For outputting LSL to double check -
track order, name, type, and white space.
For executing directly from the AST -
track order, name, type, and value.
In this case, order is only important for functions.
We can assume that names are stringshared. This means we only have to
compare pointers. It also means the same name stored at diffferent
scopes, must be stored in separate structures, coz the pointers are the
same.
Order is taken care of by the AST anyway, but for somethings we want to
condense the AST down to something more efficient.
On the other hand, no need to micro optimise it just yet, we should be
able to try out other data structures at a later date, then benchmark
them with typical scripts.
Right now I see nothing wrong with the current use of hash for script
and block variables. The same for script states and functions, as well
as state functions. Though in the near future, they will have similar
problems to functions I think - the need to track order and white
space.
Function params got unwieldy. Cleaned that up now.
*/
/* General design.
NOTE We can remove the white space tracking at compile time, as it's
only a debugging aid. Will be a performance and memory gain for
productidon use. Tracking values on the other hand will still be useful
for constants.
The compile process starts with turning tokens into AST nodes connected
in a tree. During that process the parser wants to condense nodes down
to more efficient data structures. This is a good idea, as we will
spend a fair amount of time looking up names, no matter which part of
the process is important at the time.
Once the parser has condensed things down, it only deals with the
condensed nodes. So we can get rid of some of the AST parts at this
time, so long as we keep the relevant information. This is what the
other data structures above are for. Lemon tries to free the no longer
needed AST nodes itself, even if we are still using them internally.
Need to do something about that.
*/
// Define the type for flex and lemon.
#define YYSTYPE LSL_Leaf
typedef struct
{
LuaCompiler *compiler;
void *scanner; // This should be of type yyscan_t, which is typedef to void * anyway, but that does not get defined until LuaSL_lexer.h, which depends on this struct being defined first.
LSL_Leaf *ast;
LSL_Script script;
LSL_State state;
#if LUASL_DIFF_CHECK
Eina_Strbuf *ignorable;
#endif
LSL_Leaf *lval;
LSL_Block *currentBlock;
LSL_Function *currentFunction;
Eina_Clist danglingCalls; // HEAD for function calls used before the function is defined.
Eina_Clist danglingVars; // HEAD for variable refs used before the variable is defined.
int column, line, pass;
boolean undeclared;
boolean inState;
boolean isLSL;
boolean isLua;
} LuaSL_compiler;
#ifndef excludeLexer
#include "LuaSL_lexer.h"
#endif
void finishMessage(LuaCompile *compiler, compileMessage *message, int type, int column, int line);
boolean compilerSetup(gameGlobals *ourGlobals);
void compileLSL(LuaCompiler *compiler);
void burnLeaf(void *data);
LSL_Leaf *addBlock(LuaSL_compiler *compiler, LSL_Leaf *left, LSL_Leaf *lval, LSL_Leaf *right);
LSL_Leaf *addCrement(LuaSL_compiler *compiler, LSL_Leaf *variable, LSL_Leaf *crement, LSL_Type type);
LSL_Leaf *addFor(LuaSL_compiler *compiler, LSL_Leaf *lval, LSL_Leaf *flow, LSL_Leaf *left, LSL_Leaf *expr0, LSL_Leaf *stat0, LSL_Leaf *expr1, LSL_Leaf *stat1, LSL_Leaf *expr2, LSL_Leaf *right, LSL_Leaf *block);
LSL_Leaf *addFunction(LuaSL_compiler *compiler, LSL_Leaf *type, LSL_Leaf *identifier, LSL_Leaf *open, LSL_Leaf *params, LSL_Leaf *close);
LSL_Leaf *addFunctionBody(LuaSL_compiler *compiler, LSL_Leaf *function, LSL_Leaf *block);
LSL_Leaf *addFunctionCall(LuaSL_compiler *compiler, LSL_Leaf *identifier, LSL_Leaf *open, LSL_Leaf *params, LSL_Leaf *close);
LSL_Leaf *addIfElse(LuaSL_compiler *compiler, LSL_Leaf *ifBlock, LSL_Leaf *elseBlock);
LSL_Leaf *addList(LSL_Leaf *left, LSL_Leaf *list, LSL_Leaf *right);
LSL_Leaf *addNumby(LSL_Leaf *numby);
LSL_Leaf *addOperation(LuaSL_compiler *compiler, LSL_Leaf *left, LSL_Leaf *lval, LSL_Leaf *right);
LSL_Leaf *addParameter(LuaSL_compiler *compiler, LSL_Leaf *type, LSL_Leaf *newParam);
LSL_Leaf *addParenthesis(LSL_Leaf *lval, LSL_Leaf *expr, LSL_Type type, LSL_Leaf *rval);
LSL_Leaf *addRotVec(LSL_Leaf *left, LSL_Leaf *list, LSL_Leaf *right);
LSL_Leaf *addState(LuaSL_compiler *compiler, LSL_Leaf *state, LSL_Leaf *identifier, LSL_Leaf *block);
LSL_Leaf *addStatement(LuaSL_compiler *compiler, LSL_Leaf *lval, LSL_Leaf *flow, LSL_Leaf *left, LSL_Leaf *expr, LSL_Leaf *right, LSL_Leaf *block, LSL_Leaf *identifier);
LSL_Leaf *addTypecast(LSL_Leaf *lval, LSL_Leaf *type, LSL_Leaf *rval, LSL_Leaf *expr);
LSL_Leaf *addVariable(LuaSL_compiler *compiler, LSL_Leaf *type, LSL_Leaf *identifier, LSL_Leaf *assignment, LSL_Leaf *expr);
LSL_Leaf *beginBlock(LuaSL_compiler *compiler, LSL_Leaf *block);
LSL_Leaf *checkVariable(LuaSL_compiler *compiler, LSL_Leaf *identifier, LSL_Leaf *dot, LSL_Leaf *sub);
LSL_Leaf *collectArguments(LuaSL_compiler *compiler, LSL_Leaf *list, LSL_Leaf *comma, LSL_Leaf *arg);
LSL_Leaf *collectParameters(LuaSL_compiler *compiler, LSL_Leaf *list, LSL_Leaf *comma, LSL_Leaf *newParam);
LSL_Leaf *collectStatements(LuaSL_compiler *compiler, LSL_Leaf *list, LSL_Leaf *newStatement);
void *ParseAlloc(void *(*mallocProc)(size_t));
void ParseTrace(FILE *TraceFILE, char *zTracePrompt);
void Parse(void *yyp, int yymajor, LSL_Leaf *yyminor, LuaSL_compiler *compiler);
void ParseFree(void *p, void (*freeProc)(void*));
#endif // __LUASL_LSL_TREE_H__
|