aboutsummaryrefslogtreecommitdiff
path: root/src
diff options
context:
space:
mode:
Diffstat (limited to 'src')
-rw-r--r--src/enzymatic.js160
-rw-r--r--src/parser.js574
-rw-r--r--src/utility.js14
3 files changed, 364 insertions, 384 deletions
diff --git a/src/enzymatic.js b/src/enzymatic.js
index c2c7979e..bb4458fe 100644
--- a/src/enzymatic.js
+++ b/src/enzymatic.js
@@ -7,29 +7,40 @@ DEBUG = false;
Substrate = function(name_) {
this.name_ = name_;
- this.items = [];
- this.zymes = [];
+ this.zymes = {};
this.currUid = 1;
};
Substrate.prototype = {
- addItem: function(item) {
- if (!item.__uid__) {
- item.__uid__ = this.currUid;
- this.currUid ++;
- }
- this.items.push(item);
+ addItem: function(item, targetZyme) {
+ this.addItems([item], targetZyme);
},
- addZyme: function(zyme) {
- var name_ = '?';
- if (typeof zyme == 'string') {
- name_ = zyme;
- zyme = arguments[1];
+ addItems: function(items, targetZyme) {
+ assert(targetZyme);
+ if (targetZyme == '/dev/null') return;
+ if (targetZyme == '/dev/stdout') {
+ this.results = this.results.concat(items);
+ return;
+ }
+ assert(this.zymes[targetZyme]);
+ for (var i = 0; i < items.length; i++) {
+ var item = items[i];
+ if (!item.__uid__) {
+ item.__uid__ = this.currUid;
+ this.currUid ++;
+ }
}
+ this.zymes[targetZyme].items = this.zymes[targetZyme].items.concat(items);
+ },
+
+ addZyme: function(name_, zyme) {
+ assert(name_ && zyme);
zyme.name_ = name_;
- this.zymes.push(zyme);
- if (!zyme.select) zyme.select = Zyme.prototype.select;
+ zyme.items = [];
+ zyme.forwardItem = bind(this, this.addItem);
+ zyme.forwardItems = bind(this, this.addItems);
+ this.zymes[name_] = zyme;
if (!zyme.process) zyme.process = Zyme.prototype.process;
},
@@ -42,7 +53,7 @@ Substrate.prototype = {
function midComment(force) {
var curr = Date.now();
if (curr - midTime > 1000 || force) {
- print('// Working on ' + that.name_ + ', so far ' + ((curr-startTime)/1000).toString().substr(0,10) + ' seconds. Have ' + that.items.length + ' items.');
+ print('// Working on ' + that.name_ + ', so far ' + ((curr-startTime)/1000).toString().substr(0,10) + ' seconds.');
midTime = curr;
}
}
@@ -50,111 +61,74 @@ Substrate.prototype = {
print('// Completed ' + that.name_ + ' in ' + ((Date.now() - startTime)/1000).toString().substr(0,10) + ' seconds.');
}
- // Naive solver - sheer brute force.
- // Assumes list of Zymes is non-changing.
- var results = [];
- while (true) {
- dprint('enzymatic', "Cycle start, " + this.items.length + " items.");
+ var finalResult = null;
+ this.results = [];
+ var finished = false;
+ var that = this;
+ while (!finished) {
+ dprint('enzymatic', "Cycle start, items: ");// + values(this.zymes).map(function(zyme) zyme.items).reduce(function(x,y) x+y, 0));
var hadProcessing = false;
- for (var z = 0; z < this.zymes.length; z++) {
+ values(this.zymes).forEach(function(zyme) {
midComment();
- var zyme = this.zymes[z];
- var selected = zyme.select(this.items);
- if (selected.length > 0) {
- if (DEBUG) print("Calling: " + (zyme.processItem ? zyme.processItem : zyme.process));
- if (DEBUG) {
- try {
- print("Inputs: \n---\n\n" + outputs.map(JSON.stringify).join('\n\n') + '\n\n---');
- } catch(e) {
- print("Inputs: \n---\n\n" + outputs + '\n\n---');
- }
- }
- hadProcessing = true;
- var outputs;
- try {
- dprint('Processing using ' + zyme.name_ + ': ' + selected.length + ' items out of ' + this.items.length);
- //PROF(true);
- outputs = zyme.process(selected);
- //PROF();
- } catch (e) {
- print("Exception, current selected are: " + selected.map(dump).join('\n\n'));
- print("Stack: " + dump(new Error().stack));
- throw e;
- }
- if (DEBUG) {
- try {
- print("Outputs: \n---\n\n" + outputs.map(JSON.stringify).join('\n\n') + '\n\n---');
- } catch(e) {
- print("Outputs: \n---\n\n" + outputs + '\n\n---');
- }
- }
+
+ if (zyme.items.length == 0) return;
+
+ var inputs = zyme.items.slice(0);
+ var outputs;
+ var currResultCount = that.results.length;
+ try {
+ dprint('Processing using ' + zyme.name_ + ': ' + inputs.length);
+ zyme.items = []; // More may be added in process(); we'll get to them next time
+ outputs = zyme.process(inputs);
+ dprint('New results: ' + (outputs.length + that.results.length - currResultCount) + ' out of ' + (that.results.length + outputs.length));
+ } catch (e) {
+ print("Exception, current selected are: " + inputs.map(dump).join('\n\n'));
+ print("Stack: " + dump(new Error().stack));
+ throw e;
+ }
+ hadProcessing = true;
+
+ if (outputs) {
if (outputs.length === 1 && outputs[0].__finalResult__) {
if (DEBUG) print("Solving complete: __finalResult__");
delete outputs[0].__finalResult__; // Might recycle this
delete outputs[0].__uid__;
finalComment();
- return outputs[0];
- }
- results = results.concat(outputs.filter(function(output) { return !!output.__result__; }))
- var nonResults = outputs.filter(function(output) { return !output.__result__; });
-
- var keptUids = {};
- for (var i = 0; i < nonResults.length; i++) {
- var s = nonResults[i];
- if (s.__uid__) {
- keptUids[s.__uid__] = true;
- } else {
- this.addItem(s);
- }
- }
- var droppedUids = {};
- for (var i = 0; i < selected.length; i++) {
- var s = selected[i];
- if (!keptUids[s.__uid__]) droppedUids[s.__uid__] = true;
+ finished = true;
+ finalResult = outputs[0];
+ } else {
+ that.results = that.results.concat(outputs);
}
- this.items = this.items.filter(function(item) {
- if (!droppedUids[item.__uid__]) {
- return true;
- } else {
- delete item.__uid__;
- }
- });
- //midComment(true);
}
- }
- if (this.items.length === 0) {
+ });
+ if (!hadProcessing) {
if (DEBUG) print("Solving complete: no remaining items");
finalComment();
- results.forEach(function(output) {
+ this.results.forEach(function(output) {
delete output.__result__; // Might recycle these
delete output.__uid__;
});
- return results;
+ return this.results;
}
- if (!hadProcessing) {
- print("Reached a dead end.");
- this.items.forEach(function(item) {
- print("remaining item:" + dump(item));
- });
- throw "failure";
+ if (finalResult) {
+ return finalResult;
}
midComment();
- this.items = this.items.filter(function(item) { return item !== null; });
}
},
};
Zyme = function() { };
Zyme.prototype = {
- select: function(items) {
- return items.filter(this.selectItem, this);
- },
process: function(items) {
var ret = [];
for (var i = 0; i < items.length; i++) {
var item = items[i];
try {
- ret = ret.concat(this.processItem(item));
+ var outputs = this.processItem(item);
+ if (outputs) {
+ ret = ret.concat(outputs);
+ }
} catch (e) {
print("Exception in process(), current item is: " + dump(item));
throw e;
diff --git a/src/parser.js b/src/parser.js
index f3ce9a68..0db8460a 100644
--- a/src/parser.js
+++ b/src/parser.js
@@ -156,6 +156,13 @@ function getTokenIndexByText(tokens, text) {
return i;
}
+function findTokenText(item, text) {
+ for (var i = 0; i < item.tokens.length; i++) {
+ if (item.tokens[i].text == text) return i;
+ }
+ return -1;
+}
+
// Splits a list of tokens separated by commas. For example, a list of arguments in a function call
function splitTokenList(tokens) {
if (tokens.length == 0) return [];
@@ -173,50 +180,51 @@ function splitTokenList(tokens) {
return ret;
}
-function makeSplitter(parentSlot, parentSlotValue, parentUnrequiredSlot, childSlot, copySlots) {
+// Splits an item, with the intent of later reintegration
+function splitItem(parent, childSlot, copySlots) {
+ if (!copySlots) copySlots = [];
+ if (!parent[childSlot]) parent[childSlot] = {};
+ var child = parent[childSlot];
+ parent[childSlot] = null;
+ child.parentUid = parent.__uid__;
+ child.parentSlot = childSlot;
+ child.parentLineNum = child.lineNum = parent.lineNum;
+ copySlots.forEach(function(slot) { child[slot] = parent[slot] });
return {
- selectItem: function(item) { return item[parentSlot] == parentSlotValue && !item[parentUnrequiredSlot] && item[childSlot] !== null },
- process: function(parents) {
- if (!copySlots) copySlots = [];
- var ret = parents.slice(0);
- for (var i = 0; i < parents.length; i++) {
- var parent = parents[i];
- var child = parent[childSlot];
- parent[childSlot] = null;
- child.parentUid = parent.__uid__;
- child.parentSlot = childSlot;
- child.lineNum = parent.lineNum; // Debugging
- copySlots.forEach(function(slot) { child[slot] = parent[slot] });
- ret.push(child);
- }
- return ret;
- },
+ parent: parent,
+ child: child,
};
}
-function makeCombiner(parentSlot, parentSlotValue, parentUnrequiredSlot, childRequiredSlot, finalizeFunc) {
+function makeReintegrator(afterFunc) {
+ // reintegration - find intermediate representation-parsed items and
+ // place back in parents TODO: Optimize this code to optimal O(..)
return {
- select: function(items) {
+ process: function(items) {
var ret = [];
- var parents = items.filter(function(item) { return item[parentSlot] == parentSlotValue && !item[parentUnrequiredSlot] });
- for (var i = 0; i < parents.length; i++) {
- var parent = parents[i];
- var child = items.filter(function(item) { return item[childRequiredSlot] && item.parentUid === parent.__uid__ })[0];
- if (child) {
- ret = ret.concat([parent, child]);
+ for (var i = 0; i < items.length; i++) {
+ var found = false;
+ if (items[i] && items[i].parentSlot) {
+ var child = items[i];
+ for (var j = 0; j < items.length; j++) {
+ if (items[j] && items[j].lineNum == items[i].parentLineNum) {
+ var parent = items[j];
+ // process the pair
+ parent[child.parentSlot] = child;
+ delete child.parentLineNum;
+ afterFunc.call(this, parent, child);
+
+ items[i] = null;
+ items[j] = null;
+ found = true;
+ break;
+ }
+ }
}
}
+ this.forwardItems(items.filter(function(item) { return !!item }), this.name_); // next time hopefully
return ret;
- },
- process: function(items) {
- return Zyme.prototype.processPairs(items, function(parent, child) {
- parent[child.parentSlot] = child;
- delete child.parentUid;
- delete child.parentSlot;
- finalizeFunc(parent);
- return [parent];
- });
- },
+ }
};
}
@@ -273,6 +281,7 @@ function cleanSegment(segment) {
// Expects one of the several LVM getelementptr formats:
// a qualifier, a type, a null, then an () item with tokens
function parseGetElementPtr(segment) {
+//print("Parse GTP: " + dump(segment));
segment = segment.slice(0);
segment = cleanSegment(segment);
assertTrue(['inreg', 'byval'].indexOf(segment[1].text) == -1);
@@ -371,24 +380,8 @@ function intertyper(data) {
substrate = new Substrate('Intertyper');
- // Input
-
- substrate.addItem({
- llvmText: data,
- });
-
- // Tools
-
- function findTokenText(item, text) {
- for (var i = 0; i < item.tokens.length; i++) {
- if (item.tokens[i].text == text) return i;
- }
- return -1;
- }
-
// Line splitter.
substrate.addZyme('LineSplitter', {
- selectItem: function(item) { return !!item.llvmText; },
processItem: function(item) {
var lines = item.llvmText.split('\n');
var ret = [];
@@ -412,15 +405,13 @@ function intertyper(data) {
}
}
}
- return ret.filter(function(item) { return item.lineText; });
+ this.forwardItems(ret.filter(function(item) { return item.lineText; }), 'Tokenizer');
},
});
// Line tokenizer
substrate.addZyme('Tokenizer', {
- selectItem: function(item) { return item.lineText; },
- processItem: function(item) {
- //print("line: " + item.lineText);
+ processItem: function(item, inner) {
var lineText = item.lineText + " ";
var tokens = [];
var tokenStart = -1;
@@ -458,7 +449,7 @@ function intertyper(data) {
if (token.text[0] in enclosers) {
token.item = that.processItem({
lineText: token.text.substr(1, token.text.length-2)
- });
+ }, true);
token.type = token.text[0];
}
if (indent == -1) {
@@ -520,29 +511,86 @@ function intertyper(data) {
}
}
}
- return [{
+ var item = {
tokens: tokens,
indent: indent,
lineNum: item.lineNum,
- }];
+ };
+ if (inner) {
+ return [item];
+ } else {
+ this.forwardItem(item, 'Triager');
+ }
+ },
+ });
+
+ substrate.addZyme('Triager', {
+ processItem: function(item) {
+ function triage() {
+ if (!item.intertype) {
+ if (item.tokens[0].text in searchable(';', 'target'))
+ return '/dev/null';
+ if (item.tokens.length >= 3 && item.indent === 0 && item.tokens[1].text == '=')
+ return 'Global';
+ if (item.tokens.length >= 4 && item.indent === 0 && item.tokens[0].text == 'define' &&
+ item.tokens.slice(-1)[0].text == '{')
+ return 'FuncHeader';
+ if (item.tokens.length >= 1 && item.indent === 0 && item.tokens[0].text.substr(-1) == ':')
+ return 'Label';
+ if (item.indent === 2 && item.tokens && item.tokens.length >= 3 && findTokenText(item, '=') >= 0 &&
+ !item.intertype)
+ return 'Assign';
+ if (!item.intertype && item.indent === -1 && item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'load')
+ return 'Load';
+ if (!item.intertype && item.indent === -1 && item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'bitcast')
+ return 'Bitcast';
+ if (!item.intertype && item.indent === -1 && item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'getelementptr')
+ return 'GEP';
+ if (item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'call' && !item.intertype)
+ return 'Call';
+ if (item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'invoke' && !item.intertype)
+ return 'Invoke';
+ if (!item.intertype && item.indent === -1 && item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'alloca')
+ return 'Alloca';
+ if (item.indent === -1 && item.tokens && item.tokens.length >= 3 &&
+ ['add', 'sub', 'sdiv', 'mul', 'icmp', 'zext', 'urem', 'srem', 'fadd', 'fsub', 'fmul', 'fdiv', 'fcmp', 'uitofp', 'sitofp', 'fpext', 'fptrunc', 'fptoui', 'fptosi', 'trunc', 'sext', 'select', 'shl', 'shr', 'ashl', 'ashr', 'lshr', 'lshl', 'xor', 'or', 'and', 'ptrtoint', 'inttoptr'].indexOf(item.tokens[0].text) != -1 && !item.intertype)
+ return 'Mathops';
+ if (item.indent === 2 && item.tokens && item.tokens.length >= 5 && item.tokens[0].text == 'store' &&
+ !item.intertype)
+ return 'Store';
+ if (item.indent === 2 && item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'br' &&
+ !item.intertype)
+ return 'Branch';
+ if (item.indent === 2 && item.tokens && item.tokens.length >= 2 && item.tokens[0].text == 'ret' &&
+ !item.intertype)
+ return 'Return';
+ if (item.indent === 2 && item.tokens && item.tokens.length >= 2 && item.tokens[0].text == 'switch' &&
+ !item.intertype)
+ return 'Switch';
+ if (item.indent === 0 && item.tokens && item.tokens.length >= 1 && item.tokens[0].text == '}' && !item.intertype)
+ return 'FuncEnd';
+ if (item.indent === 0 && item.tokens && item.tokens.length >= 4 && item.tokens[0].text == 'declare' &&
+ !item.intertype)
+ return 'External';
+ if (item.indent === 2 && item.tokens && item.tokens[0].text == 'unreachable' &&
+ !item.intertype)
+ return 'Unreachable';
+ } else {
+ // Already intertyped
+ if (item.parentSlot)
+ return 'Reintegrator';
+ }
+ print("Item: " + JSON.stringify(item));
+ assert(false);
+ }
+ this.forwardItem(item, triage(item));
},
});
// Line parsers to intermediate form
- // Comment
- substrate.addZyme('Comment', {
- selectItem: function(item) { return item.tokens && item.tokens[0].text == ';' },
- processItem: function(item) { return [] },
- });
- // target
- substrate.addZyme('Target', {
- selectItem: function(item) { return item.tokens && item.tokens[0].text == 'target' },
- processItem: function(item) { return [] },
- });
// globals: type or variable
substrate.addZyme('Global', {
- selectItem: function(item) { return item.tokens && item.tokens.length >= 3 && item.indent === 0 && item.tokens[1].text == '=' },
processItem: function(item) {
if (item.tokens[2].text == 'type') {
//dprint('type/const linenum: ' + item.lineNum + ':' + dump(item));
@@ -560,7 +608,7 @@ function intertyper(data) {
}
}
return [{
- __result__: true,
+ __result__: true, // XXX can remove these
intertype: 'type',
name_: item.tokens[0].text,
fields: fields,
@@ -595,8 +643,6 @@ function intertyper(data) {
});
// function header
substrate.addZyme('FuncHeader', {
- selectItem: function(item) { return item.tokens && item.tokens.length >= 4 && item.indent === 0 && item.tokens[0].text == 'define' &&
- item.tokens.slice(-1)[0].text == '{' },
processItem: function(item) {
item.tokens = item.tokens.filter(function(token) {
return ['internal', 'signext', 'zeroext', 'nounwind', 'define', 'linkonce_odr', 'inlinehint', '{'].indexOf(token.text) == -1;
@@ -613,7 +659,6 @@ function intertyper(data) {
});
// label
substrate.addZyme('Label', {
- selectItem: function(item) { return item.tokens && item.tokens.length >= 1 && item.indent === 0 && item.tokens[0].text.substr(-1) == ':' },
processItem: function(item) {
return [{
__result__: true,
@@ -623,59 +668,35 @@ function intertyper(data) {
}];
},
});
+
// assignment
substrate.addZyme('Assign', {
- selectItem: function(item) { return item.indent === 2 && item.tokens && item.tokens.length >= 3 && findTokenText(item, '=') >= 0 &&
- !item.intertype },
processItem: function(item) {
var opIndex = findTokenText(item, '=');
- return [{
+ var pair = splitItem({
intertype: 'assign',
ident: combineTokens(item.tokens.slice(0, opIndex)).text,
- value: null,
lineNum: item.lineNum,
- }, { // Additional token, to be parsed, and later re-integrated
+ }, 'value');
+ this.forwardItem(pair.parent, 'Reintegrator');
+ this.forwardItem(mergeInto(pair.child, { // Additional token, to be triaged and later re-integrated
indent: -1,
tokens: item.tokens.slice(opIndex+1),
- parentLineNum: item.lineNum,
- parentSlot: 'value',
- }];
+ }), 'Triager');
},
});
// reintegration - find intermediate representation-parsed items and
- // place back in parents
- substrate.addZyme('Reintegrator', {
- select: function(items) {
- var ret = [];
- for (var i = 0; i < items.length; i++) {
- if (items[i].parentSlot && items[i].intertype) {
- for (var j = 0; j < items.length; j++) {
- if (items[j].lineNum == items[i].parentLineNum) {
- ret = ret.concat([items[j], items[i]]);
- }
- }
- }
- }
- return ret;
- },
- process: function(items) {
- return Zyme.prototype.processPairs(items, function(parent, child) {
- parent[child.parentSlot] = child;
- parent.__result__ = true;
- delete child.parentLineNum;
-
- // Special re-integration behaviors
- if (child.intertype == 'fastgetelementptrload') {
- parent.intertype = 'fastgetelementptrload';
- }
-
- return [parent];
- });
+ // place back in parents TODO: Optimize this code to optimal O(..)
+ substrate.addZyme('Reintegrator', makeReintegrator(function(parent, child) {
+ // Special re-integration behaviors
+ if (child.intertype == 'fastgetelementptrload') {
+ parent.intertype = 'fastgetelementptrload';
}
- });
+ this.forwardItem(parent, '/dev/stdout');
+ }));
+
// 'load'
substrate.addZyme('Load', {
- selectItem: function(item) { return !item.intertype && item.indent === -1 && item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'load' },
processItem: function(item) {
item.pointerType = item.tokens[1];
item.type = { text: removePointing(item.pointerType.text) };
@@ -692,30 +713,28 @@ function intertyper(data) {
} else {
item.intertype = 'load';
if (item.tokens[2].text == 'bitcast') {
- item.pointer = item.tokens[3].item[0].tokens[1]; // XXX item without [0], also below
+ item.pointer = item.tokens[3].item[0].tokens[1];
item.originalType = item.tokens[3].item[0].tokens[0];
} else {
item.pointer = item.tokens[2];
}
}
item.ident = item.pointer.text;
- return [item];
+ this.forwardItem(item, 'Reintegrator');
},
});
// 'bitcast'
substrate.addZyme('Bitcast', {
- selectItem: function(item) { return !item.intertype && item.indent === -1 && item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'bitcast' },
processItem: function(item) {
item.intertype = 'bitcast';
item.type = item.tokens[1];
item.ident = item.tokens[2].text;
item.type2 = item.tokens[4];
- return [item];
+ this.forwardItem(item, 'Reintegrator');
},
});
// 'getelementptr'
substrate.addZyme('GEP', {
- selectItem: function(item) { return !item.intertype && item.indent === -1 && item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'getelementptr' },
processItem: function(item) {
var last = getTokenIndexByText(item.tokens, ';');
var segment = [ item.tokens[1], { text: null }, null, { item: [ {
@@ -726,12 +745,11 @@ function intertyper(data) {
item.type = data.type;
item.params = data.params;
item.ident = data.ident;
- return [item];
+ this.forwardItem(item, 'Reintegrator');
},
});
// 'call'
substrate.addZyme('Call', {
- selectItem: function(item) { return item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'call' && !item.intertype },
processItem: function(item) {
item.intertype = 'call';
if (['signext', 'zeroext'].indexOf(item.tokens[1].text) != -1) {
@@ -749,13 +767,13 @@ function intertyper(data) {
// standalone call - not in assign
item.standalone = true;
item.__result__ = true;
+ return [item];
}
- return [item];
+ this.forwardItem(item, 'Reintegrator');
},
});
// 'invoke'
substrate.addZyme('Invoke', {
- selectItem: function(item) { return item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'invoke' && !item.intertype },
processItem: function(item) {
item.intertype = 'invoke';
item.type = item.tokens[1];
@@ -773,26 +791,23 @@ function intertyper(data) {
// standalone call - not in assign
item.standalone = true;
item.__result__ = true;
+ return [item];
}
- return [item];
+ this.forwardItem(item, 'Reintegrator');
},
});
// 'alloca'
substrate.addZyme('Alloca', {
- selectItem: function(item) { return !item.intertype && item.indent === -1 && item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'alloca' },
processItem: function(item) {
item.intertype = 'alloca';
item.allocatedType = item.tokens[1];
item.type = { text: addPointing(item.tokens[1].text) }; // type of pointer we will get
item.type2 = { text: item.tokens[1].text }; // value we will create, and get a pointer to
- return [item];
+ this.forwardItem(item, 'Reintegrator');
},
});
// mathops
substrate.addZyme('Mathops', {
- selectItem: function(item) { return item.indent === -1 && item.tokens && item.tokens.length >= 3 &&
- ['add', 'sub', 'sdiv', 'mul', 'icmp', 'zext', 'urem', 'srem', 'fadd', 'fsub', 'fmul', 'fdiv', 'fcmp', 'uitofp', 'sitofp', 'fpext', 'fptrunc', 'fptoui', 'fptosi', 'trunc', 'sext', 'select', 'shl', 'shr', 'ashl', 'ashr', 'lshr', 'lshl', 'xor', 'or', 'and', 'ptrtoint', 'inttoptr']
- .indexOf(item.tokens[0].text) != -1 && !item.intertype },
processItem: function(item) {
item.intertype = 'mathop';
item.op = item.tokens[0].text;
@@ -808,13 +823,11 @@ function intertyper(data) {
item.ident3 = item.tokens[5] ? item.tokens[5].text : null;
item.ident4 = item.tokens[8] ? item.tokens[8].text : null;
//print('// zz got maptop ' + item.op + ',' + item.variant + ',' + item.ident + ',' + item.value);
- return [item];
+ this.forwardItem(item, 'Reintegrator');
},
});
// 'store'
substrate.addZyme('Store', {
- selectItem: function(item) { return item.indent === 2 && item.tokens && item.tokens.length >= 5 && item.tokens[0].text == 'store' &&
- !item.intertype },
processItem: function(item) {
if (item.tokens[3].text != ',') {
assertEq(item.tokens[2].text, 'getelementptr');
@@ -846,8 +859,6 @@ function intertyper(data) {
});
// 'br'
substrate.addZyme('Branch', {
- selectItem: function(item) { return item.indent === 2 && item.tokens && item.tokens.length >= 3 && item.tokens[0].text == 'br' &&
- !item.intertype },
processItem: function(item) {
if (item.tokens[1].text == 'label') {
return [{
@@ -870,8 +881,6 @@ function intertyper(data) {
});
// 'ret'
substrate.addZyme('Return', {
- selectItem: function(item) { return item.indent === 2 && item.tokens && item.tokens.length >= 2 && item.tokens[0].text == 'ret' &&
- !item.intertype },
processItem: function(item) {
return [{
__result__: true,
@@ -884,8 +893,6 @@ function intertyper(data) {
});
// 'switch'
substrate.addZyme('Switch', {
- selectItem: function(item) { return item.indent === 2 && item.tokens && item.tokens.length >= 2 && item.tokens[0].text == 'switch' &&
- !item.intertype },
processItem: function(item) {
function parseSwitchLabels(item) {
var ret = [];
@@ -912,7 +919,6 @@ function intertyper(data) {
});
// function end
substrate.addZyme('FuncEnd', {
- selectItem: function(item) { return item.indent === 0 && item.tokens && item.tokens.length >= 1 && item.tokens[0].text == '}' && !item.intertype },
processItem: function(item) {
return [{
__result__: true,
@@ -923,8 +929,6 @@ function intertyper(data) {
});
// external function stub
substrate.addZyme('External', {
- selectItem: function(item) { return item.indent === 0 && item.tokens && item.tokens.length >= 4 && item.tokens[0].text == 'declare' &&
- !item.intertype },
processItem: function(item) {
return [{
__result__: true,
@@ -938,8 +942,6 @@ function intertyper(data) {
});
// 'unreachable'
substrate.addZyme('Unreachable', {
- selectItem: function(item) { return item.indent === 2 && item.tokens && item.tokens[0].text == 'unreachable' &&
- !item.intertype },
processItem: function(item) {
return [{
__result__: true,
@@ -949,6 +951,12 @@ function intertyper(data) {
},
});
+ // Input
+
+ substrate.addItem({
+ llvmText: data,
+ }, 'LineSplitter');
+
return substrate.solve();
}
@@ -969,23 +977,16 @@ function analyzer(data) {
//print('zz analaz')
substrate = new Substrate('Analyzer');
- substrate.addItem({
- items: data,
- });
-
// Sorter
substrate.addZyme('Sorter', {
- selectItem: function(item) { return !item.sorted; },
processItem: function(item) {
item.items.sort(function (a, b) { return a.lineNum - b.lineNum });
- item.sorted = true;
- return [item];
+ this.forwardItem(item, 'Gatherer');
},
});
// Gatherer
substrate.addZyme('Gatherer', {
- selectItem: function(item) { return item.sorted && !item.gathered; },
processItem: function(item) {
// Single-liners
['globalVariable', 'functionStub', 'type'].forEach(function(intertype) {
@@ -1016,14 +1017,12 @@ function analyzer(data) {
}
}
delete item.items;
- item.gathered = true;
- return [item];
+ this.forwardItem(item, 'Identinicer');
},
});
// IdentiNicer
substrate.addZyme('Identinicer', {
- selectItem: function(item) { return item.gathered && !item.identiniced; },
processItem: function(output) {
walkJSON(output, function(item) {
['', '2', '3', '4', '5'].forEach(function(ext) {
@@ -1031,8 +1030,7 @@ function analyzer(data) {
item['ident' + ext] = toNiceIdent(item['ident' + ext]);
});
});
- output.identiniced = true;
- return [output];
+ this.forwardItem(output, 'Typevestigator');
}
});
@@ -1065,7 +1063,6 @@ function analyzer(data) {
// Typevestigator
substrate.addZyme('Typevestigator', {
- selectItem: function(item) { return item.gathered && !item.typevestigated; },
processItem: function(data) {
// Convert types list to dict
var old = data.types;
@@ -1082,14 +1079,12 @@ function analyzer(data) {
addType(!item.type2.text ? item.type2 : item.type2.text, data);
}
});
- data.typevestigated = true;
- return [data];
+ this.forwardItem(data, 'Typeanalyzer');
}
});
// Type analyzer
- substrate.addZyme('Type Analyzer', {
- selectItem: function(item) { return item.typevestigated && !item.typed; },
+ substrate.addZyme('Typeanalyzer', {
processItem: function(item) {
//print('zz analaz types')
// 'fields' is the raw list of LLVM fields. However, we embed
@@ -1152,14 +1147,12 @@ function analyzer(data) {
});
}
- item.typed = true;
- return [item];
+ this.forwardItem(item, 'VariableAnalyzer');
},
});
// Variable analyzer
- substrate.addZyme('Variable Analyzer', {
- selectItem: function(item) { return item.typevestigated && !item.variablized; },
+ substrate.addZyme('VariableAnalyzer', {
processItem: function(item) {
item.functions.forEach(function(func) {
func.variables = {};
@@ -1233,18 +1226,16 @@ function analyzer(data) {
//print('// var ' + vname + ': ' + JSON.stringify(variable));
}
});
- item.variablized = true;
- return [item];
+ this.forwardItem(item, 'Relooper');
},
});
// ReLooper - reconstruct nice loops, as much as possible
substrate.addZyme('Relooper', {
- selectItem: function(item) { return item.variablized && !item.relooped },
processItem: function(item) {
+ var that = this;
function finish() {
- item.relooped = true;
- return [item];
+ that.forwardItem(item, 'Optimizer');
}
// Tools
@@ -1651,10 +1642,9 @@ print('// zz Merged away! ' + label2.ident + ' into ' + label1.ident);
// Optimizer
substrate.addZyme('Optimizer', {
- selectItem: function(item) { return item.relooped && !item.optimized; },
processItem: function(item) {
+ var that = this;
function finish() {
- item.optimized = true;
item.__finalResult__ = true;
return [item];
}
@@ -1845,6 +1835,10 @@ print('// zz Merged away! ' + label2.ident + ' into ' + label1.ident);
},
});
+ substrate.addItem({
+ items: data,
+ }, 'Sorter');
+
return substrate.solve();
}
@@ -1852,20 +1846,10 @@ print('// zz Merged away! ' + label2.ident + ' into ' + label1.ident);
function JSify(data) {
substrate = new Substrate('JSifyer');
- [].concat(values(data.types).filter(function(type) { return type.lineNum != '?' }))
- .concat(data.globalVariables)
- .concat(data.functions)
- .concat(data.functionStubs)
- .forEach(function(item) {
- item.passes = {};
- substrate.addItem(item);
- });
-
var TYPES = data.types;
// type
substrate.addZyme('Type', {
- selectItem: function(item) { return item.intertype == 'type' && !item.JS },
processItem: function(item) {
var type = TYPES[item.name_];
if (type.needsFlattening) {
@@ -1980,7 +1964,6 @@ function JSify(data) {
// globalVariablw
substrate.addZyme('GlobalVariable', {
- selectItem: function(item) { return item.intertype == 'globalVariable' && !item.JS },
processItem: function(item) {
dprint('gconst', '// zz global Cons: ' + dump(item) + ' :: ' + dump(item.value));
if (item.ident == '_llvm_global_ctors') {
@@ -2000,7 +1983,6 @@ function JSify(data) {
// functionStub
substrate.addZyme('FunctionStub', {
- selectItem: function(item) { return item.intertype == 'functionStub' && !item.JS },
processItem: function(item) {
var shortident = item.ident.substr(1);
if (shortident in Snippets) {
@@ -2015,7 +1997,6 @@ function JSify(data) {
// function splitter
substrate.addZyme('FunctionSplitter', {
- selectItem: function(item) { return item.intertype == 'function' && !item.passes.splitted },
processItem: function(item) {
var ret = [item];
item.splitItems = 0;
@@ -2029,114 +2010,102 @@ function JSify(data) {
});
});
- item.passes.splitted = true;
- return ret;
+ this.forwardItems(ret, 'FuncLineTriager');
},
});
// function reconstructor & post-JS optimizer
substrate.addZyme('FunctionReconstructor', {
- select: function(items) {
- var funcs = items.filter(function(item) { return item.intertype == 'function' && item.passes.splitted });
- return funcs.map(function(func) {
- var lines = items.filter(function(item) { return item.JS && item.func === func.ident });
- if (lines.length === 0) return [];
- return [func].concat(lines);
- }).reduce(concatenator, []);
- },
- process: function(allItems) {
- var ret = [];
- for (var i = 0; i < allItems.length;) {
- var func = allItems[i];
- var j = i+1;
- while (j < allItems.length && allItems[j].intertype != 'function') j++;
- var lines = allItems.slice(i+1, j);
- i = j;
-
- lines.forEach(function(line) {
- delete line.funcData; // clean up
-
- var label = func.labels.filter(function(label) { return la