CyberChef/src/core/operations/Code.js

426 lines
11 KiB
JavaScript
Raw Normal View History

var Utils = require("../Utils.js"),
VKbeautify = require("vkbeautify"),
dom = require("xmldom").DOMParser,
xpath = require("xpath"),
prettyPrintOne = require("exports-loader?prettyPrintOne!google-code-prettify/bin/prettify.min.js");
2016-11-28 11:42:58 +01:00
/**
* Code operations.
*
* @author n1474335 [n1474335@gmail.com]
* @copyright Crown Copyright 2016
* @license Apache-2.0
*
* @namespace
*/
var Code = module.exports = {
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* @constant
* @default
*/
LANGUAGES: ["default-code", "default-markup", "bash", "bsh", "c", "cc", "coffee", "cpp", "cs", "csh", "cv", "cxx", "cyc", "htm", "html", "in.tag", "java", "javascript", "js", "json", "m", "mxml", "perl", "pl", "pm", "py", "python", "rb", "rc", "rs", "ruby", "rust", "sh", "uq.val", "xhtml", "xml", "xsl"],
/**
* @constant
* @default
*/
LINE_NUMS: false,
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* Syntax highlighter operation.
*
* @param {string} input
* @param {Object[]} args
* @returns {html}
*/
runSyntaxHighlight: function(input, args) {
2016-11-28 11:42:58 +01:00
var language = args[0],
lineNums = args[1];
return "<code class='prettyprint'>" + prettyPrintOne(Utils.escapeHtml(input), language, lineNums) + "</code>";
2016-11-28 11:42:58 +01:00
},
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* @constant
* @default
*/
BEAUTIFY_INDENT: "\\t",
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* XML Beautify operation.
*
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runXmlBeautify: function(input, args) {
var indentStr = args[0];
return VKbeautify.xml(input, indentStr);
2016-11-28 11:42:58 +01:00
},
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* JSON Beautify operation.
*
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runJsonBeautify: function(input, args) {
var indentStr = args[0];
if (!input) return "";
return VKbeautify.json(input, indentStr);
2016-11-28 11:42:58 +01:00
},
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* CSS Beautify operation.
*
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runCssBeautify: function(input, args) {
var indentStr = args[0];
return VKbeautify.css(input, indentStr);
2016-11-28 11:42:58 +01:00
},
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* SQL Beautify operation.
*
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runSqlBeautify: function(input, args) {
var indentStr = args[0];
return VKbeautify.sql(input, indentStr);
2016-11-28 11:42:58 +01:00
},
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* @constant
* @default
*/
PRESERVE_COMMENTS: false,
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* XML Minify operation.
*
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runXmlMinify: function(input, args) {
var preserveComments = args[0];
return VKbeautify.xmlmin(input, preserveComments);
2016-11-28 11:42:58 +01:00
},
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* JSON Minify operation.
*
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runJsonMinify: function(input, args) {
if (!input) return "";
return VKbeautify.jsonmin(input);
2016-11-28 11:42:58 +01:00
},
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* CSS Minify operation.
*
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runCssMinify: function(input, args) {
var preserveComments = args[0];
return VKbeautify.cssmin(input, preserveComments);
2016-11-28 11:42:58 +01:00
},
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* SQL Minify operation.
*
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runSqlMinify: function(input, args) {
return VKbeautify.sqlmin(input);
2016-11-28 11:42:58 +01:00
},
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
/**
* Generic Code Beautify operation.
*
* Yeeeaaah...
*
* I'm not proud of this code, but seriously, try writing a generic lexer and parser that
* correctly generates an AST for multiple different languages. I have tried, and I can tell
* you it's pretty much impossible.
2016-12-14 17:39:17 +01:00
*
2016-11-28 11:42:58 +01:00
* This basically works. That'll have to be good enough. It's not meant to produce working code,
* just slightly more readable code.
2016-12-14 17:39:17 +01:00
*
2016-11-28 11:42:58 +01:00
* Things that don't work:
* - For loop formatting
* - Do-While loop formatting
* - Switch/Case indentation
* - Bit shift operators
*
* @author n1474335 [n1474335@gmail.com]
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runGenericBeautify: function(input, args) {
2016-11-28 11:42:58 +01:00
var code = input,
t = 0,
preservedTokens = [],
2016-11-28 11:42:58 +01:00
m;
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Remove strings
var sstrings = /'([^'\\]|\\.)*'/g;
2016-12-14 17:39:17 +01:00
while ((m = sstrings.exec(code))) {
code = preserveToken(code, m, t++);
2016-11-28 11:42:58 +01:00
sstrings.lastIndex = m.index;
}
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
var dstrings = /"([^"\\]|\\.)*"/g;
2016-12-14 17:39:17 +01:00
while ((m = dstrings.exec(code))) {
code = preserveToken(code, m, t++);
2016-11-28 11:42:58 +01:00
dstrings.lastIndex = m.index;
}
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Remove comments
var scomments = /\/\/[^\n\r]*/g;
2016-12-14 17:39:17 +01:00
while ((m = scomments.exec(code))) {
code = preserveToken(code, m, t++);
2016-11-28 11:42:58 +01:00
scomments.lastIndex = m.index;
}
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
var mcomments = /\/\*[\s\S]*?\*\//gm;
2016-12-14 17:39:17 +01:00
while ((m = mcomments.exec(code))) {
code = preserveToken(code, m, t++);
2016-11-28 11:42:58 +01:00
mcomments.lastIndex = m.index;
}
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
var hcomments = /(^|\n)#[^\n\r#]+/g;
2016-12-14 17:39:17 +01:00
while ((m = hcomments.exec(code))) {
code = preserveToken(code, m, t++);
2016-11-28 11:42:58 +01:00
hcomments.lastIndex = m.index;
}
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Remove regexes
var regexes = /\/.*?[^\\]\/[gim]{0,3}/gi;
2016-12-14 17:39:17 +01:00
while ((m = regexes.exec(code))) {
code = preserveToken(code, m, t++);
2016-11-28 11:42:58 +01:00
regexes.lastIndex = m.index;
}
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Create newlines after ;
code = code.replace(/;/g, ";\n");
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Create newlines after { and around }
code = code.replace(/{/g, "{\n");
code = code.replace(/}/g, "\n}\n");
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Remove carriage returns
code = code.replace(/\r/g, "");
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Remove all indentation
code = code.replace(/^\s+/g, "");
code = code.replace(/\n\s+/g, "\n");
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Remove trailing spaces
code = code.replace(/\s*$/g, "");
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Remove newlines before {
code = code.replace(/\n{/g, "{");
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Indent
var i = 0,
level = 0;
while (i < code.length) {
2017-02-09 16:09:33 +01:00
switch (code[i]) {
2016-11-28 11:42:58 +01:00
case "{":
level++;
break;
case "\n":
if (i+1 >= code.length) break;
2016-12-14 17:39:17 +01:00
if (code[i+1] === "}") level--;
2016-11-28 11:42:58 +01:00
var indent = (level >= 0) ? Array(level*4+1).join(" ") : "";
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
code = code.substring(0, i+1) + indent + code.substring(i+1);
if (level > 0) i += level*4;
break;
}
i++;
}
// Add strategic spaces
code = code.replace(/\s*([!<>=+-/*]?)=\s*/g, " $1= ");
code = code.replace(/\s*<([=]?)\s*/g, " <$1 ");
code = code.replace(/\s*>([=]?)\s*/g, " >$1 ");
code = code.replace(/([^+])\+([^+=])/g, "$1 + $2");
code = code.replace(/([^-])-([^-=])/g, "$1 - $2");
code = code.replace(/([^*])\*([^*=])/g, "$1 * $2");
code = code.replace(/([^/])\/([^/=])/g, "$1 / $2");
code = code.replace(/\s*,\s*/g, ", ");
code = code.replace(/\s*{/g, " {");
code = code.replace(/}\n/g, "}\n\n");
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Just... don't look at this
code = code.replace(/(if|for|while|with|elif|elseif)\s*\(([^\n]*)\)\s*\n([^{])/gim, "$1 ($2)\n $3");
code = code.replace(/(if|for|while|with|elif|elseif)\s*\(([^\n]*)\)([^{])/gim, "$1 ($2) $3");
code = code.replace(/else\s*\n([^{])/gim, "else\n $1");
code = code.replace(/else\s+([^{])/gim, "else $1");
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Remove strategic spaces
code = code.replace(/\s+;/g, ";");
code = code.replace(/\{\s+\}/g, "{}");
code = code.replace(/\[\s+\]/g, "[]");
code = code.replace(/}\s*(else|catch|except|finally|elif|elseif|else if)/gi, "} $1");
2016-12-14 17:39:17 +01:00
2016-11-28 11:42:58 +01:00
// Replace preserved tokens
var ptokens = /###preservedToken(\d+)###/g;
2016-12-14 17:39:17 +01:00
while ((m = ptokens.exec(code))) {
var ti = parseInt(m[1], 10);
code = code.substring(0, m.index) + preservedTokens[ti] + code.substring(m.index + m[0].length);
2016-11-28 11:42:58 +01:00
ptokens.lastIndex = m.index;
}
return code;
2016-12-14 17:39:17 +01:00
/**
* Replaces a matched token with a placeholder value.
*/
function preserveToken(str, match, t) {
preservedTokens[t] = match[0];
2016-11-28 11:42:58 +01:00
return str.substring(0, match.index) +
"###preservedToken" + t + "###" +
2016-11-28 11:42:58 +01:00
str.substring(match.index + match[0].length);
}
},
/**
* @constant
* @default
*/
XPATH_INITIAL: "",
/**
* @constant
* @default
*/
XPATH_DELIMITER: "\\n",
/**
* XPath expression operation.
*
* @author Mikescher (https://github.com/Mikescher | https://mikescher.com)
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runXpath:function(input, args) {
var query = args[0],
delimiter = args[1];
var doc;
try {
doc = new dom().parseFromString(input);
} catch (err) {
return "Invalid input XML.";
}
var nodes;
try {
nodes = xpath.select(query, doc);
} catch (err) {
return "Invalid XPath. Details:\n" + err.message;
}
var nodeToString = function(node) {
return node.toString();
};
return nodes.map(nodeToString).join(delimiter);
},
/**
* @constant
* @default
*/
CSS_SELECTOR_INITIAL: "",
/**
* @constant
* @default
*/
CSS_QUERY_DELIMITER: "\\n",
/**
* CSS selector operation.
*
* @author Mikescher (https://github.com/Mikescher | https://mikescher.com)
* @author n1474335 [n1474335@gmail.com]
* @param {string} input
* @param {Object[]} args
* @returns {string}
*/
runCSSQuery: function(input, args) {
var query = args[0],
delimiter = args[1],
parser = new DOMParser(),
html,
result;
if (!query.length || !input.length) {
return "";
}
try {
html = parser.parseFromString(input, "text/html");
} catch (err) {
return "Invalid input HTML.";
}
try {
result = html.querySelectorAll(query);
} catch (err) {
return "Invalid CSS Selector. Details:\n" + err.message;
}
var nodeToString = function(node) {
switch (node.nodeType) {
case Node.ELEMENT_NODE: return node.outerHTML;
case Node.ATTRIBUTE_NODE: return node.value;
case Node.COMMENT_NODE: return node.data;
case Node.TEXT_NODE: return node.wholeText;
case Node.DOCUMENT_NODE: return node.outerHTML;
default: throw new Error("Unknown Node Type: " + node.nodeType);
}
};
return Array.apply(null, Array(result.length))
.map(function(_, i) {
return result[i];
})
.map(nodeToString)
.join(delimiter);
},
2016-11-28 11:42:58 +01:00
};