import Utils from "../Utils.js";
2017-03-27 20:39:04 +02:00
import * as JsDiff from "diff";
2016-11-28 11:42:58 +01:00
* String utility operations.
* @author n1474335 []
* @copyright Crown Copyright 2016
* @license Apache-2.0
* @namespace
const StrUtils = {
2016-11-28 11:42:58 +01:00
* @constant
* @default
name: "User defined",
value: ""
name: "IPv4 address",
value: "(?:(?:\\d|[01]?\\d\\d|2[0-4]\\d|25[0-5])\\.){3}(?:25[0-5]|2[0-4]\\d|[01]?\\d\\d|\\d)(?:\\/\\d{1,2})?"
name: "IPv6 address",
value: "((?=.*::)(?!.*::.+::)(::)?([\\dA-Fa-f]{1,4}:(:|\\b)|){5}|([\\dA-Fa-f]{1,4}:){6})((([\\dA-Fa-f]{1,4}((?!\\3)::|:\\b|(?![\\dA-Fa-f])))|(?!\\2\\3)){2}|(((2[0-4]|1\\d|[1-9])?\\d|25[0-5])\\.?\\b){4})"
name: "Email address",
value: "(\\w[-.\\w]*)@([-\\w]+(?:\\.[-\\w]+)*)\\.([A-Za-z]{2,4})"
name: "URL",
value: "([A-Za-z]+://)([-\\w]+(?:\\.\\w[-\\w]*)+)(:\\d+)?(/[^.!,?;\"\\x27<>()\\[\\]{}\\s\\x7F-\\xFF]*(?:[.!,?]+[^.!,?;\"\\x27<>()\\[\\]{}\\s\\x7F-\\xFF]+)*)?"
name: "Domain",
value: "(?:(https?):\\/\\/)?([-\\w.]+)\\.(com|net|org|biz|info|co|uk|onion|int|mobi|name|edu|gov|mil|eu|ac|ae|af|de|ca|ch|cn|cy|es|gb|hk|il|in|io|tv|me|nl|no|nz|ro|ru|tr|us|az|ir|kz|uz|pk)+"
name: "Windows file path",
value: "([A-Za-z]):\\\\((?:[A-Za-z\\d][A-Za-z\\d\\- \\x27_\\(\\)]{0,61}\\\\?)*[A-Za-z\\d][A-Za-z\\d\\- \\x27_\\(\\)]{0,61})(\\.[A-Za-z\\d]{1,6})?"
name: "UNIX file path",
value: "(?:/[A-Za-z\\d.][A-Za-z\\d\\-.]{0,61})+"
name: "MAC address",
value: "[A-Fa-f\\d]{2}(?:[:-][A-Fa-f\\d]{2}){5}"
name: "Date (yyyy-mm-dd)",
value: "((?:19|20)\\d\\d)[- /.](0[1-9]|1[012])[- /.](0[1-9]|[12][0-9]|3[01])"
name: "Date (dd/mm/yyyy)",
value: "(0[1-9]|[12][0-9]|3[01])[- /.](0[1-9]|1[012])[- /.]((?:19|20)\\d\\d)"
name: "Date (mm/dd/yyyy)",
value: "(0[1-9]|1[012])[- /.](0[1-9]|[12][0-9]|3[01])[- /.]((?:19|20)\\d\\d)"
name: "Strings",
value: "[A-Za-z\\d/\\-:.,_$%\\x27\"()<>= !\\[\\]{}@]{4,}"
* @constant
* @default
* @constant
* @default
* @constant
* @default
OUTPUT_FORMAT: ["Highlight matches", "List matches", "List capture groups", "List matches with capture groups"],
* @constant
* @default
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* Regular expression operation.
* @param {string} input
* @param {Object[]} args
* @returns {html}
runRegex: function(input, args) {
var userRegex = args[1],
2016-11-28 11:42:58 +01:00
i = args[2],
m = args[3],
displayTotal = args[4],
outputFormat = args[5],
2016-11-28 11:42:58 +01:00
modifiers = "g";
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
if (i) modifiers += "i";
if (m) modifiers += "m";
2017-02-09 16:09:33 +01:00
if (userRegex && userRegex !== "^" && userRegex !== "$") {
2016-11-28 11:42:58 +01:00
try {
var regex = new RegExp(userRegex, modifiers);
2017-02-09 16:09:33 +01:00
switch (outputFormat) {
2016-11-28 11:42:58 +01:00
case "Highlight matches":
return StrUtils._regexHighlight(input, regex, displayTotal);
2016-11-28 11:42:58 +01:00
case "List matches":
return Utils.escapeHtml(StrUtils._regexList(input, regex, displayTotal, true, false));
2016-11-28 11:42:58 +01:00
case "List capture groups":
return Utils.escapeHtml(StrUtils._regexList(input, regex, displayTotal, false, true));
2016-11-28 11:42:58 +01:00
case "List matches with capture groups":
return Utils.escapeHtml(StrUtils._regexList(input, regex, displayTotal, true, true));
2016-11-28 11:42:58 +01:00
return "Error: Invalid output format";
} catch (err) {
return "Invalid regex. Details: " + err.message;
} else {
return Utils.escapeHtml(input);
2016-11-28 11:42:58 +01:00
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* @constant
* @default
CASE_SCOPE: ["All", "Word", "Sentence", "Paragraph"],
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* To Upper case operation.
* @param {string} input
* @param {Object[]} args
* @returns {string}
runUpper: function (input, args) {
2016-11-28 11:42:58 +01:00
var scope = args[0];
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
switch (scope) {
case "Word":
return input.replace(/(\b\w)/gi, function(m) {
return m.toUpperCase();
case "Sentence":
return input.replace(/(?:\.|^)\s*(\b\w)/gi, function(m) {
return m.toUpperCase();
case "Paragraph":
return input.replace(/(?:\n|^)\s*(\b\w)/gi, function(m) {
return m.toUpperCase();
case "All":
/* falls through */
return input.toUpperCase();
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* To Upper case operation.
* @param {string} input
* @param {Object[]} args
* @returns {string}
runLower: function (input, args) {
2016-11-28 11:42:58 +01:00
return input.toLowerCase();
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* @constant
* @default
SEARCH_TYPE: ["Regex", "Extended (\\n, \\t, \\x...)", "Simple string"],
* @constant
* @default
* @constant
* @default
* @constant
* @default
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* Find / Replace operation.
* @param {string} input
* @param {Object[]} args
* @returns {string}
runFindReplace: function(input, args) {
2016-11-28 11:42:58 +01:00
var find = args[0].string,
type = args[0].option,
replace = args[1],
g = args[2],
i = args[3],
m = args[4],
modifiers = "";
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
if (g) modifiers += "g";
if (i) modifiers += "i";
if (m) modifiers += "m";
2017-02-09 16:09:33 +01:00
2016-12-14 17:39:17 +01:00
if (type === "Regex") {
2016-11-28 11:42:58 +01:00
find = new RegExp(find, modifiers);
} else if (type.indexOf("Extended") === 0) {
find = Utils.parseEscapedChars(find);
2016-11-28 11:42:58 +01:00
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
return input.replace(find, replace, modifiers);
// Non-standard addition of flags in the third argument. This will work in Firefox but
// probably nowhere else. The purpose is to allow global matching when the `find` parameter
// is just a string.
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* @constant
* @default
* @constant
* @default
DELIMITER_OPTIONS: ["Line feed", "CRLF", "Space", "Comma", "Semi-colon", "Colon", "Nothing (separate chars)"],
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* Split operation.
* @param {string} input
* @param {Object[]} args
* @returns {string}
runSplit: function(input, args) {
var splitDelim = args[0] || StrUtils.SPLIT_DELIM,
joinDelim = Utils.charRep[args[1]],
sections = input.split(splitDelim);
2017-02-09 16:09:33 +01:00
return sections.join(joinDelim);
2016-11-28 11:42:58 +01:00
2016-12-17 01:53:06 +01:00
2016-12-23 15:36:16 +01:00
2016-12-17 01:53:06 +01:00
2016-12-23 15:36:16 +01:00
* Filter operation.
2016-12-17 01:53:06 +01:00
* @author Mikescher ( |
* @param {string} input
* @param {Object[]} args
* @returns {string}
runFilter: function(input, args) {
var delim = Utils.charRep[args[0]],
2016-12-23 15:36:16 +01:00
reverse = args[2];
2016-12-17 01:53:06 +01:00
try {
var regex = new RegExp(args[1]);
} catch (err) {
return "Invalid regex. Details: " + err.message;
var regexFilter = function(value) {
2016-12-17 01:53:06 +01:00
return reverse ^ regex.test(value);
2016-12-23 15:36:16 +01:00
2016-12-17 01:53:06 +01:00
return input.split(delim).filter(regexFilter).join(delim);
2016-12-17 01:53:06 +01:00
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* @constant
* @default
* @constant
* @default
DIFF_BY: ["Character", "Word", "Line", "Sentence", "CSS", "JSON"],
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* Diff operation.
* @param {string} input
* @param {Object[]} args
* @returns {html}
runDiff: function(input, args) {
var sampleDelim = args[0],
diffBy = args[1],
showAdded = args[2],
showRemoved = args[3],
ignoreWhitespace = args[4],
samples = input.split(sampleDelim),
2016-11-28 11:42:58 +01:00
output = "",
2017-02-09 16:09:33 +01:00
2016-12-14 17:39:17 +01:00
if (!samples || samples.length !== 2) {
2016-11-28 11:42:58 +01:00
return "Incorrect number of samples, perhaps you need to modify the sample delimiter or add more samples?";
2017-02-09 16:09:33 +01:00
switch (diffBy) {
2016-11-28 11:42:58 +01:00
case "Character":
diff = JsDiff.diffChars(samples[0], samples[1]);
case "Word":
if (ignoreWhitespace) {
2016-11-28 11:42:58 +01:00
diff = JsDiff.diffWords(samples[0], samples[1]);
} else {
diff = JsDiff.diffWordsWithSpace(samples[0], samples[1]);
case "Line":
if (ignoreWhitespace) {
2016-11-28 11:42:58 +01:00
diff = JsDiff.diffTrimmedLines(samples[0], samples[1]);
} else {
diff = JsDiff.diffLines(samples[0], samples[1]);
case "Sentence":
diff = JsDiff.diffSentences(samples[0], samples[1]);
case "CSS":
diff = JsDiff.diffCss(samples[0], samples[1]);
case "JSON":
diff = JsDiff.diffJson(samples[0], samples[1]);
return "Invalid 'Diff by' option.";
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
for (var i = 0; i < diff.length; i++) {
if (diff[i].added) {
if (showAdded) output += "<span class='hlgreen'>" + Utils.escapeHtml(diff[i].value) + "</span>";
2016-11-28 11:42:58 +01:00
} else if (diff[i].removed) {
if (showRemoved) output += "<span class='hlred'>" + Utils.escapeHtml(diff[i].value) + "</span>";
2016-11-28 11:42:58 +01:00
} else {
output += Utils.escapeHtml(diff[i].value);
2016-11-28 11:42:58 +01:00
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
return output;
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* @constant
* @default
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* Offset checker operation.
* @param {string} input
* @param {Object[]} args
* @returns {html}
runOffsetChecker: function(input, args) {
var sampleDelim = args[0],
samples = input.split(sampleDelim),
2016-11-28 11:42:58 +01:00
outputs = [],
i = 0,
s = 0,
match = false,
inMatch = false,
2016-11-28 11:42:58 +01:00
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
if (!samples || samples.length < 2) {
return "Not enough samples, perhaps you need to modify the sample delimiter or add more data?";
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
// Initialise output strings
for (s = 0; s < samples.length; s++) {
outputs[s] = "";
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
// Loop through each character in the first sample
for (i = 0; i < samples[0].length; i++) {
chr = samples[0][i];
match = false;
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
// Loop through each sample to see if the chars are the same
for (s = 1; s < samples.length; s++) {
2016-12-14 17:39:17 +01:00
if (samples[s][i] !== chr) {
2016-11-28 11:42:58 +01:00
match = false;
match = true;
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
// Write output for each sample
for (s = 0; s < samples.length; s++) {
if (samples[s].length <= i) {
if (inMatch) outputs[s] += "</span>";
if (s === samples.length - 1) inMatch = false;
2016-11-28 11:42:58 +01:00
2017-02-09 16:09:33 +01:00
if (match && !inMatch) {
outputs[s] += "<span class='hlgreen'>" + Utils.escapeHtml(samples[s][i]);
2016-12-14 17:39:17 +01:00
if (samples[s].length === i + 1) outputs[s] += "</span>";
if (s === samples.length - 1) inMatch = true;
} else if (!match && inMatch) {
outputs[s] += "</span>" + Utils.escapeHtml(samples[s][i]);
if (s === samples.length - 1) inMatch = false;
2016-11-28 11:42:58 +01:00
} else {
outputs[s] += Utils.escapeHtml(samples[s][i]);
if (inMatch && samples[s].length === i + 1) {
2016-11-28 11:42:58 +01:00
outputs[s] += "</span>";
if (samples[s].length - 1 !== i) inMatch = false;
2016-11-28 11:42:58 +01:00
2017-02-09 16:09:33 +01:00
2016-12-14 17:39:17 +01:00
if (samples[0].length - 1 === i) {
if (inMatch) outputs[s] += "</span>";
outputs[s] += Utils.escapeHtml(samples[s].substring(i + 1));
2016-11-28 11:42:58 +01:00
2017-02-09 16:09:33 +01:00
return outputs.join(sampleDelim);
2016-11-28 11:42:58 +01:00
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* Parse escaped string operation.
* @param {string} input
* @param {Object[]} args
* @returns {string}
runParseEscapedString: function(input, args) {
return Utils.parseEscapedChars(input);
2016-11-28 11:42:58 +01:00
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* Adds HTML highlights to matches within a string.
* @private
* @param {string} input
* @param {RegExp} regex
* @param {boolean} displayTotal
2016-11-28 11:42:58 +01:00
* @returns {string}
_regexHighlight: function(input, regex, displayTotal) {
2016-11-28 11:42:58 +01:00
var output = "",
hl = 1,
i = 0,
total = 0;
2017-02-09 16:09:33 +01:00
2016-12-14 17:39:17 +01:00
while ((m = regex.exec(input))) {
2016-11-28 11:42:58 +01:00
// Add up to match
output += Utils.escapeHtml(input.slice(i, m.index));
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
// Add match with highlighting
output += "<span class='hl"+hl+"'>" + Utils.escapeHtml(m[0]) + "</span>";
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
// Switch highlight
2016-12-14 17:39:17 +01:00
hl = hl === 1 ? 2 : 1;
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
i = regex.lastIndex;
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
// Add all after final match
output += Utils.escapeHtml(input.slice(i, input.length));
2017-02-09 16:09:33 +01:00
if (displayTotal)
2016-11-28 11:42:58 +01:00
output = "Total found: " + total + "\n\n" + output;
return output;
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
* Creates a string listing the matches within a string.
* @private
* @param {string} input
* @param {RegExp} regex
* @param {boolean} displayTotal
2016-11-28 11:42:58 +01:00
* @param {boolean} matches - Display full match
* @param {boolean} captureGroups - Display each of the capture groups separately
2016-11-28 11:42:58 +01:00
* @returns {string}
_regexList: function(input, regex, displayTotal, matches, captureGroups) {
2016-11-28 11:42:58 +01:00
var output = "",
total = 0,
2017-02-09 16:09:33 +01:00
2016-12-14 17:39:17 +01:00
while ((match = regex.exec(input))) {
2016-11-28 11:42:58 +01:00
if (matches) {
output += match[0] + "\n";
if (captureGroups) {
2016-11-28 11:42:58 +01:00
for (var i = 1; i < match.length; i++) {
if (matches) {
output += " Group " + i + ": ";
output += match[i] + "\n";
2017-02-09 16:09:33 +01:00
if (displayTotal)
2016-11-28 11:42:58 +01:00
output = "Total found: " + total + "\n\n" + output;
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
return output;
2017-02-09 16:09:33 +01:00
2016-11-28 11:42:58 +01:00
export default StrUtils;