diff --git a/bin/build b/bin/build index e39752ccc..d856bb995 100755 --- a/bin/build +++ b/bin/build @@ -41,12 +41,14 @@ set -e sed -i "s/\"version\": \"[^\"]*\"/\"version\": \"$version\"/" src/drivers/npm/package.json # WebExtension + echo "Building WebExtension..." webextension_dir=src/drivers/webextension pushd $webextension_dir > /dev/null +sed -i "/sourceMappingURL/d" node_modules/webextension-polyfill/dist/browser-polyfill.js sed -i "s/\"version\": \"[^\"]*\"/\"version\": \"$version\"/" manifest.json zip -qr ../../../build/wappalyzer_webextension.zip . \ diff --git a/bin/validate-regex b/bin/validate-regex index 380ffdb15..f331a8945 100755 --- a/bin/validate-regex +++ b/bin/validate-regex @@ -1,97 +1,91 @@ #!/usr/bin/env node -var - app, - json = require('../src/apps.json'); - -for ( app in json.apps ) { - ['headers', 'html', 'env', 'meta', 'script'].forEach(function(type) { - var - key, - patterns = json.apps[app][type]; - - if ( patterns !== undefined ) { - patterns = typeof patterns === 'string' ? [patterns] : patterns; - - if ( !( patterns instanceof Array ) ) { - patterns = []; - - for ( key in json.apps[app][type] ) { - patterns.push(json.apps[app][type][key]); - } - } - - patterns.forEach(function(pattern) { - var - attrs = pattern.split('\\;'), - regex = '/' + attrs.shift().replace('/', '\/') + '/', - version = attrs.find( function (attr){ - return attr.indexOf('version:')===0; - } ), - amountOfCaptureGroups, - captureGroupsNeeded, - amountOfCaptureGroupsNeeded, - highestBackReference; - - //Check if the pattern is a valid RegExp - //Note: unlike when used in Wappalyzer, the modifier i isn't added here - new RegExp(regex); - - //Actual amount of capture groups - amountOfCaptureGroups = ''.match(new RegExp('(?:'+pattern+')?')).length - 1; - - //Capture groups of which the result is used - captureGroupsNeeded = version ? (version.match(/\\\d/g) || []).filter( function(value, index, self){ - return self.indexOf(value) === index; - }).map( function(value){//Because Math.max needs the integers only - return parseInt(value.charAt(1), 10);//Will only work if backreferences cannot be any longer than a single digit - }) : []; - - //Amount of capture groups needed - amountOfCaptureGroupsNeeded = captureGroupsNeeded.length; - - //Highest back reference number used - highestBackReference = Math.max.apply(null, captureGroupsNeeded); - - //Report error - if(amountOfCaptureGroups > amountOfCaptureGroupsNeeded) { - throw new Error('The pattern uses more capture groups than needed. Use non-capturing groups where appropriate.\n' + app + ': ' + type + ': ' + pattern); - }else if(amountOfCaptureGroups < amountOfCaptureGroupsNeeded){ - throw new Error('The version string references more capture groups than there are in the pattern! Remove any incorrect back references from the version string and/or add the missing capture groups to the pattern.\n' + app + ': ' + type + ': ' + pattern); - } else if(highestBackReference > amountOfCaptureGroups){ - throw new Error('The version string references one or more capture groups whose index is higher than the amount of capture groups in the pattern. Please use the correct index instead of \\\\'+highestBackReference+'.\n' + app + ': ' + type + ': ' + pattern); - } - - if ( /^\/(?:\^\$|\.\+|\.\*)\/$/.test(regex) ) { - throw new Error('Pattern should be replaced with empty string.\n' + app + ': ' + type + ': ' + pattern); - } - - if ( type === 'html' ) { - if ( /\.(?:\+|\*)/.test(regex) ) { - throw new Error('Avoid ".+" and ".*" in HTML patterns. Consider using "[^>]+" or "[^<]+" instead.\n' + app + ': ' + type + ': ' + pattern); - } - - if ( !/[<>]/.test(regex) ) { - throw new Error('HTML patterns must contain "<" or ">".\n' + app + ': ' + type + ': ' + pattern); - } - } - - //Warn about suspicious periods (".") in patterns which should probably have been escaped - // Periods inside character classes (such as [\d.]) don't count as wildcard, so we'll replace - // the character classes in the pattern with "_". (We could remove them entirely, but then - // we'd have to deal with leftover * and + characters; for example, removing the character - // class entirely from the pattern /test.[a-z]+/ would yield the pattern /test.+/, which - // would mean not detecting the un-escaped ".". Replacing the character class with an - // underscore instead gives /test._+/, which WOULD yield a warning about the unescaped ".".) - if ( /(?:^\/|[^\\])\.(?:[^*+]|\/$)/.test(regex.replace(/([^\\]|^)\[[^\]]+\]/g,'$1_') ) ) { - console.warn('Suspicious period (".") in pattern. Should this have been escaped?\n\tApp: ' + app + '\n\tPattern: ' + type + ': ' + pattern); - } - - }); - } - }); - - if ( !/^https?:\/\//i.test(json.apps[app].website) ) { - throw new Error('Invalid website URL\n' + app + ': ' + json.apps[app].website); - } +let + app, + json = require('../src/apps.json'); + +for (app in json.apps) { + ['headers', 'html', 'env', 'meta', 'script'].forEach((type) => { + let + key, + patterns = json.apps[app][type]; + + if (patterns !== undefined) { + patterns = typeof patterns === 'string' ? [patterns] : patterns; + + if (!(patterns instanceof Array)) { + patterns = []; + + for (key in json.apps[app][type]) { + patterns.push(json.apps[app][type][key]); + } + } + + patterns.forEach((pattern) => { + let + attrs = pattern.split('\\;'), + regex = `/${attrs.shift().replace('/', '\/')}/`, + version = attrs.find(attr => attr.indexOf('version:') === 0), + amountOfCaptureGroups, + captureGroupsNeeded, + amountOfCaptureGroupsNeeded, + highestBackReference; + + // Check if the pattern is a valid RegExp + // Note: unlike when used in Wappalyzer, the modifier i isn't added here + new RegExp(regex); + + // Actual amount of capture groups + amountOfCaptureGroups = ''.match(new RegExp(`(?:${pattern})?`)).length - 1; + + // Capture groups of which the result is used + captureGroupsNeeded = version ? (version.match(/\\\d/g) || []).filter((value, index, self) => self.indexOf(value) === index).map(value => parseInt(value.charAt(1), 10), // Will only work if backreferences cannot be any longer than a single digit + ) : []; + + // Amount of capture groups needed + amountOfCaptureGroupsNeeded = captureGroupsNeeded.length; + + // Highest back reference number used + highestBackReference = Math.max.apply(null, captureGroupsNeeded); + + // Report error + if (amountOfCaptureGroups > amountOfCaptureGroupsNeeded) { + throw new Error(`The pattern uses more capture groups than needed. Use non-capturing groups where appropriate.\n${app}: ${type}: ${pattern}`); + } else if (amountOfCaptureGroups < amountOfCaptureGroupsNeeded) { + throw new Error(`The version string references more capture groups than there are in the pattern! Remove any incorrect back references from the version string and/or add the missing capture groups to the pattern.\n${app}: ${type}: ${pattern}`); + } else if (highestBackReference > amountOfCaptureGroups) { + throw new Error(`The version string references one or more capture groups whose index is higher than the amount of capture groups in the pattern. Please use the correct index instead of \\\\${highestBackReference}.\n${app}: ${type}: ${pattern}`); + } + + if (/^\/(?:\^\$|\.\+|\.\*)\/$/.test(regex)) { + throw new Error(`Pattern should be replaced with empty string.\n${app}: ${type}: ${pattern}`); + } + + if (type === 'html') { + if (/\.(?:\+|\*)/.test(regex)) { + throw new Error(`Avoid ".+" and ".*" in HTML patterns. Consider using "[^>]+" or "[^<]+" instead.\n${app}: ${type}: ${pattern}`); + } + + if (!/[<>]/.test(regex)) { + throw new Error(`HTML patterns must contain "<" or ">".\n${app}: ${type}: ${pattern}`); + } + } + + // Warn about suspicious periods (".") in patterns which should probably have been escaped + // Periods inside character classes (such as [\d.]) don't count as wildcard, so we'll replace + // the character classes in the pattern with "_". (We could remove them entirely, but then + // we'd have to deal with leftover * and + characters; for example, removing the character + // class entirely from the pattern /test.[a-z]+/ would yield the pattern /test.+/, which + // would mean not detecting the un-escaped ".". Replacing the character class with an + // underscore instead gives /test._+/, which WOULD yield a warning about the unescaped ".".) + if (/(?:^\/|[^\\])\.(?:[^*+]|\/$)/.test(regex.replace(/([^\\]|^)\[[^\]]+\]/g, '$1_'))) { + console.warn(`Suspicious period (".") in pattern. Should this have been escaped?\n\tApp: ${app}\n\tPattern: ${type}: ${pattern}`); + } + }); + } + }); + + if (!/^https?:\/\//i.test(json.apps[app].website)) { + throw new Error(`Invalid website URL\n${app}: ${json.apps[app].website}`); + } } diff --git a/src/apps.json b/src/apps.json index 42e45f7f6..9f3d156a1 100644 --- a/src/apps.json +++ b/src/apps.json @@ -1180,7 +1180,7 @@ 62 ], "headers": { - "X-Hacker": "(automattic.com/jobs|wpvip.com/careers)" + "X-Hacker": "(?:automattic.com/jobs|wpvip.com/careers)" }, "icon": "automattic.png", "implies": "WordPress", @@ -4055,7 +4055,7 @@ ], "icon": "GeneXus.png", "js": { - "gx":"", + "gx": "", "gx.gxVersion": "^(.+)-.*$\\;version:\\1" }, "script": [ @@ -4173,7 +4173,10 @@ "
" ], "icon": "GitLab.svg", - "implies": ["Ruby on Rails", "Vue.js"], + "implies": [ + "Ruby on Rails", + "Vue.js" + ], "js": { "GitLab": "", "gl.dashboardOptions": "" @@ -14006,16 +14009,6 @@ "script": "/media/conv/js/jquery\\.js", "website": "https://uknowva.com" }, - "Pytonik": { - "cats": [ - 18, - 22 - ], - "html": "Pytonik ([0-9.]+);version:\\1", - "icon": "pytonik.png", - "implies": "Python", - "website": "https://pytonik.com" - }, "vBulletin": { "cats": [ 2 @@ -14050,7 +14043,7 @@ }, "website": "http://vibecommerce.com.br" }, - "Vikaon": { + "Vikaon": { "cats": [ 6 ], @@ -14318,9 +14311,6 @@ "meta": { "generator": "Varbase" }, - "html": [ - "varbase_" - ], "cpe": "cpe:/a:vardot:varbase", "icon": "varbase.png", "implies": "Drupal", diff --git a/src/drivers/npm/npm-shrinkwrap.json b/src/drivers/npm/npm-shrinkwrap.json index ef47e40cd..f4bde316a 100644 --- a/src/drivers/npm/npm-shrinkwrap.json +++ b/src/drivers/npm/npm-shrinkwrap.json @@ -1,6 +1,6 @@ { "name": "wappalyzer", - "version": "5.9.1", + "version": "5.9.18", "lockfileVersion": 1, "requires": true, "dependencies": { diff --git a/src/drivers/npm/package.json b/src/drivers/npm/package.json index d10044af2..371ee27da 100644 --- a/src/drivers/npm/package.json +++ b/src/drivers/npm/package.json @@ -2,7 +2,7 @@ "name": "wappalyzer", "description": "Uncovers the technologies used on websites", "homepage": "https://github.com/AliasIO/Wappalyzer", - "version": "5.9.18", + "version": "5.9.4", "author": "Elbert Alias", "license": "GPL-3.0", "repository": { diff --git a/src/drivers/webextension/manifest.json b/src/drivers/webextension/manifest.json index ba422fd0f..f1e4c3f7d 100644 --- a/src/drivers/webextension/manifest.json +++ b/src/drivers/webextension/manifest.json @@ -4,7 +4,7 @@ "author": "Elbert Alias", "homepage_url": "https://www.wappalyzer.com", "description": "Identify web technologies", - "version": "5.9.3", + "version": "5.9.4", "default_locale": "en", "manifest_version": 2, "icons": { diff --git a/src/icons/pytonik.png b/src/icons/pytonik.png deleted file mode 100644 index 1bb6c9e02..000000000 Binary files a/src/icons/pytonik.png and /dev/null differ