You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
This repo is archived. You can view files and clone it, but cannot push or open issues/pull-requests.

332 lines
8.2 KiB

5 years ago
'use strict'
const Wappalyzer = {
technologies: [],
categories: [],
slugify(string) {
return string
.toLowerCase()
.replace(/[^a-z0-9-]/g, '-')
.replace(/--+/g, '-')
.replace(/(?:^-|-$)/, '')
},
getTechnology(name) {
return Wappalyzer.technologies.find(({ name: _name }) => name === _name)
},
getCategory(id) {
return Wappalyzer.categories.find(({ id: _id }) => id === _id)
},
resolve(detections = []) {
const resolved = detections.reduce((resolved, { technology }) => {
if (
resolved.findIndex(
({ technology: { name } }) => name === technology.name
) === -1
) {
let version = ''
let confidence = 0
detections.forEach(({ technology: { name }, pattern, match }) => {
if (name === technology.name) {
const versionValue = Wappalyzer.resolveVersion(pattern, match)
confidence = Math.min(100, confidence + pattern.confidence)
version =
versionValue.length > version.length && versionValue.length <= 10
? versionValue
: version
}
})
6 years ago
5 years ago
resolved.push({ technology, confidence, version })
6 years ago
}
5 years ago
return resolved
}, [])
Wappalyzer.resolveExcludes(resolved)
Wappalyzer.resolveImplies(resolved)
return resolved.map(
({
technology: { name, slug, categories, icon, website },
confidence,
version
}) => ({
name,
slug,
categories: categories.map((id) => Wappalyzer.getCategory(id)),
confidence,
version,
icon,
website
})
5 years ago
)
},
5 years ago
resolveVersion({ version, regex }, match) {
let resolved = version
7 years ago
5 years ago
if (version) {
const matches = regex.exec(match)
7 years ago
5 years ago
if (matches) {
matches.forEach((match, index) => {
// Parse ternary operator
const ternary = new RegExp(`\\\\${index}\\?([^:]+):(.*)$`).exec(
version
)
5 years ago
if (ternary && ternary.length === 3) {
resolved = version.replace(
ternary[0],
match ? ternary[1] : ternary[2]
)
}
5 years ago
// Replace back references
resolved = resolved
.trim()
.replace(new RegExp(`\\\\${index}`, 'g'), match || '')
})
}
}
5 years ago
return resolved
},
7 years ago
5 years ago
resolveExcludes(resolved) {
resolved.forEach(({ technology }) => {
technology.excludes.forEach((name) => {
const excluded = Wappalyzer.getTechnology(name)
7 years ago
5 years ago
if (!excluded) {
throw new Error(`Excluded technology does not exist: ${name}`)
}
7 years ago
5 years ago
const index = resolved.findIndex(({ name }) => name === excluded.name)
5 years ago
if (index === -1) {
resolved.splice(index, 1)
}
})
})
5 years ago
},
7 years ago
5 years ago
resolveImplies(resolved) {
let done = false
5 years ago
while (resolved.length && !done) {
resolved.forEach(({ technology, confidence }) => {
done = true
7 years ago
5 years ago
technology.implies.forEach((name) => {
const implied = Wappalyzer.getTechnology(name)
7 years ago
5 years ago
if (!implied) {
throw new Error(`Implied technology does not exist: ${name}`)
}
7 years ago
5 years ago
if (
resolved.findIndex(
({ technology: { name } }) => name === implied.name
) === -1
) {
resolved.push({ technology: implied, confidence, version: '' })
7 years ago
5 years ago
done = false
}
})
})
7 years ago
}
5 years ago
},
async analyze(url, { html, meta, headers, cookies, scripts }) {
const oo = Wappalyzer.analyzeOneToOne
const om = Wappalyzer.analyzeOneToMany
const mm = Wappalyzer.analyzeManyToMany
const flatten = (array) => Array.prototype.concat.apply([], array)
try {
const detections = flatten(
flatten(
await Promise.all(
Wappalyzer.technologies.map((technology) =>
Promise.all([
oo(technology, 'url', url),
oo(technology, 'html', html),
om(technology, 'meta', meta),
mm(technology, 'headers', headers),
om(technology, 'cookies', cookies),
om(technology, 'scripts', scripts)
])
)
5 years ago
)
)
).filter((technology) => technology)
5 years ago
return detections
} catch (error) {
throw new Error(error.message || error.toString())
7 years ago
}
5 years ago
},
setTechnologies(data) {
const transform = Wappalyzer.transformPatterns
Wappalyzer.technologies = Object.keys(data).reduce((technologies, name) => {
const {
cats,
url,
html,
meta,
headers,
cookies,
script,
js,
implies,
excludes,
icon,
website
} = data[name]
technologies.push({
name,
categories: cats || [],
slug: Wappalyzer.slugify(name),
url: transform(url),
headers: transform(
Object.keys(headers || {}).reduce(
(lcHeaders, header) => ({
...lcHeaders,
[header.toLowerCase()]: headers[header]
}),
{}
)
),
cookies: transform(cookies),
html: transform(html),
meta: transform(meta),
scripts: transform(script),
js: transform(js),
implies: typeof implies === 'string' ? [implies] : implies || [],
excludes: typeof excludes === 'string' ? [excludes] : excludes || [],
icon: icon || 'default.svg',
website: website || ''
})
7 years ago
5 years ago
return technologies
}, [])
},
5 years ago
setCategories(data) {
Wappalyzer.categories = Object.keys(data)
.reduce((categories, id) => {
const category = data[id]
5 years ago
categories.push({
id: parseInt(id, 10),
slug: Wappalyzer.slugify(category.name),
...category
})
5 years ago
return categories
}, [])
.sort(({ priority: a }, { priority: b }) => (a > b ? -1 : 0))
},
7 years ago
5 years ago
transformPatterns(patterns) {
if (!patterns) {
return []
7 years ago
}
7 years ago
5 years ago
const toArray = (value) => (Array.isArray(value) ? value : [value])
7 years ago
5 years ago
if (typeof patterns === 'string' || Array.isArray(patterns)) {
patterns = { main: patterns }
}
7 years ago
5 years ago
const parsed = Object.keys(patterns).reduce((parsed, key) => {
parsed[key] = toArray(patterns[key]).map((pattern) => {
const { regex, confidence, version } = pattern
.split('\\;')
.reduce((attrs, attr, i) => {
if (i) {
// Key value pairs
attr = attr.split(':')
if (attr.length > 1) {
attrs[attr.shift()] = attr.join(':')
}
} else {
// Escape slashes in regular expression
attrs.regex = new RegExp(attr.replace(/\//g, '\\/'), 'i')
}
7 years ago
5 years ago
return attrs
}, {})
7 years ago
5 years ago
return {
regex,
confidence: parseInt(confidence || 100, 10),
version: version || ''
}
5 years ago
})
5 years ago
return parsed
}, {})
7 years ago
5 years ago
return 'main' in parsed ? parsed.main : parsed
},
5 years ago
analyzeOneToOne(technology, type, value) {
return technology[type].reduce((technologies, pattern) => {
if (pattern.regex.test(value)) {
technologies.push({ technology, pattern, match: value })
}
7 years ago
5 years ago
return technologies
}, [])
},
5 years ago
analyzeOneToMany(technology, type, items = []) {
return items.reduce((technologies, { key, value }) => {
const patterns = technology[type][key] || []
5 years ago
patterns.forEach((pattern) => {
if (pattern.regex.test(value)) {
technologies.push({ technology, pattern, match: value })
}
})
5 years ago
return technologies
}, [])
},
5 years ago
analyzeManyToMany(technology, type, items = {}) {
return Object.keys(technology[type]).reduce((technologies, key) => {
const patterns = technology[type][key] || []
const values = items[key] || []
6 years ago
5 years ago
patterns.forEach((pattern) => {
values.forEach((value) => {
if (pattern.regex.test(value)) {
technologies.push({ technology, pattern, match: value })
}
})
})
5 years ago
return technologies
}, [])
}
}
5 years ago
if (typeof module !== 'undefined') {
module.exports = Wappalyzer
}