mirror of
https://github.com/nmap/nmap.git
synced 2026-05-13 16:57:06 +00:00
Update to add additional blacklist entries the httpspider library. The goal is to avoid downloading and processing certain additional video, audio and binary formats.
This should speed up crawling certain sites. In the case of http-email-harvest it should reduce some of the false positives generated by running the RegEx against binary data. The only script that this appears likely to have affected the results of would have been http-sitemap-generator and that script specifically disables the blacklist.
This commit is contained in:
parent
113f1791ff
commit
b82c819afb
1 changed files with 3 additions and 1 deletions
|
|
@ -596,11 +596,13 @@ Crawler = {
|
|||
addDefaultBlacklist = function(self)
|
||||
local extensions = {
|
||||
image_extensions = {"png","jpg","jpeg","gif","bmp"},
|
||||
video_extensions = {"avi","flv","ogg","mp4","wmv"},
|
||||
audio_extensions = {"aac","m4a","mp3","wav"},
|
||||
doc_extensions = {"pdf", "doc", "docx", "docm", "xls", "xlsx", "xlsm",
|
||||
"ppt", "pptx", "pptm", "odf", "ods", "odp", "ps", "xps"},
|
||||
archive_extensions = {"zip", "tar.gz", "gz", "rar", "7z", "sit", "sitx",
|
||||
"tgz", "tar.bz", "tar", "iso"},
|
||||
exe_extensions = {"exe", "com", "msi", "bin"}
|
||||
exe_extensions = {"exe", "com", "msi", "bin","dmg"}
|
||||
}
|
||||
local blacklist = {}
|
||||
for _, cat in pairs(extensions) do
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue