2021-06-18 06:31:59 +00:00
|
|
|
id: extract-urls
|
|
|
|
|
|
|
|
info:
|
|
|
|
name: Extract URLs from HTML attributes
|
|
|
|
author: dwisiswant0
|
|
|
|
severity: info
|
|
|
|
tags: headless,extractor
|
2024-01-04 06:27:45 +00:00
|
|
|
|
2021-06-18 06:31:59 +00:00
|
|
|
headless:
|
|
|
|
- steps:
|
|
|
|
- args:
|
|
|
|
url: "{{BaseURL}}"
|
|
|
|
action: navigate
|
2022-08-29 09:10:50 +00:00
|
|
|
|
2021-06-18 06:31:59 +00:00
|
|
|
- action: waitload
|
2022-08-29 09:10:50 +00:00
|
|
|
|
2021-06-18 06:31:59 +00:00
|
|
|
- action: script
|
|
|
|
name: extract
|
|
|
|
args:
|
|
|
|
code: |
|
2022-05-18 17:55:25 +00:00
|
|
|
() => {
|
|
|
|
return '\n' + [...new Set(Array.from(document.querySelectorAll('[src], [href], [url], [action]')).map(i => i.src || i.href || i.url || i.action))].join('\r\n') + '\n'
|
|
|
|
}
|
2022-08-29 09:10:50 +00:00
|
|
|
|
2021-06-18 06:31:59 +00:00
|
|
|
extractors:
|
|
|
|
- type: kval
|
|
|
|
part: extract
|
|
|
|
kval:
|
|
|
|
- extract
|
2024-01-04 06:57:22 +00:00
|
|
|
# digest: 4a0a0047304502201929be3307cd1badad321f4fce5ff44feda065bae4ab72a7817ea16fa8201afb022100be1f94a508d5d79dbff66c137c8c8959b1168743fc8bfa3f612ae4ef3210ec45:922c64590222798bb761d5b6d8e72950
|