blob: 0680c5cee9a678a78bfb6d52dcdd00cc06a04433 (
plain) (
tree)
|
|
# Extract <a href="..."> URLs from an HTML document or documents
# Input is either stdin or the given arguments concatenated
cat -- "${@:--}" |
# Pipe through pup to get all the href links
pup -p 'a attr{href}' |
# Sort them uniquely
sort | uniq
|