#!/bin/sh # Extract URLs from an HTML document or documents. cat -- "${@:-/dev/stdin}" | # shellcheck disable=SC2002 pup -p 'a attr{href}' | sort | uniq