diff --git a/scrape.sh b/scrape.sh index ff9a635..8bb257a 100644 --- a/scrape.sh +++ b/scrape.sh @@ -222,6 +222,7 @@ html_to_markdown() { local f="$(mktemp)" log url=$1 cat > "$f" + grep '' "$f" | sed 's/.*>\([^<]*\)<.title>.*/\1/g' >&2 cat "$f" \ | readability "file://$(realpath $f)" \ | pandoc -f html -t markdown --ascii --toc --wrap=none --strip-comments -o - \