diff --git a/scrape.sh b/scrape.sh index 37f330d..108f990 100644 --- a/scrape.sh +++ b/scrape.sh @@ -258,6 +258,7 @@ html_to_markdown() { | perl -pe 's|

(.*?)

|\2|g' \ | perl -pe 's|\r*(?:(?!).)+\r*||g' \ | tr '\r' '\n' \ + | sed 's/]*>\([^<]*\)<\/a>/\1/g' \ | pandoc \ -f html \ -t markdown+pipe_tables-simple_tables-multiline_tables \