diff --git a/scrape.sh b/scrape.sh index 4fdb07b..8fd865c 100644 --- a/scrape.sh +++ b/scrape.sh @@ -234,10 +234,7 @@ url_to_title_candidate() { html_to_markdown() { local f="$(mktemp)" log url=$1 - log 1: url=$1 cat > "$f" - log 2: url=$1 - #grep '' "$f" | sed 's/.*>\([^<]*\)<.title>.*/# \1/g' local clean="$( cat "$f" \ | readability "file://$(realpath $f)" \ @@ -245,9 +242,7 @@ html_to_markdown() { | sed 's/{[^}]*data[^}]*}//g' \ | sed 's/\[](#[^)]*)//' )" - log 3: url=$1 rm "$f" - log 4: url=$1 echo "$clean" | ( lastline="" while read -r line; do @@ -260,9 +255,7 @@ html_to_markdown() { done cat &> /dev/null ) - log 5: url=$1 echo "$clean" - log 6: url=$1 return $? }