simplify google docs markdown

master
Bel LaPointe 2022-02-16 15:09:08 -07:00
parent c0d49d23bb
commit 8c87cdf0b2
1 changed files with 16 additions and 0 deletions

View File

@ -26,11 +26,27 @@ google() (
echo "" echo ""
if [ "${downloaded##*.}" == "csv" ]; then if [ "${downloaded##*.}" == "csv" ]; then
_csv_to_md "$downloaded" _csv_to_md "$downloaded"
elif [ "${downloaded##*.}" == "html" ]; then
_html_to_md "$downloaded"
else else
cat "$downloaded" cat "$downloaded"
fi fi
} }
_html_to_md() {
which pandoc &> /dev/null
local f="$1"
#log f=$f
cat "$f" \
| sed 's/.*<body/<body/' \
| sed 's/<\/body>.*/<\/body>/' \
| sed 's/<[\/]*span[^>]*>//g' \
| perl -pe 's|<div class="c[0-9][0-9]*">.*?<\/div>||g' \
| sed 's/<\([a-z][a-z]*\)[^>]*/<\1/g' \
| pandoc - -f html -t commonmark -s -o - \
| sed 's/^<[\/]*div>$//g'
}
_csv_to_md() { _csv_to_md() {
local f="$1" local f="$1"
( (