From 780d50bb59815ada90f8441655daa476505c8e8f Mon Sep 17 00:00:00 2001 From: Bel LaPointe Date: Tue, 1 Feb 2022 14:29:13 -0700 Subject: [PATCH] notea failing scale tests with jsut Alerts/ --- app/crawler/main.sh | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/app/crawler/main.sh b/app/crawler/main.sh index d85aa8d..4d7f8af 100644 --- a/app/crawler/main.sh +++ b/app/crawler/main.sh @@ -78,10 +78,14 @@ crawl_with() { export ID="$(echo "$crawlable_source/$TITLE" | base64 | md5sum | awk '{print $1}')" export PID="$(echo $json | jq -r .id)" log " $PID/$ID ($TITLE): ${#CONTENT}" - notea put + push_crawled done } +push_crawled() { + notea put +} + is_crawlable() { local crawlable_source="$(extract_crawlable_source "$*")" # https://unix.stackexchange.com/questions/181254/how-to-use-grep-and-cut-in-script-to-obtain-website-urls-from-an-html-file @@ -90,6 +94,8 @@ is_crawlable() { } rewrite() { + log not impl: rewrite "#abc-def" to "#h-abc-def" + log not impl: rewrite "./asdf" to "./zyxw" or "absolute.com/asdf" log not impl rewrite, change images return 1 }