shorted pid for scraped and do not change title
This commit is contained in:
@@ -95,6 +95,8 @@ crawl_with() {
|
|||||||
local content="$(echo "$json" | jq -r .content)"
|
local content="$(echo "$json" | jq -r .content)"
|
||||||
local crawlable_source="$(extract_crawlable_source "$content")"
|
local crawlable_source="$(extract_crawlable_source "$content")"
|
||||||
|
|
||||||
|
notes put "$pid" "$(notes meta "$pid" | jq -r .Meta.Title)" "$crawlable_source"
|
||||||
|
|
||||||
local expanded=($($backend expand "$crawlable_source"))
|
local expanded=($($backend expand "$crawlable_source"))
|
||||||
|
|
||||||
log purge $crawlable_source:
|
log purge $crawlable_source:
|
||||||
@@ -150,6 +152,7 @@ crawl_with() {
|
|||||||
ID="${ID%/}"
|
ID="${ID%/}"
|
||||||
if [ "${#expanded[@]}" -lt 2 ]; then
|
if [ "${#expanded[@]}" -lt 2 ]; then
|
||||||
ID="$pid"
|
ID="$pid"
|
||||||
|
TITLE="$(notes meta "$ID" | jq -r .Meta.Title)"
|
||||||
CONTENT="$(printf "%s\n\n%s", "$crawlable_source" "$CONTENT")"
|
CONTENT="$(printf "%s\n\n%s", "$crawlable_source" "$CONTENT")"
|
||||||
fi
|
fi
|
||||||
log " $ID ($TITLE): ${#CONTENT}"
|
log " $ID ($TITLE): ${#CONTENT}"
|
||||||
|
|||||||
Reference in New Issue
Block a user