diff --git a/rag/1_download_html.sh b/rag/1_download_html.sh index 9cc5686..9147d0e 100755 --- a/rag/1_download_html.sh +++ b/rag/1_download_html.sh @@ -49,7 +49,12 @@ if [ -z "$content" ]; then fi path="$output_path/${title//\//_}.html" -echo "Страница: $title

$content" > "$path" +content=$(echo "$content" | sed "s#href=\"/#href=\"$CONF_URL/#g") +content=$(echo "$content" | sed "s#src=\"/#src=\"$CONF_URL/#g") +# content=${content//href=\"\//href=\"$CONF_URL} +# content=${content//src=\"\//src=\"$CONF_URL} + +echo "Страница: $CONF_URL/pages/viewpage.action?pageId=$PAGE_ID

$title

$content" > "$path" echo "Сохранено: $output_path/$title.html" child_ids=$(echo "$response" | jq -r '.children.page.results[]?.id' 2>/dev/null)