From a01f9037142833c08adb62843ebd0b2441215ea3 Mon Sep 17 00:00:00 2001 From: AnthonyAxenov Date: Sat, 23 Aug 2025 11:53:23 +0800 Subject: [PATCH] =?UTF-8?q?=D0=A3=D0=BF=D1=80=D0=BE=D1=89=D0=B5=D0=BD?= =?UTF-8?q?=D0=BE=20=D0=B8=D0=B7=D0=BC=D0=B5=D0=BD=D0=B5=D0=BD=D0=B8=D0=B5?= =?UTF-8?q?=20=D0=B2=D0=BD=D1=83=D1=82=D1=80=D0=B5=D0=BD=D0=BD=D0=B8=D1=85?= =?UTF-8?q?=20=D1=81=D1=81=D1=8B=D0=BB=D0=BE=D0=BA=20+=20=D1=81=D0=BA?= =?UTF-8?q?=D1=80=D0=B8=D0=BF=D1=82=20=D0=B4=D0=BB=D1=8F=20=D0=BE=D1=87?= =?UTF-8?q?=D0=B8=D1=81=D1=82=D0=BA=D0=B8=20=D0=B4=D0=B0=D0=BD=D0=BD=D1=8B?= =?UTF-8?q?=D1=85?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- rag/1_download_html.sh | 6 ++---- rag/clear.sh | 7 +++++++ 2 files changed, 9 insertions(+), 4 deletions(-) create mode 100755 rag/clear.sh diff --git a/rag/1_download_html.sh b/rag/1_download_html.sh index 9147d0e..09a7e4f 100755 --- a/rag/1_download_html.sh +++ b/rag/1_download_html.sh @@ -49,10 +49,8 @@ if [ -z "$content" ]; then fi path="$output_path/${title//\//_}.html" -content=$(echo "$content" | sed "s#href=\"/#href=\"$CONF_URL/#g") -content=$(echo "$content" | sed "s#src=\"/#src=\"$CONF_URL/#g") -# content=${content//href=\"\//href=\"$CONF_URL} -# content=${content//src=\"\//src=\"$CONF_URL} +content=${content//href=\"\//href=\"$CONF_URL} +content=${content//src=\"\//src=\"$CONF_URL} echo "Страница: $CONF_URL/pages/viewpage.action?pageId=$PAGE_ID

$title

$content" > "$path" echo "Сохранено: $output_path/$title.html" diff --git a/rag/clear.sh b/rag/clear.sh new file mode 100755 index 0000000..4618517 --- /dev/null +++ b/rag/clear.sh @@ -0,0 +1,7 @@ +#!/bin/bash + +rm -rf ./input_html/*.html +rm -rf ./input_pdf/*.pdf +rm -rf ./output_md/*.md +rm -rf ./ready_rag/* +touch ./ready_rag/.gitkeep