From b81c1c0ae82446fe3d03d2c821b2af5ced49b18c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E8=AB=8F=E8=A8=AA=E5=AD=90?= Date: Mon, 13 Nov 2023 16:46:21 +0900 Subject: [PATCH] =?UTF-8?q?=E3=82=AB=E3=83=86=E3=82=B4=E3=83=AA=E3=83=BC?= =?UTF-8?q?=E3=81=AE=E3=83=9A=E3=83=BC=E3=82=B8=E3=83=8D=E3=83=BC=E3=82=B7?= =?UTF-8?q?=E3=83=A7=E3=83=B3?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- page.go | 56 +++++++++++++++++++++++++++++++++++++++++++++++++++++--- 1 file changed, 53 insertions(+), 3 deletions(-) diff --git a/page.go b/page.go index b9a11da..d765002 100644 --- a/page.go +++ b/page.go @@ -74,7 +74,24 @@ func getdesc(str string) string { /* 記事かの確認 */ func isarticle(url string) bool { chk := strings.Split(url, "=") - return len(chk) > 2 && chk[0] == "/view_news.pl?id" + return len(chk) > 2 && + (chk[0] == "/view_news.pl?id" || chk[0] == "/view_news.pl?from" || chk[0] == "/view_news.pl?media_id" || chk[0] == "/view_news.pl?stkt") +} + +/* 部分圏かの確認 */ +func issubcat(url string) bool { + chk := strings.Split(url, "=") + return len(chk) > 1 && + (chk[0] == "/list_news_category.pl?id" || chk[0] == "/list_news_category.pl?page" || chk[0] == "/list_news_category.pl?sort" || chk[0] == "/list_news_category.pl?type" || chk[0] == "/list_news_category.pl?sub_category_id") && + strings.Contains(url, "type=bn") +} + +/* 部分かの確認 */ +func iscategory(url string) bool { + chk := strings.Split(url, "=") + return len(chk) > 1 && + (chk[0] == "/list_news_category.pl?id" || chk[0] == "/list_news_category.pl?sub_category_id" || chk[0] == "/list_news_category?from") && + !strings.Contains(url, "type=bn") } /* 出版社かの確認 */ @@ -155,6 +172,34 @@ func rmebloat(body string, cnf Config) string { return body } +/* 部分圏だけが残るまで消す */ +func rmsbloat(body string, cnf Config) string { + var re *regexp.Regexp + + rep := []struct { + pat string + repl string + }{ + {`(?s).*?`, ""}, + {`(?s)
.*?`, ""}, + //{`(?s)
\n" + strings.TrimSpace(body)) + "\n
\n" + return body +} + /* 出版社だけが残るまで消す */ func rmpbloat(body string, cnf Config) string { var re *regexp.Regexp @@ -163,9 +208,8 @@ func rmpbloat(body string, cnf Config) string { pat string repl string }{ - {`(?s).*?
`, ""}, + {`(?s).*?`, ""}, {`(?s).*?`, ""}, - {`(?s)
.*?

`, `

`}, {`(?s)