Skip to content
This repository was archived by the owner on Feb 22, 2025. It is now read-only.

Commit 9e54fce

Browse files
authored
Merge pull request #810 from rix1337/dev
Improve RegEx search for BY
2 parents cc4aa0b + b6be404 commit 9e54fce

File tree

6 files changed

+23
-11
lines changed

6 files changed

+23
-11
lines changed

feedcrawler/external_sites/feed_search/sites/content_all_by.py

Lines changed: 17 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -30,11 +30,15 @@ def __init__(self, filename):
3030
self.url = self.hostnames.get('by')
3131
self.password = self.url.split('.')[0]
3232

33-
if "List_ContentAll_Seasons" not in filename:
33+
if "_Regex" in filename:
34+
self.URL = 'https://' + self.url + "/?cat="
35+
self.FEED_URLS = [self.URL + "1", self.URL + "2"]
36+
elif "List_ContentAll_Seasons" not in filename:
3437
self.URL = 'https://' + self.url + "/?cat=1"
38+
self.FEED_URLS = [self.URL]
3539
else:
3640
self.URL = 'https://' + self.url + "/?cat=2"
37-
self.FEED_URLS = [self.URL]
41+
self.FEED_URLS = [self.URL]
3842

3943
self.config = CrawlerConfig("ContentAll")
4044
self.feedcrawler = CrawlerConfig("FeedCrawler")
@@ -49,9 +53,17 @@ def __init__(self, filename):
4953
search = int(CrawlerConfig("ContentAll").get("search"))
5054
i = 2
5155
while i <= search:
52-
page_url = self.URL + "&start=" + str(i)
53-
if page_url not in self.FEED_URLS:
54-
self.FEED_URLS.append(page_url)
56+
if "_Regex" in filename:
57+
page_url_1 = self.URL + "1&start=" + str(i)
58+
page_url_2 = self.URL + "2&start=" + str(i)
59+
if page_url_1 not in self.FEED_URLS:
60+
self.FEED_URLS.append(page_url_1)
61+
if page_url_2 not in self.FEED_URLS:
62+
self.FEED_URLS.append(page_url_2)
63+
else:
64+
page_url = self.URL + "&start=" + str(i)
65+
if page_url not in self.FEED_URLS:
66+
self.FEED_URLS.append(page_url)
5567
i += 1
5668
self.cdc = FeedDb('cdc')
5769

feedcrawler/providers/common_functions.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -620,7 +620,7 @@ def keep_alphanumeric_with_special_characters(string):
620620

621621
def keep_alphanumeric_with_regex_characters(string):
622622
string = replace_with_stripped_ascii(string)
623-
return re.sub(r'[^0-9a-zA-Z\s\-.*+()|\[\]?!]', '', string)
623+
return re.sub(r'[^0-9a-zA-Z\s\-.*+()|\[\]\\{},?!]', '', string)
624624

625625

626626
def keep_numbers(string):

feedcrawler/providers/version.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@
88

99

1010
def get_version():
11-
return "20.1.8"
11+
return "20.1.9"
1212

1313

1414
def create_version_file():

feedcrawler/web_interface/vuejs_frontend/package-lock.json

Lines changed: 2 additions & 2 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

feedcrawler/web_interface/vuejs_frontend/package.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
{
22
"name": "feedcrawler-web",
3-
"version": "20.1.8",
3+
"version": "20.1.9",
44
"type": "module",
55
"scripts": {
66
"dev": "vite",

feedcrawler/web_interface/vuejs_frontend/src/components/Lists.vue

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -112,7 +112,7 @@ function submitLists() {
112112
@click="showRegExHelp">RegEx-Suche</span>
113113
</h5><!-- Setting variables in label is unsupported -->
114114
<FormKit v-model="store.lists.mb.regex"
115-
:validation="[['?matches', /^[a-zA-Z0-9ÄäÖöÜüß\-\s.*+()|\[\]?!]+$/]]"
115+
:validation="[['?matches', /^[a-zA-Z0-9ÄäÖöÜüß\-\s.*+()|\[\]\\{},?!]+$/]]"
116116
:validation-messages="{
117117
matches: 'Bitte nur Buchstaben, Zahlen, Leerzeichen oder folgende Sonderzeichen eingeben: . * + ( ) | [ ] ? !'
118118
}"

0 commit comments

Comments
 (0)