mirror of
https://github.com/Garmelon/PFERD.git
synced 2026-04-12 15:35:05 +02:00
fixed regex needs to match whole href
This commit is contained in:
parent
08565b22ad
commit
9f7aff761d
1 changed files with 1 additions and 1 deletions
|
|
@ -28,7 +28,7 @@ class KitIpdCrawlerSection(HttpCrawlerSection):
|
||||||
return target
|
return target
|
||||||
|
|
||||||
def link_regex(self) -> Pattern[AnyStr]:
|
def link_regex(self) -> Pattern[AnyStr]:
|
||||||
regex = self.s.get("link_regex", ".*/[^/]*\.(?:pdf|zip|c|java)")
|
regex = self.s.get("link_regex", "^.*/[^/]*\.(?:pdf|zip|c|java)$")
|
||||||
return re.compile(regex)
|
return re.compile(regex)
|
||||||
|
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue