fix base regex

This commit is contained in:
2021-03-27 23:52:16 +01:00
parent 4473d1bec9
commit 5b5a821522

View File

@@ -12,7 +12,7 @@ from httplib.httpsocket import FORMAT
from httplib.message import ClientMessage as Message from httplib.message import ClientMessage as Message
from httplib.retriever import Retriever from httplib.retriever import Retriever
BASE_REGEX = re.compile(r"<\s*base.*href\s*=\s*['\"](\S*)['\"][^>]*>", re.M | re.I) BASE_REGEX = re.compile(r"<\s*base[^>]*\shref\s*=\s*['\"]([^\"']+)['\"][^>]*>", re.M | re.I)
IMG_REGEX = re.compile(r"<\s*img[^>]*\ssrc\s*=\s*['\"]([^\"']+)['\"][^>]*>", re.M | re.I) IMG_REGEX = re.compile(r"<\s*img[^>]*\ssrc\s*=\s*['\"]([^\"']+)['\"][^>]*>", re.M | re.I)