mirror of
https://github.com/simon987/hexlib.git
synced 2025-04-10 14:06:43 +00:00
8 lines
260 B
Python
8 lines
260 B
Python
import re
|
|
|
|
LINK_RE = re.compile(r"(https?://[\w\-_.]+\.[a-z]{2,4}([^\s<'\"]*|$))")
|
|
HTML_HREF_RE = re.compile(r"href=\"([^\"]+)\"")
|
|
WHITESPACE_RE = re.compile(r"\s+")
|
|
PUNCTUATION_RE = re.compile(r"[.,;:\"“!?/()|*=>]+")
|
|
XML_ENTITY_RE = re.compile(r"&[a-z]+;")
|