Browse Source

Percent-decode each line only once

master
JustAnotherArchivist 2 years ago
parent
commit
80bf010433
1 changed files with 2 additions and 1 deletions
  1. +2
    -1
      youtube-extract

+ 2
- 1
youtube-extract View File

@@ -114,10 +114,11 @@ for origLine in sys.stdin:
origLine = origLine.strip()
line = re.sub(r'https?://', '//', origLine)
line = domainPattern.sub('/www.youtube.com/', line)
decodedLine = percentdecode(line)
hadMatches = False
for pattern, paramSearch, f in matchers:
results = set()
for m in itertools.chain((x for x in pattern.finditer(line)), (x for x in pattern.finditer(percentdecode(line))) if paramSearch else ()):
for m in itertools.chain((x for x in pattern.finditer(line)), (x for x in pattern.finditer(decodedLine)) if paramSearch else ()):
hadMatches = True
r = f(m)
if r in results:


Loading…
Cancel
Save