diff options
| author | Christian Krinitsin <mail@krinitsin.com> | 2025-05-30 14:51:13 +0000 |
|---|---|---|
| committer | Christian Krinitsin <mail@krinitsin.com> | 2025-05-30 14:51:13 +0000 |
| commit | 225caa38269323af1bfc2daadff5ec8bd930747f (patch) | |
| tree | e0a5fefde9ee100ba6f32fb36de6707490e4164e /mailinglist/downloader.py | |
| parent | 904141bfb8d5385b75eb3b7afec1dcda89af65a7 (diff) | |
| download | qemu-analysis-225caa38269323af1bfc2daadff5ec8bd930747f.tar.gz qemu-analysis-225caa38269323af1bfc2daadff5ec8bd930747f.zip | |
add mailinglist scraper results
Diffstat (limited to 'mailinglist/downloader.py')
| -rwxr-xr-x | mailinglist/downloader.py | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/mailinglist/downloader.py b/mailinglist/downloader.py index e793271e0..ebe4d2d7e 100755 --- a/mailinglist/downloader.py +++ b/mailinglist/downloader.py @@ -63,13 +63,13 @@ def main(): # existing thread re_match = match(r'(?i)^re:\s*(.*)', text) # matches 'Re:' if re_match: - title_hash = str(hash(re_match.group(1).strip()))[0:7] + title_hash = str(hash(re_match.group(1).strip()))[1:8] if path.exists(f"output_mailinglist/{title_hash}"): process_thread(urljoin(url, href), title_hash) continue # new thread - title_hash = str(hash(text.strip()))[0:7] + title_hash = str(hash(text.strip()))[1:8] if path.exists(f"output_mailinglist/{title_hash}"): print(f"ERROR: {title_hash} should not exist!") continue |