From 2653c58a8f00dfc8acdb4c3f68b026cce95f7bb3 Mon Sep 17 00:00:00 2001
From: Tobias Gruetzmacher <tobias-git@23.gs>
Date: Fri, 10 Jan 2020 14:53:01 +0100
Subject: [PATCH] Tests: Ignore difference in archive.org snapshots

---
 tests/modules/check_comics.py | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/tests/modules/check_comics.py b/tests/modules/check_comics.py
index c5fc11370..b4eab6596 100644
--- a/tests/modules/check_comics.py
+++ b/tests/modules/check_comics.py
@@ -1,7 +1,7 @@
 # -*- coding: utf-8 -*-
 # Copyright (C) 2004-2008 Tristan Seligmann and Jonathan Jacobs
 # Copyright (C) 2012-2014 Bastian Kleineidam
-# Copyright (C) 2015-2019 Tobias Gruetzmacher
+# Copyright (C) 2015-2020 Tobias Gruetzmacher
 
 from __future__ import absolute_import, division, print_function
 
@@ -16,6 +16,10 @@ _locks = {}
 MaxConnections = 2
 # Maximum number of strips to get to test a comic
 MaxStrips = 5
+# Match (already-escaped) archive.org URL
+ARCHIVE_ORG_MATCH = re.compile(r'(?<=web\\.archive\\.org/web)/\d+/')
+# Matches some (maybe-escaped - because Python 2) printf-style format specifiers
+PRINTF_MATCH = re.compile(r'\\?%[0-9]*[sd]')
 
 
 def get_lock(host):
@@ -101,7 +105,8 @@ def _check_stripurl(strip, scraperobj):
         return
     # test that the stripUrl regex matches the retrieved strip URL
     urlmatch = re.escape(scraperobj.stripUrl)
-    urlmatch = urlmatch.replace('\\%', '%').replace(r"%s", r".+")
+    urlmatch = PRINTF_MATCH.sub('.+', urlmatch)
+    urlmatch = ARCHIVE_ORG_MATCH.sub(r'/\\d+/', urlmatch)
     ro = re.compile(urlmatch)
     mo = ro.match(strip.strip_url)
     err = 'strip URL {!r} does not match stripUrl pattern {}'.format(