cs.app.pilfer.sitemap: Wikipedia: fix article path pattern, add a pattern for the commons images
1 files changed, 9 insertions(+), 1 deletions(-)

M lib/python/cs/app/pilfer/sitemap.py
M lib/python/cs/app/pilfer/sitemap.py +9 -1
@@ 230,10 230,18 @@ class Wikipedia(SiteMap):
       (
           (
               '*.wikipedia.org',
-              'wiki/(?P<title>[^:/]+)$',
+              r'/wiki/(?P<title>[^:/]+)$',
           ),
           'wiki/{title}',
       ),
+      # https://upload.wikimedia.org/wikipedia/commons/thumb/3/35/Carbonate-outcrops_world.jpg/620px-Carbonate-outcrops_world.jpg
+      (
+          (
+              'upload.wikipedia.org',
+              r'/wikipedia/commons/(?<subpath>.*\.(jpg|gif|png))$',
+          ),
+          'wiki/commons/{subpath}',
+      ),
   ]
 
   @promote