cs.app.pilfer.sitemap: Wikipedia: fix article path pattern, add a pattern for the commons images
1 files changed, 9 insertions(+), 1 deletions(-) M lib/python/cs/app/pilfer/sitemap.py
M lib/python/cs/app/pilfer/sitemap.py +9 -1
@@ 230,10 230,18 @@ class Wikipedia(SiteMap): ( ( '*.wikipedia.org', - 'wiki/(?P<title>[^:/]+)$', + r'/wiki/(?P<title>[^:/]+)$', ), 'wiki/{title}', ), + # https://upload.wikimedia.org/wikipedia/commons/thumb/3/35/Carbonate-outcrops_world.jpg/620px-Carbonate-outcrops_world.jpg + ( + ( + 'upload.wikipedia.org', + r'/wikipedia/commons/(?<subpath>.*\.(jpg|gif|png))$', + ), + 'wiki/commons/{subpath}', + ), ] @promote