Skip to content

Commit

Permalink
fix regex
Browse files Browse the repository at this point in the history
  • Loading branch information
jimregan committed Nov 6, 2019
1 parent ea46c00 commit 0a2089e
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion Lib/corpuscrawler/crawl_ga.py
Original file line number Diff line number Diff line change
Expand Up @@ -61,7 +61,7 @@ def _rte_writable_paragraph(text):
return True

def _check_rte_sitemap(url):
urlmatch = re.search(r'http://www.rte.ie/sitemap-([0-9]+)0000.xml', url)
urlmatch = re.search(r'https?://www.rte.ie/sitemap-([0-9]+)0000.xml', url)
try:
if int(urlmatch.group(1)) < 40:
return True
Expand Down

0 comments on commit 0a2089e

Please sign in to comment.