Update sitemap generator with current series

This hasn't been updated in four years, we need to get current content
into the sitemap and drop unmaintained releases.

Change-Id: If2f9a3459f7570b92328002ca8c13ebcca67f54c
This commit is contained in:
Dr. Jens Harbott 2024-03-28 09:26:18 +01:00
parent a5cadb200b
commit a014b0bda9
2 changed files with 19 additions and 11 deletions

View File

@ -31,13 +31,10 @@ class SitemapSpider(spiders.CrawlSpider):
name = 'sitemap'
MAINT_SERIES = [
'ocata',
'pike',
'queens',
'rocky',
'stein',
'train',
'ussuri',
'zed',
'2023.1',
'2023.2',
'2024.1',
]
MAINT_RELEASES_PAT = re.compile('^.*/(' + '|'.join(MAINT_SERIES) + ')/')
LATEST_PAT = re.compile('^.*/latest/')
@ -69,6 +66,17 @@ class SitemapSpider(spiders.CrawlSpider):
r'/liberty/',
r'/mitaka/',
r'/newton/',
r'/ocata/',
r'/pike/',
r'/queens/',
r'/rocky/',
r'/stein/',
r'/train/',
r'/ussuri/',
r'/victoria/',
r'/wallaby/',
r'/xena/',
r'/yoga/',
],
deny_domains=[
# docs.o.o redirects to a few sites, filter

View File

@ -61,7 +61,7 @@ class TestSitemapSpider(unittest.TestCase):
path = sitemap_file.urlparse.SplitResult(
scheme='https',
netloc='docs.openstack.org',
path='/ocata/something.html',
path='/2024.1/something.html',
query='',
fragment=''
)
@ -79,7 +79,7 @@ class TestSitemapSpider(unittest.TestCase):
path = sitemap_file.urlparse.SplitResult(
scheme='https',
netloc='docs.openstackorg',
path='/ocata/something.html',
path='/2024.1/something.html',
query='',
fragment=''
)
@ -97,7 +97,7 @@ class TestSitemapSpider(unittest.TestCase):
path = sitemap_file.urlparse.SplitResult(
scheme='https',
netloc='docs.openstack.org',
path='/ocata/something.html',
path='/2024.1/something.html',
query='',
fragment=''
)
@ -131,7 +131,7 @@ class TestSitemapSpider(unittest.TestCase):
path = sitemap_file.urlparse.SplitResult(
scheme='https',
netloc='docs.openstack.org',
path='/ocata',
path='/2024.1',
query='',
fragment=''
)