From 5626caa091d02e0277734931bd3ce86d4751ce47 Mon Sep 17 00:00:00 2001 From: Andrzej Kopytko Date: Mon, 30 Dec 2024 17:48:01 +0100 Subject: [PATCH] Docs port for sitemap fix to 24.6 (#28234) ### Details: - *item1* - *...* ### Tickets: - *ticket-id* --- .../__init__.py | 23 +++++++++++-------- 1 file changed, 13 insertions(+), 10 deletions(-) diff --git a/docs/openvino_custom_sphinx_sitemap/openvino_custom_sphinx_sitemap/__init__.py b/docs/openvino_custom_sphinx_sitemap/openvino_custom_sphinx_sitemap/__init__.py index 8d31859d5bcbef..e4bb06f7fad550 100644 --- a/docs/openvino_custom_sphinx_sitemap/openvino_custom_sphinx_sitemap/__init__.py +++ b/docs/openvino_custom_sphinx_sitemap/openvino_custom_sphinx_sitemap/__init__.py @@ -126,21 +126,24 @@ def process_coveo_meta(meta, url, link): if tag_name == 'ovdoctype': ET.SubElement(namespace_element, tag_name).text = process_link(link) elif tag_name == 'ovcategory' and loc_element is not None: - ET.SubElement(namespace_element, tag_name).text = extract_hierarchy(loc_element.text) + ET.SubElement(namespace_element, tag_name).text = extract_categories(loc_element.text) elif tag_name == 'ovversion': ET.SubElement(namespace_element, tag_name).text = tag_value def process_link(link): if '/' in link: - return link.split('/')[0].replace("-", " ") - return link.split('.html')[0].replace("-", " ") + return format_segment(link.split('/')[0].replace("-", " ")) + return format_segment(link.split('.html')[0].replace("-", " ")) -def extract_hierarchy(link): +def extract_categories(link): path = link.split("://")[-1] segments = path.split('/')[1:] if segments and segments[-1].endswith('.html'): segments = segments[:-1] + if segments: + segments = segments[1:] + if segments and '.' in segments[0]: year, *rest = segments[0].split('.') if year.isdigit() and len(year) == 4: @@ -148,13 +151,13 @@ def extract_hierarchy(link): segments = [format_segment(segment) for segment in segments] - hierarchy = [] - for i in range(1, len(segments) + 1): - hierarchy.append('|'.join(segments[:i])) - - return ';'.join(hierarchy) + if segments: + hierarchy = ['|'.join(segments[:i]) for i in range(1, len(segments) + 1)] + return ';'.join(hierarchy) + + return "No category" def format_segment(segment): - if segment == 'c_cpp_api': segment = 'c/c++_api' + if segment == 'c_cpp_api': segment = 'C/C++_api' return ' '.join(word.capitalize() for word in segment.replace('-', ' ').replace('_', ' ').split()) \ No newline at end of file