documentation/tests/checkers/rst_style.py

import re

import sphinxlint


ALLOWED_HEADING_CHARS = ['=', '-', '~', '*', '^']  # In the same order as in the guidelines.
MAIN_HEADING_CHAR = ALLOWED_HEADING_CHARS[0]
MAIN_HEADING_RE = re.compile(rf'{MAIN_HEADING_CHAR}+\n[^\n]+\n{MAIN_HEADING_CHAR}+\n')
HEADING_DELIMITER_RE = re.compile(
    '^(' + '|'.join(rf'\{char}+' for char in ALLOWED_HEADING_CHARS) + ')\n$'
)
FORBIDDEN_HEADING_CHARS = [
    '#', '"', '\'', '+', '`', '@', '!', ',', '.', '/'
]  # Exhaustive list at https://docutils.sourceforge.io/docs/ref/rst/restructuredtext.html#sections.
FORBIDDEN_HEADING_DELIMITER_RE = re.compile(
    '^(' + '|'.join(rf'\{char}+' for char in FORBIDDEN_HEADING_CHARS) + ')\n$'
)
GIT_CONFLICT_MARKERS = ['<' * 7, '>' * 7]
ALLOWED_EARLY_BREAK_RE = re.compile(r'^\s*(\.\. |:\S+:\s+)', re.IGNORECASE)  # Contains markup.


@sphinxlint.checker('.rst')
def check_heading_delimiters_characters(file, lines, options=None):
    """ Check that heading delimiters use only allowed characters. """
    for lno, line in enumerate(lines):
        if FORBIDDEN_HEADING_DELIMITER_RE.search(line):
            yield lno + 1, f"illegal use of the character {line[0]} in heading delimiters; use" \
                           f" any of {', '.join(ALLOWED_HEADING_CHARS)} instead"


@sphinxlint.checker('.rst')
def check_heading_delimiters_order(file, lines, options=None):
    """ Check that heading delimiters appear in the correct order. """
    last_delimiter_char_index = -1  # The index of the heading delimiter char in the ordered list.
    for lno, line in enumerate(lines):
        if HEADING_DELIMITER_RE.search(line):  # The line is a heading delimiter.
            delimiter_char = line[0]
            delimiter_char_index = ALLOWED_HEADING_CHARS.index(delimiter_char)
            if delimiter_char_index > last_delimiter_char_index + 1:
                # There is a leap of more than 1 in the chars used for the heading delimiters.
                last_delimiter_char = ALLOWED_HEADING_CHARS[last_delimiter_char_index] \
                    if last_delimiter_char_index != -1 else None
                yield lno + 1, f"the heading delimiter {delimiter_char} is not allowed after a" \
                               f" heading with {last_delimiter_char} as delimiter; follow this" \
                               f" order: {', '.join(ALLOWED_HEADING_CHARS)}"
            last_delimiter_char_index = delimiter_char_index


@sphinxlint.checker('.rst')
def check_max_one_main_heading(file, lines, options=None):
    """ Check that there is at most one main heading (h1) per document. """
    code = "".join(lines)
    nb_main_headings = len(MAIN_HEADING_RE.findall(code))
    if nb_main_headings > 1:
        yield 0, "the document should have only one main heading"


@sphinxlint.checker('.rst')
def check_min_one_main_heading(file, lines, options=None):
    """ Check that there is a main heading (h1) on document when it contains other headings. """
    heading_found, main_heading_found = False, False
    for lno, line in enumerate(lines):
        if HEADING_DELIMITER_RE.search(line):  # The line is a heading delimiter.
            heading_found = True
            if MAIN_HEADING_RE.search(''.join(lines[lno - 2:lno + 1])):  # Lower delimiter of h1.
                main_heading_found = True
                break

    if heading_found and not main_heading_found:
        yield 0, "the document should have a main heading (h1)"


@sphinxlint.checker('.rst')
def check_heading_delimiters_length(file, lines, options=None):
    """ Check that heading delimiters have the same length as their heading. """
    for lno, line in enumerate(lines):
        if HEADING_DELIMITER_RE.search(line):  # The line is a heading delimiter.
            if MAIN_HEADING_RE.search(''.join(lines[lno:lno+3])):  # Upper delimiter of h1.
                heading_lno = lno + 1
            else:  # Lower delimiter of a heading of any level.
                heading_lno = lno - 1
            if len(line.rstrip()) != len(lines[heading_lno].rstrip()):
                yield lno + 1, "the heading delimiter should have the same length as its heading"


@sphinxlint.checker('.rst')
def check_heading_spacing(file, lines, options=None):
    """ Check that headings are preceded and followed by at least one blank line. """
    for lno, line in enumerate(lines):
        if HEADING_DELIMITER_RE.search(line):  # The line is a heading delimiter.
            if MAIN_HEADING_RE.search(''.join(lines[lno:lno+3])):  # Upper delimiter of h1.
                continue  # We handle this heading via its lower delimiter.

            heading_lno = lno - 1
            if MAIN_HEADING_RE.search(''.join(lines[lno-2:lno+1])):  # Lower delimiter of h1.
                main_heading = True
            else:  # Lower delimiter of a heading of level 2-6.
                main_heading = False
            lno_before_heading = heading_lno - (2 if main_heading else 1)
            if lno_before_heading >= 0 and lines[lno_before_heading] != '\n':
                # Heading doesn't have to be preceded by a blank line if on first line of the file.
                yield heading_lno + 1, "the heading should be preceded by a blank line"
            if lines[heading_lno + 2] != '\n':
                yield heading_lno + 1, "the heading should be followed by a blank line"


@sphinxlint.checker('.rst', enabled=False)
def check_early_line_breaks(file, lines, options=None):
    """ Checks that no line breaks early, i.e., before using as much of the max length as possible.

    Note: `make review` only
    """

    def is_valid_line(line_, forbidden_starting_chars_):
        """ Allowed to break early - handle tables and bullets """
        return not ALLOWED_EARLY_BREAK_RE.search(line_) \
            and not HEADING_DELIMITER_RE.search(line_) \
            and not line_.startswith('\n') \
            and not line_.lstrip().startswith(forbidden_starting_chars_) \
            and len(line_) <= options.max_line_length

    def get_next_line_first_word(next_line_):
        """ Return the first word of the next line """
        if next_line_.startswith(' '):
            next_line_dict = {
                '*': lambda x: x.split('* ', 1)[0],
                '-': lambda x: x.split('- ', 1)[0],
                '#.': lambda x: x.split('#. ', 1)[0],
                'default': lambda x: x.split(' ', 1)[0]
            }
            return next_line_dict.get(next_line_.lstrip()[:2], next_line_dict['default'])(
                next_line_.lstrip()
            )
        else:
            return next_line_.split(' ', 1)[0]

    for lno, line in enumerate(lines):
        if lno + 1 < len(lines):
            next_line = lines[lno + 1]
            if (is_valid_line(line, ('+', '|'))
                and is_valid_line(next_line, ('+', '|', '- ', '* ', '#. '))
            ):
                current_line_remaining_space = options.max_line_length - len(line)
                next_line_first_word = get_next_line_first_word(next_line).rstrip()
                if current_line_remaining_space > len(next_line_first_word):
                    yield lno + 1, f"consider moving \"{next_line_first_word}\" to line {lno + 1}"


@sphinxlint.checker('.rst', '.py', '.js', '.xml', '.css', '.sass', '.less', '.po', '.pot')
def check_git_conflict_markers(file, lines, options=None):
    """ Check that there are no conflict markers. """
    for lno, line in enumerate(lines):
        if any(marker in line for marker in GIT_CONFLICT_MARKERS):
            yield lno + 1, "the git conflict should be resolved"
[ADD] tests: add sphinxlint checkers for headings task-2801043 X-original-commit: ad768c33aa1b239c5fb221717036076483fabb99 Part-of: odoo/documentation#3553 Co-authored-by: Antoine Vandevenne (anv) <anv@odoo.com> 2022-11-23 00:17:30 +07:00			`import re`

			`import sphinxlint`


			`ALLOWED_HEADING_CHARS = ['=', '-', '~', '*', '^'] # In the same order as in the guidelines.`
			`MAIN_HEADING_CHAR = ALLOWED_HEADING_CHARS[0]`
			`MAIN_HEADING_RE = re.compile(rf'{MAIN_HEADING_CHAR}+\n[^\n]+\n{MAIN_HEADING_CHAR}+\n')`
			`HEADING_DELIMITER_RE = re.compile(`
			`'^(' + '\|'.join(rf'\{char}+' for char in ALLOWED_HEADING_CHARS) + ')\n$'`
			`)`
			`FORBIDDEN_HEADING_CHARS = [`
			'#', '"', '\'', '+', '`', '@', '!', ',', '.', '/'
			`] # Exhaustive list at https://docutils.sourceforge.io/docs/ref/rst/restructuredtext.html#sections.`
			`FORBIDDEN_HEADING_DELIMITER_RE = re.compile(`
			`'^(' + '\|'.join(rf'\{char}+' for char in FORBIDDEN_HEADING_CHARS) + ')\n$'`
			`)`
[IMP] rst_style: new linters X-original-commit: a33db1cbbbd40df1e982026e04f69a7e9c6584d2 Part-of: odoo/documentation#3796 2023-02-17 19:38:17 +07:00			`GIT_CONFLICT_MARKERS = ['<' * 7, '>' * 7]`
[IMP] test/rst_style, Makefile: add optional review checkers task-2801043 closes odoo/documentation#5358 X-original-commit: 8eec0e76346ec3167399ed83146e42cbf0cdcadb Signed-off-by: Antoine Vandevenne (anv) <anv@odoo.com> 2023-08-05 02:29:37 +07:00			`ALLOWED_EARLY_BREAK_RE = re.compile(r'^\s*(\.\. \|:\S+:\s+)', re.IGNORECASE) # Contains markup.`
[IMP] rst_style: new linters X-original-commit: a33db1cbbbd40df1e982026e04f69a7e9c6584d2 Part-of: odoo/documentation#3796 2023-02-17 19:38:17 +07:00
[ADD] tests: add sphinxlint checkers for headings task-2801043 X-original-commit: ad768c33aa1b239c5fb221717036076483fabb99 Part-of: odoo/documentation#3553 Co-authored-by: Antoine Vandevenne (anv) <anv@odoo.com> 2022-11-23 00:17:30 +07:00
			`@sphinxlint.checker('.rst')`
			`def check_heading_delimiters_characters(file, lines, options=None):`
			`""" Check that heading delimiters use only allowed characters. """`
			`for lno, line in enumerate(lines):`
			`if FORBIDDEN_HEADING_DELIMITER_RE.search(line):`
			`yield lno + 1, f"illegal use of the character {line[0]} in heading delimiters; use" \`
			`f" any of {', '.join(ALLOWED_HEADING_CHARS)} instead"`


			`@sphinxlint.checker('.rst')`
			`def check_heading_delimiters_order(file, lines, options=None):`
			`""" Check that heading delimiters appear in the correct order. """`
			`last_delimiter_char_index = -1 # The index of the heading delimiter char in the ordered list.`
			`for lno, line in enumerate(lines):`
			`if HEADING_DELIMITER_RE.search(line): # The line is a heading delimiter.`
			`delimiter_char = line[0]`
			`delimiter_char_index = ALLOWED_HEADING_CHARS.index(delimiter_char)`
			`if delimiter_char_index > last_delimiter_char_index + 1:`
			`# There is a leap of more than 1 in the chars used for the heading delimiters.`
			`last_delimiter_char = ALLOWED_HEADING_CHARS[last_delimiter_char_index] \`
			`if last_delimiter_char_index != -1 else None`
			`yield lno + 1, f"the heading delimiter {delimiter_char} is not allowed after a" \`
			`f" heading with {last_delimiter_char} as delimiter; follow this" \`
			`f" order: {', '.join(ALLOWED_HEADING_CHARS)}"`
			`last_delimiter_char_index = delimiter_char_index`


			`@sphinxlint.checker('.rst')`
			`def check_max_one_main_heading(file, lines, options=None):`
			`""" Check that there is at most one main heading (h1) per document. """`
			`code = "".join(lines)`
			`nb_main_headings = len(MAIN_HEADING_RE.findall(code))`
			`if nb_main_headings > 1:`
			`yield 0, "the document should have only one main heading"`


			`@sphinxlint.checker('.rst')`
			`def check_min_one_main_heading(file, lines, options=None):`
			`""" Check that there is a main heading (h1) on document when it contains other headings. """`
			`heading_found, main_heading_found = False, False`
			`for lno, line in enumerate(lines):`
			`if HEADING_DELIMITER_RE.search(line): # The line is a heading delimiter.`
			`heading_found = True`
			`if MAIN_HEADING_RE.search(''.join(lines[lno - 2:lno + 1])): # Lower delimiter of h1.`
			`main_heading_found = True`
			`break`

			`if heading_found and not main_heading_found:`
			`yield 0, "the document should have a main heading (h1)"`


			`@sphinxlint.checker('.rst')`
			`def check_heading_delimiters_length(file, lines, options=None):`
			`""" Check that heading delimiters have the same length as their heading. """`
			`for lno, line in enumerate(lines):`
			`if HEADING_DELIMITER_RE.search(line): # The line is a heading delimiter.`
			`if MAIN_HEADING_RE.search(''.join(lines[lno:lno+3])): # Upper delimiter of h1.`
			`heading_lno = lno + 1`
			`else: # Lower delimiter of a heading of any level.`
			`heading_lno = lno - 1`
			`if len(line.rstrip()) != len(lines[heading_lno].rstrip()):`
			`yield lno + 1, "the heading delimiter should have the same length as its heading"`


			`@sphinxlint.checker('.rst')`
			`def check_heading_spacing(file, lines, options=None):`
			`""" Check that headings are preceded and followed by at least one blank line. """`
			`for lno, line in enumerate(lines):`
			`if HEADING_DELIMITER_RE.search(line): # The line is a heading delimiter.`
			`if MAIN_HEADING_RE.search(''.join(lines[lno:lno+3])): # Upper delimiter of h1.`
			`continue # We handle this heading via its lower delimiter.`

			`heading_lno = lno - 1`
			`if MAIN_HEADING_RE.search(''.join(lines[lno-2:lno+1])): # Lower delimiter of h1.`
			`main_heading = True`
			`else: # Lower delimiter of a heading of level 2-6.`
			`main_heading = False`
			`lno_before_heading = heading_lno - (2 if main_heading else 1)`
			`if lno_before_heading >= 0 and lines[lno_before_heading] != '\n':`
			`# Heading doesn't have to be preceded by a blank line if on first line of the file.`
			`yield heading_lno + 1, "the heading should be preceded by a blank line"`
			`if lines[heading_lno + 2] != '\n':`
			`yield heading_lno + 1, "the heading should be followed by a blank line"`


[IMP] test/rst_style, Makefile: add optional review checkers task-2801043 closes odoo/documentation#5358 X-original-commit: 8eec0e76346ec3167399ed83146e42cbf0cdcadb Signed-off-by: Antoine Vandevenne (anv) <anv@odoo.com> 2023-08-05 02:29:37 +07:00			`@sphinxlint.checker('.rst', enabled=False)`
			`def check_early_line_breaks(file, lines, options=None):`
			`""" Checks that no line breaks early, i.e., before using as much of the max length as possible.`

			Note: `make review` only
			`"""`

			`def is_valid_line(line_, forbidden_starting_chars_):`
			`""" Allowed to break early - handle tables and bullets """`
			`return not ALLOWED_EARLY_BREAK_RE.search(line_) \`
			`and not HEADING_DELIMITER_RE.search(line_) \`
			`and not line_.startswith('\n') \`
			`and not line_.lstrip().startswith(forbidden_starting_chars_) \`
			`and len(line_) <= options.max_line_length`

			`def get_next_line_first_word(next_line_):`
			`""" Return the first word of the next line """`
			`if next_line_.startswith(' '):`
			`next_line_dict = {`
			`'': lambda x: x.split(' ', 1)[0],`
			`'-': lambda x: x.split('- ', 1)[0],`
			`'#.': lambda x: x.split('#. ', 1)[0],`
			`'default': lambda x: x.split(' ', 1)[0]`
			`}`
[ADD] tests: image compression and resource file name checkers task-2801043 closes odoo/documentation#4870 closes odoo/documentation#5436 X-original-commit: fa90e27c4e04641283d553b4d358765a4f1de113 Signed-off-by: Antoine Vandevenne (anv) <anv@odoo.com> Co-authored-by: Antoine Vandevenne (anv) <anv@odoo.com> 2023-04-17 20:46:16 +07:00			`return next_line_dict.get(next_line_.lstrip()[:2], next_line_dict['default'])(`
[IMP] test/rst_style, Makefile: add optional review checkers task-2801043 closes odoo/documentation#5358 X-original-commit: 8eec0e76346ec3167399ed83146e42cbf0cdcadb Signed-off-by: Antoine Vandevenne (anv) <anv@odoo.com> 2023-08-05 02:29:37 +07:00			`next_line_.lstrip()`
			`)`
			`else:`
			`return next_line_.split(' ', 1)[0]`

			`for lno, line in enumerate(lines):`
			`if lno + 1 < len(lines):`
			`next_line = lines[lno + 1]`
			`if (is_valid_line(line, ('+', '\|'))`
			`and is_valid_line(next_line, ('+', '\|', '- ', '* ', '#. '))`
			`):`
			`current_line_remaining_space = options.max_line_length - len(line)`
[ADD] tests: image compression and resource file name checkers task-2801043 closes odoo/documentation#4870 closes odoo/documentation#5436 X-original-commit: fa90e27c4e04641283d553b4d358765a4f1de113 Signed-off-by: Antoine Vandevenne (anv) <anv@odoo.com> Co-authored-by: Antoine Vandevenne (anv) <anv@odoo.com> 2023-04-17 20:46:16 +07:00			`next_line_first_word = get_next_line_first_word(next_line).rstrip()`
[IMP] test/rst_style, Makefile: add optional review checkers task-2801043 closes odoo/documentation#5358 X-original-commit: 8eec0e76346ec3167399ed83146e42cbf0cdcadb Signed-off-by: Antoine Vandevenne (anv) <anv@odoo.com> 2023-08-05 02:29:37 +07:00			`if current_line_remaining_space > len(next_line_first_word):`
			`yield lno + 1, f"consider moving \"{next_line_first_word}\" to line {lno + 1}"`


[REF] tests: split checkers task-2801043 closes odoo/documentation#3796 X-original-commit: 8e8c4668927681f364adb8b5904e64bece78fce8 Signed-off-by: Antoine Vandevenne (anv) <anv@odoo.com> Signed-off-by: Victor Feyens (vfe) <vfe@odoo.com> 2023-03-09 22:03:21 +07:00			`@sphinxlint.checker('.rst', '.py', '.js', '.xml', '.css', '.sass', '.less', '.po', '.pot')`
			`def check_git_conflict_markers(file, lines, options=None):`
			`""" Check that there are no conflict markers. """`
			`for lno, line in enumerate(lines):`
			`if any(marker in line for marker in GIT_CONFLICT_MARKERS):`
			`yield lno + 1, "the git conflict should be resolved"`