On Thu, Aug 7, 2025 at 4:53 PM Aaron Conole <acon...@redhat.com> wrote:
>
> Mike Pattrick via dev <ovs-dev@openvswitch.org> writes:
>
> > On Thu, Aug 7, 2025 at 2:07 PM Eli Oliver via dev
> > <ovs-dev@openvswitch.org> wrote:
> >>
> >> Checkpatch is used to do spell checking for C files, currently.  However,
> >> python code is also a routine part of the Open vSwitch suite, and it should
> >> also receive spell checking where possible.
> >>
> >> This patch adds an initial implementation of spell checking to checkpatch
> >> that will catch all of the comments starting with '#', and some of the
> >> doc-string lines.  Future work would implement a more robust python
> >> parser that will handle doc-string entries.
> >>
> >> Signed-off-by: Eli Oliver <eoli...@redhat.com>
> >> ---
> >>  tests/checkpatch.at     | 64 +++++++++++++++++++++++++++++++++--------
> >>  utilities/checkpatch.py | 31 ++++++++++++++++----
> >>  2 files changed, 78 insertions(+), 17 deletions(-)
> >>
> >> diff --git a/tests/checkpatch.at b/tests/checkpatch.at
> >> index 994876e08..17bb74c43 100755
> >> --- a/tests/checkpatch.at
> >> +++ b/tests/checkpatch.at
> >> @@ -39,34 +39,55 @@ Subject: Patch this is.
> >>      fi
> >>  }
> >>
> >> -# try_checkpatch_c_file SOURCE [ERRORS] [CHECKPATCH-ARGS] [FILTER]
> >> +# try_checkpatch_file FILENAME SOURCE [ERRORS] [CHECKPATCH-ARGS] [FILTER]
> >>  #
> >> -# Runs checkpatch against test SOURCE expecting the set of specified
> >> -# ERRORS (and warnings).  Optionally, sets [CHECKPATCH-ARGS].  The
> >> -# optional FILTER can be used to adjust the expected output before
> >> +# Runs checkpatch against FILENAME with SOURCE contents, expecting the set
> >> +# of specified ERRORS (and warnings).  Optionally, sets [CHECKPATCH-ARGS].
> >> +# The optional FILTER can be used to adjust the expected output before
> >>  # processing.
> >> -try_checkpatch_c_file() {
> >> -   echo "$1" | sed 's/^    //' > test.c
> >> +try_checkpatch_file() {
> >> +   local FILENAME="$1"
> >> +   echo "$2" | sed 's/^    //' > "$FILENAME"
> >>
> >> -   # Take expected output from $2.
> >> -   if test -n "$2"; then
> >> -       echo "$2" | sed 's/^    //' > expout
> >> +   # Take expected output from $3.
> >> +   if test -n "$3"; then
> >> +       echo "$3" | sed 's/^    //' > expout
> >>     else
> >>         : > expout
> >>     fi
> >>
> >>     if test -s expout; then
> >>         AT_CHECK([OVS_SRC_DIR=$top_srcdir $PYTHON3 \
> >> -                   $top_srcdir/utilities/checkpatch.py $3 -q -f test.c],
> >> +                   $top_srcdir/utilities/checkpatch.py $4 -q -f 
> >> "$FILENAME"],
> >>                  [1], [stdout])
> >> -       AT_CHECK([sed "$4
> >> +       AT_CHECK([sed "$5
> >>                        /^Lines checked:/d
> >>                        /^$/d" stdout], [0], [expout])
> >>     else
> >>         AT_CHECK([OVS_SRC_DIR=$top_srcdir $PYTHON3 \
> >> -                   $top_srcdir/utilities/checkpatch.py $3 -q -f test.c])
> >> +                   $top_srcdir/utilities/checkpatch.py $4 -q -f 
> >> "$FILENAME"])
> >>     fi
> >>  }
> >> +
> >> +# try_checkpatch_c_file SOURCE [ERRORS] [CHECKPATCH-ARGS] [FILTER]
> >> +#
> >> +# Runs checkpatch against "C" SOURCE contents, expecting the set of
> >> +# specified ERRORS (and warnings).  Optionally, sets [CHECKPATCH-ARGS].
> >> +# The optional FILTER can be used to adjust the expected output before
> >> +# processing.
> >> +try_checkpatch_c_file() {
> >> +    try_checkpatch_file "test.c" "$@"
> >> +}
> >> +
> >> +# try_checkpatch_py_file SOURCE [ERRORS] [CHECKPATCH-ARGS] [FILTER]
> >> +#
> >> +# Runs checkpatch against "Python" SOURCE contents, expecting the set of
> >> +# specified ERRORS (and warnings).  Optionally, sets [CHECKPATCH-ARGS].
> >> +# The optional FILTER can be used to adjust the expected output before
> >> +# processing.
> >> +try_checkpatch_py_file() {
> >> +    try_checkpatch_file "test.py" "$1"
> >> +}
> >>  OVS_END_SHELL_HELPERS
> >>
> >>  AT_SETUP([checkpatch - sign-offs])
> >> @@ -763,4 +784,23 @@ try_checkpatch_c_file \
> >>      "" \
> >>      "-S"
> >>
> >> +dnl Second check with some different words
> >> +try_checkpatch_c_file \
> >> +    "/* This code is for my private prooperty. */
> >
> > Nit: property
> >
> >
> >> +    " \
> >> +    "WARNING: Possible misspelled word: \"prooperty\"
> >> +    test.c:1:
> >> +    /* This code is for my private prooperty. */" \
> >> +    "-S" \
> >> +    "/^Did you mean:/d"
> >> +
> >> +try_checkpatch_py_file \
> >> +    "# This is a python file with an intentionaly misspelt word.
> >
> > Nit: intentionally
>
> Just a note, I think the point is for these to be misspelled and cause
> checkpatch to emit the warning.  So I think they should stay as-is :)

Opa good point

-M

>
> >> +    # The user wants to check if it's working." \
> >> +    "WARNING: Possible misspelled word: \"intentionaly\"
> >> +    test.py:1:
> >> +    # This is a python file with an intentionaly misspelt word." \
> >> +    "-S" \
> >> +    "/^Did you mean:/d"
> >> +
> >>  AT_CLEANUP
> >> diff --git a/utilities/checkpatch.py b/utilities/checkpatch.py
> >> index 28d0977eb..88d74b717 100755
> >> --- a/utilities/checkpatch.py
> >> +++ b/utilities/checkpatch.py
> >> @@ -384,15 +384,32 @@ def filter_comments(current_line, keep=False):
> >>      return sanitized_line
> >>
> >>
> >> -def check_spelling(line, comment):
> >> +NOT_COMMENT = 0
> >> +C_COMMENT = 1
> >> +PY_COMMENT = 2
> >> +
> >> +
> >> +def check_spelling(line, comment_type):
> >>      if not spell_check_dict or not spellcheck:
> >>          return False
> >>
> >>      is_name_tag = re.compile(r'^\s*([a-z-]+-by): (.*@.*)$', re.I | re.M | 
> >> re.S)
> >>      if line.startswith('Fixes: ') or is_name_tag.match(line):
> >>          return False
> >> +    if comment_type == NOT_COMMENT:
> >> +        words = line
> >> +    elif comment_type == C_COMMENT:
> >> +        words = filter_comments(line, True)
> >> +    elif comment_type == PY_COMMENT:
> >> +        words = ""
> >> +        matched = re.search(r'#[^!](.*)$', line)
> >> +        if matched:
> >> +            words = matched.group(0)[1:]
> >
> > Instead of
> >
> > matched = re.search(r'#[^!](.*)$', line)
> > matched.group(0)[1:]
> >
> > It is probably simpler to just include the whole comment in the group
> > and reference it by group ID. Eg:
> >
> > matched = re.search(r'#([^!].*)$', line)
> > matched.group(1)
>
> Agreed, it looks nicer to have matched.group(1)
>
> >> +        else:
> >> +            words = line.replace("'''", '').replace('"""', '').strip()
> >> +    else:
> >> +        return False
> >>
> >> -    words = filter_comments(line, True) if comment else line
> >>      words = words.replace(':', ' ').split(' ')
> >>
> >>      flagged_words = []
> >> @@ -599,7 +616,11 @@ checks = [
> >>
> >>      {'regex': r'(\.c|\.h)(\.in)?$', 'match_name': None,
> >>       'prereq': lambda x: has_comment(x),
> >> -     'check': lambda x: check_spelling(x, True)},
> >> +     'check': lambda x: check_spelling(x, comment_type=C_COMMENT)},
> >> +
> >> +    {'regex': r'\.py(\.in)?$', 'match_name': None,
> >> +     'prereq': lambda x: "#" in x or "'''" in x or '"""' in x,
> >
> > Not all multiline strings in python are docstrings. However, it may
> > not make too much of a difference here.
> >
> >> +     'check': lambda x: check_spelling(x, PY_COMMENT)},
> >>
> >>      {'regex': r'(\.c|\.h)(\.in)?$', 'match_name': None,
> >>       'check': lambda x: empty_return_with_brace(x),
> >> @@ -783,7 +804,7 @@ def run_file_checks(text):
> >>  def run_subject_checks(subject, spellcheck=False):
> >>      warnings = False
> >>
> >> -    if spellcheck and check_spelling(subject, False):
> >> +    if spellcheck and check_spelling(subject, comment_type=NOT_COMMENT):
> >>          warnings = True
> >>
> >>      summary = subject[subject.rindex(': ') + 2:]
> >> @@ -1005,7 +1026,7 @@ def ovs_checkpatch_parse(text, filename, 
> >> author=None, committer=None):
> >>                              '--abbrev=12 COMMIT_REF\n')
> >>                  print("%d: %s\n" % (lineno, line))
> >>              elif spellcheck:
> >> -                check_spelling(line, False)
> >> +                check_spelling(line, comment_type=NOT_COMMENT)
> >>              for typo, correct in tags_typos.items():
> >>                  m = re.match(typo, line, re.I)
> >>                  if m:
> >> --
> >> 2.49.0
> >>
> >>
> >> _______________________________________________
> >> dev mailing list
> >> d...@openvswitch.org
> >> https://mail.openvswitch.org/mailman/listinfo/ovs-dev
> >>
> >
> > _______________________________________________
> > dev mailing list
> > d...@openvswitch.org
> > https://mail.openvswitch.org/mailman/listinfo/ovs-dev
>

_______________________________________________
dev mailing list
d...@openvswitch.org
https://mail.openvswitch.org/mailman/listinfo/ovs-dev

Reply via email to