From f021598fca84eba803b39832f3436005cf1e788a Mon Sep 17 00:00:00 2001 From: Adam Bittlingmayer Date: Sun, 14 Jan 2024 00:03:27 +0400 Subject: [PATCH 1/2] Update test_enforce_style.py --- .github/tests/test_enforce_style.py | 19 +++++++++++++------ 1 file changed, 13 insertions(+), 6 deletions(-) diff --git a/.github/tests/test_enforce_style.py b/.github/tests/test_enforce_style.py index ac7a0387..128174c7 100644 --- a/.github/tests/test_enforce_style.py +++ b/.github/tests/test_enforce_style.py @@ -5,6 +5,8 @@ from .find_missing_links import walk_directory +# Checks that we use UK spellings for words that differ between the UK and US +# Permits US spellings for proper nouns. # Load the English language model for Spacy NLP = spacy.load("en_core_web_sm") @@ -54,16 +56,21 @@ def check_spellings(file_path): raw_word = re.sub(r'^[^a-zA-Z\'-]*|[^a-zA-Z\'-]*$', '', word) if raw_word: - # Skip words that have the same spelling in both US and UK English or are wrong for both - if ((us.check(raw_word) == uk.check(raw_word)) or (uk.check(raw_word) and not us.check(raw_word))): - continue + # Skip CamelCase and all-uppercase words if is_camel_case(raw_word) or raw_word.isupper(): continue - # Check if the word is a proper noun in context - assert is_proper_noun_in_context(_line, raw_word), \ - f'US-specific spelling: "{raw_word}" in {file_path} \n\n\t at the line: {line} \n\n\tsuggestions: {uk.suggest(raw_word)} \n' + # If a US word but not a UK word + if us.check(raw_word) and not uk.check(raw_word) + + # Check if the word is a proper noun in context + # This is a relatively expensive check. + assert is_proper_noun_in_context(_line, raw_word), f'''US-specific spelling: + "{ raw_word }" in { file_path } + line: { line } + suggestions: { uk.suggest(raw_word) } + ''' EXCLUDE_DIRS = ['vendor'] EXCLUDE_FILES = ['README.md', 'CHANGELOG.md'] From f0ed9d29a796af678ecd9b927a7cdb1b1030bd30 Mon Sep 17 00:00:00 2001 From: Adam Bittlingmayer Date: Mon, 22 Jan 2024 13:13:56 +0400 Subject: [PATCH 2/2] Update test_enforce_style.py --- .github/tests/test_enforce_style.py | 30 ++++++++++++++--------------- 1 file changed, 14 insertions(+), 16 deletions(-) diff --git a/.github/tests/test_enforce_style.py b/.github/tests/test_enforce_style.py index 128174c7..3c1585b1 100644 --- a/.github/tests/test_enforce_style.py +++ b/.github/tests/test_enforce_style.py @@ -55,22 +55,20 @@ def check_spellings(file_path): # Extract only the letters raw_word = re.sub(r'^[^a-zA-Z\'-]*|[^a-zA-Z\'-]*$', '', word) - if raw_word: - - # Skip CamelCase and all-uppercase words - if is_camel_case(raw_word) or raw_word.isupper(): - continue - - # If a US word but not a UK word - if us.check(raw_word) and not uk.check(raw_word) - - # Check if the word is a proper noun in context - # This is a relatively expensive check. - assert is_proper_noun_in_context(_line, raw_word), f'''US-specific spelling: - "{ raw_word }" in { file_path } - line: { line } - suggestions: { uk.suggest(raw_word) } - ''' + # Skip non-alpha, ALLCAPS and camelCase/CamelCase + if not raw_word or raw_word.isupper() or is_camel_case(raw_word): + continue + + # If a US word but not a UK word + if us.check(raw_word) and not uk.check(raw_word): + + # Check if the word is a proper noun in context + # This is a relatively expensive check. + assert is_proper_noun_in_context(_line, raw_word), f'''US-specific spelling: + "{ raw_word }" in { file_path } + line: { line } + suggestions: { uk.suggest(raw_word) } + ''' EXCLUDE_DIRS = ['vendor'] EXCLUDE_FILES = ['README.md', 'CHANGELOG.md']