Document what the spellchecker scanner is doing.

2008-11-03 08:25:16 +00:00 · 2008-11-03 08:25:16 +00:00 · 2cc7e6f954
commit 2cc7e6f954
parent 53d2b62b88
1 changed files with 11 additions and 0 deletions
--- a/data/tools/wmllint
+++ b/data/tools/wmllint
@ -1189,26 +1189,37 @@ def spellcheck(fn, d):
            # Fold continued lines
            value = re.sub(r'" *\+\s*_ *"', "", value)
            for token in value.split():
+                # Try it with simple lowercasing first
                lowered = token.lower()
                if d.check(lowered):
                    continue
+                # Strip leading punctuastion and grotty Wesnoth highlighters
                while lowered and lowered[0] in " \t(`@*'%_":
                    lowered = lowered[1:]
+                # Not interested in interpolations or numeric literals
+                if not lowered or lowered.startswith("$"):
+                    continue
+                # Suffix handling
                while lowered and lowered[-1] in "_-*').,:;?!& \t":
                    lowered = lowered[:-1]
+                # Not interested in interpolations or numeric literals
                if not lowered or lowered.startswith("$") or lowered[0].isdigit():
                    continue
+               # Nuke balanced string quotes if present
                lowered = string_strip(lowered)
                if lowered and d.check(lowered):
                    continue
+                # No match? Strip posessive suffixes and try again.
                elif lowered.endswith("'s") and d.check(lowered[:-2]):
                    continue
                elif lowered.endswith("s'") and d.check(lowered[:-2]):
                    continue
+                # Hyphenated compounds need all their parts good
                if "-" in lowered:
                    parts = lowered.split("-")
                    if filter(lambda w: not w or d.check(w), parts) == parts:
                        continue
+                # Modifier literals aren't interesting
                if re.match("[+-][0-9]", lowered):
                    continue
                # Match various onomatopoetic exclamations of variable form