From f23be008f11ff3a35963264c8c9dce6ac4060346 Mon Sep 17 00:00:00 2001 From: "Eric S. Raymond" Date: Thu, 17 Jun 2010 21:41:45 +0000 Subject: [PATCH] Handle more UTF-8 wackiness gracefully in the spellchecker. --- data/tools/wmllint | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/data/tools/wmllint b/data/tools/wmllint index afa149c9587..7a8bd96e844 100755 --- a/data/tools/wmllint +++ b/data/tools/wmllint @@ -1896,6 +1896,10 @@ def inner_spellcheck(nav, value, spelldict): value = value.replace("\xe2\x80\x94", " ") # UTF-8 em dash value = value.replace("\xe2\x80\x93", " ") # UTF-8 en dash value = value.replace("\xe2\x80\x95", " ") # UTF-8 horizontal dash + value = value.replace("\xe2\x80\x99", "'") # UTF-8 right single quote + value = value.replace("\xe2\x80\x98", "'") # UTF-8 left single quote + value = value.replace("\xe2\x80\x9d", " ") # UTF-8 right double quote + value = value.replace("\xe2\x80\x9c", " ") # UTF-8 left double quote value = value.replace("''", "") value = value.replace("female^", " ") value = value.replace("male^", " ")