keep apstrophies, simplifies code - plint - French poetry validator (local mirror of https://gitlab.com/a3nm/plint)

commit 537c0e4595038d9e676cf137b9703394e296450e
parent 01d617d42d2d62251e7a92c79edf4083d8b43e96
Author: Antoine Amarilli <a3nm@a3nm.net>
Date:   Sat, 19 May 2012 20:19:03 +0200

keep apstrophies, simplifies code

Diffstat:
common.py  | 11 ++++-------

1 file changed, 4 insertions(+), 7 deletions(-)
diff --git a/common.py b/common.py
@@ -5,7 +5,7 @@ import unicodedata
 import re
 
 vowels = 'aeiouyœæ'
-consonants = "bcçdfghjklmnpqrstvwxz"
+consonants = "bcçdfghjklmnpqrstvwxz'"
 legal = vowels + consonants + ' -'
 
 # a variant of x-sampa such that all french phonemes are one-character
@@ -42,12 +42,10 @@ def norm_spaces(text):
   """Remove multiple consecutive whitespace"""
   return re.sub("\s+-*\s*", ' ', text)
 
-def rm_punct(text, with_apostrophe = False):
+def rm_punct(text):
   """Remove punctuation from text"""
   text = re.sub("’", "'", text) # no weird apostrophes
   text = re.sub("' ", "'", text) # space after apostrophes
-  if not with_apostrophe:
-    text = re.sub("'", '', text)
 
   #TODO rather: keep only good chars
   pattern = re.compile("[^'\w -]", re.UNICODE)
@@ -76,10 +74,9 @@ def is_consonants(chunk):
       return False
   return True
 
-def normalize(text, with_apostrophe=False, downcase=True):
+def normalize(text, downcase=True):
   """Normalize text, ie. lowercase, no useless punctuation or whitespace"""
-  return norm_spaces(rm_punct(text.lower() if downcase else text,
-      with_apostrophe)).rstrip().lstrip()
+  return norm_spaces(rm_punct(text.lower() if downcase else text)).rstrip().lstrip()
 
 def subst(string, subs):
   if len(subs) == 0:

	plint French poetry validator (local mirror of https://gitlab.com/a3nm/plint)
	git clone https://a3nm.net/git/plint/
	Log \| Files \| Refs \| README