From 316d796e6c1d41e32a49a1813a783c0c418c4ed7 Mon Sep 17 00:00:00 2001 From: Dan Scott Date: Fri, 29 Jul 2011 14:11:05 -0400 Subject: [PATCH] S with combining acute accent (lower and uppercase) We can use the composed codepoint for these instead of going the decomposed route, for more accuracy and great justice. Signed-off-by: Dan Scott --- tools/ebooks/prep_ebook_records.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/tools/ebooks/prep_ebook_records.py b/tools/ebooks/prep_ebook_records.py index cf8e3c6e1e..79b1739268 100644 --- a/tools/ebooks/prep_ebook_records.py +++ b/tools/ebooks/prep_ebook_records.py @@ -378,8 +378,10 @@ def clean_diacritics(field): # COMBINING CEDILLA tmpsf = tmpsf.replace(u'\xb0c', u'c\u0327') - # COMBINING ACUTE ACCENT - tmpsf = tmpsf.replace(u'\xd4s', u's\u0301') + # S WITH COMBINING ACUTE ACCENT (lowercase) + tmpsf = tmpsf.replace(u'\xd4s', u'\u015b') + # S WITH COMBINING ACUTE ACCENT (uppercase) + tmpsf = tmpsf.replace(u'\xd4S', u'\u015a') # COMBINING BREVE tmpsf = tmpsf.replace(u'\xe6i', u'i\u0306') -- 2.11.0