From: Dan Scott Date: Tue, 2 Aug 2011 20:38:03 +0000 (-0400) Subject: Add more carons, based on outliers from CRKN_OUP X-Git-Url: https://old-git.evergreen-ils.org/?a=commitdiff_plain;h=0c52b2cb528a1affced5d30edb31d1cfcd761650;p=contrib%2FConifer.git Add more carons, based on outliers from CRKN_OUP Note that in at least one case, this would result in MUSICA becoming MSICA. Sigh. Finally the conflicts arrive. Signed-off-by: Dan Scott --- diff --git a/tools/ebooks/prep_ebook_records.py b/tools/ebooks/prep_ebook_records.py index ef39467190..2fb48596e9 100644 --- a/tools/ebooks/prep_ebook_records.py +++ b/tools/ebooks/prep_ebook_records.py @@ -392,10 +392,22 @@ def clean_diacritics(field): tmpsf = tmpsf.replace(u'\xd4S', u'\u015a') tmpsf = tmpsf.replace(u'\xd4s', u'\u015b') + # A CARON + tmpsf = tmpsf.replace(u'\xdaA', u'\u0100') + tmpsf = tmpsf.replace(u'\xdaa', u'\u0101') + + # C CARON + tmpsf = tmpsf.replace(u'\xdaC', u'\u010c') + tmpsf = tmpsf.replace(u'\xdac', u'\u010d') + # R CARON tmpsf = tmpsf.replace(u'\xdaR', u'\u0158') tmpsf = tmpsf.replace(u'\xdar', u'\u0159') + # S CARON + tmpsf = tmpsf.replace(u'\xdaS', u'\u0160') + tmpsf = tmpsf.replace(u'\xdas', u'\u0161') + # G BREVE tmpsf = tmpsf.replace(u'\xe6G', u'\u011e') tmpsf = tmpsf.replace(u'\xe6g', u'\u011f')