From a2afa21dbf79d14ebfa9234cccc2bbce5b75843b Mon Sep 17 00:00:00 2001 From: Elisabeth Henry Date: Thu, 25 Feb 2016 21:47:42 +0100 Subject: [PATCH] =?UTF-8?q?fixed=20french=20cleaner,=20now=20uses=20em=20s?= =?UTF-8?q?pace=20after=20=E2=80=94?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/lib/cleaner.rs | 13 ++++++++++++- 1 file changed, 12 insertions(+), 1 deletion(-) diff --git a/src/lib/cleaner.rs b/src/lib/cleaner.rs index 5c01be3..db885f9 100644 --- a/src/lib/cleaner.rs +++ b/src/lib/cleaner.rs @@ -93,7 +93,17 @@ impl Cleaner for French { new_s.push(current); match current { // handle nb space after char - '«'|'—' => { + '—' => { + if is_whitespace(next) { + // use "em space" + new_s.push('\u{2003}'); + if let Some(next) = chars.next() { + current = next; + continue; + } + } + }, + '«' => { if is_whitespace(next) { new_s.push(self.nb_char); if let Some(next) = chars.next() { @@ -101,6 +111,7 @@ impl Cleaner for French { continue; } } + }, _ => (), }