mirror of
git://github.com/kovidgoyal/calibre.git
synced 2026-01-06 05:24:56 +01:00
Conversion heuristics: Make unwrapping recognize Georgian letters as well. Fixes #1753533 [Unwrapping fails on non-latin stripts](https://bugs.launchpad.net/calibre/+bug/1753533)
This commit is contained in:
parent
a31de75a39
commit
6dbf46c43e
1 changed files with 1 additions and 1 deletions
|
|
@ -358,7 +358,7 @@ def style_unwrap(match):
|
|||
|
||||
# define the pieces of the regex
|
||||
# (?<!\&\w{4});) is a semicolon not part of an entity
|
||||
lookahead = "(?<=.{"+unicode(length)+u"}([a-zäëïöüàèìòùáćéíĺóŕńśúýâêîôûçąężıãõñæøþðßěľščťžňďřů,:)\IA\u00DF]|(?<!\&\w{4});))"
|
||||
lookahead = "(?<=.{"+unicode(length)+u"}([a-zა-ჰäëïöüàèìòùáćéíĺóŕńśúýâêîôûçąężıãõñæøþðßěľščťžňďřů,:)\IA\u00DF]|(?<!\&\w{4});))"
|
||||
em_en_lookahead = "(?<=.{"+unicode(length)+u"}[\u2013\u2014])"
|
||||
soft_hyphen = u"\xad"
|
||||
line_ending = "\s*(?P<style_close></(span|[iub])>)?\s*(</(p|div)>)?"
|
||||
|
|
|
|||
Loading…
Reference in a new issue