mirror of
git://github.com/kovidgoyal/calibre.git
synced 2026-04-24 01:03:09 +02:00
Add more characters referecned by bug #822744 to the line unwrap lookahead character list.
This commit is contained in:
parent
140b1181d1
commit
78dc53abae
1 changed files with 1 additions and 1 deletions
|
|
@ -315,7 +315,7 @@ def punctuation_unwrap(self, length, content, format):
|
|||
supports a range of html markup and text files
|
||||
'''
|
||||
# define the pieces of the regex
|
||||
lookahead = "(?<=.{"+str(length)+u"}([a-zäëïöüàèìòùáćéíóńśúâêîôûçąężıãõñæøþðßě,:)\IA\u00DF]|(?<!\&\w{4});))" # (?<!\&\w{4});) is a semicolon not part of an entity
|
||||
lookahead = "(?<=.{"+str(length)+u"}([a-zäëïöüàèìòùáćéíóńśúâêîôûçąężıãõñæøþðßôľščťžňďěřů,:)\IA\u00DF]|(?<!\&\w{4});))" # (?<!\&\w{4});) is a semicolon not part of an entity
|
||||
em_en_lookahead = "(?<=.{"+str(length)+u"}[\u2013\u2014])"
|
||||
soft_hyphen = u"\xad"
|
||||
line_ending = "\s*</(span|[iubp]|div)>\s*(</(span|[iubp]|div)>)?"
|
||||
|
|
|
|||
Loading…
Reference in a new issue