diff --git a/picard/util/textencoding.py b/picard/util/textencoding.py index 3ce273dc9..5fb214276 100644 --- a/picard/util/textencoding.py +++ b/picard/util/textencoding.py @@ -176,6 +176,7 @@ _simplify_punctuation = { "\u226B": ">>", # MUCH GREATER-THAN "\u2985": "((", # LEFT WHITE PARENTHESIS "\u2986": "))", # RIGHT WHITE PARENTHESIS + "\u2022": "-", # BULLET "\u200B": "", # Zero Width Space } diff --git a/test/test_textencoding.py b/test/test_textencoding.py index e2533abeb..39ceae467 100644 --- a/test/test_textencoding.py +++ b/test/test_textencoding.py @@ -94,9 +94,9 @@ punctuation_from = ( u"\u301E\u00AB\u00BB\u2039\u203A\u00AD\u2010\u2012\u2013\u2014" # 〞«»‹›\u00AD‐‒–— u"\u2015\u2016\u2044\u2045\u2046\u204E\u3008\u3009\u300A\u300B" # ―‖⁄⁅⁆⁎〈〉《》 u"\u3014\u3015\u3018\u3019\u301A\u301B\u2212\u2215\u2216\u2223" # 〔〕〘〙〚〛−∕∖∣ - u"\u2225\u226A\u226B\u2985\u2986\u200B" # ∥≪≫⦅⦆· + u"\u2225\u226A\u226B\u2985\u2986\u2022\u200B" # ∥≪≫⦅⦆•· ) -punctuation_to = u"''''\"\"\"\"'\"\"<<>><>-----||/[]*<><<>>[][][]-/\\|||<<>>(())" +punctuation_to = u"''''\"\"\"\"'\"\"<<>><>-----||/[]*<><<>>[][][]-/\\|||<<>>(())-" combinations_from = ( u"\u00C6\u00D0\u00D8\u00DE\u00DF\u00E6\u00F0\u00F8\u00FE\u0110" # ÆÐØÞßæðøþĐ u"\u0111\u0126\u0127\u0131\u0138\u0141\u0142\u014A\u014B\u0152" # đĦħıĸŁłŊŋŒ