From 0c168cca9d9dee26c9ba3a82430d0ec4379dde47 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Cristian=20Garc=C3=ADa=20Romero?= Date: Tue, 15 Feb 2022 08:59:31 +0100 Subject: [PATCH] Fix paragraphs When sentence was being split, the paragraph identifier was being wrongly printed multiple times --- bifixer/monofixer.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/bifixer/monofixer.py b/bifixer/monofixer.py index 6f3c3cd..9a75f58 100644 --- a/bifixer/monofixer.py +++ b/bifixer/monofixer.py @@ -211,6 +211,9 @@ def fix_sentences(args): new_parts[args.sdeferredcol-1] = parts[args.sdeferredcol-1].rstrip("\n")+"#"+str(sent_num) if args.sparagraphid: + if "#" in parts[args.sparagraphid-1]: + new_parts[args.sparagraphid-1] = parts[args.sparagraphid-1].rstrip("\n").split("#")[0]+"#"+str(sent_num) + else: new_parts[args.sparagraphid-1] = parts[args.sparagraphid-1].rstrip("\n")+"#"+str(sent_num) if (new_parts[args.scol-1]): #sentence may be empty now because it contained only spaces or similar weird thing