From 4a49e0340fea5b1bf071601be2c8970f52fb5c13 Mon Sep 17 00:00:00 2001 From: Stefan Weil Date: Fri, 3 May 2024 07:44:57 +0200 Subject: [PATCH] Remove trailing whitespace from PAGE XML output Fixes: 577e8a8b93a9 ("Add PAGE XML renderer / export (#4214)") Signed-off-by: Stefan Weil --- src/api/pagerenderer.cpp | 10 ++++++---- 1 file changed, 6 insertions(+), 4 deletions(-) diff --git a/src/api/pagerenderer.cpp b/src/api/pagerenderer.cpp index 0f53dd73c5..9c27ab8316 100644 --- a/src/api/pagerenderer.cpp +++ b/src/api/pagerenderer.cpp @@ -873,7 +873,11 @@ char *TessBaseAPI::GetPAGEText(ETEXT_DESC *monitor, int page_number) { if (res_it->IsAtBeginningOf(RIL_TEXTLINE)) { // writing_direction_before = writing_direction; line_conf = ((res_it->Confidence(RIL_TEXTLINE)) / 100.); - line_content << HOcrEscape(res_it->GetUTF8Text(RIL_TEXTLINE)).c_str(); + std::string textline = res_it->GetUTF8Text(RIL_TEXTLINE); + if (textline.back() == '\n') { + textline.erase(textline.length() - 1); + } + line_content << HOcrEscape(textline.c_str()); line_str << "\t\t\t