From b46f2a1f342222301adf0ddde3b2158eff197bb2 Mon Sep 17 00:00:00 2001 From: Jochen Pfaeffle Date: Thu, 6 Feb 2025 12:25:09 +0100 Subject: [PATCH 1/2] fix multicharactor with utf-8 encoding --- src/EDI/Parser.php | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/src/EDI/Parser.php b/src/EDI/Parser.php index 9166f7a..d335065 100644 --- a/src/EDI/Parser.php +++ b/src/EDI/Parser.php @@ -157,7 +157,9 @@ public function parse(): self // Basic sanitization, remove non-printable chars. $lineTrim = \trim($line); - $line = (string) \preg_replace($this->stripChars, '', $lineTrim); + if (mb_detect_encoding($line, mb_list_encodings()) !== 'UTF-8') { + $line = (string) \preg_replace($this->stripChars, '', $lineTrim); + } $line_bytes = \strlen($line); if ($line_bytes !== \strlen($lineTrim)) { From 388e5e8741114cf393138a3a3bd8cfe1cdfa3168 Mon Sep 17 00:00:00 2001 From: Jochen Pfaeffle Date: Fri, 7 Feb 2025 10:08:38 +0100 Subject: [PATCH 2/2] revert change --- src/EDI/Parser.php | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/src/EDI/Parser.php b/src/EDI/Parser.php index d335065..9166f7a 100644 --- a/src/EDI/Parser.php +++ b/src/EDI/Parser.php @@ -157,9 +157,7 @@ public function parse(): self // Basic sanitization, remove non-printable chars. $lineTrim = \trim($line); - if (mb_detect_encoding($line, mb_list_encodings()) !== 'UTF-8') { - $line = (string) \preg_replace($this->stripChars, '', $lineTrim); - } + $line = (string) \preg_replace($this->stripChars, '', $lineTrim); $line_bytes = \strlen($line); if ($line_bytes !== \strlen($lineTrim)) {