From 801ca9cd5af7c86da741a601b4721bff3f94f9cd Mon Sep 17 00:00:00 2001 From: Jarkko Hietaniemi Date: Sun, 3 Dec 2000 17:58:20 +0000 Subject: [PATCH] Raw zero bytes in text files confuse at least GNU patch 2.1. p4raw-id: //depot/perl@7965 --- t/pragma/utf8.t | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/t/pragma/utf8.t b/t/pragma/utf8.t index 93a5bc4..60cbd8c 100755 --- a/t/pragma/utf8.t +++ b/t/pragma/utf8.t @@ -569,12 +569,15 @@ sub nok_bytes { # http://www.cl.cam.ac.uk/~mgk25/ucs/examples/UTF-8-test.txt, # version dated 2000-09-02. +# Note the \0 instead of a raw zero byte in 2.1.1: for example +# GNU patch v2.1 has "issues" with raw zero bytes. + my @MK = split(/\n/, <<__EOMK__); 1 Correct UTF-8 1.1.1 y "κόσμε" - 11 ce:ba:e1:bd:b9:cf:83:ce:bc:ce:b5 5 2 Boundary conditions 2.1 First possible sequence of certain length -2.1.1 y "" 0 1 00 1 +2.1.1 y "\0" 0 1 00 1 2.1.2 y "€" 80 2 c2:80 1 2.1.3 y "ࠀ" 800 3 e0:a0:80 1 2.1.4 y "𐀀" 10000 4 f0:90:80:80 1 -- 2.7.4