/* Test of u8_prev() function. Copyright (C) 2010-2023 Free Software Foundation, Inc. This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program. If not, see . */ /* Written by Bruno Haible , 2010. */ #include #include "unistr.h" #include "macros.h" static int check (const uint8_t *input, size_t input_length, ucs4_t *puc) { ucs4_t uc; /* Test recognition when at the beginning of the string. */ if (u8_prev (&uc, input + input_length, input) != input) return 1; /* Test recognition when preceded by a 1-unit character. */ { uint8_t buf[100]; uint8_t *ptr; size_t i; ucs4_t uc1; ptr = buf; *ptr++ = 'x'; for (i = 0; i < input_length; i++) ptr[i] = input[i]; if (u8_prev (&uc1, ptr + input_length, buf) != ptr) return 2; if (uc1 != uc) return 3; } /* Test recognition when preceded by a 2-unit character. */ { uint8_t buf[100]; uint8_t *ptr; size_t i; ucs4_t uc1; ptr = buf; *ptr++ = 0xC3; *ptr++ = 0x97; for (i = 0; i < input_length; i++) ptr[i] = input[i]; if (u8_prev (&uc1, ptr + input_length, buf) != ptr) return 4; if (uc1 != uc) return 5; } /* Test recognition when preceded by a 3-unit character. */ { uint8_t buf[100]; uint8_t *ptr; size_t i; ucs4_t uc1; ptr = buf; *ptr++ = 0xE2; *ptr++ = 0x84; *ptr++ = 0x82; for (i = 0; i < input_length; i++) ptr[i] = input[i]; if (u8_prev (&uc1, ptr + input_length, buf) != ptr) return 6; if (uc1 != uc) return 7; } /* Test recognition when preceded by a 4-unit character. */ { uint8_t buf[100]; uint8_t *ptr; size_t i; ucs4_t uc1; ptr = buf; *ptr++ = 0xF0; *ptr++ = 0x9D; *ptr++ = 0x94; *ptr++ = 0x9E; for (i = 0; i < input_length; i++) ptr[i] = input[i]; if (u8_prev (&uc1, ptr + input_length, buf) != ptr) return 8; if (uc1 != uc) return 9; } *puc = uc; return 0; } static int check_invalid (const uint8_t *input, size_t input_length) { ucs4_t uc; /* Test recognition when at the beginning of the string. */ uc = 0xBADFACE; if (u8_prev (&uc, input + input_length, input) != NULL) return 1; if (uc != 0xBADFACE) return 2; /* Test recognition when preceded by a 1-unit character. */ { uint8_t buf[100]; uint8_t *ptr; size_t i; ptr = buf; *ptr++ = 'x'; for (i = 0; i < input_length; i++) ptr[i] = input[i]; uc = 0xBADFACE; if (u8_prev (&uc, ptr + input_length, buf) != NULL) return 3; if (uc != 0xBADFACE) return 4; } /* Test recognition when preceded by a 2-unit character. */ { uint8_t buf[100]; uint8_t *ptr; size_t i; ptr = buf; *ptr++ = 0xC3; *ptr++ = 0x97; for (i = 0; i < input_length; i++) ptr[i] = input[i]; uc = 0xBADFACE; if (u8_prev (&uc, ptr + input_length, buf) != NULL) return 5; if (uc != 0xBADFACE) return 6; } /* Test recognition when preceded by a 3-unit character. */ { uint8_t buf[100]; uint8_t *ptr; size_t i; ptr = buf; *ptr++ = 0xE2; *ptr++ = 0x84; *ptr++ = 0x82; for (i = 0; i < input_length; i++) ptr[i] = input[i]; uc = 0xBADFACE; if (u8_prev (&uc, ptr + input_length, buf) != NULL) return 7; if (uc != 0xBADFACE) return 8; } /* Test recognition when preceded by a 4-unit character. */ { uint8_t buf[100]; uint8_t *ptr; size_t i; ptr = buf; *ptr++ = 0xF0; *ptr++ = 0x9D; *ptr++ = 0x94; *ptr++ = 0x9E; for (i = 0; i < input_length; i++) ptr[i] = input[i]; uc = 0xBADFACE; if (u8_prev (&uc, ptr + input_length, buf) != NULL) return 9; if (uc != 0xBADFACE) return 10; } return 0; } int main () { ucs4_t uc; /* Test ISO 646 unit input. */ { ucs4_t c; uint8_t buf[1]; for (c = 0; c < 0x80; c++) { buf[0] = c; uc = 0xBADFACE; ASSERT (check (buf, 1, &uc) == 0); ASSERT (uc == c); } } /* Test 2-byte character input. */ { static const uint8_t input[] = { 0xC3, 0x97 }; uc = 0xBADFACE; ASSERT (check (input, SIZEOF (input), &uc) == 0); ASSERT (uc == 0x00D7); } /* Test 3-byte character input. */ { static const uint8_t input[] = { 0xE2, 0x82, 0xAC }; uc = 0xBADFACE; ASSERT (check (input, SIZEOF (input), &uc) == 0); ASSERT (uc == 0x20AC); } /* Test 4-byte character input. */ { static const uint8_t input[] = { 0xF4, 0x8F, 0xBF, 0xBD }; uc = 0xBADFACE; ASSERT (check (input, SIZEOF (input), &uc) == 0); ASSERT (uc == 0x10FFFD); } /* Test incomplete/invalid 1-byte input. */ { static const uint8_t input[] = { 0xC1 }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xC3 }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xE2 }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xF4 }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xFE }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } /* Test incomplete/invalid 2-byte input. */ { static const uint8_t input[] = { 0xE0, 0x9F }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xE2, 0x82 }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xE2, 0xD0 }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xF0, 0x8F }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xF3, 0x8F }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xF3, 0xD0 }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } /* Test incomplete/invalid 3-byte input. */ { static const uint8_t input[] = { 0xF3, 0x8F, 0xBF }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xF3, 0xE4, 0xBF }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } { static const uint8_t input[] = { 0xF3, 0x8F, 0xD0 }; ASSERT (check_invalid (input, SIZEOF (input)) == 0); } return 0; }