view tests/unistr/test-u8-prev.c @ 17249:e542fd46ad6f

maint: update all copyright year number ranges Run "make update-copyright". Compare to commit 1602f0a from last year. Signed-off-by: Eric Blake <eblake@redhat.com>
author Eric Blake <eblake@redhat.com>
date Tue, 01 Jan 2013 00:50:58 +0000
parents 8250f2777afc
children 344018b6e5d7
line wrap: on
line source

/* Test of u8_prev() function.
   Copyright (C) 2010-2013 Free Software Foundation, Inc.

   This program is free software: you can redistribute it and/or modify
   it under the terms of the GNU General Public License as published by
   the Free Software Foundation; either version 3 of the License, or
   (at your option) any later version.

   This program is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License for more details.

   You should have received a copy of the GNU General Public License
   along with this program.  If not, see <http://www.gnu.org/licenses/>.  */

/* Written by Bruno Haible <bruno@clisp.org>, 2010.  */

#include <config.h>

#include "unistr.h"

#include "macros.h"

static int
check (const uint8_t *input, size_t input_length, ucs4_t *puc)
{
  ucs4_t uc;

  /* Test recognition when at the beginning of the string.  */
  if (u8_prev (&uc, input + input_length, input) != input)
    return 1;

  /* Test recognition when preceded by a 1-unit character.  */
  {
    uint8_t buf[100];
    uint8_t *ptr;
    size_t i;
    ucs4_t uc1;

    ptr = buf;
    *ptr++ = 'x';
    for (i = 0; i < input_length; i++)
      ptr[i] = input[i];

    if (u8_prev (&uc1, ptr + input_length, buf) != ptr)
      return 2;
    if (uc1 != uc)
      return 3;
  }

  /* Test recognition when preceded by a 2-unit character.  */
  {
    uint8_t buf[100];
    uint8_t *ptr;
    size_t i;
    ucs4_t uc1;

    ptr = buf;
    *ptr++ = 0xC3;
    *ptr++ = 0x97;
    for (i = 0; i < input_length; i++)
      ptr[i] = input[i];

    if (u8_prev (&uc1, ptr + input_length, buf) != ptr)
      return 4;
    if (uc1 != uc)
      return 5;
  }

  /* Test recognition when preceded by a 3-unit character.  */
  {
    uint8_t buf[100];
    uint8_t *ptr;
    size_t i;
    ucs4_t uc1;

    ptr = buf;
    *ptr++ = 0xE2;
    *ptr++ = 0x84;
    *ptr++ = 0x82;
    for (i = 0; i < input_length; i++)
      ptr[i] = input[i];

    if (u8_prev (&uc1, ptr + input_length, buf) != ptr)
      return 6;
    if (uc1 != uc)
      return 7;
  }

  /* Test recognition when preceded by a 4-unit character.  */
  {
    uint8_t buf[100];
    uint8_t *ptr;
    size_t i;
    ucs4_t uc1;

    ptr = buf;
    *ptr++ = 0xF0;
    *ptr++ = 0x9D;
    *ptr++ = 0x94;
    *ptr++ = 0x9E;
    for (i = 0; i < input_length; i++)
      ptr[i] = input[i];

    if (u8_prev (&uc1, ptr + input_length, buf) != ptr)
      return 8;
    if (uc1 != uc)
      return 9;
  }

  *puc = uc;
  return 0;
}

static int
check_invalid (const uint8_t *input, size_t input_length)
{
  ucs4_t uc;

  /* Test recognition when at the beginning of the string.  */
  uc = 0xBADFACE;
  if (u8_prev (&uc, input + input_length, input) != NULL)
    return 1;
  if (uc != 0xBADFACE)
    return 2;

  /* Test recognition when preceded by a 1-unit character.  */
  {
    uint8_t buf[100];
    uint8_t *ptr;
    size_t i;

    ptr = buf;
    *ptr++ = 'x';
    for (i = 0; i < input_length; i++)
      ptr[i] = input[i];

    uc = 0xBADFACE;
    if (u8_prev (&uc, ptr + input_length, buf) != NULL)
      return 3;
    if (uc != 0xBADFACE)
      return 4;
  }

  /* Test recognition when preceded by a 2-unit character.  */
  {
    uint8_t buf[100];
    uint8_t *ptr;
    size_t i;

    ptr = buf;
    *ptr++ = 0xC3;
    *ptr++ = 0x97;
    for (i = 0; i < input_length; i++)
      ptr[i] = input[i];

    uc = 0xBADFACE;
    if (u8_prev (&uc, ptr + input_length, buf) != NULL)
      return 5;
    if (uc != 0xBADFACE)
      return 6;
  }

  /* Test recognition when preceded by a 3-unit character.  */
  {
    uint8_t buf[100];
    uint8_t *ptr;
    size_t i;

    ptr = buf;
    *ptr++ = 0xE2;
    *ptr++ = 0x84;
    *ptr++ = 0x82;
    for (i = 0; i < input_length; i++)
      ptr[i] = input[i];

    uc = 0xBADFACE;
    if (u8_prev (&uc, ptr + input_length, buf) != NULL)
      return 7;
    if (uc != 0xBADFACE)
      return 8;
  }

  /* Test recognition when preceded by a 4-unit character.  */
  {
    uint8_t buf[100];
    uint8_t *ptr;
    size_t i;

    ptr = buf;
    *ptr++ = 0xF0;
    *ptr++ = 0x9D;
    *ptr++ = 0x94;
    *ptr++ = 0x9E;
    for (i = 0; i < input_length; i++)
      ptr[i] = input[i];

    uc = 0xBADFACE;
    if (u8_prev (&uc, ptr + input_length, buf) != NULL)
      return 9;
    if (uc != 0xBADFACE)
      return 10;
  }

  return 0;
}

int
main ()
{
  ucs4_t uc;

  /* Test ISO 646 unit input.  */
  {
    ucs4_t c;
    uint8_t buf[1];

    for (c = 0; c < 0x80; c++)
      {
        buf[0] = c;
        uc = 0xBADFACE;
        ASSERT (check (buf, 1, &uc) == 0);
        ASSERT (uc == c);
      }
  }

  /* Test 2-byte character input.  */
  {
    static const uint8_t input[] = { 0xC3, 0x97 };
    uc = 0xBADFACE;
    ASSERT (check (input, SIZEOF (input), &uc) == 0);
    ASSERT (uc == 0x00D7);
  }

  /* Test 3-byte character input.  */
  {
    static const uint8_t input[] = { 0xE2, 0x82, 0xAC };
    uc = 0xBADFACE;
    ASSERT (check (input, SIZEOF (input), &uc) == 0);
    ASSERT (uc == 0x20AC);
  }

  /* Test 4-byte character input.  */
  {
    static const uint8_t input[] = { 0xF4, 0x8F, 0xBF, 0xBD };
    uc = 0xBADFACE;
    ASSERT (check (input, SIZEOF (input), &uc) == 0);
    ASSERT (uc == 0x10FFFD);
  }

  /* Test incomplete/invalid 1-byte input.  */
  {
    static const uint8_t input[] = { 0xC1 };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xC3 };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xE2 };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xF4 };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xFE };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }

  /* Test incomplete/invalid 2-byte input.  */
  {
    static const uint8_t input[] = { 0xE0, 0x9F };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xE2, 0x82 };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xE2, 0xD0 };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xF0, 0x8F };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xF3, 0x8F };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xF3, 0xD0 };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }

  /* Test incomplete/invalid 3-byte input.  */
  {
    static const uint8_t input[] = { 0xF3, 0x8F, 0xBF };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xF3, 0xE4, 0xBF };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }
  {
    static const uint8_t input[] = { 0xF3, 0x8F, 0xD0 };
    ASSERT (check_invalid (input, SIZEOF (input)) == 0);
  }

  return 0;
}