summaryrefslogtreecommitdiff
path: root/src/raptor_nfc_icu.c
blob: 9d17982ad0c92a631929749b212484ecc664e050 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
/* -*- Mode: c; c-basic-offset: 2 -*-
 *
 * raptor_nfc_icu.c - Raptor Unicode NFC checking via ICU library
 *
 * Copyright (C) 2012, David Beckett http://www.dajobe.org/
 * 
 * This package is Free Software and part of Redland http://librdf.org/
 * 
 * It is licensed under the following three licenses as alternatives:
 *   1. GNU Lesser General Public License (LGPL) V2.1 or any newer version
 *   2. GNU General Public License (GPL) V2 or any newer version
 *   3. Apache License, V2.0 or any newer version
 * 
 * You may not use this file except in compliance with at least one of
 * the above three licenses.
 * 
 * See LICENSE.html or LICENSE.txt at the top of this package for the
 * complete terms and further detail along with the license texts for
 * the licenses in COPYING.LIB, COPYING and LICENSE-2.0.txt respectively.
 * 
 * 
 */


#ifdef HAVE_CONFIG_H
#include <raptor_config.h>
#endif

#ifdef HAVE_STDLIB_H
#include <stdlib.h>
#endif

#include <stdio.h>
#include <stdarg.h>
#ifdef HAVE_STDLIB_H
#include <stdlib.h>
#endif

/* Raptor includes */
#include "raptor2.h"
#include "raptor_internal.h"

#if ICU_UC_MAJOR_VERSION >= 56
#include <unicode/unorm2.h>
#else
#include <unicode/unorm.h>
#endif


/**
 * raptor_nfc_icu_check:
 * @input: UTF-8 string
 * @length: length of string
 * @errorp: pointer to store offset of character in error (or NULL)
 *
 * Unicode Normal Form C (NFC) check function.
 *
 * If errorp is not NULL, it is set to the offset of the character
 * in error in the buffer, or <0 if there is no error.
 * 
 * Return value: Non 0 if the string is NFC
 **/
int
raptor_nfc_icu_check(const unsigned char* string, size_t len, int *error)
{
  /* unorm_quickCheck was deprecated in ICU UC V56 */

#if ICU_UC_MAJOR_VERSION >= 56
  /* norm2 is be a singleton - do not attempt to free it */
  const UNormalizer2 *norm2;
  UErrorCode error_code = U_ZERO_ERROR;
  UNormalizationCheckResult res;

  norm2 = unorm2_getNFCInstance(&error_code);
  if(!U_SUCCESS(error_code)) {
     if(error)
       *error = 1;
     return 0;
  }

  res = unorm2_quickCheck(norm2,(const UChar *)string, (int32_t)len,
                          &error_code);
   if(!U_SUCCESS(error_code)) {
     if(error)
       *error = 1;
     return 0;
   }

   return (res == UNORM_YES);
#else
   UNormalizationCheckResult res;
   UErrorCode error_code = U_ZERO_ERROR;

   res = unorm_quickCheck((const UChar *)string, (int32_t)len,
                          UNORM_NFC, &error_code);
   if(!U_SUCCESS(error_code)) {
     if(error)
       *error = 1;
     return 0;
   }
   
   return (res == UNORM_YES);
#endif
}