summaryrefslogtreecommitdiff
path: root/chromium/device/bluetooth/string_util_icu.cc
blob: 148a4ca8620b8c72fce8b8984c9ca44d2834d440 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
// Copyright 2016 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#include "device/bluetooth/string_util_icu.h"

#include <memory>

#include "base/macros.h"
#include "base/memory/singleton.h"
#include "base/strings/string_util.h"
#include "third_party/icu/source/common/unicode/uniset.h"

namespace device {

namespace {

class GraphicCharacters {
 public:
  static GraphicCharacters* GetInstance() {
    return base::Singleton<GraphicCharacters, base::LeakySingletonTraits<
                                                  GraphicCharacters>>::get();
  }

  bool HasGraphicCharacter(base::StringPiece s) {
    int32_t length = graphic_->spanUTF8(
        s.data(), s.size(), USetSpanCondition::USET_SPAN_NOT_CONTAINED);
    return static_cast<size_t>(length) != s.size();
  }

 private:
  friend struct base::DefaultSingletonTraits<GraphicCharacters>;

  GraphicCharacters();

  // set of graphic characters.
  std::unique_ptr<icu::UnicodeSet> graphic_;

  DISALLOW_COPY_AND_ASSIGN(GraphicCharacters);
};

GraphicCharacters::GraphicCharacters() {
  UErrorCode graphic_status = U_ZERO_ERROR;

  // The set of Unicode Graphic Characters as defined by
  // http://www.unicode.org/reports/tr18/#graph
  // This set is composed of the characters not included in the following
  // sets:
  // - Whitespace (WSpace)
  // - gc=Control (Cc)
  // - gc=Surrogate (Cs)
  // - gc=Unassigned (Cn)
  graphic_.reset(
      new icu::UnicodeSet(UNICODE_STRING_SIMPLE("[:graph:]"), graphic_status));
  DCHECK(U_SUCCESS(graphic_status));

  graphic_->freeze();
}

}  // namespace

bool HasGraphicCharacter(base::StringPiece s) {
  DCHECK(base::IsStringUTF8(s));
  return GraphicCharacters::GetInstance()->HasGraphicCharacter(s);
}

}  // namespace device