forked from swiftlang/swift
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathUnicodeGraphemeBreakTest.cpp.gyb
72 lines (56 loc) · 2.09 KB
/
UnicodeGraphemeBreakTest.cpp.gyb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
%# -*- mode: C++ -*-
%# Ignore the following admonition; it applies to the resulting .cpp file only
//// Automatically Generated From UnicodeExtendedGraphemeClusters.cpp.gyb.
//// Do Not Edit Directly!
//===----------------------------------------------------------------------===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2014 - 2015 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See http://swift.org/LICENSE.txt for license information
// See http://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
//
//===----------------------------------------------------------------------===//
%{
from GYBUnicodeDataUtils import *
grapheme_cluster_break_tests = \
get_grapheme_cluster_break_tests_as_UTF8(unicodeGraphemeBreakTestFile)
}%
#include "swift/Basic/Unicode.h"
#include "gtest/gtest.h"
#include <vector>
using namespace swift;
using namespace swift::unicode;
static std::vector<unsigned> FindGraphemeClusterBoundaries(StringRef Str) {
std::vector<unsigned> Result;
Result.push_back(0);
unsigned Pos = 0;
while (Pos != Str.size()) {
Pos += extractFirstExtendedGraphemeCluster(Str.substr(Pos)).size();
Result.push_back(Pos);
}
return Result;
}
TEST(ExtractExtendedGraphemeCluster, TestsFromUnicodeSpec) {
% for subject_string,expected_boundaries in grapheme_cluster_break_tests:
EXPECT_EQ((std::vector<unsigned>{ ${', '.join([ str(x) for x in expected_boundaries ])} }),
FindGraphemeClusterBoundaries("${subject_string}"));
% end
}
TEST(ExtractExtendedGraphemeCluster, ExtraTests) {
//
// Sequences with one continuation byte missing
//
EXPECT_EQ((std::vector<unsigned>{ 0, 1 }),
FindGraphemeClusterBoundaries("\xc2"));
//
// Isolated surrogates
//
EXPECT_EQ((std::vector<unsigned>{ 0, 1, 2, 3 }),
FindGraphemeClusterBoundaries("\xed\xa0\x80"));
EXPECT_EQ((std::vector<unsigned>{ 0, 4, 5, 6, 11 }),
FindGraphemeClusterBoundaries(
"\xf3\xa0\x84\x80" "\xed\xa0\x80" "\xf3\xa0\x84\x80"));
}