1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
|
/*
* Copyright 2009, The Android Open Source Project
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* * Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* * Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
* COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
* OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
* AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#include <iostream>
#include <string>
#include <vector>
static const char gSite[] = "http://www.corp.google.com/eng/doc/emoji/dev.html";
using namespace std;
static int hexchar_to_int(char c) {
if (c >= '0' && c <= '9') {
return c - '0';
}
if (c >= 'A' && c <= 'F') {
return 10 + c - 'A';
}
if (c >= 'a' && c <= 'f') {
return 10 + c - 'a';
}
return -1; // unrecognized char for nex
}
/* Tool to build gmoji_pua table, listing all of the pua values for gmoji
*/
int main (int argc, char * const argv[]) {
char buffer[10000];
FILE* file = fopen(argv[1], "r");
if (NULL == file) {
std::cerr << "Can't open " << argv[1] << " for input. Aborting\n";
std::cout << "\n";
return -1;
}
vector<int> unichars;
int lineNo = 0;
for (;;) {
if (fgets(buffer, sizeof(buffer), file) == 0) {
break;
}
int prevPua = 0;
int pua = 0;
// we just want to eat the first 5 chars
for (int i = 0; i < 5; i++) {
int value = hexchar_to_int(buffer[i]);
if (value < 0) { // bad char for hex
std::cerr << "Expected hex char on line " << lineNo
<< " col " << i << "\n";
return -1;
}
pua = (pua << 4) | value;
}
if (pua < 0xFE000 || pua > 0xFEFFF) {
std::cerr << "PUA not in expected range " << pua << " line "
<< lineNo << "\n";
return -1;
}
if (pua <= prevPua) {
std::cerr << "PUA value not in ascending order line "
<< lineNo << "\n";
return -1;
}
unichars.push_back(pua);
prevPua = pua;
lineNo++;
}
// Now output our resulting array to look like a C array
const int perLine = 8;
const int base = unichars[0];
printf("\n");
printf("// Compressed gmoji table, sorted\n");
printf("// Originally scraped from %s\n", gSite);
printf("// Input text file \"%s\"\n", argv[1]);
printf("\n");
printf("static const uint16_t gGmojiPUA[] = {\n");
for (int i = 0; i < unichars.size(); i++) {
if ((i % perLine) == 0) { // first one
printf(" ");
}
printf("0x%03X", unichars[i] - base);
if (i == unichars.size() - 1) { // last one entirely
printf("\n");
}
else if ((i % perLine) == (perLine - 1)) { // last one on line
printf(",\n");
} else {
printf(", ");
}
}
printf("};\n");
printf("\n");
printf("#define GMOJI_PUA_MIN 0x%X\n", unichars[0]);
printf("#define GMOJI_PUA_MAX 0x%X\n", unichars[unichars.size()-1]);
printf("#define GMOJI_PUA_COUNT (sizeof(gGmojiPUA) / sizeof(gGmojiPUA[0]))\n");
printf("// GMOJI_PUA_COUNT should be %d\n", unichars.size());
printf("\n");
fclose(file);
return 0;
}
|