summaryrefslogtreecommitdiffstats
path: root/chrome/browser/sync/util/character_set_converters-linux.cc
diff options
context:
space:
mode:
Diffstat (limited to 'chrome/browser/sync/util/character_set_converters-linux.cc')
-rw-r--r--chrome/browser/sync/util/character_set_converters-linux.cc60
1 files changed, 60 insertions, 0 deletions
diff --git a/chrome/browser/sync/util/character_set_converters-linux.cc b/chrome/browser/sync/util/character_set_converters-linux.cc
new file mode 100644
index 0000000..96ad1b6
--- /dev/null
+++ b/chrome/browser/sync/util/character_set_converters-linux.cc
@@ -0,0 +1,60 @@
+// Copyright (c) 2009 The Chromium Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style license that can be
+// found in the LICENSE file.
+
+#include "chrome/browser/sync/util/character_set_converters.h"
+
+#include <string>
+
+using std::string;
+
+namespace browser_sync {
+
+// Converts input_string to UTF8 and appends the result into output_string.
+void AppendPathStringToUTF8(const PathChar *wide, int size,
+ string* output_string) {
+ output_string->append(wide, size);
+}
+
+bool AppendUTF8ToPathString(const char* utf8, size_t size,
+ PathString* output_string) {
+ output_string->append(utf8, size);
+ return true;
+}
+
+void TrimPathStringToValidCharacter(PathString* string) {
+ // Constants from http://en.wikipedia.org/wiki/UTF-8
+ CHECK(string);
+ if (string->empty())
+ return;
+ if (0 == (string->at(string->length() - 1) & 0x080))
+ return;
+ int partial_enc_bytes = 0;
+ for (partial_enc_bytes = 0 ; true ; ++partial_enc_bytes) {
+ if (4 == partial_enc_bytes || partial_enc_bytes == string->length()) {
+ // original string was broken, garbage in, garbage out.
+ return;
+ }
+ PathChar c = string->at(string->length() - 1 - partial_enc_bytes);
+ if ((c & 0x0c0) == 0x080) // utf continuation char;
+ continue;
+ if ((c & 0x0e0) == 0x0e0) // 2-byte encoded char.
+ if (1 == partial_enc_bytes)
+ return;
+ else
+ break;
+ if ((c & 0x0f0) == 0xc0) // 3-byte encoded char.
+ if (2 == partial_enc_bytes)
+ return;
+ else
+ break;
+ if ((c & 0x0f8) == 0x0f0) // 4-byte encoded char.
+ if (3 == partial_enc_bytes)
+ return;
+ else
+ break;
+ }
+ string->resize(string->length() - 1 - partial_enc_bytes);
+}
+
+} // namespace browser_sync