// Copyright (c) 2012 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // // This file implements utility functions for eliding and formatting UI text. // // Note that several of the functions declared in text_elider.h are implemented // in this file using helper classes in an unnamed namespace. #include "ui/gfx/text_elider.h" #include #include #include "base/files/file_path.h" #include "base/i18n/break_iterator.h" #include "base/i18n/char_iterator.h" #include "base/i18n/rtl.h" #include "base/memory/scoped_ptr.h" #include "base/strings/string_split.h" #include "base/strings/string_util.h" #include "base/strings/sys_string_conversions.h" #include "base/strings/utf_string_conversions.h" #include "net/base/escape.h" #include "net/base/net_util.h" #include "net/base/registry_controlled_domains/registry_controlled_domain.h" #include "third_party/icu/source/common/unicode/rbbi.h" #include "third_party/icu/source/common/unicode/uloc.h" #include "ui/gfx/font_list.h" #include "ui/gfx/text_utils.h" #include "url/gurl.h" namespace gfx { // U+2026 in utf8 const char kEllipsis[] = "\xE2\x80\xA6"; const char16 kEllipsisUTF16[] = { 0x2026, 0 }; const char16 kForwardSlash = '/'; namespace { // Helper class to split + elide text, while respecting UTF16 surrogate pairs. class StringSlicer { public: StringSlicer(const string16& text, const string16& ellipsis, bool elide_in_middle) : text_(text), ellipsis_(ellipsis), elide_in_middle_(elide_in_middle) { } // Cuts |text_| to be |length| characters long. If |elide_in_middle_| is true, // the middle of the string is removed to leave equal-length pieces from the // beginning and end of the string; otherwise, the end of the string is // removed and only the beginning remains. If |insert_ellipsis| is true, // then an ellipsis character will be inserted at the cut point. string16 CutString(size_t length, bool insert_ellipsis) { const string16 ellipsis_text = insert_ellipsis ? ellipsis_ : string16(); if (!elide_in_middle_) return text_.substr(0, FindValidBoundaryBefore(length)) + ellipsis_text; // We put the extra character, if any, before the cut. const size_t half_length = length / 2; const size_t prefix_length = FindValidBoundaryBefore(length - half_length); const size_t suffix_start_guess = text_.length() - half_length; const size_t suffix_start = FindValidBoundaryAfter(suffix_start_guess); const size_t suffix_length = half_length - (suffix_start_guess - suffix_start); return text_.substr(0, prefix_length) + ellipsis_text + text_.substr(suffix_start, suffix_length); } private: // Returns a valid cut boundary at or before |index|. size_t FindValidBoundaryBefore(size_t index) const { DCHECK_LE(index, text_.length()); if (index != text_.length()) U16_SET_CP_START(text_.data(), 0, index); return index; } // Returns a valid cut boundary at or after |index|. size_t FindValidBoundaryAfter(size_t index) const { DCHECK_LE(index, text_.length()); if (index != text_.length()) U16_SET_CP_LIMIT(text_.data(), 0, index, text_.length()); return index; } // The text to be sliced. const string16& text_; // Ellipsis string to use. const string16& ellipsis_; // If true, the middle of the string will be elided. bool elide_in_middle_; DISALLOW_COPY_AND_ASSIGN(StringSlicer); }; // Build a path from the first |num_components| elements in |path_elements|. // Prepends |path_prefix|, appends |filename|, inserts ellipsis if appropriate. string16 BuildPathFromComponents(const string16& path_prefix, const std::vector& path_elements, const string16& filename, size_t num_components) { // Add the initial elements of the path. string16 path = path_prefix; // Build path from first |num_components| elements. for (size_t j = 0; j < num_components; ++j) path += path_elements[j] + kForwardSlash; // Add |filename|, ellipsis if necessary. if (num_components != (path_elements.size() - 1)) path += string16(kEllipsisUTF16) + kForwardSlash; path += filename; return path; } // Takes a prefix (Domain, or Domain+subdomain) and a collection of path // components and elides if possible. Returns a string containing the longest // possible elided path, or an empty string if elision is not possible. string16 ElideComponentizedPath(const string16& url_path_prefix, const std::vector& url_path_elements, const string16& url_filename, const string16& url_query, const gfx::FontList& font_list, int available_pixel_width) { const size_t url_path_number_of_elements = url_path_elements.size(); CHECK(url_path_number_of_elements); for (size_t i = url_path_number_of_elements - 1; i > 0; --i) { string16 elided_path = BuildPathFromComponents(url_path_prefix, url_path_elements, url_filename, i); if (available_pixel_width >= gfx::GetStringWidth(elided_path, font_list)) return ElideText(elided_path + url_query, font_list, available_pixel_width, ELIDE_AT_END); } return string16(); } } // namespace string16 ElideEmail(const string16& email, const gfx::FontList& font_list, int available_pixel_width) { if (gfx::GetStringWidth(email, font_list) <= available_pixel_width) return email; // Split the email into its local-part (username) and domain-part. The email // spec technically allows for @ symbols in the local-part (username) of the // email under some special requirements. It is guaranteed that there is no @ // symbol in the domain part of the email however so splitting at the last @ // symbol is safe. const size_t split_index = email.find_last_of('@'); DCHECK_NE(split_index, string16::npos); string16 username = email.substr(0, split_index); string16 domain = email.substr(split_index + 1); DCHECK(!username.empty()); DCHECK(!domain.empty()); // Subtract the @ symbol from the available width as it is mandatory. const string16 kAtSignUTF16 = ASCIIToUTF16("@"); available_pixel_width -= gfx::GetStringWidth(kAtSignUTF16, font_list); // Check whether eliding the domain is necessary: if eliding the username // is sufficient, the domain will not be elided. const int full_username_width = gfx::GetStringWidth(username, font_list); const int available_domain_width = available_pixel_width - std::min(full_username_width, gfx::GetStringWidth(username.substr(0, 1) + kEllipsisUTF16, font_list)); if (gfx::GetStringWidth(domain, font_list) > available_domain_width) { // Elide the domain so that it only takes half of the available width. // Should the username not need all the width available in its half, the // domain will occupy the leftover width. // If |desired_domain_width| is greater than |available_domain_width|: the // minimal username elision allowed by the specifications will not fit; thus // |desired_domain_width| must be <= |available_domain_width| at all cost. const int desired_domain_width = std::min(available_domain_width, std::max(available_pixel_width - full_username_width, available_pixel_width / 2)); domain = ElideText(domain, font_list, desired_domain_width, ELIDE_IN_MIDDLE); // Failing to elide the domain such that at least one character remains // (other than the ellipsis itself) remains: return a single ellipsis. if (domain.length() <= 1U) return string16(kEllipsisUTF16); } // Fit the username in the remaining width (at this point the elided username // is guaranteed to fit with at least one character remaining given all the // precautions taken earlier). available_pixel_width -= gfx::GetStringWidth(domain, font_list); username = ElideText(username, font_list, available_pixel_width, ELIDE_AT_END); return username + kAtSignUTF16 + domain; } string16 ElideEmail(const string16& email, const gfx::Font& font, int available_pixel_width) { return ElideEmail(email, gfx::FontList(font), available_pixel_width); } // TODO(pkasting): http://crbug.com/77883 This whole function gets // kerning/ligatures/etc. issues potentially wrong by assuming that the width of // a rendered string is always the sum of the widths of its substrings. Also I // suspect it could be made simpler. string16 ElideUrl(const GURL& url, const gfx::FontList& font_list, int available_pixel_width, const std::string& languages) { // Get a formatted string and corresponding parsing of the url. url_parse::Parsed parsed; const string16 url_string = net::FormatUrl(url, languages, net::kFormatUrlOmitAll, net::UnescapeRule::SPACES, &parsed, NULL, NULL); if (available_pixel_width <= 0) return url_string; // If non-standard, return plain eliding. if (!url.IsStandard()) return ElideText(url_string, font_list, available_pixel_width, ELIDE_AT_END); // Now start eliding url_string to fit within available pixel width. // Fist pass - check to see whether entire url_string fits. const int pixel_width_url_string = gfx::GetStringWidth(url_string, font_list); if (available_pixel_width >= pixel_width_url_string) return url_string; // Get the path substring, including query and reference. const size_t path_start_index = parsed.path.begin; const size_t path_len = parsed.path.len; string16 url_path_query_etc = url_string.substr(path_start_index); string16 url_path = url_string.substr(path_start_index, path_len); // Return general elided text if url minus the query fits. const string16 url_minus_query = url_string.substr(0, path_start_index + path_len); if (available_pixel_width >= gfx::GetStringWidth(url_minus_query, font_list)) return ElideText(url_string, font_list, available_pixel_width, ELIDE_AT_END); // Get Host. string16 url_host = UTF8ToUTF16(url.host()); // Get domain and registry information from the URL. string16 url_domain = UTF8ToUTF16( net::registry_controlled_domains::GetDomainAndRegistry( url, net::registry_controlled_domains::EXCLUDE_PRIVATE_REGISTRIES)); if (url_domain.empty()) url_domain = url_host; // Add port if required. if (!url.port().empty()) { url_host += UTF8ToUTF16(":" + url.port()); url_domain += UTF8ToUTF16(":" + url.port()); } // Get sub domain. string16 url_subdomain; const size_t domain_start_index = url_host.find(url_domain); if (domain_start_index != string16::npos) url_subdomain = url_host.substr(0, domain_start_index); const string16 kWwwPrefix = UTF8ToUTF16("www."); if ((url_subdomain == kWwwPrefix || url_subdomain.empty() || url.SchemeIsFile())) { url_subdomain.clear(); } // If this is a file type, the path is now defined as everything after ":". // For example, "C:/aa/aa/bb", the path is "/aa/bb/cc". Interesting, the // domain is now C: - this is a nice hack for eliding to work pleasantly. if (url.SchemeIsFile()) { // Split the path string using ":" std::vector file_path_split; base::SplitString(url_path, ':', &file_path_split); if (file_path_split.size() > 1) { // File is of type "file:///C:/.." url_host.clear(); url_domain.clear(); url_subdomain.clear(); const string16 kColon = UTF8ToUTF16(":"); url_host = url_domain = file_path_split.at(0).substr(1) + kColon; url_path_query_etc = url_path = file_path_split.at(1); } } // Second Pass - remove scheme - the rest fits. const int pixel_width_url_host = gfx::GetStringWidth(url_host, font_list); const int pixel_width_url_path = gfx::GetStringWidth(url_path_query_etc, font_list); if (available_pixel_width >= pixel_width_url_host + pixel_width_url_path) return url_host + url_path_query_etc; // Third Pass: Subdomain, domain and entire path fits. const int pixel_width_url_domain = gfx::GetStringWidth(url_domain, font_list); const int pixel_width_url_subdomain = gfx::GetStringWidth(url_subdomain, font_list); if (available_pixel_width >= pixel_width_url_subdomain + pixel_width_url_domain + pixel_width_url_path) return url_subdomain + url_domain + url_path_query_etc; // Query element. string16 url_query; const int kPixelWidthDotsTrailer = gfx::GetStringWidth( string16(kEllipsisUTF16), font_list); if (parsed.query.is_nonempty()) { url_query = UTF8ToUTF16("?") + url_string.substr(parsed.query.begin); if (available_pixel_width >= (pixel_width_url_subdomain + pixel_width_url_domain + pixel_width_url_path - gfx::GetStringWidth(url_query, font_list))) { return ElideText(url_subdomain + url_domain + url_path_query_etc, font_list, available_pixel_width, ELIDE_AT_END); } } // Parse url_path using '/'. std::vector url_path_elements; base::SplitString(url_path, kForwardSlash, &url_path_elements); // Get filename - note that for a path ending with / // such as www.google.com/intl/ads/, the file name is ads/. size_t url_path_number_of_elements = url_path_elements.size(); DCHECK(url_path_number_of_elements != 0); string16 url_filename; if ((url_path_elements.at(url_path_number_of_elements - 1)).length() > 0) { url_filename = *(url_path_elements.end() - 1); } else if (url_path_number_of_elements > 1) { // Path ends with a '/'. url_filename = url_path_elements.at(url_path_number_of_elements - 2) + kForwardSlash; url_path_number_of_elements--; } DCHECK(url_path_number_of_elements != 0); const size_t kMaxNumberOfUrlPathElementsAllowed = 1024; if (url_path_number_of_elements <= 1 || url_path_number_of_elements > kMaxNumberOfUrlPathElementsAllowed) { // No path to elide, or too long of a path (could overflow in loop below) // Just elide this as a text string. return ElideText(url_subdomain + url_domain + url_path_query_etc, font_list, available_pixel_width, ELIDE_AT_END); } // Start eliding the path and replacing elements by ".../". const string16 kEllipsisAndSlash = string16(kEllipsisUTF16) + kForwardSlash; const int pixel_width_ellipsis_slash = gfx::GetStringWidth(kEllipsisAndSlash, font_list); // Check with both subdomain and domain. string16 elided_path = ElideComponentizedPath(url_subdomain + url_domain, url_path_elements, url_filename, url_query, font_list, available_pixel_width); if (!elided_path.empty()) return elided_path; // Check with only domain. // If a subdomain is present, add an ellipsis before domain. // This is added only if the subdomain pixel width is larger than // the pixel width of kEllipsis. Otherwise, subdomain remains, // which means that this case has been resolved earlier. string16 url_elided_domain = url_subdomain + url_domain; if (pixel_width_url_subdomain > kPixelWidthDotsTrailer) { if (!url_subdomain.empty()) url_elided_domain = kEllipsisAndSlash[0] + url_domain; else url_elided_domain = url_domain; elided_path = ElideComponentizedPath(url_elided_domain, url_path_elements, url_filename, url_query, font_list, available_pixel_width); if (!elided_path.empty()) return elided_path; } // Return elided domain/.../filename anyway. string16 final_elided_url_string(url_elided_domain); const int url_elided_domain_width = gfx::GetStringWidth(url_elided_domain, font_list); // A hack to prevent trailing ".../...". if ((available_pixel_width - url_elided_domain_width) > pixel_width_ellipsis_slash + kPixelWidthDotsTrailer + gfx::GetStringWidth(ASCIIToUTF16("UV"), font_list)) { final_elided_url_string += BuildPathFromComponents(string16(), url_path_elements, url_filename, 1); } else { final_elided_url_string += url_path; } return ElideText(final_elided_url_string, font_list, available_pixel_width, ELIDE_AT_END); } string16 ElideUrl(const GURL& url, const gfx::Font& font, int available_pixel_width, const std::string& languages) { return ElideUrl(url, gfx::FontList(font), available_pixel_width, languages); } string16 ElideFilename(const base::FilePath& filename, const gfx::FontList& font_list, int available_pixel_width) { #if defined(OS_WIN) string16 filename_utf16 = filename.value(); string16 extension = filename.Extension(); string16 rootname = filename.BaseName().RemoveExtension().value(); #elif defined(OS_POSIX) string16 filename_utf16 = WideToUTF16(base::SysNativeMBToWide( filename.value())); string16 extension = WideToUTF16(base::SysNativeMBToWide( filename.Extension())); string16 rootname = WideToUTF16(base::SysNativeMBToWide( filename.BaseName().RemoveExtension().value())); #endif const int full_width = gfx::GetStringWidth(filename_utf16, font_list); if (full_width <= available_pixel_width) return base::i18n::GetDisplayStringInLTRDirectionality(filename_utf16); if (rootname.empty() || extension.empty()) { const string16 elided_name = ElideText(filename_utf16, font_list, available_pixel_width, ELIDE_AT_END); return base::i18n::GetDisplayStringInLTRDirectionality(elided_name); } const int ext_width = gfx::GetStringWidth(extension, font_list); const int root_width = gfx::GetStringWidth(rootname, font_list); // We may have trimmed the path. if (root_width + ext_width <= available_pixel_width) { const string16 elided_name = rootname + extension; return base::i18n::GetDisplayStringInLTRDirectionality(elided_name); } if (ext_width >= available_pixel_width) { const string16 elided_name = ElideText(rootname + extension, font_list, available_pixel_width, ELIDE_IN_MIDDLE); return base::i18n::GetDisplayStringInLTRDirectionality(elided_name); } int available_root_width = available_pixel_width - ext_width; string16 elided_name = ElideText(rootname, font_list, available_root_width, ELIDE_AT_END); elided_name += extension; return base::i18n::GetDisplayStringInLTRDirectionality(elided_name); } string16 ElideFilename(const base::FilePath& filename, const gfx::Font& font, int available_pixel_width) { return ElideFilename(filename, gfx::FontList(font), available_pixel_width); } string16 ElideText(const string16& text, const gfx::FontList& font_list, int available_pixel_width, ElideBehavior elide_behavior) { if (text.empty()) return text; const int current_text_pixel_width = gfx::GetStringWidth(text, font_list); const bool elide_in_middle = (elide_behavior == ELIDE_IN_MIDDLE); const bool insert_ellipsis = (elide_behavior != TRUNCATE_AT_END); const string16 ellipsis = string16(kEllipsisUTF16); StringSlicer slicer(text, ellipsis, elide_in_middle); // Pango will return 0 width for absurdly long strings. Cut the string in // half and try again. // This is caused by an int overflow in Pango (specifically, in // pango_glyph_string_extents_range). It's actually more subtle than just // returning 0, since on super absurdly long strings, the int can wrap and // return positive numbers again. Detecting that is probably not worth it // (eliding way too much from a ridiculous string is probably still // ridiculous), but we should check other widths for bogus values as well. if (current_text_pixel_width <= 0 && !text.empty()) { const string16 cut = slicer.CutString(text.length() / 2, false); return ElideText(cut, font_list, available_pixel_width, elide_behavior); } if (current_text_pixel_width <= available_pixel_width) return text; if (insert_ellipsis && gfx::GetStringWidth(ellipsis, font_list) > available_pixel_width) return string16(); // Use binary search to compute the elided text. size_t lo = 0; size_t hi = text.length() - 1; size_t guess; for (guess = (lo + hi) / 2; lo <= hi; guess = (lo + hi) / 2) { // We check the length of the whole desired string at once to ensure we // handle kerning/ligatures/etc. correctly. const string16 cut = slicer.CutString(guess, insert_ellipsis); const int guess_length = gfx::GetStringWidth(cut, font_list); // Check again that we didn't hit a Pango width overflow. If so, cut the // current string in half and start over. if (guess_length <= 0) { return ElideText(slicer.CutString(guess / 2, false), font_list, available_pixel_width, elide_behavior); } if (guess_length > available_pixel_width) hi = guess - 1; else lo = guess + 1; } return slicer.CutString(guess, insert_ellipsis); } string16 ElideText(const string16& text, const gfx::Font& font, int available_pixel_width, ElideBehavior elide_behavior) { return ElideText(text, gfx::FontList(font), available_pixel_width, elide_behavior); } SortedDisplayURL::SortedDisplayURL(const GURL& url, const std::string& languages) { net::AppendFormattedHost(url, languages, &sort_host_); string16 host_minus_www = net::StripWWW(sort_host_); url_parse::Parsed parsed; display_url_ = net::FormatUrl(url, languages, net::kFormatUrlOmitAll, net::UnescapeRule::SPACES, &parsed, &prefix_end_, NULL); if (sort_host_.length() > host_minus_www.length()) { prefix_end_ += sort_host_.length() - host_minus_www.length(); sort_host_.swap(host_minus_www); } } SortedDisplayURL::SortedDisplayURL() : prefix_end_(0) { } SortedDisplayURL::~SortedDisplayURL() { } int SortedDisplayURL::Compare(const SortedDisplayURL& other, icu::Collator* collator) const { // Compare on hosts first. The host won't contain 'www.'. UErrorCode compare_status = U_ZERO_ERROR; UCollationResult host_compare_result = collator->compare( static_cast(sort_host_.c_str()), static_cast(sort_host_.length()), static_cast(other.sort_host_.c_str()), static_cast(other.sort_host_.length()), compare_status); DCHECK(U_SUCCESS(compare_status)); if (host_compare_result != 0) return host_compare_result; // Hosts match, compare on the portion of the url after the host. string16 path = this->AfterHost(); string16 o_path = other.AfterHost(); compare_status = U_ZERO_ERROR; UCollationResult path_compare_result = collator->compare( static_cast(path.c_str()), static_cast(path.length()), static_cast(o_path.c_str()), static_cast(o_path.length()), compare_status); DCHECK(U_SUCCESS(compare_status)); if (path_compare_result != 0) return path_compare_result; // Hosts and paths match, compare on the complete url. This'll push the www. // ones to the end. compare_status = U_ZERO_ERROR; UCollationResult display_url_compare_result = collator->compare( static_cast(display_url_.c_str()), static_cast(display_url_.length()), static_cast(other.display_url_.c_str()), static_cast(other.display_url_.length()), compare_status); DCHECK(U_SUCCESS(compare_status)); return display_url_compare_result; } string16 SortedDisplayURL::AfterHost() const { const size_t slash_index = display_url_.find(sort_host_, prefix_end_); if (slash_index == string16::npos) { NOTREACHED(); return string16(); } return display_url_.substr(slash_index + sort_host_.length()); } bool ElideString(const string16& input, int max_len, string16* output) { DCHECK_GE(max_len, 0); if (static_cast(input.length()) <= max_len) { output->assign(input); return false; } switch (max_len) { case 0: output->clear(); break; case 1: output->assign(input.substr(0, 1)); break; case 2: output->assign(input.substr(0, 2)); break; case 3: output->assign(input.substr(0, 1) + ASCIIToUTF16(".") + input.substr(input.length() - 1)); break; case 4: output->assign(input.substr(0, 1) + ASCIIToUTF16("..") + input.substr(input.length() - 1)); break; default: { int rstr_len = (max_len - 3) / 2; int lstr_len = rstr_len + ((max_len - 3) % 2); output->assign(input.substr(0, lstr_len) + ASCIIToUTF16("...") + input.substr(input.length() - rstr_len)); break; } } return true; } namespace { // Internal class used to track progress of a rectangular string elide // operation. Exists so the top-level ElideRectangleString() function // can be broken into smaller methods sharing this state. class RectangleString { public: RectangleString(size_t max_rows, size_t max_cols, bool strict, string16 *output) : max_rows_(max_rows), max_cols_(max_cols), current_row_(0), current_col_(0), strict_(strict), suppressed_(false), output_(output) {} // Perform deferred initializations following creation. Must be called // before any input can be added via AddString(). void Init() { output_->clear(); } // Add an input string, reformatting to fit the desired dimensions. // AddString() may be called multiple times to concatenate together // multiple strings into the region (the current caller doesn't do // this, however). void AddString(const string16& input); // Perform any deferred output processing. Must be called after the // last AddString() call has occurred. bool Finalize(); private: // Add a line to the rectangular region at the current position, // either by itself or by breaking it into words. void AddLine(const string16& line); // Add a word to the rectangular region at the current position, // either by itself or by breaking it into characters. void AddWord(const string16& word); // Add text to the output string if the rectangular boundaries // have not been exceeded, advancing the current position. void Append(const string16& string); // Set the current position to the beginning of the next line. If // |output| is true, add a newline to the output string if the rectangular // boundaries have not been exceeded. If |output| is false, we assume // some other mechanism will (likely) do similar breaking after the fact. void NewLine(bool output); // Maximum number of rows allowed in the output string. size_t max_rows_; // Maximum number of characters allowed in the output string. size_t max_cols_; // Current row position, always incremented and may exceed max_rows_ // when the input can not fit in the region. We stop appending to // the output string, however, when this condition occurs. In the // future, we may want to expose this value to allow the caller to // determine how many rows would actually be required to hold the // formatted string. size_t current_row_; // Current character position, should never exceed max_cols_. size_t current_col_; // True when we do whitespace to newline conversions ourselves. bool strict_; // True when some of the input has been truncated. bool suppressed_; // String onto which the output is accumulated. string16* output_; DISALLOW_COPY_AND_ASSIGN(RectangleString); }; void RectangleString::AddString(const string16& input) { base::i18n::BreakIterator lines(input, base::i18n::BreakIterator::BREAK_NEWLINE); if (lines.Init()) { while (lines.Advance()) AddLine(lines.GetString()); } else { NOTREACHED() << "BreakIterator (lines) init failed"; } } bool RectangleString::Finalize() { if (suppressed_) { output_->append(ASCIIToUTF16("...")); return true; } return false; } void RectangleString::AddLine(const string16& line) { if (line.length() < max_cols_) { Append(line); } else { base::i18n::BreakIterator words(line, base::i18n::BreakIterator::BREAK_SPACE); if (words.Init()) { while (words.Advance()) AddWord(words.GetString()); } else { NOTREACHED() << "BreakIterator (words) init failed"; } } // Account for naturally-occuring newlines. ++current_row_; current_col_ = 0; } void RectangleString::AddWord(const string16& word) { if (word.length() < max_cols_) { // Word can be made to fit, no need to fragment it. if (current_col_ + word.length() >= max_cols_) NewLine(strict_); Append(word); } else { // Word is so big that it must be fragmented. int array_start = 0; int char_start = 0; base::i18n::UTF16CharIterator chars(&word); while (!chars.end()) { // When boundary is hit, add as much as will fit on this line. if (current_col_ + (chars.char_pos() - char_start) >= max_cols_) { Append(word.substr(array_start, chars.array_pos() - array_start)); NewLine(true); array_start = chars.array_pos(); char_start = chars.char_pos(); } chars.Advance(); } // Add the last remaining fragment, if any. if (array_start != chars.array_pos()) Append(word.substr(array_start, chars.array_pos() - array_start)); } } void RectangleString::Append(const string16& string) { if (current_row_ < max_rows_) output_->append(string); else suppressed_ = true; current_col_ += string.length(); } void RectangleString::NewLine(bool output) { if (current_row_ < max_rows_) { if (output) output_->append(ASCIIToUTF16("\n")); } else { suppressed_ = true; } ++current_row_; current_col_ = 0; } // Internal class used to track progress of a rectangular text elide // operation. Exists so the top-level ElideRectangleText() function // can be broken into smaller methods sharing this state. class RectangleText { public: RectangleText(const gfx::FontList& font_list, int available_pixel_width, int available_pixel_height, WordWrapBehavior wrap_behavior, std::vector* lines) : font_list_(font_list), line_height_(font_list.GetHeight()), available_pixel_width_(available_pixel_width), available_pixel_height_(available_pixel_height), wrap_behavior_(wrap_behavior), current_width_(0), current_height_(0), last_line_ended_in_lf_(false), lines_(lines), insufficient_width_(false), insufficient_height_(false) {} // Perform deferred initializions following creation. Must be called // before any input can be added via AddString(). void Init() { lines_->clear(); } // Add an input string, reformatting to fit the desired dimensions. // AddString() may be called multiple times to concatenate together // multiple strings into the region (the current caller doesn't do // this, however). void AddString(const string16& input); // Perform any deferred output processing. Must be called after the last // AddString() call has occured. Returns a combination of // |ReformattingResultFlags| indicating whether the given width or height was // insufficient, leading to elision or truncation. int Finalize(); private: // Add a line to the rectangular region at the current position, // either by itself or by breaking it into words. void AddLine(const string16& line); // Wrap the specified word across multiple lines. int WrapWord(const string16& word); // Add a long word - wrapping, eliding or truncating per the wrap behavior. int AddWordOverflow(const string16& word); // Add a word to the rectangluar region at the current position. int AddWord(const string16& word); // Append the specified |text| to the current output line, incrementing the // running width by the specified amount. This is an optimization over // |AddToCurrentLine()| when |text_width| is already known. void AddToCurrentLineWithWidth(const string16& text, int text_width); // Append the specified |text| to the current output line. void AddToCurrentLine(const string16& text); // Set the current position to the beginning of the next line. bool NewLine(); // The font list used for measuring text width. const gfx::FontList& font_list_; // The height of each line of text. const int line_height_; // The number of pixels of available width in the rectangle. const int available_pixel_width_; // The number of pixels of available height in the rectangle. const int available_pixel_height_; // The wrap behavior for words that are too long to fit on a single line. const WordWrapBehavior wrap_behavior_; // The current running width. int current_width_; // The current running height. int current_height_; // The current line of text. string16 current_line_; // Indicates whether the last line ended with \n. bool last_line_ended_in_lf_; // The output vector of lines. std::vector* lines_; // Indicates whether a word was so long that it had to be truncated or elided // to fit the available width. bool insufficient_width_; // Indicates whether there were too many lines for the available height. bool insufficient_height_; DISALLOW_COPY_AND_ASSIGN(RectangleText); }; void RectangleText::AddString(const string16& input) { base::i18n::BreakIterator lines(input, base::i18n::BreakIterator::BREAK_NEWLINE); if (lines.Init()) { while (!insufficient_height_ && lines.Advance()) { string16 line = lines.GetString(); // The BREAK_NEWLINE iterator will keep the trailing newline character, // except in the case of the last line, which may not have one. Remove // the newline character, if it exists. last_line_ended_in_lf_ = !line.empty() && line[line.length() - 1] == '\n'; if (last_line_ended_in_lf_) line.resize(line.length() - 1); AddLine(line); } } else { NOTREACHED() << "BreakIterator (lines) init failed"; } } int RectangleText::Finalize() { // Remove trailing whitespace from the last line or remove the last line // completely, if it's just whitespace. if (!insufficient_height_ && !lines_->empty()) { TrimWhitespace(lines_->back(), TRIM_TRAILING, &lines_->back()); if (lines_->back().empty() && !last_line_ended_in_lf_) lines_->pop_back(); } if (last_line_ended_in_lf_) lines_->push_back(string16()); return (insufficient_width_ ? INSUFFICIENT_SPACE_HORIZONTAL : 0) | (insufficient_height_ ? INSUFFICIENT_SPACE_VERTICAL : 0); } void RectangleText::AddLine(const string16& line) { const int line_width = gfx::GetStringWidth(line, font_list_); if (line_width <= available_pixel_width_) { AddToCurrentLineWithWidth(line, line_width); } else { // Iterate over positions that are valid to break the line at. In general, // these are word boundaries but after any punctuation following the word. base::i18n::BreakIterator words(line, base::i18n::BreakIterator::BREAK_LINE); if (words.Init()) { while (words.Advance()) { const bool truncate = !current_line_.empty(); const string16& word = words.GetString(); const int lines_added = AddWord(word); if (lines_added) { if (truncate) { // Trim trailing whitespace from the line that was added. const int line = lines_->size() - lines_added; TrimWhitespace(lines_->at(line), TRIM_TRAILING, &lines_->at(line)); } if (ContainsOnlyWhitespace(word)) { // Skip the first space if the previous line was carried over. current_width_ = 0; current_line_.clear(); } } } } else { NOTREACHED() << "BreakIterator (words) init failed"; } } // Account for naturally-occuring newlines. NewLine(); } int RectangleText::WrapWord(const string16& word) { // Word is so wide that it must be fragmented. string16 text = word; int lines_added = 0; bool first_fragment = true; while (!insufficient_height_ && !text.empty()) { string16 fragment = ElideText(text, font_list_, available_pixel_width_, TRUNCATE_AT_END); // At least one character has to be added at every line, even if the // available space is too small. if(fragment.empty()) fragment = text.substr(0, 1); if (!first_fragment && NewLine()) lines_added++; AddToCurrentLine(fragment); text = text.substr(fragment.length()); first_fragment = false; } return lines_added; } int RectangleText::AddWordOverflow(const string16& word) { int lines_added = 0; // Unless this is the very first word, put it on a new line. if (!current_line_.empty()) { if (!NewLine()) return 0; lines_added++; } if (wrap_behavior_ == IGNORE_LONG_WORDS) { current_line_ = word; current_width_ = available_pixel_width_; } else if (wrap_behavior_ == WRAP_LONG_WORDS) { lines_added += WrapWord(word); } else { const ElideBehavior elide_behavior = (wrap_behavior_ == ELIDE_LONG_WORDS ? ELIDE_AT_END : TRUNCATE_AT_END); const string16 elided_word = ElideText(word, font_list_, available_pixel_width_, elide_behavior); AddToCurrentLine(elided_word); insufficient_width_ = true; } return lines_added; } int RectangleText::AddWord(const string16& word) { int lines_added = 0; string16 trimmed; TrimWhitespace(word, TRIM_TRAILING, &trimmed); const int trimmed_width = gfx::GetStringWidth(trimmed, font_list_); if (trimmed_width <= available_pixel_width_) { // Word can be made to fit, no need to fragment it. if ((current_width_ + trimmed_width > available_pixel_width_) && NewLine()) lines_added++; // Append the non-trimmed word, in case more words are added after. AddToCurrentLine(word); } else { lines_added = AddWordOverflow(wrap_behavior_ == IGNORE_LONG_WORDS ? trimmed : word); } return lines_added; } void RectangleText::AddToCurrentLine(const string16& text) { AddToCurrentLineWithWidth(text, gfx::GetStringWidth(text, font_list_)); } void RectangleText::AddToCurrentLineWithWidth(const string16& text, int text_width) { if (current_height_ >= available_pixel_height_) { insufficient_height_ = true; return; } current_line_.append(text); current_width_ += text_width; } bool RectangleText::NewLine() { bool line_added = false; if (current_height_ < available_pixel_height_) { lines_->push_back(current_line_); current_line_.clear(); line_added = true; } else { insufficient_height_ = true; } current_height_ += line_height_; current_width_ = 0; return line_added; } } // namespace bool ElideRectangleString(const string16& input, size_t max_rows, size_t max_cols, bool strict, string16* output) { RectangleString rect(max_rows, max_cols, strict, output); rect.Init(); rect.AddString(input); return rect.Finalize(); } int ElideRectangleText(const string16& input, const gfx::FontList& font_list, int available_pixel_width, int available_pixel_height, WordWrapBehavior wrap_behavior, std::vector* lines) { RectangleText rect(font_list, available_pixel_width, available_pixel_height, wrap_behavior, lines); rect.Init(); rect.AddString(input); return rect.Finalize(); } int ElideRectangleText(const string16& input, const gfx::Font& font, int available_pixel_width, int available_pixel_height, WordWrapBehavior wrap_behavior, std::vector* lines) { return ElideRectangleText(input, gfx::FontList(font), available_pixel_width, available_pixel_height, wrap_behavior, lines); } string16 TruncateString(const string16& string, size_t length) { if (string.size() <= length) // String fits, return it. return string; if (length == 0) // No room for the elide string, return an empty string. return string16(); size_t max = length - 1; // Added to the end of strings that are too big. static const char16 kElideString[] = { 0x2026, 0 }; if (max == 0) // Just enough room for the elide string. return kElideString; // Use a line iterator to find the first boundary. UErrorCode status = U_ZERO_ERROR; scoped_ptr bi( static_cast( icu::RuleBasedBreakIterator::createLineInstance( icu::Locale::getDefault(), status))); if (U_FAILURE(status)) return string.substr(0, max) + kElideString; bi->setText(string.c_str()); int32_t index = bi->preceding(static_cast(max)); if (index == icu::BreakIterator::DONE) { index = static_cast(max); } else { // Found a valid break (may be the beginning of the string). Now use // a character iterator to find the previous non-whitespace character. icu::StringCharacterIterator char_iterator(string.c_str()); if (index == 0) { // No valid line breaks. Start at the end again. This ensures we break // on a valid character boundary. index = static_cast(max); } char_iterator.setIndex(index); while (char_iterator.hasPrevious()) { char_iterator.previous(); if (!(u_isspace(char_iterator.current()) || u_charType(char_iterator.current()) == U_CONTROL_CHAR || u_charType(char_iterator.current()) == U_NON_SPACING_MARK)) { // Not a whitespace character. Advance the iterator so that we // include the current character in the truncated string. char_iterator.next(); break; } } if (char_iterator.hasPrevious()) { // Found a valid break point. index = char_iterator.getIndex(); } else { // String has leading whitespace, return the elide string. return kElideString; } } return string.substr(0, index) + kElideString; } } // namespace gfx