// Copyright (c) 2011 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #ifndef BASE_STRINGS_UTF_OFFSET_STRING_CONVERSIONS_H_ #define BASE_STRINGS_UTF_OFFSET_STRING_CONVERSIONS_H_ #include <string> #include <vector> #include "base/base_export.h" #include "base/strings/string16.h" #include "base/strings/string_piece.h" namespace base { // Like the conversions in utf_string_conversions.h, but also takes one or more // |offset[s]_for_adjustment| representing insertion/selection points between // characters: if |src| is "abcd", then 0 is before 'a', 2 is between 'b' and // 'c', and 4 is at the end of the string. Valid input offsets range from 0 to // |src_len|. On exit, each offset will have been modified to point at the same // logical position in the output string. If an offset cannot be successfully // adjusted (e.g. because it points into the middle of a multibyte sequence), it // will be set to string16::npos. // // |offset[s]_for_adjustment| may be NULL. BASE_EXPORT bool UTF8ToUTF16AndAdjustOffset(const char* src, size_t src_len, string16* output, size_t* offset_for_adjustment); BASE_EXPORT bool UTF8ToUTF16AndAdjustOffsets( const char* src, size_t src_len, string16* output, std::vector<size_t>* offsets_for_adjustment); BASE_EXPORT string16 UTF8ToUTF16AndAdjustOffset(const base::StringPiece& utf8, size_t* offset_for_adjustment); BASE_EXPORT string16 UTF8ToUTF16AndAdjustOffsets( const base::StringPiece& utf8, std::vector<size_t>* offsets_for_adjustment); BASE_EXPORT std::string UTF16ToUTF8AndAdjustOffset( const base::StringPiece16& utf16, size_t* offset_for_adjustment); BASE_EXPORT std::string UTF16ToUTF8AndAdjustOffsets( const base::StringPiece16& utf16, std::vector<size_t>* offsets_for_adjustment); // Limiting function callable by std::for_each which will replace any value // which is greater than |limit| with npos. Typically this is called with a // string length to clamp offsets into the string to [0, length] (as opposed to // [0, length); see comments above). template <typename T> struct LimitOffset { explicit LimitOffset(size_t limit) : limit_(limit) {} void operator()(size_t& offset) { if (offset > limit_) offset = T::npos; } size_t limit_; }; // Stack object which, on destruction, will update a vector of offsets based on // any supplied adjustments. To use, declare one of these, providing the // address of the offset vector to adjust. Then Add() any number of Adjustments // (each Adjustment gives the |original_offset| of a substring and the lengths // of the substring before and after transforming). When the OffsetAdjuster // goes out of scope, all the offsets in the provided vector will be updated. class BASE_EXPORT OffsetAdjuster { public: struct BASE_EXPORT Adjustment { Adjustment(size_t original_offset, size_t original_length, size_t output_length); size_t original_offset; size_t original_length; size_t output_length; }; explicit OffsetAdjuster(std::vector<size_t>* offsets_for_adjustment); ~OffsetAdjuster(); void Add(const Adjustment& adjustment); private: void AdjustOffset(std::vector<size_t>::iterator offset); std::vector<size_t>* offsets_for_adjustment_; std::vector<Adjustment> adjustments_; }; } // namespace base #endif // BASE_STRINGS_UTF_OFFSET_STRING_CONVERSIONS_H_