blob: bdb7c111203f3578a2d1bb170c60d2641b6a3760 [file] [log] [blame]
// Copyright (c) 2011 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#ifndef BASE_STRINGS_UTF_OFFSET_STRING_CONVERSIONS_H_
#define BASE_STRINGS_UTF_OFFSET_STRING_CONVERSIONS_H_
#include <string>
#include <vector>
#include "base/base_export.h"
#include "base/strings/string16.h"
#include "base/strings/string_piece.h"
namespace base {
// Like the conversions in utf_string_conversions.h, but also takes one or more
// |offset[s]_for_adjustment| representing insertion/selection points between
// characters: if |src| is "abcd", then 0 is before 'a', 2 is between 'b' and
// 'c', and 4 is at the end of the string. Valid input offsets range from 0 to
// |src_len|. On exit, each offset will have been modified to point at the same
// logical position in the output string. If an offset cannot be successfully
// adjusted (e.g. because it points into the middle of a multibyte sequence), it
// will be set to string16::npos.
//
// |offset[s]_for_adjustment| may be NULL.
BASE_EXPORT bool UTF8ToUTF16AndAdjustOffset(const char* src,
size_t src_len,
string16* output,
size_t* offset_for_adjustment);
BASE_EXPORT bool UTF8ToUTF16AndAdjustOffsets(
const char* src,
size_t src_len,
string16* output,
std::vector<size_t>* offsets_for_adjustment);
BASE_EXPORT string16 UTF8ToUTF16AndAdjustOffset(const base::StringPiece& utf8,
size_t* offset_for_adjustment);
BASE_EXPORT string16 UTF8ToUTF16AndAdjustOffsets(
const base::StringPiece& utf8,
std::vector<size_t>* offsets_for_adjustment);
BASE_EXPORT std::string UTF16ToUTF8AndAdjustOffset(
const base::StringPiece16& utf16,
size_t* offset_for_adjustment);
BASE_EXPORT std::string UTF16ToUTF8AndAdjustOffsets(
const base::StringPiece16& utf16,
std::vector<size_t>* offsets_for_adjustment);
// Limiting function callable by std::for_each which will replace any value
// which is greater than |limit| with npos. Typically this is called with a
// string length to clamp offsets into the string to [0, length] (as opposed to
// [0, length); see comments above).
template <typename T>
struct LimitOffset {
explicit LimitOffset(size_t limit)
: limit_(limit) {}
void operator()(size_t& offset) {
if (offset > limit_)
offset = T::npos;
}
size_t limit_;
};
// Stack object which, on destruction, will update a vector of offsets based on
// any supplied adjustments. To use, declare one of these, providing the
// address of the offset vector to adjust. Then Add() any number of Adjustments
// (each Adjustment gives the |original_offset| of a substring and the lengths
// of the substring before and after transforming). When the OffsetAdjuster
// goes out of scope, all the offsets in the provided vector will be updated.
class BASE_EXPORT OffsetAdjuster {
public:
struct BASE_EXPORT Adjustment {
Adjustment(size_t original_offset,
size_t original_length,
size_t output_length);
size_t original_offset;
size_t original_length;
size_t output_length;
};
explicit OffsetAdjuster(std::vector<size_t>* offsets_for_adjustment);
~OffsetAdjuster();
void Add(const Adjustment& adjustment);
private:
void AdjustOffset(std::vector<size_t>::iterator offset);
std::vector<size_t>* offsets_for_adjustment_;
std::vector<Adjustment> adjustments_;
};
} // namespace base
#endif // BASE_STRINGS_UTF_OFFSET_STRING_CONVERSIONS_H_