| /* |
| * Copyright (C) 2013 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #ifndef _CHARACTER_ENCODING_DETECTOR_H |
| #define _CHARACTER_ENCODING_DETECTOR_H |
| |
| #include <media/mediascanner.h> |
| |
| #include "StringArray.h" |
| |
| #include "unicode/ucnv.h" |
| #include "unicode/ucsdet.h" |
| #include "unicode/ustring.h" |
| |
| namespace android { |
| |
| class CharacterEncodingDetector { |
| |
| public: |
| CharacterEncodingDetector(); |
| ~CharacterEncodingDetector(); |
| |
| void addTag(const char *name, const char *value); |
| size_t size(); |
| |
| void detectAndConvert(); |
| status_t getTag(int index, const char **name, const char**value); |
| |
| private: |
| const UCharsetMatch *getPreferred( |
| const char *input, size_t len, |
| const UCharsetMatch** ucma, size_t matches, |
| bool *goodmatch, int *highestmatch); |
| |
| bool isFrequent(const uint16_t *values, uint32_t c); |
| |
| // cached name and value strings, for native encoding support. |
| // TODO: replace these with byte blob arrays that don't require the data to be |
| // singlenullbyte-terminated |
| StringArray mNames; |
| StringArray mValues; |
| |
| UConverter* mUtf8Conv; |
| }; |
| |
| |
| |
| }; // namespace android |
| |
| #endif |