blob: e834815b09f68ea1af2fd3745c4800d4b3849f48 [file] [log] [blame]
// Copyright 2017 The PDFium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
#include "core/fxcrt/cfx_utf8decoder.h"
#include <utility>
CFX_UTF8Decoder::CFX_UTF8Decoder(ByteStringView input) {
for (char c : input) {
ProcessByte(c);
}
}
CFX_UTF8Decoder::~CFX_UTF8Decoder() = default;
WideString CFX_UTF8Decoder::TakeResult() {
return std::move(m_Buffer);
}
void CFX_UTF8Decoder::AppendCodePoint(uint32_t ch) {
m_Buffer += static_cast<wchar_t>(ch);
}
void CFX_UTF8Decoder::ProcessByte(uint8_t byte) {
if (byte < 0x80) {
m_PendingBytes = 0;
AppendCodePoint(byte);
} else if (byte < 0xc0) {
if (m_PendingBytes == 0) {
return;
}
m_PendingBytes--;
m_PendingChar |= (byte & 0x3f) << (m_PendingBytes * 6);
if (m_PendingBytes == 0) {
AppendCodePoint(m_PendingChar);
}
} else if (byte < 0xe0) {
m_PendingBytes = 1;
m_PendingChar = (byte & 0x1f) << 6;
} else if (byte < 0xf0) {
m_PendingBytes = 2;
m_PendingChar = (byte & 0x0f) << 12;
} else if (byte < 0xf8) {
m_PendingBytes = 3;
m_PendingChar = (byte & 0x07) << 18;
} else if (byte < 0xfc) {
m_PendingBytes = 4;
m_PendingChar = (byte & 0x03) << 24;
} else if (byte < 0xfe) {
m_PendingBytes = 5;
m_PendingChar = (byte & 0x01) << 30;
} else {
m_PendingBytes = 0;
}
}