59 lines
1.4 KiB
C++
59 lines
1.4 KiB
C++
|
|
// Copyright 2017 The PDFium Authors
|
||
|
|
// Use of this source code is governed by a BSD-style license that can be
|
||
|
|
// found in the LICENSE file.
|
||
|
|
|
||
|
|
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
|
||
|
|
|
||
|
|
#include "core/fxcrt/cfx_utf8decoder.h"
|
||
|
|
|
||
|
|
#include <utility>
|
||
|
|
|
||
|
|
CFX_UTF8Decoder::CFX_UTF8Decoder(ByteStringView input) {
|
||
|
|
for (char c : input) {
|
||
|
|
ProcessByte(c);
|
||
|
|
}
|
||
|
|
}
|
||
|
|
|
||
|
|
CFX_UTF8Decoder::~CFX_UTF8Decoder() = default;
|
||
|
|
|
||
|
|
WideString CFX_UTF8Decoder::TakeResult() {
|
||
|
|
return std::move(m_Buffer);
|
||
|
|
}
|
||
|
|
|
||
|
|
void CFX_UTF8Decoder::AppendCodePoint(uint32_t ch) {
|
||
|
|
m_Buffer += static_cast<wchar_t>(ch);
|
||
|
|
}
|
||
|
|
|
||
|
|
void CFX_UTF8Decoder::ProcessByte(uint8_t byte) {
|
||
|
|
if (byte < 0x80) {
|
||
|
|
m_PendingBytes = 0;
|
||
|
|
AppendCodePoint(byte);
|
||
|
|
} else if (byte < 0xc0) {
|
||
|
|
if (m_PendingBytes == 0) {
|
||
|
|
return;
|
||
|
|
}
|
||
|
|
m_PendingBytes--;
|
||
|
|
m_PendingChar |= (byte & 0x3f) << (m_PendingBytes * 6);
|
||
|
|
if (m_PendingBytes == 0) {
|
||
|
|
AppendCodePoint(m_PendingChar);
|
||
|
|
}
|
||
|
|
} else if (byte < 0xe0) {
|
||
|
|
m_PendingBytes = 1;
|
||
|
|
m_PendingChar = (byte & 0x1f) << 6;
|
||
|
|
} else if (byte < 0xf0) {
|
||
|
|
m_PendingBytes = 2;
|
||
|
|
m_PendingChar = (byte & 0x0f) << 12;
|
||
|
|
} else if (byte < 0xf8) {
|
||
|
|
m_PendingBytes = 3;
|
||
|
|
m_PendingChar = (byte & 0x07) << 18;
|
||
|
|
} else if (byte < 0xfc) {
|
||
|
|
m_PendingBytes = 4;
|
||
|
|
m_PendingChar = (byte & 0x03) << 24;
|
||
|
|
} else if (byte < 0xfe) {
|
||
|
|
m_PendingBytes = 5;
|
||
|
|
m_PendingChar = (byte & 0x01) << 30;
|
||
|
|
} else {
|
||
|
|
m_PendingBytes = 0;
|
||
|
|
}
|
||
|
|
}
|