You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

726 lines
21 KiB

// Copyright 2014 PDFium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
#include "xfa/fxfa/parser/cxfa_localevalue.h"
#include <cwchar>
#include <utility>
#include <vector>
#include "core/fxcrt/fx_extension.h"
#include "third_party/base/ptr_util.h"
#include "third_party/base/span.h"
#include "third_party/base/stl_util.h"
#include "xfa/fgas/crt/cfgas_stringformatter.h"
#include "xfa/fxfa/parser/cxfa_document.h"
#include "xfa/fxfa/parser/cxfa_localemgr.h"
#include "xfa/fxfa/parser/xfa_utils.h"
namespace {
FX_LOCALECATEGORY ValueCategory(FX_LOCALECATEGORY eCategory,
uint32_t dwValueType) {
if (eCategory != FX_LOCALECATEGORY_Unknown)
return eCategory;
switch (dwValueType) {
case XFA_VT_BOOLEAN:
case XFA_VT_INTEGER:
case XFA_VT_DECIMAL:
case XFA_VT_FLOAT:
return FX_LOCALECATEGORY_Num;
case XFA_VT_TEXT:
return FX_LOCALECATEGORY_Text;
case XFA_VT_DATE:
return FX_LOCALECATEGORY_Date;
case XFA_VT_TIME:
return FX_LOCALECATEGORY_Time;
case XFA_VT_DATETIME:
return FX_LOCALECATEGORY_DateTime;
}
return FX_LOCALECATEGORY_Unknown;
}
bool ValueSplitDateTime(const WideString& wsDateTime,
WideString& wsDate,
WideString& wsTime) {
wsDate.clear();
wsTime.clear();
if (wsDateTime.IsEmpty())
return false;
auto nSplitIndex = wsDateTime.Find('T');
if (!nSplitIndex.has_value())
nSplitIndex = wsDateTime.Find(' ');
if (!nSplitIndex.has_value())
return false;
wsDate = wsDateTime.First(nSplitIndex.value());
wsTime = wsDateTime.Last(wsDateTime.GetLength() - nSplitIndex.value() - 1);
return true;
}
class ScopedLocale {
public:
ScopedLocale(CXFA_LocaleMgr* pLocaleMgr, LocaleIface* pNewLocale)
: m_pLocaleMgr(pLocaleMgr),
m_pNewLocale(pNewLocale),
m_pOrigLocale(pNewLocale ? m_pLocaleMgr->GetDefLocale() : nullptr) {
if (m_pNewLocale)
m_pLocaleMgr->SetDefLocale(pNewLocale);
}
~ScopedLocale() {
if (m_pNewLocale)
m_pLocaleMgr->SetDefLocale(m_pOrigLocale);
}
ScopedLocale(const ScopedLocale& that) = delete;
ScopedLocale& operator=(const ScopedLocale& that) = delete;
private:
UnownedPtr<CXFA_LocaleMgr> const m_pLocaleMgr;
LocaleIface* const m_pNewLocale;
LocaleIface* const m_pOrigLocale;
};
} // namespace
CXFA_LocaleValue::CXFA_LocaleValue() = default;
CXFA_LocaleValue::CXFA_LocaleValue(uint32_t dwType, CXFA_LocaleMgr* pLocaleMgr)
: m_pLocaleMgr(pLocaleMgr),
m_dwType(dwType),
m_bValid(m_dwType != XFA_VT_NULL) {}
CXFA_LocaleValue::CXFA_LocaleValue(uint32_t dwType,
const WideString& wsValue,
CXFA_LocaleMgr* pLocaleMgr)
: m_pLocaleMgr(pLocaleMgr),
m_wsValue(wsValue),
m_dwType(dwType),
m_bValid(ValidateCanonicalValue(wsValue, dwType)) {}
CXFA_LocaleValue::CXFA_LocaleValue(uint32_t dwType,
const WideString& wsValue,
const WideString& wsFormat,
LocaleIface* pLocale,
CXFA_LocaleMgr* pLocaleMgr)
: m_pLocaleMgr(pLocaleMgr),
m_dwType(dwType),
m_bValid(ParsePatternValue(wsValue, wsFormat, pLocale)) {}
CXFA_LocaleValue::CXFA_LocaleValue(const CXFA_LocaleValue& that) = default;
CXFA_LocaleValue& CXFA_LocaleValue::operator=(const CXFA_LocaleValue& that) =
default;
CXFA_LocaleValue::~CXFA_LocaleValue() = default;
bool CXFA_LocaleValue::ValidateValue(const WideString& wsValue,
const WideString& wsPattern,
LocaleIface* pLocale,
WideString* pMatchFormat) {
if (!m_pLocaleMgr)
return false;
ScopedLocale scoped_locale(m_pLocaleMgr.Get(), pLocale);
std::vector<WideString> wsPatterns =
CFGAS_StringFormatter::SplitOnBars(wsPattern);
WideString wsOutput;
bool bRet = false;
size_t i = 0;
for (; !bRet && i < wsPatterns.size(); i++) {
const WideString& wsFormat = wsPatterns[i];
auto pFormat =
pdfium::MakeUnique<CFGAS_StringFormatter>(m_pLocaleMgr.Get(), wsFormat);
switch (ValueCategory(pFormat->GetCategory(), m_dwType)) {
case FX_LOCALECATEGORY_Null:
bRet = pFormat->ParseNull(wsValue);
if (!bRet)
bRet = wsValue.IsEmpty();
break;
case FX_LOCALECATEGORY_Zero:
bRet = pFormat->ParseZero(wsValue);
if (!bRet)
bRet = wsValue.EqualsASCII("0");
break;
case FX_LOCALECATEGORY_Num: {
WideString fNum;
bRet = pFormat->ParseNum(wsValue, &fNum);
if (!bRet)
bRet = pFormat->FormatNum(wsValue, &wsOutput);
break;
}
case FX_LOCALECATEGORY_Text:
bRet = pFormat->ParseText(wsValue, &wsOutput);
wsOutput.clear();
if (!bRet)
bRet = pFormat->FormatText(wsValue, &wsOutput);
break;
case FX_LOCALECATEGORY_Date: {
CFX_DateTime dt;
bRet = ValidateCanonicalDate(wsValue, &dt);
if (!bRet) {
bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_Date, &dt);
if (!bRet) {
bRet = pFormat->FormatDateTime(wsValue, FX_DATETIMETYPE_Date,
&wsOutput);
}
}
break;
}
case FX_LOCALECATEGORY_Time: {
CFX_DateTime dt;
bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_Time, &dt);
if (!bRet) {
bRet =
pFormat->FormatDateTime(wsValue, FX_DATETIMETYPE_Time, &wsOutput);
}
break;
}
case FX_LOCALECATEGORY_DateTime: {
CFX_DateTime dt;
bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_DateTime, &dt);
if (!bRet) {
bRet = pFormat->FormatDateTime(wsValue, FX_DATETIMETYPE_DateTime,
&wsOutput);
}
break;
}
default:
bRet = false;
break;
}
}
if (bRet && pMatchFormat)
*pMatchFormat = wsPatterns[i - 1];
return bRet;
}
double CXFA_LocaleValue::GetDoubleNum() const {
if (!m_bValid || (m_dwType != XFA_VT_BOOLEAN && m_dwType != XFA_VT_INTEGER &&
m_dwType != XFA_VT_DECIMAL && m_dwType != XFA_VT_FLOAT)) {
return 0;
}
return wcstod(m_wsValue.c_str(), nullptr);
}
CFX_DateTime CXFA_LocaleValue::GetDate() const {
if (!m_bValid || m_dwType != XFA_VT_DATE)
return CFX_DateTime();
CFX_DateTime dt;
FX_DateFromCanonical(m_wsValue.span(), &dt);
return dt;
}
CFX_DateTime CXFA_LocaleValue::GetTime() const {
if (!m_bValid || m_dwType != XFA_VT_TIME)
return CFX_DateTime();
CFX_DateTime dt;
FX_TimeFromCanonical(m_pLocaleMgr->GetDefLocale(), m_wsValue.span(), &dt);
return dt;
}
bool CXFA_LocaleValue::SetDate(const CFX_DateTime& d) {
m_dwType = XFA_VT_DATE;
m_wsValue = WideString::Format(L"%04d-%02d-%02d", d.GetYear(), d.GetMonth(),
d.GetDay());
return true;
}
bool CXFA_LocaleValue::SetTime(const CFX_DateTime& t) {
m_dwType = XFA_VT_TIME;
m_wsValue = WideString::Format(L"%02d:%02d:%02d", t.GetHour(), t.GetMinute(),
t.GetSecond());
if (t.GetMillisecond() > 0)
m_wsValue += WideString::Format(L"%:03d", t.GetMillisecond());
return true;
}
bool CXFA_LocaleValue::SetDateTime(const CFX_DateTime& dt) {
m_dwType = XFA_VT_DATETIME;
m_wsValue = WideString::Format(L"%04d-%02d-%02dT%02d:%02d:%02d", dt.GetYear(),
dt.GetMonth(), dt.GetDay(), dt.GetHour(),
dt.GetMinute(), dt.GetSecond());
if (dt.GetMillisecond() > 0)
m_wsValue += WideString::Format(L"%:03d", dt.GetMillisecond());
return true;
}
bool CXFA_LocaleValue::FormatPatterns(WideString& wsResult,
const WideString& wsFormat,
LocaleIface* pLocale,
XFA_VALUEPICTURE eValueType) const {
wsResult.clear();
for (const auto& pattern : CFGAS_StringFormatter::SplitOnBars(wsFormat)) {
if (FormatSinglePattern(wsResult, pattern, pLocale, eValueType))
return true;
}
return false;
}
bool CXFA_LocaleValue::FormatSinglePattern(WideString& wsResult,
const WideString& wsFormat,
LocaleIface* pLocale,
XFA_VALUEPICTURE eValueType) const {
if (!m_pLocaleMgr)
return false;
ScopedLocale scoped_locale(m_pLocaleMgr.Get(), pLocale);
wsResult.clear();
bool bRet = false;
auto pFormat =
pdfium::MakeUnique<CFGAS_StringFormatter>(m_pLocaleMgr.Get(), wsFormat);
FX_LOCALECATEGORY eCategory = ValueCategory(pFormat->GetCategory(), m_dwType);
switch (eCategory) {
case FX_LOCALECATEGORY_Null:
if (m_wsValue.IsEmpty())
bRet = pFormat->FormatNull(&wsResult);
break;
case FX_LOCALECATEGORY_Zero:
if (m_wsValue.EqualsASCII("0"))
bRet = pFormat->FormatZero(&wsResult);
break;
case FX_LOCALECATEGORY_Num:
bRet = pFormat->FormatNum(m_wsValue, &wsResult);
break;
case FX_LOCALECATEGORY_Text:
bRet = pFormat->FormatText(m_wsValue, &wsResult);
break;
case FX_LOCALECATEGORY_Date:
bRet =
pFormat->FormatDateTime(m_wsValue, FX_DATETIMETYPE_Date, &wsResult);
break;
case FX_LOCALECATEGORY_Time:
bRet =
pFormat->FormatDateTime(m_wsValue, FX_DATETIMETYPE_Time, &wsResult);
break;
case FX_LOCALECATEGORY_DateTime:
bRet = pFormat->FormatDateTime(m_wsValue, FX_DATETIMETYPE_DateTime,
&wsResult);
break;
default:
wsResult = m_wsValue;
bRet = true;
}
if (!bRet && (eCategory != FX_LOCALECATEGORY_Num ||
eValueType != XFA_VALUEPICTURE_Display)) {
wsResult = m_wsValue;
}
return bRet;
}
bool CXFA_LocaleValue::ValidateCanonicalValue(const WideString& wsValue,
uint32_t dwVType) {
if (wsValue.IsEmpty())
return true;
CFX_DateTime dt;
switch (dwVType) {
case XFA_VT_DATE: {
if (ValidateCanonicalDate(wsValue, &dt))
return true;
WideString wsDate;
WideString wsTime;
if (ValueSplitDateTime(wsValue, wsDate, wsTime) &&
ValidateCanonicalDate(wsDate, &dt)) {
return true;
}
return false;
}
case XFA_VT_TIME: {
if (ValidateCanonicalTime(wsValue))
return true;
WideString wsDate;
WideString wsTime;
if (ValueSplitDateTime(wsValue, wsDate, wsTime) &&
ValidateCanonicalTime(wsTime)) {
return true;
}
return false;
}
case XFA_VT_DATETIME: {
WideString wsDate, wsTime;
if (ValueSplitDateTime(wsValue, wsDate, wsTime) &&
ValidateCanonicalDate(wsDate, &dt) && ValidateCanonicalTime(wsTime)) {
return true;
}
} break;
}
return true;
}
bool CXFA_LocaleValue::ValidateCanonicalDate(const WideString& wsDate,
CFX_DateTime* unDate) {
static const uint8_t LastDay[12] = {31, 28, 31, 30, 31, 30,
31, 31, 30, 31, 30, 31};
static const uint16_t wCountY = 4;
static const uint16_t wCountM = 2;
static const uint16_t wCountD = 2;
pdfium::span<const wchar_t> spDate = wsDate.span();
if (spDate.size() < wCountY ||
spDate.size() > wCountY + wCountM + wCountD + 2) {
return false;
}
const bool bSymbol = wsDate.Contains(0x2D);
uint16_t wYear = 0;
uint16_t wMonth = 0;
uint16_t wDay = 0;
size_t nIndex = 0;
size_t nStart = 0;
while (nIndex < wCountY && spDate[nIndex] != '\0') {
if (!FXSYS_IsDecimalDigit(spDate[nIndex]))
return false;
wYear = (spDate[nIndex] - '0') + wYear * 10;
nIndex++;
}
if (bSymbol) {
if (nIndex >= spDate.size() || spDate[nIndex] != 0x2D)
return false;
nIndex++;
}
nStart = nIndex;
while (nIndex < spDate.size() && spDate[nIndex] != '\0' &&
nIndex - nStart < wCountM) {
if (!FXSYS_IsDecimalDigit(spDate[nIndex]))
return false;
wMonth = (spDate[nIndex] - '0') + wMonth * 10;
nIndex++;
}
if (bSymbol) {
if (nIndex >= spDate.size() || spDate[nIndex] != 0x2D)
return false;
nIndex++;
}
nStart = nIndex;
while (nIndex < spDate.size() && spDate[nIndex] != '\0' &&
nIndex - nStart < wCountD) {
if (!FXSYS_IsDecimalDigit(spDate[nIndex]))
return false;
wDay = (spDate[nIndex] - '0') + wDay * 10;
nIndex++;
}
if (nIndex != spDate.size())
return false;
if (wYear < 1900 || wYear > 2029)
return false;
if (wMonth < 1 || wMonth > 12)
return wMonth == 0 && spDate.size() == wCountY;
if (wDay < 1)
return wDay == 0 && spDate.size() == wCountY + wCountM;
if (wMonth == 2) {
if (wYear % 400 == 0 || (wYear % 100 != 0 && wYear % 4 == 0)) {
if (wDay > 29)
return false;
} else if (wDay > 28) {
return false;
}
} else if (wDay > LastDay[wMonth - 1]) {
return false;
}
unDate->SetDate(wYear, static_cast<uint8_t>(wMonth),
static_cast<uint8_t>(wDay));
return true;
}
bool CXFA_LocaleValue::ValidateCanonicalTime(const WideString& wsTime) {
pdfium::span<const wchar_t> spTime = wsTime.span();
if (spTime.size() < 2)
return false;
const uint16_t wCountH = 2;
const uint16_t wCountM = 2;
const uint16_t wCountS = 2;
const uint16_t wCountF = 3;
const bool bSymbol = wsTime.Contains(':');
uint16_t wHour = 0;
uint16_t wMinute = 0;
uint16_t wSecond = 0;
uint16_t wFraction = 0;
size_t nIndex = 0;
size_t nStart = 0;
while (nIndex - nStart < wCountH && spTime[nIndex]) {
if (!FXSYS_IsDecimalDigit(spTime[nIndex]))
return false;
wHour = spTime[nIndex] - '0' + wHour * 10;
nIndex++;
}
if (bSymbol) {
if (nIndex < spTime.size() && spTime[nIndex] != ':')
return false;
nIndex++;
}
nStart = nIndex;
while (nIndex < spTime.size() && spTime[nIndex] != '\0' &&
nIndex - nStart < wCountM) {
if (!FXSYS_IsDecimalDigit(spTime[nIndex]))
return false;
wMinute = spTime[nIndex] - '0' + wMinute * 10;
nIndex++;
}
if (bSymbol) {
if (nIndex >= spTime.size() || spTime[nIndex] != ':')
return false;
nIndex++;
}
nStart = nIndex;
while (nIndex < spTime.size() && spTime[nIndex] != '\0' &&
nIndex - nStart < wCountS) {
if (!FXSYS_IsDecimalDigit(spTime[nIndex]))
return false;
wSecond = spTime[nIndex] - '0' + wSecond * 10;
nIndex++;
}
auto pos = wsTime.Find('.');
if (pos.has_value() && pos.value() != 0) {
if (nIndex >= spTime.size() || spTime[nIndex] != '.')
return false;
nIndex++;
nStart = nIndex;
while (nIndex < spTime.size() && spTime[nIndex] != '\0' &&
nIndex - nStart < wCountF) {
if (!FXSYS_IsDecimalDigit(spTime[nIndex]))
return false;
wFraction = spTime[nIndex] - '0' + wFraction * 10;
nIndex++;
}
}
if (nIndex < spTime.size()) {
if (spTime[nIndex] == 'Z') {
nIndex++;
} else if (spTime[nIndex] == '-' || spTime[nIndex] == '+') {
int16_t nOffsetH = 0;
int16_t nOffsetM = 0;
nIndex++;
nStart = nIndex;
while (nIndex < spTime.size() && spTime[nIndex] != '\0' &&
nIndex - nStart < wCountH) {
if (!FXSYS_IsDecimalDigit(spTime[nIndex]))
return false;
nOffsetH = spTime[nIndex] - '0' + nOffsetH * 10;
nIndex++;
}
if (bSymbol) {
if (nIndex >= spTime.size() || spTime[nIndex] != ':')
return false;
nIndex++;
}
nStart = nIndex;
while (nIndex < spTime.size() && spTime[nIndex] != '\0' &&
nIndex - nStart < wCountM) {
if (!FXSYS_IsDecimalDigit(spTime[nIndex]))
return false;
nOffsetM = spTime[nIndex] - '0' + nOffsetM * 10;
nIndex++;
}
if (nOffsetH > 12 || nOffsetM >= 60)
return false;
}
}
return nIndex == spTime.size() && wHour < 24 && wMinute < 60 &&
wSecond < 60 && wFraction <= 999;
}
bool CXFA_LocaleValue::ParsePatternValue(const WideString& wsValue,
const WideString& wsPattern,
LocaleIface* pLocale) {
if (!m_pLocaleMgr)
return false;
std::vector<WideString> wsPatterns =
CFGAS_StringFormatter::SplitOnBars(wsPattern);
ScopedLocale scoped_locale(m_pLocaleMgr.Get(), pLocale);
bool bRet = false;
for (size_t i = 0; !bRet && i < wsPatterns.size(); i++) {
const WideString& wsFormat = wsPatterns[i];
auto pFormat =
pdfium::MakeUnique<CFGAS_StringFormatter>(m_pLocaleMgr.Get(), wsFormat);
switch (ValueCategory(pFormat->GetCategory(), m_dwType)) {
case FX_LOCALECATEGORY_Null:
bRet = pFormat->ParseNull(wsValue);
if (bRet)
m_wsValue.clear();
break;
case FX_LOCALECATEGORY_Zero:
bRet = pFormat->ParseZero(wsValue);
if (bRet)
m_wsValue = L"0";
break;
case FX_LOCALECATEGORY_Num: {
WideString fNum;
bRet = pFormat->ParseNum(wsValue, &fNum);
if (bRet)
m_wsValue = std::move(fNum);
break;
}
case FX_LOCALECATEGORY_Text:
bRet = pFormat->ParseText(wsValue, &m_wsValue);
break;
case FX_LOCALECATEGORY_Date: {
CFX_DateTime dt;
bRet = ValidateCanonicalDate(wsValue, &dt);
if (!bRet) {
bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_Date, &dt);
}
if (bRet)
SetDate(dt);
break;
}
case FX_LOCALECATEGORY_Time: {
CFX_DateTime dt;
bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_Time, &dt);
if (bRet)
SetTime(dt);
break;
}
case FX_LOCALECATEGORY_DateTime: {
CFX_DateTime dt;
bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_DateTime, &dt);
if (bRet)
SetDateTime(dt);
break;
}
default:
m_wsValue = wsValue;
bRet = true;
break;
}
}
if (!bRet)
m_wsValue = wsValue;
return bRet;
}
void CXFA_LocaleValue::GetNumericFormat(WideString& wsFormat,
int32_t nIntLen,
int32_t nDecLen) {
ASSERT(wsFormat.IsEmpty());
ASSERT(nIntLen >= -1);
ASSERT(nDecLen >= -1);
int32_t nTotalLen = (nIntLen >= 0 ? nIntLen : 2) + 1 +
(nDecLen >= 0 ? nDecLen : 2) + (nDecLen == 0 ? 0 : 1);
{
// Span's lifetime must end before ReleaseBuffer() below.
pdfium::span<wchar_t> lpBuf = wsFormat.GetBuffer(nTotalLen);
int32_t nPos = 0;
lpBuf[nPos++] = L's';
if (nIntLen == -1) {
lpBuf[nPos++] = L'z';
lpBuf[nPos++] = L'*';
} else {
while (nIntLen) {
lpBuf[nPos++] = L'z';
nIntLen--;
}
}
if (nDecLen != 0) {
lpBuf[nPos++] = L'.';
}
if (nDecLen == -1) {
lpBuf[nPos++] = L'z';
lpBuf[nPos++] = L'*';
} else {
while (nDecLen) {
lpBuf[nPos++] = L'z';
nDecLen--;
}
}
}
wsFormat.ReleaseBuffer(nTotalLen);
}
bool CXFA_LocaleValue::ValidateNumericTemp(const WideString& wsNumeric,
const WideString& wsFormat,
LocaleIface* pLocale) {
if (wsFormat.IsEmpty() || wsNumeric.IsEmpty())
return true;
pdfium::span<const wchar_t> spNum = wsNumeric.span();
pdfium::span<const wchar_t> spFmt = wsFormat.span();
int32_t n = 0;
int32_t nf = 0;
wchar_t c = spNum[n];
wchar_t cf = spFmt[nf];
if (cf == L's') {
if (c == L'-' || c == L'+')
++n;
++nf;
}
bool bLimit = true;
int32_t nCount = wsNumeric.GetLength();
int32_t nCountFmt = wsFormat.GetLength();
while (n < nCount && (!bLimit || nf < nCountFmt) &&
FXSYS_IsDecimalDigit(c = spNum[n])) {
if (bLimit) {
if ((cf = spFmt[nf]) == L'*')
bLimit = false;
else if (cf == L'z')
nf++;
else
return false;
}
n++;
}
if (n == nCount)
return true;
if (nf == nCountFmt)
return false;
while (nf < nCountFmt && (cf = spFmt[nf]) != L'.') {
ASSERT(cf == L'z' || cf == L'*');
++nf;
}
WideString wsDecimalSymbol;
if (pLocale)
wsDecimalSymbol = pLocale->GetDecimalSymbol();
else
wsDecimalSymbol = WideString(L'.');
if (spFmt[nf] != L'.')
return false;
if (wsDecimalSymbol != WideStringView(c) && c != L'.')
return false;
++nf;
++n;
bLimit = true;
while (n < nCount && (!bLimit || nf < nCountFmt) &&
FXSYS_IsDecimalDigit(spNum[n])) {
if (bLimit) {
if ((cf = spFmt[nf]) == L'*')
bLimit = false;
else if (cf == L'z')
nf++;
else
return false;
}
n++;
}
return n == nCount;
}