// Copyright 2014 PDFium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com #include "xfa/fxfa/parser/cxfa_localevalue.h" #include #include #include #include "core/fxcrt/fx_extension.h" #include "third_party/base/ptr_util.h" #include "third_party/base/span.h" #include "third_party/base/stl_util.h" #include "xfa/fgas/crt/cfgas_stringformatter.h" #include "xfa/fxfa/parser/cxfa_document.h" #include "xfa/fxfa/parser/cxfa_localemgr.h" #include "xfa/fxfa/parser/xfa_utils.h" namespace { FX_LOCALECATEGORY ValueCategory(FX_LOCALECATEGORY eCategory, uint32_t dwValueType) { if (eCategory != FX_LOCALECATEGORY_Unknown) return eCategory; switch (dwValueType) { case XFA_VT_BOOLEAN: case XFA_VT_INTEGER: case XFA_VT_DECIMAL: case XFA_VT_FLOAT: return FX_LOCALECATEGORY_Num; case XFA_VT_TEXT: return FX_LOCALECATEGORY_Text; case XFA_VT_DATE: return FX_LOCALECATEGORY_Date; case XFA_VT_TIME: return FX_LOCALECATEGORY_Time; case XFA_VT_DATETIME: return FX_LOCALECATEGORY_DateTime; } return FX_LOCALECATEGORY_Unknown; } bool ValueSplitDateTime(const WideString& wsDateTime, WideString& wsDate, WideString& wsTime) { wsDate.clear(); wsTime.clear(); if (wsDateTime.IsEmpty()) return false; auto nSplitIndex = wsDateTime.Find('T'); if (!nSplitIndex.has_value()) nSplitIndex = wsDateTime.Find(' '); if (!nSplitIndex.has_value()) return false; wsDate = wsDateTime.First(nSplitIndex.value()); wsTime = wsDateTime.Last(wsDateTime.GetLength() - nSplitIndex.value() - 1); return true; } class ScopedLocale { public: ScopedLocale(CXFA_LocaleMgr* pLocaleMgr, LocaleIface* pNewLocale) : m_pLocaleMgr(pLocaleMgr), m_pNewLocale(pNewLocale), m_pOrigLocale(pNewLocale ? m_pLocaleMgr->GetDefLocale() : nullptr) { if (m_pNewLocale) m_pLocaleMgr->SetDefLocale(pNewLocale); } ~ScopedLocale() { if (m_pNewLocale) m_pLocaleMgr->SetDefLocale(m_pOrigLocale); } ScopedLocale(const ScopedLocale& that) = delete; ScopedLocale& operator=(const ScopedLocale& that) = delete; private: UnownedPtr const m_pLocaleMgr; LocaleIface* const m_pNewLocale; LocaleIface* const m_pOrigLocale; }; } // namespace CXFA_LocaleValue::CXFA_LocaleValue() = default; CXFA_LocaleValue::CXFA_LocaleValue(uint32_t dwType, CXFA_LocaleMgr* pLocaleMgr) : m_pLocaleMgr(pLocaleMgr), m_dwType(dwType), m_bValid(m_dwType != XFA_VT_NULL) {} CXFA_LocaleValue::CXFA_LocaleValue(uint32_t dwType, const WideString& wsValue, CXFA_LocaleMgr* pLocaleMgr) : m_pLocaleMgr(pLocaleMgr), m_wsValue(wsValue), m_dwType(dwType), m_bValid(ValidateCanonicalValue(wsValue, dwType)) {} CXFA_LocaleValue::CXFA_LocaleValue(uint32_t dwType, const WideString& wsValue, const WideString& wsFormat, LocaleIface* pLocale, CXFA_LocaleMgr* pLocaleMgr) : m_pLocaleMgr(pLocaleMgr), m_dwType(dwType), m_bValid(ParsePatternValue(wsValue, wsFormat, pLocale)) {} CXFA_LocaleValue::CXFA_LocaleValue(const CXFA_LocaleValue& that) = default; CXFA_LocaleValue& CXFA_LocaleValue::operator=(const CXFA_LocaleValue& that) = default; CXFA_LocaleValue::~CXFA_LocaleValue() = default; bool CXFA_LocaleValue::ValidateValue(const WideString& wsValue, const WideString& wsPattern, LocaleIface* pLocale, WideString* pMatchFormat) { if (!m_pLocaleMgr) return false; ScopedLocale scoped_locale(m_pLocaleMgr.Get(), pLocale); std::vector wsPatterns = CFGAS_StringFormatter::SplitOnBars(wsPattern); WideString wsOutput; bool bRet = false; size_t i = 0; for (; !bRet && i < wsPatterns.size(); i++) { const WideString& wsFormat = wsPatterns[i]; auto pFormat = pdfium::MakeUnique(m_pLocaleMgr.Get(), wsFormat); switch (ValueCategory(pFormat->GetCategory(), m_dwType)) { case FX_LOCALECATEGORY_Null: bRet = pFormat->ParseNull(wsValue); if (!bRet) bRet = wsValue.IsEmpty(); break; case FX_LOCALECATEGORY_Zero: bRet = pFormat->ParseZero(wsValue); if (!bRet) bRet = wsValue.EqualsASCII("0"); break; case FX_LOCALECATEGORY_Num: { WideString fNum; bRet = pFormat->ParseNum(wsValue, &fNum); if (!bRet) bRet = pFormat->FormatNum(wsValue, &wsOutput); break; } case FX_LOCALECATEGORY_Text: bRet = pFormat->ParseText(wsValue, &wsOutput); wsOutput.clear(); if (!bRet) bRet = pFormat->FormatText(wsValue, &wsOutput); break; case FX_LOCALECATEGORY_Date: { CFX_DateTime dt; bRet = ValidateCanonicalDate(wsValue, &dt); if (!bRet) { bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_Date, &dt); if (!bRet) { bRet = pFormat->FormatDateTime(wsValue, FX_DATETIMETYPE_Date, &wsOutput); } } break; } case FX_LOCALECATEGORY_Time: { CFX_DateTime dt; bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_Time, &dt); if (!bRet) { bRet = pFormat->FormatDateTime(wsValue, FX_DATETIMETYPE_Time, &wsOutput); } break; } case FX_LOCALECATEGORY_DateTime: { CFX_DateTime dt; bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_DateTime, &dt); if (!bRet) { bRet = pFormat->FormatDateTime(wsValue, FX_DATETIMETYPE_DateTime, &wsOutput); } break; } default: bRet = false; break; } } if (bRet && pMatchFormat) *pMatchFormat = wsPatterns[i - 1]; return bRet; } double CXFA_LocaleValue::GetDoubleNum() const { if (!m_bValid || (m_dwType != XFA_VT_BOOLEAN && m_dwType != XFA_VT_INTEGER && m_dwType != XFA_VT_DECIMAL && m_dwType != XFA_VT_FLOAT)) { return 0; } return wcstod(m_wsValue.c_str(), nullptr); } CFX_DateTime CXFA_LocaleValue::GetDate() const { if (!m_bValid || m_dwType != XFA_VT_DATE) return CFX_DateTime(); CFX_DateTime dt; FX_DateFromCanonical(m_wsValue.span(), &dt); return dt; } CFX_DateTime CXFA_LocaleValue::GetTime() const { if (!m_bValid || m_dwType != XFA_VT_TIME) return CFX_DateTime(); CFX_DateTime dt; FX_TimeFromCanonical(m_pLocaleMgr->GetDefLocale(), m_wsValue.span(), &dt); return dt; } bool CXFA_LocaleValue::SetDate(const CFX_DateTime& d) { m_dwType = XFA_VT_DATE; m_wsValue = WideString::Format(L"%04d-%02d-%02d", d.GetYear(), d.GetMonth(), d.GetDay()); return true; } bool CXFA_LocaleValue::SetTime(const CFX_DateTime& t) { m_dwType = XFA_VT_TIME; m_wsValue = WideString::Format(L"%02d:%02d:%02d", t.GetHour(), t.GetMinute(), t.GetSecond()); if (t.GetMillisecond() > 0) m_wsValue += WideString::Format(L"%:03d", t.GetMillisecond()); return true; } bool CXFA_LocaleValue::SetDateTime(const CFX_DateTime& dt) { m_dwType = XFA_VT_DATETIME; m_wsValue = WideString::Format(L"%04d-%02d-%02dT%02d:%02d:%02d", dt.GetYear(), dt.GetMonth(), dt.GetDay(), dt.GetHour(), dt.GetMinute(), dt.GetSecond()); if (dt.GetMillisecond() > 0) m_wsValue += WideString::Format(L"%:03d", dt.GetMillisecond()); return true; } bool CXFA_LocaleValue::FormatPatterns(WideString& wsResult, const WideString& wsFormat, LocaleIface* pLocale, XFA_VALUEPICTURE eValueType) const { wsResult.clear(); for (const auto& pattern : CFGAS_StringFormatter::SplitOnBars(wsFormat)) { if (FormatSinglePattern(wsResult, pattern, pLocale, eValueType)) return true; } return false; } bool CXFA_LocaleValue::FormatSinglePattern(WideString& wsResult, const WideString& wsFormat, LocaleIface* pLocale, XFA_VALUEPICTURE eValueType) const { if (!m_pLocaleMgr) return false; ScopedLocale scoped_locale(m_pLocaleMgr.Get(), pLocale); wsResult.clear(); bool bRet = false; auto pFormat = pdfium::MakeUnique(m_pLocaleMgr.Get(), wsFormat); FX_LOCALECATEGORY eCategory = ValueCategory(pFormat->GetCategory(), m_dwType); switch (eCategory) { case FX_LOCALECATEGORY_Null: if (m_wsValue.IsEmpty()) bRet = pFormat->FormatNull(&wsResult); break; case FX_LOCALECATEGORY_Zero: if (m_wsValue.EqualsASCII("0")) bRet = pFormat->FormatZero(&wsResult); break; case FX_LOCALECATEGORY_Num: bRet = pFormat->FormatNum(m_wsValue, &wsResult); break; case FX_LOCALECATEGORY_Text: bRet = pFormat->FormatText(m_wsValue, &wsResult); break; case FX_LOCALECATEGORY_Date: bRet = pFormat->FormatDateTime(m_wsValue, FX_DATETIMETYPE_Date, &wsResult); break; case FX_LOCALECATEGORY_Time: bRet = pFormat->FormatDateTime(m_wsValue, FX_DATETIMETYPE_Time, &wsResult); break; case FX_LOCALECATEGORY_DateTime: bRet = pFormat->FormatDateTime(m_wsValue, FX_DATETIMETYPE_DateTime, &wsResult); break; default: wsResult = m_wsValue; bRet = true; } if (!bRet && (eCategory != FX_LOCALECATEGORY_Num || eValueType != XFA_VALUEPICTURE_Display)) { wsResult = m_wsValue; } return bRet; } bool CXFA_LocaleValue::ValidateCanonicalValue(const WideString& wsValue, uint32_t dwVType) { if (wsValue.IsEmpty()) return true; CFX_DateTime dt; switch (dwVType) { case XFA_VT_DATE: { if (ValidateCanonicalDate(wsValue, &dt)) return true; WideString wsDate; WideString wsTime; if (ValueSplitDateTime(wsValue, wsDate, wsTime) && ValidateCanonicalDate(wsDate, &dt)) { return true; } return false; } case XFA_VT_TIME: { if (ValidateCanonicalTime(wsValue)) return true; WideString wsDate; WideString wsTime; if (ValueSplitDateTime(wsValue, wsDate, wsTime) && ValidateCanonicalTime(wsTime)) { return true; } return false; } case XFA_VT_DATETIME: { WideString wsDate, wsTime; if (ValueSplitDateTime(wsValue, wsDate, wsTime) && ValidateCanonicalDate(wsDate, &dt) && ValidateCanonicalTime(wsTime)) { return true; } } break; } return true; } bool CXFA_LocaleValue::ValidateCanonicalDate(const WideString& wsDate, CFX_DateTime* unDate) { static const uint8_t LastDay[12] = {31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31}; static const uint16_t wCountY = 4; static const uint16_t wCountM = 2; static const uint16_t wCountD = 2; pdfium::span spDate = wsDate.span(); if (spDate.size() < wCountY || spDate.size() > wCountY + wCountM + wCountD + 2) { return false; } const bool bSymbol = wsDate.Contains(0x2D); uint16_t wYear = 0; uint16_t wMonth = 0; uint16_t wDay = 0; size_t nIndex = 0; size_t nStart = 0; while (nIndex < wCountY && spDate[nIndex] != '\0') { if (!FXSYS_IsDecimalDigit(spDate[nIndex])) return false; wYear = (spDate[nIndex] - '0') + wYear * 10; nIndex++; } if (bSymbol) { if (nIndex >= spDate.size() || spDate[nIndex] != 0x2D) return false; nIndex++; } nStart = nIndex; while (nIndex < spDate.size() && spDate[nIndex] != '\0' && nIndex - nStart < wCountM) { if (!FXSYS_IsDecimalDigit(spDate[nIndex])) return false; wMonth = (spDate[nIndex] - '0') + wMonth * 10; nIndex++; } if (bSymbol) { if (nIndex >= spDate.size() || spDate[nIndex] != 0x2D) return false; nIndex++; } nStart = nIndex; while (nIndex < spDate.size() && spDate[nIndex] != '\0' && nIndex - nStart < wCountD) { if (!FXSYS_IsDecimalDigit(spDate[nIndex])) return false; wDay = (spDate[nIndex] - '0') + wDay * 10; nIndex++; } if (nIndex != spDate.size()) return false; if (wYear < 1900 || wYear > 2029) return false; if (wMonth < 1 || wMonth > 12) return wMonth == 0 && spDate.size() == wCountY; if (wDay < 1) return wDay == 0 && spDate.size() == wCountY + wCountM; if (wMonth == 2) { if (wYear % 400 == 0 || (wYear % 100 != 0 && wYear % 4 == 0)) { if (wDay > 29) return false; } else if (wDay > 28) { return false; } } else if (wDay > LastDay[wMonth - 1]) { return false; } unDate->SetDate(wYear, static_cast(wMonth), static_cast(wDay)); return true; } bool CXFA_LocaleValue::ValidateCanonicalTime(const WideString& wsTime) { pdfium::span spTime = wsTime.span(); if (spTime.size() < 2) return false; const uint16_t wCountH = 2; const uint16_t wCountM = 2; const uint16_t wCountS = 2; const uint16_t wCountF = 3; const bool bSymbol = wsTime.Contains(':'); uint16_t wHour = 0; uint16_t wMinute = 0; uint16_t wSecond = 0; uint16_t wFraction = 0; size_t nIndex = 0; size_t nStart = 0; while (nIndex - nStart < wCountH && spTime[nIndex]) { if (!FXSYS_IsDecimalDigit(spTime[nIndex])) return false; wHour = spTime[nIndex] - '0' + wHour * 10; nIndex++; } if (bSymbol) { if (nIndex < spTime.size() && spTime[nIndex] != ':') return false; nIndex++; } nStart = nIndex; while (nIndex < spTime.size() && spTime[nIndex] != '\0' && nIndex - nStart < wCountM) { if (!FXSYS_IsDecimalDigit(spTime[nIndex])) return false; wMinute = spTime[nIndex] - '0' + wMinute * 10; nIndex++; } if (bSymbol) { if (nIndex >= spTime.size() || spTime[nIndex] != ':') return false; nIndex++; } nStart = nIndex; while (nIndex < spTime.size() && spTime[nIndex] != '\0' && nIndex - nStart < wCountS) { if (!FXSYS_IsDecimalDigit(spTime[nIndex])) return false; wSecond = spTime[nIndex] - '0' + wSecond * 10; nIndex++; } auto pos = wsTime.Find('.'); if (pos.has_value() && pos.value() != 0) { if (nIndex >= spTime.size() || spTime[nIndex] != '.') return false; nIndex++; nStart = nIndex; while (nIndex < spTime.size() && spTime[nIndex] != '\0' && nIndex - nStart < wCountF) { if (!FXSYS_IsDecimalDigit(spTime[nIndex])) return false; wFraction = spTime[nIndex] - '0' + wFraction * 10; nIndex++; } } if (nIndex < spTime.size()) { if (spTime[nIndex] == 'Z') { nIndex++; } else if (spTime[nIndex] == '-' || spTime[nIndex] == '+') { int16_t nOffsetH = 0; int16_t nOffsetM = 0; nIndex++; nStart = nIndex; while (nIndex < spTime.size() && spTime[nIndex] != '\0' && nIndex - nStart < wCountH) { if (!FXSYS_IsDecimalDigit(spTime[nIndex])) return false; nOffsetH = spTime[nIndex] - '0' + nOffsetH * 10; nIndex++; } if (bSymbol) { if (nIndex >= spTime.size() || spTime[nIndex] != ':') return false; nIndex++; } nStart = nIndex; while (nIndex < spTime.size() && spTime[nIndex] != '\0' && nIndex - nStart < wCountM) { if (!FXSYS_IsDecimalDigit(spTime[nIndex])) return false; nOffsetM = spTime[nIndex] - '0' + nOffsetM * 10; nIndex++; } if (nOffsetH > 12 || nOffsetM >= 60) return false; } } return nIndex == spTime.size() && wHour < 24 && wMinute < 60 && wSecond < 60 && wFraction <= 999; } bool CXFA_LocaleValue::ParsePatternValue(const WideString& wsValue, const WideString& wsPattern, LocaleIface* pLocale) { if (!m_pLocaleMgr) return false; std::vector wsPatterns = CFGAS_StringFormatter::SplitOnBars(wsPattern); ScopedLocale scoped_locale(m_pLocaleMgr.Get(), pLocale); bool bRet = false; for (size_t i = 0; !bRet && i < wsPatterns.size(); i++) { const WideString& wsFormat = wsPatterns[i]; auto pFormat = pdfium::MakeUnique(m_pLocaleMgr.Get(), wsFormat); switch (ValueCategory(pFormat->GetCategory(), m_dwType)) { case FX_LOCALECATEGORY_Null: bRet = pFormat->ParseNull(wsValue); if (bRet) m_wsValue.clear(); break; case FX_LOCALECATEGORY_Zero: bRet = pFormat->ParseZero(wsValue); if (bRet) m_wsValue = L"0"; break; case FX_LOCALECATEGORY_Num: { WideString fNum; bRet = pFormat->ParseNum(wsValue, &fNum); if (bRet) m_wsValue = std::move(fNum); break; } case FX_LOCALECATEGORY_Text: bRet = pFormat->ParseText(wsValue, &m_wsValue); break; case FX_LOCALECATEGORY_Date: { CFX_DateTime dt; bRet = ValidateCanonicalDate(wsValue, &dt); if (!bRet) { bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_Date, &dt); } if (bRet) SetDate(dt); break; } case FX_LOCALECATEGORY_Time: { CFX_DateTime dt; bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_Time, &dt); if (bRet) SetTime(dt); break; } case FX_LOCALECATEGORY_DateTime: { CFX_DateTime dt; bRet = pFormat->ParseDateTime(wsValue, FX_DATETIMETYPE_DateTime, &dt); if (bRet) SetDateTime(dt); break; } default: m_wsValue = wsValue; bRet = true; break; } } if (!bRet) m_wsValue = wsValue; return bRet; } void CXFA_LocaleValue::GetNumericFormat(WideString& wsFormat, int32_t nIntLen, int32_t nDecLen) { ASSERT(wsFormat.IsEmpty()); ASSERT(nIntLen >= -1); ASSERT(nDecLen >= -1); int32_t nTotalLen = (nIntLen >= 0 ? nIntLen : 2) + 1 + (nDecLen >= 0 ? nDecLen : 2) + (nDecLen == 0 ? 0 : 1); { // Span's lifetime must end before ReleaseBuffer() below. pdfium::span lpBuf = wsFormat.GetBuffer(nTotalLen); int32_t nPos = 0; lpBuf[nPos++] = L's'; if (nIntLen == -1) { lpBuf[nPos++] = L'z'; lpBuf[nPos++] = L'*'; } else { while (nIntLen) { lpBuf[nPos++] = L'z'; nIntLen--; } } if (nDecLen != 0) { lpBuf[nPos++] = L'.'; } if (nDecLen == -1) { lpBuf[nPos++] = L'z'; lpBuf[nPos++] = L'*'; } else { while (nDecLen) { lpBuf[nPos++] = L'z'; nDecLen--; } } } wsFormat.ReleaseBuffer(nTotalLen); } bool CXFA_LocaleValue::ValidateNumericTemp(const WideString& wsNumeric, const WideString& wsFormat, LocaleIface* pLocale) { if (wsFormat.IsEmpty() || wsNumeric.IsEmpty()) return true; pdfium::span spNum = wsNumeric.span(); pdfium::span spFmt = wsFormat.span(); int32_t n = 0; int32_t nf = 0; wchar_t c = spNum[n]; wchar_t cf = spFmt[nf]; if (cf == L's') { if (c == L'-' || c == L'+') ++n; ++nf; } bool bLimit = true; int32_t nCount = wsNumeric.GetLength(); int32_t nCountFmt = wsFormat.GetLength(); while (n < nCount && (!bLimit || nf < nCountFmt) && FXSYS_IsDecimalDigit(c = spNum[n])) { if (bLimit) { if ((cf = spFmt[nf]) == L'*') bLimit = false; else if (cf == L'z') nf++; else return false; } n++; } if (n == nCount) return true; if (nf == nCountFmt) return false; while (nf < nCountFmt && (cf = spFmt[nf]) != L'.') { ASSERT(cf == L'z' || cf == L'*'); ++nf; } WideString wsDecimalSymbol; if (pLocale) wsDecimalSymbol = pLocale->GetDecimalSymbol(); else wsDecimalSymbol = WideString(L'.'); if (spFmt[nf] != L'.') return false; if (wsDecimalSymbol != WideStringView(c) && c != L'.') return false; ++nf; ++n; bLimit = true; while (n < nCount && (!bLimit || nf < nCountFmt) && FXSYS_IsDecimalDigit(spNum[n])) { if (bLimit) { if ((cf = spFmt[nf]) == L'*') bLimit = false; else if (cf == L'z') nf++; else return false; } n++; } return n == nCount; }