diff options
Diffstat (limited to 'xfa/fxfa/fm2js/xfa_lexer_unittest.cpp')
-rw-r--r-- | xfa/fxfa/fm2js/xfa_lexer_unittest.cpp | 239 |
1 files changed, 239 insertions, 0 deletions
diff --git a/xfa/fxfa/fm2js/xfa_lexer_unittest.cpp b/xfa/fxfa/fm2js/xfa_lexer_unittest.cpp new file mode 100644 index 0000000000..fac0c9ac55 --- /dev/null +++ b/xfa/fxfa/fm2js/xfa_lexer_unittest.cpp @@ -0,0 +1,239 @@ +// Copyright 2016 PDFium Authors. All rights reserved. +// Use of this source code is governed by a BSD-style license that can be +// found in the LICENSE file. + +#include "xfa/fxfa/fm2js/xfa_lexer.h" + +#include <vector> + +#include "testing/gtest/include/gtest/gtest.h" +#include "testing/test_support.h" +#include "third_party/base/ptr_util.h" + +TEST(CXFA_FMLexerTest, EmptyString) { + CXFA_FMLexer lexer(L"", nullptr); + CXFA_FMToken* token = lexer.NextToken(); + EXPECT_EQ(TOKeof, token->m_type); +} + +TEST(CXFA_FMLexerTest, Numbers) { + auto lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"-12", nullptr); + CXFA_FMToken* token = lexer->NextToken(); + // TODO(dsinclair): Should this return -12 instead of two tokens? + EXPECT_EQ(TOKminus, token->m_type); + token = lexer->NextToken(); + EXPECT_EQ(L"12", token->m_wstring); + token = lexer->NextToken(); + EXPECT_EQ(TOKeof, token->m_type); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"1.5362", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKnumber, token->m_type); + EXPECT_EQ(L"1.5362", token->m_wstring); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"0.875", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKnumber, token->m_type); + EXPECT_EQ(L"0.875", token->m_wstring); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"5.56e-2", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKnumber, token->m_type); + EXPECT_EQ(L"5.56e-2", token->m_wstring); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"1.234E10", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKnumber, token->m_type); + EXPECT_EQ(L"1.234E10", token->m_wstring); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"123456789.012345678", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKnumber, token->m_type); + // TODO(dsinclair): This should round as per IEEE 64-bit values. + // EXPECT_EQ(L"123456789.01234567", token->m_wstring); + EXPECT_EQ(L"123456789.012345678", token->m_wstring); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"99999999999999999", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKnumber, token->m_type); + // TODO(dsinclair): This is spec'd as rounding when > 16 significant digits + // prior to the exponent. + // EXPECT_EQ(L"100000000000000000", token->m_wstring); + EXPECT_EQ(L"99999999999999999", token->m_wstring); +} + +// The quotes are stripped in CXFA_FMStringExpression::ToJavaScript. +TEST(CXFA_FMLexerTest, Strings) { + auto lexer = pdfium::MakeUnique<CXFA_FMLexer>( + L"\"The cat jumped over the fence.\"", nullptr); + CXFA_FMToken* token = lexer->NextToken(); + EXPECT_EQ(TOKstring, token->m_type); + EXPECT_EQ(L"\"The cat jumped over the fence.\"", token->m_wstring); + + token = lexer->NextToken(); + EXPECT_EQ(TOKeof, token->m_type); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"\"\"", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKstring, token->m_type); + EXPECT_EQ(L"\"\"", token->m_wstring); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>( + L"\"The message reads: \"\"Warning: Insufficient Memory\"\"\"", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKstring, token->m_type); + EXPECT_EQ(L"\"The message reads: \"\"Warning: Insufficient Memory\"\"\"", + token->m_wstring); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>( + L"\"\\u0047\\u006f\\u0066\\u0069\\u0073\\u0068\\u0021\\u000d\\u000a\"", + nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKstring, token->m_type); + EXPECT_EQ( + L"\"\\u0047\\u006f\\u0066\\u0069\\u0073\\u0068\\u0021\\u000d\\u000a\"", + token->m_wstring); +} + +// Note, 'this' is a keyword but is not matched by the lexer. +TEST(CXFA_FMLexerTest, OperatorsAndKeywords) { + struct { + const wchar_t* op; + XFA_FM_TOKEN token; + } op[] = {{L"+", TOKplus}, + {L"/", TOKdiv}, + {L"-", TOKminus}, + {L"&", TOKand}, + {L"|", TOKor}, + {L"*", TOKmul}, + {L"<", TOKlt}, + {L">", TOKgt}, + {L"==", TOKeq}, + {L"<>", TOKne}, + {L"<=", TOKle}, + {L">=", TOKge}, + {L"and", TOKksand}, + {L"break", TOKbreak}, + {L"continue", TOKcontinue}, + {L"do", TOKdo}, + {L"downto", TOKdownto}, + {L"else", TOKelse}, + {L"elseif", TOKelseif}, + {L"end", TOKend}, + {L"endfor", TOKendfor}, + {L"endfunc", TOKendfunc}, + {L"endif", TOKendif}, + {L"endwhile", TOKendwhile}, + {L"eq", TOKkseq}, + {L"exit", TOKexit}, + {L"for", TOKfor}, + {L"foreach", TOKforeach}, + {L"func", TOKfunc}, + {L"ge", TOKksge}, + {L"gt", TOKksgt}, + {L"if", TOKif}, + {L"in", TOKin}, + {L"infinity", TOKinfinity}, + {L"le", TOKksle}, + {L"lt", TOKkslt}, + {L"nan", TOKnan}, + {L"ne", TOKksne}, + {L"not", TOKksnot}, + {L"null", TOKnull}, + {L"or", TOKksor}, + {L"return", TOKreturn}, + {L"step", TOKstep}, + {L"then", TOKthen}, + {L"throw", TOKthrow}, + {L"upto", TOKupto}, + {L"var", TOKvar}, + {L"while", TOKwhile}, + + // The following are defined but aren't in the spec. + {L"(", TOKlparen}, + {L")", TOKrparen}, + {L",", TOKcomma}, + {L".", TOKdot}, + {L"[", TOKlbracket}, + {L"]", TOKrbracket}, + {L"..", TOKdotdot}, + {L".#", TOKdotscream}, + {L".*", TOKdotstar}}; + + for (size_t i = 0; i < FX_ArraySize(op); ++i) { + auto lexer = pdfium::MakeUnique<CXFA_FMLexer>(op[i].op, nullptr); + CXFA_FMToken* token = lexer->NextToken(); + EXPECT_EQ(op[i].token, token->m_type); + } +} + +TEST(CXFA_FMLexerTest, Comments) { + auto lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"// Empty.", nullptr); + CXFA_FMToken* token = lexer->NextToken(); + EXPECT_EQ(TOKeof, token->m_type); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"//", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKeof, token->m_type); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"123 // Empty.\n\"str\"", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKnumber, token->m_type); + EXPECT_EQ(L"123", token->m_wstring); + + token = lexer->NextToken(); + EXPECT_EQ(TOKstring, token->m_type); + EXPECT_EQ(L"\"str\"", token->m_wstring); + + token = lexer->NextToken(); + EXPECT_EQ(TOKeof, token->m_type); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L";", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKeof, token->m_type); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"; Empty.", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKeof, token->m_type); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"123 ;Empty.\n\"str\"", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKnumber, token->m_type); + EXPECT_EQ(L"123", token->m_wstring); + + token = lexer->NextToken(); + EXPECT_EQ(TOKstring, token->m_type); + EXPECT_EQ(L"\"str\"", token->m_wstring); + + token = lexer->NextToken(); + EXPECT_EQ(TOKeof, token->m_type); +} + +TEST(CXFA_FMLexerTest, Identifiers) { + std::vector<const wchar_t*> identifiers = { + L"a", L"an_identifier", L"_ident", L"$ident", L"!ident", L"GetAddr"}; + for (const auto* ident : identifiers) { + auto lexer = pdfium::MakeUnique<CXFA_FMLexer>(ident, nullptr); + CXFA_FMToken* token = lexer->NextToken(); + EXPECT_EQ(TOKidentifier, token->m_type); + EXPECT_EQ(ident, token->m_wstring); + } +} + +TEST(CXFA_FMLexerTest, Whitespace) { + auto lexer = pdfium::MakeUnique<CXFA_FMLexer>(L" \t\xc\x9\xb", nullptr); + CXFA_FMToken* token = lexer->NextToken(); + EXPECT_EQ(TOKeof, token->m_type); + + lexer = pdfium::MakeUnique<CXFA_FMLexer>(L"123 \t\xc\x9\xb 456", nullptr); + token = lexer->NextToken(); + EXPECT_EQ(TOKnumber, token->m_type); + EXPECT_EQ(L"123", token->m_wstring); + + token = lexer->NextToken(); + EXPECT_EQ(TOKnumber, token->m_type); + EXPECT_EQ(L"456", token->m_wstring); + + token = lexer->NextToken(); + EXPECT_EQ(TOKeof, token->m_type); +} |