Source code
Revision control
Copy as Markdown
Other Tools
/* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
/* vim: set ts=8 sts=2 et sw=2 tw=80: */
/* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
#include "Common.h"
#include "gtest/gtest.h"
#include "nsCRT.h"
#include "nsIDocumentEncoder.h"
#include "nsIParserUtils.h"
#include "nsServiceManagerUtils.h"
#include "nsString.h"
// Test for ASCII with format=flowed; delsp=yes
TEST(PlainTextSerializer, ASCIIWithFlowedDelSp)
{
nsString test;
nsString result;
test.AssignLiteral(
"<html><body>"
"Firefox Firefox Firefox Firefox "
"Firefox Firefox Firefox Firefox "
"Firefox Firefox Firefox Firefox"
"</body></html>");
ConvertBufToPlainText(test,
nsIDocumentEncoder::OutputFormatted |
nsIDocumentEncoder::OutputCRLineBreak |
nsIDocumentEncoder::OutputLFLineBreak |
nsIDocumentEncoder::OutputFormatFlowed |
nsIDocumentEncoder::OutputFormatDelSp,
kDefaultWrapColumn);
// create result case
result.AssignLiteral(
"Firefox Firefox Firefox Firefox "
"Firefox Firefox Firefox Firefox "
"Firefox \r\nFirefox Firefox Firefox\r\n");
ASSERT_EQ(test, result)
<< "Wrong HTML to ASCII text serialization with format=flowed; delsp=yes";
}
TEST(PlainTextSerializer, Bug1864820)
{
nsString test(
uR"#(
<html><body>
> label=master&label=experimental&product=chrome&product=firefox&product=safari&aligned&view=interop&q=label%3Ainterop-2023-property
<blockquote>
> label=master&label=experimental&product=chrome&product=firefox&product=safari&aligned&view=interop&q=label%3Ainterop-2023-property
</blockquote>
</body></html>
)#");
ConvertBufToPlainText(test,
nsIDocumentEncoder::OutputFormatted |
nsIDocumentEncoder::OutputPersistNBSP |
nsIDocumentEncoder::OutputLFLineBreak |
nsIDocumentEncoder::OutputFormatFlowed,
kDefaultWrapColumn);
nsString result(
uR"#(
>Â Â label=master&label=experimental&product=chrome&product=firefox&product=safari&aligned&view=interop&q=label%3Ainterop-2023-property
>Â Â label=master&label=experimental&product=chrome&product=firefox&product=safari&aligned&view=interop&q=label%3Ainterop-2023-property
)#");
result.Trim(" \n");
test.Trim(" \n");
ASSERT_EQ(test, result) << "Shouldn't hang with format=flowed";
}
// Test for CJK with format=flowed; delsp=yes
TEST(PlainTextSerializer, CJKWithFlowedDelSp)
{
nsString test;
nsString result;
test.AssignLiteral("<html><body>");
for (uint32_t i = 0; i < 40; i++) {
// Insert Kanji (U+5341)
test.Append(0x5341);
}
test.AppendLiteral("</body></html>");
ConvertBufToPlainText(test,
nsIDocumentEncoder::OutputFormatted |
nsIDocumentEncoder::OutputCRLineBreak |
nsIDocumentEncoder::OutputLFLineBreak |
nsIDocumentEncoder::OutputFormatFlowed |
nsIDocumentEncoder::OutputFormatDelSp,
kDefaultWrapColumn);
// create result case
for (uint32_t i = 0; i < 36; i++) {
result.Append(0x5341);
}
result.AppendLiteral(" \r\n");
for (uint32_t i = 0; i < 4; i++) {
result.Append(0x5341);
}
result.AppendLiteral("\r\n");
ASSERT_EQ(test, result)
<< "Wrong HTML to CJK text serialization with format=flowed; delsp=yes";
}
// Test for CJK with DisallowLineBreaking
TEST(PlainTextSerializer, CJKWithDisallowLineBreaking)
{
nsString test;
nsString result;
test.AssignLiteral("<html><body>");
for (uint32_t i = 0; i < 400; i++) {
// Insert Kanji (U+5341)
test.Append(0x5341);
}
test.AppendLiteral("</body></html>");
ConvertBufToPlainText(test,
nsIDocumentEncoder::OutputFormatted |
nsIDocumentEncoder::OutputCRLineBreak |
nsIDocumentEncoder::OutputLFLineBreak |
nsIDocumentEncoder::OutputFormatFlowed |
nsIDocumentEncoder::OutputDisallowLineBreaking,
kDefaultWrapColumn);
// create result case
for (uint32_t i = 0; i < 400; i++) {
result.Append(0x5341);
}
result.AppendLiteral("\r\n");
ASSERT_EQ(test, result)
<< "Wrong HTML to CJK text serialization with OutputDisallowLineBreaking";
}
// Test for Latin with DisallowLineBreaking
TEST(PlainTextSerializer, LatinWithDisallowLineBreaking)
{
nsString test;
test.AssignLiteral("<html><body>");
for (uint32_t i = 0; i < 400; i++) {
// Insert á (Latin Small Letter a with Acute) (U+00E1)
test.Append(0x00E1);
}
test.AppendLiteral("</body></html>\r\n");
ConvertBufToPlainText(test,
nsIDocumentEncoder::OutputFormatted |
nsIDocumentEncoder::OutputCRLineBreak |
nsIDocumentEncoder::OutputLFLineBreak |
nsIDocumentEncoder::OutputFormatFlowed |
nsIDocumentEncoder::OutputDisallowLineBreaking,
kDefaultWrapColumn);
// Create expect case.
nsString expect;
for (uint32_t i = 0; i < 400; i++) {
expect.Append(0x00E1);
}
expect.AppendLiteral(" \r\n\r\n");
ASSERT_EQ(test, expect) << "Wrong HTML to Latin text serialization with "
"OutputDisallowLineBreaking";
}
// Test for ASCII with format=flowed; and quoted lines in preformatted span.
TEST(PlainTextSerializer, PreformatFlowedQuotes)
{
nsString test;
nsString result;
test.AssignLiteral(
"<html><body>"
"<span style=\"white-space: pre-wrap;\" _moz_quote=\"true\">"
"> Firefox Firefox Firefox Firefox <br>"
"> Firefox Firefox Firefox <b>Firefox</b><br>"
"><br>"
">> Firefox Firefox Firefox Firefox <br>"
">> Firefox Firefox Firefox Firefox<br>"
"</span></body></html>");
ConvertBufToPlainText(test,
nsIDocumentEncoder::OutputFormatted |
nsIDocumentEncoder::OutputCRLineBreak |
nsIDocumentEncoder::OutputLFLineBreak |
nsIDocumentEncoder::OutputFormatFlowed,
kDefaultWrapColumn);
// create result case
result.AssignLiteral(
"> Firefox Firefox Firefox Firefox \r\n"
"> Firefox Firefox Firefox *Firefox*\r\n"
">\r\n"
">> Firefox Firefox Firefox Firefox \r\n"
">> Firefox Firefox Firefox Firefox\r\n");
ASSERT_EQ(test, result) << "Wrong HTML to ASCII text serialization "
"with format=flowed; and quoted "
"lines using OutputFormatted";
}
// Test for ASCII with format=flowed; and not using OutputFormatted.
TEST(PlainTextSerializer, OutputFormatFlowedAndWrapped)
{
nsString test;
nsString result;
test.AssignLiteral(
"<html><body>"
"<span style=\"white-space: pre-wrap;\" _moz_quote=\"true\">"
"> Firefox Firefox Firefox Firefox <br>"
"> Firefox Firefox Firefox <b>Firefox</b><br>"
"><br>"
">> Firefox Firefox Firefox Firefox <br>"
">> Firefox Firefox Firefox Firefox<br>"
"</span></body></html>");
ConvertBufToPlainText(test,
nsIDocumentEncoder::OutputWrap |
nsIDocumentEncoder::OutputCRLineBreak |
nsIDocumentEncoder::OutputLFLineBreak |
nsIDocumentEncoder::OutputFormatFlowed,
kDefaultWrapColumn);
// create result case
result.AssignLiteral(
"> Firefox Firefox Firefox Firefox \r\n"
"> Firefox Firefox Firefox Firefox\r\n"
">\r\n"
">> Firefox Firefox Firefox Firefox \r\n"
">> Firefox Firefox Firefox Firefox\r\n");
ASSERT_EQ(test, result) << "Wrong HTML to ASCII text serialization "
"with format=flowed; and quoted "
"lines using OutputWrap";
}
TEST(PlainTextSerializer, PrettyPrintedHtml)
{
nsString test;
test.AppendLiteral("<html>" NS_LINEBREAK "<body>" NS_LINEBREAK
" first<br>" NS_LINEBREAK " second<br>" NS_LINEBREAK
"</body>" NS_LINEBREAK "</html>");
ConvertBufToPlainText(test, 0, kDefaultWrapColumn);
nsAutoString expect;
expect.AppendLiteral("first" NS_LINEBREAK "second" NS_LINEBREAK);
ASSERT_EQ(test, expect) << "Wrong prettyprinted html to text serialization";
}
TEST(PlainTextSerializer, PreElement)
{
nsString test;
test.AppendLiteral("<html>" NS_LINEBREAK "<body>" NS_LINEBREAK
"<pre>" NS_LINEBREAK " first" NS_LINEBREAK
" second" NS_LINEBREAK "</pre>" NS_LINEBREAK
"</body>" NS_LINEBREAK "</html>");
ConvertBufToPlainText(test, 0, kDefaultWrapColumn);
nsAutoString expect;
expect.AppendLiteral(" first" NS_LINEBREAK
" second" NS_LINEBREAK NS_LINEBREAK);
ASSERT_EQ(test, expect) << "Wrong prettyprinted html to text serialization";
}
TEST(PlainTextSerializer, BlockElement)
{
nsString test;
test.AppendLiteral("<html>" NS_LINEBREAK "<body>" NS_LINEBREAK
"<div>" NS_LINEBREAK " first" NS_LINEBREAK
"</div>" NS_LINEBREAK "<div>" NS_LINEBREAK
" second" NS_LINEBREAK "</div>" NS_LINEBREAK
"</body>" NS_LINEBREAK "</html>");
ConvertBufToPlainText(test, 0, kDefaultWrapColumn);
nsAutoString expect;
expect.AppendLiteral("first" NS_LINEBREAK "second" NS_LINEBREAK);
ASSERT_EQ(test, expect) << "Wrong prettyprinted html to text serialization";
}
TEST(PlainTextSerializer, PreWrapElementForThunderbird)
{
// This test examines the magic pre-wrap setup that Thunderbird relies on.
nsString test;
test.AppendLiteral("<html>" NS_LINEBREAK
"<body style=\"white-space: pre-wrap;\">" NS_LINEBREAK
"<pre>" NS_LINEBREAK
" first line is too long" NS_LINEBREAK
" second line is even loooonger " NS_LINEBREAK
"</pre>" NS_LINEBREAK "</body>" NS_LINEBREAK "</html>");
const uint32_t wrapColumn = 10;
ConvertBufToPlainText(test, nsIDocumentEncoder::OutputWrap, wrapColumn);
// "\n\n first\nline is\ntoo long\n second\nline is\neven\nloooonger\n\n\n"
nsAutoString expect;
expect.AppendLiteral(NS_LINEBREAK NS_LINEBREAK
" first" NS_LINEBREAK "line is" NS_LINEBREAK
"too long" NS_LINEBREAK " second" NS_LINEBREAK
"line is" NS_LINEBREAK "even" NS_LINEBREAK
"loooonger" NS_LINEBREAK NS_LINEBREAK NS_LINEBREAK);
ASSERT_EQ(test, expect) << "Wrong prettyprinted html to text serialization";
}
TEST(PlainTextSerializer, Simple)
{
nsString test;
test.AppendLiteral(
"<html><base>base</base><head><span>span</span></head>"
"<body>body</body></html>");
ConvertBufToPlainText(test, 0, kDefaultWrapColumn);
nsAutoString expect;
expect.AppendLiteral("basespanbody");
ASSERT_EQ(test, expect) << "Wrong html to text serialization";
}
TEST(PlainTextSerializer, OneHundredAndOneOL)
{
nsAutoString test;
test.AppendLiteral(
"<html>"
"<body>"
"<ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><"
"ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><"
"ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><"
"ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><"
"ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><"
"ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol><ol></ol></ol></ol></"
"ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></"
"ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></"
"ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></"
"ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></"
"ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></"
"ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></"
"ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></ol></"
"ol></ol><li>X</li></ol>"
"</body>"
"</html>");
ConvertBufToPlainText(test, nsIDocumentEncoder::OutputFormatted,
kDefaultWrapColumn);
nsAutoString expected;
expected.AppendLiteral(" 1. X" NS_LINEBREAK);
ASSERT_EQ(test, expected);
}