mirror of
https://github.com/SerenityOS/serenity.git
synced 2025-01-23 01:41:59 -05:00
cfff04c9c7
This uses a non-stream xref table, and the spec says "The cross-reference table (comprising the original cross-reference section and all update sections) must contain one entry for each object number from 0 to the maximum object number used in the file". So this file isn't spec compliant. However, with xref streams this does happen in practice (the spec isn't quite clear on if it's valid there), and it's much easier to write a test file with a non-stream xref table by hand. Also, this file shows up fine in other PDF viewers. This is a regression test for #25079.
352 lines
15 KiB
C++
352 lines
15 KiB
C++
/*
|
|
* Copyright (c) 2021, Simon Woertz <simon@woertz.at>
|
|
*
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
|
*/
|
|
|
|
#include <AK/ByteString.h>
|
|
#include <AK/Forward.h>
|
|
#include <AK/LexicalPath.h>
|
|
#include <LibCore/MappedFile.h>
|
|
#include <LibCore/ResourceImplementationFile.h>
|
|
#include <LibCore/System.h>
|
|
#include <LibGfx/Bitmap.h>
|
|
#include <LibPDF/CommonNames.h>
|
|
#include <LibPDF/Document.h>
|
|
#include <LibPDF/Function.h>
|
|
#include <LibPDF/Renderer.h>
|
|
#include <LibTest/Macros.h>
|
|
#include <LibTest/TestCase.h>
|
|
|
|
TEST_CASE(parse_value)
|
|
{
|
|
// document isn't really used for anything, only to check there's no security_handler.
|
|
auto file = MUST(Core::MappedFile::map("linearized.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
|
|
auto contents = "<50607><10\n>"sv;
|
|
PDF::Parser parser(contents.bytes());
|
|
parser.set_document(document->make_weak_ptr());
|
|
|
|
auto value1 = MUST(parser.parse_value(PDF::Parser::CanBeIndirectValue::No));
|
|
auto string1 = value1.get<NonnullRefPtr<PDF::Object>>()->cast<PDF::StringObject>();
|
|
EXPECT(string1->is_binary());
|
|
EXPECT_EQ(string1->string(), "\x50\x60\x70"sv);
|
|
|
|
auto value2 = MUST(parser.parse_value(PDF::Parser::CanBeIndirectValue::No));
|
|
auto string2 = value2.get<NonnullRefPtr<PDF::Object>>()->cast<PDF::StringObject>();
|
|
EXPECT(string2->is_binary());
|
|
EXPECT_EQ(string2->string(), "\x10"sv);
|
|
}
|
|
|
|
TEST_CASE(linearized_pdf)
|
|
{
|
|
auto file = MUST(Core::MappedFile::map("linearized.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
MUST(document->initialize());
|
|
EXPECT_EQ(document->get_page_count(), 1U);
|
|
}
|
|
|
|
TEST_CASE(non_linearized_pdf)
|
|
{
|
|
auto file = MUST(Core::MappedFile::map("non-linearized.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
MUST(document->initialize());
|
|
EXPECT_EQ(document->get_page_count(), 1U);
|
|
}
|
|
|
|
TEST_CASE(complex_pdf)
|
|
{
|
|
auto file = MUST(Core::MappedFile::map("complex.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
MUST(document->initialize());
|
|
EXPECT_EQ(document->get_page_count(), 3U);
|
|
}
|
|
|
|
TEST_CASE(empty_file_issue_10702)
|
|
{
|
|
AK::ReadonlyBytes empty;
|
|
auto document = PDF::Document::create(empty);
|
|
EXPECT(document.is_error());
|
|
}
|
|
|
|
TEST_CASE(encoding)
|
|
{
|
|
auto file = MUST(Core::MappedFile::map("encoding.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
MUST(document->initialize());
|
|
EXPECT_EQ(document->get_page_count(), 1U);
|
|
|
|
auto info_dict = MUST(document->info_dict()).value();
|
|
EXPECT_EQ(MUST(info_dict.author()).value(), "Nico Weber");
|
|
EXPECT_EQ(MUST(info_dict.producer()).value(), (char const*)u8"Manüally Created");
|
|
EXPECT_EQ(MUST(info_dict.title()).value(), (char const*)u8"Êñ©•ding test");
|
|
|
|
auto outline_dict = document->outline();
|
|
EXPECT_EQ(outline_dict->count, 3u);
|
|
EXPECT_EQ(outline_dict->children[0]->title, (char const*)u8"Titlè 1");
|
|
EXPECT_EQ(outline_dict->children[1]->title, (char const*)u8"Titlè 2");
|
|
EXPECT_EQ(outline_dict->children[2]->title, (char const*)u8"Titlè 3");
|
|
}
|
|
|
|
TEST_CASE(offset)
|
|
{
|
|
auto file = MUST(Core::MappedFile::map("offset.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
MUST(document->initialize());
|
|
EXPECT_EQ(document->get_page_count(), 1U);
|
|
}
|
|
|
|
TEST_CASE(truncated_pdf_header_issue_10717)
|
|
{
|
|
AK::ByteString string { "%PDF-2.11%" };
|
|
auto document = PDF::Document::create(string.bytes());
|
|
EXPECT(document.is_error());
|
|
}
|
|
|
|
TEST_CASE(encrypted_with_aes)
|
|
{
|
|
auto file = MUST(Core::MappedFile::map("password-is-sup.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
EXPECT(document->security_handler()->try_provide_user_password("sup"sv));
|
|
MUST(document->initialize());
|
|
EXPECT_EQ(document->get_page_count(), 1U);
|
|
|
|
auto info_dict = MUST(document->info_dict()).value();
|
|
EXPECT_EQ(MUST(info_dict.title()).value(), "sup");
|
|
EXPECT_EQ(MUST(info_dict.creator()).value(), "TextEdit");
|
|
}
|
|
|
|
TEST_CASE(encrypted_object_stream)
|
|
{
|
|
auto file = MUST(Core::MappedFile::map("encryption_nocopy.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
MUST(document->initialize());
|
|
EXPECT_EQ(document->get_page_count(), 1U);
|
|
|
|
auto info_dict = MUST(document->info_dict()).value();
|
|
EXPECT_EQ(MUST(info_dict.author()).value(), "van der Knijff");
|
|
EXPECT_EQ(MUST(info_dict.creator()).value(), "Acrobat PDFMaker 9.1 voor Word");
|
|
}
|
|
|
|
TEST_CASE(resolve_indirect_reference_during_parsing)
|
|
{
|
|
auto file = MUST(Core::MappedFile::map("jbig2-globals.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
MUST(document->initialize());
|
|
EXPECT_EQ(document->get_page_count(), 1U);
|
|
|
|
auto jbig2_stream_value = MUST(document->get_or_load_value(5));
|
|
auto jbig2_stream = MUST(document->resolve_to<PDF::StreamObject>(jbig2_stream_value));
|
|
EXPECT_EQ(jbig2_stream->bytes().size(), 20'000U);
|
|
}
|
|
|
|
TEST_CASE(malformed_pdf_document)
|
|
{
|
|
Array test_inputs = {
|
|
"oss-fuzz-testcase-62065.pdf"sv
|
|
};
|
|
|
|
for (auto test_input : test_inputs) {
|
|
auto file = MUST(Core::MappedFile::map(test_input));
|
|
auto document_or_error = PDF::Document::create(file->bytes());
|
|
EXPECT(document_or_error.is_error());
|
|
}
|
|
}
|
|
|
|
static PDF::Value make_array(Vector<float> floats)
|
|
{
|
|
Vector<PDF::Value> values;
|
|
for (auto f : floats)
|
|
values.append(PDF::Value { f });
|
|
return PDF::Value { make_object<PDF::ArrayObject>(move(values)) };
|
|
}
|
|
|
|
static PDF::PDFErrorOr<NonnullRefPtr<PDF::Function>> make_function(int type, ReadonlyBytes data, Vector<float> domain, Vector<float> range, Function<void(HashMap<DeprecatedFlyString, PDF::Value>&)> extra_keys = nullptr)
|
|
{
|
|
HashMap<DeprecatedFlyString, PDF::Value> map;
|
|
map.set(PDF::CommonNames::FunctionType, PDF::Value { type });
|
|
map.set(PDF::CommonNames::Domain, make_array(move(domain)));
|
|
map.set(PDF::CommonNames::Range, make_array(move(range)));
|
|
if (extra_keys)
|
|
extra_keys(map);
|
|
auto dict = make_object<PDF::DictObject>(move(map));
|
|
auto stream = make_object<PDF::StreamObject>(dict, MUST(ByteBuffer::copy(data)));
|
|
|
|
// document isn't used for anything, but UBSan complains about a (harmless) method call on a null object without it.
|
|
auto file = MUST(Core::MappedFile::map("linearized.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
return PDF::Function::create(document, stream);
|
|
}
|
|
|
|
static PDF::PDFErrorOr<NonnullRefPtr<PDF::Function>> make_sampled_function(ReadonlyBytes data, Vector<float> domain, Vector<float> range, Vector<float> sizes)
|
|
{
|
|
return make_function(0, data, move(domain), move(range), [&sizes](auto& map) {
|
|
map.set(PDF::CommonNames::Size, make_array(sizes));
|
|
map.set(PDF::CommonNames::BitsPerSample, PDF::Value { 8 });
|
|
});
|
|
}
|
|
|
|
TEST_CASE(sampled)
|
|
{
|
|
auto f1 = MUST(make_sampled_function(Vector<u8> { { 0, 255, 0 } }, { 0.0f, 1.0f }, { 0.0f, 10.0f }, { 3 }));
|
|
EXPECT_EQ(MUST(f1->evaluate(Vector<float> { 0.0f })), Vector<float> { 0.0f });
|
|
EXPECT_EQ(MUST(f1->evaluate(Vector<float> { 0.25f })), Vector<float> { 5.0f });
|
|
EXPECT_EQ(MUST(f1->evaluate(Vector<float> { 0.5f })), Vector<float> { 10.0f });
|
|
EXPECT_EQ(MUST(f1->evaluate(Vector<float> { 0.75f })), Vector<float> { 5.0f });
|
|
EXPECT_EQ(MUST(f1->evaluate(Vector<float> { 1.0f })), Vector<float> { 0.0f });
|
|
|
|
auto f2 = MUST(make_sampled_function(Vector<u8> { { 0, 255, 255, 0, 0, 255 } }, { 0.0f, 1.0f }, { 0.0f, 10.0f, 0.0f, 8.0f }, { 3 }));
|
|
EXPECT_EQ(MUST(f2->evaluate(Vector<float> { 0.0f })), (Vector<float> { 0.0f, 8.0f }));
|
|
EXPECT_EQ(MUST(f2->evaluate(Vector<float> { 0.25f })), (Vector<float> { 5.0f, 4.0f }));
|
|
EXPECT_EQ(MUST(f2->evaluate(Vector<float> { 0.5f })), (Vector<float> { 10.0f, 0.0f }));
|
|
EXPECT_EQ(MUST(f2->evaluate(Vector<float> { 0.75f })), (Vector<float> { 5.0f, 4.0f }));
|
|
EXPECT_EQ(MUST(f2->evaluate(Vector<float> { 1.0f })), (Vector<float> { 0.0f, 8.0f }));
|
|
|
|
auto f3 = MUST(make_sampled_function(Vector<u8> { { 0, 255, 0, 255, 0, 255 } }, { 0.0f, 1.0f, 0.0f, 1.0f }, { 0.0f, 10.0f }, { 3, 2 }));
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.0f, 0.0f })), Vector<float> { 0.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.25f, 0.0f })), Vector<float> { 5.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.5f, 0.0f })), Vector<float> { 10.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.75f, 0.0f })), Vector<float> { 5.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 1.0f, 0.0f })), Vector<float> { 0.0f });
|
|
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.0f, 0.5f })), Vector<float> { 5.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.25f, 0.5f })), Vector<float> { 5.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.5f, 0.5f })), Vector<float> { 5.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.75f, 0.5f })), Vector<float> { 5.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 1.0f, 0.5f })), Vector<float> { 5.0f });
|
|
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.0f, 1.0f })), Vector<float> { 10.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.25f, 1.0f })), Vector<float> { 5.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.5f, 1.0f })), Vector<float> { 0.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 0.75f, 1.0f })), Vector<float> { 5.0f });
|
|
EXPECT_EQ(MUST(f3->evaluate(Vector<float> { 1.0f, 1.0f })), Vector<float> { 10.0f });
|
|
|
|
auto f4 = MUST(make_sampled_function(Vector<u8> { { 0, 255, 255, 0, 0, 255, 255, 0 } }, { 0.0f, 1.0f, 0.0f, 1.0f }, { 0.0f, 10.0f, 0.0f, 8.0f }, { 2, 2 }));
|
|
EXPECT_EQ(MUST(f4->evaluate(Vector<float> { 0.0f, 0.0f })), (Vector<float> { 0.0f, 8.0f }));
|
|
EXPECT_EQ(MUST(f4->evaluate(Vector<float> { 0.5f, 0.5f })), (Vector<float> { 5.0f, 4.0f }));
|
|
}
|
|
|
|
static PDF::PDFErrorOr<NonnullRefPtr<PDF::Function>> make_postscript_function(StringView program, Vector<float> domain, Vector<float> range)
|
|
{
|
|
return make_function(4, program.bytes(), move(domain), move(range));
|
|
}
|
|
|
|
static NonnullRefPtr<PDF::Function> check_postscript_function(StringView program, Vector<float> domain, Vector<float> range)
|
|
{
|
|
auto function = make_postscript_function(program, move(domain), move(range));
|
|
if (function.is_error())
|
|
FAIL(function.error().message());
|
|
return function.value();
|
|
}
|
|
|
|
static void check_evaluate(StringView program, Vector<float> inputs, Vector<float> outputs)
|
|
{
|
|
Vector<float> domain;
|
|
for (size_t i = 0; i < inputs.size(); ++i) {
|
|
domain.append(-100.0f);
|
|
domain.append(100.0f);
|
|
}
|
|
Vector<float> range;
|
|
for (size_t i = 0; i < outputs.size(); ++i) {
|
|
range.append(-100.0f);
|
|
range.append(100.0f);
|
|
}
|
|
auto function = check_postscript_function(program, domain, range);
|
|
auto result = function->evaluate(inputs);
|
|
if (result.is_error())
|
|
FAIL(result.error().message());
|
|
EXPECT_EQ(result.value(), outputs);
|
|
}
|
|
|
|
TEST_CASE(postscript)
|
|
{
|
|
// Arithmetic operators
|
|
check_evaluate("{ abs }"sv, { 0.5f }, { 0.5f });
|
|
check_evaluate("{ add }"sv, { 0.25f, 0.5f }, { 0.75f });
|
|
check_evaluate("{ atan }"sv, { 1.0f, 0.01f }, { AK::to_degrees(atan2f(0.01f, 1.0f)) });
|
|
check_evaluate("{ ceiling }"sv, { 0.5f }, { 1.0f });
|
|
check_evaluate("{ cos }"sv, { 1.0f }, { cosf(AK::to_radians(1.0f)) });
|
|
check_evaluate("{ cvi }"sv, { 0.5f }, { 0.0f });
|
|
check_evaluate("{ cvr }"sv, { 0.5f }, { 0.5f });
|
|
check_evaluate("{ div }"sv, { 0.5f, 1.0f }, { 0.5f });
|
|
check_evaluate("{ exp }"sv, { 0.0f }, { 1.0f });
|
|
check_evaluate("{ floor }"sv, { 0.5f }, { 0.0f });
|
|
check_evaluate("{ idiv }"sv, { 0.5f, 1.0f }, { 0.0f });
|
|
check_evaluate("{ ln }"sv, { 10.0f }, { logf(10.0f) });
|
|
check_evaluate("{ log }"sv, { 10.0f }, { log10f(10.0f) });
|
|
check_evaluate("{ mod }"sv, { 0.5f, 0.25f }, { 0.0f });
|
|
check_evaluate("{ mul }"sv, { 0.5f, 0.25f }, { 0.125f });
|
|
check_evaluate("{ neg }"sv, { 0.5f }, { -0.5f });
|
|
check_evaluate("{ round }"sv, { 0.5f }, { 1.0f });
|
|
check_evaluate("{ sin }"sv, { 1.0f }, { sinf(AK::to_radians(1.0f)) });
|
|
check_evaluate("{ sqrt }"sv, { 0.5f }, { sqrtf(0.5f) });
|
|
check_evaluate("{ sub }"sv, { 0.5f, 0.25f }, { 0.25f });
|
|
check_evaluate("{ truncate }"sv, { 0.5f }, { 0.0f });
|
|
|
|
// Relational, boolean, and bitwise operators
|
|
check_evaluate("{ and }"sv, { 0.0f, 1.0f }, { 0.0f });
|
|
check_evaluate("{ bitshift }"sv, { 1.0f, 3.0f }, { 8.0f });
|
|
check_evaluate("{ bitshift }"sv, { 8.0f, -2.0f }, { 2.0f });
|
|
check_evaluate("{ eq }"sv, { 0.5f, 0.5f }, { 1.0f });
|
|
check_evaluate("{ ge }"sv, { 0.5f, 0.5f }, { 1.0f });
|
|
check_evaluate("{ gt }"sv, { 0.5f, 0.5f }, { 0.0f });
|
|
check_evaluate("{ le }"sv, { 0.5f, 0.5f }, { 1.0f });
|
|
check_evaluate("{ lt }"sv, { 0.5f, 0.5f }, { 0.0f });
|
|
check_evaluate("{ ne }"sv, { 0.5f, 0.5f }, { 0.0f });
|
|
check_evaluate("{ not }"sv, { 0.5f }, { 0.0f });
|
|
check_evaluate("{ or }"sv, { 0.0f, 1.0f }, { 1.0f });
|
|
check_evaluate("{ xor }"sv, { 0.0f, 1.0f }, { 1.0f });
|
|
|
|
// Conditional operators
|
|
check_evaluate("{ { 4 } if }"sv, { 1.0f }, { 4.0f });
|
|
check_evaluate("{ { 4 } if }"sv, { 0.0f }, {});
|
|
check_evaluate("{ { 4 } { 5 } ifelse }"sv, { 1.0f }, { 4.0f });
|
|
check_evaluate("{ { 4 } { 5 } ifelse }"sv, { 0.0f }, { 5.0f });
|
|
|
|
// Stack operators
|
|
check_evaluate("{ 2 copy }"sv, { 8.0f, 0.5f, 1.0f }, { 8.0f, 0.5f, 1.0f, 0.5f, 1.0f });
|
|
check_evaluate("{ dup }"sv, { 1.0f, 0.5f }, { 1.0f, 0.5f, 0.5f });
|
|
check_evaluate("{ exch }"sv, { 8.0f, 1.0f, 0.5f }, { 8.0f, 0.5f, 1.0f });
|
|
check_evaluate("{ 1 index }"sv, { 8.0f, 1.0f, 0.5f }, { 8.0f, 1.0f, 0.5f, 1.0f });
|
|
check_evaluate("{ pop }"sv, { 8.0f, 1.0f, 0.5f }, { 8.0f, 1.0f });
|
|
check_evaluate("{ 3 1 roll }"sv, { 0.5f, 1.0f, 2.0f }, { 2.0f, 0.5f, 1.0f });
|
|
check_evaluate("{ 3 -1 roll }"sv, { 0.5f, 1.0f, 2.0f }, { 1.0f, 2.0f, 0.5f });
|
|
}
|
|
|
|
TEST_CASE(render)
|
|
{
|
|
#if !defined(AK_OS_SERENITY)
|
|
// Get from Build/lagom/bin/TestPDF to Build/lagom/Root/res.
|
|
auto source_root = LexicalPath(MUST(Core::System::current_executable_path())).parent().parent().string();
|
|
Core::ResourceImplementation::install(make<Core::ResourceImplementationFile>(MUST(String::formatted("{}/Root/res", source_root))));
|
|
#endif
|
|
|
|
auto file = MUST(Core::MappedFile::map("colorspaces.pdf"sv));
|
|
auto document = MUST(PDF::Document::create(file->bytes()));
|
|
MUST(document->initialize());
|
|
EXPECT_EQ(document->get_page_count(), 1U);
|
|
|
|
auto page = MUST(document->get_page(0));
|
|
auto page_size = Gfx::IntSize { 310, 370 };
|
|
auto bitmap = MUST(Gfx::Bitmap::create(Gfx::BitmapFormat::BGRx8888, page_size));
|
|
MUST(PDF::Renderer::render(document, page, bitmap, Color::White, PDF::RenderingPreferences {}));
|
|
|
|
// DeviceGray
|
|
EXPECT_EQ(bitmap->get_pixel(270, 370 - 20), Gfx::Color::NamedColor::Black);
|
|
|
|
// MyCalRGB
|
|
EXPECT_EQ(bitmap->get_pixel(270, 370 - 80), Gfx::Color::NamedColor::Black);
|
|
|
|
// DeviceRGB
|
|
EXPECT_EQ(bitmap->get_pixel(270, 370 - 140), Gfx::Color::NamedColor::Black);
|
|
|
|
// DeviceCMYK (note: black one box further left)
|
|
EXPECT_EQ(bitmap->get_pixel(220, 370 - 200), Gfx::Color::NamedColor::Black);
|
|
|
|
// MyLab
|
|
EXPECT_EQ(bitmap->get_pixel(270, 370 - 260), Gfx::Color::NamedColor::Black);
|
|
|
|
// MyCalGray
|
|
EXPECT_EQ(bitmap->get_pixel(270, 370 - 320), Gfx::Color::NamedColor::Black);
|
|
}
|