#!/usr/bin/env python
# Copyright 2016 The PDFium Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
import cStringIO
import functools
import multiprocessing
import optparse
import os
import re
import shutil
import subprocess
import sys
import common
import gold
import pngdiffer
import suppressor
class KeyboardInterruptError(Exception): pass
# Nomenclature:
# x_root - "x"
# x_filename - "x.ext"
# x_path - "path/to/a/b/c/x.ext"
# c_dir - "path/to/a/b/c"
def TestOneFileParallel(this, test_case):
"""Wrapper to call GenerateAndTest() and redirect output to stdout."""
try:
input_filename, source_dir = test_case
result = this.GenerateAndTest(input_filename, source_dir);
return (result, input_filename, source_dir)
except KeyboardInterrupt:
raise KeyboardInterruptError()
class TestRunner:
def __init__(self, dirname):
self.test_dir = dirname
# GenerateAndTest returns a tuple <success, outputfiles> where
# success is a boolean indicating whether the tests passed comparison
# tests and outputfiles is a list tuples:
# (path_to_image, md5_hash_of_pixelbuffer)
def GenerateAndTest(self, input_filename, source_dir):
input_root, _ = os.path.splitext(input_filename)
expected_txt_path = os.path.join(source_dir, input_root + '_expected.txt')
pdf_path = os.path.join(self.working_dir, input_root + '.pdf')
# Remove any existing generated images from previous runs.
actual_images = self.image_differ.GetActualFiles(input_filename, source_dir,
self.working_dir)
for image in actual_images:
if os.path.exists(image):
os.remove(image)
sys.stdout.flush()
raised_exception = self.Generate(source_dir, input_filename, input_root,
pdf_path)
if raised_exception != None:
print "FAILURE: " + input_filename + "; " + str(raised_exception)
return False, []
results = []
if os.path.exists(expected_txt_path):
raised_exception = self.TestText(input_root, expected_txt_path, pdf_path)
else:
raised_exception, results = self.TestPixel(input_root, pdf_path)
if raised_exception != None:
print "FAILURE: " + input_filename + "; " + str(raised_exception)
return False, results
if len(actual_images):
if self.image_differ.HasDifferences(input_filename, source_dir,
self.working_dir):
return False, results
return True, results
def Generate(self, source_dir, input_filename, input_root, pdf_path):
original_path = os.path.join(source_dir, input_filename)
input_path = os.path.join(source_dir, input_root + '.in')
input_event_path = os.path.join(source_dir, input_root + ".evt")
if os.path.exists(input_event_path):
output_event_path = os.path.splitext(pdf_path)[0] + ".evt"
shutil.copyfile(input_event_path, output_event_path)
if not os.path.exists(input_path):
if os.path.exists(original_path):
shutil.copyfile(original_path, pdf_path)
return None
sys.stdout.flush()
return common.RunCommand(
[sys.executable, self.fixup_path, '--output-dir=' + self.working_dir,
input_path])
def TestText(self, input_root, expected_txt_path, pdf_path):
txt_path = os.path.join(self.working_dir, input_root + '.txt')
with open(txt_path, 'w') as outfile:
cmd_to_run = [self.pdfium_test_path, pdf_path]
subprocess.check_call(cmd_to_run, stdout=outfile)
cmd = [sys.executable, self.text_diff_path, expected_txt_path, txt_path]
return common.RunCommand(cmd)
def TestPixel(self, input_root, pdf_path):
cmd_to_run = [self.pdfium_test_path, '--send-events', '--png']
if self.gold_results:
cmd_to_run.append('--md5')
cmd_to_run.append(pdf_path)
return common.RunCommandExtractHashedFiles(cmd_to_run)
def HandleResult(self, input_filename, input_path, result):
success, image_paths = result
if self.gold_results:
if image_paths:
for img_path, md5_hash in image_paths:
# the output filename (without extension becomes the test name)
test_name = os.path.splitext(os.path.split(img_path)[1])[0]
self.gold_results.AddTestResult(test_name, md5_hash, img_path)
if self.test_suppressor.IsResultSuppressed(input_filename):
if success:
self.surprises.append(input_path)
else:
if not success:
self.failures.append(input_path)
def Run(self):
parser = optparse.OptionParser()
parser.add_option('--build-dir', default=os.path.join('out', 'Debug'),
help='relative path from the base source directory')
parser.add_option('-j', default=multiprocessing.cpu_count(),
dest='num_workers', type='int',
help='run NUM_WORKERS jobs in parallel')
parser.add_option('--gold_properties', default='', dest="gold_properties",
help='Key value pairs that are written to the top level of the JSON file that is ingested by Gold.')
parser.add_option('--gold_key', default='', dest="gold_key",
help='Key value pairs that are added to the "key" field of the JSON file that is ingested by Gold.')
parser.add_option('--gold_output_dir', default='', dest="gold_output_dir",
help='Path of where to write the JSON output to be uploaded to Gold.')
parser.add_option('--gold_ignore_hashes', default='', dest="gold_ignore_hashes",
help='Path to a file with MD5 hashes we wish to ignore.')
parser.add_option('--ignore_errors', action="store_true", dest="ignore_errors",
help='Prevents the return value from being non-zero when image comparison fails.')
options, args = parser.parse_args()
finder = common.DirectoryFinder(options.build_dir)
self.fixup_path = finder.ScriptPath('fixup_pdf_template.py')
self.text_diff_path = finder.ScriptPath('text_diff.py')
self.source_dir = finder.TestingDir()
if self.test_dir != 'corpus':
test_dir = finder.TestingDir(os.path.join('resources', self.test_dir))
else:
test_dir = finder.TestingDir(self.test_dir)
self.pdfium_test_path = finder.ExecutablePath('pdfium_test')
if not os.path.exists(self.pdfium_test_path):
print "FAILURE: Can't find test executable '%s'" % self.pdfium_test_path
print "Use --build-dir to specify its location."
return 1
self.working_dir = finder.WorkingDir(os.path.join('testing', self.test_dir))
if not os.path.exists(self.working_dir):
os.makedirs(self.working_dir)
self.feature_string = subprocess.check_output([self.pdfium_test_path,
'--show-config'])
self.test_suppressor = suppressor.Suppressor(finder, self.feature_string)
self.image_differ = pngdiffer.PNGDiffer(finder)
walk_from_dir = finder.TestingDir(test_dir);
test_cases = []
input_file_re = re.compile('^[a-zA-Z0-9_.]+[.](in|pdf)$')
if len(args):
for file_name in args:
file_name.replace(".pdf", ".in")
input_path = os.path.join(walk_from_dir, file_name)
if not os.path.isfile(input_path):
print "Can't find test file '%s'" % file_name
return 1
test_cases.append((os.path.basename(input_path),
os.path.dirname(input_path)))
else:
for file_dir, _, filename_list in os.walk(walk_from_dir):
for input_filename in filename_list:
if input_file_re.match(input_filename):
input_path = os.path.join(file_dir, input_filename)
if not self.test_suppressor.IsExecutionSuppressed(input_path):
if os.path.isfile(input_path):
test_cases.append((input_filename, file_dir))
self.failures = []
self.surprises = []
# Collect Gold results if an output directory was named.
self.gold_results = None
if options.gold_output_dir:
self.gold_results = gold.GoldResults("pdfium",
options.gold_output_dir,
options.gold_properties,
options.gold_key,
options.gold_ignore_hashes)
if options.num_workers > 1 and len(test_cases) > 1:
try:
pool = multiprocessing.Pool(options.num_workers)
worker_func = functools.partial(TestOneFileParallel, self)
worker_results = pool.imap(worker_func, test_cases)
for worker_result in worker_results:
result, input_filename, source_dir = worker_result
input_path = os.path.join(source_dir, input_filename)
self.HandleResult(input_filename, input_path, result)
except KeyboardInterrupt:
pool.terminate()
finally:
pool.close()
pool.join()
else:
for test_case in test_cases:
input_filename, input_file_dir = test_case
result = self.GenerateAndTest(input_filename, input_file_dir)
self.HandleResult(input_filename,
os.path.join(input_file_dir, input_filename), result)
if self.gold_results:
self.gold_results.WriteResults()
if self.surprises:
self.surprises.sort()
print '\n\nUnexpected Successes:'
for surprise in self.surprises:
print surprise;
if self.failures:
self.failures.sort()
print '\n\nSummary of Failures:'
for failure in self.failures:
print failure
if not options.ignore_errors:
return 1
return 0