# Copyright 2015 The Chromium Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
import errno
import hashlib
import logging
import math
import mmap
import os
import re
from autotest_lib.client.common_lib import error
from autotest_lib.client.common_lib import file_utils
from autotest_lib.client.cros import chrome_binary_test
from autotest_lib.client.cros.video import device_capability
from autotest_lib.client.cros.video import helper_logger
DOWNLOAD_BASE = ('http://commondatastorage.googleapis.com'
'/chromiumos-test-assets-public/')
VEA_BINARY = 'video_encode_accelerator_unittest'
TIME_BINARY = '/usr/local/bin/time'
# The format used for 'time': <real time> <kernel time> <user time>
TIME_OUTPUT_FORMAT = '%e %S %U'
FRAME_STATS_SUFFIX = 'frame-data.csv'
TEST_LOG_SUFFIX = 'test.log'
TIME_LOG_SUFFIX = 'time.log'
# Performance keys:
# FPS (i.e. encoder throughput)
KEY_FPS = 'fps'
# Encode latencies at the 50th, 75th, and 95th percentiles.
# Encode latency is the delay from input of a frame to output of the encoded
# bitstream.
KEY_ENCODE_LATENCY_50 = 'encode_latency.50_percentile'
KEY_ENCODE_LATENCY_75 = 'encode_latency.75_percentile'
KEY_ENCODE_LATENCY_95 = 'encode_latency.95_percentile'
# CPU usage in kernel space
KEY_CPU_KERNEL_USAGE = 'cpu_usage.kernel'
# CPU usage in user space
KEY_CPU_USER_USAGE = 'cpu_usage.user'
# Units of performance values:
UNIT_MILLISECOND = 'milliseconds'
UNIT_MICROSECOND = 'us'
UNIT_RATIO = 'ratio'
UNIT_FPS = 'fps'
RE_FPS = re.compile(r'^Measured encoder FPS: ([+\-]?[0-9.]+)$', re.MULTILINE)
RE_ENCODE_LATENCY_50 = re.compile(
r'^Encode latency for the 50th percentile: (\d+) us$',
re.MULTILINE)
RE_ENCODE_LATENCY_75 = re.compile(
r'^Encode latency for the 75th percentile: (\d+) us$',
re.MULTILINE)
RE_ENCODE_LATENCY_95 = re.compile(
r'^Encode latency for the 95th percentile: (\d+) us$',
re.MULTILINE)
def _remove_if_exists(filepath):
try:
os.remove(filepath)
except OSError, e:
if e.errno != errno.ENOENT: # no such file
raise
class video_VEAPerf(chrome_binary_test.ChromeBinaryTest):
"""
This test monitors several performance metrics reported by Chrome test
binary, video_encode_accelerator_unittest.
"""
version = 1
def _logperf(self, test_name, key, value, units, higher_is_better=False):
description = '%s.%s' % (test_name, key)
self.output_perf_value(
description=description, value=value, units=units,
higher_is_better=higher_is_better)
def _analyze_fps(self, test_name, log_file):
"""
Analyzes FPS info from result log file.
"""
with open(log_file, 'r') as f:
mm = mmap.mmap(f.fileno(), 0, access=mmap.ACCESS_READ)
fps = [float(m.group(1)) for m in RE_FPS.finditer(mm)]
mm.close()
if len(fps) != 1:
raise error.TestError('Parsing FPS failed w/ %d occurrence(s).' %
len(fps))
self._logperf(test_name, KEY_FPS, fps[0], UNIT_FPS, True)
def _analyze_encode_latency(self, test_name, log_file):
"""
Analyzes encode latency from result log file.
"""
with open(log_file, 'r') as f:
mm = mmap.mmap(f.fileno(), 0, access=mmap.ACCESS_READ)
latency_50 = [int(m.group(1)) for m in
RE_ENCODE_LATENCY_50.finditer(mm)]
latency_75 = [int(m.group(1)) for m in
RE_ENCODE_LATENCY_75.finditer(mm)]
latency_95 = [int(m.group(1)) for m in
RE_ENCODE_LATENCY_95.finditer(mm)]
mm.close()
if any([len(l) != 1 for l in [latency_50, latency_75, latency_95]]):
raise error.TestError('Parsing encode latency failed.')
self._logperf(test_name, KEY_ENCODE_LATENCY_50, latency_50[0],
UNIT_MICROSECOND)
self._logperf(test_name, KEY_ENCODE_LATENCY_75, latency_75[0],
UNIT_MICROSECOND)
self._logperf(test_name, KEY_ENCODE_LATENCY_95, latency_95[0],
UNIT_MICROSECOND)
def _analyze_cpu_usage(self, test_name, time_log_file):
"""
Analyzes CPU usage from the output of 'time' command.
"""
with open(time_log_file) as f:
content = f.read()
r, s, u = (float(x) for x in content.split())
self._logperf(test_name, KEY_CPU_USER_USAGE, u / r, UNIT_RATIO)
self._logperf(test_name, KEY_CPU_KERNEL_USAGE, s / r, UNIT_RATIO)
def _analyze_frame_stats(self, test_name, frame_stats_file):
"""
Analyzes quality from --frame_stats output CSV. Assumes YUV420 (for MSE
samples per channel).
"""
def mse_to_psnr(samples, peak, mse):
"""
Generate PSNR from MSE for a frame.
"""
MAX_PSNR = 100.0
# Prevent a divide-by-zero, MSE at 0 is perfect quality (no error).
if mse == 0:
return MAX_PSNR
psnr = 10.0 * math.log10(peak * peak * samples / float(mse))
return min(psnr, MAX_PSNR)
frame_ssim = {'y': [], 'u': [], 'v': [], 'combined': []}
frame_psnr = {'y': [], 'u': [], 'v': [], 'combined': []}
for line in open(frame_stats_file):
(frame, width, height,
ssim_y, ssim_u, ssim_v, mse_y, mse_u, mse_v) = line.split(',')
# Skip CSV header.
if frame == 'frame':
continue
frame = int(frame)
width = int(width)
height = int(height)
ssim_y = float(ssim_y)
ssim_u = float(ssim_u)
ssim_v = float(ssim_v)
mse_y = int(mse_y)
mse_u = int(mse_u)
mse_v = int(mse_v)
frame_ssim['y'].append(ssim_y)
frame_ssim['u'].append(ssim_u)
frame_ssim['v'].append(ssim_v)
# Weighting of YUV channels for SSIM taken from libvpx.
frame_ssim['combined'].append(
0.8 * ssim_y + 0.1 * (ssim_u + ssim_v))
# Samples per MSE score assumes YUV420 subsampling.
frame_psnr['y'].append(
mse_to_psnr(width * height * 4 / 4, 255, mse_y))
frame_psnr['u'].append(
mse_to_psnr(width * height * 1 / 4, 255, mse_u))
frame_psnr['v'].append(
mse_to_psnr(width * height * 1 / 4, 255, mse_v))
frame_psnr['combined'].append(
mse_to_psnr(
width * height * 6 / 4, 255, mse_y + mse_u + mse_v))
for channel in ['y', 'u', 'v', 'combined']:
# Log stats with a key similar to 'quality.ssim.y.max'. For combined
# stats the channel is omitted ('quality.ssim.max').
key = 'quality.%s'
if channel is not 'combined':
key += '.' + channel
key += '.%s'
for (stat, func) in [('min', min), ('max', max),
('avg', lambda x: sum(x) / len(x))]:
self._logperf(test_name, key % ('ssim', stat),
func(frame_ssim[channel]), None,
higher_is_better=True)
self._logperf(test_name, key % ('psnr', stat),
func(frame_psnr[channel]), None,
higher_is_better=True)
def _get_profile_name(self, profile):
"""
Gets profile name from a profile index.
"""
if profile == 1:
return 'h264'
elif profile == 11:
return 'vp8'
else:
raise error.TestError('Internal error.')
def _convert_test_name(self, path, on_cloud, profile):
"""Converts source path to test name and output video file name.
For example: for the path on cloud
"tulip2/tulip2-1280x720-1b95123232922fe0067869c74e19cd09.yuv"
We will derive the test case's name as "tulip2-1280x720.vp8" or
"tulip2-1280x720.h264" depending on the profile. The MD5 checksum in
path will be stripped.
For the local file, we use the base name directly.
@param path: The local path or download path.
@param on_cloud: Whether the file is on cloud.
@param profile: Profile index.
@returns a pair of (test name, output video file name)
"""
s = os.path.basename(path)
name = s[:s.rfind('-' if on_cloud else '.')]
profile_name = self._get_profile_name(profile)
return (name + '_' + profile_name, name + '.' + profile_name)
def _download_video(self, path_on_cloud, local_file):
url = '%s%s' % (DOWNLOAD_BASE, path_on_cloud)
logging.info('download "%s" to "%s"', url, local_file)
file_utils.download_file(url, local_file)
with open(local_file, 'r') as r:
md5sum = hashlib.md5(r.read()).hexdigest()
if md5sum not in path_on_cloud:
raise error.TestError('unmatched md5 sum: %s' % md5sum)
def _get_result_filename(self, test_name, subtype, suffix):
return os.path.join(self.resultsdir,
'%s_%s_%s' % (test_name, subtype, suffix))
def _get_vea_unittest_args(self, test_stream_data, test_log_file):
vea_args = [
'--test_stream_data=%s' % test_stream_data,
'--output_log="%s"' % test_log_file,
'--ozone-platform=gbm',
helper_logger.chrome_vmodule_flag()]
return vea_args
def _run_test_case(self, test_name, test_stream_data):
"""
Runs a VEA unit test.
@param test_name: Name of this test case.
@param test_stream_data: Parameter to --test_stream_data in vea_unittest.
"""
# Get FPS.
test_log_file = self._get_result_filename(test_name, 'fullspeed',
TEST_LOG_SUFFIX)
vea_args = self._get_vea_unittest_args(test_stream_data, test_log_file)
vea_args += ['--gtest_filter=EncoderPerf/*/0']
self.run_chrome_test_binary(VEA_BINARY, ' '.join(vea_args))
self._analyze_fps(test_name, test_log_file)
# Get CPU usage and encode latency under specified frame rate.
test_log_file = self._get_result_filename(test_name, 'fixedspeed',
TEST_LOG_SUFFIX)
time_log_file = self._get_result_filename(test_name, 'fixedspeed',
TIME_LOG_SUFFIX)
vea_args = self._get_vea_unittest_args(test_stream_data, test_log_file)
vea_args += ['--gtest_filter=SimpleEncode/*/0',
'--run_at_fps',
'--measure_latency']
time_cmd = ('%s -f "%s" -o "%s" ' %
(TIME_BINARY, TIME_OUTPUT_FORMAT, time_log_file))
self.run_chrome_test_binary(VEA_BINARY, ' '.join(vea_args),
prefix=time_cmd)
self._analyze_encode_latency(test_name, test_log_file)
self._analyze_cpu_usage(test_name, time_log_file)
# TODO(pbos): Measure quality at more bitrates.
# Generate SSIM/PSNR scores (objective quality metrics).
test_log_file = self._get_result_filename(test_name, 'quality',
TEST_LOG_SUFFIX)
frame_stats_file = self._get_result_filename(test_name, 'quality',
FRAME_STATS_SUFFIX)
vea_args = self._get_vea_unittest_args(test_stream_data, test_log_file)
vea_args += ['--gtest_filter=SimpleEncode/*/0',
'--frame_stats="%s"' % frame_stats_file]
self.run_chrome_test_binary(VEA_BINARY, ' '.join(vea_args))
self._analyze_frame_stats(test_name, frame_stats_file)
@helper_logger.video_log_wrapper
@chrome_binary_test.nuke_chrome
def run_once(self, test_cases, required_cap):
"""
Tests ChromeOS video hardware encoder performance.
"""
last_error = None
device_capability.DeviceCapability().ensure_capability(required_cap)
for (path, on_cloud, width, height, requested_bit_rate,
profile, requested_frame_rate) in test_cases:
try:
test_name, output_name = self._convert_test_name(
path, on_cloud, profile)
if on_cloud:
input_path = os.path.join(self.tmpdir,
os.path.basename(path))
self._download_video(path, input_path)
else:
input_path = os.path.join(self.cr_source_dir, path)
output_path = os.path.join(self.tmpdir, output_name)
test_stream_data = '%s:%s:%s:%s:%s:%s:%s' % (
input_path, width, height, profile, output_path,
requested_bit_rate, requested_frame_rate)
self._run_test_case(test_name, test_stream_data)
except Exception as last_error:
# Log the error and continue to the next test case.
logging.exception(last_error)
finally:
if on_cloud:
_remove_if_exists(input_path)
_remove_if_exists(output_path)
if last_error:
raise last_error