# Copyright (c) 2011 The Chromium OS Authors. All rights reserved. # Use of this source code is governed by a BSD-style license that can be # found in the LICENSE file. import logging, os, re from autotest_lib.client.bin import utils from autotest_lib.client.common_lib import error from autotest_lib.client.cros import crash_test _25_HOURS_AGO = -25 * 60 * 60 _CRASH_SENDER_CRON_PATH = '/etc/cron.hourly/crash_sender.hourly' _DAILY_RATE_LIMIT = 32 _MIN_UNIQUE_TIMES = 4 _SECONDS_SEND_SPREAD = 3600 class logging_CrashSender(crash_test.CrashTest): """ End-to-end test of crash_sender. """ version = 1 def _check_hardware_info(self, result): # Get board name lsb_release = utils.read_file('/etc/lsb-release') board_match = re.search(r'CHROMEOS_RELEASE_BOARD=(.*)', lsb_release) if not ('Board: %s' % board_match.group(1)) in result['output']: raise error.TestFail('Missing board name %s in output' % board_match.group(1)) # Get hwid with os.popen("crossystem hwid 2>/dev/null", "r") as hwid_proc: hwclass = hwid_proc.read() if not hwclass: hwclass = 'undefined' if not ('HWClass: %s' % hwclass) in result['output']: raise error.TestFail('Expected hwclass %s in output' % hwclass) def _check_simple_minidump_send(self, report, log_path=None): result = self._call_sender_one_crash(report=report) if (result['report_exists'] or result['rate_count'] != 1 or not result['send_attempt'] or not result['send_success'] or result['sleep_time'] < 0 or result['sleep_time'] >= _SECONDS_SEND_SPREAD or result['report_kind'] != 'minidump' or result['report_payload'] != self.get_crash_dir_name( '%s.dmp' % self._FAKE_TEST_BASENAME) or result['exec_name'] != 'fake' or not 'Version: my_ver' in result['output']): raise error.TestFail('Simple minidump send failed') if log_path and not ('log: @%s' % log_path) in result['output']: raise error.TestFail('Minidump send missing log') self._check_hardware_info(result) # Also test "Image type" field. Note that it will not be "dev" even # on a dev build because /tmp/crash-test-in-progress will exist. if result['image_type']: raise error.TestFail('Image type "%s" should not exist' % result['image_type']) # Also test "Boot mode" field. Note that it will not be "dev" even # when booting in dev mode because /tmp/crash-test-in-progress will # exist. if result['boot_mode']: raise error.TestFail('Boot mode "%s" should not exist' % result['boot_mode']) def _test_sender_simple_minidump(self): """Test sending a single minidump crash report.""" self._check_simple_minidump_send(None) def _test_sender_simple_minidump_with_log(self): """Test that a minidump report with an auxiliary log is sent.""" dmp_path = self.write_crash_dir_entry( '%s.dmp' % self._FAKE_TEST_BASENAME, '') log_path = self.write_crash_dir_entry( '%s.log' % self._FAKE_TEST_BASENAME, '') meta_path = self.write_fake_meta( '%s.meta' % self._FAKE_TEST_BASENAME, 'fake', dmp_path, log=log_path) self._check_simple_minidump_send(meta_path, log_path) def _shift_file_mtime(self, path, delta): statinfo = os.stat(path) os.utime(path, (statinfo.st_atime, statinfo.st_mtime + delta)) def _test_sender_simple_old_minidump(self): """Test that old minidumps and metadata are sent.""" dmp_path = self.write_crash_dir_entry( '%s.dmp' % self._FAKE_TEST_BASENAME, '') meta_path = self.write_fake_meta( '%s.meta' % self._FAKE_TEST_BASENAME, 'fake', dmp_path) self._shift_file_mtime(dmp_path, _25_HOURS_AGO) self._shift_file_mtime(meta_path, _25_HOURS_AGO) self._check_simple_minidump_send(meta_path) def _test_sender_simple_kernel_crash(self): """Test sending a single kcrash report.""" kcrash_fake_report = self.write_crash_dir_entry( 'kernel.today.kcrash', '') self.write_fake_meta('kernel.today.meta', 'kernel', kcrash_fake_report) result = self._call_sender_one_crash(report=kcrash_fake_report) if (result['report_exists'] or result['rate_count'] != 1 or not result['send_attempt'] or not result['send_success'] or result['sleep_time'] < 0 or result['sleep_time'] >= _SECONDS_SEND_SPREAD or result['report_kind'] != 'kcrash' or (result['report_payload'] != self.get_crash_dir_name('kernel.today.kcrash')) or result['exec_name'] != 'kernel'): raise error.TestFail('Simple kcrash send failed') self._check_hardware_info(result) def _test_sender_pausing(self): """Test the sender returns immediately when the pause file is present. This is testing the sender's test functionality - if this regresses, other tests can become flaky because the cron-started sender may run asynchronously to these tests. Disable child sending as normally this environment configuration allows our children to run in spite of the pause file.""" self._set_system_sending(False) self._set_child_sending(False) result = self._call_sender_one_crash(should_fail=True) if (not result['report_exists'] or not 'Exiting early due to' in result['output'] or result['send_attempt']): raise error.TestFail('Sender did not pause') def _test_sender_reports_disabled(self): """Test that when reporting is disabled, we don't send.""" result = self._call_sender_one_crash(reports_enabled=False) if (result['report_exists'] or not 'Crash reporting is disabled' in result['output'] or result['send_attempt']): raise error.TestFail('Sender did not handle reports disabled') def _test_sender_rate_limiting(self): """Test the sender properly rate limits and sends with delay.""" sleep_times = [] for i in range(1, _DAILY_RATE_LIMIT + 1): result = self._call_sender_one_crash() if not result['send_attempt'] or not result['send_success']: raise error.TestFail('Crash uploader did not send on #%d' % i) if result['rate_count'] != i: raise error.TestFail('Did not properly persist rate on #%d' % i) sleep_times.append(result['sleep_time']) logging.debug('Sleeps between sending crashes were: %s', sleep_times) unique_times = {} for i in range(0, _DAILY_RATE_LIMIT): unique_times[sleep_times[i]] = True if len(unique_times) < _MIN_UNIQUE_TIMES: raise error.TestFail('Expected at least %d unique times: %s' % _MIN_UNIQUE_TIMES, sleep_times) # Now the _DAILY_RATE_LIMIT ^ th send request should fail. result = self._call_sender_one_crash() if (not result['report_exists'] or not 'Cannot send more crashes' in result['output'] or result['rate_count'] != _DAILY_RATE_LIMIT): raise error.TestFail('Crash rate limiting did not take effect') # Set one rate file a day earlier and verify can send rate_files = os.listdir(self._CRASH_SENDER_RATE_DIR) rate_path = os.path.join(self._CRASH_SENDER_RATE_DIR, rate_files[0]) self._shift_file_mtime(rate_path, _25_HOURS_AGO) utils.system('ls -l ' + self._CRASH_SENDER_RATE_DIR) result = self._call_sender_one_crash() if (not result['send_attempt'] or not result['send_success'] or result['rate_count'] != _DAILY_RATE_LIMIT): raise error.TestFail('Crash not sent even after 25hrs pass') def _test_sender_single_instance(self): """Test the sender fails to start when another instance is running.""" with self.hold_crash_lock(): result = self._call_sender_one_crash(should_fail=True) if (not 'Already running; quitting.' in result['output'] or result['send_attempt'] or not result['report_exists']): raise error.TestFail('Allowed multiple instances to run') def _test_sender_send_fails(self): """Test that when the send fails we try again later.""" result = self._call_sender_one_crash(send_success=False) if not result['send_attempt'] or result['send_success']: raise error.TestError('Did not properly cause a send failure') if result['rate_count'] != 1: raise error.TestFail('Did not count a failed send against rate ' 'limiting') if not result['report_exists']: raise error.TestFail('Expected minidump to be saved for later ' 'sending') # Also test "Image type" field. For testing purposes, we set it upon # mock failure. Note that it will not be "dev" even on a dev build # because /tmp/crash-test-in-progress will exist. if not result['image_type']: raise error.TestFail('Missing image type on mock failure') if result['image_type'] != 'mock-fail': raise error.TestFail('Incorrect image type on mock failure ' '("%s" != "mock-fail")' % result['image_type']) def _test_sender_orphaned_files(self): """Test that payload and unknown files that are old are removed.""" core_file = self.write_crash_dir_entry('random1.core', '') unknown_file = self.write_crash_dir_entry('.unknown', '') # As new files, we expect crash_sender to leave these alone. results = self._call_sender_one_crash() if ('Removing old orphaned file' in results['output'] or not os.path.exists(core_file) or not os.path.exists(unknown_file)): raise error.TestFail('New orphaned files were removed') self._shift_file_mtime(core_file, _25_HOURS_AGO) self._shift_file_mtime(unknown_file, _25_HOURS_AGO) results = self._call_sender_one_crash() if (not 'Removing old orphaned file' in results['output'] or os.path.exists(core_file) or os.path.exists(unknown_file)): raise error.TestFail( 'Old orphaned files were not removed') def _test_sender_incomplete_metadata(self): """Test that incomplete metadata file is removed once old.""" dmp_file = self.write_crash_dir_entry('incomplete.1.2.3.dmp', '') meta_file = self.write_fake_meta('incomplete.1.2.3.meta', 'unknown', dmp_file, complete=False) # As new files, we expect crash_sender to leave these alone. results = self._call_sender_one_crash() if ('Removing recent incomplete report' in results['output'] or not os.path.exists(meta_file) or not os.path.exists(dmp_file)): raise error.TestFail('New unknown files were removed') self._shift_file_mtime(meta_file, _25_HOURS_AGO) results = self._call_sender_one_crash() if (not 'Removing old incomplete metadata' in results['output'] or os.path.exists(meta_file) or os.path.exists(dmp_file)): raise error.TestFail( 'Old unknown/incomplete files were not removed') def _test_sender_missing_payload(self): meta_file = self.write_fake_meta('bad.meta', 'unknown', 'bad.dmp') other_file = self.write_crash_dir_entry('bad.other', '') results = self._call_sender_one_crash(report=meta_file) # Should remove this file. if (not 'Missing payload' in results['output'] or os.path.exists(meta_file) or os.path.exists(other_file)): raise error.TestFail('Missing payload case handled wrong') def _test_sender_error_type(self): dmp_file = self.write_crash_dir_entry('error_type.dmp', '') meta_file = self.write_fake_meta('error_type.meta', 'fake', dmp_file, complete=False) utils.write_keyval(meta_file, {"error_type": "system-issue"}) utils.write_keyval(meta_file, {"done": "1"}) self._set_force_official(True) # also test this self._set_mock_developer_mode(True) # also test "boot_mode" field result = self._call_sender_one_crash(report=meta_file) if not result['error_type']: raise error.TestFail('Missing error type') if result['error_type'] != 'system-issue': raise error.TestFail('Incorrect error type "%s"' % result['error_type']) # Also test force-official override by checking the image type. Note # that it will not be "dev" even on a dev build because # /tmp/crash-test-in-progress will exist. if not result['image_type']: raise error.TestFail('Missing image type when forcing official') if result['image_type'] != 'force-official': raise error.TestFail('Incorrect image type ("%s" != ' '"force-official")' % result['image_type']) # Also test "Boot mode" field. For testing purposes, it should # have been set to "dev" mode. if not result['boot_mode']: raise error.TestFail('Missing boot mode when mocking dev mode') if result['boot_mode'] != 'dev': raise error.TestFail('Incorrect boot mode when mocking dev mode ' '("%s" != "dev")' % result['boot_mode']) def run_once(self): self.run_crash_tests([ 'sender_simple_minidump', 'sender_simple_old_minidump', 'sender_simple_minidump_with_log', 'sender_simple_kernel_crash', 'sender_pausing', 'sender_reports_disabled', 'sender_rate_limiting', 'sender_single_instance', 'sender_send_fails', 'sender_orphaned_files', 'sender_incomplete_metadata', 'sender_missing_payload', 'sender_error_type']);