Context Navigation

← Previous Changeset
Next Changeset →

Changeset 96272 in webkit

Timestamp:

Sep 28, 2011 5:09:39 PM (13 years ago)

Author:

dpranke@chromium.org

Message:

Modify new-run-webkit-tests to return the percentage difference in image diffs where possible.

https://bugs.webkit.org/show_bug.cgi?id=67253

Reviewed by Eric Seidel.

Tools:

Nearly all of the work in this was done by Simon Fraser; I'm
just repackaging it and cleaning it up a bit. This change
modifies port.diff_image() to return a tuple of (pass/fail,
%age), adds the value to the FailureImageHashMismatch, and
writes the value into the full_results.json files to be
displayed in the results page.

Scripts/webkitpy/layout_tests/controllers/manager.py:
Scripts/webkitpy/layout_tests/controllers/single_test_runner.py:
Scripts/webkitpy/layout_tests/layout_package/test_result_writer.py:
Scripts/webkitpy/layout_tests/models/test_failures.py:
Scripts/webkitpy/layout_tests/port/base.py:
Scripts/webkitpy/layout_tests/port/chromium.py:
Scripts/webkitpy/layout_tests/port/chromium_unittest.py:
Scripts/webkitpy/layout_tests/port/port_testcase.py:
Scripts/webkitpy/layout_tests/port/test.py:
Scripts/webkitpy/layout_tests/port/webkit.py:
Scripts/webkitpy/layout_tests/run_webkit_tests_integrationtest.py:

LayoutTests:

fast/harness/resources/results-test.js:

(mockExpectation):
(runDefaultSingleRowTest):
():

fast/harness/results.html:

Location:

trunk

Files:

: 16 edited

LayoutTests/ChangeLog (modified) (1 diff)
LayoutTests/fast/harness/resources/results-test.js (modified) (5 diffs)
LayoutTests/fast/harness/results.html (modified) (1 diff)
Tools/ChangeLog (modified) (1 diff)
Tools/Scripts/webkitpy/layout_tests/controllers/manager.py (modified) (1 diff)
Tools/Scripts/webkitpy/layout_tests/controllers/single_test_runner.py (modified) (1 diff)
Tools/Scripts/webkitpy/layout_tests/layout_package/test_result_writer.py (modified) (1 diff)
Tools/Scripts/webkitpy/layout_tests/models/test_failures.py (modified) (1 diff)
Tools/Scripts/webkitpy/layout_tests/port/base.py (modified) (1 diff)
Tools/Scripts/webkitpy/layout_tests/port/chromium.py (modified) (2 diffs)
Tools/Scripts/webkitpy/layout_tests/port/chromium_unittest.py (modified) (1 diff)
Tools/Scripts/webkitpy/layout_tests/port/port_testcase.py (modified) (4 diffs)
Tools/Scripts/webkitpy/layout_tests/port/test.py (modified) (1 diff)
Tools/Scripts/webkitpy/layout_tests/port/webkit.py (modified) (4 diffs)
Tools/Scripts/webkitpy/layout_tests/run_webkit_tests_integrationtest.py (modified) (3 diffs)
Tools/Scripts/webkitpy/to_be_moved/rebaseline_chromium_webkit_tests.py (modified) (2 diffs)

Legend:

: Unmodified
: Added
: Removed

trunk/LayoutTests/ChangeLog

-                      r96270
+                      r96272
+-09-28  Dirk Pranke  <dpranke@chromium.org>
+        Modify new-run-webkit-tests to return the percentage difference in image diffs where possible.
+        https://bugs.webkit.org/show_bug.cgi?id=67253
+        Reviewed by Eric Seidel.
+        * fast/harness/resources/results-test.js:
+        (mockExpectation):
+        (runDefaultSingleRowTest):
+        ():
+        * fast/harness/results.html:
 -09-28  Chris Rogers  <crogers@google.com>

trunk/LayoutTests/fast/harness/resources/results-test.js

-                      r89873
+                      r96272
+}
+function mockExpectation(expected, actual)
+{
+function mockExpectation(expected, actual, diff_percentage)
+{
+    diff_percentage = (typeof(diff_percentage) == undefined) ? 0 : diff_percentage;
     return {
         expected: expected,
         time_ms: 1,
         actual: actual,
+        image_diff_percent: diff_percentage,
         has_stderr: false
     };
 …
+}
 function runDefaultSingleRowTest(test, expected, actual, isExpected, textResults, imageResults)
+{
     results = mockResults();
     results.tests[test] = mockExpectation(expected, actual);
+function runDefaultSingleRowTest(test, expected, actual, diff_percentage, isExpected, textResults, imageResults)
+{
+    results = mockResults();
+    results.tests[test] = mockExpectation(expected, actual, diff_percentage);
     runSingleRowTest(results, isExpected, textResults, imageResults);
+}
 …
     });
     runDefaultSingleRowTest('bar-skip.html', 'TEXT', 'SKIP', true, '', '');
     runDefaultSingleRowTest('bar-flaky-fail.html', 'PASS FAIL', 'TEXT', true, 'expected actual diff ', '');
     runDefaultSingleRowTest('bar-flaky-fail-unexpected.html', 'PASS TEXT', 'IMAGE', false, '', 'images diff ');
     runDefaultSingleRowTest('bar-audio.html', 'TEXT', 'AUDIO', false, 'expected audio actual audio ', '');
     runDefaultSingleRowTest('bar-image.html', 'TEXT', 'IMAGE', false, '', 'images diff ');
     runDefaultSingleRowTest('bar-image-plus-text.html', 'TEXT', 'IMAGE+TEXT', false, 'expected actual diff ', 'images diff ');
     results = mockResults();
     results.tests['bar-reftest.html'] = mockExpectation('PASS', 'IMAGE');
+    runDefaultSingleRowTest('bar-skip.html', 'TEXT', 'SKIP', 0, true, '', '');
+    runDefaultSingleRowTest('bar-flaky-fail.html', 'PASS FAIL', 'TEXT', 0, true, 'expected actual diff ', '');
+    runDefaultSingleRowTest('bar-flaky-fail-unexpected.html', 'PASS TEXT', 'IMAGE', 1, false, '', 'images diff (1%) ');
+    runDefaultSingleRowTest('bar-audio.html', 'TEXT', 'AUDIO', 0, false, 'expected audio actual audio ', '');
+    runDefaultSingleRowTest('bar-image.html', 'TEXT', 'IMAGE', 1, false, '', 'images diff (1%) ');
+    runDefaultSingleRowTest('bar-image-plus-text.html', 'TEXT', 'IMAGE+TEXT', 1, false, 'expected actual diff ', 'images diff (1%) ');
+    results = mockResults();
+    results.tests['bar-reftest.html'] = mockExpectation('PASS', 'IMAGE', 1);
     results.tests['bar-reftest.html'].is_reftest = true;
     runSingleRowTest(results, false, '', 'ref html images diff ');
+    runSingleRowTest(results, false, '', 'ref html images diff (1%) ');
     results = mockResults();
 …
     results = mockResults();
     results.tests['bar.html'] = mockExpectation('PASS', 'IMAGE');
     runTest(results, function() {
         assertTrue(document.querySelector('tbody td:nth-child(3)').textContent == 'images diff ');
+    results.tests['bar.html'] = mockExpectation('PASS', 'IMAGE', 1);
+    runTest(results, function() {
+        assertTrue(document.querySelector('tbody td:nth-child(3)').textContent == 'images diff (1%) ');
         document.getElementById('toggle-images').checked = false;
 …
         updateTogglingImages();
         // FIXME: We get extra spaces in the DOM every time we enable/disable image toggling.
         assertTrue(document.querySelector('tbody td:nth-child(3)').textContent == 'expected actual  diff ');
+        assertTrue(document.querySelector('tbody td:nth-child(3)').textContent == 'expected actual  diff (1%) ');
         document.getElementById('toggle-images').checked = true;
         updateTogglingImages();
         assertTrue(document.querySelector('tbody td:nth-child(3)').textContent == ' images   diff ');
     });
     results = mockResults();
     results.tests['reading-options-from-localstorage.html'] = mockExpectation('IMAGE+TEXT', 'IMAGE+TEXT');
+        assertTrue(document.querySelector('tbody td:nth-child(3)').textContent == ' images   diff (1%) ');
+    });
+    results = mockResults();
+    results.tests['reading-options-from-localstorage.html'] = mockExpectation('IMAGE+TEXT', 'IMAGE+TEXT', 1);
     runTest(results, function() {
         assertTrue(window.getComputedStyle(document.querySelector('tbody'), null)['display'] != 'none');
         assertTrue(document.querySelector('tbody td:nth-child(3)').textContent == 'expected actual  diff ');
+        assertTrue(document.querySelector('tbody td:nth-child(3)').textContent == 'expected actual  diff (1%) ');
     }, '{"toggle-images":false,"unexpected-results":false}');

trunk/LayoutTests/fast/harness/results.html

r94212	r96272
546	546	}
547	547
548		~~// FIXME: old-run-webkit-tests shows the diff percentage as the text contents of the "diff" link.~~
549		row += resultLink(test_prefix, '-diff.png', 'diff');
	548	var diff = testObject.image_diff_percent;
	549	row += resultLink(test_prefix, '-diff.png', 'diff (' + diff + '%)');
550	550	}
551	551	}

trunk/Tools/ChangeLog

-                      r96268
+                      r96272
+-09-28  Dirk Pranke  <dpranke@chromium.org>
+        Modify new-run-webkit-tests to return the percentage difference in image diffs where possible.
+        https://bugs.webkit.org/show_bug.cgi?id=67253
+        Reviewed by Eric Seidel.
+        Nearly all of the work in this was done by Simon Fraser; I'm
+        just repackaging it and cleaning it up a bit. This change
+        modifies port.diff_image() to return a tuple of (pass/fail,
+        %age), adds the value to the FailureImageHashMismatch, and
+        writes the value into the full_results.json files to be
+        displayed in the results page.
+        * Scripts/webkitpy/layout_tests/controllers/manager.py:
+        * Scripts/webkitpy/layout_tests/controllers/single_test_runner.py:
+        * Scripts/webkitpy/layout_tests/layout_package/test_result_writer.py:
+        * Scripts/webkitpy/layout_tests/models/test_failures.py:
+        * Scripts/webkitpy/layout_tests/port/base.py:
+        * Scripts/webkitpy/layout_tests/port/chromium.py:
+        * Scripts/webkitpy/layout_tests/port/chromium_unittest.py:
+        * Scripts/webkitpy/layout_tests/port/port_testcase.py:
+        * Scripts/webkitpy/layout_tests/port/test.py:
+        * Scripts/webkitpy/layout_tests/port/webkit.py:
+        * Scripts/webkitpy/layout_tests/run_webkit_tests_integrationtest.py:
 -09-25  Kentaro Hara  <haraken@chromium.org>

trunk/Tools/Scripts/webkitpy/layout_tests/controllers/manager.py

r95441	r96272
171	171	if 'is_reftest' in result.failures:
172	172	test_dict['is_reftest'] = True
	173	if type(f) is test_failures.FailureImageHashMismatch:
	174	test_dict['image_diff_percent'] = f.diff_percent
173	175
174	176	if test_failures.FailureReftestMismatchDidNotOccur in failure_types:

trunk/Tools/Scripts/webkitpy/layout_tests/controllers/single_test_runner.py

-                      r90532
+                      r96272
             failures.append(test_failures.FailureMissingImageHash())
         elif driver_output.image_hash != expected_driver_output.image_hash:
+            driver_output.image_diff = self._port.diff_image(driver_output.image, expected_driver_output.image)
+            diff_result = self._port.diff_image(driver_output.image, expected_driver_output.image)
+            driver_output.image_diff = diff_result[0]
             if driver_output.image_diff:
                 failures.append(test_failures.FailureImageHashMismatch())
+                failures.append(test_failures.FailureImageHashMismatch(diff_result[1]))
         return failures

trunk/Tools/Scripts/webkitpy/layout_tests/layout_package/test_result_writer.py

r90532	r96272
71	71	writer.write_image_files(driver_output.image, expected_driver_output.image)
72	72	# FIXME: This work should be done earlier in the pipeline (e.g., when we compare images for non-ref tests).
73		image_diff = port.diff_image(driver_output.image, expected_driver_output.image)
	73	image_diff = port.diff_image(driver_output.image, expected_driver_output.image)[0]
74	74	if image_diff:
75	75	writer.write_image_diff_files(image_diff)

trunk/Tools/Scripts/webkitpy/layout_tests/models/test_failures.py

r90532	r96272
168	168	class FailureImageHashMismatch(TestFailure):
169	169	"""Image hashes didn't match."""
	170	def __init__(self, diff_percent=0):
	171	self.diff_percent = diff_percent
170	172
171	173	@staticmethod

trunk/Tools/Scripts/webkitpy/layout_tests/port/base.py

r93166	r96272
258	258
259	259	def diff_image(self, expected_contents, actual_contents, tolerance=0):
260		"""Compare two images and return a~~n image diff~~.
	260	"""Compare two images and return a tuple of an image diff, and a percentage difference (0-100).
261	261
262	262	\|tolerance\| should be a percentage value (0.0 - 100.0).

trunk/Tools/Scripts/webkitpy/layout_tests/port/chromium.py

-                      r95875
+                      r96272
         # If only one of them exists, return that one.
         if not actual_contents and not expected_contents:
             return None
+            return (None, 0)
         if not actual_contents:
             return expected_contents
+            return (expected_contents, 0)
         if not expected_contents:
             return actual_contents
+            return (actual_contents, 0)
         tempdir = self._filesystem.mkdtemp()
 …
                 result = self._filesystem.read_binary_file(native_diff_filename)
             self._filesystem.rmtree(str(tempdir))
         return result
+        return (result, 0)  # FIXME: how to get % diff?
     def path_from_chromium_base(self, *comps):

trunk/Tools/Scripts/webkitpy/layout_tests/port/chromium_unittest.py

-                      r94219
+                      r96272
         # Images are different.
         port._executive = executive_mock.MockExecutive2(run_command_fn=mock_run_command)
         self.assertEquals(mock_image_diff, port.diff_image("EXPECTED", "ACTUAL"))
+        self.assertEquals(mock_image_diff, port.diff_image("EXPECTED", "ACTUAL")[0])
         # Images are the same.
         port._executive = executive_mock.MockExecutive2(exit_code=0)
         self.assertEquals(None, port.diff_image("EXPECTED", "ACTUAL"))
+        self.assertEquals(None, port.diff_image("EXPECTED", "ACTUAL")[0])
         # There was some error running image_diff.

trunk/Tools/Scripts/webkitpy/layout_tests/port/port_testcase.py

-                      r93176
+                      r96272
         tmpfd.close()
         self.assertFalse(port.diff_image(contents1, contents1))
         self.assertTrue(port.diff_image(contents1, contents2))
         self.assertTrue(port.diff_image(contents1, contents2, tmpfile))
+        self.assertFalse(port.diff_image(contents1, contents1)[0])
+        self.assertTrue(port.diff_image(contents1, contents2)[0])
+        self.assertTrue(port.diff_image(contents1, contents2, tmpfile)[0])
         port._filesystem.remove(tmpfile)
 …
         if not port:
             return
         self.assertFalse(port.diff_image(None, None))
         self.assertFalse(port.diff_image(None, ''))
         self.assertFalse(port.diff_image('', None))
         self.assertFalse(port.diff_image('', ''))
+        self.assertFalse(port.diff_image(None, None)[0])
+        self.assertFalse(port.diff_image(None, '')[0])
+        self.assertFalse(port.diff_image('', None)[0])
+        self.assertFalse(port.diff_image('', '')[0])
     def test_diff_image__missing_actual(self):
 …
         if not port:
             return
         self.assertTrue(port.diff_image(None, 'foo'))
         self.assertTrue(port.diff_image('', 'foo'))
+        self.assertTrue(port.diff_image(None, 'foo')[0])
+        self.assertTrue(port.diff_image('', 'foo')[0])
     def test_diff_image__missing_expected(self):
 …
         if not port:
             return
         self.assertTrue(port.diff_image('foo', None))
         self.assertTrue(port.diff_image('foo', ''))
+        self.assertTrue(port.diff_image('foo', None)[0])
+        self.assertTrue(port.diff_image('foo', '')[0])
     def test_check_build(self):

trunk/Tools/Scripts/webkitpy/layout_tests/port/test.py

-                      r94316
+                      r96272
         diffed = actual_contents != expected_contents
         if diffed:
             return "< %s\n---\n> %s\n" % (expected_contents, actual_contents)
         return None
+            return ["< %s\n---\n> %s\n" % (expected_contents, actual_contents), 1]
+        return (None, 0)
     def layout_tests_dir(self):

trunk/Tools/Scripts/webkitpy/layout_tests/port/webkit.py

-                      r95911
+                      r96272
         # FIXME: need unit tests for this.
         if not actual_contents and not expected_contents:
             return None
+            return (None, 0)
         if not actual_contents or not expected_contents:
             # FIXME: It's not clear what we should return in this case.
             # Maybe we should throw an exception?
             return True
+            return (True, 0)
         process = self._start_image_diff_process(expected_contents, actual_contents)
 …
         deadline = time.time() + timeout
         output = sp.read_line(timeout)
+        output_image = ""
+        diff_percent = 0
         while not sp.timed_out and not sp.crashed and output:
             if output.startswith('Content-Length'):
 …
                 content_length = int(m.group(1))
                 timeout = deadline - time.time()
+                output = sp.read(timeout, content_length)
+                output_image = sp.read(timeout, content_length)
+                output = sp.read_line(timeout)
                 break
             elif output.startswith('diff'):
 …
             m = re.match('diff: (.+)% (passed|failed)', output)
             if m.group(2) == 'passed':
+                return None
+        return output
+                return [None, 0]
+            diff_percent = float(m.group(1))
+        return (output_image, diff_percent)
     def default_results_directory(self):

trunk/Tools/Scripts/webkitpy/layout_tests/run_webkit_tests_integrationtest.py

-                      r95441
+                      r96272
     multiprocessing = None
+try:
+    import json
+except ImportError:
+    # python 2.5 compatibility
+    import webkitpy.thirdparty.simplejson as json
 # FIXME: remove this when we fix test-webkitpy to work properly on cygwin
 # (bug 63846).
 …
             def diff_image(self, expected_contents, actual_contents):
                 self.tolerance_used_for_diff_image = self._options.tolerance
                 return True
+                return (True, 1)
         def get_port_for_run(args):
 …
 MainTest = skip_if(MainTest, sys.platform == 'cygwin' and compare_version(sys, '2.6')[0] < 0, 'new-run-webkit-tests tests hang on Cygwin Python 2.5.2')
+class EndToEndTest(unittest.TestCase):
+    def parse_full_results(self, full_results_text):
+        json_to_eval = full_results_text.replace("ADD_RESULTS(", "").replace(");", "")
+        compressed_results = json.loads(json_to_eval)
+        return compressed_results
+    def test_end_to_end(self):
+        fs = unit_test_filesystem()
+        res, out, err, user = logging_run(record_results=True, tests_included=True, filesystem=fs)
+        # Six tests should fail, so the return code should be 6.
+        self.assertEquals(res, 6)
+        results = self.parse_full_results(fs.files['/tmp/layout-test-results/full_results.json'])
+        # Check to ensure we're passing back image diff %age correctly.
+        self.assertEquals(results['tests']['failures']['expected']['image.html']['image_diff_percent'], 1)
+        # Check that we attempted to display the results page in a browser.
+        self.assertTrue(user.opened_urls)
 class RebaselineTest(unittest.TestCase):

trunk/Tools/Scripts/webkitpy/to_be_moved/rebaseline_chromium_webkit_tests.py

-                      r94031
+                      r96272
         if is_image:
             return self._port.diff_image(output1, output2)
+            return self._port.diff_image(output1, output2)[0]
         return self._port.compare_text(output1, output2)
 …
             old_output = self._filesystem.read_binary_file(old_file)
             new_output = self._filesystem.read_binary_file(new_file)
             image_diff = self._port.diff_image(old_output, new_output)
+            image_diff = self._port.diff_image(old_output, new_output)[0]
             self._filesystem.write_binary_file(diff_file, image_diff)

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changeset 96272 in webkit

Legend:

Download in other formats: