appengine/findit/util_scripts/crash_queries/delta_test/delta_test.py - Issue 2400283003: [Findit] Add skeleton code for delta test script.

Unified Diff: appengine/findit/util_scripts/crash_queries/delta_test/delta_test.py

Issue 2400283003: [Findit] Add skeleton code for delta test script. (Closed)

Patch Set: Rebase. Created 4 years, 2 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

« no previous file with comments | « appengine/findit/util_scripts/crash_queries/delta_test/__init__.py ('k') | appengine/findit/util_scripts/crash_queries/delta_test/delta_util.py » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: appengine/findit/util_scripts/crash_queries/delta_test/delta_test.py

diff --git a/appengine/findit/util_scripts/crash_queries/delta_test/delta_test.py b/appengine/findit/util_scripts/crash_queries/delta_test/delta_test.py

new file mode 100644

index 0000000000000000000000000000000000000000..b4f4a6d13cc21f752202eade8cc4efab1c42f75f

--- /dev/null

+++ b/appengine/findit/util_scripts/crash_queries/delta_test/delta_test.py

@@ -0,0 +1,211 @@

+# Use of this source code is governed by a BSD-style license that can be

+# found in the LICENSE file.

+import json

+import logging

+import os

+import pickle

+import subprocess

+from crash_queries import crash_iterator

+from crash_queries.delta_test import delta_util

+AZALEA_RESULTS_DIRECTORY = os.path.join(os.path.dirname(__file__),

+ 'azalea_results')

+DELTA_TEST_DIRECTORY = os.path.dirname(__file__)

+class Delta(object):

+ """Stands for delta between two results.

+ Note, the 2 results should be the same kind and have the same structure.

+ """

+ def __init__(self, result1, result2, fields):

+ self._result1 = result1

+ self._result2 = result2

+ self._fields = fields

+ self._delta_dict = {}

+ self._delta_str_dict = {}

+ @property

+ def delta_dict(self):

+ """Dict representation of delta.

+ Returns:

+ A dict. For example, for Culprit result, the delta dict is like below:

+ {

+ 'project': 'chromium',

+ 'components': ['Blink>API'],

+ 'cls': [],

+ 'regression_range': ['52.0.1200.1', '52.0.1200.3']

+ }

+ """

+ if self._delta_dict:

+ return self._delta_dict

+ for field in self._fields:

+ value1 = getattr(self._result1, field)

+ value2 = getattr(self._result2, field)

+ if value1 != value2:

+ if hasattr(value1, 'ToDict') and callable(value1.ToDict):

+ value1 = value1.ToDict()

+ value2 = value2.ToDict()

+ self._delta_dict[field] = (value1, value2)

+ return self._delta_dict

+ @property

+ def delta_str_dict(self):

+ """Converts delta of each field to a string."""

+ if self._delta_str_dict:

+ return self._delta_str_dict

+ for key, (value1, value2) in self.delta_dict.iteritems():

+ self._delta_str_dict[key] = '%s: %s, %s' % (key, value1, value2)

+ return self._delta_str_dict

+ def ToDict(self):

+ return self.delta_dict

+ def __str__(self):

+ return '\n'.join(self.delta_str_dict.values())

+ def __bool__(self):

+ return bool(self.delta_dict)

+ def __nonzero__(self):

+ return self.__bool__()

+def GetDeltasFromTwoSetsOfResults(set1, set2):

+ """Gets delta from two sets of results.

+ Set1 and set2 are dicts mapping id to result.

+ Results are a list of (message, matches, component_name, cr_label)

+ Returns a list of delta results (results1, results2).

+ """

+ deltas = {}

+ for result_id, result1 in set1.iteritems():

+ # Even when the command are exactly the same, it's possible that one set is

+ # loaded from local result file, another is just queried from database,

+ # sometimes some crash results would get deleted.

+ if result_id not in set2:

+ continue

+ result2 = set2[result_id]

+ delta = Delta(result1, result2, result1.fields)

+ if delta:

+ deltas[result_id] = delta

+ return deltas

+def GetResults(crashes, client_id, git_hash, result_path, verbose=False):

+ """Returns an evaluator function to compute delta between 2 findit githashes.

+ Args:

+ crashes (list): A list of crash infos.

+ client_id (str): Possible values - fracas/cracas/clustefuzz.

+ git_hash (str): A git hash of findit repository.

+ result_path (str): file path for subprocess to write results on.

+ verbose (bool): If True, print all the findit results.

+ Return:

+ A dict mapping crash id to culprit for every crashes analyzed by

+ git_hash version.

+ """

+ if not crashes:

+ return {}

+ if verbose:

+ logging.info('\n\n***************************')

+ logging.info('Switching to git %s', git_hash)

+ logging.info('***************************\n\n')

+ with open(os.devnull, 'w') as null_handle:

+ subprocess.check_call(

+ 'cd %s; git checkout %s' % (DELTA_TEST_DIRECTORY, git_hash),

+ stdout=null_handle,

+ stderr=null_handle,

+ shell=True)

+ if not os.path.exists(result_path):

+ args = ['python', 'run-predator.py', result_path, '--client', client_id]

+ if verbose:

+ args.append('--verbose')

+ p = subprocess.Popen(args, stdin=subprocess.PIPE)

+ # TODO(katesonia): Cache crashes for crash_iterator and let subprocess read

+ # corresponding cache file instead.

+ p.communicate(input=json.dumps(crashes))

+ else:

+ logging.info('\nLoading results from %s', result_path)

+ if not os.path.exists(result_path):

+ logging.error('Failed to get results.')

+ return {}

+ with open(result_path) as f:

+ return pickle.load(f)

+ return {}

+def DeltaEvaluator(git_hash1, git_hash2,

+ client_id, app_id,

+ start_date, end_date, batch_size,

+ property_values=None, verbose=False):

+ """Evaluates delta between git_hash1 and git_hash2 on a set of Testcases.

+ Args:

+ git_hash1 (str): A git hash of findit repository.

+ git_hash2 (str): A git hash of findit repository.

+ start_date (str): Run delta test on testcases after (including)

+ the start_date, format should be '%Y-%m-%d'.

+ end_date (str): Run delta test on testcases before (not including)

+ the end_date, format should be '%Y-%m-%d'.

+ client_id (CrashClient): Possible values are 'fracas', 'cracas',

+ 'cluterfuzz'.

+ app_id (str): Appengine app id to query.

+ batch_size (int): Size of a batch that can be queried at one time.

+ property_values (dict): Property values to query.

+ batch_size (int): The size of crashes that can be queried at one time.

+ verbose (bool): If True, print all the findit results.

+ Return:

+ (deltas, crash_count).

+ deltas (dict): Mappings id to delta for each culprit value.

+ crash_count (int): Total count of all the crashes.

+ """

+ head_branch_name = subprocess.check_output(

+ ['git', 'rev-parse', '--abbrev-ref', 'HEAD']).replace('\n', '')

+ try:

+ deltas = {}

+ crash_count = 0

+ for index, crashes in enumerate(

+ crash_iterator.IterateCrashes(client_id, app_id,

+ property_values=property_values,

+ start_date=start_date,

+ end_date=end_date,

+ batch_size=batch_size,

+ batch_run=True)):

+ results = []

+ for git_hash in [git_hash1, git_hash2]:

+ result_path = os.path.join(

+ AZALEA_RESULTS_DIRECTORY, delta_util.GenerateFileName(

+ client_id, property_values, start_date, end_date,

+ batch_size, index, git_hash))

+ results.append(GetResults(crashes, client_id, git_hash, result_path,

+ verbose=verbose))

+ crash_count += len(crashes)

+ deltas.update(GetDeltasFromTwoSetsOfResults(*results))

+ return deltas, crash_count

+ finally:

+ with open(os.devnull, 'w') as null_handle:

+ subprocess.check_call(['git', 'checkout', head_branch_name],

+ stdout=null_handle,

+ stderr=null_handle)