aboutsummaryrefslogtreecommitdiffhomepage
path: root/tools/flakes/detect_flakes.py
blob: b066ee613939b2341b28466d9d9ba61219d32afc (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
#!/usr/bin/env python
# Copyright 2015 gRPC authors.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""Detect new flakes introduced in the last 24h hours with respect to the
previous six days"""

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import datetime
import os
import sys
import logging
logging.basicConfig(format='%(asctime)s %(message)s')

gcp_utils_dir = os.path.abspath(
    os.path.join(os.path.dirname(__file__), '../gcp/utils'))
sys.path.append(gcp_utils_dir)

import big_query_utils


def print_table(table):
    kokoro_base_url = 'https://kokoro.corp.google.com/job/'
    for k, v in table.items():
        job_name = v[0]
        build_id = v[1]
        ts = int(float(v[2]))
        # TODO(dgq): timezone handling is wrong. We need to determine the timezone
        # of the computer running this script.
        human_ts = datetime.datetime.utcfromtimestamp(ts).strftime(
            '%Y-%m-%d %H:%M:%S PDT')
        job_path = '{}/{}'.format('/job/'.join(job_name.split('/')), build_id)
        full_kokoro_url = kokoro_base_url + job_path
        print("Test: {}, Timestamp: {}, url: {}\n".format(k, human_ts,
                                                          full_kokoro_url))


def get_flaky_tests(days_lower_bound, days_upper_bound, limit=None):
    """ period is one of "WEEK", "DAY", etc.
  (see https://cloud.google.com/bigquery/docs/reference/standard-sql/functions-and-operators#date_add). """

    bq = big_query_utils.create_big_query()
    query = """
SELECT
  REGEXP_REPLACE(test_name, r'/\d+', '') AS filtered_test_name,
  job_name,
  build_id,
  timestamp
FROM
  [grpc-testing:jenkins_test_results.aggregate_results]
WHERE
    timestamp > DATE_ADD(CURRENT_DATE(), {days_lower_bound}, "DAY")
    AND timestamp <= DATE_ADD(CURRENT_DATE(), {days_upper_bound}, "DAY")
  AND NOT REGEXP_MATCH(job_name, '.*portability.*')
  AND result != 'PASSED' AND result != 'SKIPPED'
ORDER BY timestamp desc
""".format(
        days_lower_bound=days_lower_bound, days_upper_bound=days_upper_bound)
    if limit:
        query += '\n LIMIT {}'.format(limit)
    query_job = big_query_utils.sync_query_job(bq, 'grpc-testing', query)
    page = bq.jobs().getQueryResults(
        pageToken=None, **query_job['jobReference']).execute(num_retries=3)
    rows = page.get('rows')
    if rows:
        return {
            row['f'][0]['v']:
            (row['f'][1]['v'], row['f'][2]['v'], row['f'][3]['v'])
            for row in rows
        }
    else:
        return {}


def get_new_flakes():
    last_week_sans_yesterday = get_flaky_tests(-14, -1)
    last_24 = get_flaky_tests(0, +1)
    last_week_sans_yesterday_names = set(last_week_sans_yesterday.keys())
    last_24_names = set(last_24.keys())
    logging.debug('|last_week_sans_yesterday| =',
                  len(last_week_sans_yesterday_names))
    logging.debug('|last_24_names| =', len(last_24_names))
    new_flakes = last_24_names - last_week_sans_yesterday_names
    logging.debug('|new_flakes| = ', len(new_flakes))
    return {k: last_24[k] for k in new_flakes}


def main():
    new_flakes = get_new_flakes()
    if new_flakes:
        print("Found {} new flakes:".format(len(new_flakes)))
        print_table(new_flakes)
    else:
        print("No new flakes found!")


if __name__ == '__main__':
    main()