2012-02-01 17:08:03 +00:00
|
|
|
#!/usr/bin/env python
|
|
|
|
#-*- coding: utf-8 -*-
|
|
|
|
# Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
|
|
|
|
#
|
|
|
|
# Use of this source code is governed by a BSD-style license
|
|
|
|
# that can be found in the LICENSE file in the root of the source
|
|
|
|
# tree. An additional intellectual property rights grant can be found
|
|
|
|
# in the file PATENTS. All contributing project authors may
|
|
|
|
# be found in the AUTHORS file in the root of the source tree.
|
|
|
|
|
|
|
|
"""Contains functions for parsing the build master's transposed grid page."""
|
|
|
|
|
|
|
|
__author__ = 'phoglund@webrtc.org (Patrik Höglund)'
|
|
|
|
|
|
|
|
import re
|
|
|
|
|
|
|
|
|
|
|
|
class FailedToParseBuildStatus(Exception):
|
|
|
|
pass
|
|
|
|
|
|
|
|
|
2012-03-02 12:37:28 +00:00
|
|
|
def _map_status(status):
|
|
|
|
if status == 'exception':
|
|
|
|
return 'failed'
|
|
|
|
return status
|
|
|
|
|
|
|
|
|
2012-02-01 17:08:03 +00:00
|
|
|
def _parse_builds(revision, html):
|
|
|
|
"""Parses the bot list, which is a sequence of <td></td> lines.
|
|
|
|
|
2012-03-02 12:37:28 +00:00
|
|
|
See contract for parse_tgrid_page for more information on how this function
|
|
|
|
behaves.
|
|
|
|
|
2012-02-01 17:08:03 +00:00
|
|
|
Example input:
|
|
|
|
<td class="build success"><a href="builders/Android/builds/119">OK</a></td>
|
|
|
|
The first regular expression group captures Android, second 119, third OK.
|
|
|
|
"""
|
|
|
|
result = {}
|
|
|
|
|
|
|
|
for match in re.finditer('<td.*?>.*?<a href="builders/(.+?)/builds/(\d+)">'
|
2012-03-02 12:37:28 +00:00
|
|
|
'(OK|failed|building|warnings|exception)'
|
|
|
|
'</a>.*?</td>',
|
2012-02-27 15:42:25 +00:00
|
|
|
html, re.DOTALL):
|
2012-02-01 17:08:03 +00:00
|
|
|
revision_and_bot_name = revision + "--" + match.group(1)
|
2012-03-02 12:37:28 +00:00
|
|
|
build_number_and_status = match.group(2) + "--" + _map_status(
|
|
|
|
match.group(3))
|
2012-02-01 17:08:03 +00:00
|
|
|
|
|
|
|
result[revision_and_bot_name] = build_number_and_status
|
|
|
|
|
|
|
|
return result
|
|
|
|
|
|
|
|
|
|
|
|
def parse_tgrid_page(html):
|
|
|
|
"""Parses the build master's tgrid page.
|
|
|
|
|
|
|
|
Example input:
|
|
|
|
<tr>
|
|
|
|
<td valign="bottom" class="sourcestamp">1568</td>
|
|
|
|
LIST OF BOTS
|
|
|
|
</tr>
|
|
|
|
The first regular expression group captures 1568, second group captures
|
|
|
|
everything in LIST OF BOTS. The list of bots is then passed into a
|
|
|
|
separate function for parsing.
|
|
|
|
|
|
|
|
Args:
|
|
|
|
html: The raw HTML from the tgrid page.
|
|
|
|
|
|
|
|
Returns: A dictionary with <svn revision>--<bot name> mapped to
|
2012-02-27 15:42:25 +00:00
|
|
|
<bot build number>--<status>, where status is either OK, failed,
|
2012-03-02 12:37:28 +00:00
|
|
|
building or warnings. The status may be 'exception' in the input, but
|
|
|
|
we simply map that to failed.
|
2012-02-01 17:08:03 +00:00
|
|
|
"""
|
|
|
|
result = {}
|
|
|
|
|
|
|
|
for match in re.finditer('<td.*?class="sourcestamp">(\d+)</td>(.*?)</tr>',
|
|
|
|
html, re.DOTALL):
|
|
|
|
revision = match.group(1)
|
|
|
|
builds_for_revision_html = match.group(2)
|
|
|
|
result.update(_parse_builds(revision, builds_for_revision_html))
|
|
|
|
|
|
|
|
if not result:
|
2012-02-06 10:55:12 +00:00
|
|
|
raise FailedToParseBuildStatus('Could not find any build statuses in %s.' %
|
|
|
|
html)
|
2012-02-01 17:08:03 +00:00
|
|
|
|
|
|
|
return result
|