gerritbot/gerritbot/bot.py

505 lines
17 KiB
Python
Executable File

#! /usr/bin/env python
# Copyright 2011 OpenStack LLC
# Copyright 2012 Hewlett-Packard Development Company, L.P.
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License. You may obtain
# a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations
# under the License.
# The configuration file should look like:
"""
[ircbot]
nick=NICKNAME
pass=PASSWORD
server=irc.freenode.net
port=6697
channel_config=/path/to/yaml/config
pid=/path/to/pid_file
use_mqtt=True
[gerrit]
user=gerrit2
key=/path/to/id_rsa
host=review.example.com
port=29418
[mqtt]
host=example.com
port=1883
websocket=False
"""
# The yaml channel config should look like:
"""
openstack-dev:
events:
- patchset-created
- change-merged
projects:
- openstack/nova
- openstack/swift
- ^openstack/fuel-.*
branches:
- master
- ^stable/(newton|ocata|pike)
"""
import ConfigParser
import daemon
from ib3.auth import SASL
from ib3.connection import SSL
import irc.bot
import json
import logging.config
import os
import re
import sys
import threading
import time
import yaml
import paho.mqtt.client as mqtt
try:
import daemon.pidlockfile
pid_file_module = daemon.pidlockfile
except Exception:
# as of python-daemon 1.6 it doesn't bundle pidlockfile anymore
# instead it depends on lockfile-0.9.1
import daemon.pidfile
pid_file_module = daemon.pidfile
# https://bitbucket.org/jaraco/irc/issue/34/
# irc-client-should-not-crash-on-failed
# ^ This is why pep8 is a bad idea.
irc.client.ServerConnection.buffer_class.errors = 'replace'
# Freenode only allows a connection to join up to 120 channels
CHANNEL_MAX = 120
class Channel(object):
def __init__(self, name):
self.name = name
self.stamp()
def stamp(self):
self.last_used = time.time()
class GerritBot(SASL, SSL, irc.bot.SingleServerIRCBot):
def __init__(self, channels, nickname, password, server, port=6697):
super(GerritBot, self).__init__(
server_list=[(server, port)],
nickname=nickname,
realname=nickname,
ident_password=password,
channels=channels)
self.all_channels = {}
for name in channels:
self.all_channels[name] = Channel(name)
self.joined_channels = {}
self.nickname = nickname
self.password = password
self.log = logging.getLogger('gerritbot')
def send(self, channel_name, msg):
self.log.info('Sending "%s" to %s' % (msg, channel_name))
if channel_name not in self.joined_channels:
if len(self.joined_channels) >= CHANNEL_MAX:
drop = sorted(self.joined_channels.values(),
key=lambda x: x.last_used)[-1]
self.connection.part(drop.name)
self.log.info('Parted channel %s' % drop.name)
del self.joined_channels[drop.name]
channel = self.all_channels[channel_name]
self.connection.join(channel.name)
self.joined_channels[channel.name] = channel
self.log.info('Joined channel %s' % channel.name)
time.sleep(0.5)
self.all_channels[channel_name].stamp()
try:
self.connection.privmsg(channel_name, msg)
time.sleep(0.5)
except Exception:
self.log.exception('Exception sending message:')
self.connection.reconnect()
class Gerrit(threading.Thread):
def __init__(self, ircbot, channel_config, server,
username, port=29418, keyfile=None):
super(Gerrit, self).__init__()
self.ircbot = ircbot
self.channel_config = channel_config
self.log = logging.getLogger('gerritbot')
self.server = server
self.username = username
self.port = port
self.keyfile = keyfile
self.connected = False
def connect(self):
# Import here because it needs to happen after daemonization
import gerritlib.gerrit
try:
self.gerrit = gerritlib.gerrit.Gerrit(
self.server, self.username, self.port, self.keyfile)
self.gerrit.startWatching()
self.log.info('Start watching Gerrit event stream.')
self.connected = True
except Exception:
self.log.exception('Exception while connecting to gerrit')
self.connected = False
# Delay before attempting again.
time.sleep(1)
@staticmethod
def _get_username(patchset):
# Try to find username
for key in ('name', 'username', 'email'):
username = patchset['uploader'].get(key)
if username:
return username
return "UNKNOWN USER"
def patchset_created(self, channel, data):
msg = '%s proposed %s %s: %s %s' % (
self._get_username(data['patchSet']),
data['change']['project'],
data['change']['branch'],
data['change']['subject'],
data['change']['url'])
self.log.info('Compiled Message %s: %s' % (channel, msg))
self.ircbot.send(channel, msg)
def ref_updated(self, channel, data):
refName = data['refUpdate']['refName']
m = re.match(r'(refs/tags)/(.*)', refName)
if m:
tag = m.group(2)
msg = '%s tagged project %s with %s' % (
data['submitter']['username'],
data['refUpdate']['project'],
tag
)
self.log.info('Compiled Message %s: %s' % (channel, msg))
self.ircbot.send(channel, msg)
def comment_added(self, channel, data):
msg = 'A comment has been added to a proposed change to %s: %s %s' % (
data['change']['project'],
data['change']['subject'],
data['change']['url'])
self.log.info('Compiled Message %s: %s' % (channel, msg))
self.ircbot.send(channel, msg)
for approval in data.get('approvals', []):
if (approval['type'] == 'VRIF' and approval['value'] == '-2'
and channel in self._channels_for('events',
'x-vrif-minus-2')):
msg = 'Verification of a change to %s failed: %s %s' % (
data['change']['project'],
data['change']['subject'],
data['change']['url'])
self.log.info('Compiled Message %s: %s' % (channel, msg))
self.ircbot.send(channel, msg)
if (approval['type'] == 'VRIF' and approval['value'] == '2'
and channel in self._channels_for('events',
'x-vrif-plus-2')):
msg = 'Verification of a change to %s succeeded: %s %s' % (
data['change']['project'],
data['change']['subject'],
data['change']['url'])
self.log.info('Compiled Message %s: %s' % (channel, msg))
self.ircbot.send(channel, msg)
if (approval['type'] == 'CRVW' and approval['value'] == '-2'
and channel in self._channels_for('events',
'x-crvw-minus-2')):
msg = 'A change to %s has been rejected: %s %s' % (
data['change']['project'],
data['change']['subject'],
data['change']['url'])
self.log.info('Compiled Message %s: %s' % (channel, msg))
self.ircbot.send(channel, msg)
if (approval['type'] == 'CRVW' and approval['value'] == '2'
and channel in self._channels_for('events',
'x-crvw-plus-2')):
msg = 'A change to %s has been approved: %s %s' % (
data['change']['project'],
data['change']['subject'],
data['change']['url'])
self.log.info('Compiled Message %s: %s' % (channel, msg))
self.ircbot.send(channel, msg)
def change_merged(self, channel, data):
msg = 'Merged %s %s: %s %s' % (
data['change']['project'],
data['change']['branch'],
data['change']['subject'],
data['change']['url'])
self.log.info('Compiled Message %s: %s' % (channel, msg))
self.ircbot.send(channel, msg)
def _channels_for(self, section, datakey):
"""Get a set of channel names for a given data value.
Finds all the channels that care about the specified datakey for a
given channel_config section. If the channel config key starts with
'^', datakey is matched by regex; otherwise it is matched by string
equality. For example, given input data:
openstack-dev:
projects:
- openstack/foo-bar
openstack-infra:
projects:
- ^openstack/foo-.*$
openstack-sdks:
projects:
- openstack/foo
...the call:
_channels_for('projects', 'openstack/foo-bar')
...will return the set:
{'#openstack-dev', '#openstack-infra'}
:param str section: The channel_config section to inspect ('projects',
'events', or 'branches')
:param str datakey: The key into the section, from the source data.
E.g. for section 'projects', the key would be the
project name (data['change']['project']).
"""
ret = set()
for key, chanset in getattr(self.channel_config, section, {}).items():
for channel in chanset or set():
if key.startswith('^'):
if re.search(key, datakey):
ret.add(channel)
else:
if key == datakey:
ret.add(channel)
return ret
def _read(self, data):
try:
# We only consider event (not project/branch) filters for these.
event_only_types = ('ref-updated',)
if data['type'] in event_only_types:
channel_set = self._channels_for('events', data['type'])
else:
channel_set = (
self._channels_for('projects', data['change']['project']) &
self._channels_for('events', data['type']) &
self._channels_for('branches', data['change']['branch'])
)
except KeyError:
# The data we care about was not present, no channels want
# this event.
channel_set = set()
if not channel_set:
channel_set = set()
self.log.info('Potential channels to receive event notification: %s' %
channel_set)
for channel in channel_set:
if data['type'] == 'comment-added':
self.comment_added(channel, data)
elif data['type'] == 'patchset-created':
self.patchset_created(channel, data)
elif data['type'] == 'change-merged':
self.change_merged(channel, data)
elif data['type'] == 'ref-updated':
self.ref_updated(channel, data)
def run(self):
while True:
while not self.connected:
self.connect()
try:
event = self.gerrit.getEvent()
self.log.info('Received event: %s' % event)
self._read(event)
except Exception:
self.log.exception('Exception encountered in event loop')
if not self.gerrit.watcher_thread.is_alive():
# Start new gerrit connection. Don't need to restart IRC
# bot, it will reconnect on its own.
self.connected = False
class GerritMQTT(Gerrit):
def __init__(self, ircbot, channel_config, server, base_topic='gerrit',
port=1883, websocket=False):
threading.Thread.__init__(self)
self.ircbot = ircbot
self.channel_config = channel_config
self.log = logging.getLogger('gerritbot')
self.server = server
self.port = port
self.websocket = websocket
self.base_topic = base_topic
self.connected = False
def connect(self):
try:
self.client.connect(self.server, port=self.port)
self.log.info('Start watching Gerrit event stream via mqtt!.')
self.connected = True
except Exception:
self.log.exception('Exception while connecting to mqtt')
self.client.reinitialise()
self.connected = False
# Delay before attempting again.
time.sleep(1)
def run(self):
def _on_connect(client, userdata, flags, rc):
client.subscribe(self.base_topic + '/#')
def _on_message(client, userdata, msg):
data = json.loads(msg.payload)
if data:
self._read(data)
if self.websocket:
self.client = mqtt.Client(transport='websockets')
else:
self.client = mqtt.Client()
self.client.on_connect = _on_connect
self.client.on_message = _on_message
while True:
while not self.connected:
self.connect()
try:
self.client.loop()
except Exception:
self.log.exception('Exception encountered in event loop')
time.sleep(5)
class ChannelConfig(object):
def __init__(self, data):
self.data = data
keys = data.keys()
for key in keys:
if key[0] != '#':
data['#' + key] = data.pop(key)
self.channels = data.keys()
self.projects = {}
self.events = {}
self.branches = {}
for channel, val in iter(self.data.items()):
for event in val['events']:
event_set = self.events.get(event, set())
event_set.add(channel)
self.events[event] = event_set
for project in val['projects']:
project_set = self.projects.get(project, set())
project_set.add(channel)
self.projects[project] = project_set
for branch in val['branches']:
branch_set = self.branches.get(branch, set())
branch_set.add(channel)
self.branches[branch] = branch_set
def _main(config):
setup_logging(config)
fp = config.get('ircbot', 'channel_config')
if fp:
fp = os.path.expanduser(fp)
if not os.path.exists(fp):
raise Exception("Unable to read layout config file at %s" % fp)
else:
raise Exception("Channel Config must be specified in config file.")
try:
channel_config = ChannelConfig(yaml.load(open(fp)))
except Exception:
log = logging.getLogger('gerritbot')
log.exception("Syntax error in chanel config file")
raise
bot = GerritBot(channel_config.channels,
config.get('ircbot', 'nick'),
config.get('ircbot', 'pass'),
config.get('ircbot', 'server'),
config.getint('ircbot', 'port'))
if config.has_option('ircbot', 'use_mqtt'):
use_mqtt = config.getboolean('ircbot', 'use_mqtt')
else:
use_mqtt = False
if use_mqtt:
g = GerritMQTT(bot,
channel_config,
config.get('mqtt', 'host'),
config.get('mqtt', 'base_topic'),
config.getint('mqtt', 'port'),
config.getboolean('mqtt', 'websocket'))
else:
g = Gerrit(bot,
channel_config,
config.get('gerrit', 'host'),
config.get('gerrit', 'user'),
config.getint('gerrit', 'port'),
config.get('gerrit', 'key'))
g.start()
bot.start()
def main():
if len(sys.argv) != 2:
print("Usage: %s CONFIGFILE" % sys.argv[0])
sys.exit(1)
config = ConfigParser.ConfigParser()
config.read(sys.argv[1])
pid_path = ""
if config.has_option('ircbot', 'pid'):
pid_path = config.get('ircbot', 'pid')
else:
pid_path = "/var/run/gerritbot/gerritbot.pid"
pid = pid_file_module.TimeoutPIDLockFile(pid_path, 10)
with daemon.DaemonContext(pidfile=pid):
_main(config)
def setup_logging(config):
if config.has_option('ircbot', 'log_config'):
log_config = config.get('ircbot', 'log_config')
fp = os.path.expanduser(log_config)
if not os.path.exists(fp):
raise Exception("Unable to read logging config file at %s" % fp)
logging.config.fileConfig(fp)
else:
logging.basicConfig(level=logging.DEBUG)
if __name__ == "__main__":
main()