Files
python-ganttclient/nova/scheduler/zone_manager.py
Chris Behrens 9e7db3860c Separate scheduler host management
This is a bit of a scheduler refactoring to support future scaling work
as a part of blueprint scaling-zones.

Also fixes bug 891971 (remove unused set_network_host in scheduler)

With or without that blueprint work, this cleans a number of things up
and paves the way for combining a lot of the schedulers by using this
new 'HostManager' for filtering and weighing (future work :)

On to the goodies:

Introduces new HostManager, splitting code out from ZoneManager.
Zone communication and management is handlded in the ZoneManager.
Host filtering and weighing is handled in the HostManager.
ZoneManager is removed from the SchedulerManager and direct calls to it
  from the SchedulerManager now occur via the scheduler driver.  This
  simplifies a number of things.
ZoneManager and HostManager classes to use are now flags.  This allows
  one to extend the current classes and use them.
HostManager uses a HostState class to keep info about hosts.  This class
  needs to be extendable.  Since it's very much tied to the HostManager,
  the HostState class to use is not a flag.  It is, instead, a class
  variable in HostManager.
Filtering functions now accept a single host to filter.  This improves
  performance by not having to build a new array of hosts within every
  filter function.
Filtering functions now accept a more generic 'filter_properties'
  dictionary which we can fill with information available for filtering.
  Adding additional data to this 'filter_properties' can be done by
  subclassing.
Weighing functions now accept this 'filter_properties', also, although
  it's poorly named ATM.  Will be cleaned up in a future branch when I
  move some weighing functions into the host manager.
Filtering tests are true unit tests now.
test_zones was moved from top level to under scheduler as zone_manager
  tests and refactored to be true unit tests.
Host tests are true unit tests now.
Other minor cleanups

Change-Id: I0ef2acef6639b4500c400c18cf2c673cb80f0150
2012-01-18 05:43:36 +00:00

161 lines
5.7 KiB
Python

# Copyright (c) 2011 Openstack, LLC.
# All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License. You may obtain
# a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations
# under the License.
"""
Manage communication with child zones and keep state for them.
"""
import datetime
import traceback
from eventlet import greenpool
from novaclient import v1_1 as novaclient
from nova import db
from nova import flags
from nova import log as logging
from nova import utils
FLAGS = flags.FLAGS
flags.DEFINE_integer('zone_db_check_interval', 60,
'Seconds between getting fresh zone info from db.')
flags.DEFINE_integer('zone_failures_to_offline', 3,
'Number of consecutive errors before marking zone offline')
LOG = logging.getLogger('nova.scheduler.zone_manager')
class ZoneState(object):
"""Holds state for a particular zone."""
def __init__(self):
self.is_active = True
self.capabilities = {}
self.attempt = 0
self.last_seen = datetime.datetime.min
self.last_exception = None
self.last_exception_time = None
self.zone_info = {}
def update_zone_info(self, zone):
"""Update zone credentials from db"""
self.zone_info = dict(zone.iteritems())
def update_metadata(self, zone_metadata):
"""Update zone metadata after successful communications with
child zone."""
self.last_seen = utils.utcnow()
self.attempt = 0
self.capabilities = dict(
[(k, v) for k, v in zone_metadata.iteritems() if k != 'name'])
self.is_active = True
def get_zone_info(self):
db_fields_to_return = ['api_url', 'id', 'weight_scale',
'weight_offset']
zone_info = dict(is_active=self.is_active,
capabilities=self.capabilities)
for field in db_fields_to_return:
zone_info[field] = self.zone_info[field]
return zone_info
def log_error(self, exception):
"""Something went wrong. Check to see if zone should be
marked as offline."""
self.last_exception = exception
self.last_exception_time = utils.utcnow()
api_url = self.zone_info['api_url']
LOG.warning(_("'%(exception)s' error talking to "
"zone %(api_url)s") % locals())
max_errors = FLAGS.zone_failures_to_offline
self.attempt += 1
if self.attempt >= max_errors:
self.is_active = False
LOG.error(_("No answer from zone %(api_url)s "
"after %(max_errors)d "
"attempts. Marking inactive.") % locals())
def call_novaclient(self):
"""Call novaclient. Broken out for testing purposes. Note that
we have to use the admin credentials for this since there is no
available context."""
username = self.zone_info['username']
password = self.zone_info['password']
api_url = self.zone_info['api_url']
region_name = self.zone_info['name']
client = novaclient.Client(username, password, None, api_url,
region_name)
return client.zones.info()._info
def poll(self):
"""Eventlet worker to poll a self."""
if 'api_url' not in self.zone_info:
return
name = self.zone_info['name']
api_url = self.zone_info['api_url']
LOG.debug(_("Polling zone: %(name)s @ %(api_url)s") % locals())
try:
self.update_metadata(self.call_novaclient())
except Exception, e:
self.log_error(traceback.format_exc())
class ZoneManager(object):
"""Keeps the zone states updated."""
def __init__(self):
self.last_zone_db_check = datetime.datetime.min
self.zone_states = {} # { <zone_id> : ZoneState }
self.green_pool = greenpool.GreenPool()
def get_zone_list(self):
"""Return the list of zones we know about."""
return [zone.get_zone_info() for zone in self.zone_states.values()]
def _refresh_from_db(self, context):
"""Make our zone state map match the db."""
# Add/update existing zones ...
zones = db.zone_get_all(context)
existing = self.zone_states.keys()
db_keys = []
for zone in zones:
zone_id = zone['id']
db_keys.append(zone_id)
if zone_id not in existing:
self.zone_states[zone_id] = ZoneState()
self.zone_states[zone_id].update_zone_info(zone)
# Cleanup zones removed from db ...
keys = self.zone_states.keys() # since we're deleting
for zone_id in keys:
if zone_id not in db_keys:
del self.zone_states[zone_id]
def _poll_zones(self):
"""Try to connect to each child zone and get update."""
def _worker(zone_state):
zone_state.poll()
self.green_pool.imap(_worker, self.zone_states.values())
def update(self, context):
"""Update status for all zones. This should be called
periodically to refresh the zone states.
"""
diff = utils.utcnow() - self.last_zone_db_check
if diff.seconds >= FLAGS.zone_db_check_interval:
LOG.debug(_("Updating zone cache from db."))
self.last_zone_db_check = utils.utcnow()
self._refresh_from_db(context)
self._poll_zones()