neutron-vpnaas/neutron_vpnaas/services/vpn/device_drivers/ipsec.py
Niklas Schwarz f63f99d822 Add type annotations
Add type annotations to the different parameters
and return values to modernize the python used.
This will also introduce mypy as another tool
for static code analysis which will currently not
run in CI

Change-Id: Ic09e47673f916328568c413d0e8485d36c283c24
2024-04-18 10:42:46 +02:00

1207 lines
45 KiB
Python

# Copyright 2013, Nachi Ueno, NTT I3, Inc.
# All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License. You may obtain
# a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations
# under the License.
import typing as ty
import abc
import base64
import copy
import filecmp
import os
import re
import shutil
import socket
import sys
import eventlet
import jinja2
import netaddr
from neutron.agent.linux import ip_lib
from neutron.agent.linux import utils as agent_utils
from neutron_lib.api import validators
from neutron_lib import constants
from neutron_lib import context
from neutron_lib.exceptions import vpn as vpn_exception
from neutron_lib.plugins import utils as plugin_utils
from neutron_lib import rpc as n_rpc
from neutron_lib.utils import file as file_utils
from oslo_concurrency import lockutils
from oslo_config import cfg
from oslo_log import helpers as log_helpers
from oslo_log import log as logging
import oslo_messaging
from oslo_service import loopingcall
from oslo_utils import encodeutils
from oslo_utils import fileutils
from neutron_vpnaas._i18n import _
from neutron_vpnaas.services.vpn.common import topics
from neutron_vpnaas.services.vpn import device_drivers
LOG = logging.getLogger(__name__)
TEMPLATE_PATH = os.path.dirname(os.path.abspath(__file__))
ipsec_opts = [
cfg.StrOpt(
'config_base_dir',
default='$state_path/ipsec',
help=_('Location to store ipsec server config files')),
cfg.IntOpt('ipsec_status_check_interval',
default=60,
help=_("Interval for checking ipsec status")),
cfg.BoolOpt('enable_detailed_logging',
default=False,
help=_("Enable detail logging for ipsec pluto process. "
"If the flag set to True, the detailed logging will "
"be written into config_base_dir/<pid>/log. "
"Note: This setting applies to OpenSwan and LibreSwan "
"only. StrongSwan logs to syslog.")),
]
cfg.CONF.register_opts(ipsec_opts, 'ipsec')
openswan_opts = [
cfg.StrOpt(
'ipsec_config_template',
default=os.path.join(
TEMPLATE_PATH,
'template/openswan/ipsec.conf.template'),
help=_('Template file for ipsec configuration')),
cfg.StrOpt(
'ipsec_secret_template',
default=os.path.join(
TEMPLATE_PATH,
'template/openswan/ipsec.secret.template'),
help=_('Template file for ipsec secret configuration'))
]
cfg.CONF.register_opts(openswan_opts, 'openswan')
pluto_opts = [
cfg.IntOpt('shutdown_check_timeout',
default=1,
help=_('Initial interval in seconds for checking if pluto '
'daemon is shutdown'),
deprecated_group='libreswan'),
cfg.IntOpt('shutdown_check_retries',
default=5,
help=_('The maximum number of retries for checking for '
'pluto daemon shutdown'),
deprecated_group='libreswan'),
cfg.FloatOpt('shutdown_check_back_off',
default=1.5,
help=_('A factor to increase the retry interval for '
'each retry'),
deprecated_group='libreswan'),
cfg.BoolOpt('restart_check_config',
default=False,
help=_('Enable this flag to avoid from unnecessary restart'),
deprecated_group='libreswan')
]
cfg.CONF.register_opts(pluto_opts, 'pluto')
JINJA_ENV = None
IPSEC_CONNS = 'ipsec_site_connections'
# *Swan supports Base64 encoded binary values as PSKs. In such cases,
# a character sequence beginning with 0s is interpreted as Base64
# encoded binary data.
# - StrongSwan
# - https://wiki.strongswan.org/projects/strongswan/wiki/PskSecret
# - LibreSwan
# - https://libreswan.org/man/ipsec.secrets.5.html
# - https://libreswan.org/man/ipsec_ttodata.3.html
# - OpenSwan (no online documents, see manpages sources in the repository)
# - https://github.com/xelerance/Openswan
PSK_BASE64_PREFIX = '0s'
def _get_template(
template_file: ty.Union[str, jinja2.Template]) -> jinja2.Template:
global JINJA_ENV
if not JINJA_ENV:
templateLoader = jinja2.FileSystemLoader(searchpath="/")
JINJA_ENV = jinja2.Environment(loader=templateLoader, autoescape=True)
return JINJA_ENV.get_template(template_file)
class BaseSwanProcess(metaclass=abc.ABCMeta):
"""Swan Family Process Manager
This class manages start/restart/stop ipsec process.
This class create/delete config template
"""
binary = "ipsec"
CONFIG_DIRS = [
'var/run',
'log',
'etc',
'etc/ipsec.d/aacerts',
'etc/ipsec.d/acerts',
'etc/ipsec.d/cacerts',
'etc/ipsec.d/certs',
'etc/ipsec.d/crls',
'etc/ipsec.d/ocspcerts',
'etc/ipsec.d/policies',
'etc/ipsec.d/private',
'etc/ipsec.d/reqs',
'etc/pki/nssdb/'
]
DIALECT_MAP = {
"3des": "3des",
"aes-128": "aes128",
"aes-256": "aes256",
"aes-192": "aes192",
"sha256": "sha2_256",
"sha384": "sha2_384",
"sha512": "sha2_512",
"group2": "modp1024",
"group5": "modp1536",
"group14": "modp2048",
"group15": "modp3072",
"bi-directional": "start",
"response-only": "add",
"v2": "insist",
"v1": "never"
}
NS_WRAPPER = 'neutron-vpn-netns-wrapper'
STATUS_DICT = {
'erouted': constants.ACTIVE,
'unrouted': constants.DOWN
}
STATUS_RE = r'\d\d\d "([a-f0-9\-]+).* (unrouted|erouted);'
STATUS_NOT_RUNNING_RE = 'Command:.*ipsec.*status.*Exit code: [1|3]$'
STATUS_IPSEC_SA_ESTABLISHED_RE = (
r'\d{3} #\d+: "([a-f0-9\-]+).*established.*newest IPSEC')
STATUS_IPSEC_SA_ESTABLISHED_RE2 = (
r'\d{3} #\d+: "([a-f0-9\-\/x]+).*established.*newest IPSEC')
def __init__(self, conf, process_id: str, vpnservice, namespace: str):
self.conf = conf
self.id = process_id
self.updated_pending_status: bool = False
self.namespace = namespace
self.connection_status: ty.Dict[str, ty.Dict[str, ty.Any]] = {}
self.config_dir = os.path.join(
self.conf.ipsec.config_base_dir, self.id)
self.etc_dir = os.path.join(self.config_dir, 'etc')
self.log_dir = os.path.join(self.config_dir, 'log')
self.update_vpnservice(vpnservice)
self.STATUS_PATTERN = re.compile(self.STATUS_RE)
self.STATUS_NOT_RUNNING_PATTERN = re.compile(
self.STATUS_NOT_RUNNING_RE)
self.STATUS_IPSEC_SA_ESTABLISHED_PATTERN = re.compile(
self.STATUS_IPSEC_SA_ESTABLISHED_RE)
self.STATUS_IPSEC_SA_ESTABLISHED_PATTERN2 = re.compile(
self.STATUS_IPSEC_SA_ESTABLISHED_RE2)
self.STATUS_MAP = self.STATUS_DICT
def translate_dialect(self):
if not self.vpnservice:
return
for ipsec_site_conn in self.vpnservice["ipsec_site_connections"]:
self._dialect(ipsec_site_conn, "initiator")
self._dialect(ipsec_site_conn["ikepolicy"], "ike_version")
for key in ["encryption_algorithm", "auth_algorithm", "pfs"]:
self._dialect(ipsec_site_conn["ikepolicy"], key)
self._dialect(ipsec_site_conn["ipsecpolicy"], key)
if ("local_id" not in ipsec_site_conn.keys()) or (
not ipsec_site_conn["local_id"]
):
ipsec_site_conn["local_id"] = ipsec_site_conn["external_ip"]
def base64_encode_psk(self):
if not self.vpnservice:
return
for ipsec_site_conn in self.vpnservice["ipsec_site_connections"]:
psk = ipsec_site_conn["psk"]
encoded_psk = base64.b64encode(encodeutils.safe_encode(psk))
# NOTE(huntxu): base64.b64encode returns an instance of 'bytes'
# in Python 3, convert it to a str. For Python 2, after calling
# safe_decode, psk is converted into a unicode not containing any
# non-ASCII characters so it doesn't matter.
psk = encodeutils.safe_decode(encoded_psk, incoming="utf_8")
ipsec_site_conn["psk"] = PSK_BASE64_PREFIX + psk
def get_ns_wrapper(self) -> str:
"""
Check if we're inside a virtualenv. If we are, then we should
respect this and launch wrapper from venv as well.
"""
if (hasattr(sys, 'real_prefix') or
(hasattr(sys, 'base_prefix') and sys.base_prefix != sys.prefix)):
ns_wrapper = os.path.join(sys.prefix, "bin/", self.NS_WRAPPER)
else:
ns_wrapper = self.NS_WRAPPER
return ns_wrapper
def update_vpnservice(self, vpnservice: ty.Dict[str, ty.Any]):
self.vpnservice = vpnservice
self.translate_dialect()
self.base64_encode_psk()
def _dialect(self, obj, key):
obj[key] = self.DIALECT_MAP.get(obj[key], obj[key])
@abc.abstractmethod
def ensure_configs(self):
pass
def ensure_config_file(self, kind, template, vpnservice, file_mode=None):
"""Update config file, based on current settings for service."""
config_str = self._gen_config_content(template, vpnservice)
config_file_name = self._get_config_filename(kind)
if file_mode is None:
file_utils.replace_file(config_file_name, config_str)
else:
file_utils.replace_file(config_file_name, config_str, file_mode)
def remove_config(self):
"""Remove whole config file."""
agent_utils.execute(
cmd=["rm", "-rf", self.config_dir], run_as_root=True)
def _get_config_filename(self, kind) -> str:
config_dir = self.etc_dir
return os.path.join(config_dir, kind)
def ensure_config_dir(self, vpnservice):
"""Create config directory if it does not exist."""
fileutils.ensure_tree(self.config_dir, 0o755)
for subdir in self.CONFIG_DIRS:
dir_path = os.path.join(self.config_dir, subdir)
fileutils.ensure_tree(dir_path, 0o755)
def _gen_config_content(self, template_file, vpnservice) -> str:
template = _get_template(template_file)
return template.render(
{'vpnservice': vpnservice,
'state_path': self.conf.state_path})
def _get_rootwrap_config(self) -> ty.Optional[str]:
if 'neutron-rootwrap' in cfg.CONF.AGENT.root_helper:
rh_tokens: ty.List[str] = cfg.CONF.AGENT.root_helper.split(' ')
if len(rh_tokens) == 3 and os.path.exists(rh_tokens[2]):
return rh_tokens[2]
return None
@abc.abstractmethod
def get_status(self):
pass
@property
def status(self) -> str:
if self.active:
return constants.ACTIVE
return constants.DOWN
@property
def active(self) -> bool:
"""Check if the process is active or not."""
if not self.namespace:
return False
try:
status = self.get_status()
self._extract_and_record_connection_status(status)
if not self.connection_status:
return False
except RuntimeError:
return False
return True
def update(self):
"""Update Status based on vpnservice configuration."""
# Disable the process if a vpnservice is disabled or it has no
# enabled IPSec site connections.
vpnservice_has_active_ipsec_site_conns = any(
ipsec_site_conn['admin_state_up']
for ipsec_site_conn in
self.vpnservice['ipsec_site_connections'])
if (not self.vpnservice['admin_state_up'] or
not vpnservice_has_active_ipsec_site_conns):
self.disable()
else:
self.enable()
if plugin_utils.in_pending_status(self.vpnservice['status']):
self.updated_pending_status = True
self.vpnservice['status'] = self.status
for ipsec_site_conn in self.vpnservice['ipsec_site_connections']:
if plugin_utils.in_pending_status(ipsec_site_conn['status']):
conn_id = ipsec_site_conn['id']
conn_status = self.connection_status.get(conn_id)
if not conn_status:
continue
conn_status['updated_pending_status'] = True
ipsec_site_conn['status'] = conn_status['status']
def enable(self):
"""Enabling the process."""
try:
self.ensure_configs()
if self.active:
self.restart()
else:
self.start()
except RuntimeError:
LOG.exception(
"Failed to enable vpn process on router %s",
self.id)
def disable(self):
"""Disabling the process."""
try:
if self.active:
self.stop()
self.remove_config()
except RuntimeError:
LOG.exception(
"Failed to disable vpn process on router %s",
self.id)
@abc.abstractmethod
def restart(self):
"""Restart process."""
@abc.abstractmethod
def start(self):
"""Start process."""
@abc.abstractmethod
def stop(self):
"""Stop process."""
def _check_status_line(self,
line: str) -> ty.Tuple[ty.Optional[str], ty.Optional[str]]:
"""Parse a line and search for status information.
If a connection has an established Security Association,
it will be considered ACTIVE. Otherwise, even if a status
line shows that a connection is active, it will be marked
as DOWN-ed.
"""
# pluto is not running so just exit
if self.STATUS_NOT_RUNNING_PATTERN.search(line):
self.connection_status = {}
raise StopIteration()
m = self.STATUS_IPSEC_SA_ESTABLISHED_PATTERN.search(line)
if m:
connection_id = m.group(1)
return connection_id, constants.ACTIVE
m = self.STATUS_PATTERN.search(line)
if m:
connection_id = m.group(1)
return connection_id, constants.DOWN
return None, None
def _extract_and_record_connection_status(self,
status_output: ty.Optional[str]):
if not status_output:
self.connection_status = {}
return
for line in status_output.split('\n'):
try:
conn_id, conn_status = self._check_status_line(line)
except StopIteration:
break
if conn_id:
self._record_connection_status(conn_id, conn_status)
def _record_connection_status(self, connection_id: str, status,
force_status_update: bool = False):
conn_info = self.connection_status.get(connection_id)
if not conn_info:
self.connection_status[connection_id] = {
'status': status,
'updated_pending_status': force_status_update
}
else:
conn_info['status'] = status
if force_status_update:
conn_info['updated_pending_status'] = True
class OpenSwanProcess(BaseSwanProcess):
"""OpenSwan Process manager class.
This process class uses three commands
(1) ipsec pluto: IPsec IKE keying daemon
(2) ipsec addconn: Adds new ipsec addconn
(3) ipsec whack: control interface for IPSEC keying daemon
"""
def __init__(self, conf, process_id: str, vpnservice, namespace: str):
super().__init__(conf, process_id, vpnservice, namespace)
self.secrets_file: str = os.path.join(
self.etc_dir, 'ipsec.secrets')
self.config_file: str = os.path.join(
self.etc_dir, 'ipsec.conf')
self.pid_path: str = os.path.join(
self.config_dir, 'var', 'run', 'pluto')
self.pid_file: str = f'{self.pid_path}.pid'
def _execute(self, cmd, check_exit_code: bool = True,
extra_ok_codes: ty.Optional[ty.List[int]] = None
) -> ty.Optional[str]:
"""Execute command on namespace."""
ip_wrapper = ip_lib.IPWrapper(namespace=self.namespace)
return ip_wrapper.netns.execute(cmd, check_exit_code=check_exit_code,
extra_ok_codes=extra_ok_codes)
def ensure_configs(self):
"""Generate config files which are needed for OpenSwan.
If there is no directory, this function will create
dirs.
"""
self.ensure_config_dir(self.vpnservice)
self.ensure_config_file(
'ipsec.conf',
self.conf.openswan.ipsec_config_template,
self.vpnservice)
self.ensure_config_file(
'ipsec.secrets',
self.conf.openswan.ipsec_secret_template,
self.vpnservice,
0o600)
def _copy_configs(self):
if not cfg.CONF.pluto.restart_check_config:
return
config_file_name = self._get_config_filename('ipsec.conf')
if os.path.isfile(config_file_name):
shutil.copyfile(config_file_name, config_file_name + '.old')
config_file_name = self._get_config_filename('ipsec.secrets')
if os.path.isfile(config_file_name):
shutil.copyfile(config_file_name, config_file_name + '.old')
os.chmod(config_file_name + '.old', 0o600)
def _process_running(self) -> bool:
"""Checks if process is still running."""
# If no PID file, we assume the process is not running.
if not os.path.exists(self.pid_file):
return False
try:
# We take an ask-forgiveness-not-permission approach and rely
# on throwing to tell us something. If the pid file exists,
# delve into the process information and check if it matches
# our expected command line.
with open(self.pid_file, 'r', encoding="C") as f:
pid = f.readline().strip()
with open(f'/proc/{pid}/cmdline',
encoding="C") as cmd_line_file:
cmd_line = cmd_line_file.readline()
if self.pid_path in cmd_line and 'pluto' in cmd_line:
# Okay the process is probably a pluto process
# and it contains the pid_path in the command
# line... could be a race. Log to error and return
# that it is *NOT* okay to clean up files. We are
# logging to error instead of debug because it
# indicates something bad has happened and this is
# valuable information for figuring it out.
LOG.error('Process %(pid)s exists with command '
'line %(cmd_line)s.',
{'pid': pid, 'cmd_line': cmd_line})
return True
except IOError as e:
# This is logged as "info" instead of error because it simply
# means that we couldn't find the files to check on them.
LOG.info('Unable to find control files on startup for '
'router %(router)s: %(msg)s',
{'router': self.id, 'msg': e})
return False
def _cleanup_control_files(self):
try:
ctl_file = f'{self.pid_path}.ctl'
LOG.debug('Removing %(pidfile)s and %(ctlfile)s',
{'pidfile': self.pid_file,
'ctlfile': ctl_file})
if os.path.exists(self.pid_file):
os.remove(self.pid_file)
if os.path.exists(ctl_file):
os.remove(ctl_file)
except OSError as e:
LOG.error('Unable to remove pluto control '
'files for router %(router)s. %(msg)s',
{'router': self.id, 'msg': e})
def get_status(self) -> ty.Optional[str]:
return self._execute([self.binary,
'whack',
'--ctlbase',
self.pid_path,
'--status'], extra_ok_codes=[1, 3])
def _config_changed(self) -> bool:
secrets_file = os.path.join(
self.etc_dir, 'ipsec.secrets')
config_file = os.path.join(
self.etc_dir, 'ipsec.conf')
if not os.path.isfile(secrets_file + '.old'):
return True
if not os.path.isfile(config_file + '.old'):
return True
if not filecmp.cmp(secrets_file, secrets_file + '.old'):
return True
if not filecmp.cmp(config_file, config_file + '.old'):
return True
return False
def restart(self):
"""Restart the process."""
if cfg.CONF.pluto.restart_check_config and not self._config_changed():
return
# stop() followed immediately by a start() runs the risk that the
# current pluto daemon has not had a chance to shutdown. We check
# the current process information to see if the daemon is still
# running and if so, wait a short interval and retry.
self.stop()
wait_interval = cfg.CONF.pluto.shutdown_check_timeout
for i in range(cfg.CONF.pluto.shutdown_check_retries):
if not self._process_running():
self._cleanup_control_files()
break
eventlet.sleep(wait_interval)
wait_interval *= cfg.CONF.pluto.shutdown_check_back_off
else:
LOG.warning('Server appears to still be running, restart '
'of router %s may fail', self.id)
self.start()
def _resolve_fqdn(self, fqdn) -> ty.Optional[str]:
# The first addrinfo member from the list returned by
# socket.getaddrinfo is used for the address resolution.
# The code doesn't filter for ipv4 or ipv6 address.
try:
addrinfo: ty.Tuple[
socket.AddressFamily,
socket.SocketKind,
int,
str,
ty.Union[ty.Tuple[str, int], ty.Tuple[str, int, int, int]],
] = socket.getaddrinfo(fqdn, None)[0]
return addrinfo[-1][0]
except socket.gaierror:
LOG.exception("Peer address %s cannot be resolved", fqdn)
return None
def _get_nexthop(self, address: str, connection_id: str) -> str:
# check if address is an ip address or fqdn
invalid_ip_address = validators.validate_ip_address(address)
if invalid_ip_address:
ip_addr = self._resolve_fqdn(address)
if not ip_addr:
self._record_connection_status(connection_id, constants.ERROR,
force_status_update=True)
raise vpn_exception.VPNPeerAddressNotResolved(
peer_address=address)
else:
ip_addr = address
routes = self._execute(['ip', 'route', 'get', ip_addr])
if routes and routes.find('via') >= 0:
return routes.split(' ')[2]
return address
def _virtual_privates(self,
vpnservice: ty.Dict[str, ty.List[ty.Dict[str, ty.Any]]]) -> str:
"""Returns line of virtual_privates.
virtual_private contains the networks
that are allowed as subnet for the remote client.
"""
virtual_privates: ty.List[str] = []
nets: ty.List = []
for ipsec_site_conn in vpnservice['ipsec_site_connections']:
nets += ipsec_site_conn['local_cidrs']
nets += ipsec_site_conn['peer_cidrs']
for net in nets:
version = netaddr.IPNetwork(net).version
virtual_privates.append(f'%v{version}:{net}')
virtual_privates.sort()
return ','.join(virtual_privates)
def _gen_config_content(self,
template_file: ty.Union[str, jinja2.Template],
vpnservice) -> str:
template = _get_template(template_file)
virtual_privates = self._virtual_privates(vpnservice)
return template.render(
{'vpnservice': vpnservice,
'virtual_privates': virtual_privates})
def start_pluto(self):
cmd = [self.binary,
'pluto',
'--ctlbase', self.pid_path,
'--ipsecdir', self.etc_dir,
'--use-netkey',
'--uniqueids',
'--nat_traversal',
'--secretsfile', self.secrets_file]
if self.conf.ipsec.enable_detailed_logging:
cmd += ['--perpeerlog', '--perpeerlogbase', self.log_dir]
self._execute(cmd)
def add_ipsec_connection(self, nexthop, conn_id):
self._execute([self.binary,
'addconn',
'--ctlbase', f'{self.pid_path}.ctl',
'--defaultroutenexthop', nexthop,
'--config', self.config_file, conn_id
])
def start_whack_listening(self):
#TODO(nati) fix this when openswan is fixed
#Due to openswan bug, this command always exit with 3
self._execute([self.binary,
'whack',
'--ctlbase', self.pid_path,
'--listen'
], check_exit_code=False)
def shutdown_whack(self):
self._execute([self.binary,
'whack',
'--ctlbase', self.pid_path,
'--shutdown'
])
def initiate_connection(self, conn_name):
self._execute([self.binary,
'whack',
'--ctlbase', self.pid_path,
'--name', conn_name,
'--asynchronous',
'--initiate'
])
def terminate_connection(self, conn_name):
self._execute([self.binary,
'whack',
'--ctlbase', self.pid_path,
'--name', conn_name,
'--terminate'
])
def start(self):
"""Start the process.
Note: if there is not namespace yet,
just do nothing, and wait next event.
"""
if not self.namespace:
return
# NOTE: The restart operation calls the parent's start() instead of
# this one to avoid having to special case the startup file check.
# If anything is added to this method that needs to run whenever
# a restart occurs, it should be either added to the restart()
# override or things refactored to special-case start() when
# called from restart().
# If, by any reason, ctl and pid files weren't cleaned up, pluto
# won't be able to rewrite them and will fail to start. So we check
# to see if the process is running and if not, attempt a cleanup.
# In either case we fall through to allow the pluto process to
# start or fail in the usual way.
if not self._process_running():
self._cleanup_control_files()
#start pluto IKE keying daemon
self.start_pluto()
#add connections
for ipsec_site_conn in self.vpnservice['ipsec_site_connections']:
# Don't add a connection if its admin state is down
if not ipsec_site_conn['admin_state_up']:
continue
nexthop = self._get_nexthop(ipsec_site_conn['peer_address'],
ipsec_site_conn['id'])
self.add_ipsec_connection(nexthop, ipsec_site_conn['id'])
#start whack ipsec keying daemon
self.start_whack_listening()
for ipsec_site_conn in self.vpnservice['ipsec_site_connections']:
if (not ipsec_site_conn['initiator'] == 'start' or
not ipsec_site_conn['admin_state_up']):
continue
#initiate ipsec connection
self.initiate_connection(ipsec_site_conn['id'])
self._copy_configs()
def get_established_connections(self) -> ty.List[str]:
connections: ty.List[str] = []
status_output: ty.Optional[str] = self.get_status()
if not status_output:
return connections
for line in status_output.split('\n'):
if self.STATUS_NOT_RUNNING_PATTERN.search(line):
return connections
m = self.STATUS_IPSEC_SA_ESTABLISHED_PATTERN2.search(line)
if m:
connection = m.group(1)
if connection in connections:
continue
connections.append(connection)
return connections
def disconnect(self):
if not self.namespace:
return
if not self.vpnservice:
return
connections = self.get_established_connections()
for conn_name in connections:
self.terminate_connection(conn_name)
def stop(self):
#Stop process using whack
#Note this will also stop pluto
self.disconnect()
self.shutdown_whack()
self.connection_status = {}
class IPsecVpnDriverApi:
"""IPSecVpnDriver RPC api."""
@log_helpers.log_method_call
def __init__(self, topic):
target = oslo_messaging.Target(topic=topic, version='1.0')
self.client = n_rpc.get_client(target)
@log_helpers.log_method_call
def get_vpn_services_on_host(self, context: context.ContextBase, host):
"""Get list of vpnservices.
The vpnservices including related ipsec_site_connection,
ikepolicy and ipsecpolicy on this host
"""
cctxt = self.client.prepare()
return cctxt.call(context, 'get_vpn_services_on_host', host=host)
@log_helpers.log_method_call
def update_status(self, context: context.ContextBase, status):
"""Update local status.
This method call updates status attribute of
VPNServices.
"""
cctxt = self.client.prepare()
return cctxt.call(context, 'update_status', status=status)
class IPsecDriver(device_drivers.DeviceDriver, metaclass=abc.ABCMeta):
"""VPN Device Driver for IPSec.
This class is designed for use with L3-agent now.
However this driver will be used with another agent in future
so the use of "Router" is kept minimal now.
Instead of router_id, we are using process_id in this code.
"""
# history
# 1.0 Initial version
target = oslo_messaging.Target(version='1.0')
def __init__(self, vpn_service, host: str):
# TODO(pc_m) Replace vpn_service with config arg, once all driver
# implementations no longer need vpn_service.
self.conf = vpn_service.conf
self.host = host
self.conn = n_rpc.Connection()
self.context: context.ContextBase = \
context.get_admin_context_without_session()
self.topic: str = topics.IPSEC_AGENT_TOPIC
node_topic: str = f'{self.topic}.{self.host}'
self.processes: ty.Dict[str, BaseSwanProcess] = {}
self.routers: ty.Dict[str, ty.Any] = {}
self.process_status_cache: ty.Dict[str, ty.Dict[str, ty.Any]] = {}
self.endpoints = [self]
self.conn.create_consumer(node_topic, self.endpoints, fanout=False)
self.conn.consume_in_threads()
self.agent_rpc = IPsecVpnDriverApi(topics.IPSEC_DRIVER_TOPIC)
self.process_status_cache_check = loopingcall.FixedIntervalLoopingCall(
self.report_status, self.context)
self.process_status_cache_check.start(
interval=self.conf.ipsec.ipsec_status_check_interval)
def get_namespace(self, router_id: str) -> ty.Optional[str]:
"""Get namespace of router.
:router_id: router_id
:returns: namespace string.
Note: If the router is a DVR, then the SNAT namespace will be
provided. If the router does not exist, return None.
"""
router = self.routers.get(router_id)
if not router:
return None
# For DVR, use SNAT namespace
# TODO(pcm): Use router object method to tell if DVR, when available
if router.router['distributed']:
return router.snat_namespace.name
return router.ns_name
def get_router_based_iptables_manager(self, router):
"""Returns router based iptables manager
In DVR routers the IPsec VPN service should run inside
the snat namespace. So the iptables manager used for
snat namespace is different from the iptables manager
used for the qr namespace in a non dvr based router.
This function will check the router type and then will
return the right iptables manager. If DVR enabled router
it will return the snat_iptables_manager otherwise it will
return the legacy iptables_manager.
"""
# TODO(pcm): Use router object method to tell if DVR, when available
if router.router['distributed']:
return router.snat_iptables_manager
return router.iptables_manager
def add_nat_rule(self, router_id, chain, rule, top=False):
"""Add nat rule in namespace.
:param router_id: router_id
:param chain: a string of chain name
:param rule: a string of rule
:param top: if top is true, the rule
will be placed on the top of chain
Note if there is no router, this method does nothing
"""
router = self.routers.get(router_id)
if not router:
return
iptables_manager = self.get_router_based_iptables_manager(router)
iptables_manager.ipv4['nat'].add_rule(chain, rule, top=top)
def remove_nat_rule(self, router_id, chain, rule, top=False):
"""Remove nat rule in namespace.
:param router_id: router_id
:param chain: a string of chain name
:param rule: a string of rule
:param top: unused
needed to have same argument with add_nat_rule
"""
router = self.routers.get(router_id)
if not router:
return
iptables_manager = self.get_router_based_iptables_manager(router)
iptables_manager.ipv4['nat'].remove_rule(chain, rule, top=top)
def iptables_apply(self, router_id):
"""Apply IPtables.
:param router_id: router_id
This method do nothing if there is no router
"""
router = self.routers.get(router_id)
if not router:
return
iptables_manager = self.get_router_based_iptables_manager(router)
iptables_manager.apply()
def _update_nat(self, vpnservice, func):
"""Setting up nat rule in iptables.
We need to setup nat rule for ipsec packet.
:param vpnservice: vpnservices
:param func: self.add_nat_rule or self.remove_nat_rule
"""
router_id = vpnservice['router_id']
for ipsec_site_connection in vpnservice['ipsec_site_connections']:
for local_cidr in ipsec_site_connection['local_cidrs']:
# This ipsec rule is not needed for ipv6.
if netaddr.IPNetwork(local_cidr).version == 6:
continue
for peer_cidr in ipsec_site_connection['peer_cidrs']:
func(router_id,
'POSTROUTING',
f'-s {local_cidr} -d {peer_cidr} -m policy '
'--dir out --pol ipsec '
'-j ACCEPT ',
top=True)
self.iptables_apply(router_id)
@log_helpers.log_method_call
def vpnservice_updated(self, context: context.ContextBase, **kwargs):
"""Vpnservice updated rpc handler
VPN Service Driver will call this method
when vpnservices updated.
Then this method start sync with server.
"""
router = kwargs.get('router', None)
self.sync(context, [router] if router else [])
@abc.abstractmethod
def create_process(self, process_id: str, vpnservice,
namespace) -> BaseSwanProcess:
pass
def ensure_process(self, process_id: str,
vpnservice=None) -> BaseSwanProcess:
"""Ensuring process.
If the process doesn't exist, it will create process
and store it in self.process
"""
process = self.processes.get(process_id, None)
if not process or not process.namespace:
namespace = self.get_namespace(process_id)
process = self.create_process(
process_id,
vpnservice,
namespace)
self.processes[process_id] = process
elif vpnservice:
process.update_vpnservice(vpnservice)
return process
def create_router(self, router):
"""Handling create router event.
Agent calls this method, when the process namespace is ready.
Note: process_id == router_id == vpnservice_id
"""
process_id = router.router_id
self.routers[process_id] = router
if process_id in self.processes:
# In case of vpnservice is created
# before router's namespace
process = self.processes[process_id]
self._update_nat(process.vpnservice, self.add_nat_rule)
# Don't run ipsec process for backup HA router
if router.router['ha'] and router.ha_state == 'backup':
return
process.enable()
def destroy_process(self, process_id):
"""Destroy process.
Disable the process, remove the nat rule, and remove the process
manager for the processes that no longer are running vpn service.
"""
if process_id in self.processes:
process = self.processes[process_id]
process.disable()
vpnservice = process.vpnservice
if vpnservice:
self._update_nat(vpnservice, self.remove_nat_rule)
del self.processes[process_id]
def destroy_router(self, process_id):
"""Handling destroy_router event.
Agent calls this method, when the process namespace
is deleted.
"""
self.destroy_process(process_id)
if process_id in self.routers:
del self.routers[process_id]
def get_process_status_cache(self,
process: BaseSwanProcess) -> ty.Dict[str, ty.Any]:
if not self.process_status_cache.get(process.id):
self.process_status_cache[process.id] = {
'status': None,
'id': process.vpnservice['id'],
'updated_pending_status': False,
'ipsec_site_connections': {}}
return self.process_status_cache[process.id]
def is_status_updated(self, process: BaseSwanProcess,
previous_status: ty.Dict[str, ty.Any]) -> bool:
if process.updated_pending_status:
return True
if process.status != previous_status['status']:
return True
if (process.connection_status !=
previous_status['ipsec_site_connections']):
return True
return False
def unset_updated_pending_status(self, process):
process.updated_pending_status = False
for connection_status in process.connection_status.values():
connection_status['updated_pending_status'] = False
def copy_process_status(self,
process: BaseSwanProcess) -> ty.Dict[str, ty.Any]:
return {
'id': process.vpnservice['id'],
'status': process.status,
'updated_pending_status': process.updated_pending_status,
'ipsec_site_connections': copy.deepcopy(process.connection_status)
}
def update_downed_connections(self, process_id: str, new_status):
"""Update info to be reported, if connections just went down.
If there is no longer any information for a connection, because it
has been removed (e.g. due to an admin down of VPN service or IPSec
connection), but there was previous status information for the
connection, mark the connection as down for reporting purposes.
"""
if process_id in self.process_status_cache:
for conn in self.process_status_cache[process_id][IPSEC_CONNS]:
if conn not in new_status[IPSEC_CONNS]:
new_status[IPSEC_CONNS][conn] = {
'status': constants.DOWN,
'updated_pending_status': True
}
def should_be_reported(self, context: context.ContextBase,
process: BaseSwanProcess) -> bool:
if (context.is_admin or
process.vpnservice["tenant_id"] == context.tenant_id):
return True
return False
@log_helpers.log_method_call
def report_status(self, context: context.ContextBase):
status_changed_vpn_services = []
for process_id, process in list(self.processes.items()):
# NOTE(mnaser): It's not necessary to check status for processes
# of a backup L3 agent
router = self.routers.get(process_id)
if router and router.router['ha'] and router.ha_state == 'backup':
LOG.debug("%s router in backup state, skipping", process_id)
continue
if not self.should_be_reported(context, process):
continue
previous_status = self.get_process_status_cache(process)
if self.is_status_updated(process, previous_status):
new_status = self.copy_process_status(process)
self.update_downed_connections(process.id, new_status)
status_changed_vpn_services.append(new_status)
self.process_status_cache[process.id] = (
self.copy_process_status(process))
# We need unset updated_pending status after it
# is reported to the server side
self.unset_updated_pending_status(process)
if status_changed_vpn_services:
self.agent_rpc.update_status(
context,
status_changed_vpn_services)
@log_helpers.log_method_call
@lockutils.synchronized('vpn-agent', 'neutron-')
def sync(self, context: context.ContextBase, routers):
"""Sync status with server side.
:param context: context object for RPC call
:param routers: Router objects which is created in this sync event
There could be many failure cases should be
considered including the followings.
1) Agent class restarted
2) Failure on process creation
3) VpnService is deleted during agent down
4) RPC failure
In order to handle these failure cases,
This driver takes simple sync strategies.
"""
vpnservices = self.agent_rpc.get_vpn_services_on_host(
context, self.host)
router_ids = [vpnservice["router_id"] for vpnservice in vpnservices]
sync_router_ids = [router["id"] for router in routers]
self._sync_vpn_processes(vpnservices, sync_router_ids)
self._delete_vpn_processes(sync_router_ids, router_ids)
self._cleanup_stale_vpn_processes(router_ids)
self.report_status(context)
def _sync_vpn_processes(self, vpnservices, sync_router_ids):
# Ensure the ipsec process is enabled only for
# - the vpn services which are not yet in self.processes
# - vpn services whose router id is in 'sync_router_ids'
for vpnservice in vpnservices:
if vpnservice['router_id'] not in self.processes or (
vpnservice['router_id'] in sync_router_ids):
process: ty.Optional[BaseSwanProcess] = self.ensure_process(
vpnservice['router_id'], vpnservice=vpnservice)
if not process:
return
self._update_nat(vpnservice, self.add_nat_rule)
router = self.routers.get(vpnservice['router_id'])
if not router:
continue
# For HA router, spawn vpn process on master router
# and terminate vpn process on backup router
if router.router['ha'] and router.ha_state == 'backup':
process.disable()
else:
process.update()
def _delete_vpn_processes(self, sync_router_ids, vpn_router_ids):
# Delete any IPSec processes that are
# associated with routers, but are not running the VPN service.
for process_id in sync_router_ids:
if process_id not in vpn_router_ids:
self.destroy_process(process_id)
def _cleanup_stale_vpn_processes(self, vpn_router_ids):
# Delete any IPSec processes running
# VPN that do not have an associated router.
process_ids = [pid for pid in self.processes
if pid not in vpn_router_ids]
for process_id in process_ids:
self.destroy_process(process_id)
class OpenSwanDriver(IPsecDriver):
def create_process(self, process_id: str, vpnservice,
namespace: str) -> BaseSwanProcess:
return OpenSwanProcess(
self.conf,
process_id,
vpnservice,
namespace)