Add require_tenant_aggregate request filter
This adds a require_tenant_aggregate request filter which uses overlaid nova and placement aggregates to limit placement results during scheduling. It uses the same `filter_tenant_id` metadata key as the existing scheduler filter we have today, so people already doing this with that filter will be able to enable this and get placement to pre-filter those hosts for them automatically. This also allows making this filter advisory but not required, and supports multiple tenants per aggregate, unlike the original filter. Related to blueprint placement-req-filter Change-Id: Idb52b2a9af539df653da7a36763cb9a1d0de3d1b
This commit is contained in:
@@ -150,6 +150,34 @@ scheduler, this option has no effect.
|
||||
Number of workers for the nova-scheduler service. The default will be the
|
||||
number of CPUs available if using the "filter_scheduler" scheduler driver,
|
||||
otherwise the default will be 1.
|
||||
"""),
|
||||
cfg.BoolOpt("limit_tenants_to_placement_aggregate",
|
||||
default=False,
|
||||
help="""
|
||||
This setting causes the scheduler to look up a host aggregate with the
|
||||
metadata key of `filter_tenant_id` set to the project of an incoming
|
||||
request, and request results from placement be limited to that aggregate.
|
||||
Multiple tenants may be added to a single aggregate by appending a serial
|
||||
number to the key, such as `filter_tenant_id:123`.
|
||||
|
||||
The matching aggregate UUID must be mirrored in placement for proper
|
||||
operation. If no host aggregate with the tenant id is found, or that
|
||||
aggregate does not match one in placement, the result will be the same
|
||||
as not finding any suitable hosts for the request.
|
||||
|
||||
See also the placement_aggregate_required_for_tenants option.
|
||||
"""),
|
||||
cfg.BoolOpt("placement_aggregate_required_for_tenants",
|
||||
default=False,
|
||||
help="""
|
||||
This setting, when limit_tenants_to_placement_aggregate=True, will control
|
||||
whether or not a tenant with no aggregate affinity will be allowed to schedule
|
||||
to any available node. If aggregates are used to limit some tenants but
|
||||
not all, then this should be False. If all tenants should be confined via
|
||||
aggregate, then this should be True to prevent them from receiving unrestricted
|
||||
scheduling to any available node.
|
||||
|
||||
See also the limit_tenants_to_placement_aggregate option.
|
||||
"""),
|
||||
]
|
||||
|
||||
|
@@ -13,13 +13,55 @@
|
||||
from oslo_log import log as logging
|
||||
|
||||
import nova.conf
|
||||
from nova import exception
|
||||
from nova.i18n import _
|
||||
from nova import objects
|
||||
|
||||
|
||||
CONF = nova.conf.CONF
|
||||
LOG = logging.getLogger(__name__)
|
||||
TENANT_METADATA_KEY = 'filter_tenant_id'
|
||||
|
||||
|
||||
def require_tenant_aggregate(ctxt, request_spec):
|
||||
"""Require hosts in an aggregate based on tenant id.
|
||||
|
||||
This will modify request_spec to request hosts in an aggregate
|
||||
defined specifically for the tenant making the request. We do that
|
||||
by looking for a nova host aggregate with metadata indicating which
|
||||
tenant it is for, and passing that aggregate uuid to placement to
|
||||
limit results accordingly.
|
||||
"""
|
||||
|
||||
enabled = CONF.scheduler.limit_tenants_to_placement_aggregate
|
||||
agg_required = CONF.scheduler.placement_aggregate_required_for_tenants
|
||||
if not enabled:
|
||||
return
|
||||
|
||||
aggregates = objects.AggregateList.get_by_metadata(
|
||||
ctxt, value=request_spec.project_id)
|
||||
aggregate_uuids_for_tenant = set([])
|
||||
for agg in aggregates:
|
||||
for key, value in agg.metadata.items():
|
||||
if key.startswith(TENANT_METADATA_KEY):
|
||||
aggregate_uuids_for_tenant.add(agg.uuid)
|
||||
break
|
||||
|
||||
if aggregate_uuids_for_tenant:
|
||||
if ('requested_destination' not in request_spec or
|
||||
request_spec.requested_destination is None):
|
||||
request_spec.requested_destination = objects.Destination()
|
||||
destination = request_spec.requested_destination
|
||||
destination.require_aggregates(aggregate_uuids_for_tenant)
|
||||
elif agg_required:
|
||||
LOG.warning('Tenant %(tenant)s has no available aggregates',
|
||||
{'tenant': request_spec.project_id})
|
||||
raise exception.RequestFilterFailed(
|
||||
reason=_('No hosts available for tenant'))
|
||||
|
||||
|
||||
ALL_REQUEST_FILTERS = [
|
||||
require_tenant_aggregate,
|
||||
]
|
||||
|
||||
|
||||
|
@@ -10,7 +10,17 @@
|
||||
# License for the specific language governing permissions and limitations
|
||||
# under the License.
|
||||
|
||||
import time
|
||||
|
||||
from nova.scheduler.client import report
|
||||
|
||||
from nova import context as nova_context
|
||||
from nova import test
|
||||
from nova.tests import fixtures as nova_fixtures
|
||||
from nova.tests.functional import integrated_helpers
|
||||
import nova.tests.unit.image.fake
|
||||
from nova.tests.unit import policy_fixture
|
||||
from nova.virt import fake
|
||||
|
||||
|
||||
class AggregatesTest(integrated_helpers._IntegratedTestBase):
|
||||
@@ -39,3 +49,222 @@ class AggregatesTest(integrated_helpers._IntegratedTestBase):
|
||||
self.start_service('compute', host='compute2')
|
||||
self.host_mappings['compute2'].destroy()
|
||||
self.assertEqual(2, self._add_hosts_to_aggregate())
|
||||
|
||||
|
||||
class AggregateRequestFiltersTest(test.TestCase,
|
||||
integrated_helpers.InstanceHelperMixin):
|
||||
microversion = 'latest'
|
||||
compute_driver = 'fake.MediumFakeDriver'
|
||||
|
||||
def setUp(self):
|
||||
self.flags(compute_driver=self.compute_driver)
|
||||
super(AggregateRequestFiltersTest, self).setUp()
|
||||
|
||||
self.useFixture(policy_fixture.RealPolicyFixture())
|
||||
self.useFixture(nova_fixtures.NeutronFixture(self))
|
||||
self.useFixture(nova_fixtures.AllServicesCurrent())
|
||||
|
||||
placement = self.useFixture(nova_fixtures.PlacementFixture())
|
||||
self.placement_api = placement.api
|
||||
api_fixture = self.useFixture(nova_fixtures.OSAPIFixture(
|
||||
api_version='v2.1'))
|
||||
|
||||
self.admin_api = api_fixture.admin_api
|
||||
self.admin_api.microversion = self.microversion
|
||||
self.api = self.admin_api
|
||||
|
||||
# the image fake backend needed for image discovery
|
||||
nova.tests.unit.image.fake.stub_out_image_service(self)
|
||||
|
||||
self.start_service('conductor')
|
||||
self.scheduler_service = self.start_service('scheduler')
|
||||
|
||||
self.computes = {}
|
||||
self.aggregates = {}
|
||||
|
||||
self._start_compute('host1')
|
||||
self._start_compute('host2')
|
||||
|
||||
self.context = nova_context.get_admin_context()
|
||||
self.report_client = report.SchedulerReportClient()
|
||||
|
||||
self.flavors = self.api.get_flavors()
|
||||
|
||||
# Aggregate with only host1
|
||||
self._create_aggregate('only-host1')
|
||||
self._add_host_to_aggregate('only-host1', 'host1')
|
||||
|
||||
# Aggregate with only host2
|
||||
self._create_aggregate('only-host2')
|
||||
self._add_host_to_aggregate('only-host2', 'host2')
|
||||
|
||||
# Aggregate with neither host
|
||||
self._create_aggregate('no-hosts')
|
||||
|
||||
# Default to enabling the filter and making it mandatory
|
||||
self.flags(limit_tenants_to_placement_aggregate=True,
|
||||
group='scheduler')
|
||||
self.flags(placement_aggregate_required_for_tenants=True,
|
||||
group='scheduler')
|
||||
|
||||
def _start_compute(self, host):
|
||||
"""Start a nova compute service on the given host
|
||||
|
||||
:param host: the name of the host that will be associated to the
|
||||
compute service.
|
||||
:return: the nova compute service object
|
||||
"""
|
||||
fake.set_nodes([host])
|
||||
self.addCleanup(fake.restore_nodes)
|
||||
compute = self.start_service('compute', host=host)
|
||||
self.computes[host] = compute
|
||||
return compute
|
||||
|
||||
def _create_aggregate(self, name):
|
||||
agg = self.admin_api.post_aggregate({'aggregate': {'name': name}})
|
||||
self.aggregates[name] = agg
|
||||
|
||||
def _get_provider_uuid_by_host(self, host):
|
||||
"""Return the compute node uuid for a named compute host."""
|
||||
# NOTE(gibi): the compute node id is the same as the compute node
|
||||
# provider uuid on that compute
|
||||
resp = self.admin_api.api_get(
|
||||
'os-hypervisors?hypervisor_hostname_pattern=%s' % host).body
|
||||
return resp['hypervisors'][0]['id']
|
||||
|
||||
def _add_host_to_aggregate(self, agg, host):
|
||||
"""Add a compute host to both nova and placement aggregates.
|
||||
|
||||
:param agg: Name of the nova aggregate
|
||||
:param host: Name of the compute host
|
||||
"""
|
||||
agg = self.aggregates[agg]
|
||||
self.admin_api.add_host_to_aggregate(agg['id'], host)
|
||||
|
||||
host_uuid = self._get_provider_uuid_by_host(host)
|
||||
|
||||
# Get the existing aggregates for this host in placement and add the
|
||||
# new one to it
|
||||
aggs = self.report_client.get(
|
||||
'/resource_providers/%s/aggregates' % host_uuid,
|
||||
version='1.1').json()
|
||||
placement_aggs = aggs['aggregates']
|
||||
placement_aggs.append(agg['uuid'])
|
||||
|
||||
# Make sure we have a view of the provider we're about to mess with
|
||||
# FIXME(efried): This should be a thing we can do without internals
|
||||
self.report_client._ensure_resource_provider(self.context, host_uuid)
|
||||
|
||||
self.report_client.set_aggregates_for_provider(self.context, host_uuid,
|
||||
placement_aggs)
|
||||
|
||||
def _grant_tenant_aggregate(self, agg, tenants):
|
||||
"""Grant a set of tenants access to use an aggregate.
|
||||
|
||||
:param agg: Name of the nova aggregate
|
||||
:param tenants: A list of all tenant ids that will be allowed access
|
||||
"""
|
||||
agg = self.aggregates[agg]
|
||||
action = {
|
||||
'set_metadata': {
|
||||
'metadata': {
|
||||
'filter_tenant_id%i' % i: tenant
|
||||
for i, tenant in enumerate(tenants)
|
||||
}
|
||||
},
|
||||
}
|
||||
self.admin_api.post_aggregate_action(agg['id'], action)
|
||||
|
||||
def _wait_for_state_change(self, server, from_status):
|
||||
for i in range(0, 50):
|
||||
server = self.api.get_server(server['id'])
|
||||
if server['status'] != from_status:
|
||||
break
|
||||
time.sleep(.1)
|
||||
|
||||
return server
|
||||
|
||||
def _boot_server(self):
|
||||
server_req = self._build_minimal_create_server_request(
|
||||
self.api, 'test-instance', flavor_id=self.flavors[0]['id'],
|
||||
image_uuid='155d900f-4e14-4e4c-a73d-069cbf4541e6',
|
||||
networks='none')
|
||||
|
||||
created_server = self.api.post_server({'server': server_req})
|
||||
server = self._wait_for_state_change(created_server, 'BUILD')
|
||||
|
||||
return server
|
||||
|
||||
def test_tenant_id_required_fails_if_no_aggregate(self):
|
||||
server = self._boot_server()
|
||||
# Without granting our tenant permission to an aggregate, instance
|
||||
# creates should fail since aggregates are required
|
||||
self.assertEqual('ERROR', server['status'])
|
||||
|
||||
def test_tenant_id_not_required_succeeds_if_no_aggregate(self):
|
||||
self.flags(placement_aggregate_required_for_tenants=False,
|
||||
group='scheduler')
|
||||
server = self._boot_server()
|
||||
# Without granting our tenant permission to an aggregate, instance
|
||||
# creates should still succeed since aggregates are not required
|
||||
self.assertEqual('ACTIVE', server['status'])
|
||||
|
||||
def _get_instance_host(self, server):
|
||||
srv = self.admin_api.get_server(server['id'])
|
||||
return srv['OS-EXT-SRV-ATTR:host']
|
||||
|
||||
def test_filter_honors_tenant_id(self):
|
||||
tenant = self.api.project_id
|
||||
|
||||
# Grant our tenant access to the aggregate with only host1 in it
|
||||
# and boot some servers. They should all stack up on host1.
|
||||
self._grant_tenant_aggregate('only-host1',
|
||||
['foo', tenant, 'bar'])
|
||||
server1 = self._boot_server()
|
||||
server2 = self._boot_server()
|
||||
self.assertEqual('ACTIVE', server1['status'])
|
||||
self.assertEqual('ACTIVE', server2['status'])
|
||||
|
||||
# Grant our tenant access to the aggregate with only host2 in it
|
||||
# and boot some servers. They should all stack up on host2.
|
||||
self._grant_tenant_aggregate('only-host1',
|
||||
['foo', 'bar'])
|
||||
self._grant_tenant_aggregate('only-host2',
|
||||
['foo', tenant, 'bar'])
|
||||
server3 = self._boot_server()
|
||||
server4 = self._boot_server()
|
||||
self.assertEqual('ACTIVE', server3['status'])
|
||||
self.assertEqual('ACTIVE', server4['status'])
|
||||
|
||||
# Make sure the servers landed on the hosts we had access to at
|
||||
# the time we booted them.
|
||||
hosts = [self._get_instance_host(s)
|
||||
for s in (server1, server2, server3, server4)]
|
||||
expected_hosts = ['host1', 'host1', 'host2', 'host2']
|
||||
self.assertEqual(expected_hosts, hosts)
|
||||
|
||||
def test_filter_with_empty_aggregate(self):
|
||||
tenant = self.api.project_id
|
||||
|
||||
# Grant our tenant access to the aggregate with no hosts in it
|
||||
self._grant_tenant_aggregate('no-hosts',
|
||||
['foo', tenant, 'bar'])
|
||||
server = self._boot_server()
|
||||
self.assertEqual('ERROR', server['status'])
|
||||
|
||||
def test_filter_with_multiple_aggregates_for_tenant(self):
|
||||
tenant = self.api.project_id
|
||||
|
||||
# Grant our tenant access to the aggregate with no hosts in it,
|
||||
# and one with a host.
|
||||
self._grant_tenant_aggregate('no-hosts',
|
||||
['foo', tenant, 'bar'])
|
||||
self._grant_tenant_aggregate('only-host2',
|
||||
['foo', tenant, 'bar'])
|
||||
|
||||
# Boot several servers and make sure they all land on the
|
||||
# only host we have access to.
|
||||
for i in range(0, 4):
|
||||
server = self._boot_server()
|
||||
self.assertEqual('ACTIVE', server['status'])
|
||||
self.assertEqual('host2', self._get_instance_host(server))
|
||||
|
@@ -13,6 +13,8 @@
|
||||
import mock
|
||||
|
||||
from nova import context as nova_context
|
||||
from nova import exception
|
||||
from nova import objects
|
||||
from nova.scheduler import request_filter
|
||||
from nova import test
|
||||
from nova.tests import uuidsentinel as uuids
|
||||
@@ -23,6 +25,8 @@ class TestRequestFilter(test.NoDBTestCase):
|
||||
super(TestRequestFilter, self).setUp()
|
||||
self.context = nova_context.RequestContext(user_id=uuids.user,
|
||||
project_id=uuids.project)
|
||||
self.flags(limit_tenants_to_placement_aggregate=True,
|
||||
group='scheduler')
|
||||
|
||||
def test_process_reqspec(self):
|
||||
fake_filters = [mock.MagicMock(), mock.MagicMock()]
|
||||
@@ -33,3 +37,49 @@ class TestRequestFilter(test.NoDBTestCase):
|
||||
for filter in fake_filters:
|
||||
filter.assert_called_once_with(mock.sentinel.context,
|
||||
mock.sentinel.reqspec)
|
||||
|
||||
@mock.patch('nova.objects.AggregateList.get_by_metadata')
|
||||
def test_require_tenant_aggregate_disabled(self, getmd):
|
||||
self.flags(limit_tenants_to_placement_aggregate=False,
|
||||
group='scheduler')
|
||||
reqspec = mock.MagicMock()
|
||||
request_filter.require_tenant_aggregate(self.context, reqspec)
|
||||
self.assertFalse(getmd.called)
|
||||
|
||||
@mock.patch('nova.objects.AggregateList.get_by_metadata')
|
||||
def test_require_tenant_aggregate(self, getmd):
|
||||
getmd.return_value = [
|
||||
objects.Aggregate(
|
||||
uuid=uuids.agg1,
|
||||
metadata={'filter_tenant_id': 'owner'}),
|
||||
objects.Aggregate(
|
||||
uuid=uuids.agg2,
|
||||
metadata={'filter_tenant_id:12': 'owner'}),
|
||||
objects.Aggregate(
|
||||
uuid=uuids.agg3,
|
||||
metadata={'other_key': 'owner'}),
|
||||
]
|
||||
reqspec = objects.RequestSpec(project_id='owner')
|
||||
request_filter.require_tenant_aggregate(self.context, reqspec)
|
||||
self.assertEqual(
|
||||
','.join(sorted([uuids.agg1, uuids.agg2])),
|
||||
','.join(sorted(
|
||||
reqspec.requested_destination.aggregates[0].split(','))))
|
||||
# Make sure we called with the request spec's tenant and not
|
||||
# necessarily just the one from context.
|
||||
getmd.assert_called_once_with(self.context, value='owner')
|
||||
|
||||
@mock.patch('nova.objects.AggregateList.get_by_metadata')
|
||||
def test_require_tenant_aggregate_no_match(self, getmd):
|
||||
self.flags(placement_aggregate_required_for_tenants=True,
|
||||
group='scheduler')
|
||||
getmd.return_value = []
|
||||
self.assertRaises(exception.RequestFilterFailed,
|
||||
request_filter.require_tenant_aggregate,
|
||||
self.context, mock.MagicMock())
|
||||
|
||||
@mock.patch('nova.objects.AggregateList.get_by_metadata')
|
||||
def test_require_tenant_aggregate_no_match_not_required(self, getmd):
|
||||
getmd.return_value = []
|
||||
request_filter.require_tenant_aggregate(
|
||||
self.context, mock.MagicMock())
|
||||
|
@@ -0,0 +1,11 @@
|
||||
---
|
||||
features:
|
||||
- |
|
||||
The scheduler can now use placement to more efficiently query for hosts within a
|
||||
tenant-restricted aggregate. This requires that a host aggregate is created in
|
||||
nova with the ``filter_tenant_id`` key (optionally suffixed with any string for
|
||||
multiple tenants, like ``filter_tenant_id3=$tenantid``) and the same aggregate
|
||||
is created in placement with an identical UUID. The
|
||||
``[scheduler]/limit_tenants_to_placement_aggregate`` config option enables this
|
||||
behavior and ``[scheduler]/placement_aggregate_required_for_tenants`` makes it
|
||||
either optional or mandatory, allowing only some tenants to be restricted.
|
Reference in New Issue
Block a user