dynamo db indexes

This commit is contained in:
Matt Ferrante 2015-12-31 17:19:23 -05:00 committed by Matt Clay
parent eefd716e8c
commit 99c8e82b60

View file

@ -23,9 +23,8 @@ description:
- Can update the provisioned throughput on existing tables. - Can update the provisioned throughput on existing tables.
- Returns the status of the specified table. - Returns the status of the specified table.
author: Alan Loi (@loia) author: Alan Loi (@loia)
version_added: "2.0"
requirements: requirements:
- "boto >= 2.13.2" - "boto >= 2.37.0"
options: options:
state: state:
description: description:
@ -70,13 +69,18 @@ options:
- Write throughput capacity (units) to provision. - Write throughput capacity (units) to provision.
required: false required: false
default: 1 default: 1
region: indexes:
description: description:
- The AWS region to use. If not specified then the value of the EC2_REGION environment variable, if any, is used. - list of dictionaries describing indexes to add to the table. global indexes can be updated. local indexes don't support updates or have throughput.
- required options: ['name', 'type', 'hash_key_name']
- valid types: ['all', 'global_all', 'global_include', 'global_keys_only', 'include', 'keys_only']
- other options: ['hash_key_type', 'range_key_name', 'range_key_type', 'includes', 'read_capacity', 'write_capacity']
required: false required: false
aliases: ['aws_region', 'ec2_region'] default: []
version_added: "2.1"
extends_documentation_fragment: aws extends_documentation_fragment:
- aws
- ec2
""" """
EXAMPLES = ''' EXAMPLES = '''
@ -98,6 +102,21 @@ EXAMPLES = '''
read_capacity: 10 read_capacity: 10
write_capacity: 10 write_capacity: 10
# set index on existing dynamo table
- dynamodb_table:
name: my-table
region: us-east-1
indexes:
- name: NamedIndex
type: global_include
hash_key_name: id
range_key_name: create_time
includes:
- other_field
- other_field2
read_capacity: 10
write_capacity: 10
# Delete dynamo table # Delete dynamo table
- dynamodb_table: - dynamodb_table:
name: my-table name: my-table
@ -117,20 +136,25 @@ try:
import boto import boto
import boto.dynamodb2 import boto.dynamodb2
from boto.dynamodb2.table import Table from boto.dynamodb2.table import Table
from boto.dynamodb2.fields import HashKey, RangeKey from boto.dynamodb2.fields import HashKey, RangeKey, AllIndex, GlobalAllIndex, GlobalIncludeIndex, GlobalKeysOnlyIndex, IncludeIndex, KeysOnlyIndex
from boto.dynamodb2.types import STRING, NUMBER, BINARY from boto.dynamodb2.types import STRING, NUMBER, BINARY
from boto.exception import BotoServerError, NoAuthHandlerFound, JSONResponseError from boto.exception import BotoServerError, NoAuthHandlerFound, JSONResponseError
from boto.dynamodb2.exceptions import ValidationException
HAS_BOTO = True HAS_BOTO = True
DYNAMO_TYPE_MAP = {
'STRING': STRING,
'NUMBER': NUMBER,
'BINARY': BINARY
}
except ImportError: except ImportError:
HAS_BOTO = False HAS_BOTO = False
DYNAMO_TYPE_DEFAULT = 'STRING'
DYNAMO_TYPE_MAP = { INDEX_REQUIRED_OPTIONS = ['name', 'type', 'hash_key_name']
'STRING': STRING, INDEX_OPTIONS = INDEX_REQUIRED_OPTIONS + ['hash_key_type', 'range_key_name', 'range_key_type', 'includes', 'read_capacity', 'write_capacity']
'NUMBER': NUMBER, INDEX_TYPE_OPTIONS = ['all', 'global_all', 'global_include', 'global_keys_only', 'include', 'keys_only']
'BINARY': BINARY
}
def create_or_update_dynamo_table(connection, module): def create_or_update_dynamo_table(connection, module):
@ -141,21 +165,20 @@ def create_or_update_dynamo_table(connection, module):
range_key_type = module.params.get('range_key_type') range_key_type = module.params.get('range_key_type')
read_capacity = module.params.get('read_capacity') read_capacity = module.params.get('read_capacity')
write_capacity = module.params.get('write_capacity') write_capacity = module.params.get('write_capacity')
all_indexes = module.params.get('indexes')
for index in all_indexes:
validate_index(index, module)
schema = get_schema_param(hash_key_name, hash_key_type, range_key_name, range_key_type)
if range_key_name:
schema = [
HashKey(hash_key_name, DYNAMO_TYPE_MAP.get(hash_key_type)),
RangeKey(range_key_name, DYNAMO_TYPE_MAP.get(range_key_type))
]
else:
schema = [
HashKey(hash_key_name, DYNAMO_TYPE_MAP.get(hash_key_type))
]
throughput = { throughput = {
'read': read_capacity, 'read': read_capacity,
'write': write_capacity 'write': write_capacity
} }
indexes, global_indexes = get_indexes(all_indexes)
result = dict( result = dict(
region=module.params.get('region'), region=module.params.get('region'),
table_name=table_name, table_name=table_name,
@ -165,16 +188,18 @@ def create_or_update_dynamo_table(connection, module):
range_key_type=range_key_type, range_key_type=range_key_type,
read_capacity=read_capacity, read_capacity=read_capacity,
write_capacity=write_capacity, write_capacity=write_capacity,
indexes=all_indexes,
) )
try: try:
table = Table(table_name, connection=connection) table = Table(table_name, connection=connection)
if dynamo_table_exists(table): if dynamo_table_exists(table):
result['changed'] = update_dynamo_table(table, throughput=throughput, check_mode=module.check_mode) result['changed'] = update_dynamo_table(table, throughput=throughput, check_mode=module.check_mode, global_indexes=global_indexes)
else: else:
if not module.check_mode: if not module.check_mode:
Table.create(table_name, connection=connection, schema=schema, throughput=throughput) Table.create(table_name, connection=connection, schema=schema, throughput=throughput, indexes=indexes, global_indexes=global_indexes)
result['changed'] = True result['changed'] = True
if not module.check_mode: if not module.check_mode:
@ -225,16 +250,42 @@ def dynamo_table_exists(table):
raise e raise e
def update_dynamo_table(table, throughput=None, check_mode=False): def update_dynamo_table(table, throughput=None, check_mode=False, global_indexes=None):
table.describe() # populate table details table.describe() # populate table details
throughput_changed = False
global_indexes_changed = False
if has_throughput_changed(table, throughput): if has_throughput_changed(table, throughput):
if not check_mode: if not check_mode:
return table.update(throughput=throughput) throughput_changed = table.update(throughput=throughput)
else: else:
return True throughput_changed = True
return False removed_indexes, added_indexes, index_throughput_changes = get_changed_global_indexes(table, global_indexes)
if removed_indexes:
if not check_mode:
for name, index in removed_indexes.iteritems():
global_indexes_changed = table.delete_global_secondary_index(name) or global_indexes_changed
else:
global_indexes_changed = True
if added_indexes:
if not check_mode:
for name, index in added_indexes.iteritems():
global_indexes_changed = table.create_global_secondary_index(global_index=index) or global_indexes_changed
else:
global_indexes_changed = True
if index_throughput_changes:
if not check_mode:
# todo: remove try once boto has https://github.com/boto/boto/pull/3447 fixed
try:
global_indexes_changed = table.update_global_secondary_index(global_indexes=index_throughput_changes) or global_indexes_changed
except ValidationException as e:
pass
else:
global_indexes_changed = True
return throughput_changed or global_indexes_changed
def has_throughput_changed(table, new_throughput): def has_throughput_changed(table, new_throughput):
@ -245,6 +296,80 @@ def has_throughput_changed(table, new_throughput):
new_throughput['write'] != table.throughput['write'] new_throughput['write'] != table.throughput['write']
def get_schema_param(hash_key_name, hash_key_type, range_key_name, range_key_type):
if range_key_name:
schema = [
HashKey(hash_key_name, DYNAMO_TYPE_MAP.get(hash_key_type, DYNAMO_TYPE_MAP[DYNAMO_TYPE_DEFAULT])),
RangeKey(range_key_name, DYNAMO_TYPE_MAP.get(range_key_type, DYNAMO_TYPE_MAP[DYNAMO_TYPE_DEFAULT]))
]
else:
schema = [
HashKey(hash_key_name, DYNAMO_TYPE_MAP.get(hash_key_type, DYNAMO_TYPE_MAP[DYNAMO_TYPE_DEFAULT]))
]
return schema
def get_changed_global_indexes(table, global_indexes):
table.describe()
table_index_info = dict((index.name, index.schema()) for index in table.global_indexes)
table_index_objects = dict((index.name, index) for index in table.global_indexes)
set_index_info = dict((index.name, index.schema()) for index in global_indexes)
set_index_objects = dict((index.name, index) for index in global_indexes)
removed_indexes = dict((name, index) for name, index in table_index_info.iteritems() if name not in set_index_info)
added_indexes = dict((name, set_index_objects[name]) for name, index in set_index_info.iteritems() if name not in table_index_info)
# todo: uncomment once boto has https://github.com/boto/boto/pull/3447 fixed
# index_throughput_changes = dict((name, index.throughput) for name, index in set_index_objects.iteritems() if name not in added_indexes and (index.throughput['read'] != str(table_index_objects[name].throughput['read']) or index.throughput['write'] != str(table_index_objects[name].throughput['write'])))
# todo: remove once boto has https://github.com/boto/boto/pull/3447 fixed
index_throughput_changes = dict((name, index.throughput) for name, index in set_index_objects.iteritems() if name not in added_indexes)
return removed_indexes, added_indexes, index_throughput_changes
def validate_index(index, module):
for key, val in index.iteritems():
if key not in INDEX_OPTIONS:
module.fail_json(msg='%s is not a valid option for an index' % key)
for required_option in INDEX_REQUIRED_OPTIONS:
if required_option not in index:
module.fail_json(msg='%s is a required option for an index' % required_option)
if index['type'] not in INDEX_TYPE_OPTIONS:
module.fail_json(msg='%s is not a valid index type, must be one of %s' % (index['type'], INDEX_TYPE_OPTIONS))
def get_indexes(all_indexes):
indexes = []
global_indexes = []
for index in all_indexes:
name = index['name']
schema = get_schema_param(index.get('hash_key_name'), index.get('hash_key_type'), index.get('range_key_name'), index.get('range_key_type'))
throughput = {
'read': index.get('read_capacity', 1),
'write': index.get('write_capacity', 1)
}
if index['type'] == 'all':
indexes.append(AllIndex(name, parts=schema))
elif index['type'] == 'global_all':
global_indexes.append(GlobalAllIndex(name, parts=schema, throughput=throughput))
elif index['type'] == 'global_include':
global_indexes.append(GlobalIncludeIndex(name, parts=schema, throughput=throughput, includes=index['includes']))
elif index['type'] == 'global_keys_only':
global_indexes.append(GlobalKeysOnlyIndex(name, parts=schema, throughput=throughput))
elif index['type'] == 'include':
indexes.append(IncludeIndex(name, parts=schema, includes=index['includes']))
elif index['type'] == 'keys_only':
indexes.append(KeysOnlyIndex(name, parts=schema))
return indexes, global_indexes
def main(): def main():
argument_spec = ec2_argument_spec() argument_spec = ec2_argument_spec()
argument_spec.update(dict( argument_spec.update(dict(
@ -256,6 +381,7 @@ def main():
range_key_type=dict(default='STRING', type='str', choices=['STRING', 'NUMBER', 'BINARY']), range_key_type=dict(default='STRING', type='str', choices=['STRING', 'NUMBER', 'BINARY']),
read_capacity=dict(default=1, type='int'), read_capacity=dict(default=1, type='int'),
write_capacity=dict(default=1, type='int'), write_capacity=dict(default=1, type='int'),
indexes=dict(default=[], type='list'),
)) ))
module = AnsibleModule( module = AnsibleModule(