python-boto3/tests/unit/dynamodb/test_table.py
2016-05-21 21:03:29 -05:00

288 lines
10 KiB
Python

# Copyright 2015 Amazon.com, Inc. or its affiliates. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"). You
# may not use this file except in compliance with the License. A copy of
# the License is located at
#
# http://aws.amazon.com/apache2.0/
#
# or in the "license" file accompanying this file. This file is
# distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF
# ANY KIND, either express or implied. See the License for the specific
# language governing permissions and limitations under the License.
from tests import unittest, mock
from boto3.dynamodb.table import BatchWriter
class BaseTransformationTest(unittest.TestCase):
maxDiff = None
def setUp(self):
self.client = mock.Mock()
self.client.batch_write_item.return_value = {'UnprocessedItems': {}}
self.table_name = 'tablename'
self.flush_amount = 2
self.batch_writer = BatchWriter(self.table_name, self.client,
self.flush_amount)
def assert_batch_write_calls_are(self, expected_batch_writes):
self.assertEqual(self.client.batch_write_item.call_count,
len(expected_batch_writes))
batch_write_calls = [
args[1] for args in
self.client.batch_write_item.call_args_list
]
self.assertEqual(batch_write_calls, expected_batch_writes)
def test_batch_write_does_not_immediately_write(self):
self.batch_writer.put_item(Item={'Hash': 'foo'})
self.assertFalse(self.client.batch_write_item.called)
def test_batch_write_flushes_at_flush_amount(self):
self.batch_writer.put_item(Item={'Hash': 'foo1'})
self.batch_writer.put_item(Item={'Hash': 'foo2'})
expected = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo1'}}},
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
]
}
}
self.assert_batch_write_calls_are([expected])
def test_multiple_flushes_reset_items_to_put(self):
self.batch_writer.put_item(Item={'Hash': 'foo1'})
self.batch_writer.put_item(Item={'Hash': 'foo2'})
self.batch_writer.put_item(Item={'Hash': 'foo3'})
self.batch_writer.put_item(Item={'Hash': 'foo4'})
# We should have two batch calls, one for foo1,foo2 and
# one for foo3,foo4.
first_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo1'}}},
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
]
}
}
second_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo3'}}},
{'PutRequest': {'Item': {'Hash': 'foo4'}}},
]
}
}
self.assert_batch_write_calls_are([first_batch, second_batch])
def test_can_handle_puts_and_deletes(self):
self.batch_writer.put_item(Item={'Hash': 'foo1'})
self.batch_writer.delete_item(Key={'Hash': 'foo2'})
expected = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo1'}}},
{'DeleteRequest': {'Key': {'Hash': 'foo2'}}},
]
}
}
self.assert_batch_write_calls_are([expected])
def test_multiple_batch_calls_with_mixed_deletes(self):
self.batch_writer.put_item(Item={'Hash': 'foo1'})
self.batch_writer.delete_item(Key={'Hash': 'foo2'})
self.batch_writer.delete_item(Key={'Hash': 'foo3'})
self.batch_writer.put_item(Item={'Hash': 'foo4'})
first_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo1'}}},
{'DeleteRequest': {'Key': {'Hash': 'foo2'}}},
]
}
}
second_batch = {
'RequestItems': {
self.table_name: [
{'DeleteRequest': {'Key': {'Hash': 'foo3'}}},
{'PutRequest': {'Item': {'Hash': 'foo4'}}},
]
}
}
self.assert_batch_write_calls_are([first_batch, second_batch])
def test_unprocessed_items_added_to_next_batch(self):
self.client.batch_write_item.side_effect = [
{
'UnprocessedItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo2'}}}
],
},
},
# Then the last response shows that everything went through
{'UnprocessedItems': {}}
]
self.batch_writer.put_item(Item={'Hash': 'foo1'})
self.batch_writer.put_item(Item={'Hash': 'foo2'})
self.batch_writer.put_item(Item={'Hash': 'foo3'})
# We should have sent two batch requests consisting of 2
# 2 requests. foo1,foo2 and foo2,foo3.
# foo2 is sent twice because the first response has it listed
# as an unprocessed item which means it needs to be part
# of the next batch.
first_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo1'}}},
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
]
}
}
second_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
{'PutRequest': {'Item': {'Hash': 'foo3'}}},
]
}
}
self.assert_batch_write_calls_are([first_batch, second_batch])
def test_all_items_flushed_on_exit(self):
with self.batch_writer as b:
b.put_item(Item={'Hash': 'foo1'})
self.assert_batch_write_calls_are([
{
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo1'}}},
]
},
},
])
def test_never_send_more_than_max_batch_size(self):
# Suppose the server sends backs a response that indicates that
# all the items were unprocessed.
self.client.batch_write_item.side_effect = [
{
'UnprocessedItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo1'}}},
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
],
},
},
{
'UnprocessedItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
],
},
},
{
'UnprocessedItems': {}
},
]
with BatchWriter(self.table_name, self.client, flush_amount=2) as b:
b.put_item(Item={'Hash': 'foo1'})
b.put_item(Item={'Hash': 'foo2'})
b.put_item(Item={'Hash': 'foo3'})
# Note how we're never sending more than flush_amount=2.
first_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo1'}}},
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
]
}
}
# Even when the server sends us unprocessed items of 2 elements,
# we'll still only send 2 at a time, in order.
second_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo1'}}},
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
]
}
}
# And then we still see one more unprocessed item so
# we need to send another batch.
third_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo3'}}},
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
]
}
}
self.assert_batch_write_calls_are([first_batch, second_batch,
third_batch])
def test_repeated_flushing_on_exit(self):
# We're going to simulate unprocessed_items
# returning multiple unprocessed items across calls.
self.client.batch_write_item.side_effect = [
{
'UnprocessedItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
{'PutRequest': {'Item': {'Hash': 'foo3'}}},
],
},
},
{
'UnprocessedItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo3'}}},
],
},
},
{
'UnprocessedItems': {}
},
]
with BatchWriter(self.table_name, self.client, flush_amount=4) as b:
b.put_item(Item={'Hash': 'foo1'})
b.put_item(Item={'Hash': 'foo2'})
b.put_item(Item={'Hash': 'foo3'})
# So when we exit, we expect three calls.
# First we try the normal batch write with 3 items:
first_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo1'}}},
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
{'PutRequest': {'Item': {'Hash': 'foo3'}}},
]
}
}
# Then we see two unprocessed items so we send another batch.
second_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo2'}}},
{'PutRequest': {'Item': {'Hash': 'foo3'}}},
]
}
}
# And then we still see one more unprocessed item so
# we need to send another batch.
third_batch = {
'RequestItems': {
self.table_name: [
{'PutRequest': {'Item': {'Hash': 'foo3'}}},
]
}
}
self.assert_batch_write_calls_are([first_batch, second_batch,
third_batch])