| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266 | <?phpnamespace Aws\DynamoDb;use Aws\CommandInterface;use Aws\CommandPool;use Aws\Exception\AwsException;use Aws\ResultInterface;/** * The WriteRequestBatch is an object that is capable of efficiently sending * DynamoDB BatchWriteItem requests from queued up put and delete item requests. * requests. The batch attempts to send the requests with the fewest requests * to DynamoDB as possible and also re-queues any unprocessed items to ensure * that all items are sent. */class WriteRequestBatch{    /** @var DynamoDbClient DynamoDB client used to perform write operations. */    private $client;    /** @var array Configuration options for the batch. */    private $config;    /** @var array Queue of pending put/delete requests in the batch. */    private $queue;    /**     * Creates a WriteRequestBatch object that is capable of efficiently sending     * DynamoDB BatchWriteItem requests from queued up Put and Delete requests.     *     * @param DynamoDbClient $client DynamoDB client used to send batches.     * @param array          $config Batch configuration options.     *     - table: (string) DynamoDB table used by the batch, this can be     *       overridden for each individual put() or delete() call.     *     - batch_size: (int) The size of each batch (default: 25). The batch     *       size must be between 2 and 25. If you are sending batches of large     *       items, you may consider lowering the batch size, otherwise, you     *       should use 25.     *     - pool_size: (int) This number dictates how many BatchWriteItem     *       requests you would like to do in parallel. For example, if the     *       "batch_size" is 25, and "pool_size" is 3, then you would send 3     *       BatchWriteItem requests at a time, each with 25 items. Please keep     *       your throughput in mind when choosing the "pool_size" option.     *     - autoflush: (bool) This option allows the batch to automatically     *       flush once there are enough items (i.e., "batch_size" * "pool_size")     *       in the queue. This defaults to true, so you must set this to false     *       to stop autoflush.     *     - before: (callable) Executed before every BatchWriteItem operation.     *       It should accept an \Aws\CommandInterface object as its argument.     *     - error: Executed if an error was encountered executing a,     *       BatchWriteItem operation, otherwise errors are ignored. It should     *       accept an \Aws\Exception\AwsException as its argument.     *     * @throws \InvalidArgumentException if the batch size is not between 2 and 25.     */    public function __construct(DynamoDbClient $client, array $config = [])    {        // Apply defaults        $config += [            'table'      => null,            'batch_size' => 25,            'pool_size'  => 1,            'autoflush'  => true,            'before'     => null,            'error'      => null        ];        // Ensure the batch size is valid        if ($config['batch_size'] > 25 || $config['batch_size'] < 2) {            throw new \InvalidArgumentException('"batch_size" must be between 2 and 25.');        }        // Ensure the callbacks are valid        if ($config['before'] && !is_callable($config['before'])) {            throw new \InvalidArgumentException('"before" must be callable.');        }        if ($config['error'] && !is_callable($config['error'])) {            throw new \InvalidArgumentException('"error" must be callable.');        }        // If autoflush is enabled, set the threshold        if ($config['autoflush']) {            $config['threshold'] = $config['batch_size'] * $config['pool_size'];        }        $this->client = $client;        $this->config = $config;        $this->queue = [];    }    /**     * Adds a put item request to the batch.     *     * @param array       $item  Data for an item to put. Format:     *     [     *         'attribute1' => ['type' => 'value'],     *         'attribute2' => ['type' => 'value'],     *         ...     *     ]     * @param string|null $table The name of the table. This must be specified     *                           unless the "table" option was provided in the     *                           config of the WriteRequestBatch.     *     * @return $this     */    public function put(array $item, $table = null)    {        $this->queue[] = [            'table' => $this->determineTable($table),            'data'  => ['PutRequest' => ['Item' => $item]],        ];        $this->autoFlush();        return $this;    }    /**     * Adds a delete item request to the batch.     *     * @param array       $key   Key of an item to delete. Format:     *     [     *         'key1' => ['type' => 'value'],     *         ...     *     ]     * @param string|null $table The name of the table. This must be specified     *                           unless the "table" option was provided in the     *                           config of the WriteRequestBatch.     *     * @return $this     */    public function delete(array $key, $table = null)    {        $this->queue[] = [            'table' => $this->determineTable($table),            'data'  => ['DeleteRequest' => ['Key' => $key]],        ];        $this->autoFlush();        return $this;    }    /**     * Flushes the batch by combining all the queued put and delete requests     * into BatchWriteItem commands and executing them. Unprocessed items are     * automatically re-queued.     *     * @param bool $untilEmpty If true, flushing will continue until the queue     *                         is completely empty. This will make sure that     *                         unprocessed items are all eventually sent.     *     * @return $this     */    public function flush($untilEmpty = true)    {        // Send BatchWriteItem requests until the queue is empty        $keepFlushing = true;        while ($this->queue && $keepFlushing) {            $commands = $this->prepareCommands();            $pool = new CommandPool($this->client, $commands, [                'before' => $this->config['before'],                'concurrency' => $this->config['pool_size'],                'fulfilled'   => function (ResultInterface $result) {                    // Re-queue any unprocessed items                    if ($result->hasKey('UnprocessedItems')) {                        $this->retryUnprocessed($result['UnprocessedItems']);                    }                },                'rejected' => function ($reason) {                    if ($reason instanceof AwsException) {                        $code = $reason->getAwsErrorCode();                        if ($code === 'ProvisionedThroughputExceededException') {                            $this->retryUnprocessed($reason->getCommand()['RequestItems']);                        } elseif (is_callable($this->config['error'])) {                            $this->config['error']($reason);                        }                    }                }            ]);            $pool->promise()->wait();            $keepFlushing = (bool) $untilEmpty;        }        return $this;    }    /**     * Creates BatchWriteItem commands from the items in the queue.     *     * @return CommandInterface[]     */    private function prepareCommands()    {        // Chunk the queue into batches        $batches = array_chunk($this->queue, $this->config['batch_size']);        $this->queue = [];        // Create BatchWriteItem commands for each batch        $commands = [];        foreach ($batches as $batch) {            $requests = [];            foreach ($batch as $item) {                if (!isset($requests[$item['table']])) {                    $requests[$item['table']] = [];                }                $requests[$item['table']][] = $item['data'];            }            $commands[] = $this->client->getCommand(                'BatchWriteItem',                ['RequestItems' => $requests]            );        }        return $commands;    }    /**     * Re-queues unprocessed results with the correct data.     *     * @param array $unprocessed Unprocessed items from a result.     */    private function retryUnprocessed(array $unprocessed)    {        foreach ($unprocessed as $table => $requests) {            foreach ($requests as $request) {                $this->queue[] = [                    'table' => $table,                    'data'  => $request,                ];            }        }    }    /**     * If autoflush is enabled and the threshold is met, flush the batch     */    private function autoFlush()    {        if ($this->config['autoflush']            && count($this->queue) >= $this->config['threshold']        ) {            // Flush only once. Unprocessed items are handled in a later flush.            $this->flush(false);        }    }    /**     * Determine the table name by looking at what was provided and what the     * WriteRequestBatch was originally configured with.     *     * @param string|null $table The table name.     *     * @return string     * @throws \RuntimeException if there was no table specified.     */    private function determineTable($table)    {        $table = $table ?: $this->config['table'];        if (!$table) {            throw new \RuntimeException('There was no table specified.');        }        return $table;    }}
 |