jmikola · September 17, 2018 16:23
diff --git a/README.md b/README.md
diff --git a/bucket-insert.php b/bucket-insert.php
 <?php

 function create_guid() {
    $chars = md5(uniqid(rand(), true));

    return sprintf(
        '%s-%s-%s-%s-%s',
        substr($chars, 0, 8),
        substr($chars, 8, 4),
        substr($chars, 12, 4),
        substr($chars, 16, 4),
        substr($chars, 20, 12)
    );
 };

 function create_timeslice() {
    $date = getdate();

    return [
        'y' => $date['year'] % 100,
        'mo' => $date['mon'],
        'd' => $date['mday'],
        'h' => $date['hours'],
        'm' => $date['minutes'],
    ];
 }

 function create_eventnames($n) {
    static $prefixes = [
        'foo-foo-foo-foo-foo-foo',
        'bar-bar-bar-bar-bar-bar',
        'baz-baz-baz-baz-baz-baz',
    ];

    $object = new \stdClass();

    for ($i = 0; $i < $n; $i++) {
        $eventname = sprintf('%s-%d', $prefixes[rand(0, 2)], $i);
        $bucketname = substr(md5($eventname), 0, 2);

        if ( ! isset($object->$bucketname)) {
            $object->$bucketname = new \stdClass();
        }

        $object->$bucketname->$eventname = 0;
    }

    return $object;
 }

 function create_document() {
    return [
        '_id' => new MongoId(),
        'appver' => 123456,
        'deploytype' => 'production',
        'g' => 123456,
        'guid' => create_guid(),
        'timeslice' => create_timeslice(),
        'random' => uniqid(),
        'stats' => [
            'eventnames' => create_eventnames(20000),
            'events' => 0,
        ],
    ];
 }

 $m = new MongoClient();
 $c = $m->test->bucket;
 $c->drop();

 for ($i = 0; $i < 2000; $i++) {
    $c->insert(create_document(), ['w' => 0]);
 }
diff --git a/bucket-update.php b/bucket-update.php
 <?php

 $m = new MongoClient();
 $c = $m->test->bucket;
 $c->ensureIndex([
    'appver' => 1,
    'deploytype' => 1,
    'g' => 1,
    'guid' => 1,
    'timeslice' => 1,
 ]);

 $updates = [];

 foreach ($c->find() as $document) {
    $query = array_intersect_key($document, [ 'appver' => 1, 'deploytype' => 1, 'g' => 1, 'guid' => 1, 'timeslice' => 1 ]);

    $newobj = [
        '$set' => [ 'random' => uniqid() ],
        '$inc' => [
            'stats.events' => 5,
        ],
    ];

    foreach (array_rand($document['stats']['eventnames'], 5) as $bucketname) {
        $eventname = array_rand($document['stats']['eventnames'][$bucketname], 1);
        $newobj['$inc']["stats.eventnames.$bucketname.$eventname"] = 1;
    }

    $updates[] = [ $query, $newobj ];
 }

 $count = $c->count();
 $limit = 10000;
 $start = microtime(true);

 for ($i = 0; $i < $limit; $i++) {
    $query = $updates[$i % $count][0];
    $newobj = $updates[$i % $count][1];
    $c->update($query, $newobj, ['w' => 0]);
 }

 $end = microtime(true);

 printf("Updated %d documents in %f seconds (avg: %f/document)\n", $limit, ($end - $start), ($end - $start) / $limit);
diff --git a/original-insert.php b/original-insert.php
 <?php

 function create_guid() {
    $chars = md5(uniqid(rand(), true));

    return sprintf(
        '%s-%s-%s-%s-%s',
        substr($chars, 0, 8),
        substr($chars, 8, 4),
        substr($chars, 12, 4),
        substr($chars, 16, 4),
        substr($chars, 20, 12)
    );
 };

 function create_timeslice() {
    $date = getdate();

    return [
        'y' => $date['year'] % 100,
        'mo' => $date['mon'],
        'd' => $date['mday'],
        'h' => $date['hours'],
        'm' => $date['minutes'],
    ];
 }

 function create_eventnames($n) {
    static $prefixes = [
        'foo-foo-foo-foo-foo-foo',
        'bar-bar-bar-bar-bar-bar',
        'baz-baz-baz-baz-baz-baz',
    ];

    $object = new \stdClass();

    for ($i = 0; $i < $n; $i++) {
        $eventname = sprintf('%s-%d', $prefixes[rand(0, 2)], $i);
        $object->$eventname = 0;
    }

    return $object;
 }

 function create_document() {
    return [
        '_id' => new MongoId(),
        'appver' => 123456,
        'deploytype' => 'production',
        'g' => 123456,
        'guid' => create_guid(),
        'timeslice' => create_timeslice(),
        'random' => uniqid(),
        'stats' => [
            'eventnames' => create_eventnames(20000),
            'events' => 0,
        ],
    ];
 }

 $m = new MongoClient();
 $c = $m->test->original;
 $c->drop();

 for ($i = 0; $i < 2000; $i++) {
    $c->insert(create_document(), ['w' => 0]);
 }
diff --git a/original-update.php b/original-update.php
 <?php

 $m = new MongoClient();
 $c = $m->test->original;
 $c->ensureIndex([
    'appver' => 1,
    'deploytype' => 1,
    'g' => 1,
    'guid' => 1,
    'timeslice' => 1,
 ]);

 $updates = [];

 foreach ($c->find() as $document) {
    $query = array_intersect_key($document, [ 'appver' => 1, 'deploytype' => 1, 'g' => 1, 'guid' => 1, 'timeslice' => 1 ]);

    $newobj = [
        '$set' => [ 'random' => uniqid() ],
        '$inc' => [ 'stats.events' => 5 ],
    ];

    foreach (array_rand($document['stats']['eventnames'], 5) as $eventname) {
        $newobj['$inc']["stats.eventnames.$eventname"] = 1;
    }

    $updates[] = [ $query, $newobj ];
 }

 $count = $c->count();
 $limit = 10000;
 $start = microtime(true);

 for ($i = 0; $i < $limit; $i++) {
    $query = $updates[$i % $count][0];
    $newobj = $updates[$i % $count][1];
    $c->update($query, $newobj, ['w' => 0]);
 }

 $end = microtime(true);

 printf("Updated %d documents in %f seconds (avg: %f/document)\n", $limit, ($end - $start), ($end - $start) / $limit);
	<?php

	$m = new MongoClient();
	$c = $m->test->bucket;
	$c->ensureIndex([
	'appver' => 1,
	'deploytype' => 1,
	'g' => 1,
	'guid' => 1,
	'timeslice' => 1,
	]);

	$updates = [];

	foreach ($c->find() as $document) {
	$query = array_intersect_key($document, [ 'appver' => 1, 'deploytype' => 1, 'g' => 1, 'guid' => 1, 'timeslice' => 1 ]);

	$newobj = [
	'$set' => [ 'random' => uniqid() ],
	'$inc' => [
	'stats.events' => 5,
	],
	];

	foreach (array_rand($document['stats']['eventnames'], 5) as $bucketname) {
	$eventname = array_rand($document['stats']['eventnames'][$bucketname], 1);
	$newobj['$inc']["stats.eventnames.$bucketname.$eventname"] = 1;
	}

	$updates[] = [ $query, $newobj ];
	}

	$count = $c->count();
	$limit = 10000;
	$start = microtime(true);

	for ($i = 0; $i < $limit; $i++) {
	$query = $updates[$i % $count][0];
	$newobj = $updates[$i % $count][1];
	$c->update($query, $newobj, ['w' => 0]);
	}

	$end = microtime(true);

	printf("Updated %d documents in %f seconds (avg: %f/document)\n", $limit, ($end - $start), ($end - $start) / $limit);
	<?php

	$m = new MongoClient();
	$c = $m->test->original;
	$c->ensureIndex([
	'appver' => 1,
	'deploytype' => 1,
	'g' => 1,
	'guid' => 1,
	'timeslice' => 1,
	]);

	$updates = [];

	foreach ($c->find() as $document) {
	$query = array_intersect_key($document, [ 'appver' => 1, 'deploytype' => 1, 'g' => 1, 'guid' => 1, 'timeslice' => 1 ]);

	$newobj = [
	'$set' => [ 'random' => uniqid() ],
	'$inc' => [ 'stats.events' => 5 ],
	];

	foreach (array_rand($document['stats']['eventnames'], 5) as $eventname) {
	$newobj['$inc']["stats.eventnames.$eventname"] = 1;
	}

	$updates[] = [ $query, $newobj ];
	}

	$count = $c->count();
	$limit = 10000;
	$start = microtime(true);

	for ($i = 0; $i < $limit; $i++) {
	$query = $updates[$i % $count][0];
	$newobj = $updates[$i % $count][1];
	$c->update($query, $newobj, ['w' => 0]);
	}

	$end = microtime(true);

	printf("Updated %d documents in %f seconds (avg: %f/document)\n", $limit, ($end - $start), ($end - $start) / $limit);