Skip to content

Commit

Permalink
Merge pull request #361 from acelaya/feature/paginated-visits
Browse files Browse the repository at this point in the history
Feature/paginated visits
  • Loading branch information
acelaya authored Feb 23, 2019
2 parents 08bd4f1 + d2fad01 commit c70077c
Show file tree
Hide file tree
Showing 7 changed files with 85 additions and 28 deletions.
3 changes: 2 additions & 1 deletion CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@ All notable changes to this project will be documented in this file.

The format is based on [Keep a Changelog](https://keepachangelog.com), and this project adheres to [Semantic Versioning](https://semver.org).

## [Unreleased]
## 1.16.0 - 2019-02-23

#### Added

Expand Down Expand Up @@ -61,6 +61,7 @@ The format is based on [Keep a Changelog](https://keepachangelog.com), and this
#### Fixed
* [#317](https://github.com/shlinkio/shlink/issues/317) Fixed error while trying to generate previews because of global config file being deleted by mistake by build script.
* [#307](https://github.com/shlinkio/shlink/issues/307) Fixed memory leak while trying to process huge amounts of visits due to the query not being properly paginated.
## 1.15.1 - 2018-12-16
Expand Down
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
<?php
declare(strict_types=1);

namespace ShlinkioTest\Shlink\Common\Paginator;
namespace ShlinkioTest\Shlink\Common\Paginator\Adapter;

use PHPUnit\Framework\TestCase;
use Prophecy\Prophecy\ObjectProphecy;
Expand Down
30 changes: 26 additions & 4 deletions module/Core/src/Repository/VisitRepository.php
Original file line number Diff line number Diff line change
Expand Up @@ -10,12 +10,34 @@

class VisitRepository extends EntityRepository implements VisitRepositoryInterface
{
public function findUnlocatedVisits(): iterable
/**
* This method will allow you to iterate the whole list of unlocated visits, but loading them into memory in
* smaller blocks of a specific size.
* This will have side effects if you update those rows while you iterate them.
* If you plan to do so, pass the first argument as false in order to disable applying offsets while slicing the
* dataset
*
* @return iterable|Visit[]
*/
public function findUnlocatedVisits(bool $applyOffset = true, int $blockSize = self::DEFAULT_BLOCK_SIZE): iterable
{
$dql = 'SELECT v FROM Shlinkio\Shlink\Core\Entity\Visit AS v WHERE v.visitLocation IS NULL';
$query = $this->getEntityManager()->createQuery($dql);
$dql = <<<DQL
SELECT v FROM Shlinkio\Shlink\Core\Entity\Visit AS v WHERE v.visitLocation IS NULL
DQL;
$query = $this->getEntityManager()->createQuery($dql)
->setMaxResults($blockSize);
$remainingVisitsToProcess = $this->count(['visitLocation' => null]);
$offset = 0;

return $query->iterate();
while ($remainingVisitsToProcess > 0) {
$iterator = $query->setFirstResult($applyOffset ? $offset : null)->iterate();
foreach ($iterator as $key => [$value]) {
yield $key => $value;
}

$remainingVisitsToProcess -= $blockSize;
$offset += $blockSize;
}
}

/**
Expand Down
13 changes: 12 additions & 1 deletion module/Core/src/Repository/VisitRepositoryInterface.php
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,18 @@

interface VisitRepositoryInterface extends ObjectRepository
{
public function findUnlocatedVisits(): iterable;
public const DEFAULT_BLOCK_SIZE = 10000;

/**
* This method will allow you to iterate the whole list of unlocated visits, but loading them into memory in
* smaller blocks of a specific size.
* This will have side effects if you update those rows while you iterate them.
* If you plan to do so, pass the first argument as false in order to disable applying offsets while slicing the
* dataset
*
* @return iterable|Visit[]
*/
public function findUnlocatedVisits(bool $applyOffset = true, int $blockSize = self::DEFAULT_BLOCK_SIZE): iterable;

/**
* @return Visit[]
Expand Down
20 changes: 14 additions & 6 deletions module/Core/src/Service/VisitService.php
Original file line number Diff line number Diff line change
Expand Up @@ -24,9 +24,12 @@ public function locateUnlocatedVisits(callable $geolocateVisit, ?callable $notif
{
/** @var VisitRepository $repo */
$repo = $this->em->getRepository(Visit::class);
$results = $repo->findUnlocatedVisits();
$results = $repo->findUnlocatedVisits(false);
$count = 0;
$persistBlock = 200;

foreach ($results as [$visit]) {
foreach ($results as $visit) {
$count++;
try {
/** @var Location $location */
$location = $geolocateVisit($visit);
Expand All @@ -37,20 +40,25 @@ public function locateUnlocatedVisits(callable $geolocateVisit, ?callable $notif

$location = new VisitLocation($location);
$this->locateVisit($visit, $location, $notifyVisitWithLocation);

// Flush and clear after X iterations
if ($count % $persistBlock === 0) {
$this->em->flush();
$this->em->clear();
}
}

$this->em->flush();
$this->em->clear();
}

private function locateVisit(Visit $visit, VisitLocation $location, ?callable $notifyVisitWithLocation): void
{
$visit->locate($location);

$this->em->persist($visit);
$this->em->flush();

if ($notifyVisitWithLocation !== null) {
$notifyVisitWithLocation($location, $visit);
}

$this->em->clear();
}
}
18 changes: 15 additions & 3 deletions module/Core/test-db/Repository/VisitRepositoryTest.php
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,8 @@
use Shlinkio\Shlink\Core\Model\Visitor;
use Shlinkio\Shlink\Core\Repository\VisitRepository;
use ShlinkioTest\Shlink\Common\DbTest\DatabaseTestCase;
use function Functional\map;
use function range;
use function sprintf;

class VisitRepositoryTest extends DatabaseTestCase
Expand All @@ -30,8 +32,11 @@ protected function setUp(): void
$this->repo = $this->getEntityManager()->getRepository(Visit::class);
}

/** @test */
public function findUnlocatedVisitsReturnsProperVisits(): void
/**
* @test
* @dataProvider provideBlockSize
*/
public function findUnlocatedVisitsReturnsProperVisits(int $blockSize): void
{
$shortUrl = new ShortUrl('');
$this->getEntityManager()->persist($shortUrl);
Expand All @@ -50,14 +55,21 @@ public function findUnlocatedVisitsReturnsProperVisits(): void
$this->getEntityManager()->flush();

$resultsCount = 0;
$results = $this->repo->findUnlocatedVisits();
$results = $this->repo->findUnlocatedVisits(true, $blockSize);
foreach ($results as $value) {
$resultsCount++;
}

$this->assertEquals(3, $resultsCount);
}

public function provideBlockSize(): iterable
{
return map(range(1, 5), function (int $value) {
return [$value];
});
}

/** @test */
public function findVisitsByShortCodeReturnsProperData(): void
{
Expand Down
27 changes: 15 additions & 12 deletions module/Core/test/Service/VisitServiceTest.php
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,11 @@
use Shlinkio\Shlink\Core\Service\VisitService;
use function array_shift;
use function count;
use function floor;
use function func_get_args;
use function Functional\map;
use function range;
use function sprintf;

class VisitServiceTest extends TestCase
{
Expand All @@ -35,13 +39,12 @@ public function setUp(): void
/** @test */
public function locateVisitsIteratesAndLocatesUnlocatedVisits(): void
{
$unlocatedVisits = [
[new Visit(new ShortUrl('foo'), Visitor::emptyInstance())],
[new Visit(new ShortUrl('bar'), Visitor::emptyInstance())],
];
$unlocatedVisits = map(range(1, 200), function (int $i) {
return new Visit(new ShortUrl(sprintf('short_code_%s', $i)), Visitor::emptyInstance());
});

$repo = $this->prophesize(VisitRepository::class);
$findUnlocatedVisits = $repo->findUnlocatedVisits()->willReturn($unlocatedVisits);
$findUnlocatedVisits = $repo->findUnlocatedVisits(false)->willReturn($unlocatedVisits);
$getRepo = $this->em->getRepository(Visit::class)->willReturn($repo->reveal());

$persist = $this->em->persist(Argument::type(Visit::class))->will(function () {
Expand All @@ -63,19 +66,19 @@ public function locateVisitsIteratesAndLocatesUnlocatedVisits(): void
$findUnlocatedVisits->shouldHaveBeenCalledOnce();
$getRepo->shouldHaveBeenCalledOnce();
$persist->shouldHaveBeenCalledTimes(count($unlocatedVisits));
$flush->shouldHaveBeenCalledTimes(count($unlocatedVisits));
$clear->shouldHaveBeenCalledTimes(count($unlocatedVisits));
$flush->shouldHaveBeenCalledTimes(floor(count($unlocatedVisits) / 200) + 1);
$clear->shouldHaveBeenCalledTimes(floor(count($unlocatedVisits) / 200) + 1);
}

/** @test */
public function visitsWhichCannotBeLocatedAreIgnored()
public function visitsWhichCannotBeLocatedAreIgnored(): void
{
$unlocatedVisits = [
[new Visit(new ShortUrl('foo'), Visitor::emptyInstance())],
new Visit(new ShortUrl('foo'), Visitor::emptyInstance()),
];

$repo = $this->prophesize(VisitRepository::class);
$findUnlocatedVisits = $repo->findUnlocatedVisits()->willReturn($unlocatedVisits);
$findUnlocatedVisits = $repo->findUnlocatedVisits(false)->willReturn($unlocatedVisits);
$getRepo = $this->em->getRepository(Visit::class)->willReturn($repo->reveal());

$persist = $this->em->persist(Argument::type(Visit::class))->will(function () {
Expand All @@ -92,7 +95,7 @@ public function visitsWhichCannotBeLocatedAreIgnored()
$findUnlocatedVisits->shouldHaveBeenCalledOnce();
$getRepo->shouldHaveBeenCalledOnce();
$persist->shouldNotHaveBeenCalled();
$flush->shouldNotHaveBeenCalled();
$clear->shouldNotHaveBeenCalled();
$flush->shouldHaveBeenCalledOnce();
$clear->shouldHaveBeenCalledOnce();
}
}

0 comments on commit c70077c

Please sign in to comment.