113 lines
3.5 KiB
PHP
113 lines
3.5 KiB
PHP
<?php
|
|
|
|
namespace FOQ\ElasticaBundle\Doctrine;
|
|
|
|
use FOQ\ElasticaBundle\Provider\ProviderInterface;
|
|
use FOQ\ElasticaBundle\Transformer\ModelToElasticaTransformerInterface;
|
|
use Elastica_Type;
|
|
use Elastica_Document;
|
|
use Closure;
|
|
use InvalidArgumentException;
|
|
use FOQ\ElasticaBundle\Provider\NotIndexableException;
|
|
|
|
abstract class AbstractProvider implements ProviderInterface
|
|
{
|
|
protected $type;
|
|
protected $objectManager;
|
|
protected $objectClass;
|
|
protected $transformer;
|
|
protected $options = array(
|
|
'batch_size' => 100,
|
|
'clear_object_manager' => true,
|
|
'query_builder_method' => 'createQueryBuilder'
|
|
);
|
|
|
|
public function __construct(Elastica_Type $type, $objectManager, ModelToElasticaTransformerInterface $transformer, $objectClass, array $options = array())
|
|
{
|
|
$this->type = $type;
|
|
$this->objectManager = $objectManager;
|
|
$this->objectClass = $objectClass;
|
|
$this->transformer = $transformer;
|
|
$this->options = array_merge($this->options, $options);
|
|
}
|
|
|
|
/**
|
|
* Insert the repository objects in the type index
|
|
*
|
|
* @param Closure $loggerClosure
|
|
*/
|
|
public function populate(Closure $loggerClosure)
|
|
{
|
|
$queryBuilder = $this->createQueryBuilder();
|
|
$nbObjects = $this->countObjects($queryBuilder);
|
|
$fields = $this->extractTypeFields();
|
|
|
|
for ($offset = 0; $offset < $nbObjects; $offset += $this->options['batch_size']) {
|
|
|
|
$stepStartTime = microtime(true);
|
|
$documents = array();
|
|
$objects = $this->fetchSlice($queryBuilder, $this->options['batch_size'], $offset);
|
|
|
|
foreach ($objects as $object) {
|
|
try {
|
|
$documents[] = $this->transformer->transform($object, $fields);
|
|
} catch (NotIndexableException $e) {
|
|
// skip document
|
|
}
|
|
}
|
|
$this->type->addDocuments($documents);
|
|
|
|
if ($this->options['clear_object_manager']) {
|
|
$this->objectManager->clear();
|
|
}
|
|
|
|
$stepNbObjects = count($objects);
|
|
$stepCount = $stepNbObjects+$offset;
|
|
$objectsPerSecond = $stepNbObjects / (microtime(true) - $stepStartTime);
|
|
$loggerClosure(sprintf('%0.1f%% (%d/%d), %d objects/s', 100*$stepCount/$nbObjects, $stepCount, $nbObjects, $objectsPerSecond));
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Counts the objects of a query builder
|
|
*
|
|
* @param queryBuilder
|
|
* @return int
|
|
**/
|
|
protected abstract function countObjects($queryBuilder);
|
|
|
|
/**
|
|
* Fetches a slice of objects
|
|
*
|
|
* @param queryBuilder
|
|
* @param int limit
|
|
* @param int offset
|
|
* @return array of objects
|
|
**/
|
|
protected abstract function fetchSlice($queryBuilder, $limit, $offset);
|
|
|
|
/**
|
|
* Creates the query builder used to fetch the documents to index
|
|
*
|
|
* @return query builder
|
|
**/
|
|
protected abstract function createQueryBuilder();
|
|
|
|
protected function extractTypeFields()
|
|
{
|
|
$mappings = $this->type->getMapping();
|
|
// skip index and type name
|
|
// < 0.16.0 has both index and type levels
|
|
// >= 0.16.0 has only type level
|
|
do {
|
|
$mappings = reset($mappings);
|
|
} while (!isset($mappings['properties']));
|
|
$mappings = $mappings['properties'];
|
|
if (array_key_exists('__isInitialized__', $mappings)) {
|
|
unset($mappings['__isInitialized__']);
|
|
}
|
|
|
|
return array_keys($mappings);
|
|
}
|
|
}
|