Code Coverage
 
Lines
Functions and Methods
Classes and Traits
Total
94.44% covered (success)
94.44%
51 / 54
83.33% covered (warning)
83.33%
5 / 6
CRAP
0.00% covered (danger)
0.00%
0 / 1
EntityReindexer
94.44% covered (success)
94.44%
51 / 54
83.33% covered (warning)
83.33%
5 / 6
9.01
0.00% covered (danger)
0.00%
0 / 1
 __construct
100.00% covered (success)
100.00%
1 / 1
100.00% covered (success)
100.00%
1 / 1
1
 getIndexClass
100.00% covered (success)
100.00%
1 / 1
100.00% covered (success)
100.00%
1 / 1
1
 updateIndex
100.00% covered (success)
100.00%
11 / 11
100.00% covered (success)
100.00%
1 / 1
2
 recalculateIdfForAll
0.00% covered (danger)
0.00%
0 / 3
0.00% covered (danger)
0.00%
0 / 1
2
 createUpdateQuery
100.00% covered (success)
100.00%
28 / 28
100.00% covered (success)
100.00%
1 / 1
2
 recalculateIdf
100.00% covered (success)
100.00%
10 / 10
100.00% covered (success)
100.00%
1 / 1
2
1<?php
2namespace Apie\DoctrineEntityDatalayer;
3
4use Apie\Core\Context\ApieContext;
5use Apie\Core\Entities\EntityInterface;
6use Apie\Core\Indexing\Indexer;
7use Apie\StorageMetadataBuilder\Interfaces\HasIndexInterface;
8use Doctrine\DBAL\ArrayParameterType;
9use Doctrine\DBAL\Platforms\SqlitePlatform;
10use ReflectionClass;
11
12final class EntityReindexer
13{
14    public function __construct(private readonly OrmBuilder $ormBuilder, private readonly Indexer $indexer)
15    {
16    }
17
18    /**
19     * @param ReflectionClass<HasIndexInterface> $doctrineEntity
20     * @return class-string<object>
21     */
22    private function getIndexClass(ReflectionClass $doctrineEntity): string
23    {
24        return $doctrineEntity->getMethod('getIndexTable')->invoke(null)->name;
25    }
26
27    /**
28     * Should be called after storing a doctrine entity from a domain entity. It recalculates the search terms
29     * for the entity. For searching we use TF IDF and recalculate the TF of the entity. The IDF needs to be
30     * recalculated in a separate function with an update query.
31     *
32     * @see https://en.wikipedia.org/wiki/Tf%E2%80%93idf
33     */
34    public function updateIndex(
35        HasIndexInterface $doctrineEntity,
36        EntityInterface $entity,
37        bool $skipIdf = false
38    ): void {
39        $entityManager = $this->ormBuilder->createEntityManager();
40        $newIndexes = $this->indexer->getIndexesForObject(
41            $entity,
42            new ApieContext()
43        );
44        $doctrineEntity->replaceIndexes($newIndexes);
45        $termsToUpdate = array_keys($newIndexes);
46        $entityManager->persist($doctrineEntity);
47        $entityManager->flush();
48        if (!$skipIdf) {
49            $this->recalculateIdf($doctrineEntity, $termsToUpdate);
50        }
51    }
52
53    /**
54     * @param ReflectionClass<HasIndexInterface> $doctrineEntity
55     */
56    public function recalculateIdfForAll(ReflectionClass $doctrineEntity): void
57    {
58        $query = $this->createUpdateQuery($doctrineEntity);
59        $entityManager = $this->ormBuilder->createEntityManager();
60        $entityManager->getConnection()->executeQuery($query);
61    }
62
63    /**
64     * @param ReflectionClass<HasIndexInterface> $doctrineEntity
65     */
66    private function createUpdateQuery(ReflectionClass $doctrineEntity): string
67    {
68        $entityManager = $this->ormBuilder->createEntityManager();
69        $tableName = (new ReflectionClass($this->getIndexClass($doctrineEntity)))->getShortName();
70        $columnName = 'ref_' . $doctrineEntity->getShortName() . '_id';
71        $totalDocumentQuery = sprintf(
72            '(SELECT total_documents FROM (SELECT COUNT(DISTINCT %s) AS total_documents FROM %s WHERE %s IS NOT NULL) AS sub1)',
73            $columnName,
74            $tableName,
75            $columnName
76        );
77        $documentWithTermQuery = sprintf(
78            'SELECT documents_with_term FROM (SELECT text, COUNT(DISTINCT %s) AS documents_with_term FROM %s WHERE %s IS NOT NULL GROUP BY text) AS sub WHERE sub.text',
79            $columnName,
80            $tableName,
81            $columnName
82        );
83        $connection = $entityManager->getConnection();
84        $query = sprintf(
85            'UPDATE %s AS t
86            SET idf = COALESCE(%s((%s)/(%s = t.text LIMIT 1)), 1)
87            WHERE %s IS NOT NULL AND EXISTS (SELECT 1 FROM (SELECT text, COUNT(DISTINCT %s) AS documents_with_term FROM %s GROUP BY text) AS sub WHERE sub.text = t.text LIMIT 1);',
88            $tableName,
89            // @phpstan-ignore class.notFound
90            $connection->getDatabasePlatform() instanceof SqlitePlatform ? '' : 'log',
91            $totalDocumentQuery,
92            $documentWithTermQuery,
93            $columnName,
94            $columnName,
95            $tableName
96        );
97
98        return $query;
99    }
100
101    /**
102     * @param array<int, string> $termsToUpdate
103     */
104    private function recalculateIdf(HasIndexInterface $doctrineEntity, array $termsToUpdate): void
105    {
106        if (empty($termsToUpdate)) {
107            return;
108        }
109        $query = $this->createUpdateQuery(new ReflectionClass($doctrineEntity));
110        $query = preg_replace('#LIMIT 1\);$#', 'AND t.text IN (:terms) LIMIT 1);', $query);
111        $entityManager = $this->ormBuilder->createEntityManager();
112        $entityManager->getConnection()->executeQuery(
113            $query,
114            ['terms' => array_values($termsToUpdate)],
115            ['terms' => ArrayParameterType::STRING]
116        );
117    }
118}