class SearchIndex
{
+ /**
+ * A list of delimiter characters used to break-up parsed content into terms for indexing.
+ *
+ * @var string
+ */
+ public static $delimiters = " \n\t.,!?:;()[]{}<>`'\"";
/**
* @var EntityProvider
* - The number that have been processed so far.
* - The total number of that model to be processed.
*
- * @param callable(Entity, int, int)|null $progressCallback
+ * @param callable(Entity, int, int):void|null $progressCallback
*/
public function indexAllEntities(?callable $progressCallback = null)
{
$names = [];
$values = [];
- foreach($tags as $tag) {
+ foreach ($tags as $tag) {
$names[] = $tag->name;
$values[] = $tag->value;
}
protected function textToTermCountMap(string $text): array
{
$tokenMap = []; // {TextToken => OccurrenceCount}
- $splitChars = " \n\t.,!?:;()[]{}<>`'\"";
+ $splitChars = static::$delimiters;
$token = strtok($text, $splitChars);
while ($token !== false) {
if ($entity instanceof Page) {
$bodyTermsMap = $this->generateTermScoreMapFromHtml($entity->html);
} else {
- $bodyTermsMap = $this->generateTermScoreMapFromText($entity->description, $entity->searchFactor);
+ $bodyTermsMap = $this->generateTermScoreMapFromText($entity->description ?? '', $entity->searchFactor);
}
$mergedScoreMap = $this->mergeTermScoreMaps($nameTermsMap, $bodyTermsMap, $tagTermsMap);
$entityType = $entity->getMorphClass();
foreach ($mergedScoreMap as $term => $score) {
$dataArray[] = [
- 'term' => $term,
- 'score' => $score,
+ 'term' => $term,
+ 'score' => $score,
'entity_type' => $entityType,
- 'entity_id' => $entityId,
+ 'entity_id' => $entityId,
];
}
return $dataArray;
}
-
/**
* For the given term data arrays, Merge their contents by term
* while combining any scores.