class SearchIndex
{
+ /**
+ * A list of delimiter characters used to break-up parsed content into terms for indexing.
+ *
+ * @var string
+ */
+ public static $delimiters = " \n\t.,!?:;()[]{}<>`'\"";
/**
* @var EntityProvider
protected function textToTermCountMap(string $text): array
{
$tokenMap = []; // {TextToken => OccurrenceCount}
- $splitChars = " \n\t.,!?:;()[]{}<>`'\"";
+ $splitChars = static::$delimiters;
$token = strtok($text, $splitChars);
while ($token !== false) {
$instance = new SearchOptions();
$inputs = $request->only(['search', 'types', 'filters', 'exact', 'tags']);
- $instance->searches = explode(' ', $inputs['search'] ?? []);
- $instance->exacts = array_filter($inputs['exact'] ?? []);
+
+ $parsedStandardTerms = static::parseStandardTermString($inputs['search'] ?? '');
+ $instance->searches = $parsedStandardTerms['terms'];
+ $instance->exacts = $parsedStandardTerms['exacts'];
+
+ array_push($instance->exacts, ...array_filter($inputs['exact'] ?? []));
+
$instance->tags = array_filter($inputs['tags'] ?? []);
+
foreach (($inputs['filters'] ?? []) as $filterKey => $filterVal) {
if (empty($filterVal)) {
continue;
}
$instance->filters[$filterKey] = $filterVal === 'true' ? '' : $filterVal;
}
+
if (isset($inputs['types']) && count($inputs['types']) < 4) {
$instance->filters['type'] = implode('|', $inputs['types']);
}
}
// Parse standard terms
- foreach (explode(' ', trim($searchString)) as $searchTerm) {
- if ($searchTerm !== '') {
- $terms['searches'][] = $searchTerm;
- }
- }
+ $parsedStandardTerms = static::parseStandardTermString($searchString);
+ array_push($terms['searches'], ...$parsedStandardTerms['terms']);
+ array_push($terms['exacts'], ...$parsedStandardTerms['exacts']);
// Split filter values out
$splitFilters = [];
return $terms;
}
+
+ /**
+ * Parse a standard search term string into individual search terms and
+ * extract any exact terms searches to be made.
+ *
+ * @return array{terms: array<string>, exacts: array<string>}
+ */
+ protected static function parseStandardTermString(string $termString): array
+ {
+ $terms = explode(' ', $termString);
+ $indexDelimiters = SearchIndex::$delimiters;
+ $parsed = [
+ 'terms' => [],
+ 'exacts' => [],
+ ];
+
+ foreach ($terms as $searchTerm) {
+ if ($searchTerm === '') {
+ continue;
+ }
+
+ $parsedList = (strpbrk($searchTerm, $indexDelimiters) === false) ? 'terms' : 'exacts';
+ $parsed[$parsedList][] = $searchTerm;
+ }
+
+ return $parsed;
+ }
+
/**
* Encode this instance to a search string.
*/
$exactSearchB->assertStatus(200)->assertDontSee($page->name);
}
+ public function test_search_terms_with_delimiters_are_converted_to_exact_matches()
+ {
+ $this->asEditor();
+ $page = $this->newPage(['name' => 'Delimiter test', 'html' => '<p>1.1 2,2 3?3 4:4 5;5 (8) <9> "10" \'11\' `12`</p>']);
+ $terms = explode(' ', '1.1 2,2 3?3 4:4 5;5 (8) <9> "10" \'11\' `12`');
+
+ foreach ($terms as $term) {
+ $search = $this->get('/search?term=' . urlencode($term));
+ $search->assertSee($page->name);
+ }
+ }
+
public function test_search_filters()
{
$page = $this->newPage(['name' => 'My new test quaffleachits', 'html' => 'this is about an orange donkey danzorbhsing']);