class SearchMatchTest

Same name and namespace in other branches
  1. 11.x core/modules/search/tests/src/Kernel/SearchMatchTest.php \Drupal\Tests\search\Kernel\SearchMatchTest
  2. 10 core/modules/search/tests/src/Kernel/SearchMatchTest.php \Drupal\Tests\search\Kernel\SearchMatchTest
  3. 9 core/modules/search/tests/src/Kernel/SearchMatchTest.php \Drupal\Tests\search\Kernel\SearchMatchTest
  4. 8.9.x core/modules/search/tests/src/Kernel/SearchMatchTest.php \Drupal\Tests\search\Kernel\SearchMatchTest

Indexes content and queries it.

Attributes

#[Group('search')] #[RunTestsInSeparateProcesses]

Hierarchy

Expanded class hierarchy of SearchMatchTest

File

core/modules/search/tests/src/Kernel/SearchMatchTest.php, line 19

Namespace

Drupal\Tests\search\Kernel
View source
class SearchMatchTest extends KernelTestBase {
  // The search index can contain different types of content. Typically the type
  // is 'node'. Here we test with _test_ and _test2_ as the type.
  const SEARCH_TYPE = '_test_';
  const SEARCH_TYPE_2 = '_test2_';
  const SEARCH_TYPE_JPN = '_test3_';
  
  /**
   * {@inheritdoc}
   */
  protected static $modules = [
    'search',
  ];
  
  /**
   * {@inheritdoc}
   */
  protected function setUp() : void {
    parent::setUp();
    $this->installSchema('search', [
      'search_index',
      'search_dataset',
      'search_total',
    ]);
    $this->installConfig([
      'search',
    ]);
  }
  
  /**
   * Tests search indexing.
   */
  public function testMatching() : void {
    $this->_setup();
    $this->_testQueries();
  }
  
  /**
   * Tests HTML tags with whitespace characters are parsed correctly.
   */
  public function testHTMLTagsWithWhitespace() : void {
    $this->config('search.settings')
      ->set('index.minimum_word_size', 3)
      ->save();
    $search_index = \Drupal::service('search.index');
    assert($search_index instanceof SearchIndexInterface);
    $langcode = LanguageInterface::LANGCODE_NOT_SPECIFIED;
    // Test case 1: inline anchor tag.
    $search_index->index(static::SEARCH_TYPE, 101, $langcode, '<a href="https://example.com/">Drupal Rocks</a>');
    // Test case 2: anchor tag with newlines.
    $search_index->index(static::SEARCH_TYPE, 102, $langcode, '<a' . "\n" . '  href="https://example.com/"' . "\n" . '>Drupal Rocks</a>');
    // Test case 3: anchor tag with tab character.
    $search_index->index(static::SEARCH_TYPE, 103, $langcode, '<a' . "\t" . 'href="https://example.com/">Drupal Rocks</a>');
    // Test case 4: no tag (control).
    $search_index->index(static::SEARCH_TYPE, 104, $langcode, 'Drupal Rocks');
    // Perform search for 'rocks'.
    $connection = Database::getConnection();
    $result = $connection->select('search_index', 'i')
      ->extend(SearchQuery::class)
      ->searchExpression('rocks', static::SEARCH_TYPE)
      ->execute();
    $set = $result ? $result->fetchAll() : [];
    // Build scores map.
    $scores = [];
    foreach ($set as $item) {
      $scores[$item->sid] = $item->calculated_score;
    }
    // Verify all items found.
    $this->assertCount(4, $scores);
    // Items with anchor tags should have same score.
    $this->assertEquals($scores[101], $scores[102]);
    $this->assertEquals($scores[101], $scores[103]);
    // Anchor tag items should score higher than no-tag item.
    $this->assertGreaterThan($scores[104], $scores[101]);
  }
  
  /**
   * Set up a small index of items to test against.
   */
  public function _setup() : void {
    $this->config('search.settings')
      ->set('index.minimum_word_size', 3)
      ->save();
    $search_index = \Drupal::service('search.index');
    assert($search_index instanceof SearchIndexInterface);
    for ($i = 1; $i <= 7; ++$i) {
      $search_index->index(static::SEARCH_TYPE, $i, LanguageInterface::LANGCODE_NOT_SPECIFIED, $this->getText($i));
    }
    for ($i = 1; $i <= 5; ++$i) {
      $search_index->index(static::SEARCH_TYPE_2, $i + 7, LanguageInterface::LANGCODE_NOT_SPECIFIED, $this->getText2($i));
    }
    // No getText builder function for Japanese text; just a simple array.
    foreach ([
      13 => '以呂波耳・ほへとち。リヌルヲ。',
      14 => 'ドルーパルが大好きよ!',
      15 => 'コーヒーとケーキ',
    ] as $i => $jpn) {
      $search_index->index(static::SEARCH_TYPE_JPN, $i, LanguageInterface::LANGCODE_NOT_SPECIFIED, $jpn);
    }
  }
  
  /**
   * Helper to generate lorem ipsum snippets of content.
   *
   * Generated items to test against:
   *   1  ipsum
   *   2  dolore sit
   *   3  sit am ut
   *   4  am ut enim am
   *   5  ut enim am minim veniam
   *   6  enim am minim veniam es cillum
   *   7  am minim veniam es cillum dolore eu.
   */
  public function getText($n) : string {
    $words = explode(' ', "Ipsum dolore sit am. Ut enim am minim veniam. Es cillum dolore eu.");
    return implode(' ', array_slice($words, $n - 1, $n));
  }
  
  /**
   * Helper to generate English language snippets of content.
   *
   * Generated items to test against:
   *   8  dear
   *   9  king philip
   *   10 philip came over
   *   11 came over from germany
   *   12 over from germany swimming.
   */
  public function getText2($n) : string {
    $words = explode(' ', "Dear King Philip came over from Germany swimming.");
    return implode(' ', array_slice($words, $n - 1, $n));
  }
  
  /**
   * Run predefine queries looking for indexed terms.
   */
  public function _testQueries() : void {
    // Note: OR queries that include short words in OR groups are only accepted
    // if the ORed terms are ANDed with at least one long word in the rest of
    // the query. Examples:
    // -  enim dolore OR ut = enim (dolore OR ut) = (enim dolor) OR (enim ut)
    // is good, and
    // -  dolore OR ut = (dolore) OR (ut)
    // is bad. This is a design limitation to avoid full table scans.
    $queries = [
      // Simple AND queries.
'ipsum' => [
        1,
      ],
      'enim' => [
        4,
        5,
        6,
      ],
      'xxxxx' => [],
      'enim minim' => [
        5,
        6,
      ],
      'enim xxxxx' => [],
      'dolore eu' => [
        7,
      ],
      'dolore xx' => [],
      'ut minim' => [
        5,
      ],
      'xx minim' => [],
      'enim veniam am minim ut' => [
        5,
      ],
      // Simple OR and AND/OR queries.
'dolore OR ipsum' => [
        1,
        2,
        7,
      ],
      'dolore OR xxxxx' => [
        2,
        7,
      ],
      'dolore OR ipsum OR enim' => [
        1,
        2,
        4,
        5,
        6,
        7,
      ],
      'ipsum OR dolore sit OR cillum' => [
        2,
        7,
      ],
      'minim dolore OR ipsum' => [
        7,
      ],
      'dolore OR ipsum veniam' => [
        7,
      ],
      'minim dolore OR ipsum OR enim' => [
        5,
        6,
        7,
      ],
      'dolore xx OR yy' => [],
      'xxxxx dolore OR ipsum' => [],
      // Sequence of OR queries.
'minim' => [
        5,
        6,
        7,
      ],
      'minim OR xxxx' => [
        5,
        6,
        7,
      ],
      'minim OR xxxx OR minim' => [
        5,
        6,
        7,
      ],
      'minim OR xxxx minim' => [
        5,
        6,
        7,
      ],
      'minim OR xxxx minim OR yyyy' => [
        5,
        6,
        7,
      ],
      'minim OR xxxx minim OR cillum' => [
        6,
        7,
        5,
      ],
      'minim OR xxxx minim OR xxxx' => [
        5,
        6,
        7,
      ],
      // Negative queries.
'dolore -sit' => [
        7,
      ],
      'dolore -eu' => [
        2,
      ],
      'dolore -xxxxx' => [
        2,
        7,
      ],
      'dolore -xx' => [
        2,
        7,
      ],
      // Phrase queries.
'"dolore sit"' => [
        2,
      ],
      '"sit dolore"' => [],
      '"am minim veniam es"' => [
        6,
        7,
      ],
      '"minim am veniam es"' => [],
      // Mixed queries.
'"am minim veniam es" OR dolore' => [
        2,
        6,
        7,
      ],
      '"minim am veniam es" OR "dolore sit"' => [
        2,
      ],
      '"minim am veniam es" OR "sit dolore"' => [],
      '"am minim veniam es" -eu' => [
        6,
      ],
      '"am minim veniam" -"cillum dolore"' => [
        5,
        6,
      ],
      '"am minim veniam" -"dolore cillum"' => [
        5,
        6,
        7,
      ],
      'xxxxx "minim am veniam es" OR dolore' => [],
      'xx "minim am veniam es" OR dolore' => [],
    ];
    $connection = Database::getConnection();
    foreach ($queries as $query => $results) {
      $result = $connection->select('search_index', 'i')
        ->extend(SearchQuery::class)
        ->searchExpression($query, static::SEARCH_TYPE)
        ->execute();
      $set = $result ? $result->fetchAll() : [];
      $this->_testQueryMatching($query, $set, $results);
      $this->_testQueryScores($query, $set, $results);
    }
    // These queries are run against the second index type, SEARCH_TYPE_2.
    $queries = [
      // Simple AND queries.
'ipsum' => [],
      'enim' => [],
      'enim minim' => [],
      'dear' => [
        8,
      ],
      'germany' => [
        11,
        12,
      ],
    ];
    foreach ($queries as $query => $results) {
      $result = $connection->select('search_index', 'i')
        ->extend(SearchQuery::class)
        ->searchExpression($query, static::SEARCH_TYPE_2)
        ->execute();
      $set = $result ? $result->fetchAll() : [];
      $this->_testQueryMatching($query, $set, $results);
      $this->_testQueryScores($query, $set, $results);
    }
    // These queries are run against the third index type, SEARCH_TYPE_JPN.
    $queries = [
      // Simple AND queries.
'呂波耳' => [
        13,
      ],
      '以呂波耳' => [
        13,
      ],
      'ほへと ヌルヲ' => [
        13,
      ],
      'とちリ' => [],
      'ドルーパル' => [
        14,
      ],
      'パルが大' => [
        14,
      ],
      'コーヒー' => [
        15,
      ],
      'ヒーキ' => [],
    ];
    foreach ($queries as $query => $results) {
      $result = $connection->select('search_index', 'i')
        ->extend(SearchQuery::class)
        ->searchExpression($query, static::SEARCH_TYPE_JPN)
        ->execute();
      $set = $result ? $result->fetchAll() : [];
      $this->_testQueryMatching($query, $set, $results);
      $this->_testQueryScores($query, $set, $results);
    }
  }
  
  /**
   * Tests the matching abilities of the engine.
   *
   * Verify if a query produces the correct results.
   */
  public function _testQueryMatching($query, $set, $results) : void {
    // Get result IDs.
    $found = [];
    foreach ($set as $item) {
      $found[] = $item->sid;
    }
    // Compare $results and $found.
    sort($found);
    sort($results);
    $this->assertEquals($found, $results, "Query matching '{$query}'");
  }
  
  /**
   * Tests the scoring abilities of the engine.
   *
   * Verify if a query produces normalized, monotonous scores.
   */
  public function _testQueryScores($query, $set, $results) : void {
    // Get result scores.
    $scores = [];
    foreach ($set as $item) {
      $scores[] = $item->calculated_score;
    }
    // Check order.
    $sorted = $scores;
    sort($sorted);
    $this->assertEquals($scores, array_reverse($sorted), "Query order '{$query}'");
    // Check range.
    $this->assertTrue(!count($scores) || min($scores) > 0.0 && max($scores) <= 1.0001, "Query scoring '{$query}'");
  }

}

Members

Title Sort descending Modifiers Object type Summary Overriden Title Overrides
AssertContentTrait::$content protected property The current raw content.
AssertContentTrait::$drupalSettings protected property The drupalSettings value from the current raw $content.
AssertContentTrait::$elements protected property The XML structure parsed from the current raw $content.
AssertContentTrait::$plainTextContent protected property The plain-text content of raw $content (text nodes).
AssertContentTrait::assertEscaped protected function Passes if the raw text IS found escaped on the loaded page, fail otherwise.
AssertContentTrait::assertField protected function Asserts that a field exists with the given name or ID.
AssertContentTrait::assertFieldByName protected function Asserts that a field exists with the given name and value.
AssertContentTrait::assertFieldByXPath protected function Asserts that a field exists in the current page by the given XPath.
AssertContentTrait::assertFieldsByValue protected function Asserts that a field exists in the current page with a given Xpath result.
AssertContentTrait::assertLink protected function Passes if a link with the specified label is found.
AssertContentTrait::assertLinkByHref protected function Passes if a link containing a given href (part) is found.
AssertContentTrait::assertNoLink protected function Passes if a link with the specified label is not found.
AssertContentTrait::assertNoPattern protected function Triggers a pass if the perl regex pattern is not found in raw content.
AssertContentTrait::assertNoRaw protected function Passes if the raw text is NOT found on the loaded page, fail otherwise.
AssertContentTrait::assertNoText protected function Passes if the page (with HTML stripped) does not contains the text.
AssertContentTrait::assertPattern protected function Triggers a pass if the Perl regex pattern is found in the raw content.
AssertContentTrait::assertRaw protected function Passes if the raw text IS found on the loaded page, fail otherwise.
AssertContentTrait::assertText protected function Passes if the page (with HTML stripped) contains the text.
AssertContentTrait::assertTextHelper protected function Helper for assertText and assertNoText.
AssertContentTrait::assertThemeOutput protected function Asserts themed output.
AssertContentTrait::assertTitle protected function Pass if the page title is the given string.
AssertContentTrait::buildXPathQuery protected function Builds an XPath query.
AssertContentTrait::constructFieldXpath protected function Helper: Constructs an XPath for the given set of attributes and value.
AssertContentTrait::cssSelect protected function Searches elements using a CSS selector in the raw content.
AssertContentTrait::getAllOptions protected function Get all option elements, including nested options, in a select.
AssertContentTrait::getDrupalSettings protected function Gets the value of drupalSettings for the currently-loaded page.
AssertContentTrait::getRawContent protected function Gets the current raw content.
AssertContentTrait::getSelectedItem protected function Get the selected value from a select field.
AssertContentTrait::getTextContent protected function Retrieves the plain-text content from the current raw content.
AssertContentTrait::parse protected function Parse content returned from curlExec using DOM and SimpleXML.
AssertContentTrait::removeWhiteSpace protected function Removes all white-space between HTML tags from the raw content.
AssertContentTrait::setDrupalSettings protected function Sets the value of drupalSettings for the currently-loaded page.
AssertContentTrait::setRawContent protected function Sets the raw content (e.g. HTML).
AssertContentTrait::xpath protected function Performs an xpath search on the contents of the internal browser.
BrowserHtmlDebugTrait::$htmlOutputBaseUrl protected property The Base URI to use for links to the output files.
BrowserHtmlDebugTrait::$htmlOutputClassName protected property Class name for HTML output logging.
BrowserHtmlDebugTrait::$htmlOutputCounter protected property Counter for HTML output logging.
BrowserHtmlDebugTrait::$htmlOutputCounterStorage protected property Counter storage for HTML output logging.
BrowserHtmlDebugTrait::$htmlOutputDirectory protected property Directory name for HTML output logging.
BrowserHtmlDebugTrait::$htmlOutputEnabled protected property HTML output enabled.
BrowserHtmlDebugTrait::$htmlOutputTestId protected property HTML output test ID.
BrowserHtmlDebugTrait::formatHtmlOutputHeaders protected function Formats HTTP headers as string for HTML output logging.
BrowserHtmlDebugTrait::getHtmlOutputHeaders protected function Returns headers in HTML output format. 1
BrowserHtmlDebugTrait::getResponseLogHandler protected function Provides a Guzzle middleware handler to log every response received.
BrowserHtmlDebugTrait::getTestMethodCaller protected function Retrieves the current calling line in the class under test. 1
BrowserHtmlDebugTrait::htmlOutput protected function Logs a HTML output message in a text file.
BrowserHtmlDebugTrait::initBrowserOutputFile protected function Creates the directory to store browser output.
ConfigTestTrait::configImporter protected function Returns a ConfigImporter object to import test configuration.
ConfigTestTrait::copyConfig protected function Copies configuration objects from source storage to target storage.
DrupalTestCaseTrait::$root protected property The Drupal root directory.
DrupalTestCaseTrait::checkErrorHandlerOnTearDown public function Checks the test error handler after test execution. 1
DrupalTestCaseTrait::getDrupalRoot protected static function Returns the Drupal root directory. 1
DrupalTestCaseTrait::setDebugDumpHandler public static function Registers the dumper CLI handler when the DebugDump extension is enabled.
ExtensionListTestTrait::getModulePath protected function Gets the path for the specified module.
ExtensionListTestTrait::getThemePath protected function Gets the path for the specified theme.
HttpKernelUiHelperTrait::$mink protected property Mink session manager.
HttpKernelUiHelperTrait::assertSession public function Returns WebAssert object.
HttpKernelUiHelperTrait::buildUrl protected function Builds a URL from a system path or a URL object.
HttpKernelUiHelperTrait::clickLink protected function Follows a link by complete name.
HttpKernelUiHelperTrait::drupalGet protected function Retrieves a Drupal path.
HttpKernelUiHelperTrait::getDefaultDriverInstance protected function Gets an instance of the default Mink driver.
HttpKernelUiHelperTrait::getNodeElementsByXpath protected function Performs an xpath search on the contents of the internal browser.
HttpKernelUiHelperTrait::getSession public function Returns Mink session.
HttpKernelUiHelperTrait::getUrl protected function Gets the current URL from the browser.
HttpKernelUiHelperTrait::initMink protected function Initializes Mink sessions.
KernelTestBase::$classLoader protected property The class loader.
KernelTestBase::$configImporter protected property The configuration importer.
KernelTestBase::$configSchemaCheckerExclusions protected static property An array of config object names that are excluded from schema checking. 4
KernelTestBase::$container protected property The test container.
KernelTestBase::$databasePrefix protected property The test database prefix.
KernelTestBase::$keyValue protected property The key_value service that must persist between container rebuilds.
KernelTestBase::$siteDirectory protected property The relative path to the test site directory.
KernelTestBase::$strictConfigSchema protected property Set to TRUE to strict check all configuration saved. 9
KernelTestBase::$usesSuperUserAccessPolicy protected property Set to TRUE to make user 1 a super user. 1
KernelTestBase::$vfsRoot protected property The virtual filesystem root directory.
KernelTestBase::assertPostConditions protected function 1
KernelTestBase::bootEnvironment protected function Bootstraps a basic test environment.
KernelTestBase::bootKernel protected function Bootstraps a kernel for a test. 1
KernelTestBase::config protected function Configuration accessor for tests. Returns non-overridden configuration.
KernelTestBase::disableModules protected function Disables modules for this test.
KernelTestBase::enableModules protected function Enables modules for this test. 2
KernelTestBase::getConfigSchemaExclusions protected function Gets the config schema exclusions for this test.
KernelTestBase::getDatabaseConnectionInfo protected function Returns the Database connection info to be used for this test. 3
KernelTestBase::getDatabasePrefix public function Gets the database prefix used for test isolation.
KernelTestBase::getExtensionsForModules private function Returns Extension objects for $modules to install.
KernelTestBase::getModulesToEnable protected static function Returns the modules to install for this test.
KernelTestBase::initFileCache protected function Initializes the FileCache component.
KernelTestBase::installConfig protected function Installs default configuration for a given list of modules.
KernelTestBase::installEntitySchema protected function Installs the storage schema for a specific entity type.
KernelTestBase::installSchema protected function Installs database tables from a module schema definition.
KernelTestBase::register public function Registers test-specific services. Overrides ServiceProviderInterface::register 40
KernelTestBase::render protected function Renders a render array. 1
KernelTestBase::setInstallProfile protected function Sets the install profile and rebuilds the container to update it.
KernelTestBase::setSetting protected function Sets an in-memory Settings variable.
KernelTestBase::setUpFilesystem protected function Sets up the filesystem, so things like the file directory. 3
KernelTestBase::tearDown protected function 10
KernelTestBase::tearDownCloseDatabaseConnection public function Additional tear down method to close the connection at the end.
KernelTestBase::vfsDump protected function Dumps the current state of the virtual filesystem to STDOUT.
KernelTestBase::__sleep public function Prevents serializing any properties.
RandomGeneratorTrait::getRandomGenerator protected function Gets the random generator for the utility methods.
RandomGeneratorTrait::randomMachineName protected function Generates a unique random string containing letters and numbers.
RandomGeneratorTrait::randomObject public function Generates a random PHP object.
RandomGeneratorTrait::randomString public function Generates a pseudo-random string of ASCII characters of codes 32 to 126.
SearchMatchTest::$modules protected static property Modules to install. Overrides KernelTestBase::$modules
SearchMatchTest::getText public function Helper to generate lorem ipsum snippets of content.
SearchMatchTest::getText2 public function Helper to generate English language snippets of content.
SearchMatchTest::SEARCH_TYPE constant
SearchMatchTest::SEARCH_TYPE_2 constant
SearchMatchTest::SEARCH_TYPE_JPN constant
SearchMatchTest::setUp protected function Overrides KernelTestBase::setUp
SearchMatchTest::testHTMLTagsWithWhitespace public function Tests HTML tags with whitespace characters are parsed correctly.
SearchMatchTest::testMatching public function Tests search indexing.
SearchMatchTest::_setup public function Set up a small index of items to test against.
SearchMatchTest::_testQueries public function Run predefine queries looking for indexed terms.
SearchMatchTest::_testQueryMatching public function Tests the matching abilities of the engine.
SearchMatchTest::_testQueryScores public function Tests the scoring abilities of the engine.
StorageCopyTrait::replaceStorageContents protected static function Copy the configuration from one storage to another and remove stale items.

Buggy or inaccurate documentation? Please file an issue. Need support? Need help programming? Connect with the Drupal community.