wikimedia/mediawiki-extensions-CirrusSearch

View on GitHub
includes/Query/SubPageOfFeature.php

Summary

Maintainability
A
1 hr
Test Coverage
<?php

namespace CirrusSearch\Query;

use CirrusSearch\CrossSearchStrategy;
use CirrusSearch\Parser\AST\KeywordFeatureNode;
use CirrusSearch\Query\Builder\QueryBuildingContext;
use CirrusSearch\Search\Fetch\HighlightedField;
use CirrusSearch\Search\Fetch\HighlightFieldGenerator;
use CirrusSearch\Search\SearchContext;
use CirrusSearch\WarningCollector;
use Elastica\Query\AbstractQuery;
use Elastica\Query\MatchQuery;
use Elastica\Query\MultiMatch;

/**
 * subpagesof, find subpages of a given page
 * uses the prefix field, very similar to the prefix except
 * that it enforces a trailing / and is not a greedy keyword
 */
class SubPageOfFeature extends SimpleKeywordFeature implements FilterQueryFeature, HighlightingFeature {
    /**
     * @return string[]
     */
    protected function getKeywords() {
        return [ 'subpageof' ];
    }

    /**
     * @param KeywordFeatureNode $node
     * @return CrossSearchStrategy
     */
    public function getCrossSearchStrategy( KeywordFeatureNode $node ) {
        return CrossSearchStrategy::allWikisStrategy();
    }

    /**
     * @param SearchContext $context
     * @param string $key The keyword
     * @param string $value The value attached to the keyword with quotes stripped
     * @param string $quotedValue The original value in the search string, including quotes if used
     * @param bool $negated Is the search negated? Not used to generate the returned AbstractQuery,
     *  that will be negated as necessary. Used for any other building/context necessary.
     * @return array Two element array, first an AbstractQuery or null to apply to the
     *  query. Second a boolean indicating if the quotedValue should be kept in the search
     *  string.
     */
    protected function doApply( SearchContext $context, $key, $value, $quotedValue, $negated ) {
        $parsedValue = $this->doParseValue( $value );
        if ( $parsedValue === null ) {
            return [ null, false ];
        }
        $q = $this->doGetFilterQuery( $parsedValue );
        if ( !$negated ) {
            foreach ( $this->doGetHLFields( $parsedValue, $context->getFetchPhaseBuilder() ) as $f ) {
                $context->getFetchPhaseBuilder()->addHLField( $f );
            }
        }
        return [ $q, false ];
    }

    /**
     * @param KeywordFeatureNode $node
     * @param QueryBuildingContext $context
     * @return AbstractQuery|null
     */
    public function getFilterQuery( KeywordFeatureNode $node, QueryBuildingContext $context ) {
        if ( $node->getParsedValue() === null ) {
            return null;
        }
        return $this->doGetFilterQuery( $node->getParsedValue() );
    }

    /**
     * @param array $parsedValue
     * @return AbstractQuery
     */
    private function doGetFilterQuery( array $parsedValue ): AbstractQuery {
        $query = new MultiMatch();
        $query->setFields( [ 'title.prefix', 'redirect.title.prefix' ] );
        $query->setQuery( $parsedValue['prefix'] );
        return $query;
    }

    /**
     * @inheritDoc
     */
    public function parseValue( $key, $value, $quotedValue, $valueDelimiter, $suffix, WarningCollector $warningCollector ) {
        return $this->doParseValue( $value );
    }

    /**
     * @param string $value
     * @return array|null
     */
    private function doParseValue( $value ) {
        if ( $value !== '' ) {
            $lastC = substr( $value, -1 );
            if ( $lastC !== '/' && $lastC !== '*' ) {
                $value .= '/';
            } elseif ( $lastC === '*' ) {
                $value = substr( $value, 0, -1 );
            }
            return [ 'prefix' => $value ];
        }
        return null;
    }

    /**
     * @param array $parsedValue
     * @param HighlightFieldGenerator $highlightFieldGenerator
     * @return HighlightedField[]
     */
    private function doGetHLFields( array $parsedValue, HighlightFieldGenerator $highlightFieldGenerator ) {
        $hlfields = [];
        $definition = [
            HighlightedField::TARGET_TITLE_SNIPPET => 'title.prefix',
            HighlightedField::TARGET_REDIRECT_SNIPPET => 'redirect.title.prefix',
        ];
        $first = true;
        foreach ( $definition as $target => $esfield ) {
            $field = $highlightFieldGenerator->newHighlightField( $esfield, $target,
                 HighlightedField::EXPERT_SYNTAX_PRIORITY );
            $field->setHighlightQuery( new MatchQuery( $esfield, $parsedValue['prefix'] ) );
            $field->setNumberOfFragments( 1 );
            $field->setFragmentSize( 10000 );
            if ( $first ) {
                $first = false;
            } else {
                $field->skipIfLastMatched();
            }
            $hlfields[] = $field;
        }
        return $hlfields;
    }

    /**
     * @inheritDoc
     */
    public function buildHighlightFields( KeywordFeatureNode $node, QueryBuildingContext $context ) {
        return $this->doGetHLFields( $node->getParsedValue(), $context->getHighlightFieldGenerator() );
    }
}