123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644 |
- <?php
- /**
- * Search service class using Solr server.
- */
- class SearchApiSolrService extends SearchApiAbstractService {
- /**
- * The date format that Solr uses, in PHP date() syntax.
- */
- const SOLR_DATE_FORMAT = 'Y-m-d\TH:i:s\Z';
- /**
- * A connection to the Solr server.
- *
- * @var SearchApiSolrConnection
- */
- protected $solr;
- /**
- * @var array
- */
- protected $fieldNames = array();
- /**
- * Metadata describing fields on the Solr/Lucene index.
- *
- * @see SearchApiSolrService::getFields().
- *
- * @var array
- */
- protected $fields;
- /**
- * Saves whether a commit operation was already scheduled for this server.
- *
- * @var boolean
- */
- protected $commitScheduled = FALSE;
- /**
- * Request handler to use for this search query.
- *
- * @var string
- */
- protected $request_handler = NULL;
- public function __construct(SearchApiServer $server) {
- parent::__construct($server);
- }
- public function configurationForm(array $form, array &$form_state) {
- if ($this->options) {
- // Editing this server
- $url = 'http://' . $this->options['host'] . ':' . $this->options['port'] . $this->options['path'];
- $form['server_description'] = array(
- '#type' => 'item',
- '#title' => t('Solr server URI'),
- '#description' => l($url, $url),
- );
- }
- $options = $this->options + array(
- 'host' => 'localhost',
- 'port' => '8983',
- 'path' => '/solr',
- 'http_user' => '',
- 'http_pass' => '',
- 'excerpt' => FALSE,
- 'retrieve_data' => FALSE,
- 'highlight_data' => FALSE,
- 'http_method' => Apache_Solr_Service::METHOD_POST,
- 'autocorrect_spell' => TRUE,
- 'autocorrect_suggest_words' => TRUE,
- );
- $form['host'] = array(
- '#type' => 'textfield',
- '#title' => t('Solr host'),
- '#description' => t('The host name or IP of your Solr server, e.g. <code>localhost</code> or <code>www.example.com</code>.'),
- '#default_value' => $options['host'],
- '#required' => TRUE,
- );
- $form['port'] = array(
- '#type' => 'textfield',
- '#title' => t('Solr port'),
- '#description' => t('The Jetty example server is at port 8983, while Tomcat uses 8080 by default.'),
- '#default_value' => $options['port'],
- '#required' => TRUE,
- );
- $form['path'] = array(
- '#type' => 'textfield',
- '#title' => t('Solr path'),
- '#description' => t('The path that identifies the Solr instance to use on the server.'),
- '#default_value' => $options['path'],
- );
- $form['http'] = array(
- '#type' => 'fieldset',
- '#title' => t('Basic HTTP authentication'),
- '#description' => t('If your Solr server is protected by basic HTTP authentication, enter the login data here.'),
- '#collapsible' => TRUE,
- '#collapsed' => empty($options['http_user']),
- );
- $form['http']['http_user'] = array(
- '#type' => 'textfield',
- '#title' => t('Username'),
- '#default_value' => $options['http_user'],
- );
- $form['http']['http_pass'] = array(
- '#type' => 'password',
- '#title' => t('Password'),
- '#default_value' => $options['http_pass'],
- );
- $form['advanced'] = array(
- '#type' => 'fieldset',
- '#title' => t('Advanced'),
- '#collapsible' => TRUE,
- '#collapsed' => TRUE,
- );
- $form['advanced']['excerpt'] = array(
- '#type' => 'checkbox',
- '#title' => t('Return an excerpt for all results'),
- '#description' => t("If search keywords are given, use Solr's capabilities to create a highlighted search excerpt for each result. " .
- 'Whether the excerpts will actually be displayed depends on the settings of the search, though.'),
- '#default_value' => $options['excerpt'],
- );
- $form['advanced']['retrieve_data'] = array(
- '#type' => 'checkbox',
- '#title' => t('Retrieve result data from Solr'),
- '#description' => t('When checked, result data will be retrieved directly from the Solr server. ' .
- 'This might make item loads unnecessary. Only indexed fields can be retrieved. ' .
- 'Note also that the returned field data might not always be correct, due to preprocessing and caching issues.'),
- '#default_value' => $options['retrieve_data'],
- );
- $form['advanced']['highlight_data'] = array(
- '#type' => 'checkbox',
- '#title' => t('Highlight retrieved data'),
- '#description' => t('When retrieving result data from the Solr server, try to highlight the search terms in the returned fulltext fields.'),
- '#default_value' => $options['highlight_data'],
- );
- // Highlighting retrieved data only makes sense when we retrieve data.
- // (Actually, internally it doesn't really matter. However, from a user's
- // perspective, having to check both probably makes sense.)
- $form['advanced']['highlight_data']['#states']['invisible']
- [':input[name="options[form][advanced][retrieve_data]"]']['checked'] = FALSE;
- $form['advanced']['http_method'] = array(
- '#type' => 'select',
- '#title' => t('HTTP method'),
- '#description' => t('The HTTP method to use for sending queries. Usually, POST will work fine in all cases.'),
- '#default_value' => $options['http_method'],
- '#options' => array(
- Apache_Solr_Service::METHOD_POST => 'POST',
- Apache_Solr_Service::METHOD_GET => 'GET',
- ),
- );
- if (module_exists('search_api_autocomplete')) {
- $form['advanced']['autocomplete'] = array(
- '#type' => 'fieldset',
- '#title' => t('Autocomplete'),
- '#collapsible' => TRUE,
- '#collapsed' => TRUE,
- );
- $form['advanced']['autocomplete']['autocorrect_spell'] = array(
- '#type' => 'checkbox',
- '#title' => t('Use spellcheck for autocomplete suggestions'),
- '#description' => t('If activated, spellcheck suggestions ("Did you mean") will be included in the autocomplete suggestions. Since the used dictionary contains words from all indexes, this might lead to leaking of sensitive data, depending on your setup.'),
- '#default_value' => $options['autocorrect_spell'],
- );
- $form['advanced']['autocomplete']['autocorrect_suggest_words'] = array(
- '#type' => 'checkbox',
- '#title' => t('Suggest additional words'),
- '#description' => t('If activated and the user enters a complete word, Solr will suggest additional words the user wants to search, which are often found (not searched!) together. This has been known to lead to strange results in some configurations – if you see inappropriate additional-word suggestions, you might want to deactivate this option.'),
- '#default_value' => $options['autocorrect_suggest_words'],
- );
- }
- return $form;
- }
- public function configurationFormValidate(array $form, array &$values, array &$form_state) {
- if (isset($values['port']) && (!is_numeric($values['port']) || $values['port'] < 0 || $values['port'] > 65535)) {
- form_error($form['port'], t('The port has to be an integer between 0 and 65535.'));
- }
- }
- public function configurationFormSubmit(array $form, array &$values, array &$form_state) {
- // Since the form is nested into another, we can't simply use #parents for
- // doing this array restructuring magic. (At least not without creating an
- // unnecessary dependency on internal implementation.)
- $values += $values['http'];
- $values += $values['advanced'];
- $values += !empty($values['autocomplete']) ? $values['autocomplete'] : array();
- unset($values['http'], $values['advanced'], $values['autocomplete']);
- // Highlighting retrieved data only makes sense when we retrieve data.
- $values['highlight_data'] &= $values['retrieve_data'];
- parent::configurationFormSubmit($form, $values, $form_state);
- }
- public function supportsFeature($feature) {
- // Search API features.
- $supported = array(
- 'search_api_autocomplete',
- 'search_api_facets',
- 'search_api_facets_operator_or',
- 'search_api_mlt',
- 'search_api_multi',
- 'search_api_spellcheck',
- 'search_api_data_type_location',
- 'search_api_data_type_geohash',
- );
- // Custom data types.
- foreach (search_api_solr_get_dynamic_field_info() as $type => $info) {
- $supported[] = 'search_api_data_type_' . $type;
- }
- $supported = drupal_map_assoc($supported);
- return isset($supported[$feature]);
- }
- /**
- * View this server's settings.
- */
- public function viewSettings() {
- $output = '';
- $options = $this->options;
- $url = 'http://' . $options['host'] . ':' . $options['port'] . $options['path'];
- $output .= "<dl>\n <dt>";
- $output .= t('Solr server URI');
- $output .= "</dt>\n <dd>";
- $output .= l($url, $url);
- $output .= '</dd>';
- if ($options['http_user']) {
- $output .= "\n <dt>";
- $output .= t('Basic HTTP authentication');
- $output .= "</dt>\n <dd>";
- $output .= t('Username: @user', array('@user' => $options['http_user']));
- $output .= "</dd>\n <dd>";
- $output .= t('Password: @pass', array('@pass' => str_repeat('*', strlen($options['http_pass']))));
- $output .= '</dd>';
- }
- $output .= "\n</dl>";
- return $output;
- }
- /**
- * Create a connection to the Solr server as configured in $this->options.
- */
- protected function connect() {
- if (!$this->solr) {
- if (!class_exists('Apache_Solr_Service')) {
- throw new Exception(t('SolrPhpClient library not found! Please follow the instructions in search_api_solr/INSTALL.txt for installing the Solr search module.'));
- }
- $this->solr = new SearchApiSolrConnection($this->options);
- }
- }
- public function addIndex(SearchApiIndex $index) {
- if (module_exists('search_api_multi') && module_exists('search_api_views')) {
- views_invalidate_cache();
- }
- }
- public function fieldsUpdated(SearchApiIndex $index) {
- if (module_exists('search_api_multi') && module_exists('search_api_views')) {
- views_invalidate_cache();
- }
- return TRUE;
- }
- public function removeIndex($index) {
- if (module_exists('search_api_multi') && module_exists('search_api_views')) {
- views_invalidate_cache();
- }
- $id = is_object($index) ? $index->machine_name : $index;
- // Only delete the index's data if the index isn't read-only.
- if (!is_object($index) || empty($index->read_only)) {
- try {
- $this->connect();
- $this->solr->deleteByQuery("index_id:" . $id);
- }
- catch (Exception $e) {
- watchdog_exception('search_api_solr', $e, "%type while deleting an index's data: !message in %function (line %line of %file).");
- }
- }
- }
- public function indexItems(SearchApiIndex $index, array $items) {
- $documents = array();
- $ret = array();
- $index_id = $index->machine_name;
- $fields = $this->getFieldNames($index);
- foreach ($items as $id => $item) {
- try {
- $doc = new Apache_Solr_Document();
- $doc->setField('id', $this->createId($index_id, $id));
- $doc->setField('index_id', $index_id);
- $doc->setField('item_id', $id);
- foreach ($item as $key => $field) {
- if (!isset($fields[$key])) {
- throw new SearchApiException(t('Unknown field @field.', array('@field' => $key)));
- }
- $this->addIndexField($doc, $fields[$key], $field['value'], $field['type']);
- }
- $documents[] = $doc;
- $ret[] = $id;
- }
- catch (Exception $e) {
- watchdog_exception('search_api_solr', $e, "%type while indexing @type with ID @id: !message in %function (line %line of %file).", array('@type' => $index->item_type, '@id' => $id), WATCHDOG_WARNING);
- }
- }
- if (!$documents) {
- return array();
- }
- try {
- $this->connect();
- $response = $this->solr->addDocuments($documents);
- if ($response->getHttpStatus() == 200) {
- if (!empty($index->options['index_directly'])) {
- $this->scheduleCommit();
- }
- return $ret;
- }
- throw new SearchApiException(t('HTTP status @status: @msg.',
- array('@status' => $response->getHttpStatus(), '@msg' => $response->getHttpStatusMessage())));
- }
- catch (Exception $e) {
- watchdog_exception('search_api_solr', $e, "%type while indexing: !message in %function (line %line of %file).");
- }
- return array();
- }
- /**
- * Creates an ID used as the unique identifier at the Solr server. This has to
- * consist of both index and item ID.
- */
- protected function createId($index_id, $item_id) {
- return "$index_id-$item_id";
- }
- /**
- * Create a list of all indexed field names mapped to their Solr field names.
- *
- * The special fields "search_api_id", "search_api_relevance", and "id" are
- * also included. Any Solr fields that exist on search results are mapped back
- * to their local field names in the final result set.
- *
- * @see SearchApiSolrService::search()
- */
- public function getFieldNames(SearchApiIndex $index, $reset = FALSE) {
- if (!isset($this->fieldNames[$index->machine_name]) || $reset) {
- // This array maps "local property name" => "solr doc property name".
- $ret = array(
- 'search_api_id' => 'ss_search_api_id',
- 'search_api_relevance' => 'score',
- 'search_api_item_id' => 'item_id',
- );
- // Add the names of any fields configured on the index.
- $fields = (isset($index->options['fields']) ? $index->options['fields'] : array());
- foreach ($fields as $key => $field) {
- // Generate a field name; this corresponds with naming conventions in
- // our schema.xml
- $type = $field['type'];
- // Use the real type of the field if the server supports this type.
- if (isset($field['real_type'])) {
- $custom_type = search_api_extract_inner_type($field['real_type']);
- if ($this->supportsFeature('search_api_data_type_' . $custom_type)) {
- $type = $field['real_type'];
- }
- }
- $inner_type = search_api_extract_inner_type($type);
- $type_info = search_api_solr_get_dynamic_field_info($inner_type);
- $pref = isset($type_info['prefix']) ? $type_info['prefix']: '';
- if (empty($type_info['always multiValued'])) {
- $pref .= $type == $inner_type ? 's' : 'm';
- }
- $name = $pref . '_' . $key;
- $ret[$key] = $name;
- }
- // Let modules adjust the field mappings.
- drupal_alter('search_api_solr_field_mapping', $index, $ret);
- $this->fieldNames[$index->machine_name] = $ret;
- }
- return $this->fieldNames[$index->machine_name];
- }
- /**
- * Helper method for indexing.
- * Add $field with field name $key to the document $doc. The format of $field
- * is the same as specified in SearchApiServiceInterface::indexItems().
- */
- protected function addIndexField(Apache_Solr_Document $doc, $key, $value, $type, $multi_valued = FALSE) {
- // Don't index empty values (i.e., when field is missing)
- if (!isset($value)) {
- return;
- }
- if (search_api_is_list_type($type)) {
- $type = substr($type, 5, -1);
- foreach ($value as $v) {
- $this->addIndexField($doc, $key, $v, $type, TRUE);
- }
- return;
- }
- switch ($type) {
- case 'tokens':
- foreach ($value as $v) {
- $doc->addField($key, $v['value']);
- }
- return;
- case 'boolean':
- $value = $value ? 'true' : 'false';
- break;
- case 'date':
- $value = is_numeric($value) ? (int) $value : strtotime($value);
- if ($value === FALSE) {
- return;
- }
- $value = format_date($value, 'custom', self::SOLR_DATE_FORMAT, 'UTC');
- break;
- case 'integer':
- $value = (int) $value;
- break;
- case 'decimal':
- $value = (float) $value;
- break;
- }
- if ($multi_valued) {
- $doc->addField($key, $value);
- }
- else {
- $doc->setField($key, $value);
- }
- }
- /**
- * Delete items from an index on this server.
- *
- * This method has a custom, Solr-specific extension:
- * If $ids is a string other than "all", it is treated as a Solr query. All
- * items matching that Solr query are then deleted. If $index is additionally
- * specified, then only those items also lying on that index will be deleted.
- * It is up to the caller to ensure $ids is a valid query when the method is
- * called in this fashion.
- */
- public function deleteItems($ids = 'all', SearchApiIndex $index = NULL) {
- try {
- $this->connect();
- if ($index) {
- $index_id = $index->machine_name;
- if (is_array($ids)) {
- $solr_ids = array();
- foreach ($ids as $id) {
- $solr_ids[] = $this->createId($index_id, $id);
- }
- $this->solr->deleteByMultipleIds($solr_ids);
- }
- elseif ($ids == 'all') {
- $this->solr->deleteByQuery("index_id:" . $index_id);
- }
- else {
- $this->solr->deleteByQuery("index_id:" . $index_id . ' (' . $ids . ')');
- }
- }
- else {
- $q = $ids == 'all' ? '*:*' : $ids;
- $this->solr->deleteByQuery($q);
- }
- $this->scheduleCommit();
- }
- catch(Exception $e) {
- watchdog_exception('search_api_solr', $e, '%type while deleting items from server @server: !message in %function (line %line of %file).', array('@server' => $this->server->name));
- }
- }
- public function search(SearchApiQueryInterface $query) {
- $time_method_called = microtime(TRUE);
- // Reset request handler
- $this->request_handler = NULL;
- // Get field information
- $index = $query->getIndex();
- $fields = $this->getFieldNames($index);
- // Extract keys
- $keys = $query->getKeys();
- if (is_array($keys)) {
- $keys = $this->flattenKeys($keys);
- }
- // Set searched fields
- $options = $query->getOptions();
- $search_fields = $query->getFields();
- // Get the index fields to be able to retrieve boosts.
- $index_fields = $index->getFields();
- $qf = array();
- foreach ($search_fields as $f) {
- $boost = '';
- $boost = isset($index_fields[$f]['boost']) ? '^' . $index_fields[$f]['boost'] : '';
- $qf[] = $fields[$f] . $boost;
- }
- // Extract filters
- $filter = $query->getFilter();
- $fq = $this->createFilterQueries($filter, $fields, $index->options['fields']);
- $fq[] = 'index_id:' . $index->machine_name;
- // Extract sort
- $sort = array();
- foreach ($query->getSort() as $f => $order) {
- $f = $fields[$f];
- if (substr($f, 0, 3) == 'ss_') {
- $f = 'sort_' . substr($f, 3);
- }
- $order = strtolower($order);
- $sort[] = "$f $order";
- }
- // Get facet fields
- $facets = $query->getOption('search_api_facets', array());
- $facet_params = $this->getFacetParams($facets, $fields, $fq);
- // Handle highlighting
- $highlight_params = $this->getHighlightParams($query);
- // Handle More Like This query
- $mlt = $query->getOption('search_api_mlt');
- if ($mlt) {
- $mlt_params['qt'] = 'mlt';
- // The fields to look for similarities in.
- $mlt_fl = array();
- foreach($mlt['fields'] as $f) {
- $mlt_fl[] = $fields[$f];
- // For non-text fields, set minimum word length to 0.
- if (isset($index->options['fields'][$f]['type']) && !search_api_is_text_type($index->options['fields'][$f]['type'])) {
- $mlt_params['f.' . $fields[$f] . '.mlt.minwl'] = 0;
- }
- }
- $mlt_params['mlt.fl'] = implode(',', $mlt_fl);
- $keys = 'id:' . SearchApiSolrConnection::phrase($this->createId($index->machine_name, $mlt['id']));
- }
- // Set defaults
- if (!$keys) {
- $keys = NULL;
- }
- $offset = isset($options['offset']) ? $options['offset'] : 0;
- $limit = isset($options['limit']) ? $options['limit'] : 1000000;
- // Collect parameters
- $params = array(
- 'fl' => 'item_id,score',
- 'qf' => $qf,
- 'fq' => $fq,
- );
- if ($sort) {
- $params['sort'] = implode(', ', $sort);
- }
- if (!empty($facet_params['facet.field'])) {
- $params += $facet_params;
- }
- if (!empty($highlight_params)) {
- $params += $highlight_params;
- }
- if (!empty($options['search_api_spellcheck'])) {
- $params['spellcheck'] = 'true';
- }
- if (!empty($mlt_params['mlt.fl'])) {
- $params += $mlt_params;
- }
- if (!empty($this->options['retrieve_data'])) {
- $params['fl'] = '*,score';
- }
- $call_args = array(
- 'query' => &$keys,
- 'offset' => &$offset,
- 'limit' => &$limit,
- 'params' => &$params,
- );
- if ($this->request_handler) {
- $this->setRequestHandler($this->request_handler, $call_args);
- }
- try {
- // Send search request
- $time_processing_done = microtime(TRUE);
- $this->connect();
- drupal_alter('search_api_solr_query', $call_args, $query);
- $this->preQuery($call_args, $query);
- // Retrieve http method from server options.
- $http_method = !empty($this->options['http_method']) ? $this->options['http_method'] : Apache_Solr_Service::METHOD_POST;
- $response = $this->solr->search($keys, $offset, $limit, $params, $http_method);
- $time_query_done = microtime(TRUE);
- if ($response->getHttpStatus() != 200) {
- throw new SearchApiException(t('The Solr server responded with status code @status: @msg.',
- array('@status' => $response->getHttpStatus(), '@msg' => $response->getHttpStatusMessage())));
- }
- // Extract results
- $results = $this->extractResults($query, $response);
- // Extract facets
- if ($facets = $this->extractFacets($query, $response)) {
- $results['search_api_facets'] = $facets;
- }
- drupal_alter('search_api_solr_search_results', $results, $query, $response);
- $this->postQuery($results, $query, $response);
- // Compute performance
- $time_end = microtime(TRUE);
- $results['performance'] = array(
- 'complete' => $time_end - $time_method_called,
- 'preprocessing' => $time_processing_done - $time_method_called,
- 'execution' => $time_query_done - $time_processing_done,
- 'postprocessing' => $time_end - $time_query_done,
- );
- return $results;
- }
- catch (Exception $e) {
- throw new SearchApiException(t('An error occurred while trying to search with Solr: @msg.', array('@msg' => $e->getMessage())));
- }
- }
- /**
- * Extract results from a Solr response.
- *
- * @param Apache_Solr_Response $response
- * A response object from SolrPhpClient.
- *
- * @return array
- * An array with two keys:
- * - result count: The number of total results.
- * - results: An array of search results, as specified by
- * SearchApiQueryInterface::execute().
- */
- protected function extractResults(SearchApiQueryInterface $query, Apache_Solr_Response $response) {
- $index = $query->getIndex();
- $fields = $this->getFieldNames($index);
- $field_options = $index->options['fields'];
- // Set up the results array.
- $results = array();
- $results['results'] = array();
- // In some rare cases (e.g., MLT query with nonexistent ID) the response
- // will be NULL.
- if (!isset($response->response)) {
- $results['result count'] = 0;
- return $results;
- }
- $results['result count'] = $response->response->numFound;
- // Add each search result to the results array.
- foreach ($response->response->docs as $doc) {
- // Blank result array.
- $result = array(
- 'id' => NULL,
- 'score' => NULL,
- 'fields' => array(),
- );
- // Extract properties from the Solr document, translating from Solr to
- // Search API property names. This reverses the mapping in
- // SearchApiSolrService::getFieldNames().
- foreach ($fields as $search_api_property => $solr_property) {
- if (isset($doc->{$solr_property})) {
- $result['fields'][$search_api_property] = $doc->{$solr_property};
- // Date fields need some special treatment to become valid date values
- // (i.e., timestamps) again.
- if (isset($field_options[$search_api_property]['type'])
- && $field_options[$search_api_property]['type'] == 'date'
- && preg_match('/^\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}Z$/', $result['fields'][$search_api_property])) {
- $result['fields'][$search_api_property] = strtotime($result['fields'][$search_api_property]);
- }
- }
- }
- // We can find the item id and score in the special 'search_api_*'
- // properties. Mappings are provided for these properties in
- // SearchApiSolrService::getFieldNames().
- $result['id'] = $result['fields']['search_api_item_id'];
- $result['score'] = $result['fields']['search_api_relevance'];
- $solr_id = $this->createId($index->machine_name, $result['id']);
- $excerpt = $this->getExcerpt($response, $solr_id, $result['fields'], $fields);
- if ($excerpt) {
- $result['excerpt'] = $excerpt;
- }
- // Use the result's id as the array key. By default, 'id' is mapped to
- // 'item_id' in SearchApiSolrService::getFieldNames().
- if ($result['id']) {
- $results['results'][$result['id']] = $result;
- }
- }
- // Check for spellcheck suggestions.
- if (module_exists('search_api_spellcheck') && $query->getOption('search_api_spellcheck')) {
- $results['search_api_spellcheck'] = new SearchApiSpellcheckSolr($response);
- }
- return $results;
- }
- /**
- * Extract and format highlighting information for a specific item from a Solr response.
- *
- * Will also use highlighted fields to replace retrieved field data, if the
- * corresponding option is set.
- */
- protected function getExcerpt(Apache_Solr_Response $response, $id, array &$fields, array $field_mapping) {
- if (!isset($response->highlighting->$id)) {
- return FALSE;
- }
- $output = '';
- if (!empty($this->options['excerpt']) && !empty($response->highlighting->$id->spell)) {
- foreach ($response->highlighting->$id->spell as $snippet) {
- $snippet = strip_tags($snippet);
- $snippet = preg_replace('/^.*>|<.*$/', '', $snippet);
- $snippet = $this->formatHighlighting($snippet);
- // The created fragments sometimes have leading or trailing punctuation.
- // We remove that here for all common cases, but take care not to remove
- // < or > (so HTML tags stay valid).
- $snippet = trim($snippet, "\00..\x2F:;=\x3F..\x40\x5B..\x60");
- $output .= $snippet . ' … ';
- }
- }
- if (!empty($this->options['highlight_data'])) {
- foreach ($field_mapping as $search_api_property => $solr_property) {
- if (substr($solr_property, 0, 2) == 't_' && !empty($response->highlighting->$id->$solr_property)) {
- // Contrary to above, we here want to preserve HTML, so we just
- // replace the [HIGHLIGHT] tags with the appropriate format here.
- $fields[$search_api_property] = $this->formatHighlighting($response->highlighting->$id->$solr_property);
- }
- }
- }
- return $output;
- }
- protected function formatHighlighting($snippet) {
- return preg_replace('#\[(/?)HIGHLIGHT\]#', '<$1strong>', $snippet);
- }
- /**
- * Extract facets from a Solr response.
- *
- * @param Apache_Solr_Response $response
- * A response object from SolrPhpClient.
- *
- * @return array
- * An array describing facets that apply to the current results.
- */
- protected function extractFacets(SearchApiQueryInterface $query, Apache_Solr_Response $response) {
- if (isset($response->facet_counts->facet_fields)) {
- $index = $query->getIndex();
- $fields = $this->getFieldNames($index);
- $facets = array();
- $facet_fields = $response->facet_counts->facet_fields;
- $extract_facets = $query->getOption('search_api_facets');
- $extract_facets = ($extract_facets ? $extract_facets : array());
- foreach ($extract_facets as $delta => $info) {
- $field = $fields[$info['field']];
- if (!empty($facet_fields->$field)) {
- $min_count = $info['min_count'];
- $terms = $facet_fields->$field;
- if ($info['missing']) {
- // We have to correctly incorporate the "_empty_" term.
- // This will ensure that the term with the least results is dropped, if the limit would be exceeded.
- if (isset($terms->_empty_) && $terms->_empty_ < $min_count) {
- unset($terms->_empty_);
- }
- else {
- $terms = (array) $terms;
- arsort($terms);
- if (count($terms) > $info['limit']) {
- array_pop($terms);
- }
- }
- }
- elseif (isset($terms->_empty_)) {
- $terms = clone $terms;
- unset($terms->_empty_);
- }
- $type = isset($index->options['fields'][$info['field']]['type']) ? $index->options['fields'][$info['field']]['type'] : 'string';
- foreach ($terms as $term => $count) {
- if ($count >= $min_count) {
- if ($type == 'boolean') {
- if ($term == 'true') {
- $term = 1;
- }
- elseif ($term == 'false') {
- $term = 0;
- }
- }
- elseif ($type == 'date') {
- $term = isset($term) ? strtotime($term) : NULL;
- }
- $term = $term === '_empty_' ? '!' : '"' . $term . '"';
- $facets[$delta][] = array(
- 'filter' => $term,
- 'count' => $count,
- );
- }
- }
- if (empty($facets[$delta])) {
- unset($facets[$delta]);
- }
- }
- }
- return $facets;
- }
- }
- /**
- * Flatten a keys array into a single search string.
- *
- * @param array $keys
- * The keys array to flatten, formatted as specified by
- * SearchApiQueryInterface::getKeys().
- *
- * @return string
- * A Solr query string representing the same keys.
- */
- protected function flattenKeys(array $keys) {
- $k = array();
- $or = $keys['#conjunction'] == 'OR';
- $neg = !empty($keys['#negation']);
- foreach (element_children($keys) as $i) {
- $key = $keys[$i];
- if (!$key) {
- continue;
- }
- if (is_array($key)) {
- $subkeys = $this->flattenKeys($key);
- if ($subkeys) {
- $nested_expressions = TRUE;
- // If this is a negated OR expression, we can't just use nested keys
- // as-is, but have to put them into parantheses.
- if ($or && $neg) {
- $subkeys = "($subkeys)";
- }
- $k[] = $subkeys;
- }
- }
- else {
- $key = trim($key);
- $key = SearchApiSolrConnection::phrase($key);
- $k[] = $key;
- }
- }
- if (!$k) {
- return '';
- }
- // Formatting the keys into a Solr query can be a bit complex. The following
- // code will produce that look like this:
- //
- // #conjunction | #negation | return value
- // ----------------------------------------------------------------
- // AND | FALSE | A B C
- // AND | TRUE | -(A B C)
- // OR | FALSE | ((A) OR (B) OR (C))
- // OR | TRUE | -A -B -C
- // If there was just a single, unnested key, we can ignore all this.
- if (count($k) == 1 && empty($nested_expressions)) {
- $k = reset($k);
- return $neg ? "-$k" : $k;
- }
- if ($or) {
- if ($neg) {
- return '-' . implode(' -', $k);
- }
- return '((' . implode(') OR (', $k) . '))';
- }
- $k = implode(' ', $k);
- return $neg ? "-($k)" : $k;
- }
- /**
- * Transforms a query filter into a flat array of Solr filter queries, using
- * the field names in $fields.
- */
- protected function createFilterQueries(SearchApiQueryFilterInterface $filter, array $solr_fields, array $fields) {
- $or = $filter->getConjunction() == 'OR';
- $fq = array();
- foreach ($filter->getFilters() as $f) {
- if (is_array($f)) {
- if (!isset($fields[$f[0]])) {
- throw new SearchApiException(t('Filter term on unknown or unindexed field @field.', array('@field' => $f[0])));
- }
- if ($f[1] !== '') {
- $fq[] = $this->createFilterQuery($solr_fields[$f[0]], $f[1], $f[2], $fields[$f[0]]);
- }
- }
- else {
- $q = $this->createFilterQueries($f, $solr_fields, $fields);
- if ($filter->getConjunction() != $f->getConjunction()) {
- // $or == TRUE means the nested filter has conjunction AND, and vice versa
- $sep = $or ? ' ' : ' OR ';
- $fq[] = count($q) == 1 ? reset($q) : '((' . implode(')' . $sep . '(', $q) . '))';
- }
- else {
- $fq = array_merge($fq, $q);
- }
- }
- }
- return ($or && count($fq) > 1) ? array('((' . implode(') OR (', $fq) . '))') : $fq;
- }
- /**
- * Create a single search query string according to the given field, value
- * and operator.
- */
- protected function createFilterQuery($field, $value, $operator, $field_info) {
- $field = SearchApiSolrConnection::escapeFieldName($field);
- if ($value === NULL) {
- return ($operator == '=' ? '-' : '') . "$field:[* TO *]";
- }
- $value = trim($value);
- $value = $this->formatFilterValue($value, search_api_extract_inner_type($field_info['type']));
- switch ($operator) {
- case '<>':
- return "-($field:$value)";
- case '<':
- return "$field:{* TO $value}";
- case '<=':
- return "$field:[* TO $value]";
- case '>=':
- return "$field:[$value TO *]";
- case '>':
- return "$field:{{$value} TO *}";
- default:
- return "$field:$value";
- }
- }
- /**
- * Format a value for filtering on a field of a specific type.
- */
- protected function formatFilterValue($value, $type) {
- switch ($type) {
- case 'boolean':
- $value = $value ? 'true' : 'false';
- break;
- case 'date':
- $value = is_numeric($value) ? (int) $value : strtotime($value);
- if ($value === FALSE) {
- return 0;
- }
- $value = format_date($value, 'custom', self::SOLR_DATE_FORMAT, 'UTC');
- break;
- }
- return SearchApiSolrConnection::phrase($value);
- }
- /**
- * Helper method for creating the facet field parameters.
- */
- protected function getFacetParams(array $facets, array $fields, array &$fq = array()) {
- if (!$facets) {
- return array();
- }
- $facet_params['facet'] = 'true';
- $facet_params['facet.sort'] = 'count';
- $facet_params['facet.limit'] = 10;
- $facet_params['facet.mincount'] = 1;
- $facet_params['facet.missing'] = 'false';
- $taggedFields = array();
- foreach ($facets as $info) {
- if (empty($fields[$info['field']])) {
- continue;
- }
- // String fields have their own corresponding facet fields.
- $field = $fields[$info['field']];
- // Check for the "or" operator.
- if (isset($info['operator']) && $info['operator'] === 'or') {
- // Remember that filters for this field should be tagged.
- $escaped = SearchApiSolrConnection::escapeFieldName($fields[$info['field']]);
- $taggedFields[$escaped] = "{!tag=$escaped}";
- // Add the facet field.
- $facet_params['facet.field'][] = "{!ex=$escaped}$field";
- }
- else {
- // Add the facet field.
- $facet_params['facet.field'][] = $field;
- }
- // Set limit, unless it's the default.
- if ($info['limit'] != 10) {
- $facet_params["f.$field.facet.limit"] = $info['limit'] ? $info['limit'] : -1;
- }
- // Set mincount, unless it's the default.
- if ($info['min_count'] != 1) {
- $facet_params["f.$field.facet.mincount"] = $info['min_count'];
- }
- // Set missing, if specified.
- if ($info['missing']) {
- $facet_params["f.$field.facet.missing"] = 'true';
- }
- }
- // Tag filters of fields with "OR" facets.
- foreach ($taggedFields as $field => $tag) {
- $regex = '#(?<![^( ])' . preg_quote($field, '#') . ':#';
- foreach ($fq as $i => $filter) {
- // Solr can't handle two tags on the same filter, so we don't add two.
- // Another option here would even be to remove the other tag, too,
- // since we can be pretty sure that this filter does not originate from
- // a facet – however, wrong results would still be possible, and this is
- // definitely an edge case, so don't bother.
- if (preg_match($regex, $filter) && substr($filter, 0, 6) != '{!tag=') {
- $fq[$i] = $tag . $filter;
- }
- }
- }
- return $facet_params;
- }
- /**
- * Helper method for creating the highlighting parameters.
- *
- * (The $query parameter currently isn't used and only here for the potential
- * sake of subclasses.)
- */
- protected function getHighlightParams(SearchApiQueryInterface $query) {
- $highlight_params = array();
- if (!empty($this->options['excerpt']) || !empty($this->options['highlight_data'])) {
- $highlight_params['hl'] = 'true';
- $highlight_params['hl.fl'] = 'spell';
- $highlight_params['hl.simple.pre'] = '[HIGHLIGHT]';
- $highlight_params['hl.simple.post'] = '[/HIGHLIGHT]';
- $highlight_params['hl.snippets'] = 3;
- $highlight_params['hl.fragsize'] = 70;
- $highlight_params['hl.mergeContiguous'] = 'true';
- }
- if (!empty($this->options['highlight_data'])) {
- $highlight_params['hl.fl'] = 't_*';
- $highlight_params['hl.snippets'] = 1;
- $highlight_params['hl.fragsize'] = 0;
- if (!empty($this->options['excerpt'])) {
- // If we also generate a "normal" excerpt, set the settings for the
- // "spell" field (which we use to generate the excerpt) back to the
- // above values.
- $highlight_params['f.spell.hl.snippets'] = 3;
- $highlight_params['f.spell.hl.fragsize'] = 70;
- // It regrettably doesn't seem to be possible to set hl.fl to several
- // values, if one contains wild cards (i.e., "t_*,spell" wouldn't work).
- $highlight_params['hl.fl'] = '*';
- }
- }
- return $highlight_params;
- }
- /**
- * Helper method for setting the request handler, and making necessary
- * adjustments to the request parameters.
- *
- * @param $handler
- * Name of the handler to set.
- * @param array $call_args
- * An associative array containing all four arguments to the
- * Apache_Solr_Service::search() call ("query", "offset", "limit" and
- * "params") as references.
- *
- * @return boolean
- * TRUE iff this method invocation handled the given handler. This allows
- * subclasses to recognize whether the request handler was already set by
- * this method.
- */
- protected function setRequestHandler($handler, array &$call_args) {
- if ($handler == 'pinkPony') {
- $call_args['params']['qt'] = $handler;
- return TRUE;
- }
- return FALSE;
- }
- /**
- * Empty method to allow subclasses to apply custom changes before the query
- * is sent to Solr. Works exactly like hook_search_api_solr_query_alter().
- *
- * @param array $call_args
- * An associative array containing all four arguments to the
- * Apache_Solr_Service::search() call ("query", "offset", "limit" and
- * "params") as references.
- * @param SearchApiQueryInterface $query
- * The SearchApiQueryInterface object representing the executed search query.
- */
- protected function preQuery(array &$call_args, SearchApiQueryInterface $query) {
- }
- /**
- * Empty method to allow subclasses to apply custom changes before search results are returned.
- *
- * Works exactly like hook_search_api_solr_search_results_alter().
- *
- * @param array $results
- * The results array that will be returned for the search.
- * @param SearchApiQueryInterface $query
- * The SearchApiQueryInterface object representing the executed search query.
- * @param Apache_Solr_Response $response
- * The response object returned by Solr.
- */
- protected function postQuery(array &$results, SearchApiQueryInterface $query, Apache_Solr_Response $response) {
- }
- //
- // Autocompletion feature
- //
- /**
- * Get autocompletion suggestions for some user input.
- *
- * @param SearchApiQueryInterface $query
- * A query representing the completed user input so far.
- * @param SearchApiAutocompleteSearch $search
- * An object containing details about the search the user is on, and
- * settings for the autocompletion.
- * @param string $incomplete_key
- * The start of another fulltext keyword for the search, which should be
- * completed.
- * @param string $user_input
- * The complete user input for the fulltext search keywords so far.
- *
- * @return array
- * An array of suggestion. Each suggestion is either a simple string
- * containing the whole suggested keywords, or an array containing the
- * following keys:
- * - prefix: For special suggestions, some kind of prefix describing them.
- * - suggestion_prefix: A suggested prefix for the entered input.
- * - user_input: The input entered by the user. Defaults to $user_input.
- * - suggestion_suffix: A suggested suffix for the entered input.
- * - results: If available, the estimated number of results for these keys.
- */
- // Largely copied from the apachesolr_autocomplete module.
- public function getAutocompleteSuggestions(SearchApiQueryInterface $query, SearchApiAutocompleteSearch $search, $incomplete_key, $user_input) {
- $suggestions = array();
- // Reset request handler
- $this->request_handler = NULL;
- // Turn inputs to lower case, otherwise we get case sensivity problems.
- $incomp = drupal_strtolower($incomplete_key);
- $index = $query->getIndex();
- $fields = $this->getFieldNames($index);
- $complete = $query->getOriginalKeys();
- // Extract keys
- $keys = $query->getKeys();
- if (is_array($keys)) {
- $keys_array = array();
- while ($keys) {
- reset($keys);
- if (!element_child(key($keys))) {
- array_shift($keys);
- continue;
- }
- $key = array_shift($keys);
- if (is_array($key)) {
- $keys = array_merge($keys, $key);
- }
- else {
- $keys_array[$key] = $key;
- }
- }
- $keys = $this->flattenKeys($query->getKeys());
- }
- else {
- $keys_array = drupal_map_assoc(preg_split('/[-\s():{}\[\]\\\\"]+/', $keys, -1, PREG_SPLIT_NO_EMPTY));
- }
- if (!$keys) {
- $keys = NULL;
- }
- // Set searched fields
- $options = $query->getOptions();
- $search_fields = $query->getFields();
- $qf = array();
- foreach ($search_fields as $f) {
- $qf[] = $fields[$f];
- }
- // Extract filters
- $fq = $this->createFilterQueries($query->getFilter(), $fields, $index->options['fields']);
- $fq[] = 'index_id:' . $index->machine_name;
- // Autocomplete magic
- $facet_fields = array();
- foreach ($search_fields as $f) {
- $facet_fields[] = $fields[$f];
- }
- $limit = $query->getOption('limit', 10);
- $params = array(
- 'qf' => $qf,
- 'fq' => $fq,
- 'facet' => 'true',
- 'facet.field' => $facet_fields,
- 'facet.prefix' => $incomp,
- 'facet.limit' => $limit * 5,
- 'facet.mincount' => 1,
- 'spellcheck' => (!isset($this->options['autocorrect_spell']) || $this->options['autocorrect_spell']) ? 'true' : 'false',
- 'spellcheck.count' => 1,
- );
- $call_args = array(
- 'query' => &$keys,
- 'offset' => 0,
- 'limit' => 0,
- 'params' => &$params,
- );
- if ($this->request_handler) {
- $this->setRequestHandler($this->request_handler, $call_args);
- }
- $second_pass = !isset($this->options['autocorrect_suggest_words']) || $this->options['autocorrect_suggest_words'];
- for ($i = 0; $i < ($second_pass ? 2 : 1); ++$i) {
- try {
- // Send search request
- $this->connect();
- drupal_alter('search_api_solr_query', $call_args, $query);
- $this->preQuery($call_args, $query);
- $response = $this->solr->search($keys, 0, 0, $params);
- if ($response->getHttpStatus() != 200) {
- watchdog('search_api_solr', 'The Solr server responded with status code @status: @msg.', array('@status' => $response->getHttpStatus(), '@msg' => $response->getHttpStatusMessage()), WATCHDOG_WARNING, 'admin/config/search/search_api/server/' . $this->server->machine_name);
- return array();
- }
- if (!empty($response->spellcheck->suggestions)) {
- $replace = array();
- foreach ($response->spellcheck->suggestions as $word => $data) {
- $replace[$word] = $data->suggestion[0];
- }
- $corrected = str_ireplace(array_keys($replace), array_values($replace), $user_input);
- if ($corrected != $user_input) {
- array_unshift($suggestions, array(
- 'prefix' => t('Did you mean') . ':',
- 'user_input' => $corrected,
- ));
- }
- }
- $matches = array();
- if (isset($response->facet_counts->facet_fields)) {
- foreach ($response->facet_counts->facet_fields as $terms) {
- foreach ($terms as $term => $count) {
- if (isset($matches[$term])) {
- // If we just add the result counts, we can easily get over the
- // total number of results if terms appear in multiple fields.
- // Therefore, we just take the highest value from any field.
- $matches[$term] = max($matches[$term], $count);
- }
- else {
- $matches[$term] = $count;
- }
- }
- }
- if ($matches) {
- // Eliminate suggestions that are too short or already in the query.
- foreach ($matches as $term => $count) {
- if (strlen($term) < 3 || isset($keys_array[$term])) {
- unset($matches[$term]);
- }
- }
- // Don't suggest terms that are too frequent (by default in more
- // than 90% of results).
- $result_count = $response->response->numFound;
- $max_occurrences = $result_count * variable_get('search_api_solr_autocomplete_max_occurrences', 0.9);
- if (($max_occurrences >= 1 || $i > 0) && $max_occurrences < $result_count) {
- foreach ($matches as $match => $count) {
- if ($count > $max_occurrences) {
- unset($matches[$match]);
- }
- }
- }
- // The $count in this array is actually a score. We want the
- // highest ones first.
- arsort($matches);
- // Shorten the array to the right ones.
- $additional_matches = array_slice($matches, $limit - count($suggestions), NULL, TRUE);
- $matches = array_slice($matches, 0, $limit, TRUE);
- // Build suggestions using returned facets
- $incomp_length = strlen($incomp);
- foreach ($matches as $term => $count) {
- if (drupal_strtolower(substr($term, 0, $incomp_length)) == $incomp) {
- $suggestions[] = array(
- 'suggestion_suffix' => substr($term, $incomp_length),
- 'results' => $count,
- );
- }
- else {
- $suggestions[] = array(
- 'suggestion_suffix' => ' ' . $term,
- 'results' => $count,
- );
- }
- }
- }
- }
- }
- catch (Exception $e) {
- watchdog_exception('search_api_solr', $e, "%type during autocomplete Solr query: !message in %function (line %line of %file).", array(), WATCHDOG_WARNING);
- }
- if (count($suggestions) >= $limit) {
- break;
- }
- // Change parameters for second query.
- unset($params['facet.prefix']);
- $keys = trim ($keys . ' ' . $incomplete_key);
- }
- return $suggestions;
- }
- //
- // SearchApiMultiServiceInterface methods
- //
- /**
- * Create a query object for searching on this server.
- *
- * @param $options
- * Associative array of options configuring this query. See
- * SearchApiMultiQueryInterface::__construct().
- *
- * @throws SearchApiException
- * If the server is currently disabled.
- *
- * @return SearchApiMultiQueryInterface
- * An object for searching this server.
- */
- public function queryMultiple(array $options = array()) {
- return new SearchApiMultiQuery($this->server, $options);
- }
- /**
- * Executes a search on the server represented by this object.
- *
- * @param SearchApiMultiQueryInterface $query
- * The search query to execute.
- *
- * @throws SearchApiException
- * If an error prevented the search from completing.
- *
- * @return array
- * An associative array containing the search results, as required by
- * SearchApiMultiQueryInterface::execute().
- */
- public function searchMultiple(SearchApiMultiQueryInterface $query) {
- $time_method_called = microtime(TRUE);
- // Get field information
- $solr_fields = array(
- 'search_api_id' => 'ss_search_api_id',
- 'search_api_relevance' => 'score',
- 'search_api_multi_index' => 'index_id',
- );
- $fields = array(
- 'search_api_multi_index' => array(
- 'type' => 'string',
- ),
- );
- foreach ($query->getIndexes() as $index_id => $index) {
- if (empty($index->options['fields'])) {
- continue;
- }
- $prefix = $index_id . ':';
- foreach ($this->getFieldNames($index) as $field => $key) {
- if (!isset($solr_fields[$field])) {
- $solr_fields[$prefix . $field] = $key;
- }
- }
- foreach ($index->options['fields'] as $field => $info) {
- $fields[$prefix . $field] = $info;
- }
- }
- // Extract keys
- $keys = $query->getKeys();
- if (is_array($keys)) {
- $keys = $this->flattenKeys($keys);
- }
- // Set searched fields
- $search_fields = $query->getFields();
- $qf = array();
- foreach ($search_fields as $f) {
- $qf[] = $solr_fields[$f];
- }
- // Extract filters
- $filter = $query->getFilter();
- $fq = $this->createFilterQueries($filter, $solr_fields, $fields);
- // Restrict search to searched indexes.
- $index_filter = array();
- foreach ($query->getIndexes() as $index_id => $index) {
- $index_filter[] = 'index_id:' . SearchApiSolrConnection::phrase($index_id);
- }
- $fq[] = implode(' OR ', $index_filter);
- // Extract sort
- $sort = array();
- foreach ($query->getSort() as $f => $order) {
- $f = $solr_fields[$f];
- if (substr($f, 0, 3) == 'ss_') {
- $f = 'sort_' . substr($f, 3);
- }
- $order = strtolower($order);
- $sort[] = "$f $order";
- }
- // Get facet fields
- $facets = $query->getOption('search_api_facets') ? $query->getOption('search_api_facets') : array();
- $facet_params = $this->getFacetParams($facets, $solr_fields);
- // Set defaults
- if (!$keys) {
- $keys = NULL;
- }
- $options = $query->getOptions();
- $offset = isset($options['offset']) ? $options['offset'] : 0;
- $limit = isset($options['limit']) ? $options['limit'] : 1000000;
- // Collect parameters
- $params = array(
- 'qf' => $qf,
- 'fl' => 'item_id,index_id,score',
- 'fq' => $fq,
- );
- if ($sort) {
- $params['sort'] = implode(', ', $sort);
- }
- if (!empty($facet_params['facet.field'])) {
- $params += $facet_params;
- }
- try {
- // Send search request
- $time_processing_done = microtime(TRUE);
- $this->connect();
- $call_args = array(
- 'query' => &$keys,
- 'offset' => &$offset,
- 'limit' => &$limit,
- 'params' => &$params,
- );
- drupal_alter('search_api_solr_multi_query', $call_args, $query);
- // Retrieve http method from server options.
- $http_method = !empty($this->options['http_method']) ? $this->options['http_method'] : Apache_Solr_Service::METHOD_POST;
- $response = $this->solr->search($keys, $offset, $limit, $params, $http_method);
- $time_query_done = microtime(TRUE);
- if ($response->getHttpStatus() != 200) {
- throw new SearchApiException(t('The Solr server responded with status code @status: @msg.',
- array('@status' => $response->getHttpStatus(), '@msg' => $response->getHttpStatusMessage())));
- }
- // Extract results
- $results = array();
- $results['result count'] = $response->response->numFound;
- $results['results'] = array();
- $tmp = array();
- foreach ($response->response->docs as $id => $doc) {
- $result = array(
- 'id' => $doc->item_id,
- 'index_id' => $doc->index_id,
- 'score' => $doc->score,
- );
- $excerpt = $this->getExcerpt($response, $id, $tmp, array());
- if ($excerpt) {
- $result['excerpt'] = $excerpt;
- }
- $results['results'][$id] = $result;
- }
- // Extract facets
- if (isset($response->facet_counts->facet_fields)) {
- $results['search_api_facets'] = array();
- $facet_fields = $response->facet_counts->facet_fields;
- foreach ($facets as $delta => $info) {
- $field = $this->getFacetField($solr_fields[$info['field']]);
- if (!empty($facet_fields->$field)) {
- $min_count = $info['min_count'];
- $terms = $facet_fields->$field;
- if ($info['missing']) {
- // We have to correctly incorporate the "_empty_" term.
- // This will ensure that the term with the least results is dropped, if the limit would be exceeded.
- $terms = (array) $terms;
- arsort($terms);
- if (count($terms) > $info['limit']) {
- array_pop($terms);
- }
- }
- foreach ($terms as $term => $count) {
- if ($count >= $min_count) {
- $term = $term == '_empty_' ? '!' : '"' . $term . '"';
- $results['search_api_facets'][$delta][] = array(
- 'filter' => $term,
- 'count' => $count,
- );
- }
- }
- if (empty($results['search_api_facets'][$delta]) || count($results['search_api_facets'][$delta]) <= 1) {
- unset($results['search_api_facets'][$delta]);
- }
- }
- }
- }
- // Compute performance
- $time_end = microtime(TRUE);
- $results['performance'] = array(
- 'complete' => $time_end - $time_method_called,
- 'preprocessing' => $time_processing_done - $time_method_called,
- 'execution' => $time_query_done - $time_processing_done,
- 'postprocessing' => $time_end - $time_query_done,
- );
- return $results;
- }
- catch (Exception $e) {
- throw new SearchApiException($e->getMessage());
- }
- }
- //
- // Additional methods that might be used when knowing the service class.
- //
- /**
- * Ping the Solr server to tell whether it can be accessed.
- *
- * Uses the admin/ping request handler.
- */
- public function ping() {
- $this->connect();
- return $this->solr->ping();
- }
- /**
- * Sends a commit command to the Solr server.
- */
- public function commit() {
- try {
- $this->connect();
- return $this->solr->commit(FALSE, FALSE, FALSE);
- }
- catch (Exception $e) {
- watchdog('search_api_solr', 'A commit operation for server @name failed: @msg.',
- array('@name' => $this->server->machine_name, '@msg' => $e->getMessage()), WATCHDOG_WARNING);
- }
- }
- /**
- * Schedules a commit operation for this server.
- *
- * The commit will be sent at the end of the current page request. Multiple
- * calls to this method will still only result in one commit operation.
- */
- public function scheduleCommit() {
- if (!$this->commitScheduled) {
- $this->commitScheduled = TRUE;
- drupal_register_shutdown_function(array($this, 'commit'));
- }
- }
- /**
- * @return SearchApiSolrConnection
- * The solr connection object used by this server.
- */
- public function getSolrConnection() {
- $this->connect();
- return $this->solr;
- }
- /**
- * Get metadata about fields in the Solr/Lucene index.
- *
- * @param boolean $reset
- * Reload the cached data?
- */
- public function getFields($reset = FALSE) {
- $cid = 'search_api_solr:fields:' . $this->server->machine_name;
- // If the data hasn't been retrieved before and we aren't refreshing it, try
- // to get data from the cache.
- if (!isset($this->fields) && !$reset) {
- $cache = cache_get($cid);
- if (isset($cache->data) && !$reset) {
- $this->fields = $cache->data;
- }
- }
- // If there was no data in the cache, or if we're refreshing the data,
- // connect to the Solr server, retrieve schema information, and cache it.
- if (!isset($this->fields) || $reset) {
- $this->connect();
- $this->fields = array();
- foreach ($this->solr->getFields() as $name => $info) {
- $this->fields[$name] = new SearchApiSolrField($info);
- }
- cache_set($cid, $this->fields);
- }
- return $this->fields;
- }
- }
|