/** * Return fields to be indexed in Solr (an alternative to an XSL transformation) * * @return string[] */ public function toSolrArray() { $data = parent::toSolrArray(); if (empty($data['author'])) { $data['author'] = $data['author_fuller'] = $data['author-letter'] = $this->getFieldSubfields('110', ['a' => 1]); } $key = array_search($data['author'], $data['author2']); if ($key !== false) { unset($data['author2'][$key]); } if (isset($data['publishDate'])) { $data['main_date_str'] = MetadataUtils::extractYear($data['publishDate'][0]); $data['main_date'] = $this->validateDate($data['main_date_str'] . '-01-01T00:00:00Z'); } if ($range = $this->getPublicationDateRange()) { $data['search_sdaterange_mv'][] = $data['publication_sdaterange'] = MetadataUtils::dateRangeToNumeric($range); $data['search_daterange_mv'][] = $data['publication_daterange'] = MetadataUtils::dateRangeToStr($range); } $data['publication_place_txt_mv'] = MetadataUtils::arrayTrim($this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '260', ['a' => 1]]]), ' []'); $data['subtitle_lng_str_mv'] = $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '041', ['j' => 1]], [MarcRecord::GET_NORMAL, '979', ['j' => 1]]], false, true, true); $data['original_lng_str_mv'] = $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '041', ['h' => 1]], [MarcRecord::GET_NORMAL, '979', ['i' => 1]]], false, true, true); // 979cd = component part authors // 900, 910, 911 = Finnish reference field foreach ($this->getFieldsSubfields([[MarcRecord::GET_BOTH, '979', ['c' => 1]], [MarcRecord::GET_BOTH, '979', ['d' => 1]], [MarcRecord::GET_BOTH, '900', ['a' => 1]], [MarcRecord::GET_BOTH, '910', ['a' => 1, 'b' => 1]], [MarcRecord::GET_BOTH, '911', ['a' => 1, 'e' => 1]]], false, true, true) as $field) { $data['author2'][] = $field; } $key = array_search($data['author'], $data['author2']); if ($key !== false) { unset($data['author2'][$key]); } $data['author2'] = array_filter(array_values($data['author2'])); $data['title_alt'] = array_values(array_unique($this->getFieldsSubfields([[MarcRecord::GET_ALT, '245', ['a' => 1, 'b' => 1]], [MarcRecord::GET_BOTH, '130', ['a' => 1, 'd' => 1, 'f' => 1, 'g' => 1, 'h' => 1, 'k' => 1, 'l' => 1, 'n' => 1, 'p' => 1, 'r' => 1, 's' => 1, 't' => 1]], [MarcRecord::GET_BOTH, '240', ['a' => 1, 'd' => 1, 'f' => 1, 'g' => 1, 'k' => 1, 'l' => 1, 'n' => 1, 'p' => 1, 'r' => 1, 's' => 1]], [MarcRecord::GET_BOTH, '243', ['a' => 1, 'd' => 1, 'f' => 1, 'g' => 1, 'h' => 1, 'k' => 1, 'l' => 1, 'm' => 1, 'n' => 1, 'o' => 1, 'p' => 1, 'r' => 1, 's' => 1]], [MarcRecord::GET_BOTH, '246', ['a' => 1, 'b' => 1, 'g' => 1]], [MarcRecord::GET_BOTH, '700', ['t' => 1, 'm' => 1, 'r' => 1, 'h' => 1, 'i' => 1, 'g' => 1, 'n' => 1, 'p' => 1, 's' => 1, 'l' => 1, 'o' => 1, 'k' => 1], ['t' => 1]], [MarcRecord::GET_BOTH, '730', ['a' => 1, 'd' => 1, 'f' => 1, 'g' => 1, 'h' => 1, 'i' => 1, 'k' => 1, 'l' => 1, 'm' => 1, 'n' => 1, 'o' => 1, 'p' => 1, 'r' => 1, 's' => 1, 't' => 1]], [MarcRecord::GET_BOTH, '740', ['a' => 1]], [MarcRecord::GET_BOTH, '979', ['b' => 1]], [MarcRecord::GET_BOTH, '979', ['e' => 1]], [MarcRecord::GET_BOTH, '940', ['a' => 1]]]))); // Location coordinates $field = $this->getField('034'); if ($field) { $westOrig = $this->getSubfield($field, 'd'); $eastOrig = $this->getSubfield($field, 'e'); $northOrig = $this->getSubfield($field, 'f'); $southOrig = $this->getSubfield($field, 'g'); $west = MetadataUtils::coordinateToDecimal($westOrig); $east = MetadataUtils::coordinateToDecimal($eastOrig); $north = MetadataUtils::coordinateToDecimal($northOrig); $south = MetadataUtils::coordinateToDecimal($southOrig); if (!is_nan($west) && !is_nan($north)) { if ($west < -180 || $west > 180 || ($north < -90 || $north > 90)) { global $logger; $logger->log('NdlMarcRecord', "Discarding invalid coordinates {$west},{$north} decoded from " . "w={$westOrig}, e={$eastOrig}, n={$northOrig}, s={$southOrig}, " . "record {$this->source}." . $this->getID(), Logger::WARNING); } else { if (!is_nan($east) && !is_nan($south)) { if ($east < -180 || $east > 180 || $south < -90 || $south > 90) { global $logger; $logger->log('NdlMarcRecord', "Discarding invalid coordinates {$east},{$south} " . "decoded from w={$westOrig}, e={$eastOrig}, " . "n={$northOrig}, s={$southOrig}, record " . "{$this->source}." . $this->getID(), Logger::WARNING); } else { // Try to cope with weird coordinate order if ($north > $south) { list($north, $south) = [$south, $north]; } if ($west > $east) { list($west, $east) = [$east, $west]; } $data['location_geo'] = "ENVELOPE({$west}, {$east}, {$south}, {$north})"; } } else { $data['location_geo'] = "POINT({$west} {$north})"; } } } } // Classifications foreach ($this->getFields('080') as $field080) { $classification = trim($this->getSubfield($field080, 'a')); $classification .= trim($this->getSubfield($field080, 'b')); if ($classification) { $aux = $this->getSubfields($field080, ['x' => 1]); if ($aux) { $classification .= " {$aux}"; } $data['classification_txt_mv'][] = "udk {$classification}"; } } $dlc = $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '050', ['a' => 1, 'b' => 1]]]); foreach ($dlc as $classification) { $data['classification_txt_mv'][] = 'dlc ' . mb_strtolower(str_replace(' ', '', $classification), 'UTF-8'); } foreach ($this->getFields('084') as $field) { $source = $this->getSubfield($field, '2'); $classification = $this->getSubfields($field, ['a' => 1, 'b' => 1]); if ($source) { $data['classification_txt_mv'][] = "{$source} " . mb_strtolower(str_replace(' ', '', $classification), 'UTF-8'); } } if (isset($data['classification_txt_mv'])) { $data['allfields'] = array_merge($data['allfields'], $data['classification_txt_mv']); } // Keep classification_str_mv for backward-compatibility for now if (isset($data['classification_txt_mv'])) { $data['classification_str_mv'] = $data['classification_txt_mv']; } // Ebrary location $ebraryLocs = $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '035', ['a' => 1]]]); foreach ($ebraryLocs as $field) { if (strncmp($field, 'ebr', 3) == 0 && is_numeric(substr($field, 3))) { if (!isset($data['building']) || !in_array('EbraryDynamic', $data['building'])) { $data['building'][] = 'EbraryDynamic'; } } } // Topics if (strncmp($this->source, 'metalib', 7) == 0) { $field653 = $this->getFieldsSubfields([[MarcRecord::GET_BOTH, '653', ['a' => 1]]]); $data['topic'] = array_merge($data['topic'], $field653); $data['topic_facet'] = array_merge($data['topic_facet'], $field653); } // Original Study Number $data['ctrlnum'] = array_merge($data['ctrlnum'], $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '036', ['a' => 1]]])); // Source $data['source_str_mv'] = $this->source; $data['datasource_str_mv'] = [$this->source]; // ISSN $data['issn'] = $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '022', ['a' => 1]]]); foreach ($data['issn'] as &$value) { $value = str_replace('-', '', $value); } $data['other_issn_str_mv'] = $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '440', ['x' => 1]], [MarcRecord::GET_NORMAL, '480', ['x' => 1]], [MarcRecord::GET_NORMAL, '730', ['x' => 1]], [MarcRecord::GET_NORMAL, '776', ['x' => 1]]]); foreach ($data['other_issn_str_mv'] as &$value) { $value = str_replace('-', '', $value); } $data['linking_issn_str_mv'] = $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '022', ['l' => 1]]]); foreach ($data['linking_issn_str_mv'] as &$value) { $value = str_replace('-', '', $value); } // URLs $fields = $this->getFields('856'); foreach ($fields as $field) { $ind2 = $this->getIndicator($field, 2); $sub3 = $this->getSubfield($field, 3); if (($ind2 == '0' || $ind2 == '1') && !$sub3) { $url = trim($this->getSubfield($field, 'u')); if (!$url) { continue; } // Require at least one dot surrounded by valid characters or a // familiar scheme if (!preg_match('/[A-Za-z0-9]\\.[A-Za-z0-9]/', $url) && !preg_match('/^(http|ftp)s?:\\/\\//', $url)) { continue; } $data['online_boolean'] = true; $data['online_str_mv'] = $this->source; $linkText = $this->getSubfield($field, 'y'); if (!$linkText) { $linkText = $this->getSubfield($field, 'z'); } $link = ['url' => $this->getSubfield($field, 'u'), 'text' => $linkText, 'source' => $this->source]; $data['online_urls_str_mv'][] = json_encode($link); } } // Holdings $data['holdings_txtP_mv'] = $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '852', ['a' => 1, 'b' => 1, 'h' => 1, 'z' => 1]]]); if (!empty($data['holdings_txtP_mv'])) { $updateFunc = function (&$val, $k, $source) { $val .= " {$source}"; }; array_walk($data['holdings_txtP_mv'], $updateFunc, $this->source); } // Access restrictions if ($restrictions = $this->getAccessRestrictions()) { $data['restricted_str'] = $restrictions; } // ISMN foreach ($this->getFields('024') as $field024) { if ($this->getIndicator($field024, 1) == '2') { $ismn = $this->getSubfield($field024, 'a'); $ismn = str_replace('-', '', $ismn); if (!preg_match('{([0-9]{13})}', $ismn, $matches)) { continue; } $data['ismn_isn_mv'] = $matches[1]; } } // Project ID in 960 (Fennica) if ($this->getDriverParam('projectIdIn960', false)) { $data['project_id_str_mv'] = $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '960', ['a' => 1]]]); } // Hierarchical Categories (MetaLib) foreach ($this->getFields('976') as $field976) { $category = $this->getSubfield($field976, 'a'); $category = trim(str_replace(['/', '\\'], '', $category), " -\t\n\r\v"); if (!$category) { continue; } $sub = $this->getSubfield($field976, 'b'); $sub = trim(str_replace(['/', '\\'], '', $sub), " -\t\n\r\v"); if ($sub) { $category .= "/{$sub}"; } $data['category_str_mv'][] = $category; } // Hierarchical categories (e.g. SFX) if ($this->getDriverParam('categoriesIn650', false)) { foreach ($this->getFields('650') as $field650) { $category = $this->getSubfield($field650, 'a'); $category = trim(str_replace(['/', '\\'], '', $category)); if (!$category) { continue; } $sub = $this->getSubfield($field650, 'x'); $sub = trim(str_replace(['/', '\\'], '', $sub)); if ($sub) { $category .= "/{$sub}"; } $data['category_str_mv'][] = $category; } } // Call numbers $data['callnumber-first'] = strtoupper(str_replace(' ', '', $this->getFirstFieldSubfields([[MarcRecord::GET_NORMAL, '080', ['a' => 1, 'b' => 1]], [MarcRecord::GET_NORMAL, '084', ['a' => 1, 'b' => 1]], [MarcRecord::GET_NORMAL, '050', ['a' => 1, 'b' => 1]]]))); $data['callnumber-raw'] = array_map('strtoupper', $this->getFieldsSubfields([[MarcRecord::GET_NORMAL, '080', ['a' => 1, 'b' => 1]], [MarcRecord::GET_NORMAL, '084', ['a' => 1, 'b' => 1]], [MarcRecord::GET_NORMAL, '050', ['a' => 1, 'b' => 1]]])); $data['callnumber-sort'] = empty($data['callnumber-raw']) ? '' : $data['callnumber-raw'][0]; // Legacy callnumber fields. TODO: Remove when VuFind 1 is gone. $data['callnumber'] = strtoupper(str_replace(' ', '', $this->getFirstFieldSubfields([[MarcRecord::GET_NORMAL, '080', ['a' => 1, 'b' => 1]], [MarcRecord::GET_NORMAL, '084', ['a' => 1, 'b' => 1]], [MarcRecord::GET_NORMAL, '050', ['a' => 1, 'b' => 1]]]))); $data['callnumber-a'] = $this->getFirstFieldSubfields([[MarcRecord::GET_NORMAL, '080', ['a' => 1]], [MarcRecord::GET_NORMAL, '084', ['a' => 1]], [MarcRecord::GET_NORMAL, '050', ['a' => 1]]]); $data['callnumber-first-code'] = substr($data['callnumber-a'], 0, 1); return $data; }