|
<?php
|
|
// Project: Web Reference Database (refbase) <http://www.refbase.net>
|
|
// Copyright: Matthias Steffens <mailto:refbase@extracts.de> and the file's
|
|
// original author(s).
|
|
//
|
|
// This code is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY. Please see the GNU General Public
|
|
// License for more details.
|
|
//
|
|
// File: ./includes/srwxml.inc.php
|
|
// Repository: $HeadURL: file:///svn/p/refbase/code/branches/bleeding-edge/includes/srwxml.inc.php $
|
|
// Author(s): Matthias Steffens <mailto:refbase@extracts.de> and
|
|
// Richard Karnesky <mailto:karnesky@gmail.com>
|
|
//
|
|
// Created: 17-May-05, 16:38
|
|
// Modified: $Date: 2017-04-13 02:00:18 +0000 (Thu, 13 Apr 2017) $
|
|
// $Author: karnesky $
|
|
// $Revision: 1416 $
|
|
|
|
// This include file contains functions that'll export records to SRW XML.
|
|
// Requires ActiveLink PHP XML Package, which is available under the GPL from:
|
|
// <http://www.active-link.com/software/>. See 'sru.php' for more info.
|
|
|
|
|
|
// Incorporate some include files:
|
|
include_once 'includes/webservice.inc.php'; // include functions that are commonly used with the refbase webservices
|
|
|
|
// Import the ActiveLink Packages
|
|
require_once("classes/include.php");
|
|
import("org.active-link.xml.XML");
|
|
import("org.active-link.xml.XMLDocument");
|
|
|
|
// --------------------------------------------------------------------
|
|
|
|
// Return DC XML or MODS XML records wrapped into SRW XML ('searchRetrieveResponse'):
|
|
function srwCollection($result, $rowOffset, $showRows, $exportStylesheet, $displayType)
|
|
{
|
|
global $contentTypeCharset; // these variables are defined in 'ini.inc.php'
|
|
global $convertExportDataToUTF8;
|
|
|
|
global $exportFormat; // this is needed so that we can distinguish between "SRW_DC XML" and "SRW_MODS XML" record formats
|
|
|
|
// The array '$transtab_refbase_unicode' contains search & replace patterns
|
|
// for conversion from refbase markup to Unicode entities.
|
|
global $transtab_refbase_unicode; // defined in 'transtab_refbase_unicode.inc.php'
|
|
|
|
global $fieldSpecificSearchReplaceActionsArray;
|
|
|
|
// Individual records are objects and collections of records are strings
|
|
|
|
// Defines field-specific search & replace 'actions' that will be applied to all those refbase fields that are listed in the corresponding 'fields' element:
|
|
// (If you don't want to perform any search and replace actions, specify an empty array, like: '$fieldSpecificSearchReplaceActionsArray = array();'.
|
|
// Note that the search patterns MUST include the leading & trailing slashes -- which is done to allow for mode modifiers such as 'imsxU'.)
|
|
// "/Search Pattern/" => "Replace Pattern"
|
|
$fieldSpecificSearchReplaceActionsArray = array();
|
|
|
|
if ($convertExportDataToUTF8 == "yes")
|
|
$fieldSpecificSearchReplaceActionsArray[] = array('fields' => array("title", "publication", "abbrev_journal", "address", "keywords", "abstract", "orig_title", "series_title", "abbrev_series_title", "notes"),
|
|
'actions' => $transtab_refbase_unicode
|
|
);
|
|
|
|
$srwCollectionDoc = new XMLDocument();
|
|
|
|
if (($convertExportDataToUTF8 == "yes") AND ($contentTypeCharset != "UTF-8"))
|
|
$srwCollectionDoc->setEncoding("UTF-8");
|
|
else
|
|
$srwCollectionDoc->setEncoding($contentTypeCharset);
|
|
|
|
$srwCollection = srwGenerateBaseTags("searchRetrieveResponse");
|
|
|
|
$showRowsOriginal = $showRows; // save original value of '$showRows' (which may get modified by the 'seekInMySQLResultsToOffset()' function below)
|
|
|
|
// Find out how many rows are available and (if there were rows found) seek to the current offset:
|
|
// function 'seekInMySQLResultsToOffset()' is defined in 'include.inc.php'
|
|
list($result, $rowOffset, $showRows, $rowsFound, $previousOffset, $nextOffset, $showMaxRow) = seekInMySQLResultsToOffset($result, $rowOffset, $showRows, $displayType, "");
|
|
|
|
addNewBranch($srwCollection, "srw:numberOfRecords", array(), $rowsFound); // function 'addNewBranch()' is defined in 'webservice.inc.php'
|
|
|
|
// <srw:resultSetId> not supported
|
|
// <srw:resultSetIdleTime> not supported
|
|
|
|
$srwRecordsBranch = new XMLBranch("srw:records");
|
|
|
|
if ($showRowsOriginal != 0) // we omit the records list in the response if the SRU query did contain 'maximumRecords=0'
|
|
{
|
|
$exportArray = array(); // Array for individually exported records
|
|
|
|
// Generate the export for each record and push them onto an array:
|
|
for ($rowCounter=0; (($rowCounter < $showRows) && ($row = @ mysqli_fetch_array($result))); $rowCounter++)
|
|
{
|
|
if (preg_match("/DC/i", $exportFormat)) // export the current record as DC XML (i.e. simple Dublin Core):
|
|
$record = oaidcRecord($row, "srw_dc"); // function 'oaidcRecord()' is defined in 'oaidcxml.inc.php'
|
|
else // by default, we export the current record as MODS XML:
|
|
$record = modsRecord($row); // function 'modsRecord()' is defined in 'modsxml.inc.php'
|
|
|
|
// TODO: build 'extraRecordData' for OAI-PMH (see below) using:
|
|
// $row['serial'], $row['modified_date'], $row['modified_time']
|
|
|
|
if (!empty($record)) // unless the record buffer is empty...
|
|
array_push($exportArray, $record); // ...add it to an array of exports
|
|
}
|
|
|
|
$i = $rowOffset; // initialize counter
|
|
|
|
// for each of the DC/MODS records in the result set...
|
|
foreach ($exportArray as $record)
|
|
{
|
|
++$i; // increment $i by one, then return $i
|
|
|
|
$srwRecordBranch = new XMLBranch("srw:record");
|
|
|
|
if (preg_match("/DC/i", $exportFormat))
|
|
srwGeneratePackingSchema($srwRecordBranch, "xml", "dc");
|
|
else
|
|
srwGeneratePackingSchema($srwRecordBranch, "xml", "mods");
|
|
|
|
$srwRecordDataBranch = new XMLBranch("srw:recordData");
|
|
|
|
if (preg_match("/MODS/i", $exportFormat))
|
|
{
|
|
// NOTE: converting the MODS object into a string to perform search & replace actions
|
|
// may be very clumsy but I don't know any better... ?:-/
|
|
$recordString = $record->getXMLString();
|
|
$recordString = preg_replace('/<mods/i','<mods xmlns="http://www.loc.gov/mods/v3"',$recordString);
|
|
// alternatively to the above line we could add a 'mods:' identifier to all MODS XML tags:
|
|
// $recordString = preg_replace("#<(/)?#","<\\1mods:",$recordString);
|
|
$record->removeAllBranches();
|
|
$record->parseFromString($recordString);
|
|
}
|
|
|
|
$srwRecordDataBranch->addXMLasBranch($record);
|
|
$srwRecordBranch->addXMLBranch($srwRecordDataBranch);
|
|
|
|
// TODO: add 'extraRecordData' for OAI-PMH as explained in <http://www.dlib.org/dlib/february05/sanderson/02sanderson.html>
|
|
// Example:
|
|
// <extraRecordData>
|
|
// <oai:header xmlns:oai="http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd">
|
|
// <oai:identifier>...</oai:identifier>
|
|
// <oai:datestamp>...</oai:datestamp>
|
|
// <oai:setSpec>...</oai:setSpec>
|
|
// </oai:header>
|
|
// </extraRecordData>
|
|
//
|
|
// Then add to the SRW 'Explain' response:
|
|
// 1. an oai.identifier index containing a unique identifier for each record in the database
|
|
// 2. an oai.datestamp index containing the date/time the record was added or changed in the database
|
|
// 3. an optional oai.set index, browsable via the scan operation, to support selective harvesting of records
|
|
|
|
addNewBranch($srwRecordBranch, "srw:recordPosition", array(), $i);
|
|
|
|
$srwRecordsBranch->addXMLBranch($srwRecordBranch);
|
|
}
|
|
}
|
|
|
|
$srwCollection->addXMLBranch($srwRecordsBranch);
|
|
|
|
if (($showRowsOriginal != 0) && ($showMaxRow < $rowsFound)) // show 'nextRecordPosition' if the SRU query did not contain 'maximumRecords=0' and if there are any remaining records to be displayed
|
|
addNewBranch($srwCollection, "srw:nextRecordPosition", array(), ($showMaxRow + 1));
|
|
|
|
$srwCollectionDoc->setXML($srwCollection);
|
|
$srwCollectionString = $srwCollectionDoc->getXMLString();
|
|
|
|
// Add the XML Stylesheet definition:
|
|
// Note that this is just a hack (that should get fixed) since I don't know how to do it properly using the ActiveLink PHP XML Package ?:-/
|
|
if (!empty($exportStylesheet))
|
|
$srwCollectionString = preg_replace("/(?=\<srw:searchRetrieveResponse)/i","<?xml-stylesheet type=\"text/xsl\" href=\"" . $exportStylesheet . "\"?>\n",$srwCollectionString);
|
|
|
|
return $srwCollectionString;
|
|
}
|
|
|
|
// --------------------------------------------------------------------
|
|
|
|
// return an SRW 'explainResponse' if the SRW/U client issued either of the following:
|
|
// - http://.../refs/sru.php?operation=explain
|
|
// - http://.../refs/sru.php?
|
|
// - http://.../refs/sru.php
|
|
function srwExplainResponse($exportStylesheet)
|
|
{
|
|
global $contentTypeCharset; // these variables are specified in 'ini.inc.php'
|
|
global $databaseBaseURL;
|
|
global $officialDatabaseName;
|
|
global $hostInstitutionName;
|
|
global $feedbackEmail;
|
|
global $logoImageURL;
|
|
global $defaultLanguage;
|
|
global $defaultFeedFormat;
|
|
|
|
global $loc; // defined in 'locales/core.php'
|
|
|
|
$srwCollectionDoc = new XMLDocument();
|
|
$srwCollectionDoc->setEncoding($contentTypeCharset);
|
|
|
|
$srwCollection = srwGenerateBaseTags("explainResponse");
|
|
|
|
$srwRecordBranch = new XMLBranch("srw:record");
|
|
|
|
srwGeneratePackingSchema($srwRecordBranch, "xml", "zeerex");
|
|
|
|
$srwRecordDataBranch = new XMLBranch("srw:recordData");
|
|
|
|
$srwExplainBranch = new XMLBranch("explain");
|
|
$srwExplainBranch->setTagAttribute("xmlns", "http://explain.z3950.org/dtd/2.0/");
|
|
$srwExplainBranch->setTagAttribute("xmlns:refb", "http://refbase.net/");
|
|
|
|
|
|
// extract the protocol from the base URL:
|
|
if (preg_match("#^([^:]+)://.*#",$databaseBaseURL))
|
|
$databaseProtocol = preg_replace("#^([^:]+)://.*#","\\1",$databaseBaseURL);
|
|
else
|
|
$databaseProtocol = "";
|
|
|
|
// extract the host from the base URL:
|
|
if (preg_match("#^[^:]+://(?:www\.)?[^/]+.*#",$databaseBaseURL))
|
|
$databaseHost = preg_replace("#^[^:]+://(?:www\.)?([^/]+).*#","\\1",$databaseBaseURL);
|
|
else
|
|
$databaseHost = $databaseBaseURL;
|
|
|
|
// extract the path on server from the base URL:
|
|
if (preg_match("#^[^:]+://(?:www\.)?[^/]+/.+#",$databaseBaseURL))
|
|
$databasePathOnServer = preg_replace("#^[^:]+://(?:www\.)?[^/]+/(.+)#","\\1",$databaseBaseURL);
|
|
else
|
|
$databasePathOnServer = "";
|
|
|
|
// get the total number of records in the database:
|
|
$recordCount = getTotalNumberOfRecords(); // function 'getTotalNumberOfRecords()' is defined in 'include.inc.php'
|
|
|
|
// get the default number of records per page preferred by the current user:
|
|
$showRows = $_SESSION['userRecordsPerPage'];
|
|
|
|
// get date/time information when the database was last modified:
|
|
$lastModified = getLastModifiedDateTime(); // function 'getLastModifiedDateTime()' is defined in 'include.inc.php'
|
|
|
|
|
|
// --- begin server info ------------------------------------
|
|
$srwServerInfoBranch = new XMLBranch("serverInfo");
|
|
$srwServerInfoBranch->setTagAttribute("protocol", "SRU");
|
|
$srwServerInfoBranch->setTagAttribute("version", "1.1");
|
|
if (!empty($databaseProtocol))
|
|
$srwServerInfoBranch->setTagAttribute("transport", $databaseProtocol);
|
|
|
|
$srwServerInfoBranch->setTagContent($databaseHost, "serverInfo/host");
|
|
$srwServerInfoBranch->setTagContent("80", "serverInfo/port"); // NOTE: this should really be a variable in 'ini.inc.php' or such
|
|
|
|
addNewBranch($srwServerInfoBranch, "database", array("numRecs" => $recordCount, "lastUpdate" => $lastModified), $databasePathOnServer . "sru.php"); // function 'addNewBranch()' is defined in 'webservice.inc.php'
|
|
|
|
// IMPORTANT: if you want to allow remote users who are NOT logged in (userID=0) to query the refbase database
|
|
// via 'sru.php' then either the 'Export' or the 'Batch export' user permission needs to be
|
|
// enabled at 'user_options.php?userID=0'. This will allow export of XML records via 'sru.php'
|
|
// but won't allow a user who isn't logged in to export records via the web interface. However, you
|
|
// should be aware that a direct GET query like 'show.php?author=miller&submit=Export&exportFormat=MODS%20XML'
|
|
// will be also allowed then!
|
|
|
|
// As an alternative, you can provide explicit login information within the 'serverInfo/authentication' tag
|
|
// below. But, obviously, the provided login information should be only given for an account that has the
|
|
// 'Export' permission bit enabled but has otherwise limited access rights!
|
|
|
|
// If the 'authentication' element is present, but empty, then it implies that authentication is required
|
|
// to connect to the server, however there is no publically available login. If it contains a string, then
|
|
// this is the token to give in order to authenticate. Otherwise it may contain three elements:
|
|
// 1. user: The username to supply.
|
|
// 2. group: The group to supply.
|
|
// 3. password: The password to supply.
|
|
// $srwServerInfoAuthenticationBranch = new XMLBranch("authentication");
|
|
// $srwServerInfoAuthenticationBranch->setTagContent("LOGINEMAIL", "authentication/user");
|
|
// $srwServerInfoAuthenticationBranch->setTagContent("PASSWORD", "authentication/password");
|
|
// $srwServerInfoBranch->addXMLBranch($srwServerInfoAuthenticationBranch);
|
|
|
|
$srwExplainBranch->addXMLBranch($srwServerInfoBranch);
|
|
// --- end server info --------------------------------------
|
|
|
|
|
|
// --- begin database info ----------------------------------
|
|
$srwDatabaseInfoBranch = new XMLBranch("databaseInfo");
|
|
|
|
addNewBranch($srwDatabaseInfoBranch, "title", array("lang" => $defaultLanguage, "primary" => "true"), $officialDatabaseName);
|
|
|
|
addNewBranch($srwDatabaseInfoBranch, "description", array("lang" => $defaultLanguage, "primary" => "true"), encodeHTMLspecialchars($loc["ThisDatabaseAttempts"]));
|
|
|
|
$srwDatabaseInfoBranch->setTagContent(encodeHTMLspecialchars($hostInstitutionName), "databaseInfo/author");
|
|
|
|
$srwDatabaseInfoBranch->setTagContent(encodeHTMLspecialchars($hostInstitutionName) . " (" . $feedbackEmail . ")", "databaseInfo/contact");
|
|
|
|
$srwDatabaseImplementationBranch = new XMLBranch("implementation");
|
|
$srwDatabaseImplementationBranch->setTagAttribute("version", "0.9.6");
|
|
$srwDatabaseImplementationBranch->setTagAttribute("identifier", "refbase");
|
|
$srwDatabaseImplementationBranch->setTagContent("Web Reference Database (http://refbase.sourceforge.net)", "implementation/title");
|
|
$srwDatabaseInfoBranch->addXMLBranch($srwDatabaseImplementationBranch);
|
|
|
|
$srwDatabaseLinksBranch = new XMLBranch("links");
|
|
|
|
addNewBranch($srwDatabaseLinksBranch, "link", array("type" => "www"), $databaseBaseURL);
|
|
addNewBranch($srwDatabaseLinksBranch, "link", array("type" => "sru"), $databaseBaseURL . "sru.php");
|
|
addNewBranch($srwDatabaseLinksBranch, "link", array("type" => "rss"), $databaseBaseURL . generateURL("show.php", $defaultFeedFormat, array("where" => 'serial RLIKE ".+"'), true, $showRows)); // function 'generateURL()' is defined in 'include.inc.php'
|
|
addNewBranch($srwDatabaseLinksBranch, "link", array("type" => "icon"), $databaseBaseURL . $logoImageURL);
|
|
|
|
$srwDatabaseInfoBranch->addXMLBranch($srwDatabaseLinksBranch);
|
|
|
|
$srwExplainBranch->addXMLBranch($srwDatabaseInfoBranch);
|
|
// --- end database info ------------------------------------
|
|
|
|
|
|
// --- begin index info -------------------------------------
|
|
$srwIndexInfoBranch = new XMLBranch("indexInfo");
|
|
|
|
addNewBranch($srwIndexInfoBranch, "set", array("identifier" => "info:srw/cql-context-set/1/cql-v1.1", "name" => "cql"), "");
|
|
addNewBranch($srwIndexInfoBranch, "set", array("identifier" => "info:srw/cql-context-set/1/dc-v1.1", "name" => "dc"), "");
|
|
addNewBranch($srwIndexInfoBranch, "set", array("identifier" => "http://zing.z3950.org/cql/bath/2.0/", "name" => "bath"), "");
|
|
addNewBranch($srwIndexInfoBranch, "set", array("identifier" => "info:srw/cql-context-set/2/rec-1.1", "name" => "rec"), "");
|
|
|
|
// TODO: The index info of the refbase explain response should also list the original refbase field names,
|
|
// similar to how the COPAC SRU gateway does it (<http://tweed.lib.ed.ac.uk:8080/elf/search/copac>).
|
|
// Example:
|
|
// <index search="true" scan="false" sort="false">
|
|
// <title>Author</title>
|
|
|
|
// <map>
|
|
// <name>
|
|
// author
|
|
// </name>
|
|
// </map>
|
|
// <map>
|
|
// <name set="dc">
|
|
// creator
|
|
// </name>
|
|
// </map>
|
|
// </index>
|
|
|
|
$indexArray = array(); // TODO: '$indexArray' should be an array of arrays so that it can hold multiple mappings
|
|
|
|
$indexArray["dc.creator"] = array("_set" => "dc",
|
|
"_index" => "creator",
|
|
"_title" => "author(s) of the resource",
|
|
"_refbaseIndex" => "refbase-author");
|
|
|
|
$indexArray["dc.title"] = array("_set" => "dc",
|
|
"_index" => "title",
|
|
"_title" => "publication title of the resource",
|
|
"_refbaseIndex" => "refbase-title");
|
|
|
|
$indexArray["dc.date"] = array("_set" => "dc",
|
|
"_index" => "date",
|
|
"_title" => "year of publication of the resource",
|
|
"_refbaseIndex" => "refbase-year");
|
|
|
|
$indexArray["dc.language"] = array("_set" => "dc",
|
|
"_index" => "language",
|
|
"_title" => "language of the resource",
|
|
"_refbaseIndex" => "refbase-language");
|
|
|
|
$indexArray["dc.description"] = array("_set" => "dc",
|
|
"_index" => "description",
|
|
"_title" => "abstract or summary of the resource",
|
|
"_refbaseIndex" => "refbase-abstract");
|
|
|
|
$indexArray["dc.contributor"] = array("_set" => "dc",
|
|
"_index" => "contributor",
|
|
"_title" => "editor(s) of the resource",
|
|
"_refbaseIndex" => "refbase-editor"); // the mapping dc.contributor <-> refbase-editor might be suboptimal, but probably as best as we can do for now
|
|
|
|
$indexArray["dc.subject"] = array("_set" => "dc",
|
|
"_index" => "subject",
|
|
"_title" => "topic of the resource",
|
|
"_refbaseIndex" => "refbase-keywords");
|
|
|
|
$indexArray["dc.format"] = array("_set" => "dc",
|
|
"_index" => "format",
|
|
"_title" => "physical or digital manifestation of the resource",
|
|
"_refbaseIndex" => "refbase-medium");
|
|
|
|
// Note: Currently, we simply expose the contents of the refbase 'type' field as 'dc.type'.
|
|
// This may not be ideal since it differs from the approved terms that should be used as values for the 'dc.type' element: <http://dublincore.org/documents/dcmi-type-vocabulary/>.
|
|
// However, the document "Using simple Dublin Core to describe eprints" (<http://eprints-uk.rdn.ac.uk/project/docs/simpledc-guidelines/#type>)
|
|
// recommends type values that are much closer (but still not identical) to our own type values.
|
|
$indexArray["dc.type"] = array("_set" => "dc",
|
|
"_index" => "type",
|
|
"_title" => "nature or genre of the resource",
|
|
"_refbaseIndex" => "refbase-type");
|
|
|
|
$indexArray["dc.publisher"] = array("_set" => "dc",
|
|
"_index" => "publisher",
|
|
"_title" => "publisher",
|
|
"_refbaseIndex" => "refbase-publisher");
|
|
|
|
$indexArray["dc.coverage"] = array("_set" => "dc",
|
|
"_index" => "coverage",
|
|
"_title" => "geographic or topographic area of research",
|
|
"_refbaseIndex" => "refbase-area");
|
|
|
|
// Note: I'm note sure, if 'bath.name' (or maybe better: 'bath.personalName') can be also used to describe the author/creator ('dc.creator') of a publication
|
|
// "'Name Search -- Keyword' searches for complete word in headings (or references) for people, corporate bodies, conferences, and geographic names."
|
|
// $indexArray["bath.name"] = array("_set" => "bath",
|
|
// "_index" => "name",
|
|
// "_title" => "author",
|
|
// "_refbaseIndex" => "refbase-author");
|
|
|
|
// Note: Not sure again whether 'bath.topicalSubject' can be offered as synonym for 'dc.subject'
|
|
// "'Topical Subject Search -- Keyword' searches for complete word in a topical subject heading or reference."
|
|
// $indexArray["bath.topicalSubject"] = array("_set" => "bath",
|
|
// "_index" => "topicalSubject",
|
|
// "_title" => "keywords",
|
|
// "_refbaseIndex" => "refbase-keywords");
|
|
|
|
// NOTE: I'm not sure if 'isbn' is a valid name for the Bath Context Set? At least, it's not listed at <http://zing.z3950.org/srw/bath/2.0/#2>.
|
|
// However, 'bath.isbn' is used e.g. by <http://z3950.loc.gov:7090/voyager?operation=explain&version=1.1> and other SRU servers.
|
|
$indexArray["bath.isbn"] = array("_set" => "bath",
|
|
"_index" => "isbn",
|
|
"_title" => "international standard book number",
|
|
"_refbaseIndex" => "refbase-isbn");
|
|
|
|
$indexArray["bath.issn"] = array("_set" => "bath",
|
|
"_index" => "issn",
|
|
"_title" => "international standard serial number",
|
|
"_refbaseIndex" => "refbase-issn");
|
|
|
|
$indexArray["bath.corporateName"] = array("_set" => "bath",
|
|
"_index" => "corporateName",
|
|
"_title" => "corporate author of this publication",
|
|
"_refbaseIndex" => "refbase-corporate_author");
|
|
|
|
$indexArray["bath.conferenceName"] = array("_set" => "bath",
|
|
"_index" => "conferenceName",
|
|
"_title" => "conference this publication was presented at",
|
|
"_refbaseIndex" => "refbase-conference");
|
|
|
|
// NOTE: I'm not sure if 'notes' is a valid name for the Bath Context Set?
|
|
// 'bath.notes' is mentioned at <http://www.loc.gov/z3950/lcserver.html> and <http://zing.z3950.org/srw/bath/2.0/#3>.
|
|
$indexArray["bath.notes"] = array("_set" => "bath",
|
|
"_index" => "notes",
|
|
"_title" => "notes about the resource",
|
|
"_refbaseIndex" => "refbase-notes");
|
|
|
|
$indexArray["rec.identifier"] = array("_set" => "rec",
|
|
"_index" => "identifier",
|
|
"_title" => "database record number",
|
|
"_refbaseIndex" => "refbase-serial");
|
|
|
|
$indexArray["rec.creationDate"] = array("_set" => "rec",
|
|
"_index" => "creationDate",
|
|
"_title" => "date/time at which the record was created",
|
|
"_refbaseIndex" => "refbase-created_date-created_time"); // 'sru.php': CQL search term should get splitted into date & time information!
|
|
|
|
$indexArray["rec.creationAgentName"] = array("_set" => "rec",
|
|
"_index" => "creationAgentName",
|
|
"_title" => "name of the agent responsible for creation of the record",
|
|
"_refbaseIndex" => "refbase-created_by");
|
|
|
|
$indexArray["rec.lastModificationDate"] = array("_set" => "rec",
|
|
"_index" => "lastModificationDate",
|
|
"_title" => "date/time at which the record was last modified",
|
|
"_refbaseIndex" => "refbase-modified_date-modified_time"); // 'sru.php': CQL search term should get splitted into date & time information!
|
|
|
|
$indexArray["rec.lastModificationAgentName"] = array("_set" => "rec",
|
|
"_index" => "lastModificationAgentName",
|
|
"_title" => "name of the agent responsible for last modifying the record",
|
|
"_refbaseIndex" => "refbase-modified_by");
|
|
|
|
$indexArray["bib.citekey"] = array("_set" => "bib",
|
|
"_index" => "citekey",
|
|
"_title" => "user-specific cite key for the record",
|
|
"_refbaseIndex" => "refbase-cite_key");
|
|
|
|
// Not sure how these fields can be mapped:
|
|
// "publication" => "Book title or journal name",
|
|
// "abbrev_journal" => "Abbreviated journal name",
|
|
// "volume" => "Publication volume",
|
|
// "issue" => "Publication issue",
|
|
// "pages" => "Range or total number of pages",
|
|
// "place" => "Place of publication",
|
|
// "series_title" => "Series title", // -> could 'bath.seriesTitle' be used? compare with <http://www.loc.gov/z3950/lcserver.html> and <http://copac.ac.uk/interfaces/srw/>
|
|
// "abbrev_series_title" => "Abbreviated series title",
|
|
// "series_volume" => "Series volume",
|
|
// "series_issue" => "Series issue",
|
|
// "thesis" => "Thesis",
|
|
// "doi" => "Digital object identifier",
|
|
// "url" => "Uniform resource locator",
|
|
|
|
foreach ($indexArray as $indexKey => $index)
|
|
{
|
|
$srwIndexBranch = new XMLBranch("index");
|
|
$srwIndexBranch->setTagAttribute("search", "true");
|
|
$srwIndexBranch->setTagAttribute("scan", "false");
|
|
$srwIndexBranch->setTagAttribute("sort", "false");
|
|
$srwIndexBranch->setTagAttribute("refb:index", $index["_refbaseIndex"]);
|
|
|
|
addNewBranch($srwIndexBranch, "title", array("lang" => "en"), $index["_title"]);
|
|
|
|
$srwIndexMapBranch = new XMLBranch("map");
|
|
|
|
addNewBranch($srwIndexMapBranch, "name", array("set" => $index["_set"]), $index["_index"]);
|
|
|
|
$srwIndexBranch->addXMLBranch($srwIndexMapBranch);
|
|
|
|
$srwIndexInfoBranch->addXMLBranch($srwIndexBranch);
|
|
}
|
|
|
|
$srwExplainBranch->addXMLBranch($srwIndexInfoBranch);
|
|
// --- end index info ---------------------------------------
|
|
|
|
|
|
// --- begin schema info -------------------------------------
|
|
$srwSchemaInfoBranch = new XMLBranch("schemaInfo");
|
|
|
|
// MODS:
|
|
$modsSchemaBranch = new XMLBranch("schema");
|
|
$modsSchemaBranch->setTagAttribute("identifier", "http://www.loc.gov/mods/v3"); // or should 'info:srw/schema/1/mods-v3.2' be used?
|
|
$modsSchemaBranch->setTagAttribute("location", "http://www.loc.gov/standards/mods/v3/mods-3-0.xsd");
|
|
$modsSchemaBranch->setTagAttribute("sort", "false");
|
|
$modsSchemaBranch->setTagAttribute("retrieve", "true");
|
|
$modsSchemaBranch->setTagAttribute("name", "mods");
|
|
|
|
addNewBranch($modsSchemaBranch, "title", array("lang" => "en"), "Metadata Object Description Schema (MODS) v3");
|
|
|
|
$srwSchemaInfoBranch->addXMLBranch($modsSchemaBranch);
|
|
|
|
// Simple Dublin Core (DC):
|
|
$dcSchemaBranch = new XMLBranch("schema");
|
|
$dcSchemaBranch->setTagAttribute("identifier", "http://purl.org/dc/elements/1.1/"); // or should 'info:srw/schema/1/dc-v1.1' be used?
|
|
$dcSchemaBranch->setTagAttribute("location", "http://dublincore.org/schemas/xmls/simpledc20021212.xsd");
|
|
$dcSchemaBranch->setTagAttribute("sort", "false");
|
|
$dcSchemaBranch->setTagAttribute("retrieve", "true");
|
|
$dcSchemaBranch->setTagAttribute("name", "dc");
|
|
|
|
addNewBranch($dcSchemaBranch, "title", array("lang" => "en"), "Simple Dublin Core (DC) v1.1");
|
|
|
|
$srwSchemaInfoBranch->addXMLBranch($dcSchemaBranch);
|
|
|
|
// Simple Dublin Core (OAI_DC):
|
|
// See recommendations for use of simple Dublin Core metadata to describe eprints in eprint archives: <http://eprints-uk.rdn.ac.uk/project/docs/simpledc-guidelines/>
|
|
// Example SRW+DC output from LoC: <http://z3950.loc.gov:7090/voyager?query=dc.creator+%3D+%22miller%22&version=1.1&operation=searchRetrieve&recordSchema=dc&startRecord=1&maximumRecords=10>
|
|
// $oaidcSchemaBranch = new XMLBranch("schema");
|
|
// $oaidcSchemaBranch->setTagAttribute("identifier", "http://www.openarchives.org/OAI/2.0/oai_dc/");
|
|
// $oaidcSchemaBranch->setTagAttribute("location", "http://www.openarchives.org/OAI/2.0/oai_dc.xsd");
|
|
// $oaidcSchemaBranch->setTagAttribute("sort", "false");
|
|
// $oaidcSchemaBranch->setTagAttribute("retrieve", "true");
|
|
// $oaidcSchemaBranch->setTagAttribute("name", "oai_dc");
|
|
//
|
|
// addNewBranch($oaidcSchemaBranch, "title", array("lang" => "en"), "Simple Dublin Core for OAI-PMH (OAI_DC)");
|
|
//
|
|
// $srwSchemaInfoBranch->addXMLBranch($oaidcSchemaBranch);
|
|
|
|
$srwExplainBranch->addXMLBranch($srwSchemaInfoBranch);
|
|
// --- end schema info ---------------------------------------
|
|
|
|
|
|
// --- begin config info -------------------------------------
|
|
$srwConfigInfoBranch = new XMLBranch("configInfo");
|
|
|
|
// default:
|
|
addNewBranch($srwConfigInfoBranch, "default", array("type" => "retrieveSchema"), "mods");
|
|
addNewBranch($srwConfigInfoBranch, "default", array("type" => "numberOfRecords"), $showRows);
|
|
addNewBranch($srwConfigInfoBranch, "default", array("type" => "stylesheet"), $databaseBaseURL . "srwmods2html.xsl");
|
|
addNewBranch($srwConfigInfoBranch, "default", array("type" => "contextSet"), "cql");
|
|
addNewBranch($srwConfigInfoBranch, "default", array("type" => "index"), "cql.serverChoice");
|
|
addNewBranch($srwConfigInfoBranch, "default", array("type" => "relation"), "all");
|
|
|
|
// setting:
|
|
addNewBranch($srwConfigInfoBranch, "setting", array("type" => "sortSchema"), "identifier");
|
|
addNewBranch($srwConfigInfoBranch, "setting", array("type" => "recordPacking"), "xml");
|
|
|
|
// supports:
|
|
addNewBranch($srwConfigInfoBranch, "supports", array("type" => "proximity"), "false");
|
|
addNewBranch($srwConfigInfoBranch, "supports", array("type" => "resultSets"), "false");
|
|
addNewBranch($srwConfigInfoBranch, "supports", array("type" => "relationModifier"), "false");
|
|
addNewBranch($srwConfigInfoBranch, "supports", array("type" => "booleanModifier"), "false"); // TODO: set to 'true' when Rob's CQL-PHP has been implemented successfully
|
|
addNewBranch($srwConfigInfoBranch, "supports", array("type" => "sort"), "false");
|
|
addNewBranch($srwConfigInfoBranch, "supports", array("type" => "maskingCharacter"), "true");
|
|
addNewBranch($srwConfigInfoBranch, "supports", array("type" => "anchoring"), "true");
|
|
addNewBranch($srwConfigInfoBranch, "supports", array("type" => "emptyTerm"), "false");
|
|
addNewBranch($srwConfigInfoBranch, "supports", array("type" => "recordXPath"), "false");
|
|
addNewBranch($srwConfigInfoBranch, "supports", array("type" => "scan"), "false");
|
|
|
|
$srwExplainBranch->addXMLBranch($srwConfigInfoBranch);
|
|
// --- end config info ---------------------------------------
|
|
|
|
|
|
$srwRecordDataBranch->addXMLBranch($srwExplainBranch);
|
|
|
|
$srwRecordBranch->addXMLBranch($srwRecordDataBranch);
|
|
|
|
$srwCollection->addXMLBranch($srwRecordBranch);
|
|
|
|
$srwCollectionDoc->setXML($srwCollection);
|
|
$srwCollectionString = $srwCollectionDoc->getXMLString();
|
|
|
|
// Add the XML Stylesheet definition:
|
|
// Note that this is just a hack (that should get fixed) since I don't know how to do it properly using the ActiveLink PHP XML Package ?:-/
|
|
if (!empty($exportStylesheet))
|
|
$srwCollectionString = preg_replace("/(?=\<srw:explainResponse)/i","<?xml-stylesheet type=\"text/xsl\" href=\"" . $exportStylesheet . "\"?>\n",$srwCollectionString);
|
|
|
|
return $srwCollectionString;
|
|
}
|
|
|
|
// --------------------------------------------------------------------
|
|
|
|
// Return SRW diagnostics (i.e. SRW error information) wrapped into SRW XML ('searchRetrieveResponse'):
|
|
function srwDiagnostics($diagCode, $diagDetails, $exportStylesheet)
|
|
{
|
|
global $contentTypeCharset; // defined in 'ini.inc.php'
|
|
|
|
// Map SRU/W diagnostic numbers to their corresponding messages:
|
|
$diagMessages = mapSRWDiagnostics(); // function 'mapSRWDiagnostics()' is defined in 'webservice.inc.php'
|
|
|
|
if (isset($diagMessages[$diagCode]))
|
|
$diagMessage = $diagMessages[$diagCode];
|
|
else
|
|
$diagMessage = "Unknown error";
|
|
|
|
$srwCollectionDoc = new XMLDocument();
|
|
$srwCollectionDoc->setEncoding($contentTypeCharset);
|
|
|
|
$srwCollection = srwGenerateBaseTags("searchRetrieveResponse");
|
|
|
|
$diagnosticsBranch = new XMLBranch("srw:diagnostics");
|
|
|
|
// since we've defined the 'diag' namespace in the <searchRetrieveResponse> element (see function 'srwGenerateBaseTags()'),
|
|
// we can simply use '<diag:diagnostic>' below; otherwise we should use '<diagnostic xmlns="http://www.loc.gov/zing/srw/diagnostic/">':
|
|
// addNewBranch($diagnosticsBranch, "diagnostic", array("xmlns" => "http://www.loc.gov/zing/srw/diagnostic/"), "");
|
|
|
|
$diagnosticsBranch->setTagContent("info:srw/diagnostic/1/" . $diagCode, "srw:diagnostics/diag:diagnostic/uri");
|
|
$diagnosticsBranch->setTagContent($diagMessage, "srw:diagnostics/diag:diagnostic/message");
|
|
if (!empty($diagDetails))
|
|
$diagnosticsBranch->setTagContent(encodeHTMLspecialchars($diagDetails), "srw:diagnostics/diag:diagnostic/details");
|
|
|
|
$srwCollection->addXMLBranch($diagnosticsBranch);
|
|
|
|
$srwCollectionDoc->setXML($srwCollection);
|
|
$srwCollectionString = $srwCollectionDoc->getXMLString();
|
|
|
|
// Add the XML Stylesheet definition:
|
|
// Note that this is just a hack (that should get fixed) since I don't know how to do it properly using the ActiveLink PHP XML Package ?:-/
|
|
if (!empty($exportStylesheet))
|
|
$srwCollectionString = preg_replace("/(?=\<srw:searchRetrieveResponse)/i","<?xml-stylesheet type=\"text/xsl\" href=\"" . $exportStylesheet . "\"?>\n",$srwCollectionString);
|
|
|
|
return $srwCollectionString;
|
|
}
|
|
|
|
// --------------------------------------------------------------------
|
|
|
|
// Generate the basic SRW XML tree required for a 'searchRetrieveResponse' or 'explainResponse':
|
|
function srwGenerateBaseTags($srwOperation)
|
|
{
|
|
global $exportFormat; // this is needed so that we can distinguish between "SRW_DC XML" and "SRW_MODS XML" record formats
|
|
|
|
$srwCollection = new XML("srw:" . $srwOperation);
|
|
$srwCollection->setTagAttribute("xmlns:srw", "http://www.loc.gov/zing/srw/");
|
|
|
|
if ($srwOperation == "searchRetrieveResponse")
|
|
{
|
|
$srwCollection->setTagAttribute("xmlns:diag", "http://www.loc.gov/zing/srw/diagnostic/");
|
|
$srwCollection->setTagAttribute("xmlns:xcql", "http://www.loc.gov/zing/cql/xcql/");
|
|
|
|
if (preg_match("/DC/i", $exportFormat)) // add namespace declarations for "SRW_DC XML":
|
|
{
|
|
$srwCollection->setTagAttribute("xmlns:srw_dc", "info:srw/schema/1/dc-v1.1");
|
|
$srwCollection->setTagAttribute("xmlns:dc", "http://purl.org/dc/elements/1.1/");
|
|
$srwCollection->setTagAttribute("xmlns:prism", "http://prismstandard.org/namespaces/1.2/basic/");
|
|
}
|
|
else // add namespace declarations for "SRW_MODS XML":
|
|
$srwCollection->setTagAttribute("xmlns:mods", "http://www.loc.gov/mods/v3");
|
|
}
|
|
// elseif ($srwOperation == "explainResponse")
|
|
// {
|
|
// $srwCollection->setTagAttribute("xmlns:zr", "http://explain.z3950.org/dtd/2.0/");
|
|
// }
|
|
|
|
addNewBranch($srwCollection, "srw:version", array(), "1.1"); // function 'addNewBranch()' is defined in 'webservice.inc.php'
|
|
|
|
return $srwCollection;
|
|
}
|
|
|
|
// --------------------------------------------------------------------
|
|
|
|
// Generate the basic SRW XML elements 'recordPacking' and 'recordSchema':
|
|
function srwGeneratePackingSchema(&$thisObject, $srwPacking, $srwSchema)
|
|
{
|
|
// available schemas taken from <http://www.loc.gov/z3950/agency/zing/srw/record-schemas.html>
|
|
$srwSchemas = array("dc" => "info:srw/schema/1/dc-v1.1", // or should <http://purl.org/dc/elements/1.1/> be used?
|
|
// "dcterms" => "http://purl.org/dc/terms/",
|
|
"diag" => "info:srw/schema/1/diagnostic-v1.1", // it says 'info:srw/schema/1/diagnostics-v1.1' at <http://www.loc.gov/standards/sru/diagnostics.html> ?:-/
|
|
"zeerex" => "http://explain.z3950.org/dtd/2.0/",
|
|
"mods" => "info:srw/schema/1/mods-v3.2",
|
|
"onix" => "info:srw/schema/1/onix-v2.0",
|
|
"marcxml" => "info:srw/schema/1/marcxml-v1.1",
|
|
"ead" => "info:srw/schema/1/ead-2002",
|
|
"zthes" => "http://zthes.z3950.org/xml/0.5/",
|
|
"ccg" => "http://srw.cheshire3.org/schemas/ccg/1.0/",
|
|
"rec" => "info:srw/schema/2/rec-1.0",
|
|
"server-choice" => "info:srw/schema/1/server-choice",
|
|
"xpath" => "info:srw/schema/1/xpath-1.0");
|
|
|
|
addNewBranch($thisObject, "srw:recordPacking", array(), $srwPacking); // function 'addNewBranch()' is defined in 'webservice.inc.php'
|
|
addNewBranch($thisObject, "srw:recordSchema", array(), $srwSchemas[$srwSchema]);
|
|
}
|
|
|
|
// --------------------------------------------------------------------
|
|
?>
|