001 //$HeadURL: svn+ssh://rbezema@svn.wald.intevation.org/deegree/base/tags/2.1/src/org/deegree/ogcwebservices/csw/manager/CSWProfileHarvester.java $
002 /*---------------- FILE HEADER ------------------------------------------
003
004 This file is part of deegree.
005 Copyright (C) 2001-2006 by:
006 EXSE, Department of Geography, University of Bonn
007 http://www.giub.uni-bonn.de/deegree/
008 lat/lon GmbH
009 http://www.lat-lon.de
010
011 This library is free software; you can redistribute it and/or
012 modify it under the terms of the GNU Lesser General Public
013 License as published by the Free Software Foundation; either
014 version 2.1 of the License, or (at your option) any later version.
015
016 This library is distributed in the hope that it will be useful,
017 but WITHOUT ANY WARRANTY; without even the implied warranty of
018 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
019 Lesser General Public License for more details.
020
021 You should have received a copy of the GNU Lesser General Public
022 License along with this library; if not, write to the Free Software
023 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
024
025 Contact:
026
027 Andreas Poth
028 lat/lon GmbH
029 Aennchenstr. 19
030 53115 Bonn
031 Germany
032 E-Mail: poth@lat-lon.de
033
034 Prof. Dr. Klaus Greve
035 Department of Geography
036 University of Bonn
037 Meckenheimer Allee 166
038 53115 Bonn
039 Germany
040 E-Mail: greve@giub.uni-bonn.de
041
042
043 ---------------------------------------------------------------------------*/
044 package org.deegree.ogcwebservices.csw.manager;
045
046 import java.io.IOException;
047 import java.net.MalformedURLException;
048 import java.net.URI;
049 import java.net.URL;
050 import java.util.Date;
051 import java.util.Iterator;
052 import java.util.List;
053
054 import org.deegree.framework.log.ILogger;
055 import org.deegree.framework.log.LoggerFactory;
056 import org.deegree.framework.util.FileUtils;
057 import org.deegree.framework.util.StringTools;
058 import org.deegree.framework.xml.XMLFragment;
059 import org.deegree.framework.xml.XMLParsingException;
060 import org.deegree.framework.xml.XMLTools;
061 import org.deegree.ogcwebservices.csw.manager.HarvestRepository.ResourceType;
062 import org.xml.sax.SAXException;
063
064 /**
065 * Harverster implementation for harvesting single metadata documents.
066 *
067 *
068 * @version $Revision: 7601 $
069 * @author <a href="mailto:poth@lat-lon.de">Andreas Poth</a>
070 * @author last edited by: $Author: apoth $
071 *
072 * @version 1.0. $Revision: 7601 $, $Date: 2007-06-20 10:23:45 +0200 (Mi, 20 Jun 2007) $
073 *
074 * @since 2.0
075 */
076 public class CSWProfileHarvester extends AbstractHarvester {
077
078 private static final ILogger LOG = LoggerFactory.getLogger( CSWProfileHarvester.class );
079
080 private static CSWProfileHarvester ch = null;
081
082 /**
083 * singelton
084 *
085 * @return
086 */
087 public static CSWProfileHarvester getInstance() {
088 if ( ch == null ) {
089 ch = new CSWProfileHarvester();
090 }
091 return ch;
092 }
093
094 @Override
095 public void run() {
096 LOG.logDebug( "starting harvest iteration for CSWProfileHarvester." );
097 try {
098 HarvestRepository repository = HarvestRepository.getInstance();
099
100 List<URI> sources = repository.getSources();
101 for ( Iterator iter = sources.iterator(); iter.hasNext(); ) {
102 URI source = (URI) iter.next();
103 try {
104 // determine if source shall be harvested
105 if ( shallHarvest( source, ResourceType.csw_profile ) ) {
106 HarvestProcessor processor = new HarvestProcessor( this, source );
107 processor.start();
108 }
109 } catch ( Exception e ) {
110 LOG.logError( "Exception harvesting service: " + source, e );
111 informResponseHandlers( source, e );
112 }
113 }
114 } catch ( Exception e ) {
115 LOG.logError( "generell Exception harvesting services", e );
116 }
117
118 }
119
120 /**
121 * inner class for processing asynchronous harvesting of a csw:profile metadata document
122 *
123 * @version $Revision: 7601 $
124 * @author <a href="mailto:poth@lat-lon.de">Andreas Poth</a>
125 * @author last edited by: $Author: apoth $
126 *
127 * @version 1.0. $Revision: 7601 $, $Date: 2007-06-20 10:23:45 +0200 (Mi, 20 Jun 2007) $
128 *
129 * @since 2.0
130 */
131 protected class HarvestProcessor extends AbstractHarvestProcessor {
132
133 HarvestProcessor( AbstractHarvester owner, URI source ) {
134 super( owner, source );
135 }
136
137 @Override
138 public void run() {
139 try {
140 HarvestRepository repository = HarvestRepository.getInstance();
141 XMLFragment metaData = accessMetadata( source );
142 Date harvestingTimestamp = repository.getNextHarvestingTimestamp( source );
143 String trans = null;
144 // ensure that a resource just will be harvested if something has changed
145 if ( shallHarvest( source, ResourceType.csw_profile ) ) {
146 if ( repository.getLastHarvestingTimestamp( source ) == null ) {
147 trans = createInsertRequest( metaData );
148 } else {
149 trans = createUpdateRequest( getID( metaData ), getIdentifierXPath( metaData ), metaData );
150 }
151 performTransaction( trans );
152
153 long ts = repository.getHarvestInterval( source );
154 if ( ts <= 0 ) {
155 // if the harvest interval is less or equal to 0 the source
156 // shall just be harvested for one time and it will be
157 // removed from harvest cache db
158 informResponseHandlers( source );
159 repository.dropRequest( source );
160 } else {
161 // update timestamps just if transaction has been performed
162 // successfully
163 writeLastHarvestingTimestamp( source, harvestingTimestamp );
164 writeNextHarvestingTimestamp( source, harvestingTimestamp );
165 informResponseHandlers( source );
166 }
167 }
168
169 } catch ( Exception e ) {
170 e.printStackTrace();
171 LOG.logError( "could not perform harvest operation for source: " + source, e );
172 try {
173 owner.informResponseHandlers( source, e );
174 } catch ( Exception ee ) {
175 ee.printStackTrace();
176 }
177 }
178 }
179
180 /**
181 * returns the XPath the metadata records identifier
182 *
183 * @param metaData
184 * @return the XPath the metadata records identifier
185 */
186 private String getIdentifierXPath( XMLFragment metaData ) {
187 String xpath = "iso19115:fileIdentifier/smXML:CharacterString";
188 if ( metaData != null ) {
189 String nspace = metaData.getRootElement().getNamespaceURI();
190 nspace = StringTools.replace( nspace, "http://", "", true );
191 xpath = Messages.getString( "Identifier_" + nspace );
192 }
193 return xpath;
194 }
195
196 /**
197 * returns the identifier of a metadata record to enable its update
198 *
199 * @param metaData
200 * @return the identifier of a metadata record to enable its update
201 * @throws XMLParsingException
202 */
203 private String getID( XMLFragment metaData )
204 throws XMLParsingException {
205 String xpath = getIdentifierXPath( metaData );
206 String fileIdentifier = XMLTools.getRequiredNodeAsString( metaData.getRootElement(), xpath, nsc );
207 return fileIdentifier;
208 }
209
210 @Override
211 protected String createConstraint( String identifier, String xPath )
212 throws IOException {
213
214 // read template from file
215 // TODO
216 // read different templates depending on metadata format
217 URL url = CatalogueHarvester.class.getResource( "iso09_constraints_template.xml" );
218 String constraints = FileUtils.readTextFile( url ).toString();
219
220 constraints = StringTools.replace( constraints, "$identifier$", identifier, false );
221
222 return StringTools.replace( constraints, "$xPath$", xPath, false );
223
224 }
225
226 /**
227 *
228 * @param source
229 * @return
230 * @throws SAXException
231 * @throws IOException
232 * @throws MalformedURLException
233 */
234 private XMLFragment accessMetadata( URI source )
235 throws MalformedURLException, IOException, SAXException {
236
237 XMLFragment xml = new XMLFragment();
238 xml.load( source.toURL() );
239 return xml;
240 }
241
242 }
243
244 }