blob: 4703c41da815c3e3df8cb34ce1fb610893782233 [file] [log] [blame]
/*********************************************************************************************************************
* Copyright (c) 2008, 2011 Attensity Europe GmbH and brox IT Solutions GmbH. All rights reserved. This program and the
* accompanying materials are made available under the terms of the Eclipse Public License v1.0 which accompanies this
* distribution, and is available at http://www.eclipse.org/legal/epl-v10.html
**********************************************************************************************************************/
package org.eclipse.smila.importing.crawler.web;
import java.util.Collection;
import org.eclipse.smila.datamodel.Record;
/**
* Produces resulting records from fetched input record. Implementations may map the fetched attributes of the input
* record to output record attributes. It's also possible to split the input record to multiple output records, or to
* filter out the input record and return an empty result.
*/
public interface RecordProducer {
/** @return collection of records, maybe empty. May also return more than one if input record is split. */
Collection<Record> produceRecords(final Record record, WebCrawlingContext context) throws WebCrawlerException;
}