/*******************************************************************************
* Trombone is a flexible text processing and analysis library used
* primarily by Voyant Tools (voyant-tools.org).
*
* Copyright (©) 2007-2012 Stéfan Sinclair & Geoffrey Rockwell
*
* This file is part of Trombone.
*
* Trombone is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Trombone is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Trombone. If not, see <http://www.gnu.org/licenses/>.
******************************************************************************/
package org.voyanttools.trombone.input.source;
import java.io.ByteArrayInputStream;
import java.io.IOException;
import java.io.InputStream;
import org.apache.commons.codec.digest.DigestUtils;
import org.apache.commons.lang3.StringUtils;
import org.voyanttools.trombone.model.DocumentMetadata;
/**
* An {@link InputSource} associated with an in-memory string.
*
* @author Stéfan Sinclair
*/
public class StringInputSource implements InputSource {
/**
* the string (content) for this input source
*/
private String string;
/**
* the id (hash) for this input source
*/
private String id;
/**
* the metadata for this input source
*/
private DocumentMetadata metadata;
/**
* Create a new instance with a string (the content).
*
* @param string the content
*/
public StringInputSource(String string) {
this.string = string;
this.metadata = new DocumentMetadata();
this.metadata.setLocation("memory");
this.metadata.setSource(Source.STRING);
this.metadata.setTitle(StringUtils.abbreviate(string.trim().replaceAll("\\s+", " "),50));
this.id = DigestUtils.md5Hex(string);
}
/**
* Create a new instance with all of the needed information.
*
* @param id
* the ID (should be a relatively short alphanumeric hash code)
* for the input source as generated by
* {@link DigestUtils#md5(String)}
* @param metadata
* the metadata associated with the input source (this should
* include information like {@link Source}, location and last
* modified)
* @param string the string associated with this input source
*/
public StringInputSource(String id, DocumentMetadata metadata, String string) {
this.id = id;
this.metadata = metadata;
this.string = string;
}
public InputStream getInputStream() throws IOException {
return new ByteArrayInputStream(string.getBytes("UTF-8"));
}
public DocumentMetadata getMetadata() {
return this.metadata;
}
public String getUniqueId() {
return id;
}
}