/*
* Machine Learning support for FindBugs
* Copyright (C) 2005, University of Maryland
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this library; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
*/
package edu.umd.cs.findbugs.ml;
import java.io.BufferedInputStream;
import java.io.BufferedOutputStream;
import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.util.List;
import java.util.zip.GZIPInputStream;
import org.dom4j.Attribute;
import org.dom4j.Document;
import org.dom4j.DocumentException;
import org.dom4j.DocumentFactory;
import org.dom4j.Element;
import org.dom4j.io.OutputFormat;
import org.dom4j.io.XMLWriter;
import edu.umd.cs.findbugs.BugCollection;
import edu.umd.cs.findbugs.Project;
import edu.umd.cs.findbugs.SortedBugCollection;
import edu.umd.cs.findbugs.annotations.NonNull;
import edu.umd.cs.findbugs.xml.Dom4JXMLOutput;
/**
* Add uid attributes to BugInstances in a BugCollection. A uid is an integer
* that uniquely identifies a BugInstance in a BugCollection. Right now this is
* only used in machine learning experiments.
*
* @author David Hovemeyer
*/
public class GenerateUIDs {
private BugCollection bugCollection;
@NonNull
private Project project;
private String inputFilename;
private String outputFilename;
public GenerateUIDs(String inputFilename, String outputFilename) {
this.bugCollection = new SortedBugCollection();
this.inputFilename = inputFilename;
this.outputFilename = outputFilename;
}
@SuppressWarnings("unchecked")
public void execute() throws IOException, DocumentException {
InputStream in = null;
try {
if (inputFilename.equals("-")) {
in = System.in;
} else {
in = new BufferedInputStream(new FileInputStream(inputFilename));
if (inputFilename.endsWith(".gz"))
in = new GZIPInputStream(in);
}
bugCollection.readXML(in);
in = null;
} finally {
if (in != null)
in.close();
}
Document document = DocumentFactory.getInstance().createDocument();
Dom4JXMLOutput xmlOutput = new Dom4JXMLOutput(document);
bugCollection.writeXML(xmlOutput);
int count = 0;
List<Element> bugInstanceList = document.selectNodes("/BugCollection/BugInstance");
for (Element element : bugInstanceList) {
Attribute uidAttr = element.attribute("uid");
if (uidAttr == null) {
element.addAttribute("uid", Integer.toString(count++));
}
}
OutputStream out;
if (outputFilename.equals("-")) {
out = System.out;
} else {
out = new BufferedOutputStream(new FileOutputStream(outputFilename));
}
XMLWriter xmlWriter = new XMLWriter(out, OutputFormat.createPrettyPrint());
try {
xmlWriter.write(document);
} finally {
xmlWriter.close();
}
}
public static void main(String[] args) throws IOException, DocumentException {
if (args.length != 2) {
System.err.println("Usage: " + GenerateUIDs.class.getName() + " <input file> <output file>");
System.exit(1);
}
String inputFilename = args[0];
String outputFilename = args[1];
GenerateUIDs generateUIDs = new GenerateUIDs(inputFilename, outputFilename);
generateUIDs.execute();
}
}