/*
* Copyright [1999-2015] Wellcome Trust Sanger Institute and the EMBL-European Bioinformatics Institute
* Copyright [2016-2017] EMBL-European Bioinformatics Institute
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.ensembl.healthcheck.testcase.generic;
import java.sql.Connection;
import org.ensembl.healthcheck.DatabaseRegistryEntry;
import org.ensembl.healthcheck.ReportManager;
import org.ensembl.healthcheck.Team;
import org.ensembl.healthcheck.testcase.Priority;
import org.ensembl.healthcheck.testcase.SingleDatabaseTestCase;
import org.ensembl.healthcheck.util.DBUtils;
/**
* Check for hit_names that aren't formatted correctly.
*/
public class HitNameFormat extends SingleDatabaseTestCase {
/**
* Creates a new instance.
*/
public HitNameFormat() {
setDescription("Check that there are no incorrectly formatted hit_names");
setPriority(Priority.AMBER);
setFix("Manually fix affected values.");
setTeamResponsible(Team.GENEBUILD);
}
/**
* Run the test.
*
* @param dbre
* The database registry entry to be checked.
*/
public boolean run(DatabaseRegistryEntry dbre) {
boolean result = true;
Connection con = dbre.getConnection();
String[] tables = { "dna_align_feature", "protein_align_feature",
"protein_feature" };
for (String table : tables) {
int rows = DBUtils.getRowCount(con, "SELECT COUNT(*) FROM " + table
+ " WHERE hit_name LIKE '%|%'");
if (rows > 0) {
ReportManager
.problem(
this,
con,
rows
+ " "
+ table
+ "s appear to have incorrectly formatted hit_names (containing a '|' symbol)");
ReportManager
.problem(
this,
con,
"USEFUL SQL: SELECT SUBSTRING_INDEX(SUBSTRING_INDEX(hit_name,'|',-2),'|',1) FROM "
+ table
+ " WHERE hit_name LIKE 'gi%|%'");
ReportManager
.problem(
this,
con,
"UPDATE "
+ table
+ " SET hit_name = SUBSTRING_INDEX(SUBSTRING_INDEX(hit_name,'|',-2),'|',1) WHERE hit_name LIKE 'gi|%'");
result = false;
} else {
ReportManager.correct(this, con, "All " + table
+ "s have correctly formatted hit_names");
}
}
return result;
}
} // HitNameFormat