/*
* Copyright [1999-2015] Wellcome Trust Sanger Institute and the EMBL-European Bioinformatics Institute
* Copyright [2016-2017] EMBL-European Bioinformatics Institute
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.ensembl.healthcheck.testcase.generic;
import java.sql.Connection;
import org.ensembl.healthcheck.DatabaseRegistryEntry;
import org.ensembl.healthcheck.DatabaseType;
import org.ensembl.healthcheck.ReportManager;
import org.ensembl.healthcheck.Team;
import org.ensembl.healthcheck.testcase.SingleDatabaseTestCase;
import org.ensembl.healthcheck.util.DBUtils;
/**
* Check that feature co-ords make sense.
*/
public class ProteinFeatures extends SingleDatabaseTestCase {
private static int THRESHOLD = 1000;
/**
* Creates a new instance of CheckFeatureCoordsTestCase
*/
public ProteinFeatures() {
setDescription("Check that protein annotation feature coords make sense and that all translations exist in the database");
setTeamResponsible(Team.GENEBUILD);
}
/**
* This only applies to core and Vega databases.
*/
public void types() {
removeAppliesToType(DatabaseType.OTHERFEATURES);
removeAppliesToType(DatabaseType.RNASEQ);
removeAppliesToType(DatabaseType.CDNA);
}
/**
* Iterate over each affected database and perform various checks.
*
* @param dbre
* The database to use.
* @return true if the test passes.
*/
public boolean run(DatabaseRegistryEntry dbre) {
boolean result = true;
Connection con = dbre.getConnection();
logger.fine("Checking protein features for " + DBUtils.getShortDatabaseName(con) + " ...");
int rows = DBUtils.getRowCount(con, "SELECT COUNT(*) FROM protein_feature WHERE seq_start > seq_end");
if (rows > THRESHOLD) {
result = false;
ReportManager.problem(this, con, rows + " protein features have seq_start > seq_end");
}
logger.fine("Checking protein features for " + DBUtils.getShortDatabaseName(con) + " ...");
rows = DBUtils.getRowCount(con, "SELECT COUNT(*) from protein_feature WHERE seq_start < 0");
if (rows > THRESHOLD) {
result = false;
ReportManager.problem(this, con, rows + " protein features have seq_start < 0");
}
logger.fine("Checking protein features for " + DBUtils.getShortDatabaseName(con) + " ...");
rows = DBUtils.getRowCount(con, "SELECT COUNT(*) FROM protein_feature WHERE hit_start < 0");
if (rows > THRESHOLD) {
result = false;
ReportManager.problem(this, con, rows + " protein features have hit_start < 0");
}
logger.fine("Checking protein features for " + DBUtils.getShortDatabaseName(con) + " ...");
rows = DBUtils.getRowCount(con, "SELECT COUNT(*) from protein_feature WHERE hit_start > hit_end");
if (rows > THRESHOLD) {
result = false;
ReportManager.problem(this, con, rows + " protein features have hit_start > hit_end");
}
return result;
} // run
} // ProteinFeatures