All Downloads are FREE. Search and download functionalities are using the official Maven repository.

protobuf.opencb.variant_annotation.proto Maven / Gradle / Ivy

The newest version!
syntax = "proto3";

package protobuf.opencb;

option java_package = "org.opencb.biodata.models.variant.protobuf";
option java_outer_classname = "VariantAnnotationProto";
option java_generate_equals_and_hash = true;
//option java_multiple_files = true;

import "protobuf/opencb/common.proto";
import "protobuf/opencb/gene.proto";
import "protobuf/opencb/evidence.proto";

// enum ExpressionCall in common.proto

message ClinVar {
    string accession = 1;
    string clinical_significance = 2;
    repeated string traits = 3;
    repeated string geneNames = 4;
    string review_status = 5;
}

message Gwas {
    string snpIdCurrent = 1;
    repeated string traits = 2;
    double risk_allele_frequency = 3;
    string reported_genes = 4;
}

message Cosmic {
    string mutation_id = 1;
    string primary_site = 2;
    string site_subtype = 3;
    string primary_histology = 4;
    string histology_subtype = 5;
    string sample_source = 6;
    string tumour_origin = 7;
    string gene_name = 8;
    string mutation_somatic_status = 9;
}

message VariantTraitAssociation {
    repeated ClinVar clinvar = 1;
    repeated Gwas gwas = 2;
    repeated Cosmic cosmic = 3;
}

// message GeneDrugInteraction in common.proto
// message Expression in common.proto

//message GeneTraitAssociation {
//    string id = 1;
//    string name = 2;
//    string hpo = 3;
//    float score = 4;
//    int32 number_of_pubmeds = 5;
//    repeated string association_types = 6;
//    repeated string sources = 7;
//    string source = 8;
//}

message PopulationFrequency {
    string study = 1;
    string population = 2;
    string ref_allele = 3;
    string alt_allele = 4;
    float ref_allele_freq = 5;
    float alt_allele_freq = 6;
    float ref_hom_genotype_freq = 7;
    float het_genotype_freq = 8;
    float alt_hom_genotype_freq = 9;
}

message SequenceOntologyTerm {
    string accession = 1;
    string name = 2;
}

message ProteinFeature {
    string id = 1;
    int32 start = 2;
    int32 end = 3;
    string type = 4;
    string description = 5;
}

message Score {
    double score = 1;
    string source = 2;
    string description = 3;
}

message ProteinVariantAnnotation {
    string uniprot_accession = 1;
    string uniprot_name = 2;
    int32 position = 3;
    //string aaChange = 4;
    string reference = 5;
    string alternate = 6;
    string uniprot_variant_id = 7;
    string functional_description = 8;
    repeated Score substitution_scores = 9;
    repeated string keywords = 10;
    repeated ProteinFeature features = 11;
}

message ExonOverlap {
    string number = 1;
    float percentage = 2;
}

message ConsequenceType {
    string gene_name = 1;
    string ensembl_gene_id = 2;
    string ensembl_transcript_id = 3;
    string strand = 4;
    string biotype = 5;
    repeated ExonOverlap exon_overlap = 6;
    repeated string transcript_annotation_flags = 7;
    int32 c_dna_position = 8;
    int32 cds_position = 9;
    string codon = 10;
    ProteinVariantAnnotation protein_variant_annotation = 11;
    repeated SequenceOntologyTerm sequence_ontology_terms = 12;
}

message Repeat {
    string id = 1;
    string chromosome = 2;
    int32 start = 3;
    int32 end = 4;
    int32 period = 5;
    int32 consensusSize = 6;
    float copy_number = 7;
    float percentage_match = 8;
    float score = 9;
    string sequence = 10;
    string source = 11;
}

message Cytoband {
    string chromosome = 1;
    string stain = 2;
    string name = 3;
    int32 start = 4;
    int32 end = 5;
}

message Drug {
    string therapeuticContext = 1;
    string pathway = 2;
    string effect = 3;
    string association = 4;
    string status = 5;
    string evidence = 6;
    repeated string bibliography = 7;
}

message VariantAnnotation {
    string chromosome = 1;
    int32 start = 2;
    int32 end = 3;
    string reference = 4;
    string alternate = 5;
    string ancestral_allele = 6;
    string id = 7;

    message Xref {
        string id = 1;
        string source = 2;
    }
    repeated Xref xrefs = 8;
    repeated string hgvs = 9;
    string display_consequence_type= 10;
    repeated ConsequenceType consequence_types = 11;
    repeated PopulationFrequency population_frequencies = 12;
    string minorAllele = 13;
    float minorAlleleFreq = 14;
    repeated Score conservation = 15;
    repeated Expression gene_expression = 16;
    repeated GeneTraitAssociation gene_trait_association = 17;
    repeated GeneDrugInteraction gene_drug_interaction = 18;
    VariantTraitAssociation variant_trait_association = 19;
    repeated EvidenceEntry trait_association = 24;
    repeated Score functional_score = 20;
    repeated Repeat repeat = 21;
    repeated Cytoband cytoband = 22;
    repeated Drug drugs = 25;

    message AdditionalAttribute {
        map attribute = 1;
    }
    map additional_attributes = 23;
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy