-
Notifications
You must be signed in to change notification settings - Fork 58
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Fix gtf2gff converter to remove cds in special cases - add tests for …
…gtf to gff conversion and for gff to gff to check stop codon when starting an exon or split over 2 exons (#125)
- Loading branch information
Showing
72 changed files
with
4,125 additions
and
134 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,9 @@ | ||
chr6 HAVANA transcript 143060901 143061606 . + . gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA exon 143060901 143061066 . + . gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA CDS 143060926 143061065 . + 0 gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA start_codon 143060926 143060928 . + 0 gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA exon 143061214 143061606 . + . gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA stop_codon 143061066 143061066 . + 0 gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA stop_codon 143061214 143061215 . + 0 gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA UTR 143060901 143060925 . + . gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA UTR 143061214 143061606 . + . gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,12 @@ | ||
##gff-version 3 | ||
chr6 HAVANA gene 143060901 143061606 . + . ID=ENSG00000146416.19;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA transcript 143060901 143061606 . + . ID=ENST00000367596.5;Parent=ENSG00000146416.19;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA exon 143060901 143061066 . + . ID=exon-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA exon 143061214 143061606 . + . ID=exon-2;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA CDS 143060926 143061066 . + 0 ID=cds-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA CDS 143061214 143061215 . + 1 ID=nbis-cds-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA start_codon 143060926 143060928 . + 0 ID=start_codon-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA stop_codon 143061066 143061066 . + 0 ID=stop_codon-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA stop_codon 143061214 143061215 . + 0 ID=stop_codon-2;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA UTR 143060901 143060925 . + . ID=utr-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA UTR 143061216 143061606 . + . ID=utr-2;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,8 @@ | ||
chr6 HAVANA transcript 143060901 143061606 . + . gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA exon 143060901 143061066 . + . gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA CDS 143060926 143061066 . + 0 gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA start_codon 143060926 143060928 . + 0 gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA exon 143061214 143061606 . + . gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA stop_codon 143061214 143061216 . + 0 gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA UTR 143060901 143060925 . + . gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; | ||
chr6 HAVANA UTR 143061214 143061606 . + . gene_id "ENSG00000146416.19"; transcript_id "ENST00000367596.5"; gene_type "protein_coding"; gene_name "AIG1"; |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,11 @@ | ||
##gff-version 3 | ||
chr6 HAVANA gene 143060901 143061606 . + . ID=ENSG00000146416.19;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA transcript 143060901 143061606 . + . ID=ENST00000367596.5;Parent=ENSG00000146416.19;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA exon 143060901 143061066 . + . ID=exon-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA exon 143061214 143061606 . + . ID=exon-2;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA CDS 143060926 143061066 . + 0 ID=cds-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA CDS 143061214 143061216 . + 0 ID=nbis-cds-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA start_codon 143060926 143060928 . + 0 ID=start_codon-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA stop_codon 143061214 143061216 . + 0 ID=stop_codon-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA UTR 143060901 143060925 . + . ID=utr-1;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 | ||
chr6 HAVANA UTR 143061217 143061606 . + . ID=utr-2;Parent=ENST00000367596.5;gene_id=ENSG00000146416.19;gene_name=AIG1;gene_type=protein_coding;transcript_id=ENST00000367596.5 |
This file was deleted.
Oops, something went wrong.
Oops, something went wrong.