Command line: [exonerate -m p2g --showtargetgff -q ./SPP00000363_2.0.fa -t ./SPP00000363_2.0/fastasubseq/KV389506.1_fastasubseq.fa] Hostname: [ws101092U] C4 Alignment: ------------ Query: SPP00000363_2.0 # Protein # Selenoprotein P (SELENOP) # Marmoset Target: KV389506.1:subseq(2207742,100551) Cebus capucinus imitator isolate Cc_AM_T3 unplaced genomic scaffold Scaffold80, whole genome shotgun sequence:[revcomp] Model: protein2genome:local Raw score: 1796 Query range: 0 -> 381 Target range: 56210 -> 49942 1 : MetTrpArgSerLeuGlyLeuAlaLeuAlaLeuCysLeuLeuProSerGlyGlyThrGlu : 20 |||||||||||||||||||||||||||||||||||||||||||||||||||||||||||| MetTrpArgSerLeuGlyLeuAlaLeuAlaLeuCysLeuLeuProSerGlyGlyThrGlu 56210 : ATGTGGAGAAGCCTGGGGCTTGCCCTGGctctctgtctcctcccctcAGGAGGAACAGAG : 56153 21 : SerGlnAspGlnSerSerSerCysLysHisProProAlaTrpSerIleArgAspGlnAsp : 40 ||||||||||||||||||! !||||||!!.|||||||||||||||||||||||||||||| SerGlnAspGlnSerSerLeuCysLysGlnProProAlaTrpSerIleArgAspGlnAsp 56152 : AGCCAGGACCAAAGCTCCTTATGTAAGCAACCCCCAGCCTGGAGCATAAGAGATCAAGAT : 56093 41 : ProMetLeuAsnSerSerGlySerValThrValValAlaLeuLeuGlnAlaSerUnkTyr : 60 |||||||||||||||!!!|||||||||||||||||||||||||||||||||||| ||| ProMetLeuAsnSerThrGlySerValThrValValAlaLeuLeuGlnAlaSer***Tyr 56092 : CCAATGCTGAACTCCACTGGTTCAGTGACTGTGGTTGCTCTTCTTCAAGCCAGTTGATAC : 56033 61 : LeuCysIleLeuGlnAlaSer{Ar} >>>> Target Intron 1 >>>> {g}Leu : 69 |||||||||||||||||||||{||} 1063 bp {|}||| LeuCysIleLeuGlnAlaSer{Ar}++ ++{g}Leu 56032 : CTGTGCATTCTGCAGGCATCT{AG}gt.........................ag{A}TTG : 54943 70 : GluAspLeuArgValLysLeuGluLysGluGlyTyrSerAsnIleSerTyrIleIleVal : 89 |||||||||||||||||||||||||||||||||||||||||||||||||||||||||||| GluAspLeuArgValLysLeuGluLysGluGlyTyrSerAsnIleSerTyrIleIleVal 54942 : GAAGACCTGCGAGTAAAACTGGAGAAAGAAGGATATTctaatatttcttatattattgTT : 54883 90 : AsnHisGlnGlyLeuSerSerGlnLeuArgTyrThrHisLeuLysAsnGlnValSerGlu : 109 |||||||||||||||||||||||||||||||||||||||||||||||||||||||||||| AsnHisGlnGlyLeuSerSerGlnLeuArgTyrThrHisLeuLysAsnGlnValSerGlu 54882 : AATCATCAAGGACTCTCTTCTCAATTAAGATACACACATCTTAAGAATCAGGTTTCAGAG : 54823 110 : HisIleProValTyrGlnGlnGluGluAsnGlnProAspValTrpThrLeuLeuAsnGly : 129 |||||||||||||||||||||||||||||||||||||||||||||.!!|||||||||||| HisIleProValTyrGlnGlnGluGluAsnGlnProAspValTrpAlaLeuLeuAsnGly 54822 : CATATTCCTGTTTATCAGCAAGAAGAAAACCAACCAGATGTCTGGGCTCttttaaatgga : 54763 130 : AsnLysAspAspPheLeuIleTyrAsp{Ar} >>>> Target Intron 2 >>>> : 139 |||||||||||||||||||||||||||{||} 2125 bp AsnLysAspAspPheLeuIleTyrAsp{Ar}++ ++ 54762 : aacaaagaTGACTTCCTCATATATGAC{AG}gt.........................ag : 52608 140 : {g}CysGlyArgLeuValTyrHisLeuGlyLeuProPheSerPheLeuThrPheProTyr : 158 {|}||||||||||||||||||||||||||||||||||||||||||||||||||||||||| {g}CysGlyArgLeuValTyrHisLeuGlyLeuProPheSerPheLeuThrPheProTyr 52607 : {A}TGTGGCCGTCTTGTATATCATCTTGGTTTGCCTTTTTCCTTCCTAACATTCCCATAT : 52551 159 : ValGluGluAlaIleLysIleAlaTyrCysGluLysLysCysGlyAsnCysProLeuThr : 178 ||||||||||||||||||||||||||||||||||||||||||||||||||| !!|||||| ValGluGluAlaIleLysIleAlaTyrCysGluLysLysCysGlyAsnCysSerLeuThr 52550 : GTAGAAGAAGCCATTAAGATTGCTTACTGTGAAAAGAAATGTGGAAACTGCTCTCTCACg : 52491 179 : >>>> Target Intron 3 >>>> ThrLeuAsnAspGluAspPheCysLysAsnV : 189 1937 bp ||||||!!.|||||||||||||||||||||| ++ ++ThrLeuLysAspGluAspPheCysLysAsnV 52490 : gt.........................agACTCTCAAAGATGAAGACTTTTGTAAAAATG : 50521 190 : alSerLeuAlaThrValAsnLysThrThrGluAlaProGlnProHisHisHisHisLysH : 209 |||||||||||||||||||||||||||||||||||||||||||||||||||||||||||| alSerLeuAlaThrValAsnLysThrThrGluAlaProGlnProHisHisHisHisLysH 50520 : TAtctttggctactgtgaataaaacAACTGAAGCTCCACAGCCCCATCACCATCATAAGC : 50461 210 : isHisHisAsnHisArgHisGlnHisLeuGlySerSerGluLeuSerLysAsnGlnGlnP : 229 |||||!.!|||||| !!||||||||||||||||||||||||||||||||||||||||||| isHisArgAsnHisGlyHisGlnHisLeuGlySerSerGluLeuSerLysAsnGlnGlnP 50460 : ATCATCGCAATCATGGACATCAGCACCTTGGCAGCAGTGAGCTTTCAAAGAATCAGCAAC : 50401 230 : roGlyAlaProAspAlaProThrHisLeuThrProLeuAspLeuTyrHisHisHisLysH : 249 |||||||||||||||||||||||||||||||||||! !||||||:!!||||||||||||| roGlyAlaProAspAlaProThrHisLeuThrProSerAspLeuHisHisHisHisLysH 50400 : CAGGAGCACCAGATGCTCCTACTCATCTCACTCCTTCAGATCTTCATCACCACCATAAGC : 50341 250 : isLysGlyGlnHisArgGlnGlyHisProGluAsnUnkTyrMetProGlySerGluGlyL : 269 ||||||||||||||||||||||||||||||||||| |||!!:|||||||||||||||| isLysGlyGlnHisArgGlnGlyHisProGluAsn***TyrIleProGlySerGluGlyL 50340 : ACAAGGGTCAACATAGGCAGGGTCACCCAGAGAACTGATATATACCAGGAAGTGAAGGTT : 50281 270 : euGlnHisProArgAsnLysLeuUnkGlnArgArgCysIleAsnGlnLeuLeuUnkLysL : 289 ||||||||||||||||||||||| |||!:!||||||||||||||||||||| |||| euGlnHisProArgAsnLysLeu***GlnLysArgCysIleAsnGlnLeuLeu***LysL 50280 : TACAACATCCACGAAACAAGCTCTGACAAAAGAGATGTATAAATCAATTACTCTGAAAAT : 50221 290 : euProLysAspSerGluLeuAlaProArgSerUnkCysUnkHisCysArgHisLeuIleP : 309 |||||||||||||||||||||||||||||||| ||| ||||||||||||||||||| euProLysAspSerGluLeuAlaProArgSer***Cys***HisCysArgHisLeuIleP 50220 : TGCCCAAAGATTCAGAGTTGGCTCCTAGGAGCTGATGCTGACATTGTCGACATCTGATAT : 50161 310 : heGluLysThrGlySerAlaIleThrUnkGlnCysLysGluAsnLeuProSerLeuCysS : 329 |||||||||||||||||||||||||| ||||||! !|||||||||||||||||||||| heGluLysThrGlySerAlaIleThr***GlnCysThrGluAsnLeuProSerLeuCysS 50160 : TTGAAAAAACGGGGTCTGCAATCACCTGACAGTGTACAGAAAACCTTCCATCTTTATGTA : 50101 330 : erUnkGlnGlyLeuArgAlaGluGluAsnIleThrGluSerCysGlnUnkArgLeuProP : 349 || |||||||||||||||||||||||||||||||||||||||||| |||||||||| er***GlnGlyLeuArgAlaGluGluAsnIleThrGluSerCysGln***ArgLeuProP 50100 : GCTGACAGGGACTTCGGGCAGAGGAGAATATAACTGAATCTTGTCAGTGACGTTTGCCTC : 50041 350 : roAlaAlaUnkGlnThrSerGlnGlnLeuIleProThrGluAlaSerThrAsnUnkSerU : 369 |||||||| :!!||||||||||||||||||||||||||||||||||||||| ||| roAlaAla***LysThrSerGlnGlnLeuIleProThrGluAlaSerThrAsn***Ser* 50040 : CAGCTGCCTGAAAGACAAGTCAGCAGCTTATACCTACAGAAGCCAGTACCAATTGAAGCT : 49981 370 : nkLysAsnLysAlaLysLysUnkGluCysSerSerAsn : 381 ||||||! !||||||||| |||!! !!|||||| **LysAsnMetAlaLysLys***Glu***ProSerAsn 49980 : GAAAGAATATGGCAAAAAAGTGAGAATGACCTtcaaac : 49943 vulgar: SPP00000363_2.0 0 381 . KV389506.1:subseq(2207742,100551) 56210 49942 - 1796 M 67 201 S 0 2 5 0 2 I 0 1059 3 0 2 S 1 1 M 70 210 S 0 2 5 0 2 I 0 2121 3 0 2 S 1 1 M 39 117 5 0 2 I 0 1933 3 0 2 M 203 609 # --- START OF GFF DUMP --- # # ##gff-version 2 ##source-version exonerate:protein2genome:local 2.2.0 ##date 2016-11-18 ##type DNA # # # seqname source feature start end score strand frame attributes # KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local gene 49943 56210 1796 - . gene_id 1 ; sequence SPP00000363_2.0 ; gene_orientation + KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local cds 56008 56210 . - . KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local exon 56008 56210 . - . insertions 0 ; deletions 0 KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local splice5 56006 56007 . - . intron_id 1 ; splice_site "GT" KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local intron 54945 56007 . - . intron_id 1 KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local splice3 54945 54946 . - . intron_id 0 ; splice_site "AG" KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local cds 54732 54944 . - . KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local exon 54732 54944 . - . insertions 0 ; deletions 0 KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local splice5 54730 54731 . - . intron_id 2 ; splice_site "Gt" KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local intron 52607 54731 . - . intron_id 2 KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local splice3 52607 52608 . - . intron_id 1 ; splice_site "AG" KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local cds 52489 52606 . - . KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local exon 52489 52606 . - . insertions 0 ; deletions 0 KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local splice5 52487 52488 . - . intron_id 3 ; splice_site "gt" KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local intron 50552 52488 . - . intron_id 3 KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local splice3 50552 50553 . - . intron_id 2 ; splice_site "AG" KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local cds 49943 50551 . - . KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local exon 49943 50551 . - . insertions 0 ; deletions 0 KV389506.1:subseq(2207742,100551) exonerate:protein2genome:local similarity 49943 56210 1796 - . alignment_id 1 ; Query SPP00000363_2.0 ; Align 56211 1 201 ; Align 54944 69 210 ; Align 52606 140 117 ; Align 50552 179 609 # --- END OF GFF DUMP --- # -- completed exonerate analysis