# Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008), # Using native and syntenically mapped cDNA alignments to improve de novo gene finding # Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013 # No extrinsic information on sequences given. # Initialising the parameters using config directory /augustus/config/ ... # Using protein profile unknown # --[14..112]--> unknown_B (17) <--[1..4]--> unknown_C (21) <--[86..536]--> unknown_D (33) <--[0..9]--> unknown_E (13) <--[0..1]--> unknown_F (8) <--[0..6]--> unknown_G (27) <--[2..5]--> unknown_H (14) <--[0..5]--> unknown_I (58) <--[0..29]--> unknown_J (20) <--[4..18]--> unknown_K (24) <--[2..12]--> unknown_L (46) <--[0..163]--> unknown_M (108) <--[0..3]--> unknown_N (27) <--[0..1]--> unknown_O (31) <--[2..20]--> unknown_P (27) <--[12..95]--> unknown_R (16) <--[3..8]--> unknown_S (18) <--[0..5]--> unknown_T (32) <--[0..30]--> unknown_U (32) <--[9..50]--> unknown_V (8) <--[5..11]--> unknown_W (13) <--[0..15]--> unknown_X (21) <--[0..2]--> unknown_Y (8) <--[6..23]--> unknown_Z (13) <--[0..11]--> unknown_AA (16) <--[8..132]-- # fly version. Using default transition matrix. # Looks like ./tmp/Contig6587520180911_busco_2432604931_.temp is in fasta format. # We have hints for 0 sequences and for 0 of the sequences in the input set. # # ----- prediction on sequence number 1 (length = 9606, name = Contig65875) ----- # # Constraints/Hints: # (none) # Predicted genes for sequence number 1 on both strands # start gene g1 Contig65875 AUGUSTUS gene 4166 9334 0.01 + . g1 Contig65875 AUGUSTUS transcript 4166 9334 0.01 + . g1.t1 Contig65875 AUGUSTUS tss 4166 4166 . + . transcript_id "g1.t1"; gene_id "g1"; Contig65875 AUGUSTUS exon 4166 4220 . + . transcript_id "g1.t1"; gene_id "g1"; Contig65875 AUGUSTUS exon 5459 6580 . + . transcript_id "g1.t1"; gene_id "g1"; Contig65875 AUGUSTUS start_codon 5652 5654 . + 0 transcript_id "g1.t1"; gene_id "g1"; Contig65875 AUGUSTUS CDS 5652 6506 0.25 + 0 transcript_id "g1.t1"; gene_id "g1"; Contig65875 AUGUSTUS stop_codon 6504 6506 . + 0 transcript_id "g1.t1"; gene_id "g1"; Contig65875 AUGUSTUS exon 9048 9334 . + . transcript_id "g1.t1"; gene_id "g1"; Contig65875 AUGUSTUS tts 9334 9334 . + . transcript_id "g1.t1"; gene_id "g1"; # coding sequence = [atgaaacaaaatttctccaaacgaaatgaagacaagaaaaaggatgttggtactccaaaaaataaagaccagaaaaagc # atgatcagcttccaccaggtaggattctgtcatgtccagacaattcaaaaagcactggaacacggatgacgactgaaacacaaaagagtgccagtgta # gaagttaaagggagcatgaaaatgggagacatgttggataaggaatgctttggggatgacaaagctggaaacaatgaaaatctgtctaatgtgacttc # agaaaatccacaacaagtttcgtgtaaccaaagccttagtgtagaagaagacaagaatatggtgaaatacatctttactgttttaaagcagttagaag # atgaaaatgagctactgatacatctcattggtgttgtggtagatgttaaatttcgagttgcttcctttgaaaaagattcaaaaaacaataccgttgtt # gtagaaattcacttcaaaagcaattcagatgcaagaagatttcaaagttgcttggcacaaagtaggaaaaaattgtccttcagatacaaatttcaaaa # gcttgaaataggagctccatctaaaacgagacgagaaagcatacaaattttgcagaacatatgtaagaagactgagaacgttttagggaaacatttag # aaaagatcaaggagactgacagtaaaatttcaaaattaaacaaagcaccttcaaaaaagaagacaaaatatattgatatctcacttcatgaagagaga # gaattgcagaagaaagctttggaatacaaaaaattagaactgaaacaacaacagggtgagtttcaaacctatcctgatctgacactataa] # protein sequence = [MKQNFSKRNEDKKKDVGTPKNKDQKKHDQLPPGRILSCPDNSKSTGTRMTTETQKSASVEVKGSMKMGDMLDKECFGD # DKAGNNENLSNVTSENPQQVSCNQSLSVEEDKNMVKYIFTVLKQLEDENELLIHLIGVVVDVKFRVASFEKDSKNNTVVVEIHFKSNSDARRFQSCLA # QSRKKLSFRYKFQKLEIGAPSKTRRESIQILQNICKKTENVLGKHLEKIKETDSKISKLNKAPSKKKTKYIDISLHEERELQKKALEYKKLELKQQQG # EFQTYPDLTL] # end gene g1 ### # command line: # /augustus/bin/augustus --codingseq=1 --proteinprofile=eukaryota_odb9/prfl/EOG0937060I.prfl --predictionStart=0 --predictionEnd=27988 --species=fly ./tmp/Contig6587520180911_busco_2432604931_.temp