# Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008), # Using native and syntenically mapped cDNA alignments to improve de novo gene finding # Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013 # No extrinsic information on sequences given. # Initialising the parameters using config directory /augustus/config/ ... # Using protein profile unknown # --[0..222]--> unknown_A (15) <--[0..3]--> unknown_B (23) <--[0..18]--> unknown_C (35) <--[0..18]--> unknown_D (63) <--[0..143]--> unknown_E (8) <--[0..1]--> unknown_F (15) <--[6..9]--> unknown_H (17) <--[0..3]--> unknown_I (19) <--[0..2]--> unknown_J (70) <--[4..12]--> unknown_K (13) <--[0..1]--> unknown_L (93) <--[0..2]--> unknown_M (17) <--[1..2]--> unknown_N (26) <--[4..11]--> unknown_O (81) <--[0..8]--> unknown_P (8) <--[3..11]--> unknown_Q (48) <--[2..148]--> unknown_R (26) <--[10..42]--> unknown_S (17) <--[3..30]--> unknown_T (10) <--[0..18]-- # BUSCO_20180911_busco_2432604931 version. Using default transition matrix. # admissible start codons and their probabilities: ATG(1), CTG(0), TTG(0) # Looks like ./tmp/Contig10300920180911_busco_2432604931_.temp is in fasta format. # We have hints for 0 sequences and for 0 of the sequences in the input set. # # ----- prediction on sequence number 1 (length = 4186, name = Contig103009) ----- # # Constraints/Hints: # (none) # Predicted genes for sequence number 1 on both strands # start gene g1 Contig103009 AUGUSTUS gene 1 3397 0.14 + . g1 Contig103009 AUGUSTUS transcript 1 3397 0.14 + . g1.t1 Contig103009 AUGUSTUS intron 1 147 0.44 + . transcript_id "g1.t1"; gene_id "g1"; Contig103009 AUGUSTUS intron 343 911 0.96 + . transcript_id "g1.t1"; gene_id "g1"; Contig103009 AUGUSTUS intron 1049 1160 1 + . transcript_id "g1.t1"; gene_id "g1"; Contig103009 AUGUSTUS intron 1249 3271 0.33 + . transcript_id "g1.t1"; gene_id "g1"; Contig103009 AUGUSTUS CDS 148 342 0.46 + 0 transcript_id "g1.t1"; gene_id "g1"; Contig103009 AUGUSTUS CDS 912 1048 0.97 + 0 transcript_id "g1.t1"; gene_id "g1"; Contig103009 AUGUSTUS CDS 1161 1248 0.97 + 1 transcript_id "g1.t1"; gene_id "g1"; Contig103009 AUGUSTUS CDS 3272 3397 0.41 + 0 transcript_id "g1.t1"; gene_id "g1"; Contig103009 AUGUSTUS stop_codon 3395 3397 . + 0 transcript_id "g1.t1"; gene_id "g1"; # coding sequence = [actataccagcccgcatgtttagacgggttctgactatcgtgaacgcccactgcaagcttggactgaccgcgacattgg # tacgagaggatgacaaaattgcggacctgaattttctgattggaccaaaactgtatgaggcgaactggatggagctacagaataacgggtacatcgcc # agagtgcagtgtgcagagttgttggcagttgtgaatcctaacaagtttcgagcttgccagttcctgatccgataccatgaaagacgcaacgacaaaat # cattgtgttctcggataatgtgtttgccctgaaaagttacgccattaaactgaacaagccatacttgtatggacccacctcacaaggggagagaatgc # agatcttgcagaactttgtccataatccaaaagtcaacaccatctttgacaaaaggaaacgggagattgctcggctctttggtgaagctgagaaagac # attacaggaagcaaaatttctagtgcaatcattggaaaggaaactgaacagatgtctcgttgtgcttgtgaatga] # protein sequence = [TIPARMFRRVLTIVNAHCKLGLTATLVREDDKIADLNFLIGPKLYEANWMELQNNGYIARVQCAELLAVVNPNKFRAC # QFLIRYHERRNDKIIVFSDNVFALKSYAIKLNKPYLYGPTSQGERMQILQNFVHNPKVNTIFDKRKREIARLFGEAEKDITGSKISSAIIGKETEQMS # RCACE] # end gene g1 ### # command line: # /augustus/bin/augustus --codingseq=1 --proteinprofile=eukaryota_odb9/prfl/EOG093703C8.prfl --predictionStart=0 --predictionEnd=21281 --species=BUSCO_20180911_busco_2432604931 ./tmp/Contig10300920180911_busco_2432604931_.temp