GENSCAN 1.0 Date run: 3-Nov-116 Time: 16:22:06 Sequence gi568815595f:47182966_47443938 : 260973 bp : 47.25% C+G : Isochore 2 (43 - 51 C+G%) Parameter matrix: HumanIso.smat Predicted genes/exons: Gn.Ex Type S .Begin ...End .Len Fr Ph I/Ac Do/T CodRg P.... Tscr.. ----- ---- - ------ ------ ---- -- -- ---- ---- ----- ----- ------ 1.01 Intr + 4816 4871 56 2 2 121 52 48 0.046 3.20 1.02 Term + 44400 44474 75 2 0 145 41 3 0.040 -0.86 1.03 PlyA + 47118 47123 6 1.05 2.22 PlyA - 47155 47150 6 1.05 2.21 Term - 52042 51989 54 1 0 63 44 59 0.466 -3.44 2.20 Intr - 52652 52548 105 2 0 50 88 154 0.985 12.01 2.19 Intr - 53184 53069 116 1 2 101 93 167 0.961 18.67 2.18 Intr - 53654 53478 177 0 0 106 45 372 0.937 34.59 2.17 Intr - 58050 57836 215 2 2 57 94 314 0.999 27.26 2.16 Intr - 60280 60086 195 0 0 87 57 130 0.994 8.33 2.15 Intr - 60824 60727 98 2 2 49 63 58 0.425 -1.79 2.14 Intr - 61727 61613 115 1 1 60 81 87 0.474 5.65 2.13 Intr - 61959 61826 134 0 2 62 109 58 0.998 4.74 2.12 Intr - 62546 62456 91 1 1 52 121 138 0.999 13.50 2.11 Intr - 63287 63232 56 2 2 140 78 84 0.999 10.38 2.10 Intr - 64512 64408 105 0 0 79 77 223 0.662 20.71 2.09 Intr - 65121 65053 69 0 0 96 99 104 0.981 11.68 2.08 Intr - 74595 74518 78 0 0 109 77 75 0.925 8.25 2.07 Intr - 81385 81321 65 2 2 109 92 100 0.990 10.94 2.06 Intr - 82912 82765 148 1 1 35 66 225 0.991 14.81 2.05 Intr - 84103 84011 93 1 0 83 98 41 0.964 4.76 2.04 Intr - 88496 88272 225 2 0 84 78 179 0.984 14.68 2.03 Intr - 90693 90587 107 1 2 65 80 59 0.922 2.73 2.02 Intr - 92525 92360 166 2 1 99 48 113 0.926 7.93 2.01 Init - 94409 94317 93 2 0 62 89 94 0.163 7.28 2.00 Prom - 94767 94728 40 -8.86 3.00 Prom + 95073 95112 40 -2.96 3.01 Init + 99821 100129 309 1 0 58 81 499 0.653 43.51 3.02 Term + 100416 100553 138 2 0 93 43 55 0.878 -0.54 3.03 PlyA + 101109 101114 6 1.05 4.04 PlyA - 101860 101855 6 1.05 4.03 Term - 119632 119564 69 1 0 94 39 104 0.978 4.04 4.02 Intr - 120321 120184 138 0 0 -3 98 190 0.665 11.56 4.01 Init - 120606 120496 111 0 0 59 72 88 0.650 4.51 4.00 Prom - 131395 131356 40 -4.26 5.00 Prom + 136029 136068 40 -4.76 5.01 Init + 136543 136584 42 0 0 79 51 37 0.555 -0.23 5.02 Intr + 136688 136818 131 1 2 93 79 130 0.996 12.09 5.03 Intr + 139603 139743 141 1 0 94 89 221 0.984 22.27 5.04 Intr + 146986 147184 199 1 1 86 91 270 0.944 26.45 5.05 Intr + 150192 150352 161 2 2 58 109 141 0.990 11.99 5.06 Intr + 151718 151854 137 2 2 80 82 125 0.991 11.31 5.07 Intr + 153570 153792 223 1 1 44 61 339 0.801 23.99 5.08 Intr + 157607 157711 105 2 0 73 80 169 0.142 13.93 5.09 Intr + 159754 159865 112 1 1 41 65 4 0.182 -6.22 5.10 Term + 160590 160976 387 2 0 125 48 429 0.653 37.54 5.11 PlyA + 163830 163835 6 1.05 6.00 Prom + 167478 167517 40 -7.16 6.01 Init + 175620 175755 136 2 1 67 31 136 0.513 6.10 6.02 Intr + 179829 179943 115 1 1 79 75 52 0.200 2.51 6.03 Intr + 187087 187165 79 1 1 30 119 36 0.101 0.45 6.04 Term + 187231 187332 102 0 0 46 49 251 0.124 15.28 6.05 PlyA + 188210 188215 6 1.05 7.03 PlyA - 188645 188640 6 -0.45 7.02 Term - 188740 188722 19 0 1 75 44 4 0.059 -7.51 7.01 Init - 189305 189199 107 2 2 75 77 107 0.279 7.99 7.00 Prom - 190612 190573 40 1.24 8.00 Prom + 192892 192931 40 -6.16 8.01 Init + 197928 198215 288 2 0 63 105 257 0.636 20.02 8.02 Intr + 213178 213252 75 0 0 98 91 116 0.992 12.61 8.03 Intr + 221687 221814 128 1 2 105 85 138 0.990 14.68 8.04 Intr + 222040 222116 77 1 2 58 85 162 0.999 12.06 8.05 Intr + 222784 222833 50 2 2 128 78 60 0.998 7.40 8.06 Intr + 222950 223081 132 1 0 67 81 254 0.734 23.44 8.07 Intr + 223360 223440 81 0 0 44 91 87 0.887 4.43 8.08 Intr + 223516 223647 132 0 0 112 56 196 0.977 19.64 8.09 Intr + 223738 223785 48 0 0 70 88 92 0.630 6.28 8.10 Intr + 224165 224221 57 1 0 71 98 121 0.958 10.48 8.11 Intr + 224344 224402 59 0 2 96 87 57 0.993 4.08 8.12 Intr + 224540 224619 80 2 2 114 58 43 0.991 3.09 8.13 Intr + 224732 224846 115 0 1 87 94 100 0.996 10.01 8.14 Intr + 224925 224990 66 0 0 77 64 127 0.993 7.22 8.15 Intr + 225380 225525 146 2 2 105 113 206 0.999 24.73 8.16 Intr + 225811 226122 312 2 0 48 99 384 0.829 31.66 8.17 Intr + 226198 226361 164 2 2 88 80 299 0.641 28.79 8.18 Intr + 226452 226603 152 2 2 71 32 317 0.962 23.36 8.19 Intr + 226690 226869 180 1 0 73 72 327 0.924 28.58 8.20 Intr + 226963 227362 400 1 1 93 77 208 0.708 14.71 8.21 Intr + 227963 228721 759 1 0 74 100 820 0.438 73.47 8.22 Intr + 228818 229002 185 1 2 75 62 157 0.998 10.39 8.23 Intr + 229129 229233 105 1 0 99 80 208 0.999 20.43 8.24 Intr + 229318 229456 139 1 1 65 100 190 0.999 18.37 8.25 Intr + 229549 229662 114 0 0 67 100 42 0.893 3.94 8.26 Term + 229741 230220 480 0 0 116 47 276 0.925 21.10 8.27 PlyA + 230450 230455 6 1.05 9.26 PlyA - 230755 230750 6 -0.45 9.25 Term - 231134 230889 246 2 0 104 53 297 0.999 23.59 9.24 Intr - 231421 231215 207 1 0 95 80 200 0.999 19.17 9.23 Intr - 231687 231607 81 0 0 59 115 105 0.511 10.13 9.22 Intr - 232028 231862 167 0 2 97 70 55 0.551 4.28 9.21 Intr - 232215 232133 83 2 2 84 36 79 0.567 1.58 9.20 Intr - 234242 234157 86 2 2 32 105 115 0.988 6.22 9.19 Intr - 234861 234339 523 2 1 107 64 453 0.894 37.75 9.18 Intr - 235284 235169 116 0 2 66 73 147 0.883 10.25 9.17 Intr - 235557 235356 202 2 1 69 89 323 0.999 29.79 9.16 Intr - 235878 235690 189 2 0 69 80 136 0.998 9.60 9.15 Intr - 236739 236363 377 0 2 96 83 321 0.992 26.21 9.14 Intr - 237423 237367 57 0 0 70 92 33 0.560 0.98 9.13 Intr - 237807 237589 219 0 0 73 37 343 0.809 26.20 9.12 Intr - 238064 237966 99 2 0 55 75 92 0.863 4.91 9.11 Intr - 239571 239477 95 1 2 114 110 220 0.999 26.48 9.10 Intr - 241080 240968 113 2 2 125 92 134 0.999 17.52 9.09 Intr - 242646 242520 127 1 1 128 77 221 0.999 24.74 9.08 Intr - 243204 243032 173 2 2 65 46 276 0.637 20.69 9.07 Intr - 244297 244192 106 2 1 87 71 134 0.998 10.87 9.06 Intr - 244702 244482 221 0 2 83 63 222 0.854 17.15 9.05 Intr - 245705 245548 158 2 2 114 80 144 0.998 15.01 9.04 Intr - 248009 247931 79 1 1 91 97 14 0.581 2.15 9.03 Intr - 250369 250202 168 0 0 116 89 21 0.409 4.06 9.02 Intr - 252172 252047 126 0 0 83 11 132 0.458 4.79 9.01 Init - 260028 259907 122 0 2 63 84 79 0.875 4.66 Suboptimal exons with probability > 0.800 Exnum Type S .Begin ...End .Len Fr Ph B/Ac Do/T CodRg P.... Tscr.. ----- ---- - ------ ------ ---- -- -- ---- ---- ----- ----- ------ S.001 Intr - 94414 94317 98 2 2 115 89 87 0.835 11.23 S.002 Term + 198389 198487 99 1 0 94 54 67 0.887 2.03 Predicted peptide sequence(s): Predicted coding sequence(s): >gi568815595f:47182966_47443938|GENSCAN_predicted_peptide_1|43_aa XSTHNYISLRKKTHVRYKEVSRPSSFHLSSYKVVPELDITHQK >gi568815595f:47182966_47443938|GENSCAN_predicted_CDS_1|132_bp natagcactcacaactatatctctctcagaaagaagactcatgtacgctacaaggaggta agcagacctagttccttccatctttcctcatacaaagtggtcccagagctagatatcacc catcagaagtga >gi568815595f:47182966_47443938|GENSCAN_predicted_peptide_2|834_aa MGTRKKVHAFVRVKPTDDFAHEMIRYGDDKRSIDIHLKKDIRRGVVNNQQTDWSFKLDGV LHDASQDLVYETVAKDVVSQALDGYNGTIMCYGQTGAGKTYTMMGATENYKHRGILPRAL QQVFRMIEERPTHAITVRVSYLEIYNESLFDLLSTLPYVGPSVTPMTIVENPQGVFIKGL SVHLTSQEEDAFSLLFEAHSRTLSEEKYITSKINLVDLAGSERLGKSGSEGQVLKEATYI NKSLSFLEQAIIALGDQKRDHIPFRQCKLTHALKDSLGGNCNMVLVTNIYGEAAQLEETL SSLRFASRMKLVTTEPAINEKYDAERMVKNLEKELALLKQELAIHDSLTNRTFVTYDPMD EIQIAEINSQVRRYLEGTLDEIDIISLRQIKEVFNQFRVVLSQQEQEVESTLRRKYTLID RNDFAAISAIQKAGLVDVDGHLVGEPEGQNFGLGVAPFSTKPGKKAKSKKTFKEPLSYWV GTMDVTAANTSKSVGPGLGLVWNRTRIISRPHSNLICLFSEKGTKHCHFSREDSYFSGSW CGEQGVDHSLARKEGASSPVNGKDLDYVSTSKTQLVPSSKDGDVKDMLSRDRETSSIEPL PSDSPKEELRPIRPDTPPSKPVAFEEFKNEQGSEINRIFKENKSILNERRKRASETTQHI NAIKREIDVTKEALNFQKSLREKQGKYENKGLMIIDEEEFLLILKLKDLKKQYRSEYQDL RDLRAEIQYCQHLVDQCRHRLLMEFDIWYNESFVIPEDMQMALKPGGSIRPGMVPVNRIV SLGEDDQDKFSQLQQRVLPEGPDSISFYNAKVKIEQKRQCLYSKWQMHTGQKPK >gi568815595f:47182966_47443938|GENSCAN_predicted_CDS_2|2505_bp atgggtactaggaaaaaagttcatgcatttgtccgtgtcaaacccaccgatgactttgct catgaaatgatcagatacggagatgacaaaagaagcattgatattcacttaaaaaaagac attcggagaggagttgtcaataaccaacagacagactggtcgtttaagttggatggagtt cttcacgatgcctcccaggacttggtttatgagacagttgcaaaggatgtggtttctcag gccctcgatggctataatggcaccatcatgtgttatgggcagacgggagctggcaagaca tacaccatgatgggggcaactgagaattacaagcaccgggggatcctccctcgtgccctg cagcaggtttttaggatgatcgaagaacgccccacacatgccatcactgtgcgtgtttcc tacttggaaatctataatgagagcctgtttgatctcctgtccactctgccctatgttgga ccctcagtcacaccaatgaccatcgtggaaaaccctcaaggagtcttcattaagggcttg tcagttcacctcacaagtcaggaggaggatgcattcagcctcctttttgaggcccattcc cggaccttatcagaggaaaagtacatcacttccaaaattaacttggtggatctggcaggc tcagagaggctggggaagtctgggtctgagggccaagtcctgaaggaagccacctacatc aacaaatcgctctcattcctggagcaggccatcattgcccttggggaccagaagcgggac cacatcccctttcggcagtgcaagctcacccacgctctgaaggactcgttagggggaaac tgcaatatggtcctcgtgacaaacatctatggagaagctgcccagttagaagaaacgcta tcttcactgagatttgccagcaggatgaagctagtcaccactgagcctgccatcaatgaa aagtatgatgctgagagaatggtcaagaacctggagaaggaactagcactactcaagcag gagctggctatccatgacagcctgaccaaccgcacctttgtgacctatgaccccatggat gaaatccagattgctgagatcaactcccaggtgcggaggtacctggaggggacactggac gagatcgacataatcagccttagacagatcaaggaggtgttcaaccagttccgggtggtt ctgagccaacaggaacaggaagtggagtccactttgcgcaggaagtacaccctcattgac aggaatgactttgcagccatttctgctatccagaaggcggggcttgtggatgttgatggc cacctagtgggtgagcctgaaggacaaaactttggactcggagtcgcccctttctctacc aaacctgggaagaaagccaagtccaagaagacattcaaagagccactcagctactgggtt ggcacaatggacgtcactgctgccaatactagcaagtctgtggggcccgggctggggctg gtttggaaccgcacaagaatcatctctcgtcctcacagcaacctgatctgcctcttctcg gagaaaggcaccaagcactgtcacttcagcagggaggacagctacttttctgggagctgg tgtggagaacagggtgtggaccactccttggcaagaaaggaaggtgccagcagccctgtg aatgggaaggacttggattacgtttccacctccaagacccagctggtcccatcctccaaa gatggggatgtcaaagacatgctttcgcgggaccgggaaacttccagcattgagcccctt ccctcagactccccgaaggaggaattacgcccaattaggcccgacaccccaccctccaaa ccagtggcctttgaggagtttaagaatgagcaaggtagtgagatcaaccgaattttcaaa gaaaacaaatccatcttgaatgaacggaggaaaagggccagcgagaccacacagcacatc aatgccatcaagcgggagattgatgtgaccaaggaggccctgaatttccagaagtcacta cgggagaagcaaggcaagtacgaaaacaaggggctgatgatcatcgatgaggaagaattc ctgctgatcctcaagctcaaagacctcaagaagcagtaccgcagcgagtaccaggacctg cgtgacctcagggctgagatccagtattgccagcacctagtggatcagtgtcgccaccgc ctgctcatggaatttgacatctggtacaatgagtcctttgtcatccctgaggacatgcag atggcactgaagccaggcggcagcatccggccaggcatggtccctgtgaacaggattgtg tctctgggagaagatgaccaggacaaattcagccagctgcagcagagggtgcttcctgag ggccctgattccatctccttctacaatgccaaagtcaagatagagcagaagaggcagtgc ttatacagcaagtggcagatgcacacggggcagaagcccaagtga >gi568815595f:47182966_47443938|GENSCAN_predicted_peptide_3|148_aa MNQEAEWRGFRRRGDSTTAAAEARPIAAPRSERLSACAIAPPWLVSSRPARPAQLQRPGK MVEDGAEELEDLVHFSVSELPSRGYGVMEEIRRQGKLCDVTLKTRENGLTFYGGRGGGRL HMLMGTTEEPSLVTTDISLCLSNLAVLF >gi568815595f:47182966_47443938|GENSCAN_predicted_CDS_3|447_bp atgaaccaggaagcggagtggcggggcttccggcgccgaggagattcaactacggcggcc gcggaggcccgtccgattgctgctccgcgctccgagcggctgtcggcgtgcgctatcgcc ccgccctggttagtgtctagccggccggcgaggcctgcgcagttgcagcggccggggaag atggtggaggacggcgcggaggagctggaggatctggtgcacttctccgtgtctgagttg cctagtcgcggctacggcgtcatggaggagatccggcggcagggcaagctgtgcgacgtg accctcaagacaagagaaaatggacttaccttctatggaggcaggggcggtggccggctc cacatgctgatgggcaccactgaagaaccttctcttgtcactacagatatttctttgtgc ctgtcgaacttggctgtgctgttctag >gi568815595f:47182966_47443938|GENSCAN_predicted_peptide_4|105_aa MTPAASLLVVQEDKDDENFFWIGSFEVLSLKSGSTLPYCMERIANAMEENPSRENIIKAW KDYTMEDAIIVIEKAVKAIKTETTTQCEDDDGDEGLYDDPLPLNE >gi568815595f:47182966_47443938|GENSCAN_predicted_CDS_4|318_bp atgacaccagctgccagtcttttggttgtacaagaagataaggatgatgaaaactttttc tggattggttcctttgaagttttgtcactgaagtcaggaagtaccttgccatactgtatg gaaaggattgccaatgctatggaagagaaccctagtagagagaacatcataaaagcctgg aaggattataccatggaagatgccatcattgttatagaaaaagctgtgaaagccatcaag actgaaacaactactcaatgtgaagatgatgatggtgatgaaggcctttatgatgatcca cttccacttaatgaatag >gi568815595f:47182966_47443938|GENSCAN_predicted_peptide_5|545_aa MPWDAFTAFAVGSGIGDHKFSAHRIVLAASIPYFHAMFTNDMMECKQDEIVMQGMDPSAL EALINFAYNGNLAIDQQNVQSLLMGASFLQLQSIKDACCTFLRERLHPKNCLGVRQFAET MMCAVLYDAANSFIHQHFVEVSMSEEFLALPLEDVLELVSRDELNVKSEEQVFEAALAWV RYDREQRGPYLPELLSNIRLPLCRPQFLSDRVQQDDLVRCCHKCRDLVDEAKDYHLMPER RPHLPAFRTRPRCCTSIAGLIYAVGGLNSAGDSLNVVEVFDPIANCWERCRPMTTARSRV GVAVVNGLLYAIGGYDGQLRLSTVEAYNPETDTWTRVGSMNSKRSAMGTVVLDGQIYVCG GYDGNSSLSSVETYSPETDKWTVVTSMSSNRSAAGVTVFEGRIYVSGGHDGLQIFSSVEH YNHHTATWHPAAGMLNKRCRHGAASLGSKMFVCGGYDGSGFLSIAEMYSSVADQWCLIVP MHTRRSRVSLVASCGRLYAVGGYDGQSNLSSVEMYDPETDCWTFMAPMACHEGGVGVGCI PLLTI >gi568815595f:47182966_47443938|GENSCAN_predicted_CDS_5|1638_bp atgccctgggatgccttcaccgcctttgcagtgggcagtgggattggggaccacaaattc agtgcccaccggattgtcttagcagcctcgatcccgtatttccatgctatgtttacaaat gacatgatggagtgcaagcaggatgagattgtaatgcaaggaatggacccaagtgccctg gaggctctgatcaactttgcctacaacggcaaccttgccattgaccagcaaaatgtccag tcattgctgatgggggcgagcttcctgcagctgcagagcatcaaagacgcctgctgcaca ttccttcgagaacggcttcacccaaaaaactgcctgggtgtgcgccagtttgctgagaca atgatgtgtgctgtgctgtacgacgctgccaacagcttcatccaccagcactttgtggag gtgtccatgtcagaagagttcctggccctgcccttggaagacgtgcttgagctggtgtct cgggatgagctgaatgtcaaatctgaggagcaggtctttgaagctgcattggcctgggtc agatacgaccgggagcagaggggtccctacctgcctgagctgctgtccaatatccgcctg cccctctgtcggccccagttcctttcagacagagtacagcaggatgacctggtgcgttgc tgccacaaatgcagggacctggtagacgaagcaaaggactaccacctcatgccagagcgc cggccccacctgccagctttcagaacccggccacgctgctgcacatccatcgctggactt atctacgctgtagggggcctcaactcagcaggtgattccctgaatgtggtggaagtgttc gaccccattgccaattgctgggagagatgccgtcccatgacaacagcccgcagccgcgtt ggcgtggctgtggtgaacgggcttctctatgccatcggaggatatgacggccagctacgg ctgagcactgtggaggcctacaacccggagacagacacatggaccagagtggggagcatg aatagcaagagaagtgccatggggacagtcgtgctggatgggcagatctacgtctgtggg ggctacgatggcaactcttccctcagctccgtggagacctactcacctgagacggacaaa tggacagtggtgacctcgatgagctcgaatcgcagtgctgctggggttacagtctttgag ggcaggatatatgtgtcaggcggccatgatggtttgcagatcttcagcagtgtggaacac tacaaccaccacacagccacctggcaccctgcagctggcatgctcaacaagcgctgccgg cacggagccgcctccctggggagcaagatgtttgtctgcgggggctacgatggctctggc ttcctcagcattgccgagatgtacagctctgtggcagaccagtggtgcctgattgtcccc atgcacacgcgcaggagccgggtctccctggtggccagctgtgggcgcctctacgctgtt gggggctacgacggacagtcaaacctaagctcagtggagatgtatgacccagagacagac tgctggacattcatggcccccatggcgtgccatgagggaggggtcggtgtgggctgcatc cctctcctcaccatctaa >gi568815595f:47182966_47443938|GENSCAN_predicted_peptide_6|143_aa MRESLELLRDWLNGCDQNADSDMDNEVQAAKVSDGNEELIGNWSKTMQERPNTSHFLSLS LNFLLCVRKQEEESLPCVFSCHVSLGNKSETPSQKQQQQQQQKQDPGTELSEEERQSEEE RQSEEERQSEEERQSDVGLAAGA >gi568815595f:47182966_47443938|GENSCAN_predicted_CDS_6|432_bp atgagggaaagtttggaacttcttagagactggttaaatggctgtgaccaaaatgctgat agtgatatggacaatgaagtccaggctgccaaagtctcagatggaaatgaggaacttatt ggtaactggagcaaaacaatgcaagaacggcctaatacaagtcacttcctgtctttgtcc ctcaatttcctcctctgtgtgaggaaacaggaagaagaatccctgccctgcgtattcagc tgccacgtgagcctgggcaacaagagtgaaactccatctcaaaaacaacaacaacaacaa caacaaaaacaggacccaggcacagagctgtcagaggaggagcggcagtcagaggaggag cggcagtcagaggaggagcggcagtcagaggaggagcggcagtctgatgttggtttggct gctggggcctga >gi568815595f:47182966_47443938|GENSCAN_predicted_peptide_7|41_aa MSNLISNQENANPNYTEMPLDSHQNDEYTSVNNKCCHQPGS >gi568815595f:47182966_47443938|GENSCAN_predicted_CDS_7|126_bp atgtccaacctcatcagtaaccaggaaaatgcaaaccccaactacactgaaatgccactt gatagtcatcagaatgatgagtatacatctgtcaataataagtgttgccaccagccagga tcctag >gi568815595f:47182966_47443938|GENSCAN_predicted_peptide_8|1507_aa MRNRDSACAKDYASGWLGSLQLPAGRWHFSFPPVTSDFRHEGAGLGSWLSQQLQQLREWP GGRRVPAAMEAVPRMPMIWLDLKEAGDFHFQPAVKKFVLKNYGENPEAYNEELKKLELLR QNAVRVPRDFEGCSVLRKYLGQLHYLQSRVPMGSGQEAAVPVTWTEIFSGKSVAHEDIKY EQACILYNLGALHSMLGAMDKRVSEEGMKVSCTHFQCAAGAFAYLREHFPQAYSVDMSRQ ILTLNVNLMLGQAQECLLEKSMLDNRKSFLVARISAQVVDYYKEACRALENPDTASLLGR IQKDWKKLVQMKIYYFAAVAHLHMGKQAEEQQKFGERVAYFQSALDKLNEAIKLAKGQPD TVQDALRFTMDVIGGKYNSAKKDNDFIYHEAVPALDTLQPVKGAPLVKPLPVNPTDPAVT GPDIFAKLVPMAAHEASSLYSEEKAKLLREMMAKIEDKNEVLDQFMDSMQLDPETVDNLD AYSHIPPQLMEKCAALSVRPDTVRNLVQSMQVLSGVFTDVEASLKDIRDLLEEDELLEQK FQEAVGQAGAISITSKAELAEVRREWAKYMEVHEKASFTNSELHRAMNLHVGNLRLLSGP LDQVRAALPTPALSPEDKAVLQNLKRILAKVQEMRDQRVSLEQQLRELIQKDDITASLVT TDHSEMKVGWKLFEEQLKKYDQLKVYLEQNLAAQDRVLCALTEANVQYAAVRRVLSDLDQ KWNSTLQTLVASYEAYEDLMKKSQEGRDFYADLESKVAALLERTQSTCQAREAARQQLLD RELKKKPPPRPTAPKPLLPRREESEAVEAGDPPEELRSLPPDMVAGPRLPDTFLGSATPL HFPPSPFPSSTGPGPHYLSGPLPPGTYSGPTQLIQPRAPGPHAMPVAPGPALYPAPAYTP ELGLVPRSSPQHGVPPHPPLAYGPAPSTRPMGPQAAPLTIRGPSSAGQSTPSPHLVPSPA PSPGPGPVPPRPPAAEPPPCLRRGAAAADLLSSSPESQHGGTQSPGGGQPLLQPTKVDAA EGRRPQALRLIERDPYEHPERLRQLQQELEAFRGQLGDVGALDTVWRELQDAQEHDARGR SIAIARCYSLKNRHQDVMPYDSNRVVLRSGKDDYINASCVEGLSPYCPPLVATQAPLPGT AADFWLMVHEQKVSVIVMLVSEAEMEKQKVARYFPTERGQPMVHGALSLALSSVRSTETH VERVLSLQFRDQSLKRSLVHLHFPTWPELGLPDSPSNLLRFIQEVHAHYLHQRPLHTPII VHCSSGVGRTGAFALLYAAVQEVEAGNGIPELPQLVRRMRQQRKHMLQEKLHLRFCYEAV VRHVEQVLQRHGVPPPCKPLASASISQKNHLPQDSQDLVLGGDVPISSIQATIAKLSIRP PGGLESPVASLPGPAEPPGLPPASLPESTPIPSSSPPPLSSPLPEAPQPKEEPPVPEAPS SGPPSSSLELLASLTPEAFSLDSSLRGKQRMSKHNFLQAHNGQGLRATRPSDDPLSLLDP LWTLNKT >gi568815595f:47182966_47443938|GENSCAN_predicted_CDS_8|4524_bp atgcgcaacagggacagcgcctgcgcaaaagactacgcgagcgggtggctgggttcactg caactcccggcaggccgctggcatttttcattccctcccgtgaccagtgacttccggcac gaaggggcggggctgggctcgtggctgagccagcagctgcagcagctacgggagtggccg ggtggccggcgggtgccagccgccatggaggccgtgccccgcatgcccatgatctggctg gacctgaaggaggccggtgactttcacttccagccagctgtgaagaagtttgtcctgaag aattatggagagaacccagaagcctacaatgaagaactgaagaagctggagttgctcaga cagaatgctgtccgtgtcccacgagactttgagggctgtagtgtcctccgcaagtacctc ggccagcttcattacctgcagagtcgggtccccatgggctcgggccaggaggccgctgtc cctgtcacctggacagagatcttctcaggcaagtctgtggcccatgaggacatcaagtac gagcaggcctgtattctctacaaccttggagcgctgcactccatgctgggggccatggac aagcgggtgtctgaggagggcatgaaggtctcctgtacccatttccagtgcgcagccggc gccttcgcctacctacgggagcacttccctcaagcctacagcgtcgacatgagccgccag atccttacgctcaacgtcaacctcatgctgggccaggctcaggagtgcctcctggagaag tcgatgttggacaacaggaagagctttctggtggcccgcatcagtgcacaggtggtagat tactacaaggaggcatgccgggccttggagaaccccgacactgcctcactgctgggccgg atccagaaggactggaagaaacttgtgcagatgaagatctactacttcgcagccgtggct catctgcacatgggaaagcaggccgaggagcagcagaagttcggggagcgggttgcatac ttccagagcgccctggacaagctcaatgaagccatcaagttggccaagggccagcctgac actgtgcaagacgcgcttcgcttcactatggatgtcattgggggaaagtacaattctgcc aagaaggacaacgacttcatttaccatgaggctgtcccagcattggacactcttcagcct gtaaaaggagcccccttggtgaagcccttgccagtgaaccccacagacccagctgttaca ggccctgacatctttgccaaactggtacccatggctgcccacgaggcctcgtcactgtac agtgaggagaaggccaagctgctccgggagatgatggccaagattgaggacaagaatgag gtcctggaccagttcatggattcaatgcagttggatcccgagacggtggacaaccttgat gcctacagccacatcccaccccagctcatggagaagtgcgcggctctcagcgtccggccc gacactgtcaggaaccttgtacagtccatgcaagtgctgtcaggtgtgttcacggatgtg gaggcttccctgaaggacatcagagatctgttggaggaggatgagctgctagagcagaag tttcaggaggcggtgggccaggcaggggccatctccatcacctccaaggctgagctggca gaggtgaggcgagaatgggccaagtacatggaagtccatgagaaggcctccttcaccaac agtgagctgcaccgtgccatgaacctgcacgtcggcaacctgcgcctgctcagcgggccg cttgaccaggtccgggctgccctgcccacaccggccctctccccagaggacaaggccgtg ctgcaaaacctaaagcgcatcctggctaaggtgcaggagatgcgggaccagcgcgtgtcc ctggagcagcagctgcgtgagcttatccagaaagatgacatcactgcctcgctggtcacc acagaccactcagagatgaaggtgggctggaagttgttcgaggagcagctgaaaaagtat gaccagctgaaggtgtacctggagcagaacctggccgcccaggaccgtgtcctctgtgca ctgacagaggccaacgtgcagtacgcagccgtgcggcgggtactcagcgacttggaccaa aagtggaactccacgctgcagaccctggtggcctcgtatgaagcctatgaggacctgatg aagaagtcgcaggagggcagggacttctacgcagatctggagagcaaggtggctgctctg ctggagcgcacgcagtccacctgccaggcccgcgaggctgcccgccagcagctcctggac agggagctgaagaagaagccgccgccacggcccacagccccaaagccgctgctgccccgc agggaggagagtgaggcagtggaagcaggagacccccctgaggagctgcgcagcctcccc cctgacatggtggctggcccacgactgcctgacaccttcctgggaagtgccaccccgctc cactttcctcccagccccttccccagctccacaggcccaggaccccactatctctcaggc cccttgccccctggtacctactcgggccccacccagctgatacagcccagggccccaggg ccccatgcaatgcccgtagcacctgggcctgccctctacccagcccctgcctacacaccg gagctgggccttgtgccccgatcctccccacagcatggcgtgcctccccatcccccactg gcatatggtcctgccccttctaccagacccatgggcccccaggcagcccctcttaccatt cgagggccctcgtctgctggccagtccacccctagtccccacctggtgccttcacctgcc ccatctccagggcctggtccggtaccccctcgccccccagcagcagaaccacccccttgc ctgcgccgaggcgccgcagctgcagacctgctctcctccagcccggagagccagcatggc ggcactcagtctcctgggggtgggcagcccctgctgcagcccaccaaggtggatgcagct gagggtcgtcggccgcaggccctgcggctgattgagcgggacccctatgagcatcctgag aggctgcggcagttgcagcaggagctggaggcctttcggggtcagctgggggatgtggga gctctggacactgtctggcgagagctgcaagatgcgcaggaacatgatgcccgaggccgt tccatcgccattgcccgctgctactcactgaagaaccggcaccaggatgtcatgccctat gacagtaaccgtgtggtgctgcgctcaggcaaggatgactacatcaatgccagctgcgtg gaggggctctccccatactgccccccgctagtggcaacccaggccccactgcctggcaca gctgctgacttctggctcatggtccatgagcagaaagtgtcagtcattgtcatgctggtt tctgaggctgagatggagaagcaaaaagtggcacgctacttccccaccgagaggggccag cccatggtgcacggtgccctgagcctggcattgagcagcgtccgcagcaccgaaacccat gtggagcgcgtgctgagcctgcagttccgagaccagagcctcaagcgctctcttgtgcac ctgcacttccccacttggcctgagttaggcctgcccgacagccccagcaacttgctgcgc ttcatccaggaggtgcacgcacattacctgcatcagcggccgctgcacacgcccatcatt gtgcactgcagctctggtgtgggccgcacgggagcctttgcactgctctatgcagctgtg caggaggtggaggctgggaacggaatccctgagctgcctcagctggtgcggcgcatgcgg cagcagagaaagcacatgctgcaggagaagctgcacctcaggttctgctatgaggcagtg gtgagacacgtggagcaggtcctgcagcgccatggtgtgcctcctccatgcaaacccttg gccagtgcaagcatcagccagaagaaccaccttcctcaggactcccaggacctggtcctc ggtggggatgtgcccatcagctccatccaggccaccattgccaagctcagcattcggcct cctggggggttggagtccccggttgccagcttgccaggccctgcagagcccccaggcctc ccgccagccagcctcccagagtctaccccaatcccatcttcctccccgccccccctttcc tccccactacctgaggctccccagcctaaggaggagccgccagtgcctgaagcccccagc tcggggcccccctcctcctccctggaattgctggcctccttgaccccagaggccttctcc ctggacagctccctgcggggcaaacagcggatgagcaagcataactttctgcaggcccat aacgggcaagggctgcgggccacccggccctctgacgaccccctcagccttctggatcca ctctggacactcaacaagacctga >gi568815595f:47182966_47443938|GENSCAN_predicted_peptide_9|1379_aa MTLTERLREKISRAFYNHGLLCASYPIPIILFTGFCILACCYPLLKLPLPGTGPVEFTTP VKDYSPPPVDSDRKQGEPTEQPEIEKEMGPGQSPGVTQLSGQLSHLHWLSLIKIQASDTE VGGKDCFSYEEQEIQPKSEVPGGINLLCLVSILALAYAVTWSTALYVGAPVAYVQQIFVK SSVFPWHKNLLAVDVFRSPLSRAFQLVEEIRNHVLRDSSGIRSLEELCLQVTDLLPGLRK LRNLLPEHGCLLLSPGNFWQNDWERFHADPDIIGTIHQHEPKTLQTSATLKDLLFGVPGK YSGVSLYTRKRMVSYTITLVFQHYHAKFLGSLRARLMLLHPSPNCSLRAESLVHVHFKEE IGVAELIPLVTTYIILFAYIYFSTRKIDMVKSKWGLALAAVVTVLSSLLMSVGLCTLFGL TPTLNGGEIFPYLVVVIGLENVLVLTKSVVSTPVDLEVKLRIAQGLSSESWSIMKNMATE LGIILIGYFTLVPAIQEFCLFAVVGLVSDFFLQMLFFTTVLSIDIRRMELADLNKRLPPE ACLPSAKPVGQPTRYERQLAVRPSTPHTITLQPSSFRNLRLPKRLRVVYFLARTRLAQRL IMTLVASEEISLWEKQLQGSQAGTVVWIGILVYTDPAGLRNYLAAQVTEQSPLGEGALAP MPVPSGMLPPSHPDPAFSIFPPDAPKLPENQTSPGESPERGGPAEVVHDSPVPEVTWGPE DEELWRKLSFRHWPTLFSYYNITLAKRYISLLPVIPVTLRLNPREALEGRHPQDGRSAWP PPGPIPAGHWEAGPKGPGGVQAHGDVTLYKVAALGLATGIVLVLLLLCLYRVLCPRNYGQ LGGGPGRRRRGELPCDDYGYAPPETEIVPLVLRGHLMDIECLASDGMLLVSCCLAGHVCV WDAQTGDCLTRIPRPGRQRRDSGVGSGLEAQESWERLSDGGKAGPEEPGDSPPLRHRPRG PPPPSLFGDQPDLTCLIDTNFSAQPRSSQPTQPEPRHRAVCGRSRDSPGYDFSCLVQRVY QEEGLAAVCTPALRPPSPGPVLSQAPEDEGGSPEKGSPSLAWAPSAEGSIWSLELQGNLI VVGRSSGRLEVWDAIEGVLCCSSEEVSSGITALVFLDKRIVAARLNGSLDFFSLETHTAL SPLQFRGTPGRGSSPASPVYSSSDTVACHLTHTVPCAHQKPITALKAAAGRLVTGSQDHT LRVFRLEDSCCLFTLQGHSGAITTVYIDQTMVLASGGQDGAICLWDVLTGSRVSHVFAHR GDVTSLTCTTSCVISSGLDDLISIWDRSTGIKFYSIQQDLGCGASLGVISDNLLVTGGQG CVSFWDLNYGDLLQTVYLGKNSEAQPARQILVLDNAAIVCNFGSELSLVYVPSVLEKLD >gi568815595f:47182966_47443938|GENSCAN_predicted_CDS_9|4140_bp atgaccctgactgaaaggctgcgtgagaagatatctcgggccttctacaaccatgggctc ctctgtgcatcctatcccatccccatcatcctcttcacagggttctgcatcttagcctgc tgctacccactgctgaaactccccttgccaggaacaggacctgtggaattcaccacccct gtgaaggattactcgcccccacctgtggactctgaccgcaaacaaggagagcctactgag cagcctgagattgagaaggagatgggcccagggcagtcacctggtgtcacacagctcagt ggtcagttatctcacctccattggctgtccttgataaagatacaggccagcgatactgaa gtgggtggtaaggactgttttagttatgaagaacaggaaattcaacccaaatcagaggtc ccaggaggcattaacttgctgtgcttggtcagcatcttggcccttgcctatgctgtaacc tggagtactgcattgtatgtgggtgccccggtggcttatgtccagcagatatttgtgaag tcctcagtgtttccctggcacaagaacctcctggcagtagatgtatttcgttcacctttg tcccgggcattccaactggtggaggagatccggaaccacgtgctgagagacagctctggg atcaggagcttggaggagttgtgtctgcaagtgaccgacctgctgccaggccttaggaag ctcaggaacctactccctgagcatggatgcctgctgctgtcccctgggaacttctggcag aatgactgggaacgcttccatgctgatcctgacatcattgggaccatccaccagcacgag cctaaaaccctgcagacttcagccacactcaaagacttgttatttggtgttcctgggaag tacagcggggtgagcctctacaccaggaagaggatggtctcctacaccatcaccctggtc ttccagcactaccatgccaagttcctgggcagcctgcgtgcccgcctgatgcttctgcac cccagccccaactgcagccttcgggcggagagcctggtccacgtgcacttcaaggaggag attggtgtcgctgagctcatcccccttgtgaccacctacatcatcttgtttgcctacatc tacttctccacgcggaagatcgacatggtcaagtccaagtgggggctggccctggctgcc gtggtcacagtgctcagctcgctgctcatgtctgtgggactctgcacactcttcggcctg acgcccaccctcaatggcggcgagattttcccctaccttgtggtggttattgggttagag aatgtgttggtgctcaccaagtctgtggtctcaaccccggtagacctggaggtgaagctg cggatcgcccaaggcctaagcagcgagagctggtccatcatgaagaacatggccacggag ctgggcatcatcctcatcggctacttcaccctagtgcccgccatccaggagttctgtctc tttgctgtcgtggggctggtgtctgacttcttccttcagatgctgtttttcaccactgtc ctgtccattgacattcgccggatggagctagcagacctgaacaagcgactgccccctgag gcctgcctgccctcagccaagccagtgggacagccaacgcgctacgagcggcagctggct gtgaggccgtccacaccccacaccatcacgttgcagccgtcttccttccgaaacctgcgg ctccccaagaggctgcgtgttgtctacttcctggcccgcacccgcctggcacagcgcctc atcatgaccctagtggcttctgaggagataagcctgtgggagaagcagctccagggttct caggctggcaccgttgtctggattggcatcctggtatacacagacccagcagggctgcgc aactacctcgctgcccaggtgacggaacagagcccattgggtgagggagccctggctccc atgcccgtgcctagtggcatgctgccccccagccacccggaccctgccttctccatcttc ccacctgatgcccctaagctacctgagaaccagacgtcgccaggcgagtcacctgagcgt ggaggtccagcagaggttgtccatgacagcccagtcccagaggtaacctgggggcctgag gatgaggaactttggaggaaattgtccttccgccactggccgacgctcttcagctattac aacatcacactggccaagaggtacatcagcctgctgcccgtcatcccagtcacgctccgc ctgaacccgagggaggctctggagggccggcaccctcaggacggccgcagtgcctggccc ccaccggggcccatacctgctgggcactgggaagcaggacccaagggcccaggtggggtg caggcccatggagacgtcacgctgtacaaggtggcggcgctgggcctggccaccggcatc gtcttggtgctgctgctgctctgcctctaccgcgtgctatgcccgcgcaactacgggcag ctgggtggtgggcccgggcggcggaggcgcggggagctgccctgcgacgactacggctat gcgccacccgagacggagatcgtgccgcttgtgctgcgcggccacctcatggacatcgag tgcctggccagcgacggcatgctgctggtgagctgctgcctggcaggccacgtctgcgtg tgggacgcgcagaccggggattgcctaacgcgcattccgcgcccaggcaggcagcgccgg gacagtggcgtgggcagcgggcttgaggctcaggagagctgggaacgactttcagatggt gggaaggctggtccagaggagcctggggacagccctcccctgagacaccgcccccggggc cctccgccgccttccctcttcggggaccagcctgacctcacctgcttaattgacaccaac ttttcagcgcagcctcggtcctcacagcccactcagcccgagccccggcaccgggcggtc tgtggccgctctcgggactccccaggctatgacttcagctgcctggtgcagcgggtgtac caggaggaggggctggcggccgtctgcacaccagccctgcgcccaccctcgcctgggccg gtgctgtcccaggcccctgaggacgagggtggctcccccgagaaaggctccccttccctc gcctgggcccccagtgccgagggttccatctggagcttggagctgcagggcaacctcatc gtggtggggcggagcagcggccggctggaggtgtgggacgccattgaaggggtgctgtgc tgcagcagcgaggaggtctcctcaggcattaccgctctggtgttcttggacaaaaggatt gtggctgcacggctcaacggttcccttgatttcttctccttggagacccacactgccctc agccccctgcagtttagagggaccccagggcggggcagttcccctgcctctccagtgtac agcagcagcgacacagtggcctgtcacctgacccacacagtgccctgtgcacaccaaaaa cccatcacagccctgaaagccgctgctgggcgcttggtgactgggagccaagaccacaca ctgagagtgttccgtctggaggactcgtgctgcctcttcacccttcagggccactcaggg gccatcacgaccgtgtacattgaccagaccatggtgctggccagtggaggacaagatggg gccatctgcctgtgggatgtactgactggcagccgggtcagccatgtgtttgctcaccgt ggggatgtcacctcccttacctgtaccacctcctgtgtcatcagcagtggcctggatgac ctcatcagcatctgggaccgcagcacaggcatcaagttctactccattcagcaggacctg ggctgtggtgcaagcttgggtgtcatctcagacaacctgctggtgactggcggccagggc tgtgtctccttttgggacctaaactacggggacctgttacagacagtctacctggggaag aacagtgaggcccagcctgcccgccagatcctggtgctggacaacgctgccattgtctgc aactttggcagtgagctcagcctggtgtatgtgccctctgtgctggagaagctggactga