AV436090 ( PM066f05_r )

[UP]


[1][TOP]
>UniRef100_B3NX29 GG19316 n=1 Tax=Drosophila erecta RepID=B3NX29_DROER
          Length = 906

 Score = 65.1 bits (157), Expect = 3e-09
 Identities = 60/175 (34%), Positives = 67/175 (38%), Gaps = 18/175 (10%)
 Frame = +1

Query: 4    QQPP------SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSY-----AP 150
            QQPP       YG   P +  GG    G ++G P  PG Y  +G GG P  S       P
Sbjct: 559  QQPPPGPPQSQYGPPPPQNFAGGPPPMG-YAGYPPNPGQYGQAGAGGGPPPSGYWPPPPP 617

Query: 151  SSSASLP-------QGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQM 309
            +SSA  P       Q A  G   GAPP     Y    PTS               AP Q 
Sbjct: 618  TSSAQSPYQAYQQQQQAAAGGGAGAPPG--SSYPGGPPTSGAAPPPPPGGAYSTTAPSQT 675

Query: 310  PPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGA 474
            PPP G     A GG T           NGP +  S   P    GGG GP+ P GA
Sbjct: 676  PPPQGGGG--AGGGNT---------NPNGPNAQQSTPPPQGGAGGGAGPSGPGGA 719

[2][TOP]
>UniRef100_UPI0001791D37 PREDICTED: similar to lim domain binding protein n=1
           Tax=Acyrthosiphon pisum RepID=UPI0001791D37
          Length = 722

 Score = 64.7 bits (156), Expect = 4e-09
 Identities = 50/157 (31%), Positives = 57/157 (36%), Gaps = 2/157 (1%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPY--APGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAP 207
           P S+VGG S  G   G      PG Y G  PG H                      GG P
Sbjct: 9   PSSMVGGPSGPGGGGGRRGYGGPGGYGGGPPGHH----------------------GGGP 46

Query: 208 PSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHG 387
           P   GG    GP      +  G      P+     PP+GP PH   GG    HG P HHG
Sbjct: 47  PGHHGGSVLGGPHGGPPGHLGGGVHHSGPSGHHGGPPSGP-PHHGGGGPPGHHGGPPHHG 105

Query: 388 ANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTA 498
             GP        P +  GGG  P +  G  + P S A
Sbjct: 106 --GPPGSGPHGGPPHPHGGGGPPHHGAGVPLHPHSGA 140

[3][TOP]
>UniRef100_Q9W3G1 CG10555 n=1 Tax=Drosophila melanogaster RepID=Q9W3G1_DROME
          Length = 926

 Score = 64.7 bits (156), Expect = 4e-09
 Identities = 59/177 (33%), Positives = 67/177 (37%), Gaps = 20/177 (11%)
 Frame = +1

Query: 4    QQPP------SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSY-----AP 150
            QQPP       YG   P +  GG    G ++G P  PG Y  +G GG P  S       P
Sbjct: 571  QQPPPGPPQSQYGPPPPQNSAGGPPPMG-YAGYPPNPGQYGQAGAGGGPPPSGYWPPPPP 629

Query: 151  SSSASLP---------QGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPP 303
            +SSA  P         Q A  G   GAPP     Y    PTS               AP 
Sbjct: 630  TSSAQSPYQAYQQQQQQQAAAGGGAGAPPG--SSYPGGPPTSGAAPPPPPGGAYSTTAPS 687

Query: 304  QMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGA 474
            Q PPP G       GG    +  P     NGP +  S   P    GGG GP+ P GA
Sbjct: 688  QTPPPQGG------GGAGGGNNNP-----NGPNAQQSTPPPQGGAGGGAGPSGPGGA 733

[4][TOP]
>UniRef100_A1UQ37 Putative methyl-accepting chemotaxis sensory transducer n=1
           Tax=Mycobacterium sp. KMS RepID=A1UQ37_MYCSK
          Length = 845

 Score = 64.3 bits (155), Expect = 5e-09
 Identities = 69/200 (34%), Positives = 88/200 (44%), Gaps = 22/200 (11%)
 Frame = +1

Query: 1   AQQPPSYGSHVPGSVVGGSSAAGSFSG---PPYAPGVYAGSGPGGHPASSYAPSS--SAS 165
           A  PP       GS  GG+S+ GS      PP A G+ + +G GG   SS + ++  S+S
Sbjct: 312 AMTPPMTPVSSGGS--GGASSLGSIGSGFKPPSASGL-SSAGTGGLSPSSLSSNAGLSSS 368

Query: 166 LPQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAH 345
           LP      S GG P + AGG GA G  +AT S+ S  F +       +PPP  P P    
Sbjct: 369 LPSSVSPAS-GGLPSAAAGGGGAPG--AATSSDFSRGFNAGLGTGSVLPPPVAPPPAQPL 425

Query: 346 GGVTAAHGVPRHHG------ANGPASLNS----AALPAYATGGGNGPAYPPGAIVSPAS- 492
              T A  VP   G      A GPA + S    A  PA   G    P  PP A  +PA  
Sbjct: 426 SSTTGASSVPVSAGPAPVSAAGGPAHVASPTPAAGAPAGHMGSMGAPMMPPAA--APAGP 483

Query: 493 TATFN------RLSPAAAAA 534
              FN      +++PA A A
Sbjct: 484 LPPFNSDLQPRQVAPAGAGA 503

[5][TOP]
>UniRef100_UPI000186E27B hypothetical protein Phum_PHUM355640 n=1 Tax=Pediculus humanus
            corporis RepID=UPI000186E27B
          Length = 844

 Score = 63.2 bits (152), Expect = 1e-08
 Identities = 65/210 (30%), Positives = 85/210 (40%), Gaps = 37/210 (17%)
 Frame = +1

Query: 7    QPPSYGSHVPGSVVGGSSAAGSF------SGPPYAPGVYAGSGPGGHPASSYAPSSSASL 168
            Q PS  S   G   G S  +GSF      SGP +  G    SGP G    S  PSSS S 
Sbjct: 551  QGPSGPSGSFGGSQGPSGPSGSFDGSQGPSGPSFGGGNQGPSGPSGSFGGSQGPSSSVSF 610

Query: 169  ---------PQGAHLGSRG--------GAPPSVAGGYGASGPTSATFSNESGSF---QSL 288
                     P G+  GS+G        GAP   +G  G+ G +    S  SGSF    + 
Sbjct: 611  GGGNQGPSGPSGSFGGSQGPSGPSGSYGAPQGPSGSTGSFGGSQRPSSPSSGSFGGPGNQ 670

Query: 289  QPAPP--QMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAY 462
             P+PP     PP+GPS   + GG     G     G  GP+  ++ +    A  G +GP+ 
Sbjct: 671  GPSPPSGSYGPPSGPSG--SFGGSQGPSGPSFGGGNQGPSGPSTPSGSYGAPQGSSGPSV 728

Query: 463  P---------PGAIVSPASTATFNRLSPAA 525
                      P    SP  ++TF   +P A
Sbjct: 729  SFVGQQGSRVPVTGGSPGPSSTFGPTTPTA 758

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 57/175 (32%), Positives = 72/175 (41%), Gaps = 12/175 (6%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGS------SAAGSFSGPPYAPGVYAGS-GPGGHPASSYAPSSSASLPQ 174
           S G   P    GGS      S  G   GP    G + GS GP G P+ S+  S   S P 
Sbjct: 512 SQGPSGPSGSFGGSQGPSGPSFGGGNQGPSGPSGSFGGSQGPSG-PSGSFGGSQGPSGPS 570

Query: 175 GAHLGSRGGAPPSVAGG-YGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGG 351
           G+  GS+G + PS  GG  G SGP        SGSF   Q          GPS  ++ GG
Sbjct: 571 GSFDGSQGPSGPSFGGGNQGPSGP--------SGSFGGSQ----------GPSSSVSFGG 612

Query: 352 VTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP----ASTATF 504
                      G  GP+       P+ + GG  GP+ P G+  +P     ST +F
Sbjct: 613 -----------GNQGPSG------PSGSFGGSQGPSGPSGSYGAPQGPSGSTGSF 650

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 55/172 (31%), Positives = 68/172 (39%), Gaps = 18/172 (10%)
 Frame = +1

Query: 13  PSYGSHVP------GSVVGGSSAAGSFSGPPY---APGVYAGS----GPGGHP---ASSY 144
           PS+G   P      GS  G + A   FSG P    +PG    S    G GG+P   +SS+
Sbjct: 66  PSFGPSPPSSRPDFGSQSGSTPAGNGFSGRPSGSSSPGSGYPSAGQGGQGGYPGSSSSSF 125

Query: 145 APSSSASLPQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTG 324
            P        G   GS+G +P +  GGY + GP   TFS+  G        P       G
Sbjct: 126 GPGYQGGSGGGGRPGSQGSSPGTSNGGYPSGGP---TFSSGVGG----SSGPGYQGGAGG 178

Query: 325 PSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAY--ATGGGNGPAYPPGA 474
            S     GG     G     GA G +       P Y    GGG+GP Y  GA
Sbjct: 179 GSGPGYQGGAGGGSGPGYQGGAGGGSG------PGYQGGAGGGSGPGYQGGA 224

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 48/162 (29%), Positives = 61/162 (37%), Gaps = 8/162 (4%)
 Frame = +1

Query: 13  PSY-GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGP------GGHPASSYAPSSSASLP 171
           P Y G    GS  G    AG  SGP Y  G   GSGP      GG     Y   +     
Sbjct: 194 PGYQGGAGGGSGPGYQGGAGGGSGPGYQGGAGGGSGPGYQGGAGGGSGPGYQGGAGGGSG 253

Query: 172 QGAHLGSRGGAPPSVAGGYGASG-PTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG 348
            G   G+ GG+ P   GG G  G P S   S  +  +Q            +GPS     G
Sbjct: 254 PGYQGGAGGGSGPGFQGGAGGGGRPGSQGGSGGNSGYQG----------GSGPS---FQG 300

Query: 349 GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGA 474
           G    +G     G+ GP     +  P +   GG+GP +  G+
Sbjct: 301 GAGGGNGPSSQGGSGGPGFQGGSGGPGFQ--GGSGPGFQGGS 340

[6][TOP]
>UniRef100_UPI0000222BCC Hypothetical protein CBG04553 n=1 Tax=Caenorhabditis briggsae AF16
           RepID=UPI0000222BCC
          Length = 723

 Score = 62.8 bits (151), Expect = 2e-08
 Identities = 54/179 (30%), Positives = 69/179 (38%), Gaps = 17/179 (9%)
 Frame = +1

Query: 49  GGSSAAGSFSGPPYAPGV-YAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGG 225
           GG  ++G ++ PP   G  YA  G GG     YA      +  G +    GG   S  GG
Sbjct: 86  GGGGSSGGYAKPPGGGGGGYASGGGGGGGGGGYASGGGGGVSSGGYAKPSGGGGGSSGGG 145

Query: 226 YGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPAS 405
           Y + G +S       G +    PAP   P P  P+P  A  G  A+ G     G++G   
Sbjct: 146 YSSGGGSSG--GGGGGGYSQSAPAPAAAPAP-APAPAPAPSGGYASSG--GGGGSSGGGY 200

Query: 406 LNSAALPA----------YATGG------GNGPAYPPGAIVSPASTATFNRLSPAAAAA 534
             SA  PA          YA+GG      G G  Y   A   P   A     +PA A A
Sbjct: 201 SQSAPAPAPAPAPAPSGGYASGGGAGGSSGGGGGYSQSAPPPPPQPAPAPEPAPAPAPA 259

 Score = 59.3 bits (142), Expect = 2e-07
 Identities = 47/164 (28%), Positives = 68/164 (41%), Gaps = 1/164 (0%)
 Frame = +1

Query: 1   AQQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
           A +P    +  P      S   G  SG  Y+ G  +  G GG  +  Y+ S+    P  A
Sbjct: 249 APEPAPAPAPAPSGGYASSGGGGGSSGGGYSSGGGSSGGGGGGSSGGYSQSAPPPPPAPA 308

Query: 181 HLGSRGGAP-PSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVT 357
              +   AP P+ +GGY +SG  S+      G +   Q APP   P + P+P  A  G  
Sbjct: 309 PAPAPAPAPAPAPSGGYASSGGGSS--GGGGGGYS--QSAPPPPAPESAPAPAPAPSGGY 364

Query: 358 AAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPA 489
           A+ G     G  G +S +S    +   GGG G  Y   +   P+
Sbjct: 365 ASSGGGESSG--GGSSASSGGYASSGGGGGGGGGYASASAPPPS 406

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 53/164 (32%), Positives = 63/164 (38%), Gaps = 15/164 (9%)
 Frame = +1

Query: 1   AQQPPSYGSHVPGSVVGGSSAAG---SFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLP 171
           A  P   G +  G   GGSS  G   S S PP  P       P   PA + AP+     P
Sbjct: 210 APAPAPSGGYASGGGAGGSSGGGGGYSQSAPPPPPQ----PAPAPEPAPAPAPA-----P 260

Query: 172 QGAHLGSRGGAPPSVAGGYGASGPTS-ATFSNESGSFQSLQPAPPQMPPPT---GPSPHL 339
            G +  S GG   S  GGY + G +S       SG +    P PP  P P     P+P  
Sbjct: 261 SGGYASSGGGGG-SSGGGYSSGGGSSGGGGGGSSGGYSQSAPPPPPAPAPAPAPAPAPAP 319

Query: 340 AHGGVTAAHGVPRHHGANG--------PASLNSAALPAYATGGG 447
           A  G  A+ G     G  G        P +  SA  PA A  GG
Sbjct: 320 APSGGYASSGGGSSGGGGGGYSQSAPPPPAPESAPAPAPAPSGG 363

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 57/201 (28%), Positives = 78/201 (38%), Gaps = 28/201 (13%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSS-------ASLPQ 174
           S G +   S  GG S+ G +S      G   G G GG+  S+ AP+++       A  P 
Sbjct: 127 SSGGYAKPSGGGGGSSGGGYSS---GGGSSGGGGGGGYSQSAPAPAAAPAPAPAPAPAPS 183

Query: 175 GAHLGSRGG-----------------AP-PSVAGGYGASGPTSATFSNESGSFQSLQPAP 300
           G +  S GG                 AP P+ +GGY ASG  +   S   G +    P P
Sbjct: 184 GGYASSGGGGGSSGGGYSQSAPAPAPAPAPAPSGGY-ASGGGAGGSSGGGGGYSQSAPPP 242

Query: 301 PQMPPPT---GPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPG 471
           P  P P     P+P  A  G  A+ G     G +     +S    +   GGG+   Y   
Sbjct: 243 PPQPAPAPEPAPAPAPAPSGGYASSG---GGGGSSGGGYSSGGGSSGGGGGGSSGGYSQS 299

Query: 472 AIVSPASTATFNRLSPAAAAA 534
           A   P + A     +PA A A
Sbjct: 300 APPPPPAPAPAPAPAPAPAPA 320

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 47/164 (28%), Positives = 62/164 (37%)
 Frame = +1

Query: 1   AQQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
           A  P   G +  G   GG S+ G   G   AP       P   P  + AP+ S+      
Sbjct: 482 APAPAPSGGYSSGGGGGGGSSGGYSGGSAPAPASEPAPAPAPEPEPAPAPAPSS------ 535

Query: 181 HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTA 360
             G   G   S  GG G+SG +S  +S   GS     P PP   P   P+P  A  G  +
Sbjct: 536 --GGYSGGSSSGGGGGGSSGGSSGGYS--GGSAAPPPPPPPAPEPAPAPAPAPAPSGGYS 591

Query: 361 AHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPAS 492
           + G     G       +  + PA A+     PA  P    +PAS
Sbjct: 592 SEG---GGGGGSSGGYSGGSAPAPASEPAPAPAPEPEPAPAPAS 632

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 48/170 (28%), Positives = 60/170 (35%), Gaps = 7/170 (4%)
 Frame = +1

Query: 19  YGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG 198
           Y S   GS  GG       + PP AP   +   P   P+  YA S       G    S G
Sbjct: 325 YASSGGGSSGGGGGGYSQSAPPPPAPE--SAPAPAPAPSGGYASSGGGESSGGGSSASSG 382

Query: 199 GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTA------ 360
           G   S  GG G  G  SA+    SG       A    PPP  P+P  A     A      
Sbjct: 383 GYASSGGGGGGGGGYASASAPPPSGGGGGGYSASAAPPPPPPPAPEPAPAPAPAPAPSRG 442

Query: 361 -AHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFN 507
            + G     G++G  S  SA  PA        P   P    +PA +  ++
Sbjct: 443 YSSGGGGGGGSSGGYSGGSAPAPASEPAPAPAPEQAPAPAPAPAPSGGYS 492

[7][TOP]
>UniRef100_Q5NT95 Type 1 collagen alpha 2 n=1 Tax=Paralichthys olivaceus
            RepID=Q5NT95_PAROL
          Length = 1352

 Score = 62.8 bits (151), Expect = 2e-08
 Identities = 53/170 (31%), Positives = 65/170 (38%), Gaps = 19/170 (11%)
 Frame = +1

Query: 22   GSHVPGSVVG--GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSR 195
            G+  P    G  GS      +G    PG     G  G   ++ AP       +G H G  
Sbjct: 598  GARGPAGAPGPDGSKGEPGITGAAGGPGHQGPGGMPGERGAAGAPGGKGEKGEGGHRGPE 657

Query: 196  GGAPPSVAGGY-GASGPTSATFSN----ESGSFQSLQPAPPQMPP----PTGPSPHLAHG 348
            G A    A G  G +GP   T +N    ESGSF    PA P+         GP+      
Sbjct: 658  GNAGRDGARGMPGPAGPPGPTGANGDKGESGSFGPAGPAGPRGASGERGEVGPAGAPGFA 717

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATG--------GGNGPAYPPGA 474
            G   A G P   G  GPA +     P+  +G        G NGPA PPGA
Sbjct: 718  GPPGADGQPGARGERGPAGIKGEVGPSGPSGPAGQSGPAGPNGPAGPPGA 767

[8][TOP]
>UniRef100_Q16988 Fibroin-4 (Fragment) n=1 Tax=Araneus diadematus RepID=Q16988_ARADI
          Length = 410

 Score = 62.8 bits (151), Expect = 2e-08
 Identities = 59/179 (32%), Positives = 77/179 (43%), Gaps = 16/179 (8%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGP-------PYAPGVYAGSGPGGHPASSYAPSSSASL 168
           P +YG   P S    ++AAGS  G        P  PG Y   GPGG  +S+ A +++AS 
Sbjct: 27  PVAYGPGGPVSSAAAAAAAGSGPGGYGPENQGPSGPGGY---GPGGSGSSAAAAAAAASG 83

Query: 169 PQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG 348
           P G   GS+G + P  +GGYG  G   A+     G+  +   A      P G  P     
Sbjct: 84  PGGYGPGSQGPSGPGGSGGYG-PGSQGASGPGGPGASAAAAAAAAAASGPGGYGP----- 137

Query: 349 GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGP---------AYPPGAIVSPASTA 498
           G     G P  +G  GP S  +AA  A +  GG GP          Y PG   S A+ A
Sbjct: 138 GSQGPSG-PGAYGPGGPGSSAAAAAAAASGPGGYGPGSQGPSGPGVYGPGGPGSSAAAA 195

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 52/157 (33%), Positives = 69/157 (43%), Gaps = 8/157 (5%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGP-------PYAPGVYAGSGPGGHPASSYAPSSSASL 168
           P +YG   PGS    ++AA S  G        P  PGVY   GPG   +S+ A +++ S 
Sbjct: 145 PGAYGPGGPGSSAAAAAAAASGPGGYGPGSQGPSGPGVYGPGGPG---SSAAAAAAAGSG 201

Query: 169 PQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG 348
           P G    ++G   PS  GGYG  G         SGS  +   A    P   GP      G
Sbjct: 202 PGGYGPENQG---PSGPGGYGPGG---------SGSSAAAAAAAASGPGGYGPGSQGPSG 249

Query: 349 -GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGP 456
            G +  +G P   G +GP +  +AA  A +  GG GP
Sbjct: 250 PGGSGGYG-PGSQGGSGPGASAAAAAAAASGPGGYGP 285

 Score = 57.4 bits (137), Expect = 6e-07
 Identities = 48/166 (28%), Positives = 73/166 (43%), Gaps = 13/166 (7%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGP---------PYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
           PG+    ++AA + SGP         P  PG Y   GPGG  +S+ A +++AS P G   
Sbjct: 116 PGASAAAAAAAAAASGPGGYGPGSQGPSGPGAY---GPGGPGSSAAAAAAAASGPGGYGP 172

Query: 187 GSRGGAPPSV--AGGYGASGPTSATFSNESGSF--QSLQPAPPQMPPPTGPSPHLAHGGV 354
           GS+G + P V   GG G+S   +A   +  G +  ++  P+ P    P G     A    
Sbjct: 173 GSQGPSGPGVYGPGGPGSSAAAAAAAGSGPGGYGPENQGPSGPGGYGPGGSGSSAAAAAA 232

Query: 355 TAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPAS 492
            A+       G+ GP+    +      + GG+GP     A  + AS
Sbjct: 233 AASGPGGYGPGSQGPSGPGGSGGYGPGSQGGSGPGASAAAAAAAAS 278

 Score = 57.0 bits (136), Expect = 8e-07
 Identities = 50/169 (29%), Positives = 74/169 (43%), Gaps = 19/169 (11%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGP-------PYAPGVYAGSGPGGHPASSYAPSSSASL 168
           P  YG   PGS    ++AAGS  G        P  PG Y   GPGG  +S+ A +++AS 
Sbjct: 180 PGVYGPGGPGSSAAAAAAAGSGPGGYGPENQGPSGPGGY---GPGGSGSSAAAAAAAASG 236

Query: 169 PQGAHLGSRGGAPPSVAGGY----------GASGPTSATFSNESGSF--QSLQPAPPQMP 312
           P G   GS+G + P  +GGY          GAS   +A  ++  G +   S  P+ P   
Sbjct: 237 PGGYGPGSQGPSGPGGSGGYGPGSQGGSGPGASAAAAAAAASGPGGYGPGSQGPSGPGYQ 296

Query: 313 PPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPA 459
            P+GP  +      +A+     +        ++SA     ++G  NG A
Sbjct: 297 GPSGPGAYGPSPSASASVAASVYLRLQPRLEVSSAVSSLVSSGPTNGAA 345

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 58/189 (30%), Positives = 78/189 (41%), Gaps = 32/189 (16%)
 Frame = +1

Query: 4   QQPPSYGSHVP-GSVVGGSSAAGSFSGP-----------------PYAPGVYAGSGPGGH 129
           Q P   G + P GS    ++AA + SGP                  Y PG    SGPGG 
Sbjct: 57  QGPSGPGGYGPGGSGSSAAAAAAAASGPGGYGPGSQGPSGPGGSGGYGPGSQGASGPGGP 116

Query: 130 PAS--SYAPSSSASLPQGAHLGSRGGAPPSV--AGGYGASGPTSATFSNESGSF--QSLQ 291
            AS  + A +++AS P G   GS+G + P     GG G+S   +A  ++  G +   S  
Sbjct: 117 GASAAAAAAAAAASGPGGYGPGSQGPSGPGAYGPGGPGSSAAAAAAAASGPGGYGPGSQG 176

Query: 292 PAPPQMPPPTGPSPHLA--------HGGVTAAHGVPRHHGANGPASLNSAALPAYATGGG 447
           P+ P +  P GP    A         GG    +  P   G  GP    S+A  A A   G
Sbjct: 177 PSGPGVYGPGGPGSSAAAAAAAGSGPGGYGPENQGPSGPGGYGPGGSGSSAAAAAAAASG 236

Query: 448 NGPAYPPGA 474
            G  Y PG+
Sbjct: 237 PG-GYGPGS 244

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 51/172 (29%), Positives = 72/172 (41%), Gaps = 2/172 (1%)
 Frame = +1

Query: 25  SHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGA 204
           S    +   GS   G  +  P  P  Y   GPGG  +S+ A +++ S P G    ++G  
Sbjct: 4   SAAAAAAASGSGGYGPENQGPSGPVAY---GPGGPVSSAAAAAAAGSGPGGYGPENQG-- 58

Query: 205 PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG-GVTAAHGVPRH 381
            PS  GGYG  G         SGS  +   A    P   GP      G G +  +G P  
Sbjct: 59  -PSGPGGYGPGG---------SGSSAAAAAAAASGPGGYGPGSQGPSGPGGSGGYG-PGS 107

Query: 382 HGANGPASLNSAALPAYATGGGNGP-AYPPGAIVSPASTATFNRLSPAAAAA 534
            GA+GP    ++A  A A    +GP  Y PG+   P+    +    P ++AA
Sbjct: 108 QGASGPGGPGASAAAAAAAAAASGPGGYGPGS-QGPSGPGAYGPGGPGSSAA 158

[9][TOP]
>UniRef100_C4XYJ5 Predicted protein n=1 Tax=Clavispora lusitaniae ATCC 42720
            RepID=C4XYJ5_CLAL4
          Length = 953

 Score = 62.4 bits (150), Expect = 2e-08
 Identities = 66/188 (35%), Positives = 77/188 (40%), Gaps = 13/188 (6%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGP-----PYAPGVYAGSGPGGHPASSYAPSSSASLPQ 174
            P S GS  PGS  G S A GS   P     P +PG    SG  G P S  +PSS +  P 
Sbjct: 616  PGSPGS--PGSP-GASGAPGSPGSPGSPGSPGSPGSPGASGSPGSPGSPGSPSSPSGSPG 672

Query: 175  GAHLGSRGGA-----PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHL 339
                 S  GA      P   G  GASG   +  S  S S  S  P  P  P   G S   
Sbjct: 673  SPSSPSSPGASGSPGSPGSPGSPGASGSPGSPGSPGSPSSPSGSPGSPSSPSSPGAS--- 729

Query: 340  AHGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYP--PGAIVSPASTATFNR 510
               G   + G P   GA+G P S  S   P+  +G    P+ P  PGA  SP S  +   
Sbjct: 730  ---GSPGSPGSPGSPGASGSPGSPGSPGSPSSPSGSPGSPSSPSSPGASGSPGSPGSPG- 785

Query: 511  LSPAAAAA 534
             SP A+ A
Sbjct: 786  -SPGASGA 792

 Score = 58.2 bits (139), Expect = 4e-07
 Identities = 59/180 (32%), Positives = 71/180 (39%), Gaps = 8/180 (4%)
 Frame = +1

Query: 13   PSYGSHVPGSVVGGSSAAGSFS-GPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
            PS  S  PGS    SS   S S G P +PG    SG  G P S  +PSS +  P      
Sbjct: 664  PSSPSGSPGSPSSPSSPGASGSPGSPGSPGSPGASGSPGSPGSPGSPSSPSGSPGSPSSP 723

Query: 190  SRGGA-----PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGV 354
            S  GA      P   G  GASG   +  S  S S  S  P  P  P   G S      G 
Sbjct: 724  SSPGASGSPGSPGSPGSPGASGSPGSPGSPGSPSSPSGSPGSPSSPSSPGAS------GS 777

Query: 355  TAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYP--PGAIVSPASTATFNRLSPAAA 528
              + G P   GA+G            A G    P  P  PG+  SP S+ + +  SP+A+
Sbjct: 778  PGSPGSPGSPGASG------------APGAPGSPGSPGSPGSPSSPGSSESGSPSSPSAS 825

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 56/165 (33%), Positives = 70/165 (42%), Gaps = 4/165 (2%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
            P S GS  PGS    SS +GS  G P +PG    SG  G P S  +P +S +       G
Sbjct: 582  PGSPGS--PGSPGSPSSPSGS-PGSPSSPGSPGASGSPGSPGSPGSPGASGAPGSPGSPG 638

Query: 190  SRGG-APPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAH 366
            S G    P   G  G+ G   +  S  S S     P+ P  P  +G SP         + 
Sbjct: 639  SPGSPGSPGSPGASGSPGSPGSPGSPSSPSGSPGSPSSPSSPGASG-SP--------GSP 689

Query: 367  GVPRHHGANG-PASLNSAALPAYATGGGNGPAYP--PGAIVSPAS 492
            G P   GA+G P S  S   P+  +G    P+ P  PGA  SP S
Sbjct: 690  GSPGSPGASGSPGSPGSPGSPSSPSGSPGSPSSPSSPGASGSPGS 734

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 56/170 (32%), Positives = 66/170 (38%), Gaps = 15/170 (8%)
 Frame = +1

Query: 37  GSVVGGSSAAGS--------FSGPPYAPGVYAGSGPGG--HPASSYAPSSSASLPQGAHL 186
           G+  G  S +GS         SG P APG    +GP G   PA    PS  A  P     
Sbjct: 362 GNGSGNGSGSGSPGSPGSPGASGAPGAPGAPGPAGPAGPAGPAGPAGPSGPAGSPGSPGS 421

Query: 187 GSRGGAP--PSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTA 360
               G+P  P   G  GASG   +  S  S S  S  P  P  P   G S      G   
Sbjct: 422 PGASGSPESPGSPGSPGASGAPGSPGSPGSPSSPSGAPGSPGSPGSPGASGSPGSPGSPG 481

Query: 361 AHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYP--PGAIVSPASTAT 501
           + G P   GA G P S  S   P  A+G    P  P  PG+  SP S ++
Sbjct: 482 SPGSPGASGAPGSPGSPGSPGSPG-ASGAPGSPGSPGSPGSPGSPGSPSS 530

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 62/180 (34%), Positives = 76/180 (42%), Gaps = 5/180 (2%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
           P S GS  PGS  G S A GS  G P +PG    SG  G P S  +P S  S        
Sbjct: 477 PGSPGS--PGSP-GASGAPGS-PGSPGSPGSPGASGAPGSPGSPGSPGSPGS-------- 524

Query: 190 SRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMP--PPTGPSPHLAHGGVTAA 363
              G+P S +G  G+ G   A     SGS     P  P  P  P +  SP  +  G   +
Sbjct: 525 --PGSPSSPSGSPGSPGSPGA-----SGS-----PGSPGSPGSPGSPSSPGSSESGSPGS 572

Query: 364 HGVPRHHGANG-PASLNSAALPAYATGGGNGPAYP--PGAIVSPASTATFNRLSPAAAAA 534
            G P   G+ G P S  S   P+  +G    P+ P  PGA  SP S  +    SP A+ A
Sbjct: 573 PGSPGASGSPGSPGSPGSPGSPSSPSGSPGSPSSPGSPGASGSPGSPGSPG--SPGASGA 630

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 63/182 (34%), Positives = 76/182 (41%), Gaps = 21/182 (11%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSG-PG--GHPASSYAPSSSASLPQGA 180
            P S GS  PGS    SS +GS  G P +PG     G PG  G P S  +P SS S   G+
Sbjct: 516  PGSPGS--PGSPGSPSSPSGS-PGSPGSPGASGSPGSPGSPGSPGSPSSPGSSESGSPGS 572

Query: 181  HLGSRG--------------GAPPSVAGGYGA-SGPTSATFSNESGSFQSLQPAPPQMPP 315
              GS G              G+P S +G  G+ S P S   S   GS     P  P  P 
Sbjct: 573  P-GSPGASGSPGSPGSPGSPGSPSSPSGSPGSPSSPGSPGASGSPGS-----PGSPGSPG 626

Query: 316  PTGPSPHLAHGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYP--PGAIVSP 486
             +G        G   + G P   GA+G P S  S   P+  +G    P+ P  PGA  SP
Sbjct: 627  ASGAPGSPGSPGSPGSPGSPGSPGASGSPGSPGSPGSPSSPSGSPGSPSSPSSPGASGSP 686

Query: 487  AS 492
             S
Sbjct: 687  GS 688

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 52/157 (33%), Positives = 60/157 (38%), Gaps = 1/157 (0%)
 Frame = +1

Query: 25  SHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGA 204
           S  PGS  G   +  S SG P +PG     G  G P S  +P S  S       GS G  
Sbjct: 440 SGAPGSP-GSPGSPSSPSGAPGSPGSPGSPGASGSPGSPGSPGSPGSPGASGAPGSPGS- 497

Query: 205 PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMP-PPTGPSPHLAHGGVTAAHGVPRH 381
            P   G  GASG   +  S  S       P  P  P  P+ PS      G   A G P  
Sbjct: 498 -PGSPGSPGASGAPGSPGSPGS-------PGSPGSPGSPSSPSGSPGSPGSPGASGSPGS 549

Query: 382 HGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPAS 492
            G+  P S  S + P  +  G  G    PGA  SP S
Sbjct: 550 PGS--PGSPGSPSSPGSSESGSPGSPGSPGASGSPGS 584

[10][TOP]
>UniRef100_Q692G1 Major ampullate spidroin 2 (Fragment) n=1 Tax=Nephila clavipes
           RepID=Q692G1_NEPCL
          Length = 332

 Score = 62.0 bits (149), Expect = 3e-08
 Identities = 64/200 (32%), Positives = 82/200 (41%), Gaps = 23/200 (11%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVGGSSAAGSFSGP------PYAPGVY--AGSGPGGHPASSYAPSSS 159
           Q P  YG    G    GS+AA + +GP       Y PG     G GPG      Y P S+
Sbjct: 36  QGPGGYGPGQQGPSGAGSAAAAAAAGPGQQGLGGYGPGQQGPGGYGPGQQGPGGYGPGSA 95

Query: 160 ASLPQGAHLGSR--GGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAP-PQMPPPTGPS 330
           ++    A  G +  GG  P   G  G    ++A  +   G +   Q  P    P   GPS
Sbjct: 96  SAAAAAAGPGQQGPGGYGPGQQGPSGPGSASAAAAAAGPGGYGPGQQGPGGYAPGQQGPS 155

Query: 331 -PHLAHGGVTAAHGVPRHHG--ANGPASLNSAALPAYATGGGNGPA------YPPGAIVS 483
            P  A     AA   P  +G    GP+    AA  A A  GG GPA      Y PG+ V+
Sbjct: 156 GPGSAAAAAAAARAGPGGYGPAQQGPSGPGIAASAASAGPGGYGPAQQGPAGYGPGSAVA 215

Query: 484 P---ASTATFNRLSPAAAAA 534
               A +A +   S A+AAA
Sbjct: 216 ASAGAGSAGYGPGSQASAAA 235

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 56/192 (29%), Positives = 66/192 (34%), Gaps = 30/192 (15%)
 Frame = +1

Query: 7   QPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
           +P   G   PGS    ++AA    G  Y PG     GPGG+      PS + S    A  
Sbjct: 6   RPGQQGPSGPGSAAAAAAAAAGPGG--YGPGQ---QGPGGYGPGQQGPSGAGSAAAAAAA 60

Query: 187 G----SRGGAPPSVAG--GYGASGPTSATFSNESGSFQSLQPAPPQMPP---------PT 321
           G      GG  P   G  GYG        +   S S  +    P Q  P         P+
Sbjct: 61  GPGQQGLGGYGPGQQGPGGYGPGQQGPGGYGPGSASAAAAAAGPGQQGPGGYGPGQQGPS 120

Query: 322 GPSPHLAHGGVTAAHG-----------VPRHHGANGPASLNSAALPAYATGGGNGPAYP- 465
           GP    A        G            P   G +GP S  +AA  A A  GG GPA   
Sbjct: 121 GPGSASAAAAAAGPGGYGPGQQGPGGYAPGQQGPSGPGSAAAAAAAARAGPGGYGPAQQG 180

Query: 466 ---PGAIVSPAS 492
              PG   S AS
Sbjct: 181 PSGPGIAASAAS 192

[11][TOP]
>UniRef100_B0F656 Major ampullate spidroin 2 (Fragment) n=1 Tax=Latrodectus
           geometricus RepID=B0F656_9ARAC
          Length = 388

 Score = 62.0 bits (149), Expect = 3e-08
 Identities = 50/174 (28%), Positives = 64/174 (36%), Gaps = 4/174 (2%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGP----PYAPGVYAGSGPGGHPASSYAPSSSASLPQG 177
           P   G+    +  GGS   G   GP    P  PG   G GPGG  A+S A ++++S P G
Sbjct: 199 PGGSGAAAAAAATGGSGPGGYGQGPASYAPSGPGGQQGYGPGGSGAASAAAAAASSGPGG 258

Query: 178 AHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVT 357
              G+ G       G YG SGP          +  +   + P      GP    A     
Sbjct: 259 YGPGASG------PGSYGPSGP-----GGSGAAAAAAAASAPGGQQGYGPGGSGAAAAAA 307

Query: 358 AAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSP 519
           A    P    A GP    +AA  A   G G    Y PG   + A+ A      P
Sbjct: 308 AGGAGPGSQQAYGPGGSGAAAAAAAGPGSGGQQGYGPGGSAAAAAAAAAGGSGP 361

 Score = 57.4 bits (137), Expect = 6e-07
 Identities = 53/169 (31%), Positives = 69/169 (40%), Gaps = 6/169 (3%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
           P +YG   PG   G S+AA + +     PG     GPGG  A++ A ++  S P G   G
Sbjct: 166 PGAYGPSAPG---GPSAAAAAAASGGAGPGRQQSYGPGGSGAAAAAAATGGSGPGGYGQG 222

Query: 190 SRGGAPPSVAG--GYGASGPTSATFSNESGSFQSLQPAPPQMPPPT-GPSPHLAHGGVTA 360
               AP    G  GYG  G  +A+ +  + S       P    P + GPS     G   A
Sbjct: 223 PASYAPSGPGGQQGYGPGGSGAASAAAAAASSGPGGYGPGASGPGSYGPSGPGGSGAAAA 282

Query: 361 AHGVPRHHGANGPASLNSAALPAYATGG---GNGPAYPPGAIVSPASTA 498
           A       G  G     S A  A A GG   G+  AY PG   + A+ A
Sbjct: 283 AAAASAPGGQQGYGPGGSGAAAAAAAGGAGPGSQQAYGPGGSGAAAAAA 331

[12][TOP]
>UniRef100_Q9BIT8 Major ampullate spidroin 2 (Fragment) n=1 Tax=Latrodectus
           geometricus RepID=Q9BIT8_9ARAC
          Length = 399

 Score = 61.6 bits (148), Expect = 3e-08
 Identities = 53/164 (32%), Positives = 71/164 (43%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
           P SYG   PG   G ++AA + SGP    G   G GPGG  AS+ A +++     G +  
Sbjct: 3   PGSYGPSGPGGS-GAAAAAAAASGP----GGQQGYGPGGPGASAAAAAAAGGSGPGGY-- 55

Query: 190 SRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
              G  PS   GYG SGP +       G   S   A       +GP      GG      
Sbjct: 56  ---GQGPS---GYGPSGPGAQQGYGPGGQGGSGAAAAAAAAAGSGP------GGYGPGAA 103

Query: 370 VPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTAT 501
            P ++G +GP    +AA  A A+G G    Y PG   + A+ A+
Sbjct: 104 GPGNYGPSGPGGSGAAASAAAASGPGGQQGYGPGGSGAAAAAAS 147

 Score = 57.0 bits (136), Expect = 8e-07
 Identities = 51/154 (33%), Positives = 63/154 (40%), Gaps = 3/154 (1%)
 Frame = +1

Query: 49  GGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSS-SASLPQGAHLGSRGGAPPSVAGG 225
           GGS AA + +     PG   G GPGG  A++ A ++   S P G   G  G  P    GG
Sbjct: 137 GGSGAAAAAASGGAGPGRQQGYGPGGSGAAAAAAAAXGGSGPGGYGQGPXGYGP----GG 192

Query: 226 YGASGPTSATFSNESGSFQSLQP--APPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGP 399
            G SG  +A  +  S       P  A P    P+GP    A     AA G     G    
Sbjct: 193 QGGSGGAAAAAAAASSGPXGYGPGAAGPGNYGPSGPGGSGAAAAAAAASGPGGQQGYGPG 252

Query: 400 ASLNSAALPAYATGGGNGPAYPPGAIVSPASTAT 501
            S  SAA  A   G G   AY PG   + A+ A+
Sbjct: 253 GSGASAAAAAGGAGXGRQQAYGPGGSGAAAAAAS 286

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 60/208 (28%), Positives = 75/208 (36%), Gaps = 43/208 (20%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGH-----PASSYAPS----- 153
           Q P  YG   PG+  G        SG   A    AGSGPGG+        +Y PS     
Sbjct: 57  QGPSGYGPSGPGAQQGYGPGGQGGSGAAAAAAAAAGSGPGGYGPGAAGPGNYGPSGPGGS 116

Query: 154 ------SSASLPQG-----------AHLGSRGGAPPSVAGGY--GASGPTSATFSNESGS 276
                 ++AS P G           A   + GGA P    GY  G SG  +A  +   GS
Sbjct: 117 GAAASAAAASGPGGQQGYGPGGSGAAAAAASGGAGPGRQQGYGPGGSGAAAAAAAAXGGS 176

Query: 277 FQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGV--------------PRHHGANGPASLNS 414
                    Q P   GP      GG  AA                 P ++G +GP    +
Sbjct: 177 GPG---GYGQGPXGYGPGGQGGSGGAAAAAAAASSGPXGYGPGAAGPGNYGPSGPGGSGA 233

Query: 415 AALPAYATGGGNGPAYPPGAIVSPASTA 498
           AA  A A+G G    Y PG   + A+ A
Sbjct: 234 AAAAAAASGPGGQQGYGPGGSGASAAAA 261

[13][TOP]
>UniRef100_B3N0G2 GF21726 n=1 Tax=Drosophila ananassae RepID=B3N0G2_DROAN
          Length = 947

 Score = 61.2 bits (147), Expect = 4e-08
 Identities = 59/189 (31%), Positives = 74/189 (39%), Gaps = 31/189 (16%)
 Frame = +1

Query: 10   PPS--YGSHVPGSVVGGSSAAGSFSG-PPYAPGVYAGSGPGGHPA-SSYAP-----SSSA 162
            PP   YG   P +  GG     S++G PP   G Y  +G GG P   SY P     +SSA
Sbjct: 597  PPQSQYGPPPPQNTAGGPPPPMSYAGYPPNPVGQYGQAGAGGGPPPGSYGPPPPVPTSSA 656

Query: 163  SLPQGAHLGSRGGAPPSVAGGYGASGPTSATFS---NESGSFQSLQPAPPQMPPP-TGPS 330
              P  A+  + GGA  +  G     GP ++         G++ S   AP Q PPP  G +
Sbjct: 657  QSPYQAYQTAAGGATGAPPGSSYPGGPPTSVAGPPPPPGGAYSSSTTAPSQTPPPQAGGA 716

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPA----------------- 459
               A GG     G P     NGP +  S   P    GG  G A                 
Sbjct: 717  GGGAGGGGAGGSGNP-----NGPNAQQSTPPPQGGAGGAAGGAGGAPQQYAGPPPQQQQQ 771

Query: 460  -YPPGAIVS 483
              PPG +VS
Sbjct: 772  QQPPGVVVS 780

[14][TOP]
>UniRef100_UPI0000E46467 PREDICTED: similar to MGC139263 protein n=1 Tax=Strongylocentrotus
           purpuratus RepID=UPI0000E46467
          Length = 589

 Score = 60.8 bits (146), Expect = 6e-08
 Identities = 61/191 (31%), Positives = 74/191 (38%), Gaps = 30/191 (15%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGP---GGHP---ASSYAPSSSASLP 171
           PP+ G++ P     G   AG    PP A G   G+ P   GG P   A  Y P+  A  P
Sbjct: 23  PPAPGTYPPAGGAPGYPPAGVPGYPPAAAGYPTGAAPPPAGGQPYGAAPGYPPAGGAGYP 82

Query: 172 QGAHLGSRG---------GAPPSVAGGYGASG--PTSATFSNE---SGSFQSLQPAPP-- 303
                G            GAPP  A GY  +G  P +  +  +   +  +   QP P   
Sbjct: 83  PAPGYGGYPSAQPPAPGYGAPPGGAPGYPPAGGYPAAGGYPGQQPPAAGYPGQQPPPAAG 142

Query: 304 ---QMPPPT----GPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNG-PA 459
              Q PPP     G  P  A  G   A G P+   A   A    AA  AYA GG  G P+
Sbjct: 143 YPGQQPPPAAGYPGQQPPPAGYGQPPAAGYPQQPPA---AGYPGAAPAAYAAGGAPGYPS 199

Query: 460 YPPGAIVSPAS 492
            P GA   P S
Sbjct: 200 QPAGAQPPPPS 210

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 54/157 (34%), Positives = 62/157 (39%), Gaps = 4/157 (2%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAAGSFSGPPYAPGVY--AGSGPGGHPASSYA-PSSSASLPQGAHL 186
           SY  + P    G   A     G P APG Y  AG  PG  PA     P ++A  P GA  
Sbjct: 2   SYPGYPPAGAPGYPPAGQP--GYPPAPGTYPPAGGAPGYPPAGVPGYPPAAAGYPTGAAP 59

Query: 187 GSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQ-PAPPQMPPPTGPSPHLAHGGVTAA 363
              GG P   A GY  +G      +   G + S Q PAP    PP G   +   GG  AA
Sbjct: 60  PPAGGQPYGAAPGYPPAGGAGYPPAPGYGGYPSAQPPAPGYGAPPGGAPGYPPAGGYPAA 119

Query: 364 HGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGA 474
            G P   G   PA+      P  A  G  G   PP A
Sbjct: 120 GGYP---GQQPPAAGYPGQQPPPA-AGYPGQQPPPAA 152

[15][TOP]
>UniRef100_B6CM01 Putative uncharacterized protein n=1 Tax=Mycobacterium liflandii
           128FXT RepID=B6CM01_9MYCO
          Length = 795

 Score = 60.8 bits (146), Expect = 6e-08
 Identities = 59/185 (31%), Positives = 77/185 (41%), Gaps = 14/185 (7%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS--- 192
           G  V     GG +A  +  GP ++ GV AG+G G  P     PS+    P  A  GS   
Sbjct: 323 GLPVSAPAAGGQAAQAAQLGPAFSRGVSAGAGLGSLP-----PSTGIGTPAAAQTGSAPA 377

Query: 193 ----RGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTG---PSPHLAHGG 351
                GG  P+     GA+  T         +      AP  M PP G   P+  +A GG
Sbjct: 378 AGLASGGVAPTGVAAAGATPVTVTPAGAGVATGSGTAHAPAMMLPPPGLGAPAAPVAAGG 437

Query: 352 VTAAHGVPRHHGANGPASLNSAALPAYATGG---GNGPA-YPPGAIVSPASTATFNRLSP 519
             AA G      A   A+ + +A PA  TGG   G+G A   P ++VS  +T      SP
Sbjct: 438 --AAGGAAAVTPAGSSATPSGSAGPAGPTGGSPAGSGAAMVVPASVVSAGTTNRSRAESP 495

Query: 520 AAAAA 534
             AAA
Sbjct: 496 ELAAA 500

[16][TOP]
>UniRef100_Q9BIT9 Major ampullate spidroin 2 (Fragment) n=1 Tax=Latrodectus
           geometricus RepID=Q9BIT9_9ARAC
          Length = 373

 Score = 60.8 bits (146), Expect = 6e-08
 Identities = 54/193 (27%), Positives = 72/193 (37%), Gaps = 27/193 (13%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSS---SASLPQ 174
           Q P  YG   PG+  G        SG   A    AGSGPGG+   +  P S   S     
Sbjct: 40  QGPSGYGPSGPGAQQGYGPGGQGGSGAAAAAAAAAGSGPGGYGPGAAGPGSYGPSGPGGS 99

Query: 175 GAHLGSRGGAPPSVAGGYGASGP--TSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG 348
           GA   +   + P    GYG  GP  ++A  +   GS        P    P+GP     +G
Sbjct: 100 GAAAAAAAASGPGGQQGYGPGGPGASAAAAAAAGGSGPGGYGQGPSGYGPSGPGAQQGYG 159

Query: 349 -------GVTAAHGV---------------PRHHGANGPASLNSAALPAYATGGGNGPAY 462
                  G  AA                  P ++G +GP    +AA  A A+G G    Y
Sbjct: 160 PGGQGGSGAAAAAAAAAGSGRGGYGPGAAGPGNYGPSGPGGSGAAASAAAASGPGGQQGY 219

Query: 463 PPGAIVSPASTAT 501
            PG   + A+ A+
Sbjct: 220 GPGGSGAAAAAAS 232

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 46/151 (30%), Positives = 62/151 (41%)
 Frame = +1

Query: 49  GGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGY 228
           GGS AA + +     PG   G GPGG  A++ A +++     G +     G  P   GG 
Sbjct: 222 GGSGAAAAAASGGAGPGRQQGYGPGGSGAAAAAAAAAGGSGPGGYGQGPAGYGPGGQGGS 281

Query: 229 GASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASL 408
           G +   +A  S+  G +     A P    P+GP    A     AA G     G     S 
Sbjct: 282 GGAAAAAAAASSGPGGY-GPGAAGPGNYGPSGPGGSGAAAAAAAASGPGGQQGYGPGGSG 340

Query: 409 NSAALPAYATGGGNGPAYPPGAIVSPASTAT 501
            SAA  A   G G   AY PG   + A+ A+
Sbjct: 341 ASAAAAAGGAGPGRQQAYGPGGSGAAAAAAS 371

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 62/208 (29%), Positives = 79/208 (37%), Gaps = 43/208 (20%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVG-------GSSAAGSFS----------GPPYA-PGVYAGSGPGGH 129
           Q P  YG   PG+  G       GS AA + +          GP  A PG Y  SGPGG 
Sbjct: 142 QGPSGYGPSGPGAQQGYGPGGQGGSGAAAAAAAAAGSGRGGYGPGAAGPGNYGPSGPGGS 201

Query: 130 PASSYAPSSSASLPQ---------GAHLGSRGGAPPSVAGGY--GASGPTSATFSNESGS 276
            A++ A ++S    Q          A   + GGA P    GY  G SG  +A  +   GS
Sbjct: 202 GAAASAAAASGPGGQQGYGPGGSGAAAAAASGGAGPGRQQGYGPGGSGAAAAAAAAAGGS 261

Query: 277 FQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGV--------------PRHHGANGPASLNS 414
                    Q P   GP      GG  AA                 P ++G +GP    +
Sbjct: 262 GPG---GYGQGPAGYGPGGQGGSGGAAAAAAAASSGPGGYGPGAAGPGNYGPSGPGGSGA 318

Query: 415 AALPAYATGGGNGPAYPPGAIVSPASTA 498
           AA  A A+G G    Y PG   + A+ A
Sbjct: 319 AAAAAAASGPGGQQGYGPGGSGASAAAA 346

[17][TOP]
>UniRef100_B4KC52 GI21960 n=1 Tax=Drosophila mojavensis RepID=B4KC52_DROMO
          Length = 725

 Score = 60.8 bits (146), Expect = 6e-08
 Identities = 62/192 (32%), Positives = 85/192 (44%), Gaps = 17/192 (8%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPP---YAPGVYAGSGPGGHPAS--------SYAPSS 156
           PPS     P S     S++ SFS P     AP   A SG G +PA+        S  PSS
Sbjct: 274 PPSSSYGAPSSSSSSHSSSSSFSAPSSSYSAPSPSANSG-GSYPAAPSKSYGAPSSGPSS 332

Query: 157 SASLPQ-GAHLGSRGGAPPSVAGGYGASGPTS-----ATFSNESGSFQSLQPAPPQMPPP 318
           S S P   A++G    A PS + G  +SGP+S     +  +N  GS+    PA P     
Sbjct: 333 SYSAPSPSANVGGSYPAAPSSSYGAPSSGPSSSYSAPSPSANRGGSY----PAAPS-SSY 387

Query: 319 TGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTA 498
           + PSP    GG   A     +     P+S  SA  P+ A  GG+ PA P  +  +P+  A
Sbjct: 388 SAPSPGANSGGPYPAAPSSSYGAPAAPSSSYSAPSPS-ANSGGSYPAAPTSSYSAPSPGA 446

Query: 499 TFNRLSPAAAAA 534
                 P+A ++
Sbjct: 447 NSGGPYPSAPSS 458

 Score = 59.7 bits (143), Expect = 1e-07
 Identities = 60/182 (32%), Positives = 83/182 (45%), Gaps = 10/182 (5%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAAG---SFSGPPYAPGV-YAGSGPGGHPASSY--APSSSASLPQ- 174
           SY +  P + VGGS  A    S+  P   P   Y+   P  +   SY  APSSS S P  
Sbjct: 333 SYSAPSPSANVGGSYPAAPSSSYGAPSSGPSSSYSAPSPSANRGGSYPAAPSSSYSAPSP 392

Query: 175 GAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQS--LQPAPPQMPPPTGPSPHLAHG 348
           GA+ G  G  P + +  YGA    S+++S  S S  S    PA P     + PSP    G
Sbjct: 393 GANSG--GPYPAAPSSSYGAPAAPSSSYSAPSPSANSGGSYPAAPTSSY-SAPSPGANSG 449

Query: 349 GVTAAHGVPRHHGANGPASLNSAALPA-YATGGGNGPAYPPGAIVSPASTATFNRLSPAA 525
           G   +      +GA    S NS + P+  A  GG+ PA P  +  +PAS  + +  +P  
Sbjct: 450 GPYPS-APSSSYGAPSSGSSNSYSAPSPSANSGGSYPAAPSSSYGAPASAPSSSYSAPNP 508

Query: 526 AA 531
           +A
Sbjct: 509 SA 510

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 55/182 (30%), Positives = 87/182 (47%), Gaps = 12/182 (6%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGS-------GPGGH---PASSYAPSSSAS 165
           SYG+  P S   G+ +  SF   P AP    G+       G  G+   P++   PSSS  
Sbjct: 202 SYGAPAPPSSSYGAPSVSSFVPLPSAPSTNYGAPSKTQVLGSNGYTSGPSAPAPPSSSYG 261

Query: 166 LPQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAH 345
            P  +    R  +PPS    YGA  P+S++ S+ S S  S   +    P P+  S     
Sbjct: 262 APSSSS-SFRPISPPS--SSYGA--PSSSSSSHSSSSSFSAPSSSYSAPSPSANSGGSYP 316

Query: 346 GGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPAS--TATFNRLSP 519
              + ++G P    ++GP+S  SA  P+ A  GG+ PA P  +  +P+S  +++++  SP
Sbjct: 317 AAPSKSYGAP----SSGPSSSYSAPSPS-ANVGGSYPAAPSSSYGAPSSGPSSSYSAPSP 371

Query: 520 AA 525
           +A
Sbjct: 372 SA 373

[18][TOP]
>UniRef100_UPI0001B53F45 hypothetical protein StAA4_02603 n=1 Tax=Streptomyces sp. AA4
           RepID=UPI0001B53F45
          Length = 1500

 Score = 60.5 bits (145), Expect = 8e-08
 Identities = 57/173 (32%), Positives = 69/173 (39%), Gaps = 18/173 (10%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
           P + G    G   GGS + G  +G P  PG   G G  G P    A S  A  P     G
Sbjct: 311 PGAGGPGAGGPGAGGSGSGGPGAGGPGGPGTAGGPGAAGGPGGPGAGSPGAGGPSSGGPG 370

Query: 190 SRG-GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAH 366
           + G G   +V G  GA+ P+     N  G   +  P  P    P GP+   A G    AH
Sbjct: 371 AGGPGGVGAVGGPGGAAAPSGPGGPNGPGGAGA--PGGPAAGGPGGPNGVGAPGDGFDAH 428

Query: 367 GVPR-----------HHGANG----PASLNSAALPAYATG--GGNGPAYPPGA 474
           G               HGA G     A L +A L A A G  GG+GPA  PG+
Sbjct: 429 GPASTGPGADSPGSGGHGAAGVAAAAAGLGAAGLGAAALGAAGGSGPADGPGS 481

[19][TOP]
>UniRef100_UPI0001797576 PREDICTED: collagen, type XI, alpha 2 n=1 Tax=Equus caballus
            RepID=UPI0001797576
          Length = 1627

 Score = 60.5 bits (145), Expect = 8e-08
 Identities = 56/178 (31%), Positives = 61/178 (34%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P  S       H 
Sbjct: 738  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPSGKDGLPGHP 797

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 798  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 850

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 851  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 908

[20][TOP]
>UniRef100_Q636W5 Collagen-like triple helix repeat protein, glycine-rich n=1
           Tax=Bacillus cereus E33L RepID=Q636W5_BACCZ
          Length = 748

 Score = 60.5 bits (145), Expect = 8e-08
 Identities = 50/154 (32%), Positives = 65/154 (42%), Gaps = 3/154 (1%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGG 201
           G+  P    G +   G+ +GP  A G    +GP G  A   A ++ A+ PQGA   +   
Sbjct: 326 GATGPQGAQGPAGVTGA-TGPQGAQGNTGATGPQG--AQGPAGATGATGPQGAQGNTGAT 382

Query: 202 APPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPP-PTGPSPHLAHGGVTAAHGVPR 378
            P  + G  GA+G T    +  +G        P   PP PTGP  +    G T   GV  
Sbjct: 383 GPQGIQGNTGATGATGIGVTGPTG--------PSGGPPGPTGPQGNTGATGATGPQGVQG 434

Query: 379 HHGANGPASLNSAALPAYATG--GGNGPAYPPGA 474
           + GA G         PA ATG  G  GPA   GA
Sbjct: 435 NTGATGATGPQGVQGPAGATGPQGAQGPAGATGA 468

[21][TOP]
>UniRef100_C1ENE5 Collagen triple helix repeat protein n=1 Tax=Bacillus cereus
           03BB102 RepID=C1ENE5_BACC3
          Length = 1191

 Score = 60.5 bits (145), Expect = 8e-08
 Identities = 50/156 (32%), Positives = 65/156 (41%), Gaps = 5/156 (3%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGG 201
           G+  P    G + A G+ +GP  A G    +GP G  A   A ++ A+ PQGA   +   
Sbjct: 212 GATGPQGAQGPAGATGA-TGPQGAQGNTGATGPQG--AQGPAGATGATGPQGAQGNTGAT 268

Query: 202 APPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRH 381
            P  + G  GA+G T    +  +G            P PTGP  +    G T   GV  +
Sbjct: 269 GPQGIQGNTGATGATGIGVTGPTGP-----------PGPTGPQGNTGATGATGPQGVQGN 317

Query: 382 HGANGPASLNSAALPAYATG-----GGNGPAYPPGA 474
            GA G      A  PA ATG     G  GPA   GA
Sbjct: 318 TGATGATGPQGAQGPAGATGATGPQGVQGPAGATGA 353

[22][TOP]
>UniRef100_Q22260 Protein T06E4.6, confirmed by transcript evidence n=1
           Tax=Caenorhabditis elegans RepID=Q22260_CAEEL
          Length = 290

 Score = 60.5 bits (145), Expect = 8e-08
 Identities = 47/161 (29%), Positives = 59/161 (36%), Gaps = 2/161 (1%)
 Frame = +1

Query: 52  GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYG 231
           G+ + G  +GPP  PG     G  GH   +  P ++     G  +G  GG  P +    G
Sbjct: 80  GAQSNGCPAGPPGPPGQPGAQGEAGHAGEAGKPGAN-----GVTIGLTGGNGPCITCPAG 134

Query: 232 ASGPTSATFSN--ESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPAS 405
           A GP  A  +   +  S    Q A  + P P GP       G     G P H GA G   
Sbjct: 135 APGPAGAPGAPGPQGPSGAPGQDAVGEGPGPAGPQGPAGDAGAPGQAGAPGHPGAPGQGG 194

Query: 406 LNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAA 528
             S   P  A  G  GP  P G    P  +       PA A
Sbjct: 195 QRSRGTPGPA--GAPGPQGPAGGPGQPGQSGGAGAPGPAGA 233

[23][TOP]
>UniRef100_Q0Q5Z0 Tropoelastin 2 n=1 Tax=Danio rerio RepID=Q0Q5Z0_DANRE
          Length = 2054

 Score = 60.1 bits (144), Expect = 1e-07
 Identities = 56/168 (33%), Positives = 70/168 (41%), Gaps = 19/168 (11%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSGPPYAPG--VYAGSGPGGHPASSYAPSSSASLPQGAHLGSR 195
            G + PG V  G    G      Y PG     G GPGG PA  Y P     +P G +    
Sbjct: 1283 GGYRPGGVPAGGYGPGGVPAGGYGPGGVPAGGYGPGGVPAGGYGP---GGVPAGGY--GP 1337

Query: 196  GGAPPSVAGGYGASGPTSATFSNESGSF----QSLQPAPP----------QMPPPTGPSP 333
            GG P   AGGYG  G  +  F   SG++    ++L+  P           Q    TGP+ 
Sbjct: 1338 GGVP---AGGYGPGGVPAGGFGPGSGAYPGGAKALKYGPGGSGGIPGLGLQGQVGTGPAG 1394

Query: 334  HLAH--GGVTAAHGVPRHHGANGPASLNSAALPAYATG-GGNGPAYPP 468
             L +  G   A +G+P   GA     L + ALP   TG GG G A  P
Sbjct: 1395 GLGYGPGSKAAKYGLPGFGGA-----LGTGALPGAGTGAGGYGGAQKP 1437

[24][TOP]
>UniRef100_Q4DW77 Mucin-associated surface protein (MASP), putative n=1
           Tax=Trypanosoma cruzi RepID=Q4DW77_TRYCR
          Length = 364

 Score = 60.1 bits (144), Expect = 1e-07
 Identities = 58/179 (32%), Positives = 73/179 (40%), Gaps = 6/179 (3%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAA-GSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
           S G   PG V GGS+A+ G  SG    PG  AGS P G      +  S  S   G   G 
Sbjct: 104 SAGGPGPGGVAGGSAASSGDSSGAVAPPGASAGSSPDGGSGGGVSSGSGGS--SGTPTGD 161

Query: 193 RGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGV 372
           +G    S AGG G  G    +   +     S  PA    PPP  P+              
Sbjct: 162 QGTGDVSSAGGGGGGGSGDGSTGGDGTGSVSSAPAAAPAPPPVSPA-------------- 207

Query: 373 PRHHGANGPA-SLNSAALPAY--ATGGGNGPAYPPGAIVSPAS--TATFNRLSPAAAAA 534
                  GPA +L S A P      G  +G A  PG+ +S  +  + T N+ +PAAAAA
Sbjct: 208 -------GPAVALPSDAPPGVDPPAGSSDGKAGSPGSNLSDTTGDSQTGNQ-TPAAAAA 258

[25][TOP]
>UniRef100_UPI0000F1F788 PREDICTED: similar to Galectin-3 (Galactose-specific lectin 3)
           (Mac-2 antigen) (IgE-binding protein) (35 kDa lectin)
           (Carbohydrate-binding protein 35) (CBP 35)
           (Laminin-binding protein) (Lectin L-29) (L-34
           galactoside-binding lectin) n=1 Tax=Danio rerio
           RepID=UPI0000F1F788
          Length = 368

 Score = 59.7 bits (143), Expect = 1e-07
 Identities = 49/162 (30%), Positives = 58/162 (35%), Gaps = 4/162 (2%)
 Frame = +1

Query: 13  PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAG--SGPGGHPASSYAPSSSASLP--QGA 180
           P      PGS   G  A G F G P APG + G  + PGG+P     P      P   G 
Sbjct: 64  PQTWPSAPGSFPPGPGAPGQFPGAPAAPGQFPGAPAAPGGYPPGPGVPGQFPPNPGAPGQ 123

Query: 181 HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTA 360
                G  PP   GG     P    F +  G+ Q   P  P  P P+GP           
Sbjct: 124 FPSMPGQFPP---GGAPMPYPVPGQFPSPPGAPQGPNPNVPYPPGPSGPG---------- 170

Query: 361 AHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
                  +G  GP +      P Y  GGG  P  PPG+   P
Sbjct: 171 ------MYGPGGPGAFPPDGGPGY--GGGMFPPVPPGSWGQP 204

[26][TOP]
>UniRef100_Q9RKR9 Putative multi-domain regulatory protein n=1 Tax=Streptomyces
           coelicolor RepID=Q9RKR9_STRCO
          Length = 1334

 Score = 59.7 bits (143), Expect = 1e-07
 Identities = 53/154 (34%), Positives = 61/154 (39%), Gaps = 1/154 (0%)
 Frame = +1

Query: 37  GSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSV 216
           G+  G   A+G  SGP  APG   G  PG  PA   AP SS + P             S 
Sbjct: 288 GAASGPDPASGPASGPAVAPGSGGGPAPGWWPAPGTAPGSSTAPPHDT---------ASA 338

Query: 217 AGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAH-GGVTAAHGVPRHHGAN 393
           A    A GPTSA  +  +    +  P      P T  +P  A   G T A G     G  
Sbjct: 339 ADTAPAPGPTSAPGTAPAAGTAAPAPGTAGPAPGTSYAPGTAPVAGTTPAPGTAPAPGTA 398

Query: 394 GPASLNSAALPAYATGGGNGPAYPPGAIVSPAST 495
           GPA   S A P  A   G  PA  PG   +P ST
Sbjct: 399 GPARDTSYA-PGTAPVAGTTPA--PGTAPAPGST 429

[27][TOP]
>UniRef100_A3Q0W3 Putative uncharacterized protein n=1 Tax=Mycobacterium sp. JLS
           RepID=A3Q0W3_MYCSJ
          Length = 946

 Score = 59.7 bits (143), Expect = 1e-07
 Identities = 52/173 (30%), Positives = 68/173 (39%), Gaps = 17/173 (9%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           PG+ VG S   G+ + PP  P     S  G  P +  AP +    P    +     A  +
Sbjct: 193 PGAPVGASGGVGAPAAPPAVPAGVVDSSSGVTPPAPAAPPAGVVQPAAGAVPPAPRAVGA 252

Query: 214 VAGGYGASG-------PTSATFSNESGSFQSLQPAPPQ--------MPPPTGPSPHLAHG 348
            AGG G +G       P +A     +G+     PAPP           PP  P+P  A  
Sbjct: 253 PAGGSGGAGAPAAPPAPPAAVVEPAAGATPPAPPAPPAAVVEPAAGATPPAPPAPPAA-- 310

Query: 349 GVTAAHGV--PRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTAT 501
            V  A GV  P      GPA  +  A+         GP  PP A+V PA+ AT
Sbjct: 311 VVEPASGVTPPAPPAPGGPAGGSGGAVTP------PGPPAPPAAVVEPAAGAT 357

[28][TOP]
>UniRef100_Q283I7 Fibrillar collagen (Fragment) n=1 Tax=Saccoglossus kowalevskii
           RepID=Q283I7_SACKO
          Length = 454

 Score = 59.7 bits (143), Expect = 1e-07
 Identities = 53/163 (32%), Positives = 63/163 (38%), Gaps = 11/163 (6%)
 Frame = +1

Query: 52  GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-GAPPSVAGGY 228
           GS      SGP  APG    +GP G P     PS     P+GA  GSRG    P +AG  
Sbjct: 25  GSPGPAGMSGPMGAPGPSGEAGPQG-PTGDPGPSGPVG-PEGAR-GSRGPSGEPGIAGAP 81

Query: 229 GASGPTSATFSNESGSFQSLQPAPPQMPPP-----TGPSPHLAHGGVTAAHGVPRHHGAN 393
           G +G   A  +     F  LQ  P  M  P     TGP       G T   G P  +G +
Sbjct: 82  GDAGIQGARGAKGHRGFPGLQGIPGSMGVPGEDGMTGPPGPNGPRGATGPRGSPGLNGKD 141

Query: 394 GPASLNSAALPAYATG-----GGNGPAYPPGAIVSPASTATFN 507
           GP        P  + G     G +GP  PPG    P     F+
Sbjct: 142 GPMGQPGPEGPRGSRGDRGDSGTSGPPGPPGPPGPPGDAQGFD 184

[29][TOP]
>UniRef100_Q26052 Alpha collagen type 1 (Fragment) n=1 Tax=Paracentrotus lividus
           RepID=Q26052_PARLI
          Length = 730

 Score = 59.7 bits (143), Expect = 1e-07
 Identities = 56/164 (34%), Positives = 62/164 (37%), Gaps = 10/164 (6%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGS--FSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAH 183
           P + G        G S A GS    GP  APG    SGPGG   S  AP    S   GAH
Sbjct: 307 PGAQGPRGEKGDTGASGANGSPGAPGPIGAPGPAGASGPGGDTGSVGAPGPPGS--TGAH 364

Query: 184 LGSRGGA----PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG- 348
            GS G A    P   AG  G +GP              LQ  P  M  P  P      G 
Sbjct: 365 -GSTGPAGPAGPAGPAGERGETGPAGHKGHTGVPGLPGLQGTPGPMGEPGAPGEQGQQGT 423

Query: 349 -GVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
            G+  A G   + G  GP   +    P    G  GG+GP  PPG
Sbjct: 424 RGLPGARGSNGNDGPAGPRGFDGPEGPRGPRGESGGSGPPGPPG 467

[30][TOP]
>UniRef100_Q206M1 Major ampullate spidroin 2 (Fragment) n=1 Tax=Latrodectus hesperus
           RepID=Q206M1_9ARAC
          Length = 1198

 Score = 59.7 bits (143), Expect = 1e-07
 Identities = 55/176 (31%), Positives = 72/176 (40%), Gaps = 13/176 (7%)
 Frame = +1

Query: 13  PSYGS---HVPGSVVGGSSAAGSFSGPP---YAPGVYAGSGPGGHPASSYAPSSSASLPQ 174
           P YG    + PG   G ++AA + +GP    Y PG    SGPGG  A++ A ++  S P 
Sbjct: 103 PGYGGQQGYGPGGA-GAAAAAAAAAGPGPSGYGPGTAGPSGPGGAGAAAAAAAAGGSGPG 161

Query: 175 GAHLGSRGGAPPSVAG----GYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLA 342
           G   G  G  P    G    G G SG  +A  +   G+    Q          G  P  +
Sbjct: 162 GYGQGPSGYGPSGSGGQQGFGPGGSGAAAAAAAAAGGAGPGRQ---------QGYGPGSS 212

Query: 343 HGGVTAAHGVPRHHGANGPASLNSAALPAYATGG---GNGPAYPPGAIVSPASTAT 501
                AA G P + G  G     + A  A A GG   G   AY PG   + A+ AT
Sbjct: 213 GAAAAAAAGGPGYGGQQGYGPGGAGAAAAAAAGGAGPGTQQAYGPGGSGAAAAAAT 268

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 54/194 (27%), Positives = 69/194 (35%), Gaps = 22/194 (11%)
 Frame = +1

Query: 13  PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
           P YG    G   GG+ AA + +     PG     GPGG  A++ A +++   P G   G+
Sbjct: 223 PGYGGQ-QGYGPGGAGAAAAAAAGGAGPGTQQAYGPGGSGAAAAAATAAGPGPSGYGPGA 281

Query: 193 RGGAPPSVAG---------------------GYGASGPTSATFSNESGSFQSLQPAPPQM 309
            G + P  AG                     GYG SGP         GS  +   A    
Sbjct: 282 AGPSGPGGAGAAAAAAAAGGSGPGGYGQGPSGYGPSGPGGQQGYGPGGSGAAAAAAAAAG 341

Query: 310 PPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPA-YPPGAIVSP 486
               G       G   AA G P + G  G     + A  A A   G GP+ Y PGA  S 
Sbjct: 342 GAGPGRQQGYGQGSSGAAAGGPGYGGQQGYGPGGAGAAAAAAAAAGPGPSGYGPGAAGSS 401

Query: 487 ASTATFNRLSPAAA 528
                    + AAA
Sbjct: 402 GPGGAGAAAAAAAA 415

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 56/173 (32%), Positives = 70/173 (40%), Gaps = 11/173 (6%)
 Frame = +1

Query: 13  PSYGS---HVPGSVVGGSSAAGSFSGPP---YAPGVYAGSGPGGHPASSYAPSSSASLPQ 174
           P YG    + PG   G ++AA + +GP    Y PG    SGPGG  A++ A ++  S P 
Sbjct: 363 PGYGGQQGYGPGGA-GAAAAAAAAAGPGPSGYGPGAAGSSGPGGAGAAAAAAAAGGSGPG 421

Query: 175 GAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGG- 351
           G       G  PSV   YG SGP         GS  +   A        G       GG 
Sbjct: 422 GY------GQGPSV---YGPSGPGGQQGYGPGGSGAAAAAAAAAGGAGPGRQQGYGPGGA 472

Query: 352 -VTAAHGVPRHHGANGPASLNSAALPAYATGG---GNGPAYPPGAIVSPASTA 498
              AA G P + G  G     + A  A A GG   G   AY PG   + A+ A
Sbjct: 473 AAAAAAGGPGYGGQQGYGPGGAGAAAAAAAGGAGPGRQQAYGPGGSGAAAAAA 525

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/174 (31%), Positives = 73/174 (41%), Gaps = 1/174 (0%)
 Frame = +1

Query: 13   PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
            P YG    G   GG+ AA + +     PG     GPGG  A++ A +++ S P G    +
Sbjct: 962  PGYGGQ-QGFGPGGAGAAAAAAAGGAGPGRQQAYGPGGSGAAAAAAAAAGSGPSGYGPSA 1020

Query: 193  RGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGV 372
             G   PS  GG GA+   +A  S   GSF        Q P   GPS              
Sbjct: 1021 AG---PSGPGGSGAAAAAAAGGSG-PGSF-------GQGPTGYGPSG------------- 1056

Query: 373  PRHHGANGPASLNSAALPAYATGGGNGPA-YPPGAIVSPASTATFNRLSPAAAA 531
            P      GP +  +AA  A +  GG GP+ Y P ++ S A++A     SP   A
Sbjct: 1057 PGGQQGYGPGASGAAAAAAASGSGGYGPSQYVPSSVASSAASAASALSSPTTHA 1110

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 54/181 (29%), Positives = 72/181 (39%), Gaps = 18/181 (9%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGP----PYAPGVYAGSGPGGHPASSYAPSSSASLPQG 177
           P   G+    +  GGS   G   GP    P  PG   G GPGG  A++ A +++     G
Sbjct: 403 PGGAGAAAAAAAAGGSGPGGYGQGPSVYGPSGPGGQQGYGPGGSGAAAAAAAAAGGAGPG 462

Query: 178 AHLG-SRGGAPPSVAG---------GYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGP 327
              G   GGA  + A          GYG  G  +A  +   G+    Q A    P  +G 
Sbjct: 463 RQQGYGPGGAAAAAAAGGPGYGGQQGYGPGGAGAAAAAAAGGAGPGRQQA--YGPGGSGA 520

Query: 328 SPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGP----AYPPGAIVSPAST 495
           +   A G   + +G     GA GP    +AA    A  GG GP    AY PG   + A+ 
Sbjct: 521 AAAAAAGSGPSGYG----PGAAGPGGAGAAAA---AAAGGAGPGRQQAYGPGGSGAAAAA 573

Query: 496 A 498
           A
Sbjct: 574 A 574

[31][TOP]
>UniRef100_UPI000023F34A hypothetical protein FG00916.1 n=1 Tax=Gibberella zeae PH-1
            RepID=UPI000023F34A
          Length = 1758

 Score = 59.3 bits (142), Expect = 2e-07
 Identities = 57/192 (29%), Positives = 77/192 (40%), Gaps = 26/192 (13%)
 Frame = +1

Query: 22   GSHVPG---SVVGGSSAAGSFSGP--PYAPGVYAGSGPGGHPASSYAPSSSASL-PQGAH 183
            GS  P    +V GG S     + P  PY  G  +       P SS +P+S  S  P   +
Sbjct: 1532 GSDTPAGFDTVYGGGSVGFGGTTPMSPYNRGAAS-------PFSSTSPTSPFSYSPTSPN 1584

Query: 184  LGSRGGAPPSVAGGYGASGPTSATFSNESGSFQ----SLQPAPPQMPPPTGPSPHLAHGG 351
            +G    +P    GG G  GPTS +FS  S SF      L+P  P  P  +  SP  +   
Sbjct: 1585 MGYSPTSPLIDGGGMGRYGPTSPSFSPSSPSFSPTSPMLRPTSPASPSYSPTSPSYS--- 1641

Query: 352  VTAAHGVPRHHGANGPASLNSAALPAYA---------------TGGGNGPAYPPGA-IVS 483
               +   PRH+    PA  NS   P+Y+                GG   P+Y P +   S
Sbjct: 1642 -PTSPSSPRHYSPTSPAQFNSPTSPSYSPASPNYSPTSPNVHGAGGPTSPSYSPASPSWS 1700

Query: 484  PASTATFNRLSP 519
            P S   ++  SP
Sbjct: 1701 PTSPEAYSPTSP 1712

[32][TOP]
>UniRef100_A1CEV2 Extracellular threonine rich protein, putative n=1 Tax=Aspergillus
           clavatus RepID=A1CEV2_ASPCL
          Length = 893

 Score = 59.3 bits (142), Expect = 2e-07
 Identities = 61/182 (33%), Positives = 73/182 (40%), Gaps = 6/182 (3%)
 Frame = +1

Query: 1   AQQPPSYGSHVPGSVVGGSSAAG--SFSGPPYAPGVYAGSGPGGH---PASSYAPSSSAS 165
           A  PP  G+  P +  G   A G    +GPP   G  A +GP G    PA++  P ++  
Sbjct: 205 ATGPP--GATGPPAATGPPGATGPPGATGPPPETGPPAATGPPGATGPPAATGPPGATG- 261

Query: 166 LPQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPP-PTGPSPHLA 342
            P GA        PP+  G  GA+GP +AT     G   +  P     PP  TGP P   
Sbjct: 262 -PPGATGPPPETGPPAATGPPGATGPPAAT-----GPPAATGPPGATGPPGATGPPPET- 314

Query: 343 HGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPA 522
             G  AA G P   G  G         P  ATG   G   PPGA   PA T       P 
Sbjct: 315 --GPPAATGPPAATGPPGATGPPPETGPPAATGPPPGATGPPGATGPPAPTGPGAPTCPP 372

Query: 523 AA 528
           AA
Sbjct: 373 AA 374

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 59/175 (33%), Positives = 70/175 (40%), Gaps = 3/175 (1%)
 Frame = +1

Query: 13  PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGH---PASSYAPSSSASLPQGAH 183
           P  G+  PG+   G  AA   +GPP   G  A +GP G    PA++  P ++   P GA 
Sbjct: 178 PPAGTGPPGAT--GPPAA---TGPPPETGPPAATGPPGATGPPAATGPPGATG--PPGAT 230

Query: 184 LGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAA 363
                  PP+  G  GA+GP +AT            P     P  TGP P     G  AA
Sbjct: 231 GPPPETGPPAATGPPGATGPPAATG----------PPGATGPPGATGPPPET---GPPAA 277

Query: 364 HGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAA 528
            G P   GA GP     AA    A  G  G   PPGA   P  T       P AA
Sbjct: 278 TGPP---GATGP----PAATGPPAATGPPGATGPPGATGPPPETGPPAATGPPAA 325

[33][TOP]
>UniRef100_Q0RG05 Putative serine/threonine-protein kinase n=1 Tax=Frankia alni
           ACN14a RepID=Q0RG05_FRAAA
          Length = 933

 Score = 58.9 bits (141), Expect = 2e-07
 Identities = 50/158 (31%), Positives = 65/158 (41%), Gaps = 2/158 (1%)
 Frame = +1

Query: 7   QPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
           QPP  G+   GSV G   AAG  S P    G    SG G   A   AP  +A+       
Sbjct: 340 QPP--GTAGAGSVTGSEGAAGR-SAPGRFTGSAGASGSGRSVAPHAAPGGAATDAPAGSF 396

Query: 187 GSRGGA--PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTA 360
           G R     PP  AGG   +G   AT  + +    S  P P + PPP  P P     G  +
Sbjct: 397 GGRPATAVPPPTAGGGPPAGAMPATQMSPA-PLASPPPVPSRTPPPGNPPPGGLPPGAVS 455

Query: 361 AHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGA 474
              V     +  P++ +  ++P  A G G+  A P GA
Sbjct: 456 PGAVSGSVPSAAPSASSPGSVPPRAQGPGDAYAPPGGA 493

[34][TOP]
>UniRef100_C7IJQ8 Collagen triple helix repeat protein n=1 Tax=Clostridium
           papyrosolvens DSM 2782 RepID=C7IJQ8_9CLOT
          Length = 466

 Score = 58.9 bits (141), Expect = 2e-07
 Identities = 53/157 (33%), Positives = 68/157 (43%), Gaps = 10/157 (6%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHP-ASSYAPSSSASLPQGAHLGSRGGAPP 210
           P    G + A G+ +GP  A G    +GP G   A+    ++ A+ P GA  G+ G  P 
Sbjct: 176 PTGATGATGATGA-TGPAGATGATGATGPAGATGATGPVGATGATGPAGA-TGATG--PA 231

Query: 211 SVAGGYGASGPTSAT-FSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHG 387
              G  GA+GP  AT  +  +G+  +  PA       TGP+      G T A G     G
Sbjct: 232 GATGATGATGPAGATGATGPAGATGATGPAGA-----TGPTGPAGATGATGATGATGATG 286

Query: 388 ANGPASLNSAALPAYATG--------GGNGPAYPPGA 474
           A GPA    A  PA ATG        G  GPA   GA
Sbjct: 287 ATGPAGATGATGPAGATGATGATGATGATGPAGATGA 323

[35][TOP]
>UniRef100_Q692F8 Major ampullate spidroin 2 (Fragment) n=1 Tax=Nephila clavipes
           RepID=Q692F8_NEPCL
          Length = 296

 Score = 58.9 bits (141), Expect = 2e-07
 Identities = 63/202 (31%), Positives = 82/202 (40%), Gaps = 27/202 (13%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPP------YAPGVYA--GSGPGGHPASSYAPSSSAS 165
           P  YG    G    GS+AA + +GP       Y PG     G GPG      Y P S+++
Sbjct: 1   PGGYGPGQQGPSGAGSAAAAAAAGPGQQGLGGYGPGQQGPGGYGPGQQGPGGYGPGSASA 60

Query: 166 LPQGAHLGSR--GGAPPSVAG--GYGASGPTSATFSNESGSFQSLQPAP----PQMPPPT 321
               A  G +  GG  P   G  G G++   +A  +   G +   Q  P    P    P+
Sbjct: 61  AAAAAGPGQQGPGGYGPGQQGPSGPGSASAAAAAAAAGPGGYGPGQQGPGGYAPGQQGPS 120

Query: 322 GPSPHLAHGGVTAAHG--VPRHHGANGPASLNSAALPAYATGGGNGPA------YPPGAI 477
           GP    A     A  G   P   G +GP     AA  A A  GG GPA      Y PG+ 
Sbjct: 121 GPGSAAAAAAAAAGPGGYGPAQQGPSGP---GIAASAASAGPGGYGPAQQGPAGYGPGSA 177

Query: 478 VSP---ASTATFNRLSPAAAAA 534
           V+    A +A +   S A+AAA
Sbjct: 178 VAASAGAGSAGYGPGSQASAAA 199

[36][TOP]
>UniRef100_B4Q0C4 GE15779 n=1 Tax=Drosophila yakuba RepID=B4Q0C4_DROYA
          Length = 920

 Score = 58.9 bits (141), Expect = 2e-07
 Identities = 55/173 (31%), Positives = 64/173 (36%), Gaps = 17/173 (9%)
 Frame = +1

Query: 4    QQPP------SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSY-----AP 150
            QQPP       YG   P +  GG    G ++G P  PG Y  S  GG P  S       P
Sbjct: 567  QQPPPGPPQSQYGPPPPQNSAGGPPPMG-YAGYPPNPGQYGQSAAGGGPPPSGYWPPPPP 625

Query: 151  SSSASLPQGAH------LGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMP 312
            +SSA  P  A+        + GGA       Y    PTS               AP Q P
Sbjct: 626  TSSAQSPYQAYQQQQQQAAAAGGAGAPPGSSYPGGPPTSGAAPPPPPGGAYSTTAPSQTP 685

Query: 313  PPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPG 471
            PP       A GG    +  P     NGP +  S   P    GGG GP+ P G
Sbjct: 686  PPQ------AGGGAGGGNTNP-----NGPNAQQSTPPPQGGAGGGAGPSGPGG 727

[37][TOP]
>UniRef100_UPI00005A264B PREDICTED: similar to collagen, type XI, alpha 2 isoform 2
            preproprotein isoform 2 n=1 Tax=Canis lupus familiaris
            RepID=UPI00005A264B
          Length = 1647

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 758  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 817

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 818  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 870

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 871  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGLGLKGNEGPAGPPGPAGSP 928

[38][TOP]
>UniRef100_Q5TJG3 Collagen type XI alpha 2 (Fragment) n=2 Tax=Canis lupus familiaris
           RepID=Q5TJG3_CANFA
          Length = 1009

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
           G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 120 GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 179

Query: 187 GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
           G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 180 GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 232

Query: 337 LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
               G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 233 AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGLGLKGNEGPAGPPGPAGSP 290

[39][TOP]
>UniRef100_UPI00004BBB4F PREDICTED: similar to collagen, type XI, alpha 2 isoform 1
            preproprotein isoform 1 n=1 Tax=Canis lupus familiaris
            RepID=UPI00004BBB4F
          Length = 1733

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 844  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 903

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 904  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 956

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 957  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGLGLKGNEGPAGPPGPAGSP 1014

[40][TOP]
>UniRef100_UPI0000EB2E40 Collagen type XI alpha 2 n=1 Tax=Canis lupus familiaris
            RepID=UPI0000EB2E40
          Length = 1734

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 845  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 904

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 905  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 957

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 958  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGLGLKGNEGPAGPPGPAGSP 1015

[41][TOP]
>UniRef100_UPI0000EB2C0B Collagen type XI alpha 2 n=1 Tax=Canis lupus familiaris
            RepID=UPI0000EB2C0B
          Length = 1813

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 907  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 966

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 967  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 1019

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 1020 AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGLGLKGNEGPAGPPGPAGSP 1077

[42][TOP]
>UniRef100_UPI0000EB2C0A Collagen type XI alpha 2 n=1 Tax=Canis lupus familiaris
            RepID=UPI0000EB2C0A
          Length = 1615

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 744  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 803

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 804  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 856

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 857  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGLGLKGNEGPAGPPGPAGSP 914

[43][TOP]
>UniRef100_UPI000179D0F0 Proline/arginine-rich protein. n=1 Tax=Bos taurus RepID=UPI000179D0F0
          Length = 1659

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 770  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 829

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 830  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 882

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 883  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 940

[44][TOP]
>UniRef100_UPI000179D0EF Proline/arginine-rich protein. n=1 Tax=Bos taurus RepID=UPI000179D0EF
          Length = 1737

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 848  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 907

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 908  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 960

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 961  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 1018

[45][TOP]
>UniRef100_A4RRF2 Predicted protein n=1 Tax=Ostreococcus lucimarinus CCE9901
           RepID=A4RRF2_OSTLU
          Length = 1000

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 53/175 (30%), Positives = 74/175 (42%), Gaps = 2/175 (1%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
           P ++G+   G   G SS  G F  P  AP  + G+     P++  AP+SSA  P G   G
Sbjct: 237 PSAFGAPSGGGAFG-SSPTGGFGAPAAAPSPFGGAAT---PSAFGAPASSA--PSGGLFG 290

Query: 190 SRGGAPPSVAGGYGASGPTSATFS--NESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAA 363
                  S  GG+GAS P S+ F   + + +F +  P P         SP  A      A
Sbjct: 291 -------STTGGFGAS-PASSAFGAPSTTSAFGASAPTPGAFGATPSASPFGAAPSTPGA 342

Query: 364 HGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAA 528
            G P             A+ PA+   G  G A  P A  +P+ST  F   +PA++
Sbjct: 343 FGAP-------------ASTPAFGASGAFGAAPTPSAFGAPSSTPAFG-AAPASS 383

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 48/163 (29%), Positives = 67/163 (41%), Gaps = 4/163 (2%)
 Frame = +1

Query: 55  SSAAGSFSGP----PYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAG 222
           +++AG F  P    P+      GS  GG    ++  S++ + P GA  G   GA  S  G
Sbjct: 170 ATSAGGFGAPAATSPFGGTTGGGSAFGGASGGAFGASATPASPFGAPSGGAFGASTSTPG 229

Query: 223 GYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPA 402
           G+GAS   SA  +   G      P      P   PSP    GG       P   GA  PA
Sbjct: 230 GFGASAAPSAFGAPSGGGAFGSSPTGGFGAPAAAPSP---FGGA----ATPSAFGA--PA 280

Query: 403 SLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAAA 531
           S   +     +T GG G +    A  +P++T+ F   +P   A
Sbjct: 281 SSAPSGGLFGSTTGGFGASPASSAFGAPSTTSAFGASAPTPGA 323

[46][TOP]
>UniRef100_Q5TJG0 Collagen type XI alpha 2 (Fragment) n=1 Tax=Canis lupus familiaris
            RepID=Q5TJG0_CANFA
          Length = 1596

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 758  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 817

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 818  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 870

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 871  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGLGLKGNEGPAGPPGPAGSP 928

[47][TOP]
>UniRef100_A5D9K7 Collagen type XI alpha 2 n=1 Tax=Sus scrofa RepID=A5D9K7_PIG
          Length = 1651

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 761  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 820

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 821  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 873

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 874  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 931

[48][TOP]
>UniRef100_Q5U0Y6 LD20133p n=1 Tax=Drosophila melanogaster RepID=Q5U0Y6_DROME
          Length = 840

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 53/155 (34%), Positives = 58/155 (37%), Gaps = 13/155 (8%)
 Frame = +1

Query: 49  GGSSAAGSFSGPPYAPGVYAGSGPGGHPASSY----APSSSASLP---------QGAHLG 189
           G + AA   SG  Y P   AG GP   P S Y     P+SSA  P         Q A  G
Sbjct: 509 GPAGAATGASGHGYQPNAGAGQGP---PPSGYWPPPPPTSSAQSPYQAYQQQQQQQAAAG 565

Query: 190 SRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
              GAPP     Y    PTS               AP Q PPP G       GG    + 
Sbjct: 566 GGAGAPPG--SSYPGGPPTSGAAPPPPPGGAYSTTAPSQTPPPQGG------GGAGGGNN 617

Query: 370 VPRHHGANGPASLNSAALPAYATGGGNGPAYPPGA 474
            P     NGP +  S   P    GGG GP+ P GA
Sbjct: 618 NP-----NGPNAQQSTPPPQGGAGGGAGPSGPGGA 647

[49][TOP]
>UniRef100_B0CPK9 Predicted protein n=1 Tax=Laccaria bicolor S238N-H82
           RepID=B0CPK9_LACBS
          Length = 584

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 59/193 (30%), Positives = 76/193 (39%), Gaps = 18/193 (9%)
 Frame = +1

Query: 10  PPSY---GSHVPGSVVG--GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQ 174
           PP Y   G + P S++   G S  G+  GP   P    GS   G P    A SS   +  
Sbjct: 189 PPVYSASGPNAPSSILAAPGPSPTGAQGGPAQDPQTPTGSNTPGGPLPPPASSSFPPVNG 248

Query: 175 GAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGV 354
            A  G++GG  P  +   G++ PT     N+ G      PA   +PP  G +P  A G  
Sbjct: 249 PAPTGAQGGPAPYSSPPTGSNAPTDP--ENQGGPV--APPASLTLPPVNGSAPTGAQGDP 304

Query: 355 TAAHGVP---------RHHGANGPASLNSAALPAYA---TGGGNGPA-YPPGAIVSPAST 495
           T     P         +  GA  P   +S+  P      TGG  GPA Y P    S A T
Sbjct: 305 TPNSPPPSGGDAPTDSKESGARPPPPASSSLPPVNGPAPTGGQGGPAPYSPPHTDSNAPT 364

Query: 496 ATFNRLSPAAAAA 534
              N+  P A  A
Sbjct: 365 ELKNQGGPVAPPA 377

[50][TOP]
>UniRef100_Q32S24 Collagen alpha-2(XI) chain n=1 Tax=Bos taurus RepID=COBA2_BOVIN
          Length = 1736

 Score = 58.5 bits (140), Expect = 3e-07
 Identities = 55/178 (30%), Positives = 60/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 847  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 906

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G +  
Sbjct: 907  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLTGT 959

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 960  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 1017

[51][TOP]
>UniRef100_Q72Z02 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           ATCC 10987 RepID=Q72Z02_BACC1
          Length = 1321

 Score = 58.2 bits (139), Expect = 4e-07
 Identities = 47/154 (30%), Positives = 62/154 (40%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  V G +   G   GPP   G    +GPGG P+ S   ++ A+   GA   +       
Sbjct: 192 PTGVTGPTGITGPSGGPPGPTGPTGATGPGGGPSGS-TGATGATGNTGATGSTGVTGSTG 250

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           V G  G++GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 251 VTGATGSTGPTGSTGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQGVQG 310

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             G     G  GP  +  A  P  ATG  G  GP
Sbjct: 311 IQGATGATGDQGPQGIQGAIGPQGATGATGDQGP 344

[52][TOP]
>UniRef100_A1UCV0 Putative uncharacterized protein n=2 Tax=Mycobacterium
           RepID=A1UCV0_MYCSK
          Length = 816

 Score = 58.2 bits (139), Expect = 4e-07
 Identities = 51/161 (31%), Positives = 67/161 (41%), Gaps = 14/161 (8%)
 Frame = +1

Query: 49  GGSSAAGSFSGPPYAPGVYAGSG-PGGHPAS---SYAPSSSASLPQGAHLGSRGGAPPSV 216
           GG    GS  G P  PG   GSG  G +P S      P ++  LP    + + GGA P  
Sbjct: 288 GGGGGLGSGGGVPKMPGGLGGSGLSGSNPLSGGVGQMPGAAGWLPNSGAVSAAGGASPLS 347

Query: 217 AGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGG-----VTAAHG---- 369
           +    A     AT +   G   S QP     P P  PSP L+ GG     V+AA G    
Sbjct: 348 S----AFNQGMATTAGMGGGIPSTQP-----PAPASPSPALSAGGGHAAPVSAAPGGGVS 398

Query: 370 -VPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPA 489
                 G   PA+ ++      ++GGG     PPG++  PA
Sbjct: 399 PAAAQPGMVAPAAPSALTGTGVSSGGGAPMMLPPGSMGPPA 439

[53][TOP]
>UniRef100_C3CQG2 Collagen triple helix repeat domain protein n=2 Tax=Bacillus
           thuringiensis RepID=C3CQG2_BACTU
          Length = 1225

 Score = 58.2 bits (139), Expect = 4e-07
 Identities = 49/154 (31%), Positives = 64/154 (41%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   ++ A+   GA  GS G     
Sbjct: 177 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGS-TGATGATGSTGA-TGSTG----- 229

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           V G  G +GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 230 VTGATGTTGPTGSTGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGITGEQGIQGVQG 289

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             G+    G  GP  +  A  P  ATG  G  GP
Sbjct: 290 IQGIMGATGDQGPQGIQGAIGPQGATGATGDQGP 323

[54][TOP]
>UniRef100_Q868B4 Protein ZK643.8, partially confirmed by transcript evidence n=1
           Tax=Caenorhabditis elegans RepID=Q868B4_CAEEL
          Length = 774

 Score = 58.2 bits (139), Expect = 4e-07
 Identities = 46/148 (31%), Positives = 55/148 (37%), Gaps = 3/148 (2%)
 Frame = +1

Query: 13  PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG- 189
           PS G    G   GGSS  G ++  P   G YA SG GG    +   SS      G   G 
Sbjct: 206 PSGGGGCGG---GGSSGGGGYASAPSGGGGYATSGGGGSGGYATGGSSGGGYSSGGSSGG 262

Query: 190 --SRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAA 363
             S GG      GG G  G +     +  G   S   A P  PPP  P P  A   V++ 
Sbjct: 263 GYSTGGGGGYAGGGGGGGGSSGGYAGSSGGGGYSAPAAAPPPPPPPPPPP--APAPVSSG 320

Query: 364 HGVPRHHGANGPASLNSAALPAYATGGG 447
            G        G  S  S    A ++ GG
Sbjct: 321 GGYSEQSSGGGGGSSYSGGGEASSSSGG 348

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/176 (30%), Positives = 72/176 (40%), Gaps = 3/176 (1%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSR 195
           S G     S  GG S+ G  S    + G Y+G   G   +SS + SS      G   G+ 
Sbjct: 365 SSGGDSSSSSGGGYSSGGDSSSSSSSSGGYSG---GSDSSSSSSSSSGGYSSGGGDAGAS 421

Query: 196 GGAPPSVAGGYGASGPT--SATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
            G   S AGGY  S  +   A+    SG      PAP   P  +G     +     AA  
Sbjct: 422 SGGESSSAGGYSGSSSSGGEASSGGYSGGSSEPAPAPEAAPASSGGYSGGSEAAPEAAPA 481

Query: 370 VPRHHGANGPASLNSAALPAYATGGGNG-PAYPPGAIVSPASTATFNRLSPAAAAA 534
            P   G +G  +   AA PA  +GG +G  A P  A  +P+   + +  +P AA A
Sbjct: 482 AP-SGGYSGSEAAPEAA-PAAPSGGYSGSEAAPEAAPAAPSGGYSGSEAAPEAAPA 535

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 48/175 (27%), Positives = 68/175 (38%), Gaps = 17/175 (9%)
 Frame = +1

Query: 1   AQQPPSYGSHVPGSVVGGSSAA---------GSFSGPPYAPGVYAGSGPGGHPASSYAPS 153
           ++  P      P     GS AA         G +SG   AP     +  GG+  S  AP 
Sbjct: 508 SEAAPEAAPAAPSGGYSGSEAAPEAAPAAPSGGYSGSEAAPEAAPAAPSGGYSGSEAAPE 567

Query: 154 SSASLPQGAHLGSRGGAPPSV-----AGGYGASG---PTSATFSNESGSFQSLQPAPPQM 309
           ++ + P G + GS   AP +      +GGY   G    ++A  SN SG  ++   APP  
Sbjct: 568 AAPAAPSGGYSGSESSAPAAPEPAPSSGGYSGGGGDAGSAAGGSNYSGGGETAPAAPPPA 627

Query: 310 PPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGA 474
           P P                    + GA G    ++AA PA + GG +G     GA
Sbjct: 628 PEP-----------------AQTYSGAGGE---SAAAAPAPSGGGYSGSGGAGGA 662

[55][TOP]
>UniRef100_Q22256 Protein T06E4.4, confirmed by transcript evidence n=1
           Tax=Caenorhabditis elegans RepID=Q22256_CAEEL
          Length = 290

 Score = 58.2 bits (139), Expect = 4e-07
 Identities = 46/161 (28%), Positives = 57/161 (35%), Gaps = 2/161 (1%)
 Frame = +1

Query: 52  GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYG 231
           G+ + G  +GPP  PG     G  GH   +  P ++     G  +G  GG  P +    G
Sbjct: 80  GAQSNGCPAGPPGPPGQPGAQGEAGHAGEAGKPGAN-----GVTIGLTGGNGPCITCPAG 134

Query: 232 ASGPTSATFSN--ESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPAS 405
           A GP  A  +   +  S    Q A    P P GP       G     G P H GA G   
Sbjct: 135 APGPAGAPGAPGPQGPSGAPGQDAVGGGPGPAGPQGPAGDAGAPGQAGAPGHPGAPGQGG 194

Query: 406 LNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAA 528
             S   P     G  GP  P G    P  +       PA A
Sbjct: 195 QRSRGTP--GPSGAPGPQGPAGGPGQPGQSGGAGAPGPAGA 233

[56][TOP]
>UniRef100_Q20739 Protein F54B11.2, partially confirmed by transcript evidence n=1
           Tax=Caenorhabditis elegans RepID=Q20739_CAEEL
          Length = 304

 Score = 58.2 bits (139), Expect = 4e-07
 Identities = 54/169 (31%), Positives = 65/169 (38%), Gaps = 10/169 (5%)
 Frame = +1

Query: 52  GSSAAGSFSG--PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSV--- 216
           G+S+ G   G   P  PGV    G  G P    AP +  +  +GA +      PP     
Sbjct: 95  GASSGGQCEGCCNPGPPGVAGNPGKPGKPGKPGAPGNPGAPGKGAAVPCEAKTPPPCKPC 154

Query: 217 -AGGYGASGPTS----ATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRH 381
            AG  G  GP      A    E+GS     PA P  P P GPS      G   A G P  
Sbjct: 155 PAGPPGPPGPDGPAGPAGPDGEAGS-----PAAPSPPGPPGPSGPAGPAGNDGAAGTP-- 207

Query: 382 HGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAA 528
            G +GPA  ++   PA       GPA PPG    P         +P AA
Sbjct: 208 -GPDGPAGESTYPEPA-----APGPAGPPGPAGPPGPDGASPTAAPGAA 250

[57][TOP]
>UniRef100_C5DX72 ZYRO0F02728p n=1 Tax=Zygosaccharomyces rouxii CBS 732
            RepID=C5DX72_ZYGRC
          Length = 2302

 Score = 58.2 bits (139), Expect = 4e-07
 Identities = 56/163 (34%), Positives = 74/163 (45%), Gaps = 2/163 (1%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFS-GPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            PPS  S    S  G SSA G+ S G P AP   +GSG  G   +S A  +S+S   G+  
Sbjct: 792  PPSTSSSA-SSTSGSSSAPGTSSTGSPSAP---SGSGNSGASGASGASGASSSEASGSGN 847

Query: 187  GSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG-GVTAA 363
             +  GA    +G  GASG +SA  S  SG+  +   AP      +G S   A G G +A 
Sbjct: 848  SATSGA-SGASGASGASGASSAPSSGASGASGASSSAPTS---TSGASSSEASGSGNSAT 903

Query: 364  HGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPAS 492
             G     GA+G +S  S+     +    + P    GA  S AS
Sbjct: 904  SGASGASGASGASSAPSSGASGASGASSSAPTSTSGASSSEAS 946

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 48/170 (28%), Positives = 71/170 (41%), Gaps = 5/170 (2%)
 Frame = +1

Query: 40   SVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVA 219
            S   G+S A   SG   A    +    G   ASS AP+S++        GS   A    +
Sbjct: 848  SATSGASGASGASGASGASSAPSSGASGASGASSSAPTSTSGASSSEASGSGNSATSGAS 907

Query: 220  GGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGP----SPHLAHGGVTAAHGVPRHHG 387
            G  GASG +SA  S  SG+  +   AP      +      S + A  G+ +A   P    
Sbjct: 908  GASGASGASSAPSSGASGASGASSSAPTSTSGASSSEASGSGNSATSGIVSASSAP---S 964

Query: 388  ANGPASLNSAALPAYATG-GGNGPAYPPGAIVSPASTATFNRLSPAAAAA 534
             NG ++ + A+  + A+G   + P    GA  S AS +  +  S A  A+
Sbjct: 965  GNGNSATSGASGASGASGASSSAPTSTSGASSSEASGSGNSATSGATGAS 1014

[58][TOP]
>UniRef100_UPI00005029C8 Procollagen, type XI, alpha 2. n=1 Tax=Rattus norvegicus
            RepID=UPI00005029C8
          Length = 1629

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 55/179 (30%), Positives = 61/179 (34%), Gaps = 24/179 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P  +       H 
Sbjct: 740  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPAGKDGLPGHP 799

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSF-QSLQPAPPQMPPPTGPSP 333
            G RG            PP V G  GA+G        ESG   +   P PP  P   G   
Sbjct: 800  GQRGEVGFQGKTGPPGPPGVVGPQGAAG--------ESGPMGERGHPGPPGPPGEQGLPG 851

Query: 334  HLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                 G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 852  TAGKDGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 910

[59][TOP]
>UniRef100_UPI00005029C7 Procollagen, type XI, alpha 2. n=1 Tax=Rattus norvegicus
            RepID=UPI00005029C7
          Length = 1650

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 55/179 (30%), Positives = 61/179 (34%), Gaps = 24/179 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P  +       H 
Sbjct: 761  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPAGKDGLPGHP 820

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSF-QSLQPAPPQMPPPTGPSP 333
            G RG            PP V G  GA+G        ESG   +   P PP  P   G   
Sbjct: 821  GQRGEVGFQGKTGPPGPPGVVGPQGAAG--------ESGPMGERGHPGPPGPPGEQGLPG 872

Query: 334  HLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                 G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 873  TAGKDGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 931

[60][TOP]
>UniRef100_UPI00005029C6 Procollagen, type XI, alpha 2. n=1 Tax=Rattus norvegicus
            RepID=UPI00005029C6
          Length = 1655

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 55/179 (30%), Positives = 61/179 (34%), Gaps = 24/179 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P  +       H 
Sbjct: 766  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPAGKDGLPGHP 825

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSF-QSLQPAPPQMPPPTGPSP 333
            G RG            PP V G  GA+G        ESG   +   P PP  P   G   
Sbjct: 826  GQRGEVGFQGKTGPPGPPGVVGPQGAAG--------ESGPMGERGHPGPPGPPGEQGLPG 877

Query: 334  HLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                 G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 878  TAGKDGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 936

[61][TOP]
>UniRef100_UPI00005029C5 Procollagen, type XI, alpha 2. n=1 Tax=Rattus norvegicus
            RepID=UPI00005029C5
          Length = 1689

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 55/179 (30%), Positives = 61/179 (34%), Gaps = 24/179 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P  +       H 
Sbjct: 800  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPAGKDGLPGHP 859

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSF-QSLQPAPPQMPPPTGPSP 333
            G RG            PP V G  GA+G        ESG   +   P PP  P   G   
Sbjct: 860  GQRGEVGFQGKTGPPGPPGVVGPQGAAG--------ESGPMGERGHPGPPGPPGEQGLPG 911

Query: 334  HLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                 G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 912  TAGKDGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 970

[62][TOP]
>UniRef100_UPI00005029C4 Procollagen, type XI, alpha 2. n=1 Tax=Rattus norvegicus
            RepID=UPI00005029C4
          Length = 1710

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 55/179 (30%), Positives = 61/179 (34%), Gaps = 24/179 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P  +       H 
Sbjct: 821  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPAGKDGLPGHP 880

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSF-QSLQPAPPQMPPPTGPSP 333
            G RG            PP V G  GA+G        ESG   +   P PP  P   G   
Sbjct: 881  GQRGEVGFQGKTGPPGPPGVVGPQGAAG--------ESGPMGERGHPGPPGPPGEQGLPG 932

Query: 334  HLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                 G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 933  TAGKDGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 991

[63][TOP]
>UniRef100_UPI00005029C3 Procollagen, type XI, alpha 2. n=1 Tax=Rattus norvegicus
            RepID=UPI00005029C3
          Length = 1715

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 55/179 (30%), Positives = 61/179 (34%), Gaps = 24/179 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P  +       H 
Sbjct: 826  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPAGKDGLPGHP 885

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSF-QSLQPAPPQMPPPTGPSP 333
            G RG            PP V G  GA+G        ESG   +   P PP  P   G   
Sbjct: 886  GQRGEVGFQGKTGPPGPPGVVGPQGAAG--------ESGPMGERGHPGPPGPPGEQGLPG 937

Query: 334  HLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                 G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 938  TAGKDGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 996

[64][TOP]
>UniRef100_UPI00005029C2 Procollagen, type XI, alpha 2. n=1 Tax=Rattus norvegicus
            RepID=UPI00005029C2
          Length = 1736

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 55/179 (30%), Positives = 61/179 (34%), Gaps = 24/179 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P  +       H 
Sbjct: 847  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPAGKDGLPGHP 906

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSF-QSLQPAPPQMPPPTGPSP 333
            G RG            PP V G  GA+G        ESG   +   P PP  P   G   
Sbjct: 907  GQRGEVGFQGKTGPPGPPGVVGPQGAAG--------ESGPMGERGHPGPPGPPGEQGLPG 958

Query: 334  HLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                 G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 959  TAGKDGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 1017

[65][TOP]
>UniRef100_Q6MGB2 Procollagen, type XI, alpha 2 n=1 Tax=Rattus norvegicus
            RepID=Q6MGB2_RAT
          Length = 1617

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 55/179 (30%), Positives = 61/179 (34%), Gaps = 24/179 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P  +       H 
Sbjct: 746  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPAGKDGLPGHP 805

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSF-QSLQPAPPQMPPPTGPSP 333
            G RG            PP V G  GA+G        ESG   +   P PP  P   G   
Sbjct: 806  GQRGEVGFQGKTGPPGPPGVVGPQGAAG--------ESGPMGERGHPGPPGPPGEQGLPG 857

Query: 334  HLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                 G     G P   G +GPA L        LP  A G    G  GPA PPG   SP
Sbjct: 858  TAGKDGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPAGPPGPAGSP 916

[66][TOP]
>UniRef100_C2XI26 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           F65185 RepID=C2XI26_BACCE
          Length = 1309

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 45/154 (29%), Positives = 61/154 (39%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   + +       + G+ G     
Sbjct: 195 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGSTGATGAT-----GNTGATGST--G 247

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           V G  G++GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 248 VTGATGSTGPTGSTGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQGVQG 307

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             G     G  GP  +  A  P  ATG  G  GP
Sbjct: 308 IQGATGATGDQGPQGIQGAIGPQGATGATGDQGP 341

[67][TOP]
>UniRef100_C2P552 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           172560W RepID=C2P552_BACCE
          Length = 1325

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 45/154 (29%), Positives = 61/154 (39%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   + +       + G+ G     
Sbjct: 195 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGSTGATGAT-----GNTGATGST--G 247

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           V G  G++GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 248 VTGATGSTGPTGSTGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQGVQG 307

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             G     G  GP  +  A  P  ATG  G  GP
Sbjct: 308 IQGAKGATGDQGPQGIQGAIGPQGATGATGDQGP 341

[68][TOP]
>UniRef100_B5UNT5 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           AH1134 RepID=B5UNT5_BACCE
          Length = 1309

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 45/154 (29%), Positives = 61/154 (39%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   + +       + G+ G     
Sbjct: 195 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGSTGATGAT-----GNTGATGST--G 247

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           V G  G++GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 248 VTGATGSTGPTGSTGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQGVQG 307

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             G     G  GP  +  A  P  ATG  G  GP
Sbjct: 308 IQGAKGATGDQGPQGIQGAIGPQGATGATGDQGP 341

[69][TOP]
>UniRef100_Q7YXA3 Protein H06A10.2, partially confirmed by transcript evidence n=1
           Tax=Caenorhabditis elegans RepID=Q7YXA3_CAEEL
          Length = 305

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 51/161 (31%), Positives = 59/161 (36%), Gaps = 1/161 (0%)
 Frame = +1

Query: 49  GGSSAAGSFSGPPYAPGVYAGSGPGGH-PASSYAPSSSASLPQGAHLGSRGGAPPSVAGG 225
           GGS       G P APG    +G G   P  +  P      P G         PP   G 
Sbjct: 115 GGSPGKPGKPGKPGAPGAPGAAGKGASAPCEAKTPPPCQPCPAG---------PPGPPGP 165

Query: 226 YGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPAS 405
            G +GP       E+GS     PA P  P P GP       G   A G P   G +GPA 
Sbjct: 166 DGPAGPAGP--DGEAGS-----PAAPSPPGPPGPPGPAGPAGNDGAAGTP---GPDGPAG 215

Query: 406 LNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAA 528
            ++   PA     G GPA PPG    P         +P AA
Sbjct: 216 ESTYPEPA-----GPGPAGPPGPAGPPGPDGASPTAAPGAA 251

[70][TOP]
>UniRef100_A8X4T9 C. briggsae CBR-COL-44 protein n=1 Tax=Caenorhabditis briggsae
           RepID=A8X4T9_CAEBR
          Length = 301

 Score = 57.8 bits (138), Expect = 5e-07
 Identities = 51/171 (29%), Positives = 65/171 (38%), Gaps = 7/171 (4%)
 Frame = +1

Query: 37  GSVVGGSSAAGSFSG--PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPP 210
           G    G++A G  SG   P  PGV    G  G P    AP S  +  +GA +      PP
Sbjct: 87  GGADAGAAAGGGCSGCCNPGPPGVAGNPGKPGKPGKPGAPGSPGAPGKGAAVPCEAKNPP 146

Query: 211 SV----AGGYGASGPTSATFSNESG-SFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVP 375
                 AG  G  GP     + E+G + ++  PA P  P P GP     + G     G P
Sbjct: 147 PCQPCPAGPPGPPGPDGP--AGEAGPAGEAGAPAAPSPPGPPGPPGPPGNPGADGGAGTP 204

Query: 376 RHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAA 528
              GA G ++        Y    G GPA PPG    P         +P  A
Sbjct: 205 GPDGAGGEST--------YPEPAGPGPAGPPGPPGPPGPDGASPTAAPGEA 247

[71][TOP]
>UniRef100_A0JM00 Collagen, type 1, alpha 2 n=1 Tax=Xenopus (Silurana) tropicalis
            RepID=A0JM00_XENTR
          Length = 1354

 Score = 57.4 bits (137), Expect = 6e-07
 Identities = 60/179 (33%), Positives = 72/179 (40%), Gaps = 22/179 (12%)
 Frame = +1

Query: 1    AQQPPSYGSHVPGSVVGGSSAAGSFSGPPY---------------APGVYAGSGPGGHPA 135
            AQ PP    +       G + A  F G P                APG +  +GP G   
Sbjct: 521  AQGPPGLAGNTGDKGEQGPAGAPGFQGLPGPGGAAGELGKHGERGAPGDFGPAGPAGPRG 580

Query: 136  SSYAPSSS-ASLPQGAHLGSRG--GAPPS--VAGGYGASGPTSATFSNESGSFQSLQPAP 300
               AP  S A+ P GA LG RG  GAP S    G  GA+G   A   +  G     + A 
Sbjct: 581  ERGAPGESGAAGPLGA-LGPRGPTGAPGSDGAKGEPGAAGLNGALGPSGPGGIPGERGAA 639

Query: 301  PQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
              +P P G      H G    +G P   GA GPA  + A  PA A G  G +GPA P G
Sbjct: 640  G-VPGPKGEKGDAGHSG---EYGNPGRDGARGPAGASGAPGPAGAAGDRGESGPAGPSG 694

[72][TOP]
>UniRef100_B7IKZ3 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           G9842 RepID=B7IKZ3_BACC2
          Length = 951

 Score = 57.4 bits (137), Expect = 6e-07
 Identities = 49/154 (31%), Positives = 63/154 (40%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   ++ A+   GA  GS G     
Sbjct: 192 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGS-TGATGATGDTGA-TGSTG----- 244

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           V G  G +GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 245 VTGATGTTGPTGSTGAQGLQGIQGIQGSIGPTGPEGPQGIQGIPGPTGITGEQGIQGVQG 304

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             GV    G  GP  +  A  P   TG  G  GP
Sbjct: 305 IQGVTGATGDQGPQGIQGAIGPQGVTGATGDQGP 338

[73][TOP]
>UniRef100_C2YXV7 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           AH1271 RepID=C2YXV7_BACCE
          Length = 924

 Score = 57.4 bits (137), Expect = 6e-07
 Identities = 44/154 (28%), Positives = 60/154 (38%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   + +       + G+ G     
Sbjct: 192 PTGITGPTGITGPSGGPPGPTGATGATGPGGGPSGSTGATGAT-----GNTGATGST--G 244

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           + G  G +GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 245 ITGAAGTTGPTGSTGAQGLQGIQGVQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQGVQG 304

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             GV    G  GP  +  A  P   TG  G  GP
Sbjct: 305 IQGVTGATGDQGPQGIQGAIGPQGVTGATGDQGP 338

[74][TOP]
>UniRef100_A8WXW9 Putative uncharacterized protein n=1 Tax=Caenorhabditis briggsae
            RepID=A8WXW9_CAEBR
          Length = 1075

 Score = 57.4 bits (137), Expect = 6e-07
 Identities = 45/153 (29%), Positives = 64/153 (41%), Gaps = 1/153 (0%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAP-P 210
            P      S   G  SG  Y+ G  +  G GG  +  Y+ S+    P  A   +   AP P
Sbjct: 612  PSGGYASSGGGGGSSGGGYSSGGGSSGGGGGGSSGGYSQSAPPPPPAPAPAPAPAPAPAP 671

Query: 211  SVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGA 390
            + +GGY +SG  S+      G +   Q APP   P + P+P  A  G  A+ G     G 
Sbjct: 672  APSGGYASSGGGSS--GGGGGGYS--QSAPPPPAPESAPAPAPAPSGGYASSGGGESSG- 726

Query: 391  NGPASLNSAALPAYATGGGNGPAYPPGAIVSPA 489
             G +S +S    +   GGG G  Y   +   P+
Sbjct: 727  -GGSSASSGGYASSGGGGGGGGGYASASAPPPS 758

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 47/164 (28%), Positives = 62/164 (37%)
 Frame = +1

Query: 1    AQQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
            A  P   G +  G   GG S+ G   G   AP       P   P  + AP+ S+      
Sbjct: 834  APAPAPSGGYSSGGGGGGGSSGGYSGGSAPAPASEPAPAPAPEPEPAPAPAPSS------ 887

Query: 181  HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTA 360
              G   G   S  GG G+SG +S  +S   GS     P PP   P   P+P  A  G  +
Sbjct: 888  --GGYSGGSSSGGGGGGSSGGSSGGYS--GGSAAPPPPPPPAPEPAPAPAPAPAPSGGYS 943

Query: 361  AHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPAS 492
            + G     G       +  + PA A+     PA  P    +PAS
Sbjct: 944  SEG---GGGGGSSGGYSGGSAPAPASEPAPAPAPEPEPAPAPAS 984

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 48/170 (28%), Positives = 60/170 (35%), Gaps = 7/170 (4%)
 Frame = +1

Query: 19   YGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG 198
            Y S   GS  GG       + PP AP   +   P   P+  YA S       G    S G
Sbjct: 677  YASSGGGSSGGGGGGYSQSAPPPPAPE--SAPAPAPAPSGGYASSGGGESSGGGSSASSG 734

Query: 199  GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTA------ 360
            G   S  GG G  G  SA+    SG       A    PPP  P+P  A     A      
Sbjct: 735  GYASSGGGGGGGGGYASASAPPPSGGGGGGYSASAAPPPPPPPAPEPAPAPAPAPAPSRG 794

Query: 361  -AHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFN 507
             + G     G++G  S  SA  PA        P   P    +PA +  ++
Sbjct: 795  YSSGGGGGGGSSGGYSGGSAPAPASEPAPAPAPEQAPAPAPAPAPSGGYS 844

[75][TOP]
>UniRef100_P46804 Spidroin-2 (Fragment) n=1 Tax=Nephila clavipes RepID=SPD2_NEPCL
          Length = 627

 Score = 57.4 bits (137), Expect = 6e-07
 Identities = 58/187 (31%), Positives = 71/187 (37%), Gaps = 10/187 (5%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVGGSSAAGSFSGPP------YAPGVYA--GSGPGGHPASSYAPSSS 159
           Q P  YG    G    GS+AA + +GP       Y PG     G GPG      Y P S+
Sbjct: 293 QGPGGYGPGQQGPSGAGSAAAAAAAGPGQQGLGGYGPGQQGPGGYGPGQQGPGGYGPGSA 352

Query: 160 ASLPQGAHLGSRGGAPPSVAGGYGAS--GPTSATFSNESGSFQSLQPAPPQMPPPTGPSP 333
           ++    A  G +G       GGYG    GP+        GS  +   A    P   GP  
Sbjct: 353 SAAAAAAGPGQQG------PGGYGPGQQGPSGP------GSASAAAAAAAAGPGGYGPGQ 400

Query: 334 HLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRL 513
               GG       P   G +GP S ++AA  A A  GG GP        +P         
Sbjct: 401 Q-GPGGYA-----PGQQGPSGPGSASAAAAAAAAGPGGYGPGQQGPGGYAPGQQGPSGPG 454

Query: 514 SPAAAAA 534
           S AAAAA
Sbjct: 455 SAAAAAA 461

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 63/207 (30%), Positives = 83/207 (40%), Gaps = 31/207 (14%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVGGSSAAGSFSGPP------YAPGVYAGSGPGGHPASSYAPSSSAS 165
           Q P  YG    G    GS+AA + +GP       Y PG    SGPG    S+ A +++A+
Sbjct: 228 QGPGGYGPGQQGLSGPGSAAAAAAAGPGQQGPGGYGPGQQGPSGPG----SAAAAAAAAA 283

Query: 166 LPQGAHLGSR--GGAPPSVAGGYGASGPTSATFSNES----GSFQSLQPAP----PQMPP 315
            P G   G +  GG  P   G  GA    +A  +       G +   Q  P    P    
Sbjct: 284 GPGGYGPGQQGPGGYGPGQQGPSGAGSAAAAAAAGPGQQGLGGYGPGQQGPGGYGPGQQG 343

Query: 316 PTGPSPHLAHGGVTAA---------HGVPRHHGANGPASLNSAALPAYATGGGNGP---- 456
           P G  P  A     AA         +G P   G +GP S ++AA  A A  GG GP    
Sbjct: 344 PGGYGPGSASAAAAAAGPGQQGPGGYG-PGQQGPSGPGSASAAAAAAAAGPGGYGPGQQG 402

Query: 457 --AYPPGAIVSPASTATFNRLSPAAAA 531
              Y PG    P+   + +  + AAAA
Sbjct: 403 PGGYAPGQ-QGPSGPGSASAAAAAAAA 428

[76][TOP]
>UniRef100_UPI00015B5FE6 PREDICTED: similar to CG15920-PA n=1 Tax=Nasonia vitripennis
           RepID=UPI00015B5FE6
          Length = 752

 Score = 57.0 bits (136), Expect = 8e-07
 Identities = 51/169 (30%), Positives = 65/169 (38%), Gaps = 7/169 (4%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSG--PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAH 183
           PP+ G    G   GG+     F G  P  +PG + G G GG P+ SY P S      G+ 
Sbjct: 261 PPAAGGGGFGGNAGGNGGGNGFGGGRPSGSPGGFGGQGGGGRPSDSYLPPSG-----GSG 315

Query: 184 LGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAA 363
            G   G  P   GG+G  G   A   N  G   + +P+    PP  G        G    
Sbjct: 316 FGGGNGRQP---GGFGQQGGNGAGQQNGGGG--AGRPSSSYGPPSNGNGG--GFSGQNGG 368

Query: 364 HGVPRHHGANGPAS---LNSAALPAYATGGGN--GPAYPPGAIVSPAST 495
            G P   G  G A     +S   PA  +G GN  G    P +   P S+
Sbjct: 369 RGSPSSGGGFGGAGGSPSSSYGPPAGGSGFGNNGGAGGRPSSSYGPPSS 417

[77][TOP]
>UniRef100_Q1D888 General secretory system II protein E, N-terminal domain protein n=1
            Tax=Myxococcus xanthus DK 1622 RepID=Q1D888_MYXXD
          Length = 2136

 Score = 57.0 bits (136), Expect = 8e-07
 Identities = 67/199 (33%), Positives = 80/199 (40%), Gaps = 21/199 (10%)
 Frame = +1

Query: 1    AQQPPSYGSHVP-GSVVGG--SSAAGSFSGPPYAPGVYAGSGPG--GHPASSYAPSSSAS 165
            A+ PP+ G  +P G V  G   S   S  G P  PG      PG  G P SS      A 
Sbjct: 803  ARPPPAPGLPMPHGPVPPGMMGSRPPSSPGLPAVPGGRGAKPPGMTGAPPSSVHRGPQAP 862

Query: 166  LPQGAHLGSRGGAPPSVAGGYGASGP----------TSATFSNESGSFQSLQPAPPQMPP 315
             P G       GAP + A G GA  P          T A F+   G   +  P PP   P
Sbjct: 863  GPHGTKPPGMTGAPFATAHG-GADAPVPPGTKPPGMTGAPFATAHGGADA--PVPPGTMP 919

Query: 316  P--TGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGP----AYPPGAI 477
            P  TG  P  AHG   A    P   GA  P ++  AA PA A GG + P    A PPG +
Sbjct: 920  PGMTGAPPATAHGVPDA----PVPPGAVPPGTM--AAQPAAAHGGPDTPVSPGAVPPGMM 973

Query: 478  VSPASTATFNRLSPAAAAA 534
             +P  +      +P A  A
Sbjct: 974  GAPPPSVHGGPHAPVALGA 992

[78][TOP]
>UniRef100_A4T238 Putative uncharacterized protein n=1 Tax=Mycobacterium gilvum
           PYR-GCK RepID=A4T238_MYCGI
          Length = 811

 Score = 57.0 bits (136), Expect = 8e-07
 Identities = 58/165 (35%), Positives = 68/165 (41%), Gaps = 14/165 (8%)
 Frame = +1

Query: 37  GSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSA--SLPQ-GAHLGSRGGAP 207
           G +VGG   +G   G P  PG   G G GG P     P  S    +P  G+ L S GG P
Sbjct: 286 GGMVGGGMGSG---GAPKLPG---GLGSGGLPGMGSNPLGSGVDQMPSAGSGLPSAGGVP 339

Query: 208 PSVAGGYGASGPTSATFSNES--GSFQSLQPAPPQMPPPTGPSPHLAHGG------VTAA 363
                G GA  P  A     S  G+     PA P  P P  PSP L+ G        TA 
Sbjct: 340 ---GDGSGAGSPAVAFSQGMSTGGAIGGGMPAAP-APAPASPSPALSAGAQAAPVPATAG 395

Query: 364 HGVP---RHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPA 489
            GVP      G   PA+  + A     TGGG     PPG++  PA
Sbjct: 396 GGVPPAAAQSGLVAPAAPPTGA--GMGTGGGAPMMLPPGSMGPPA 438

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 62/185 (33%), Positives = 76/185 (41%), Gaps = 11/185 (5%)
 Frame = +1

Query: 13  PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAP---SSSASLPQGAH 183
           PS G  VPG   G  S A +FS      G+  G   GG   ++ AP   S S +L  GA 
Sbjct: 333 PSAGG-VPGDGSGAGSPAVAFS-----QGMSTGGAIGGGMPAAPAPAPASPSPALSAGAQ 386

Query: 184 LG-----SRGGAPPSVAGG---YGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHL 339
                  + GG PP+ A       A+ PT A      G+   L P    M PP GP P  
Sbjct: 387 AAPVPATAGGGVPPAAAQSGLVAPAAPPTGAGMGTGGGAPMMLPPG--SMGPPAGPVPPP 444

Query: 340 AHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSP 519
           A      A G     G+N P    SAA PA A G   GP   P ++V+   TA       
Sbjct: 445 AATVPAGALGA----GSNAP----SAAPPAAAAGA--GPTLIPASVVAAGQTAAARERRE 494

Query: 520 AAAAA 534
           +A AA
Sbjct: 495 SADAA 499

[79][TOP]
>UniRef100_A8I4M6 Predicted protein n=1 Tax=Chlamydomonas reinhardtii
           RepID=A8I4M6_CHLRE
          Length = 647

 Score = 57.0 bits (136), Expect = 8e-07
 Identities = 60/189 (31%), Positives = 69/189 (36%), Gaps = 41/189 (21%)
 Frame = +1

Query: 13  PSYGSHVPGS------VVGGSSAAG------SFSGPPYAPGVYAGSGPGG---------- 126
           PSYGS +PGS      V+G  + A       SF G     G++ G G GG          
Sbjct: 175 PSYGSSLPGSGGTAAVVLGAGTGANVPAPSSSFLGGSLLSGLFGGRGGGGGGSAAGGAAG 234

Query: 127 -------------------HPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYGASGPTS 249
                               PA    P+SSA L       S G       GG      T 
Sbjct: 235 AAVTPDSSVHGPDSYYGVPEPAFGSLPTSSALLRARGLNASAGSILTKATGGL----KTQ 290

Query: 250 ATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPA 429
              S  SG+F SL P PP  PPP   +   A GG   A GVP   GA   A L+ AA   
Sbjct: 291 MKKSTSSGNFGSLWPQPPPPPPPAAAAQRNAGGG---AAGVPL--GAGPGAGLSGAA--- 342

Query: 430 YATGGGNGP 456
              GGG  P
Sbjct: 343 ---GGGRAP 348

[80][TOP]
>UniRef100_Q9N2N7 Fibrillar collagen alpha 120 and 140 chains (Fragment) n=1
           Tax=Hemicentrotus pulcherrimus RepID=Q9N2N7_HEMPU
          Length = 632

 Score = 57.0 bits (136), Expect = 8e-07
 Identities = 54/164 (32%), Positives = 61/164 (37%), Gaps = 10/164 (6%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGS--FSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAH 183
           P   G+       G S A GS    GP  APG    SGP G   S+ AP      P GA 
Sbjct: 207 PGPQGARGEKGDTGASGANGSPGAPGPIGAPGAAGASGPRGETGSTGAPGPQG--PTGAR 264

Query: 184 LGSRGGAPPS----VAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG- 348
            GS G A PS     AG  G +GP              LQ  P  M  P  P      G 
Sbjct: 265 -GSTGPAGPSGPAGPAGERGETGPAGHKGHPGVSGLPGLQGTPGPMGEPGAPGEQGQQGT 323

Query: 349 -GVTAAHGVPRHHGANGPASLNSAALP--AYATGGGNGPAYPPG 471
            G+  A G   + G  GP   +    P      GG +GP  PPG
Sbjct: 324 RGLPGARGSNGNDGPAGPRGFDGPEGPRGPRGEGGSSGPPGPPG 367

[81][TOP]
>UniRef100_Q5QN39 Os01g0201600 protein n=2 Tax=Oryza sativa Japonica Group
           RepID=Q5QN39_ORYSJ
          Length = 301

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 45/136 (33%), Positives = 55/136 (40%), Gaps = 3/136 (2%)
 Frame = +1

Query: 67  GSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYGASGPT 246
           G  + P   PG + G G  G   S     S  +LP  +H    GGA PS  GGYGAS P 
Sbjct: 67  GGTTTPTPIPGHHGGGGSSGTTPSHGGGPSGGALPSPSH----GGAAPSHGGGYGASPPV 122

Query: 247 SATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGG---VTAAHGVPRHHGANGPASLNSA 417
           +    +  G +    PAP       G SP    GG    T +HG   + G   PA+    
Sbjct: 123 T---PSPGGGYGGGSPAPSHGGGAYGSSPSTPSGGGSSPTPSHGGGAYGGGGAPAT---- 175

Query: 418 ALPAYATGGGNGPAYP 465
             PA   G G  P  P
Sbjct: 176 --PASHDGHGLIPTTP 189

[82][TOP]
>UniRef100_UPI0000DB7202 PREDICTED: hypothetical protein n=1 Tax=Apis mellifera
           RepID=UPI0000DB7202
          Length = 344

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 55/173 (31%), Positives = 74/173 (42%), Gaps = 19/173 (10%)
 Frame = +1

Query: 13  PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSY-APSSSASLPQGAH-L 186
           P  GS++P S   G+   G   GP    G  +G G GG P+SSY APSS+   P   +  
Sbjct: 29  PISGSYLPPSTSYGTPNLGG-GGPSSTYGAPSGGG-GGRPSSSYGAPSSTYGAPSSTYGA 86

Query: 187 GSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQ---MPPPTGPSPHLAHG--- 348
            S GG  PS    YGA        S+  G+  S   AP      P   G  P  ++G   
Sbjct: 87  PSNGGGRPS--STYGAPSNGGGRPSSSYGAPSSSYGAPSSTYGAPSNGGGRPSSSYGAPS 144

Query: 349 -----------GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGA 474
                      G++ ++G P   G  G  S+ S++  A   GGG GP+   GA
Sbjct: 145 FGGGGGFGGGNGLSTSYGAPSRGGGGGGGSI-SSSYGAPTGGGGGGPSTTYGA 196

[83][TOP]
>UniRef100_UPI0001AE7353 UPI0001AE7353 related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE7353
          Length = 1629

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 740  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 799

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 800  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 852

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 853  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 910

[84][TOP]
>UniRef100_UPI0001AE734E UPI0001AE734E related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE734E
          Length = 1655

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 766  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 825

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 826  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 878

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 879  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 936

[85][TOP]
>UniRef100_UPI0001AE734D UPI0001AE734D related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE734D
          Length = 1676

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 787  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 846

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 847  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 899

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 900  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 957

[86][TOP]
>UniRef100_UPI0001AE734C UPI0001AE734C related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE734C
          Length = 1689

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 800  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 859

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 860  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 912

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 913  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 970

[87][TOP]
>UniRef100_UPI0001AE734B UPI0001AE734B related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE734B
          Length = 1710

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 821  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 880

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 881  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 933

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 934  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 991

[88][TOP]
>UniRef100_UPI0001AE734A UPI0001AE734A related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE734A
          Length = 1715

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 826  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 885

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 886  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 938

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 939  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 996

[89][TOP]
>UniRef100_UPI0001AE7349 UPI0001AE7349 related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE7349
          Length = 1736

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 847  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 906

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 907  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 959

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 960  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 1017

[90][TOP]
>UniRef100_UPI0001AE71E7 UPI0001AE71E7 related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE71E7
          Length = 1655

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 766  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 825

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 826  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 878

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 879  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 936

[91][TOP]
>UniRef100_UPI0001AE71E6 UPI0001AE71E6 related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE71E6
          Length = 1676

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 787  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 846

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 847  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 899

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 900  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 957

[92][TOP]
>UniRef100_UPI0001AE71E5 UPI0001AE71E5 related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE71E5
          Length = 1715

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 826  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 885

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 886  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 938

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 939  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 996

[93][TOP]
>UniRef100_UPI0001AE71E4 UPI0001AE71E4 related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE71E4
          Length = 1736

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 847  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 906

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 907  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 959

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 960  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 1017

[94][TOP]
>UniRef100_UPI000173A163 UPI000173A163 related cluster n=1 Tax=Homo sapiens
            RepID=UPI000173A163
          Length = 1623

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 734  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 793

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 794  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 846

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 847  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 904

[95][TOP]
>UniRef100_Q3TP88 Putative uncharacterized protein (Fragment) n=1 Tax=Mus musculus
           RepID=Q3TP88_MOUSE
          Length = 959

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 49/171 (28%), Positives = 61/171 (35%), Gaps = 17/171 (9%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGG 201
           GS  P    G     G  +G   APG    SGPGG P    A        +    G RG 
Sbjct: 200 GSRGPSGAPGPDGNKGE-AGAVGAPGSAGASGPGGLPGERGAAGIPGGKGEKGETGLRGD 258

Query: 202 APPS-------VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPH 336
              +       + G  GA GP  A+    E+G+     PA P+  P       P GP+  
Sbjct: 259 TGNTGRDGARGIPGAVGAPGPAGASGDRGEAGAAGPSGPAGPRGSPGERGEVGPAGPNGF 318

Query: 337 LAHGGVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPGAIVS 483
               G     G     G  GP   N    P  + G  G +GP  PPG + S
Sbjct: 319 AGPAGAAGQPGAKEEKGTKGPKGENGIVGPTGSVGAAGPSGPNGPPGPVGS 369

[96][TOP]
>UniRef100_B7H785 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           B4264 RepID=B7H785_BACC4
          Length = 1297

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 48/154 (31%), Positives = 63/154 (40%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   ++ A+   GA  GS G     
Sbjct: 195 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGS-TGATGATGSTGA-TGSTG----- 247

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-PAPPQ----------MPPPTGPSPHLAHGGVTA 360
           V G  G +GPT +T +      Q +Q P  P           +P PTG +      GV  
Sbjct: 248 VTGATGTTGPTGSTGAQGLQGIQGIQGPIGPTGSEGPQGIQGIPGPTGVTGEQGIQGVQG 307

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             G+    G  GP  +  A  P  ATG  G  GP
Sbjct: 308 IQGITGATGDQGPQGIQGAIGPQGATGATGDQGP 341

[97][TOP]
>UniRef100_C8RSP5 Ferredoxin, 4Fe-4S (Fragment) n=1 Tax=Corynebacterium jeikeium ATCC
            43734 RepID=C8RSP5_CORJE
          Length = 1064

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/183 (29%), Positives = 76/183 (41%), Gaps = 5/183 (2%)
 Frame = +1

Query: 1    AQQPPSYGSHV----PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASL 168
            A   PS G+      PG+    ++ +   +G P APG  A     G PA+  APS+ A  
Sbjct: 845  APSAPSAGTPAAPAAPGAPAAPAAPSAPSAGAPAAPGAPAAPAAPGAPAAPSAPSAGAPA 904

Query: 169  PQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGP-SPHLAH 345
              GA         P+  G   A G  +A  +  +   +  Q AP     P  P +P    
Sbjct: 905  APGA---------PAAPGAPAAPGAPAAPGAPAAPKSEDTQEAPKTSGAPAAPGAPSAPS 955

Query: 346  GGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAA 525
             G  AA G P       PA+  + A P+  + G   PA  PGA  +P++ A     +PAA
Sbjct: 956  AGAPAAPGAPA-----APAAPGAPAAPSAPSAG--APA-APGAPSAPSAGAPAAPGAPAA 1007

Query: 526  AAA 534
             AA
Sbjct: 1008 PAA 1010

[98][TOP]
>UniRef100_C3DRK5 Collagen triple helix repeat domain protein n=1 Tax=Bacillus
           thuringiensis serovar sotto str. T04001
           RepID=C3DRK5_BACTS
          Length = 951

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 49/154 (31%), Positives = 63/154 (40%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   ++ A+   GA  GS G     
Sbjct: 192 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGS-TGATGATGDTGA-TGSTG----- 244

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           V G  G +GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 245 VTGETGTTGPTGSTGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGITGEQGIQGVQG 304

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             GV    G  GP  +     P  ATG  G  GP
Sbjct: 305 IQGVTGATGDQGPQGIQGTIGPQGATGATGDQGP 338

[99][TOP]
>UniRef100_Q8WSZ3 Dragline silk protein spidroin 2 (Fragment) n=1 Tax=Nephila clavata
           RepID=Q8WSZ3_NEPCV
          Length = 301

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 57/190 (30%), Positives = 73/190 (38%), Gaps = 25/190 (13%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVGGSSAAGSFSGP-PYAPGV---------------YAGSGPGGHPA 135
           Q P  YG   P    G S+AA + +GP  Y PG                Y  SGP G P 
Sbjct: 30  QGPGGYGPSGPSGPGGASAAAAAAAGPGGYGPGQQGPGQQGPGQQGPAGYGPSGPSG-PG 88

Query: 136 SSYAPSSSASLPQGAHLGSRG----GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAP- 300
            + A +++A+ P G  LG +G    G       GYG SG      S   G+  +    P 
Sbjct: 89  GAAAAAAAAAGPGGYGLGQQGPGQQGPGQQGPAGYGPSG-----LSGPGGAAAAAAAGPG 143

Query: 301 ---PQMPPPTGPSPHLAHGGVTAAHGV-PRHHGANGPASLNSAALPAYATGGGNGPAYPP 468
              P    P+GP    A        G  P   G +GP S  +AA  A   G G G   P 
Sbjct: 144 GYGPGQQRPSGPGGAAAAAAAAGPGGYGPSQRGPSGPGSAAAAAAGAGPGGYGPGQKGPS 203

Query: 469 GAIVSPASTA 498
           G   + A+ A
Sbjct: 204 GPGSAAAAAA 213

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 58/183 (31%), Positives = 69/183 (37%), Gaps = 6/183 (3%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVGGSSAAGSFSGPP-YAPGVYAGS--GPGGHPASSYAPSSSASLPQ 174
           Q P  YG   P    G ++AA + +GP  Y  G       GPG    + Y PS       
Sbjct: 74  QGPAGYGPSGPSGPGGAAAAAAAAAGPGGYGLGQQGPGQQGPGQQGPAGYGPSG------ 127

Query: 175 GAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPP--QMPPPTGPS-PHLAH 345
              L   GGA  + A G G  GP     S   G+  +   A P    P   GPS P  A 
Sbjct: 128 ---LSGPGGAAAAAAAGPGGYGPGQQRPSGPGGAAAAAAAAGPGGYGPSQRGPSGPGSAA 184

Query: 346 GGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAA 525
                A       G  GP+   SAA  A A  GG GP+    A   P+        S AA
Sbjct: 185 AAAAGAGPGGYGPGQKGPSGPGSAAAAAAAGPGGYGPSQQGPARYGPSGPG-----SAAA 239

Query: 526 AAA 534
           AAA
Sbjct: 240 AAA 242

[100][TOP]
>UniRef100_Q4E3X8 Mucin-associated surface protein (MASP), putative n=1
           Tax=Trypanosoma cruzi RepID=Q4E3X8_TRYCR
          Length = 325

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 44/134 (32%), Positives = 62/134 (46%), Gaps = 3/134 (2%)
 Frame = +1

Query: 49  GGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGY 228
           GGS+ A   SG P  PG   GSG G    S+ + +S A +P+G    S GG+     GG 
Sbjct: 80  GGSAGATGASGGP-GPGDAGGSG-GTQKNSNSSETSDAGVPRGGD--SDGGSAAGEKGGS 135

Query: 229 GASGPTSATFSNESGSFQS---LQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGP 399
           G  G  ++T  + +GS  S     PAP    PP+ P         T A GV    G++G 
Sbjct: 136 GGGGSGTSTDGHGTGSVSSGLSAVPAPAPAAPPSAPGHSGGPSAPTDAPGVDPSAGSSGG 195

Query: 400 ASLNSAALPAYATG 441
            ++   + P+  TG
Sbjct: 196 TAVPPGSNPSNTTG 209

[101][TOP]
>UniRef100_B9PJ47 Putative uncharacterized protein n=1 Tax=Toxoplasma gondii GT1
            RepID=B9PJ47_TOXGO
          Length = 994

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 56/185 (30%), Positives = 69/185 (37%), Gaps = 11/185 (5%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSG--PGGHPASSYAPSSSASLPQGAH 183
            PP+  +  PG+  G   AA +   PP  P   A  G  PG  PA++    +    P G  
Sbjct: 630  PPAAAA--PGAPPGTPPAAAAPGAPPGTPPAAAAPGAPPGTPPATAATSGAPPGTPPGTP 687

Query: 184  LGSRG---GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPT----GPSPHLA 342
              + G   G+PP+ A   GA   +    +  SG       APP  PP T    G SP   
Sbjct: 688  AAASGAPPGSPPATATAAGAPPGSPPATAAASG-------APPGSPPATATASGASPGTP 740

Query: 343  HGGVTAAHGVPRHHGANGPASLNSA--ALPAYATGGGNGPAYPPGAIVSPASTATFNRLS 516
             G   AA G P       PA    A    P    G     A PP A  +P   A    L 
Sbjct: 741  PGTPAAASGAPPGTPPGTPAEALGAVPGAPVATPGAAPTTATPPAAAGTPGVVAGGPGLV 800

Query: 517  PAAAA 531
            PA  A
Sbjct: 801  PAVVA 805

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 54/183 (29%), Positives = 71/183 (38%), Gaps = 21/183 (11%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSG-PGGHPASSYAPSSSASLPQGAHLGSRGGAPP 210
            P  V GG +AA   +  P A  V   +G P G P ++ A  ++ S   GA   +  GAPP
Sbjct: 555  PNLVAGGIAAAIPAAAFPQATMVAGSNGLPQGVPVAAPAVPTAPSAAAGAPAAAASGAPP 614

Query: 211  SVAGGYGASG------PTSATFSNESGS-FQSLQPAPPQMPPPTGPSPHLAHG---GVTA 360
                   ASG      P +A      G+   +  P  P   PP   +P    G      A
Sbjct: 615  GTPSAAAASGAPPGTPPAAAAPGAPPGTPPAAAAPGAPPGTPPAAAAPGAPPGTPPATAA 674

Query: 361  AHGVPRHHGANGPASLNSA---ALPAYATGGGNGPAYPPGAIV-------SPASTATFNR 510
              G P       PA+ + A   + PA AT  G  P  PP           SP +TAT + 
Sbjct: 675  TSGAPPGTPPGTPAAASGAPPGSPPATATAAGAPPGSPPATAAASGAPPGSPPATATASG 734

Query: 511  LSP 519
             SP
Sbjct: 735  ASP 737

[102][TOP]
>UniRef100_B7PZI3 Smarca4, putative n=1 Tax=Ixodes scapularis RepID=B7PZI3_IXOSC
          Length = 434

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 44/126 (34%), Positives = 48/126 (38%), Gaps = 3/126 (2%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGS-FSGPPYAPGVYAGSGP--GGHPASSYAPSSSASLPQGAHLGS 192
           G    G   GGSS A S   GPP  P  + G  P  G  P   YAP      P       
Sbjct: 37  GKPPAGGGSGGSSGAPSPIMGPPPVPQQHMGMPPEGGAPPHHGYAPQPHMG-PGAVQPQV 95

Query: 193 RGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGV 372
            GG PP     YG   P           +Q  QP PPQ   P G  P L H GV  +H  
Sbjct: 96  YGGPPPQQQPPYGGGAP-----------YQQQQPYPPQQGVPPGGGPPLQHQGVPPSH-- 142

Query: 373 PRHHGA 390
             HHG+
Sbjct: 143 -PHHGS 147

[103][TOP]
>UniRef100_B3NY10 GG17589 n=1 Tax=Drosophila erecta RepID=B3NY10_DROER
          Length = 2024

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 60/181 (33%), Positives = 78/181 (43%), Gaps = 14/181 (7%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGP-PYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAP- 207
           P +    SS AG+ +G    +  V +G G G    S+ A S+  S  QGA  G+ GG+  
Sbjct: 162 PATPKSSSSGAGASTGSGTSSAAVTSGPGSGSTKVSTAASSAQQSGLQGA-TGAGGGSSS 220

Query: 208 -PSVAGGYGASGPTSA-TFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGG----VTAAHG 369
            P    G GA G T+A   S   G+  S     P +PP +   PH   G      TA  G
Sbjct: 221 TPGTQTGSGAGGATAARPVSAMGGTVSSTAGGAPSIPPISTMPPHTVPGSTNTTTTALAG 280

Query: 370 VPRHHGANGP----ASLNSAALPAYATGGGNGPAYP--PGAIVSPASTATFNRLSPAAAA 531
                GA GP    A+ N+AAL A     G   AYP  PG     +S+      +  AAA
Sbjct: 281 -----GAGGPGAAAANPNAAALMASLLSAGQTGAYPGAPGQTAVNSSSLLDGSTAAVAAA 335

Query: 532 A 534
           A
Sbjct: 336 A 336

[104][TOP]
>UniRef100_Q5JP94 Collagen type XI alpha 2 n=4 Tax=Homo sapiens RepID=Q5JP94_HUMAN
          Length = 1650

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 761  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 820

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 821  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 873

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 874  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 931

[105][TOP]
>UniRef100_C9J8W5 Putative uncharacterized protein ENSP00000410951 n=1 Tax=Homo sapiens
            RepID=C9J8W5_HUMAN
          Length = 1693

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 761  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 820

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 821  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 873

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 874  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 931

[106][TOP]
>UniRef100_B0UXE9 Collagen, type XI, alpha 2 n=1 Tax=Homo sapiens RepID=B0UXE9_HUMAN
          Length = 1650

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 761  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 820

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 821  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 873

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 874  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 931

[107][TOP]
>UniRef100_A6NI54 Putative uncharacterized protein ENSP00000363829 n=2 Tax=Homo sapiens
            RepID=A6NI54_HUMAN
          Length = 1693

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 761  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 820

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 821  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 873

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 874  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 931

[108][TOP]
>UniRef100_Q9UMD9-2 Isoform 2 of Collagen alpha-1(XVII) chain n=1 Tax=Homo sapiens
            RepID=Q9UMD9-2
          Length = 1415

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/173 (31%), Positives = 70/173 (40%), Gaps = 23/173 (13%)
 Frame = +1

Query: 34   PGSVVGGS-SAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL-------- 186
            PG +V    S+  +  GPP  PG     GP G P     P+  A LP    +        
Sbjct: 805  PGKIVTSEGSSMLTVPGPPGPPGAMGPPGPPGAPG----PAGPAGLPGHQEVLNLQGPPG 860

Query: 187  --GSRGGAPPSVAGGYGASGPTS----------ATFSNESGSFQSLQPAPPQMPPPTGPS 330
              G RG   PS+ G  G  GP             +F + S +F S    PP  P P GP 
Sbjct: 861  PPGPRGPPGPSIPGPPGPRGPPGEGLPGPPGPPGSFLSNSETFLS---GPPGPPGPPGPK 917

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPGAIVS 483
                  GV  A G+P     +GP+   S++   Y +G  G  GP  PPG+I S
Sbjct: 918  GDQGDPGVPGALGIP-----SGPSEGGSSS-TMYVSGPPGPPGPPGPPGSISS 964

[109][TOP]
>UniRef100_P13942-5 Isoform 5 of Collagen alpha-2(XI) chain n=2 Tax=Homo sapiens
            RepID=P13942-5
          Length = 1689

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 800  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 859

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 860  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 912

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 913  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 970

[110][TOP]
>UniRef100_P13942-2 Isoform 2 of Collagen alpha-2(XI) chain n=2 Tax=Homo sapiens
            RepID=P13942-2
          Length = 1710

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 821  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 880

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 881  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 933

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 934  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 991

[111][TOP]
>UniRef100_P13942-7 Isoform 7 of Collagen alpha-2(XI) chain n=1 Tax=Homo sapiens
            RepID=P13942-7
          Length = 1655

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 766  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 825

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 826  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 878

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 879  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 936

[112][TOP]
>UniRef100_P13942-3 Isoform 3 of Collagen alpha-2(XI) chain n=1 Tax=Homo sapiens
            RepID=P13942-3
          Length = 1715

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 826  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 885

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 886  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 938

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 939  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 996

[113][TOP]
>UniRef100_P13942-4 Isoform 4 of Collagen alpha-2(XI) chain n=1 Tax=Homo sapiens
            RepID=P13942-4
          Length = 1676

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 787  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 846

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 847  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 899

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 900  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 957

[114][TOP]
>UniRef100_P13942-8 Isoform 8 of Collagen alpha-2(XI) chain n=2 Tax=Homo sapiens
            RepID=P13942-8
          Length = 1629

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 740  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 799

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 800  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 852

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 853  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 910

[115][TOP]
>UniRef100_P13942 Collagen alpha-2(XI) chain n=1 Tax=Homo sapiens RepID=COBA2_HUMAN
          Length = 1736

 Score = 56.6 bits (135), Expect = 1e-06
 Identities = 54/178 (30%), Positives = 59/178 (33%), Gaps = 23/178 (12%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
            G   P    G S A G+  G     PP   G+    GP G P     P          H 
Sbjct: 847  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPPGPPGKDGLPGHP 906

Query: 187  GSRG----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
            G RG            PP V G  GA+G T      E G      P PP  P   G    
Sbjct: 907  GQRGEVGFQGKTGPPGPPGVVGPQGAAGETGP--MGERG-----HPGPPGPPGEQGLPGT 959

Query: 337  LAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 960  AGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 1017

[116][TOP]
>UniRef100_UPI0000E1F855 PREDICTED: similar to COL3A1 protein isoform 12 n=1 Tax=Pan
           troglodytes RepID=UPI0000E1F855
          Length = 1457

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 62/204 (30%), Positives = 75/204 (36%), Gaps = 32/204 (15%)
 Frame = +1

Query: 13  PSYGSH--VPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHL 186
           P Y S+    G  VGG +     +GPP  PG     G  GHP S  +P       +    
Sbjct: 153 PQYDSYDVKSGVAVGGLAGYPGPAGPPGPPG---PPGTSGHPGSPGSPGYQGPPGEPGQA 209

Query: 187 GSRGGAPPSVAGGYGASGPTSATFSNESG----SFQSLQPAPPQMPPPTG--PSPHL-AH 345
           G  G  PP   G  G SGP  A    ESG      +   P PP +  P G    P +  H
Sbjct: 210 GPSG--PPGPPGAIGPSGP--AGKDGESGRPGRPGERGLPGPPGIKGPAGIPGFPGMKGH 265

Query: 346 GGVTAA------HGVPRHHGANGPASLNSA-------ALPAYATGGGN----------GP 456
            G T A      +G+P  +GA GP     A        LP  A   GN          GP
Sbjct: 266 RGETGAPGLKGENGLPGENGAPGPMGPRGAPGERGRPGLPGAAGARGNDGARGSDGQPGP 325

Query: 457 AYPPGAIVSPASTATFNRLSPAAA 528
             PPG    P S      + PA +
Sbjct: 326 PGPPGTAGFPGSPGAKGEVGPAGS 349

[117][TOP]
>UniRef100_UPI0000D9A866 PREDICTED: similar to alpha 2 type I collagen isoform 1 n=1
            Tax=Macaca mulatta RepID=UPI0000D9A866
          Length = 1248

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 51/156 (32%), Positives = 60/156 (38%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG +  AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 624  PG-VVGAAGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 678

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 679  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 736

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G +GP  PPG
Sbjct: 737  AKGERGAKGPKGENGVVGPTGPVGAAGPSGPNGPPG 772

[118][TOP]
>UniRef100_UPI0000D9A865 PREDICTED: similar to alpha 2 type I collagen isoform 2 n=1
            Tax=Macaca mulatta RepID=UPI0000D9A865
          Length = 1363

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 51/156 (32%), Positives = 60/156 (38%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG +  AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 621  PG-VVGAAGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 675

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 676  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 733

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G +GP  PPG
Sbjct: 734  AKGERGAKGPKGENGVVGPTGPVGAAGPSGPNGPPG 769

[119][TOP]
>UniRef100_UPI0000D9A864 PREDICTED: similar to alpha 2 type I collagen isoform 3 n=1
            Tax=Macaca mulatta RepID=UPI0000D9A864
          Length = 1366

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 51/156 (32%), Positives = 60/156 (38%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG +  AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 624  PG-VVGAAGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 678

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 679  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 736

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G +GP  PPG
Sbjct: 737  AKGERGAKGPKGENGVVGPTGPVGAAGPSGPNGPPG 772

[120][TOP]
>UniRef100_UPI00016E5ECF UPI00016E5ECF related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E5ECF
          Length = 1261

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 51/168 (30%), Positives = 58/168 (34%), Gaps = 4/168 (2%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
            P   G   P    G S   G    P  A GV A  GP G P     P  S   P G    
Sbjct: 737  PGPAGPPGPAGAPGLSGPIGPAGLPGPAGGVSALPGPPGPPGPPGRPGDSRQGPPG---- 792

Query: 190  SRGGAPPSVAGGYGASGPT----SATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVT 357
                  P    GYG  GP        FS+ SG+F +  P PP    P G S     GG  
Sbjct: 793  ------PPGPPGYGRPGPKGDKGDPGFSSSSGTFYTGPPGPPGPAGPKGSSVATYSGG-- 844

Query: 358  AAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTAT 501
              +G+P   G  GP              G  GP  PPG    P + A+
Sbjct: 845  --NGIPGPPGPPGPPGPQGFKGSISVASGPPGPPGPPGPAGRPGTFAS 890

[121][TOP]
>UniRef100_B1JZ05 Putative uncharacterized protein n=1 Tax=Burkholderia cenocepacia
           MC0-3 RepID=B1JZ05_BURCC
          Length = 387

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 53/156 (33%), Positives = 68/156 (43%), Gaps = 5/156 (3%)
 Frame = +1

Query: 82  PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYGASGPTSATFS 261
           P   PGV  GSG    PA++ A ++ A++   A   + G    S AG   AS P  A+ S
Sbjct: 226 PLSVPGVAPGSGANAVPAAASAVTAPAAMRAAAPAAASGSGTVSGAGAAPASAPAPAS-S 284

Query: 262 NESGSFQSLQPAPPQMP-----PPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALP 426
                  +   AP   P     P T P+P  A G   A    P    A+ PA    A  P
Sbjct: 285 GGPAPAPASAAAPASAPKPISGPATAPAPSSASGSTAAPVSAP----ASAPA---PATAP 337

Query: 427 AYATGGGNGPAYPPGAIVSPASTATFNRLSPAAAAA 534
           A AT   + PA P  A  +PAS +  +  SPA AAA
Sbjct: 338 ATAT--PSSPA-PSSAASTPASASAPSSASPAPAAA 370

[122][TOP]
>UniRef100_Q9NHW4 Flagelliform silk protein (Fragment) n=1 Tax=Nephila clavipes
           RepID=Q9NHW4_NEPCL
          Length = 2249

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 60/162 (37%), Positives = 65/162 (40%), Gaps = 8/162 (4%)
 Frame = +1

Query: 10  PPSYGSHVP-GSVVGGSSAAG---SFSGPPYAPGVYAGSGP-GGHPASSYAPSSSASLPQ 174
           P   G + P G    GS A G   S SGP       +GSGP GG   SS  PS +   P 
Sbjct: 3   PSGTGGYAPTGYAPSGSGAGGVRPSASGP-------SGSGPSGGSRPSSSGPSGTRPSPN 55

Query: 175 GAHLGSRGGAPP--SVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG 348
           GA   S GG  P  S +GG G SG T    S  SGS+      P       GPS      
Sbjct: 56  GASGSSPGGIAPGGSNSGGAGVSGATGGPAS--SGSY-----GPGSTGGTYGPSGGSEPF 108

Query: 349 GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGP-AYPPG 471
           G   A G P   G  GP     A  P     GG GP  Y PG
Sbjct: 109 GPGVAGG-PYSPGGAGPGGAGGAYGPGGVGTGGAGPGGYGPG 149

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 55/169 (32%), Positives = 60/169 (35%), Gaps = 19/169 (11%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSF----SGPPYAPGVYAGSGPGG-----------HPASSYAPSS 156
            G   PG V  G S  G      +G PY PG   GSGPGG            P  +Y P  
Sbjct: 830  GGFGPGGVGPGGSGPGGVGPGGAGRPYGPG---GSGPGGAGGAGGTGGAYGPGGAYGPGG 886

Query: 157  SASLPQGAHLGSRGGAPPSVAGG-YGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSP 333
            S   P GA  G  GG  P  AGG YG  G         +G        P     P GP  
Sbjct: 887  SGG-PGGA--GGPGGEGPGGAGGPYGPGGAGGPYGPGGAGG----PYGPGGEGGPYGPGV 939

Query: 334  HLAHGGVTAAHGV--PRHHGANGPASLNSAALPAYATGGGNGP-AYPPG 471
                GG    +G   P   G  GP        P     GG+GP  Y PG
Sbjct: 940  SYGPGGAGGPYGPGGPYGPGGEGPGGAGGPYGPGGVGPGGSGPGGYGPG 988

[123][TOP]
>UniRef100_Q4G1Y1 Major ampullate spidroin 2 (Fragment) n=1 Tax=Latrodectus hesperus
           RepID=Q4G1Y1_9ARAC
          Length = 542

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 52/174 (29%), Positives = 71/174 (40%), Gaps = 1/174 (0%)
 Frame = +1

Query: 13  PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
           P YG    G   GG+ AA + +     PG     GPGG  A++ A +++ S P G    +
Sbjct: 306 PGYGGQ-QGFGPGGAGAAAAAAAGGAGPGRQQAYGPGGSGAAAAAAAAAGSGPSGYGPSA 364

Query: 193 RGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGV 372
            G   PS  GG GA+   +A  S   G  Q           PTG  P             
Sbjct: 365 AG---PSGPGGSGAAAAAAAGGSGPGGFGQG----------PTGYGP-----------SG 400

Query: 373 PRHHGANGPASLNSAALPAYATGGGNGPA-YPPGAIVSPASTATFNRLSPAAAA 531
           P      GP +  +AA  A +  GG GP+ Y P ++ S A++A     SP   A
Sbjct: 401 PGGQQGYGPGASGAAAAAAASGSGGYGPSQYVPSSVASSAASAASALSSPTTHA 454

[124][TOP]
>UniRef100_B6K9K2 Putative uncharacterized protein n=2 Tax=Toxoplasma gondii
            RepID=B6K9K2_TOXGO
          Length = 994

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 56/185 (30%), Positives = 69/185 (37%), Gaps = 11/185 (5%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSG--PGGHPASSYAPSSSASLPQGAH 183
            PP+  +  PG+  G   AA +   PP  P   A  G  PG  PA++    +    P G  
Sbjct: 630  PPAAAA--PGAPPGTPPAAAAPGAPPGTPPAAAAPGAPPGTPPATAATSGAPPGTPPGTP 687

Query: 184  LGSRG---GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPT----GPSPHLA 342
              + G   G+PP+ A   GA   +    +  SG       APP  PP T    G SP   
Sbjct: 688  AAASGAPPGSPPATATAAGAPPGSPPATAAASG-------APPGSPPATATASGASPGTP 740

Query: 343  HGGVTAAHGVPRHHGANGPASLNSA--ALPAYATGGGNGPAYPPGAIVSPASTATFNRLS 516
             G   AA G P       PA    A    P    G     A PP A  +P   A    L 
Sbjct: 741  PGTPAAASGAPPGTPPGTPAEALGAVPGAPIATPGAAPTTATPPAAAGTPGVVAGGPGLV 800

Query: 517  PAAAA 531
            PA  A
Sbjct: 801  PAVVA 805

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 54/183 (29%), Positives = 71/183 (38%), Gaps = 21/183 (11%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSG-PGGHPASSYAPSSSASLPQGAHLGSRGGAPP 210
            P  V GG +AA   +  P A  V   +G P G P ++ A  ++ S   GA   +  GAPP
Sbjct: 555  PNLVAGGIAAAIPAAAFPQATMVAGSNGLPQGVPVAAPAVPTAPSAAAGAPAAAASGAPP 614

Query: 211  SVAGGYGASG------PTSATFSNESGS-FQSLQPAPPQMPPPTGPSPHLAHG---GVTA 360
                   ASG      P +A      G+   +  P  P   PP   +P    G      A
Sbjct: 615  GTPSAAAASGAPPGTPPAAAAPGAPPGTPPAAAAPGAPPGTPPAAAAPGAPPGTPPATAA 674

Query: 361  AHGVPRHHGANGPASLNSA---ALPAYATGGGNGPAYPPGAIV-------SPASTATFNR 510
              G P       PA+ + A   + PA AT  G  P  PP           SP +TAT + 
Sbjct: 675  TSGAPPGTPPGTPAAASGAPPGSPPATATAAGAPPGSPPATAAASGAPPGSPPATATASG 734

Query: 511  LSP 519
             SP
Sbjct: 735  ASP 737

[125][TOP]
>UniRef100_B2W108 Putative uncharacterized protein n=1 Tax=Pyrenophora
           tritici-repentis Pt-1C-BFP RepID=B2W108_PYRTR
          Length = 842

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 47/156 (30%), Positives = 69/156 (44%)
 Frame = +1

Query: 19  YGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG 198
           YG  VPG  +  +  +G+ S PP      AG   GG+ + S + S S S P GA      
Sbjct: 160 YGGDVPGVSMSSAVPSGAVSSPP------AGGYGGGYGSPSPSSSPSPSTPAGAV----- 208

Query: 199 GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPR 378
             PP  AGGYG     +    + S    S   + P +P  T  +P  A    ++A G   
Sbjct: 209 STPP--AGGYGGGYGGNVPGVSMSSVVPSGASSTPAIPAATTSTPAGAVS-TSSAGGYGG 265

Query: 379 HHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            +G N P    S+ +P+ A+ G    + P GA+ +P
Sbjct: 266 GYGGNVPGVSMSSVVPSGASSGSPSASTPAGAVSTP 301

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 55/181 (30%), Positives = 75/181 (41%), Gaps = 20/181 (11%)
 Frame = +1

Query: 19  YGSHVPGSVVGGSSAAGSFSGPPYAP--GVYAGSGPG---------GHPASSYAPSSSAS 165
           YGS  P S    S+ AG+ S PP     G Y G+ PG         G  ++   P+++ S
Sbjct: 190 YGSPSPSSSPSPSTPAGAVSTPPAGGYGGGYGGNVPGVSMSSVVPSGASSTPAIPAATTS 249

Query: 166 LPQGAHLGSRGGAPPSVAGGYGASGPTSATFS-----NESGSFQSLQPAPPQMPPPTGPS 330
            P GA   S  G      GGYG + P  +  S       SGS  +  PA     PP G  
Sbjct: 250 TPAGAVSTSSAGG---YGGGYGGNVPGVSMSSVVPSGASSGSPSASTPAGAVSTPPAGGY 306

Query: 331 PHLAHG---GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP-ASTA 498
                G   GV+ +  VP    +       + + PA   GG   P+  PG  V+P A+T+
Sbjct: 307 GGGYGGNVPGVSMSSVVPSGASSTPAIPAATTSTPAGGNGGYGSPSSTPGKPVTPDAATS 366

Query: 499 T 501
           T
Sbjct: 367 T 367

[126][TOP]
>UniRef100_P02459 Collagen alpha-1(II) chain (Fragments) n=1 Tax=Bos taurus
           RepID=CO2A1_BOVIN
          Length = 747

 Score = 56.2 bits (134), Expect = 1e-06
 Identities = 51/173 (29%), Positives = 63/173 (36%), Gaps = 12/173 (6%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPAS--SYAPSSSASLPQGAH 183
           PP       G    G+  A   +GP  A G     GP G P +  S  P+ +A  P    
Sbjct: 170 PPGPVGPAGGPGFPGAPGAKGEAGPTGARGPEGAQGPRGEPGTPGSPGPAGAAGNPGTDG 229

Query: 184 L-GSRGGA-PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVT 357
           + G++G A  P +AG  G  GP                P P     P GP       G+ 
Sbjct: 230 IPGAKGSAGAPGIAGAPGFPGPRGP-------------PGPQGATGPLGPKGQTGEPGIA 276

Query: 358 AAHGVPRHHGANGPASLNSAALPAYATG--------GGNGPAYPPGAIVSPAS 492
              G     G  GPA +  A  PA   G        GG GPA PPG   +P S
Sbjct: 277 GFKGEQGPKGEPGPAGVQGAPGPAGEEGKRGARGEPGGAGPAGPPGERGAPGS 329

[127][TOP]
>UniRef100_Q3TU64 Putative uncharacterized protein n=2 Tax=Mus musculus
            RepID=Q3TU64_MOUSE
          Length = 1372

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 49/171 (28%), Positives = 61/171 (35%), Gaps = 17/171 (9%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGG 201
            GS  P    G     G  +G   APG    SGPGG P    A        +    G RG 
Sbjct: 613  GSRGPSGAPGPDGNKGE-AGAVGAPGSAGASGPGGLPGERGAAGIPGGKGEKGETGLRGD 671

Query: 202  APPS-------VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPH 336
               +       + G  GA GP  A+    E+G+     PA P+  P       P GP+  
Sbjct: 672  TGNTGRDGARGIPGAVGAPGPAGASGDRGEAGAAGPSGPAGPRGSPGERGEVGPAGPNGF 731

Query: 337  LAHGGVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPGAIVS 483
                G     G     G  GP   N    P  + G  G +GP  PPG + S
Sbjct: 732  AGPAGAAGQPGAKGEKGTKGPKGENGIVGPTGSVGAAGPSGPNGPPGPVGS 782

[128][TOP]
>UniRef100_A9EYY3 Putative uncharacterized protein n=1 Tax=Sorangium cellulosum 'So
           ce 56' RepID=A9EYY3_SORC5
          Length = 421

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 50/172 (29%), Positives = 67/172 (38%), Gaps = 16/172 (9%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
           PPS  +  P  +     A+ +    P AP  +A  GPG   A+  AP ++ +     H G
Sbjct: 155 PPSQAAFQPAPITDRMGASATQPPAPAAPPGFASPGPGA--AAPAAPEAARAPMPSPHAG 212

Query: 190 S--RGGAPPSVAG-GYGASGP-TSATFSNESGSFQSLQPAPPQMPPPTGPSPHL--AHGG 351
                 APP     G+GA+ P  S        S  +  PA    PP   P+P +  A G 
Sbjct: 213 QPPAPAAPPGFGSPGFGAAAPAVSEAARTPMPSLHAGMPAQAGPPPAAAPAPAMSAAPGA 272

Query: 352 VTAAHGVPRHHG----------ANGPASLNSAALPAYATGGGNGPAYPPGAI 477
             AAHG P+  G          A   A L   ALP+        P  PP A+
Sbjct: 273 GAAAHGAPQAAGGWDGAAESPWATTSARLEMPALPSTFVQERPEPQKPPAAV 324

[129][TOP]
>UniRef100_A0K683 Putative uncharacterized protein n=2 Tax=Burkholderia cenocepacia
           RepID=A0K683_BURCH
          Length = 383

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 52/154 (33%), Positives = 68/154 (44%), Gaps = 3/154 (1%)
 Frame = +1

Query: 82  PPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYGASGPTSATFS 261
           P  APGV  GSG    PA++ A ++ A++   A   + G    S A    A  P SA  S
Sbjct: 226 PLSAPGVAPGSGANAVPAAASAVAAPAAMRAAAPTAASGAGAVSGAAPASAPAPASAGGS 285

Query: 262 ---NESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAY 432
                S +  +L P P    P T P+P    G   A         A+ PA   SA+ PA 
Sbjct: 286 APAPASAAAPALAPKPVS-GPVTAPAPSSTSGSTAAP--------ASAPA---SASAPAP 333

Query: 433 ATGGGNGPAYPPGAIVSPASTATFNRLSPAAAAA 534
           AT   + PA P  A  +PAS +  +  SPA A A
Sbjct: 334 ATATPSSPA-PSSAASTPASASAPSSASPAPATA 366

[130][TOP]
>UniRef100_Q2I6N4 Uncharacterized Gly-rich protein n=1 Tax=uncultured delta
           proteobacterium DeepAnt-1F12 RepID=Q2I6N4_9DELT
          Length = 784

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 56/177 (31%), Positives = 69/177 (38%), Gaps = 7/177 (3%)
 Frame = +1

Query: 22  GSHVPGSVVG--GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSR 195
           G   P   VG  G+  A   +GP    G    +GPGG  A    P+           G+ 
Sbjct: 153 GEAGPQGAVGPAGADGAAGPAGPQGLQGERGPAGPGGGEAGPAGPA-----------GAD 201

Query: 196 GGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMP-----PPTGPSPHLAHGGVTA 360
           G A P  AG  GA GP  A     +G+  +  PA P  P      P GP+      G   
Sbjct: 202 GVAGP--AGADGADGPDGA--QGPAGADGAQGPAGPVGPGGGEAGPAGPAGADGVAGPAG 257

Query: 361 AHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAAA 531
           A G     GA GPA  + A  PA A  G  GP  P G    PA  A  + ++  A A
Sbjct: 258 ADGADGPDGAQGPAGADGAQGPAGA-DGAQGPVGPGGGEAGPAGPAGADGVAGPAGA 313

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 49/163 (30%), Positives = 61/163 (37%), Gaps = 7/163 (4%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASL--PQGAHLGSR 195
           G+  P    G + A G+  GP  A G     GPGG  A    P+ +  +  P GA     
Sbjct: 260 GADGPDGAQGPAGADGA-QGPAGADGAQGPVGPGGGEAGPAGPAGADGVAGPAGADGADG 318

Query: 196 GGAPPSVAGGYGASGPTSATFSNES---GSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAH 366
                  AG  GA GP  A  +      G  ++    P       GP+      G   A 
Sbjct: 319 PDGAQGPAGADGAQGPAGADGAQGPVGPGGGEAGPAGPAGADGVAGPAGADGADGPDGAQ 378

Query: 367 GVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGA--IVSPA 489
           G     GA GPA  + A  P    GG  GPA P GA  +  PA
Sbjct: 379 GPAGADGAQGPAGADGAQGPVGPGGGEAGPAGPAGADGVAGPA 421

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 49/163 (30%), Positives = 61/163 (37%), Gaps = 7/163 (4%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASL--PQGAHLGSR 195
           G+  P    G + A G+  GP  A G     GPGG  A    P+ +  +  P GA     
Sbjct: 315 GADGPDGAQGPAGADGA-QGPAGADGAQGPVGPGGGEAGPAGPAGADGVAGPAGADGADG 373

Query: 196 GGAPPSVAGGYGASGPTSATFSNES---GSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAH 366
                  AG  GA GP  A  +      G  ++    P       GP+      G   A 
Sbjct: 374 PDGAQGPAGADGAQGPAGADGAQGPVGPGGGEAGPAGPAGADGVAGPAGADGADGPDGAQ 433

Query: 367 GVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGA--IVSPA 489
           G     GA GPA  + A  P    GG  GPA P GA  +  PA
Sbjct: 434 GPAGADGAQGPAGADGAQGPVGPGGGEAGPAGPAGADGVAGPA 476

[131][TOP]
>UniRef100_C3RI07 Putative uncharacterized protein (Fragment) n=1 Tax=Mollicutes
           bacterium D7 RepID=C3RI07_9MOLU
          Length = 424

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 51/181 (28%), Positives = 63/181 (34%), Gaps = 13/181 (7%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAAGSF-----SGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
           S G+  P    G + A GS      +G   A G    +GP G      A  ++ S     
Sbjct: 49  STGAIGPTGPTGSTGATGSTGPTGATGEDGATGATGSTGPTGATGEDGATGATGSTGPTG 108

Query: 181 HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTA 360
             G+ G   P+  G  GA+GPT AT   E G+             PTGP+      G T 
Sbjct: 109 STGATGPTGPT--GATGATGPTGAT--GEDGA-----------TGPTGPTGATGEDGATG 153

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--------GGNGPAYPPGAIVSPASTATFNRLS 516
             G     GA GP        P  ATG        G  GP  P GA     +T       
Sbjct: 154 PTGATGEDGATGPTGATGPTGPTGATGEDGATGATGSTGPTGPTGATGEDGATGATGSTG 213

Query: 517 P 519
           P
Sbjct: 214 P 214

[132][TOP]
>UniRef100_C2N7W6 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           ATCC 10876 RepID=C2N7W6_BACCE
          Length = 1282

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 46/168 (27%), Positives = 63/168 (37%), Gaps = 22/168 (13%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   + +       + G+ G     
Sbjct: 195 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGSTGATGAT-----GNTGATGST--G 247

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           V G  G++GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 248 VTGATGSTGPTGSTGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQGVQG 307

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG-----------GGNGPAYPPG 471
             G     G  GP  +     P+ ATG           G  GP  P G
Sbjct: 308 IQGAKGATGDQGPQGIQGVPGPSGATGPQGVQGIQGPMGDIGPTGPEG 355

[133][TOP]
>UniRef100_B4V7M7 Putative uncharacterized protein n=1 Tax=Streptomyces sp. Mg1
           RepID=B4V7M7_9ACTO
          Length = 269

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 49/163 (30%), Positives = 63/163 (38%), Gaps = 4/163 (2%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGSFSGPPYAP--GVYAGSGPGGHPASSYAPSSSASLP--QGAHLG 189
           G+  PG   G        SG  + P     A +G  G PASS + S+SAS P  +GA   
Sbjct: 40  GAAAPGPERGAGENVAPRSGVEFQPLSAPDAPAGSTGSPASSASSSTSASAPGSEGAAGS 99

Query: 190 SRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
           + G  PP+  GG       SAT           +P     P  + P P    GG  A   
Sbjct: 100 TPGAGPPAAPGG-------SAT-----------RPGTSPAPGGSSPGPGAPSGGPAATQP 141

Query: 370 VPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTA 498
                G  GP +  +   P     GG GPA P    +SP + A
Sbjct: 142 ATPRPGTPGPVTPTAPTTPP----GGGGPATPANLTLSPPARA 180

[134][TOP]
>UniRef100_A8IZP2 Hydroxyproline-rich glycoprotein n=1 Tax=Chlamydomonas reinhardtii
           RepID=A8IZP2_CHLRE
          Length = 585

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 48/160 (30%), Positives = 64/160 (40%), Gaps = 13/160 (8%)
 Frame = +1

Query: 13  PSYGSHVPGSVVGGSSAAGSFSGPPY------APGVYAGSGPGGHPASSYAPSSSASLPQ 174
           P YG   PG+  G + A      PPY      AP  YA + PG  PA   AP      P 
Sbjct: 331 PPYGYAPPGAPPGAAGAP-----PPYGYALAGAPPPYAYAPPGAAPAPYGAPPPRPYAPA 385

Query: 175 GAHLGSR-------GGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSP 333
           GA+ GS         GA P  AG Y   G  +  ++++          P Q      P+P
Sbjct: 386 GAYPGSAPPGAYAPSGAGPGPAGAYQPPGTVAPAYASQ----------PVQGSAAGAPAP 435

Query: 334 HLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNG 453
             AHGG   +        A G A+  ++ +   A+G GNG
Sbjct: 436 --AHGGAYGSSAAATGPAAAGAAAGGNSTVANNASGSGNG 473

[135][TOP]
>UniRef100_Q4FX62 Proteophosphoglycan 5 n=1 Tax=Leishmania major strain Friedlin
            RepID=Q4FX62_LEIMA
          Length = 17392

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 48/176 (27%), Positives = 79/176 (44%), Gaps = 2/176 (1%)
 Frame = +1

Query: 13   PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPA--SSYAPSSSASLPQGAHL 186
            PS  S  P +    SSA  S S  P A    A S     P+  SS APSSS+S    A  
Sbjct: 8789 PSSSSSAPSA--SSSSAPSSSSSAPSASSSSAPSSSSSAPSASSSSAPSSSSSSALSASS 8846

Query: 187  GSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAH 366
             S   +  S      +S P+S++ S  S S  S     P     + PS   +    +++ 
Sbjct: 8847 SSAPSSSSSAPSASSSSAPSSSSSSAPSASSSSA----PSSSSSSAPSASSSSAPSSSSS 8902

Query: 367  GVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAAAA 534
              P    ++ P+S +S+A PA+++   +  +  P A  S A +++ +  S ++++A
Sbjct: 8903 SAPSASSSSAPSSSSSSAPPAFSSSAPSSSSSAPSASSSSAPSSSSSAPSASSSSA 8958

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 45/176 (25%), Positives = 79/176 (44%), Gaps = 2/176 (1%)
 Frame = +1

Query: 13   PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPA--SSYAPSSSASLPQGAHL 186
            PS  S  P S    S+ + S S  P A    A S     P+  SS APSSS+S P  +  
Sbjct: 7609 PSSSSSAP-SASSSSAPSSSSSSAPSASSSSAPSSSSSAPSASSSSAPSSSSSAPSASSS 7667

Query: 187  GSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAH 366
             +   +  S      +S P+S++ S  SGS  S     P     + PS   +    +++ 
Sbjct: 7668 SAPSSSSSSAPSASSSSAPSSSSSSAPSGSSSSA----PSSSSSSAPSASSSSAPSSSSS 7723

Query: 367  GVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAAAA 534
              P    ++ P+S +SA   + ++   +  + P G+  S  S+++ +  S ++++A
Sbjct: 7724 SAPSASSSSAPSSSSSAPSASSSSAPSSSSSAPSGSSSSAPSSSSSSAPSASSSSA 7779

[136][TOP]
>UniRef100_B5DXL6 GA27145 n=1 Tax=Drosophila pseudoobscura pseudoobscura
            RepID=B5DXL6_DROPS
          Length = 875

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 50/171 (29%), Positives = 79/171 (46%), Gaps = 8/171 (4%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGP-PYAPGVYAGSGPGGHPASSY-----APSSSASLPQGAH-LGS 192
            P S     S++ +  GP P AP + + S P   P+SSY      PSSS S P  ++   S
Sbjct: 688  PSSSYSAPSSSSNSGGPYPAAPSI-SYSAPAAPPSSSYGAPATGPSSSYSAPSSSYGAPS 746

Query: 193  RGGAPPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
             G +  S + G G+S  T+ +F S+ SGS     P+ P        S +    G  A  G
Sbjct: 747  SGSSSGSFSSGSGSSFSTAPSFGSSSSGSGSGGYPSAPSSSYSAPSSSY----GAPATGG 802

Query: 370  VPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPA 522
                   +GP+S  S+A  + ++  G+ P+ P  +  +PA  + +N   P+
Sbjct: 803  DSALSFPSGPSSSYSSAPASGSSSSGSYPSAPSSSYGAPAQDSGYNYSGPS 853

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 53/189 (28%), Positives = 81/189 (42%), Gaps = 16/189 (8%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAA--GSFSGP-----PYAP-GVYAGSGPGGHPASSY--APSSSAS 165
           SYG+   GS  G  S+A   S+  P     P AP   Y+   P  +   SY  APSSS S
Sbjct: 424 SYGAPSAGSSSGSFSSAPSSSYGAPSKGSFPSAPSSSYSAPSPSANSGGSYPSAPSSSYS 483

Query: 166 LPQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAH 345
            P  +   S G  P + +  Y A  P+    +N  GS+ +   +    P P+  S     
Sbjct: 484 APSPS-ANSGGSYPAAPSSSYSAPSPS----ANSGGSYPAAPSSSYSAPSPSANSGGSYP 538

Query: 346 GGVTAAHGVPRHHGANG------PASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFN 507
              ++++  P     +G      P+S  SA  P  A  GG  P+ P  +  +P+S++   
Sbjct: 539 AAPSSSYSAPSPSANSGGSYPAAPSSSYSAPSPG-ANSGGPYPSAPSSSYSAPSSSSNSG 597

Query: 508 RLSPAAAAA 534
              PAA ++
Sbjct: 598 GPYPAAPSS 606

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 50/178 (28%), Positives = 78/178 (43%), Gaps = 8/178 (4%)
 Frame = +1

Query: 16   SYGSHVPGSVVGGSSAAGSFSGPPYAP-GVYAGSGPGGHPASSY--APSSSASLPQGAHL 186
            SY +    S    S +A S    P AP   Y+   PG +    Y  APSSS S P  +  
Sbjct: 536  SYPAAPSSSYSAPSPSANSGGSYPAAPSSSYSAPSPGANSGGPYPSAPSSSYSAPSSSS- 594

Query: 187  GSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAH 366
             S G  P + +  Y A  P+    +N  GS+ S   +    P P+  S        ++++
Sbjct: 595  NSGGPYPAAPSSSYSAPSPS----ANSGGSYPSAPSSSYSAPSPSANSGGSYPSAPSSSY 650

Query: 367  GVP---RHHGANGPASLNSA--ALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAA 525
              P    + G + P++ +S+  A  A + GGG  PA P  +  +P+S++      PAA
Sbjct: 651  SAPSPSANSGGSYPSAPSSSYGAPSASSNGGGPYPAAPSSSYSAPSSSSNSGGPYPAA 708

[137][TOP]
>UniRef100_B3MRJ3 GF20989 n=1 Tax=Drosophila ananassae RepID=B3MRJ3_DROAN
          Length = 907

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 50/158 (31%), Positives = 61/158 (38%)
 Frame = +1

Query: 61  AAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYGASG 240
           AA S SG   A G    S  GG  A+  + +SSA    G   G+  G+    A G G   
Sbjct: 167 AASSGSGAG-ASGAGTVSSGGGSSANKVSAASSAQQLPGMATGAGAGSATPGAAGSGGGA 225

Query: 241 PTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAA 420
             S   S   G+  S     P +PP +   PH   G            GA  PA    AA
Sbjct: 226 TASRPVSAMGGTVSSTAGGAPSIPPISTMPPHTVPGSTNTTTTAMSGAGAAAPA----AA 281

Query: 421 LPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAAAA 534
           L A     G    YP    V+ AS    N ++ AAAAA
Sbjct: 282 LMASLLNPGQVGGYPGQTAVNNASLMDANSVTAAAAAA 319

[138][TOP]
>UniRef100_Q01149 Collagen alpha-2(I) chain n=2 Tax=Mus musculus RepID=CO1A2_MOUSE
          Length = 1372

 Score = 55.8 bits (133), Expect = 2e-06
 Identities = 49/171 (28%), Positives = 61/171 (35%), Gaps = 17/171 (9%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGG 201
            GS  P    G     G  +G   APG    SGPGG P    A        +    G RG 
Sbjct: 613  GSRGPSGAPGPDGNKGE-AGAVGAPGSAGASGPGGLPGERGAAGIPGGKGEKGETGLRGD 671

Query: 202  APPS-------VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPH 336
               +       + G  GA GP  A+    E+G+     PA P+  P       P GP+  
Sbjct: 672  TGNTGRDGARGIPGAVGAPGPAGASGDRGEAGAAGPSGPAGPRGSPGERGEVGPAGPNGF 731

Query: 337  LAHGGVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPGAIVS 483
                G     G     G  GP   N    P  + G  G +GP  PPG + S
Sbjct: 732  AGPAGAAGQPGAKGEKGTKGPKGENGIVGPTGSVGAAGPSGPNGPPGPVGS 782

[139][TOP]
>UniRef100_UPI0001B513DD multidomain-containing protein family n=1 Tax=Streptomyces lividans
           TK24 RepID=UPI0001B513DD
          Length = 413

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 51/153 (33%), Positives = 57/153 (37%)
 Frame = +1

Query: 37  GSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSV 216
           G+  G   A+G  SGP  APG   G  PG  PA   AP SS + P             S 
Sbjct: 288 GAASGPDPASGPASGPAVAPGSGGGPAPGWWPAPGTAPGSSTAPPHDT---------ASA 338

Query: 217 AGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANG 396
           A    A GPTSA                P   P  G +P  A G   +  G     G  G
Sbjct: 339 ADTAPAPGPTSA----------------PGTAPAPGSTPAPAPGTTGSTPGTSPAPGTAG 382

Query: 397 PASLNSAALPAYATGGGNGPAYPPGAIVSPAST 495
           PA   S A P  A   G  PA  PG   +P ST
Sbjct: 383 PARDTSYA-PGTAPVAGTTPA--PGTAPAPGST 412

[140][TOP]
>UniRef100_UPI0001AE71B1 UPI0001AE71B1 related cluster n=1 Tax=Homo sapiens
            RepID=UPI0001AE71B1
          Length = 1676

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 56/180 (31%), Positives = 61/180 (33%), Gaps = 25/180 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGA 180
            G   P    G S A G+  G     PP   G+    GP G P       P     LP   
Sbjct: 787  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPLGPPGKDGLP--G 844

Query: 181  HLGSRGGA----------PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS 330
            H G RG            PP V G  GA+G T      E G      P PP  P   G  
Sbjct: 845  HPGQRGEVGFQGKTGPPGPPGVVGPQGAAGETGPM--GERG-----HPGPPGPPGEQGLP 897

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                  G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 898  GTAGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 957

[141][TOP]
>UniRef100_UPI0000D60E9C UPI0000D60E9C related cluster n=1 Tax=Homo sapiens
            RepID=UPI0000D60E9C
          Length = 1629

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 56/180 (31%), Positives = 61/180 (33%), Gaps = 25/180 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGA 180
            G   P    G S A G+  G     PP   G+    GP G P       P     LP   
Sbjct: 740  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPLGPPGKDGLP--G 797

Query: 181  HLGSRGGA----------PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS 330
            H G RG            PP V G  GA+G T      E G      P PP  P   G  
Sbjct: 798  HPGQRGEVGFQGKTGPPGPPGVVGPQGAAGETGPM--GERG-----HPGPPGPPGEQGLP 850

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                  G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 851  GTAGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 910

[142][TOP]
>UniRef100_UPI0000D60E9B UPI0000D60E9B related cluster n=1 Tax=Homo sapiens
            RepID=UPI0000D60E9B
          Length = 1655

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 56/180 (31%), Positives = 61/180 (33%), Gaps = 25/180 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGA 180
            G   P    G S A G+  G     PP   G+    GP G P       P     LP   
Sbjct: 766  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPLGPPGKDGLP--G 823

Query: 181  HLGSRGGA----------PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS 330
            H G RG            PP V G  GA+G T      E G      P PP  P   G  
Sbjct: 824  HPGQRGEVGFQGKTGPPGPPGVVGPQGAAGETGPM--GERG-----HPGPPGPPGEQGLP 876

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                  G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 877  GTAGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 936

[143][TOP]
>UniRef100_UPI0000D60E9A UPI0000D60E9A related cluster n=1 Tax=Homo sapiens
            RepID=UPI0000D60E9A
          Length = 1689

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 56/180 (31%), Positives = 61/180 (33%), Gaps = 25/180 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGA 180
            G   P    G S A G+  G     PP   G+    GP G P       P     LP   
Sbjct: 800  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPLGPPGKDGLP--G 857

Query: 181  HLGSRGGA----------PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS 330
            H G RG            PP V G  GA+G T      E G      P PP  P   G  
Sbjct: 858  HPGQRGEVGFQGKTGPPGPPGVVGPQGAAGETGPM--GERG-----HPGPPGPPGEQGLP 910

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                  G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 911  GTAGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 970

[144][TOP]
>UniRef100_UPI0000D60E99 UPI0000D60E99 related cluster n=1 Tax=Homo sapiens
            RepID=UPI0000D60E99
          Length = 1710

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 56/180 (31%), Positives = 61/180 (33%), Gaps = 25/180 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGA 180
            G   P    G S A G+  G     PP   G+    GP G P       P     LP   
Sbjct: 821  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPLGPPGKDGLP--G 878

Query: 181  HLGSRGGA----------PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS 330
            H G RG            PP V G  GA+G T      E G      P PP  P   G  
Sbjct: 879  HPGQRGEVGFQGKTGPPGPPGVVGPQGAAGETGPM--GERG-----HPGPPGPPGEQGLP 931

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                  G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 932  GTAGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 991

[145][TOP]
>UniRef100_UPI0000D60E98 UPI0000D60E98 related cluster n=1 Tax=Homo sapiens
            RepID=UPI0000D60E98
          Length = 1715

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 56/180 (31%), Positives = 61/180 (33%), Gaps = 25/180 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGA 180
            G   P    G S A G+  G     PP   G+    GP G P       P     LP   
Sbjct: 826  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPLGPPGKDGLP--G 883

Query: 181  HLGSRGGA----------PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS 330
            H G RG            PP V G  GA+G T      E G      P PP  P   G  
Sbjct: 884  HPGQRGEVGFQGKTGPPGPPGVVGPQGAAGETGPM--GERG-----HPGPPGPPGEQGLP 936

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                  G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 937  GTAGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 996

[146][TOP]
>UniRef100_UPI0000D60E97 UPI0000D60E97 related cluster n=1 Tax=Homo sapiens
            RepID=UPI0000D60E97
          Length = 1736

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 56/180 (31%), Positives = 61/180 (33%), Gaps = 25/180 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGA 180
            G   P    G S A G+  G     PP   G+    GP G P       P     LP   
Sbjct: 847  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPLGPPGKDGLP--G 904

Query: 181  HLGSRGGA----------PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS 330
            H G RG            PP V G  GA+G T      E G      P PP  P   G  
Sbjct: 905  HPGQRGEVGFQGKTGPPGPPGVVGPQGAAGETGPM--GERG-----HPGPPGPPGEQGLP 957

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                  G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 958  GTAGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 1017

[147][TOP]
>UniRef100_B9J1C9 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           Q1 RepID=B9J1C9_BACCQ
          Length = 1330

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 42/154 (27%), Positives = 60/154 (38%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   + +       + G+ G     
Sbjct: 195 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGSTGATGAT-----GNTGATGNT--G 247

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           + G  G++GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 248 ITGATGSTGPTGSTGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQGVQG 307

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             G+    G  GP  +     P   TG  G  GP
Sbjct: 308 IQGITGATGDQGPQGIQGVIGPQGVTGATGDQGP 341

[148][TOP]
>UniRef100_Q4MVJ1 Putative uncharacterized protein n=1 Tax=Bacillus cereus G9241
           RepID=Q4MVJ1_BACCE
          Length = 1300

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 43/154 (27%), Positives = 59/154 (38%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   + +       + G+ G     
Sbjct: 192 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGSTGATGAT-----GNTGATGST--G 244

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           V G  G +GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 245 VTGATGTTGPTGSTGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQGVQG 304

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             G+    G  GP  +     P   TG  G  GP
Sbjct: 305 IQGITGATGDQGPQGIQGVIGPQGVTGATGDQGP 338

[149][TOP]
>UniRef100_C3GYK9 Putative uncharacterized protein n=1 Tax=Bacillus thuringiensis
           serovar huazhongensis BGSC 4BD1 RepID=C3GYK9_BACTU
          Length = 389

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 52/160 (32%), Positives = 64/160 (40%), Gaps = 8/160 (5%)
 Frame = +1

Query: 19  YGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASL-PQGAH--LG 189
           YGS   G   GG++ A   +GP    G    +GP G   ++ A        PQGA    G
Sbjct: 31  YGSGCLGG--GGATGATGATGPQGPAGATGATGPPGPAGATGATGPQGPQGPQGAQGPAG 88

Query: 190 SRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
           ++G   P   G  G  GP  AT +  +   Q +Q          GP+      G T A G
Sbjct: 89  AQGATGPQ--GPQGIQGPAGATGATGATGAQGVQ----------GPAGATGATGATGAQG 136

Query: 370 VPRHHGANGPASLNSAALPAYATG-----GGNGPAYPPGA 474
           V    GA GP  L     PA ATG     G  GPA   GA
Sbjct: 137 VQGPAGATGPQGLQGIQGPAGATGPQGLQGIQGPAGATGA 176

[150][TOP]
>UniRef100_C3ERC2 Collagen triple helix repeat domain protein n=1 Tax=Bacillus
           thuringiensis serovar kurstaki str. T03a001
           RepID=C3ERC2_BACTK
          Length = 594

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 58/182 (31%), Positives = 70/182 (38%), Gaps = 13/182 (7%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAG--SFSGPPYAPGVYAGSGPGGH-----PASSYAPSSSASLPQGA 180
           GS  P    G + A G    +GP  + G    +GP G      P  S  P+ S     GA
Sbjct: 127 GSTGPTGATGPTGATGPTGSTGPTGSTGPTGSTGPTGSTGSTGPTGSTGPTGSTG-STGA 185

Query: 181 HLGSRGGAPPSVA----GGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG 348
             GS G   P+ A    G  GA+GPT AT S  +GS  S           TGP+      
Sbjct: 186 -TGSTGSTGPTGATGPTGSTGATGPTGATGS--TGSTGS-----------TGPTGATGST 231

Query: 349 GVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPGAIVSPASTATFNRLSPA 522
           GVT   G     GA GP     +  P  ATG  G  GP    G+  S  ST       P 
Sbjct: 232 GVTGPTGATGSTGATGPTGSTGSTGPTGATGPTGATGPTGSTGSTGSTGSTGPTGATGPT 291

Query: 523 AA 528
            +
Sbjct: 292 GS 293

[151][TOP]
>UniRef100_C2V1W3 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           Rock3-28 RepID=C2V1W3_BACCE
          Length = 937

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 47/157 (29%), Positives = 62/157 (39%), Gaps = 16/157 (10%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+     S+  + P GA  G+ G     
Sbjct: 206 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSG----STGVTGPTGA-TGNTG----- 255

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ----------PAPPQ----MPPPTGPSPHLAHGG 351
            A G G +GPT +T    +   Q +Q          P  PQ    +P PTG +      G
Sbjct: 256 -ATGQGLTGPTGSTGETGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQG 314

Query: 352 VTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
           V    G+    G  GP  +  A  P   TG  G  GP
Sbjct: 315 VQGIQGITGATGDQGPQGIQGAIGPQGVTGATGDQGP 351

[152][TOP]
>UniRef100_B5H071 Putative uncharacterized protein (Fragment) n=1 Tax=Streptomyces
            clavuligerus ATCC 27064 RepID=B5H071_STRCL
          Length = 1007

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 54/177 (30%), Positives = 65/177 (36%), Gaps = 13/177 (7%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPG-GHPASSYAPSSSASLPQGAHLGSRGGAPP 210
            PG    G+  AG+F   P   G   G+GP  G P    A      LP  A     GG  P
Sbjct: 773  PGQGRQGTGLAGAFGNRPPKNGSGRGTGPQQGGPGGPNAGDRGRQLPTPA----AGGPRP 828

Query: 211  SVAGGYGAS--GPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHH 384
             + GG GA   GP  A             P P   P    P  H  +GG+    G P+  
Sbjct: 829  ELPGGPGAPQRGPNQA-------------PGPFGGPAADAPRGHEENGGLRGPGGSPQQG 875

Query: 385  GANGP-------ASLNSAALPAYATG---GGNGPAYPPGAIVSPASTATFNRLSPAA 525
            G  GP        S    A+   A G   GG   +  PGA   P +TA   R+ P A
Sbjct: 876  GPGGPFVRPDVFGSSQQCAVGGRAGGNPAGGPFASRNPGAEQDPTATAPMPRIDPGA 932

[153][TOP]
>UniRef100_Q9BIT7 Major ampullate spidroin 2-like protein (Fragment) n=1 Tax=Nephila
            inaurata madagascariensis RepID=Q9BIT7_9ARAC
          Length = 1953

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 59/190 (31%), Positives = 73/190 (38%), Gaps = 15/190 (7%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGPP-YAPG---------VYAGSGPGGHPASSYAPSSS 159
            P  YG    G   GGSSAA + +GP  Y PG           AGSGPGG+      P   
Sbjct: 1223 PGGYGPGQQGP--GGSSAAAAAAGPGRYGPGQQGPGAAAAAAAGSGPGGYGPGQQGPGGP 1280

Query: 160  ASLPQGAHLG-SRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
             +    A  G   GG  P   G  G  GP +A  +   G +   Q  P       G +  
Sbjct: 1281 GAAAAAAAAGRGPGGYGP---GQQGPGGPGAAAAAAGPGGYGPGQQGP-------GAAAA 1330

Query: 337  LAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYP--PGAIVSPASTATF-- 504
             A G     +G P   G  GP +  +AA      G G G   P  PGA  + A    +  
Sbjct: 1331 AAAGSGPGGYG-PGQQGPGGPGAAAAAAAGRGPGGYGQGQQGPGGPGAAAAAAGPGGYGP 1389

Query: 505  NRLSPAAAAA 534
             +  P AAAA
Sbjct: 1390 GQQGPGAAAA 1399

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 52/172 (30%), Positives = 64/172 (37%), Gaps = 11/172 (6%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGPP-YAPG---------VYAGSGPGGHPASSYAPSSS 159
            P  YG    G   GG  AA + +GP  Y PG           AG GPGG+      P  S
Sbjct: 816  PGGYGPGQQGP--GGPGAAAAAAGPGGYGPGQQGPGAAAAASAGRGPGGYGPGQQGPGGS 873

Query: 160  ASLPQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHL 339
             +    A  G  GG  P   G  G     +A      G +   Q  P Q  P    +   
Sbjct: 874  GAAAAAAGRGP-GGYGPGQQGPGGPGAAAAAAAGRGPGGYGPGQQGPGQQGPGGSGAAAA 932

Query: 340  AHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYP-PGAIVSPAS 492
            A G     +G P   G  GP +  +AA P     GG GP    PGA  + A+
Sbjct: 933  AAGRGPGGYG-PGQQGPGGPGAAAAAAGP-----GGYGPGQQGPGAAAAAAA 978

[154][TOP]
>UniRef100_Q2VLH2 Major ampullate spidroin 2-like (Fragment) n=1 Tax=Nephila inaurata
            madagascariensis RepID=Q2VLH2_9ARAC
          Length = 2069

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 59/190 (31%), Positives = 73/190 (38%), Gaps = 15/190 (7%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGPP-YAPG---------VYAGSGPGGHPASSYAPSSS 159
            P  YG    G   GGSSAA + +GP  Y PG           AGSGPGG+      P   
Sbjct: 1356 PGGYGPGQQGP--GGSSAAAAAAGPGRYGPGQQGPGAAAAAAAGSGPGGYGPGQQGPGGP 1413

Query: 160  ASLPQGAHLG-SRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPH 336
             +    A  G   GG  P   G  G  GP +A  +   G +   Q  P       G +  
Sbjct: 1414 GAAAAAAAAGRGPGGYGP---GQQGPGGPGAAAAAAGPGGYGPGQQGP-------GAAAA 1463

Query: 337  LAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYP--PGAIVSPASTATF-- 504
             A G     +G P   G  GP +  +AA      G G G   P  PGA  + A    +  
Sbjct: 1464 AAAGSGPGGYG-PGQQGPGGPGAAAAAAAGRGPGGYGQGQQGPGGPGAAAAAAGPGGYGP 1522

Query: 505  NRLSPAAAAA 534
             +  P AAAA
Sbjct: 1523 GQQGPGAAAA 1532

[155][TOP]
>UniRef100_Q26634 Alpha-1 collagen n=1 Tax=Strongylocentrotus purpuratus
            RepID=Q26634_STRPU
          Length = 1414

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 54/164 (32%), Positives = 61/164 (37%), Gaps = 10/164 (6%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGS--FSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAH 183
            P   GS       G S A GS    GP  APG    SGP G   S+ AP      P GA 
Sbjct: 989  PGPQGSRGEKGDTGASGANGSPGAPGPIGAPGAAGASGPRGETGSTGAPGPLG--PTGAR 1046

Query: 184  LGSRGGAPPS----VAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG- 348
             GS G A PS     AG  G +GP              LQ     M  P  P      G 
Sbjct: 1047 -GSTGPAGPSGPSGPAGERGETGPAGHKGHPGVSGLPGLQGTSGPMGEPGAPGEQGQQGT 1105

Query: 349  -GVTAAHGVPRHHGANGPASLNSAALP--AYATGGGNGPAYPPG 471
             G+  A G   + G +GP   +    P      GG +GP  PPG
Sbjct: 1106 RGLPGARGSNGNDGPSGPRGFDGPEGPRGPRGEGGSSGPPGPPG 1149

[156][TOP]
>UniRef100_Q16985 Fibroin-1 (Fragment) n=1 Tax=Araneus diadematus RepID=Q16985_ARADI
          Length = 360

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 53/169 (31%), Positives = 69/169 (40%), Gaps = 7/169 (4%)
 Frame = +1

Query: 49  GGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGY 228
           GG S AG+     Y  G  AGSG G   A++   S+ A+   G   G   GA    AGGY
Sbjct: 129 GGGSGAGAGGAGGYGQGYGAGSGAGAGAAAAAGASAGAAGGYGGGAGVGAGAGAGAAGGY 188

Query: 229 GASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASL 408
           G S  + A     +G+  +                  A  G  AA G    +GA   A  
Sbjct: 189 GQSYGSGAGAGAGAGAAAA------------------AGAGARAAGGYGGGYGAGAGAGA 230

Query: 409 NSAALPAYATGGGNGPAYPPGA---IVSPASTATF----NRLSPAAAAA 534
            +AA  +    GG G  Y  GA    V+ AS  ++    NRLS A AA+
Sbjct: 231 GAAA--SAGASGGYGGGYGGGAGAGAVAGASAGSYGGAVNRLSSAGAAS 277

[157][TOP]
>UniRef100_B4IJR5 GM13722 n=1 Tax=Drosophila sechellia RepID=B4IJR5_DROSE
          Length = 747

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 59/198 (29%), Positives = 71/198 (35%), Gaps = 25/198 (12%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGG------SSAAGSFSGPPYAPGVYAGSGP---------GGHPASS- 141
            PP  G H P   + G       +   ++ GPP+ P      GP         GGHP    
Sbjct: 549  PPHMGPHQPPPGMSGLPPPPPHTGYANYGGPPHGPPPGPPGGPARPYYQPQYGGHPTPQP 608

Query: 142  -YAPSS----SASLPQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQ 306
             YAP S    S   P G+H  S    PP   G  G        ++ E GS     P PPQ
Sbjct: 609  YYAPFSPYQQSYGPPPGSHYMSPRPPPPQHNGNLGHP------YAPEHGS----NPPPPQ 658

Query: 307  MPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYAT-GGGNGPAYPP---GA 474
                  P P   H       G P   G  G A+  +     Y T G G GP  PP   GA
Sbjct: 659  QQQQQQPPPGHLHEPSAGGPGAP--GGGAGAAAAAAPGAGVYPTPGAGAGPGAPPAAGGA 716

Query: 475  IVSPASTATFNRLSPAAA 528
             +  A+ A      PA A
Sbjct: 717  TLGEAAVAGGVAPPPATA 734

[158][TOP]
>UniRef100_B3M1V5 GF17870 n=1 Tax=Drosophila ananassae RepID=B3M1V5_DROAN
          Length = 871

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 49/173 (28%), Positives = 64/173 (36%), Gaps = 4/173 (2%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSR 195
           S+G+  P S  G  +A     G P  P   +   P   P+SSY   +  S          
Sbjct: 221 SFGTSAPSSSYGAQAAPSKSYGAPAPPPSKSYGAPAAPPSSSYGAPAPPS--------KS 272

Query: 196 GGAPPSVAGGYGASGPTSATFSNESGSFQS--LQPAPPQMP--PPTGPSPHLAHGGVTAA 363
            GAPP+ +  YGA    SA  S+     +S    PAPP      P  PSP         +
Sbjct: 273 YGAPPAPSSSYGAPSAPSAPSSSYGSPSKSYGAPPAPPSQSYGAPAAPSP---------S 323

Query: 364 HGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPA 522
           +G P       PA   S   PA  +     PA P  +  +P      N L PA
Sbjct: 324 YGAP-------PAPSKSYGAPAPPSPSYGAPAPPSSSYGAPPQAPVSNYLPPA 369

[159][TOP]
>UniRef100_Q5STP6 Collagen, type XI, alpha 2 n=1 Tax=Homo sapiens RepID=Q5STP6_HUMAN
          Length = 1650

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 56/180 (31%), Positives = 61/180 (33%), Gaps = 25/180 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGA 180
            G   P    G S A G+  G     PP   G+    GP G P       P     LP   
Sbjct: 761  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPLGPPGKDGLP--G 818

Query: 181  HLGSRGGA----------PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS 330
            H G RG            PP V G  GA+G T      E G      P PP  P   G  
Sbjct: 819  HPGQRGEVGFQGKTGPPGPPGVVGPQGAAGETGPM--GERG-----HPGPPGPPGEQGLP 871

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                  G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 872  GTAGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 931

[160][TOP]
>UniRef100_C9J3N1 Putative uncharacterized protein ENSP00000405291 n=1 Tax=Homo sapiens
            RepID=C9J3N1_HUMAN
          Length = 1693

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 56/180 (31%), Positives = 61/180 (33%), Gaps = 25/180 (13%)
 Frame = +1

Query: 22   GSHVPGSVVGGSSAAGSFSG-----PPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGA 180
            G   P    G S A G+  G     PP   G+    GP G P       P     LP   
Sbjct: 761  GQRGPRGATGKSGAKGTSGGDGPHGPPGERGLPGPQGPNGFPGPKGPLGPPGKDGLP--G 818

Query: 181  HLGSRGGA----------PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS 330
            H G RG            PP V G  GA+G T      E G      P PP  P   G  
Sbjct: 819  HPGQRGEVGFQGKTGPPGPPGVVGPQGAAGETGPM--GERG-----HPGPPGPPGEQGLP 871

Query: 331  PHLAHGGVTAAHGVPRHHGANGPASL----NSAALPAYATG----GGNGPAYPPGAIVSP 486
                  G     G P   G +GPA L        LP  A G    G  GP+ PPG   SP
Sbjct: 872  GTAGKEGTKGDPGPPGAPGKDGPAGLRGFPGERGLPGTAGGPGLKGNEGPSGPPGPAGSP 931

[161][TOP]
>UniRef100_A0RUH1 Collagen type XI alpha 2 n=1 Tax=Cenarchaeum symbiosum
           RepID=A0RUH1_CENSY
          Length = 468

 Score = 55.5 bits (132), Expect = 2e-06
 Identities = 59/185 (31%), Positives = 66/185 (35%), Gaps = 29/185 (15%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVGGSSAAGS-----FSGPPYAPGVYAGSGPGGHPASSYAPSSSASL 168
           +QPP+     P S  G    AG        GP  APG +   GP G P     P S    
Sbjct: 120 EQPPA---EPPASSRGEKGPAGQPGERGDKGPAGAPGEHGDKGPIGPPGERGIPGSPG-- 174

Query: 169 PQG-----------AHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQP------- 294
           PQG             +G RG   P  AG  G +GP     + + G    L P       
Sbjct: 175 PQGDKGPAGDKGITGDMGDRGDKGP--AGEPGETGPDGP--AGDKGDRGPLGPQGLPGER 230

Query: 295 --APPQMPP----PTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGP 456
             A P  PP    PTG        G T   G P   G  GPA       PA    GG GP
Sbjct: 231 GDAGPHGPPGDKGPTGERGPTGTKGETGPPGTPGDKGLQGPAGPEGGKGPA-GVEGGKGP 289

Query: 457 AYPPG 471
           A PPG
Sbjct: 290 AGPPG 294

[162][TOP]
>UniRef100_UPI00016E6475 UPI00016E6475 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E6475
          Length = 1741

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/169 (31%), Positives = 59/169 (34%), Gaps = 24/169 (14%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGAHLGSRGGA------- 204
            G+S +   +GPP   G     GP G P       P     LP   H G RG         
Sbjct: 838  GTSGSDGPAGPPGERGPQGPQGPLGFPGPKGPNGPPGKDGLP--GHPGQRGETGFQGKTG 895

Query: 205  PPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTG-------------PSPHLA 342
            PP   G  G  GPT  T  S E G      P PP  P   G             P P   
Sbjct: 896  PPGPGGVVGPQGPTGGTGPSGERG-----HPGPPGPPGEQGLPGAAGKEGGKGDPGPQ-G 949

Query: 343  HGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            H G     G+P   G  G P  +  A L      GG GP  PPG I SP
Sbjct: 950  HSGKAGPPGLPGFQGQRGLPGGMGPAGLK-----GGEGPQGPPGPIGSP 993

[163][TOP]
>UniRef100_UPI00016E6474 UPI00016E6474 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E6474
          Length = 1792

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/169 (31%), Positives = 59/169 (34%), Gaps = 24/169 (14%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGAHLGSRGGA------- 204
            G+S +   +GPP   G     GP G P       P     LP   H G RG         
Sbjct: 889  GTSGSDGPAGPPGERGPQGPQGPLGFPGPKGPNGPPGKDGLP--GHPGQRGETGFQGKTG 946

Query: 205  PPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTG-------------PSPHLA 342
            PP   G  G  GPT  T  S E G      P PP  P   G             P P   
Sbjct: 947  PPGPGGVVGPQGPTGGTGPSGERG-----HPGPPGPPGEQGLPGAAGKEGGKGDPGPQ-G 1000

Query: 343  HGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            H G     G+P   G  G P  +  A L      GG GP  PPG I SP
Sbjct: 1001 HSGKAGPPGLPGFQGQRGLPGGMGPAGLK-----GGEGPQGPPGPIGSP 1044

[164][TOP]
>UniRef100_UPI00016E6473 UPI00016E6473 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E6473
          Length = 1796

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/169 (31%), Positives = 59/169 (34%), Gaps = 24/169 (14%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGAHLGSRGGA------- 204
            G+S +   +GPP   G     GP G P       P     LP   H G RG         
Sbjct: 893  GTSGSDGPAGPPGERGPQGPQGPLGFPGPKGPNGPPGKDGLP--GHPGQRGETGFQGKTG 950

Query: 205  PPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTG-------------PSPHLA 342
            PP   G  G  GPT  T  S E G      P PP  P   G             P P   
Sbjct: 951  PPGPGGVVGPQGPTGGTGPSGERG-----HPGPPGPPGEQGLPGAAGKEGGKGDPGPQ-G 1004

Query: 343  HGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            H G     G+P   G  G P  +  A L      GG GP  PPG I SP
Sbjct: 1005 HSGKAGPPGLPGFQGQRGLPGGMGPAGLK-----GGEGPQGPPGPIGSP 1048

[165][TOP]
>UniRef100_UPI00016E644C UPI00016E644C related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E644C
          Length = 1799

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/169 (31%), Positives = 59/169 (34%), Gaps = 24/169 (14%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGAHLGSRGGA------- 204
            G+S +   +GPP   G     GP G P       P     LP   H G RG         
Sbjct: 896  GTSGSDGPAGPPGERGPQGPQGPLGFPGPKGPNGPPGKDGLP--GHPGQRGETGFQGKTG 953

Query: 205  PPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTG-------------PSPHLA 342
            PP   G  G  GPT  T  S E G      P PP  P   G             P P   
Sbjct: 954  PPGPGGVVGPQGPTGGTGPSGERG-----HPGPPGPPGEQGLPGAAGKEGGKGDPGPQ-G 1007

Query: 343  HGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            H G     G+P   G  G P  +  A L      GG GP  PPG I SP
Sbjct: 1008 HSGKAGPPGLPGFQGQRGLPGGMGPAGLK-----GGEGPQGPPGPIGSP 1051

[166][TOP]
>UniRef100_UPI00016E644B UPI00016E644B related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E644B
          Length = 1801

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/169 (31%), Positives = 59/169 (34%), Gaps = 24/169 (14%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGAHLGSRGGA------- 204
            G+S +   +GPP   G     GP G P       P     LP   H G RG         
Sbjct: 898  GTSGSDGPAGPPGERGPQGPQGPLGFPGPKGPNGPPGKDGLP--GHPGQRGETGFQGKTG 955

Query: 205  PPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTG-------------PSPHLA 342
            PP   G  G  GPT  T  S E G      P PP  P   G             P P   
Sbjct: 956  PPGPGGVVGPQGPTGGTGPSGERG-----HPGPPGPPGEQGLPGAAGKEGGKGDPGPQ-G 1009

Query: 343  HGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            H G     G+P   G  G P  +  A L      GG GP  PPG I SP
Sbjct: 1010 HSGKAGPPGLPGFQGQRGLPGGMGPAGLK-----GGEGPQGPPGPIGSP 1053

[167][TOP]
>UniRef100_UPI00016E644A UPI00016E644A related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E644A
          Length = 1812

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/169 (31%), Positives = 59/169 (34%), Gaps = 24/169 (14%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGAHLGSRGGA------- 204
            G+S +   +GPP   G     GP G P       P     LP   H G RG         
Sbjct: 909  GTSGSDGPAGPPGERGPQGPQGPLGFPGPKGPNGPPGKDGLP--GHPGQRGETGFQGKTG 966

Query: 205  PPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTG-------------PSPHLA 342
            PP   G  G  GPT  T  S E G      P PP  P   G             P P   
Sbjct: 967  PPGPGGVVGPQGPTGGTGPSGERG-----HPGPPGPPGEQGLPGAAGKEGGKGDPGPQ-G 1020

Query: 343  HGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            H G     G+P   G  G P  +  A L      GG GP  PPG I SP
Sbjct: 1021 HSGKAGPPGLPGFQGQRGLPGGMGPAGLK-----GGEGPQGPPGPIGSP 1064

[168][TOP]
>UniRef100_UPI00016E6426 UPI00016E6426 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E6426
          Length = 1810

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/169 (31%), Positives = 59/169 (34%), Gaps = 24/169 (14%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGAHLGSRGGA------- 204
            G+S +   +GPP   G     GP G P       P     LP   H G RG         
Sbjct: 907  GTSGSDGPAGPPGERGPQGPQGPLGFPGPKGPNGPPGKDGLP--GHPGQRGETGFQGKTG 964

Query: 205  PPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTG-------------PSPHLA 342
            PP   G  G  GPT  T  S E G      P PP  P   G             P P   
Sbjct: 965  PPGPGGVVGPQGPTGGTGPSGERG-----HPGPPGPPGEQGLPGAAGKEGGKGDPGPQ-G 1018

Query: 343  HGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            H G     G+P   G  G P  +  A L      GG GP  PPG I SP
Sbjct: 1019 HSGKAGPPGLPGFQGQRGLPGGMGPAGLK-----GGEGPQGPPGPIGSP 1062

[169][TOP]
>UniRef100_UPI00016E6263 UPI00016E6263 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E6263
          Length = 1729

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/169 (31%), Positives = 59/169 (34%), Gaps = 24/169 (14%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGAHLGSRGGA------- 204
            G+S +   +GPP   G     GP G P       P     LP   H G RG         
Sbjct: 849  GTSGSDGPAGPPGERGPQGPQGPLGFPGPKGPNGPPGKDGLP--GHPGQRGETGFQGKTG 906

Query: 205  PPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTG-------------PSPHLA 342
            PP   G  G  GPT  T  S E G      P PP  P   G             P P   
Sbjct: 907  PPGPGGVVGPQGPTGGTGPSGERG-----HPGPPGPPGEQGLPGAAGKEGGKGDPGPQ-G 960

Query: 343  HGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            H G     G+P   G  G P  +  A L      GG GP  PPG I SP
Sbjct: 961  HSGKAGPPGLPGFQGQRGLPGGMGPAGLK-----GGEGPQGPPGPIGSP 1004

[170][TOP]
>UniRef100_UPI00016E6262 UPI00016E6262 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E6262
          Length = 1725

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/169 (31%), Positives = 59/169 (34%), Gaps = 24/169 (14%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGAHLGSRGGA------- 204
            G+S +   +GPP   G     GP G P       P     LP   H G RG         
Sbjct: 845  GTSGSDGPAGPPGERGPQGPQGPLGFPGPKGPNGPPGKDGLP--GHPGQRGETGFQGKTG 902

Query: 205  PPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTG-------------PSPHLA 342
            PP   G  G  GPT  T  S E G      P PP  P   G             P P   
Sbjct: 903  PPGPGGVVGPQGPTGGTGPSGERG-----HPGPPGPPGEQGLPGAAGKEGGKGDPGPQ-G 956

Query: 343  HGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            H G     G+P   G  G P  +  A L      GG GP  PPG I SP
Sbjct: 957  HSGKAGPPGLPGFQGQRGLPGGMGPAGLK-----GGEGPQGPPGPIGSP 1000

[171][TOP]
>UniRef100_UPI00016E6261 UPI00016E6261 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E6261
          Length = 1737

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/169 (31%), Positives = 59/169 (34%), Gaps = 24/169 (14%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASS--YAPSSSASLPQGAHLGSRGGA------- 204
            G+S +   +GPP   G     GP G P       P     LP   H G RG         
Sbjct: 834  GTSGSDGPAGPPGERGPQGPQGPLGFPGPKGPNGPPGKDGLP--GHPGQRGETGFQGKTG 891

Query: 205  PPSVAGGYGASGPTSATF-SNESGSFQSLQPAPPQMPPPTG-------------PSPHLA 342
            PP   G  G  GPT  T  S E G      P PP  P   G             P P   
Sbjct: 892  PPGPGGVVGPQGPTGGTGPSGERG-----HPGPPGPPGEQGLPGAAGKEGGKGDPGPQ-G 945

Query: 343  HGGVTAAHGVPRHHGANG-PASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            H G     G+P   G  G P  +  A L      GG GP  PPG I SP
Sbjct: 946  HSGKAGPPGLPGFQGQRGLPGGMGPAGLK-----GGEGPQGPPGPIGSP 989

[172][TOP]
>UniRef100_UPI00016E0385 UPI00016E0385 related cluster n=1 Tax=Takifugu rubripes
           RepID=UPI00016E0385
          Length = 1425

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/191 (28%), Positives = 68/191 (35%), Gaps = 21/191 (10%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGS----------GPGGHPASSYAPSSS 159
           PP + SH PG +  G+  A  F G     G+ +GS          GP G P  + A    
Sbjct: 105 PPGHPSH-PGGI--GAQMASGFDGKSGPQGMLSGSRGEAGTRGPPGPSGSPGQAGAQGPP 161

Query: 160 ASLPQGAHLGSRG-GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAP--PQMPPPTGPS 330
             +    H+GS G   P  + G  G  G      +N    F     A   P MP P G  
Sbjct: 162 GEVGDPGHMGSSGQRGPEGLMGKPGEDGEPGKPGNNGEMGFSGSPGARGFPGMPGPPGLK 221

Query: 331 PHLAHGGV---TAAHGVPRHHGANGPASLNSAALPAYATG-----GGNGPAYPPGAIVSP 486
            H  H G+      +G     GA GP     A  P    G     G +GP+  PG    P
Sbjct: 222 GHKGHLGILGQKGENGAVGSKGATGPHGPMGAPGPMGPAGMPGERGRSGPSGTPGKRGVP 281

Query: 487 ASTATFNRLSP 519
            S      L P
Sbjct: 282 GSVGKPGSLGP 292

[173][TOP]
>UniRef100_UPI00016E0384 UPI00016E0384 related cluster n=1 Tax=Takifugu rubripes
           RepID=UPI00016E0384
          Length = 1435

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/191 (28%), Positives = 68/191 (35%), Gaps = 21/191 (10%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGS----------GPGGHPASSYAPSSS 159
           PP + SH PG +  G+  A  F G     G+ +GS          GP G P  + A    
Sbjct: 115 PPGHPSH-PGGI--GAQMASGFDGKSGPQGMLSGSRGEAGTRGPPGPSGSPGQAGAQGPP 171

Query: 160 ASLPQGAHLGSRG-GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAP--PQMPPPTGPS 330
             +    H+GS G   P  + G  G  G      +N    F     A   P MP P G  
Sbjct: 172 GEVGDPGHMGSSGQRGPEGLMGKPGEDGEPGKPGNNGEMGFSGSPGARGFPGMPGPPGLK 231

Query: 331 PHLAHGGV---TAAHGVPRHHGANGPASLNSAALPAYATG-----GGNGPAYPPGAIVSP 486
            H  H G+      +G     GA GP     A  P    G     G +GP+  PG    P
Sbjct: 232 GHKGHLGILGQKGENGAVGSKGATGPHGPMGAPGPMGPAGMPGERGRSGPSGTPGKRGVP 291

Query: 487 ASTATFNRLSP 519
            S      L P
Sbjct: 292 GSVGKPGSLGP 302

[174][TOP]
>UniRef100_UPI00016E0382 UPI00016E0382 related cluster n=1 Tax=Takifugu rubripes
           RepID=UPI00016E0382
          Length = 1420

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/191 (28%), Positives = 68/191 (35%), Gaps = 21/191 (10%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGS----------GPGGHPASSYAPSSS 159
           PP + SH PG +  G+  A  F G     G+ +GS          GP G P  + A    
Sbjct: 100 PPGHPSH-PGGI--GAQMASGFDGKSGPQGMLSGSRGEAGTRGPPGPSGSPGQAGAQGPP 156

Query: 160 ASLPQGAHLGSRG-GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAP--PQMPPPTGPS 330
             +    H+GS G   P  + G  G  G      +N    F     A   P MP P G  
Sbjct: 157 GEVGDPGHMGSSGQRGPEGLMGKPGEDGEPGKPGNNGEMGFSGSPGARGFPGMPGPPGLK 216

Query: 331 PHLAHGGV---TAAHGVPRHHGANGPASLNSAALPAYATG-----GGNGPAYPPGAIVSP 486
            H  H G+      +G     GA GP     A  P    G     G +GP+  PG    P
Sbjct: 217 GHKGHLGILGQKGENGAVGSKGATGPHGPMGAPGPMGPAGMPGERGRSGPSGTPGKRGVP 276

Query: 487 ASTATFNRLSP 519
            S      L P
Sbjct: 277 GSVGKPGSLGP 287

[175][TOP]
>UniRef100_UPI00016E035C UPI00016E035C related cluster n=1 Tax=Takifugu rubripes
           RepID=UPI00016E035C
          Length = 1427

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/191 (28%), Positives = 68/191 (35%), Gaps = 21/191 (10%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGS----------GPGGHPASSYAPSSS 159
           PP + SH PG +  G+  A  F G     G+ +GS          GP G P  + A    
Sbjct: 107 PPGHPSH-PGGI--GAQMASGFDGKSGPQGMLSGSRGEAGTRGPPGPSGSPGQAGAQGPP 163

Query: 160 ASLPQGAHLGSRG-GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAP--PQMPPPTGPS 330
             +    H+GS G   P  + G  G  G      +N    F     A   P MP P G  
Sbjct: 164 GEVGDPGHMGSSGQRGPEGLMGKPGEDGEPGKPGNNGEMGFSGSPGARGFPGMPGPPGLK 223

Query: 331 PHLAHGGV---TAAHGVPRHHGANGPASLNSAALPAYATG-----GGNGPAYPPGAIVSP 486
            H  H G+      +G     GA GP     A  P    G     G +GP+  PG    P
Sbjct: 224 GHKGHLGILGQKGENGAVGSKGATGPHGPMGAPGPMGPAGMPGERGRSGPSGTPGKRGVP 283

Query: 487 ASTATFNRLSP 519
            S      L P
Sbjct: 284 GSVGKPGSLGP 294

[176][TOP]
>UniRef100_UPI00016E0359 UPI00016E0359 related cluster n=1 Tax=Takifugu rubripes
           RepID=UPI00016E0359
          Length = 1419

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/191 (28%), Positives = 68/191 (35%), Gaps = 21/191 (10%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGS----------GPGGHPASSYAPSSS 159
           PP + SH PG +  G+  A  F G     G+ +GS          GP G P  + A    
Sbjct: 105 PPGHPSH-PGGI--GAQMASGFDGKSGPQGMLSGSRGEAGTRGPPGPSGSPGQAGAQGPP 161

Query: 160 ASLPQGAHLGSRG-GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAP--PQMPPPTGPS 330
             +    H+GS G   P  + G  G  G      +N    F     A   P MP P G  
Sbjct: 162 GEVGDPGHMGSSGQRGPEGLMGKPGEDGEPGKPGNNGEMGFSGSPGARGFPGMPGPPGLK 221

Query: 331 PHLAHGGV---TAAHGVPRHHGANGPASLNSAALPAYATG-----GGNGPAYPPGAIVSP 486
            H  H G+      +G     GA GP     A  P    G     G +GP+  PG    P
Sbjct: 222 GHKGHLGILGQKGENGAVGSKGATGPHGPMGAPGPMGPAGMPGERGRSGPSGTPGKRGVP 281

Query: 487 ASTATFNRLSP 519
            S      L P
Sbjct: 282 GSVGKPGSLGP 292

[177][TOP]
>UniRef100_UPI00016E0334 UPI00016E0334 related cluster n=1 Tax=Takifugu rubripes
           RepID=UPI00016E0334
          Length = 1479

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/191 (28%), Positives = 68/191 (35%), Gaps = 21/191 (10%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGS----------GPGGHPASSYAPSSS 159
           PP + SH PG +  G+  A  F G     G+ +GS          GP G P  + A    
Sbjct: 159 PPGHPSH-PGGI--GAQMASGFDGKSGPQGMLSGSRGEAGTRGPPGPSGSPGQAGAQGPP 215

Query: 160 ASLPQGAHLGSRG-GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAP--PQMPPPTGPS 330
             +    H+GS G   P  + G  G  G      +N    F     A   P MP P G  
Sbjct: 216 GEVGDPGHMGSSGQRGPEGLMGKPGEDGEPGKPGNNGEMGFSGSPGARGFPGMPGPPGLK 275

Query: 331 PHLAHGGV---TAAHGVPRHHGANGPASLNSAALPAYATG-----GGNGPAYPPGAIVSP 486
            H  H G+      +G     GA GP     A  P    G     G +GP+  PG    P
Sbjct: 276 GHKGHLGILGQKGENGAVGSKGATGPHGPMGAPGPMGPAGMPGERGRSGPSGTPGKRGVP 335

Query: 487 ASTATFNRLSP 519
            S      L P
Sbjct: 336 GSVGKPGSLGP 346

[178][TOP]
>UniRef100_B2I413 Conserved hypothetical membrane protein n=2 Tax=Mycobacterium
           RepID=B2I413_MYCMM
          Length = 814

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 62/203 (30%), Positives = 73/203 (35%), Gaps = 28/203 (13%)
 Frame = +1

Query: 1   AQQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
           A  P   G+     +  G    GS  G P  PG   G G GG P +   P S      GA
Sbjct: 268 AASPLGGGAPSMSGLGSGGGGMGSGGGIPKMPG---GLGSGGMPGTGSNPLSGVGQMPGA 324

Query: 181 HLG--SRGGAPP-SVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSP------ 333
             G  + GG P  S AGG       +   +  +G    + PAPP  P P  PSP      
Sbjct: 325 GSGLPNAGGLPTASNAGGASPLSAFNQGAAATAGMGGGIPPAPP--PAPASPSPAPSAGG 382

Query: 334 HLA------HGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGP------------- 456
           H A       GGV+ A   P   G   PA+  SA        GG  P             
Sbjct: 383 HAAPAAAAPGGGVSPAAAQP---GVVAPAAPASAPTGVGVGAGGGAPMMLPPGSMGPPAA 439

Query: 457 AYPPGAIVSPASTATFNRLSPAA 525
           A PP A   PA T      +PAA
Sbjct: 440 AIPPPAATVPAGTVGSTNTAPAA 462

[179][TOP]
>UniRef100_A9VS75 Collagen triple helix repeat n=1 Tax=Bacillus weihenstephanensis
           KBAB4 RepID=A9VS75_BACWK
          Length = 385

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 52/176 (29%), Positives = 64/176 (36%), Gaps = 14/176 (7%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPS--SSASLPQGAH 183
           PP  G   P  + G +  +G   GP    G+   +GP G P     P+  + A+ P G  
Sbjct: 86  PP--GPTGPTGITGATGPSGGPPGPTGPTGITGATGPSGGPPGPIGPTGITGATGPSGGP 143

Query: 184 LGSRG-----------GAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPP-PTGP 327
            G  G           G PP   G  G +G T AT              P   PP PTGP
Sbjct: 144 PGPTGPTGITGATGPSGGPPGPTGPTGITGATGAT-------------GPSGGPPGPTGP 190

Query: 328 SPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPAST 495
           +      G T   G P   G  GP  +  A  P+    G  GP    GA  S  ST
Sbjct: 191 T---GITGATGPSGGP--PGPTGPTGITGATGPSGGPPGPTGPTGITGATGSTGST 241

[180][TOP]
>UniRef100_A9EZ28 Protein kinase n=1 Tax=Sorangium cellulosum 'So ce 56'
           RepID=A9EZ28_SORC5
          Length = 721

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 58/198 (29%), Positives = 79/198 (39%), Gaps = 25/198 (12%)
 Frame = +1

Query: 13  PSYGSHV-PGSVVGGSSAAGSFS--GPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA- 180
           P+ GS + PGS    S  A + +  G P    + A    GGHP  + A   + + P  A 
Sbjct: 344 PAIGSELGPGSSGASSWEAATMAAHGAPRGSAMDAAQAHGGHPGMAQAAPGAPNGPPSAL 403

Query: 181 ------HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLA 342
                 H G+ G APPS  G  GA      +  N      +  PA     P  GPS    
Sbjct: 404 HNTGAGHAGAHG-APPSWQGA-GAPHSAPVSLHNTGSGLHNTGPAYGAPAPAHGPS---- 457

Query: 343 HGGVTAAHGVPRHHGANGPASLNSAALPAYATGGG--------------NGPAYPPGAIV 480
                A HG P H    GP++ +SA +  + TG G              +GP+ P GA V
Sbjct: 458 -----APHGAPAH----GPSAPHSAPVSLHNTGSGLHNAGPAYGALAPAHGPSAPHGAPV 508

Query: 481 SPASTAT-FNRLSPAAAA 531
           S  +T +  +   PA  A
Sbjct: 509 SLHNTGSGLHNAGPAYGA 526

[181][TOP]
>UniRef100_A4T503 Conserved hypothetical alanine and proline rich protein n=1
           Tax=Mycobacterium gilvum PYR-GCK RepID=A4T503_MYCGI
          Length = 664

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 52/164 (31%), Positives = 64/164 (39%), Gaps = 6/164 (3%)
 Frame = +1

Query: 25  SHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGA 204
           S    S    SS   S  GPP   G  +GS       +S +PS+++    GA      GA
Sbjct: 202 SAASASTPSASSPMSSSGGPPSTGGASSGSPSASTSPASGSPSTASPTTSGA-----AGA 256

Query: 205 PPSVAGGYGAS----GPTSATFSNESGSFQSLQPA-PPQMPPPTGPSPHLAHGGVTAAHG 369
            PS A   GA+     P    F N+S    S  PA  P  PP + P+P    G    A  
Sbjct: 257 QPSNASPAGAAKAQPSPIQQVF-NQSAPLASSAPAQSPAAPPSSAPAPTTPAGAAPTA-- 313

Query: 370 VPRHHGANGPASLNSAALP-AYATGGGNGPAYPPGAIVSPASTA 498
                GA G  S +    P A A  G   PA PP  +  P S A
Sbjct: 314 ---GTGAGGGLSTSGGPAPVAGAPAGAAPPAAPPVPLAPPTSPA 354

[182][TOP]
>UniRef100_A4JMC1 Putative uncharacterized protein n=1 Tax=Burkholderia vietnamiensis
           G4 RepID=A4JMC1_BURVG
          Length = 715

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 42/138 (30%), Positives = 64/138 (46%)
 Frame = +1

Query: 121 GGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAP 300
           G   AS  + +S+A+   GA   ++ GA  +  G    + PT++  S+       + PA 
Sbjct: 122 GAGAASGASAASAAAAGSGAAASAQHGASAAHPGSAAVAAPTASAVSSAP-----IAPAA 176

Query: 301 PQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIV 480
           P  P  +  +P  A  G +++ G    HGA+  A+    A PA   GG +GP    GAI 
Sbjct: 177 PAAPTSSANAP--AANGASSSAGASATHGASSAAT----AQPAAPVGGASGPHVWNGAIQ 230

Query: 481 SPASTATFNRLSPAAAAA 534
           S  S+A+     PAA  A
Sbjct: 231 SAPSSASEAAAQPAAGGA 248

[183][TOP]
>UniRef100_C2X3H2 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           Rock4-18 RepID=C2X3H2_BACCE
          Length = 1289

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 47/157 (29%), Positives = 62/157 (39%), Gaps = 16/157 (10%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+     S+  + P GA  G+ G     
Sbjct: 206 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSG----STGVTGPTGA-TGNTG----- 255

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ----------PAPPQ----MPPPTGPSPHLAHGG 351
            A G G +GPT +T    +   Q +Q          P  PQ    +P PTG +      G
Sbjct: 256 -ATGQGLTGPTGSTGETGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQG 314

Query: 352 VTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
           V    G+    G  GP  +  A  P   TG  G  GP
Sbjct: 315 VQGIQGIMGATGDQGPQGIQGAIGPQGVTGATGDQGP 351

[184][TOP]
>UniRef100_C2VI92 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           Rock3-29 RepID=C2VI92_BACCE
          Length = 956

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 47/157 (29%), Positives = 62/157 (39%), Gaps = 16/157 (10%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+     S+  + P GA  G+ G     
Sbjct: 195 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSG----STGMTGPTGA-TGNTG----- 244

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ----------PAPPQ----MPPPTGPSPHLAHGG 351
            A G G +GPT +T    +   Q +Q          P  PQ    +P PTG +      G
Sbjct: 245 -ATGQGLTGPTGSTGETGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQG 303

Query: 352 VTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
           V    G+    G  GP  +  A  P   TG  G  GP
Sbjct: 304 VQGIQGITGATGDQGPQGIQGAIGPQGVTGVTGDQGP 340

[185][TOP]
>UniRef100_C2U3W8 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           Rock1-3 RepID=C2U3W8_BACCE
          Length = 926

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 48/160 (30%), Positives = 62/160 (38%), Gaps = 19/160 (11%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+     S+  + P GA  G+ G     
Sbjct: 195 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSG----STGVTGPTGA-TGNTG----- 244

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------------PAPPQ----MPPPTGPSPHLA 342
            A G G +GPT +T    +   Q LQ             P  PQ    +P PTG +    
Sbjct: 245 -ATGQGLTGPTGSTGETGAQGLQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQG 303

Query: 343 HGGVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             GV    G+    G  GP  +  A  P   TG  G  GP
Sbjct: 304 IQGVQGIQGITGATGDQGPQGIQGAIGPQGVTGVTGDQGP 343

[186][TOP]
>UniRef100_C2MS36 Collagen triple helix repeat domain protein n=1 Tax=Bacillus cereus
           m1293 RepID=C2MS36_BACCE
          Length = 1246

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 42/154 (27%), Positives = 59/154 (38%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   + +       + G+ G     
Sbjct: 192 PTGITGPTGITGPSGGPPGPTGPTGATGPGGGPSGSTGATGAT-----GNTGATGNT--G 244

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           + G  G +GPT +T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 245 ITGATGTTGPTGSTGAQGLQGIQGIQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQGVQG 304

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             G+    G  GP  +     P   TG  G  GP
Sbjct: 305 IQGITGATGDQGPQGIQGVIGPQGVTGATGDQGP 338

[187][TOP]
>UniRef100_Q9BIU8 Flagelliform silk protein (Fragment) n=1 Tax=Argiope trifasciata
           RepID=Q9BIU8_ARGTR
          Length = 1002

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 56/179 (31%), Positives = 63/179 (35%), Gaps = 22/179 (12%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASL-----PQGAHLGSRG 198
           P  V GG   AG   G  + PG  AG GPGG P +   P           P G   G  G
Sbjct: 385 PEGVGGGPGGAGP-GGAGFGPGGGAGFGPGGAPGAPGGPGGPGGPGGPGGPGGVGPGGAG 443

Query: 199 GAPPSVAGGYGASGPTSATFSNESGSFQ-------------SLQPAPPQMPPPTGPSPHL 339
           G  P  AGG G +G T       +G F                 PA      P G  P  
Sbjct: 444 GYGPGGAGGVGPAG-TGGFGPGGAGGFGPGGAGGFGPGGAGGFGPAGAGGYGPGGVGPGG 502

Query: 340 AHG----GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATF 504
           A G    GV      P   G  GP +++       A GGG G A P GA   P   A F
Sbjct: 503 AGGFGPGGVGPGGSGPGGAGGEGPVTVDVDVSVGGAPGGGPGGAGPGGAGFGPGGGAGF 561

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 55/179 (30%), Positives = 62/179 (34%), Gaps = 22/179 (12%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASL-----PQGAHLGSRG 198
            P  V GG   AG   G  + PG  AG GPGG P +   P           P G   G  G
Sbjct: 653  PEGVGGGPGGAGP-GGAGFGPGGGAGFGPGGAPGAPGGPGGPGGPGGPGGPGGVGPGGAG 711

Query: 199  GAPPSVAGGYGASGPTSATFSNESGSFQ-------------SLQPAPPQMPPPTGPSPHL 339
            G  P  AGG+G  G T       +G F                 P       P G  P  
Sbjct: 712  GYGPGGAGGFGPGG-TGGFGPGGAGGFGPGGAGGFGPGGAGGFGPGGAGGYGPGGVGPGG 770

Query: 340  AHG----GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATF 504
            A G    GV      P   G  GP +++       A GGG G A P GA   P   A F
Sbjct: 771  AGGFGPGGVGPGGSGPGGAGGEGPVTVDVDVSVGGAPGGGPGGAGPGGAGFGPGGGAGF 829

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 55/182 (30%), Positives = 59/182 (32%), Gaps = 25/182 (13%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGP----PYAPGVYAGSGPGG---HPASSYAPSSS------ASLPQ 174
            PG   GG S  G   GP     Y PG   G GPGG     A  Y P  +       S P 
Sbjct: 839  PGGAAGGPSGPGGPGGPGGAGGYGPGGAGGYGPGGVGPGGAGGYGPGGAGGYGPGGSGPG 898

Query: 175  GAHLGSRGG------------APPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPP 318
            GA  G  GG             P  V GG G +GP  A F    G+      AP     P
Sbjct: 899  GAGPGGAGGEGPVTVDVDVTVGPEGVGGGPGGAGPGGAGFGPGGGAGFGPGGAPGAPGGP 958

Query: 319  TGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTA 498
             GP      GG           G  GP  +       Y  GG  G        V PA T 
Sbjct: 959  GGP------GG---------PGGPGGPGGVGPGGAGGYGPGGAGG--------VGPAGTG 995

Query: 499  TF 504
             F
Sbjct: 996  GF 997

[188][TOP]
>UniRef100_B7QAA1 Alpha-1 collagen type III, putative (Fragment) n=1 Tax=Ixodes
           scapularis RepID=B7QAA1_IXOSC
          Length = 507

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/179 (30%), Positives = 64/179 (35%), Gaps = 32/179 (17%)
 Frame = +1

Query: 52  GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSS--------SASLPQG----AHLGSR 195
           GS  AG  SGP Y PG  +    GG+P S  AP S        S   P G       G+ 
Sbjct: 20  GSGGAGRPSGPAYRPG--SSGAAGGYPGSGGAPGSGGAGGYPGSGGYPGGGGAPGAAGAG 77

Query: 196 GGAPPSVAGGY------------------GASGPTSATFSNESGSFQSLQPAPPQMPPPT 321
           GG P   AGGY                  G +G   +     SG +    P     P   
Sbjct: 78  GGYPKPGAGGYPGSGGVGPGAPGSGGYGPGGAGKPGSGGKPGSGGYGGGYPGSGGYPGSG 137

Query: 322 GPSPHLAHGGVTAAHGVPRHHGA--NGPASLNSAALPAYATGGGNGPAYPPGAIVSPAS 492
           G   +   GG +   G P   GA  +GP S  S     Y   GG G A  PG+   P S
Sbjct: 138 GSGGYPGSGGSSGPGGYPGPGGASSSGPGSYPSGGGGGYRPSGGTG-AGAPGSYGKPGS 195

[189][TOP]
>UniRef100_A8XVD3 C. briggsae CBR-COL-147 protein n=1 Tax=Caenorhabditis briggsae
           RepID=A8XVD3_CAEBR
          Length = 290

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 45/161 (27%), Positives = 57/161 (35%), Gaps = 2/161 (1%)
 Frame = +1

Query: 52  GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYG 231
           G+ + G  +GPP  PG     G  GHP  +  P ++     G  +G  GG  P +    G
Sbjct: 80  GAQSNGCPAGPPGPPGQPGAQGDAGHPGEAGKPGAN-----GVTIGLTGGNGPCITCPAG 134

Query: 232 ASGPTSATFS--NESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPAS 405
           A GP  A  +   +  S    Q A    P P GP       G     G P   G  G   
Sbjct: 135 APGPAGAPGAPGPQGPSGAPGQDAVGGGPGPAGPQGPAGDAGAPGQPGAPGQPGNAGRGG 194

Query: 406 LNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAA 528
             S   P  A  G  GP  P G    P  +       PA +
Sbjct: 195 QRSRGTPGPA--GAPGPQGPAGGPGQPGQSGGAGAPGPAGS 233

[190][TOP]
>UniRef100_A6YIY0 Major ampullate spidroin 2 n=1 Tax=Latrodectus hesperus
            RepID=A6YIY0_9ARAC
          Length = 3779

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 54/181 (29%), Positives = 70/181 (38%), Gaps = 18/181 (9%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
            P     + PGS   G++AA +  GP Y  G   G GPGG  A++ A +++   P G   G
Sbjct: 2525 PDRQQGYGPGS--SGAAAAAAAGGPGY--GGQQGYGPGGAGAAAAAAAAAGPGPSGYGPG 2580

Query: 190  SRGGAPPSVA-------------GGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS 330
              G A  + A              GYG SGP     +   GS  +   A        G  
Sbjct: 2581 GAGAAAAAAAAGGSGPGGYGQGPSGYGPSGPGGQQGNGPGGSGAAAAAAAAAGGAGPGRQ 2640

Query: 331  PHLAHGG--VTAAHGVPRHHGANGPASLNSAALPAYATGG---GNGPAYPPGAIVSPAST 495
                 GG    AA G P + G  G     + A  A A GG   G   AY PG   + A+ 
Sbjct: 2641 QGYGPGGAAAAAAAGGPGYGGQQGYGPGGAGAAAAAAAGGAGPGRQQAYGPGGAGAAAAA 2700

Query: 496  A 498
            A
Sbjct: 2701 A 2701

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 51/174 (29%), Positives = 70/174 (40%), Gaps = 1/174 (0%)
 Frame = +1

Query: 13   PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
            P +G    G   GGS AA + +     PG     GPGG  A++ A +++ S P G    +
Sbjct: 3548 PGFGGQ-QGYGPGGSGAAAAAAAGGAGPGRQQAYGPGGSGAAAAAAAAAGSGPSGYGPSA 3606

Query: 193  RGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGV 372
             G + P  +G  G SGP         G F        Q P   GPS              
Sbjct: 3607 AGPSGPGGSGAAGGSGP---------GGF-------GQGPAGYGPSG------------- 3637

Query: 373  PRHHGANGPASLNSAALPAYATGGGNGPA-YPPGAIVSPASTATFNRLSPAAAA 531
            P      GP +  +AA  A +  GG GP+ Y P ++ S A++A     SP   A
Sbjct: 3638 PGGQQGYGPGASGAAAAAAASGSGGYGPSQYVPSSVASSAASAASALSSPTTHA 3691

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 49/172 (28%), Positives = 69/172 (40%), Gaps = 8/172 (4%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGP----PYAPGVYAGSGPGGHPASSYAPSSSASLPQG 177
           P   G+    +  GGS   G   GP    P  P    G GPGG  A++ A +++ S P G
Sbjct: 231 PGGAGAAAGAAAAGGSGPGGYGQGPAAYGPSGPSGQQGYGPGGSGAAAAAAAAAGSGPSG 290

Query: 178 AHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG--- 348
              G   G P    GG GA+   +A   +  G +   Q +      P+GPS    +G   
Sbjct: 291 --YGPGAGGP----GGAGAAAAAAAAGGSGPGGYGQGQAS----YGPSGPSGQQGYGPGG 340

Query: 349 -GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTAT 501
            G  AA       G +G     +AA  A + G G    Y PG   + A+  +
Sbjct: 341 SGAAAAAAAAAGSGPSGYGPGAAAAAAAGSAGPGTQQGYGPGGSGAAAAAGS 392

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 51/169 (30%), Positives = 68/169 (40%), Gaps = 7/169 (4%)
 Frame = +1

Query: 13   PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
            P YG    G   GG+ AA + +     PG     GPGG  A++ A +++   P G   G+
Sbjct: 2657 PGYGGQ-QGYGPGGAGAAAAAAAGGAGPGRQQAYGPGGAGAAAAAAAAAGPGPSGYGPGA 2715

Query: 193  RGGAPPSVAGGYGASGPTSATFSNESGSF----QSLQPAPPQMPPPTGPSPHLAHGGVTA 360
             G   PS  GG GA+   +A   +  G +        P+ P      GP    A     A
Sbjct: 2716 SG---PSGTGGAGAAAAAAAAGGSGPGGYGQGASGYGPSGPGGQQGYGPGGSGAAAAAAA 2772

Query: 361  AHGV--PRHHGANGPASLNSAALPAYATGGGNGP-AYPPGAIVSPASTA 498
            A G   P      GP S  +AA  A    G  GP  Y PG   + A+ A
Sbjct: 2773 AAGGAGPGRQQGYGPGSSGAAAAAAAGGPGYGGPQGYGPGGAGAAAAAA 2821

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 57/178 (32%), Positives = 71/178 (39%), Gaps = 5/178 (2%)
 Frame = +1

Query: 13   PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASL---PQGAH 183
            P YG    G  +G + AA + +     PG     GPGG  A++ A + S      P  A 
Sbjct: 3137 PGYGGQ-QGYGLGVAGAAAAVAAGGAGPGRQQAYGPGGSGAAAAAAAGSGRSGYGPGAAG 3195

Query: 184  LGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAA 363
             G  G A  + AGG G SG   A     SG+  +     P      G  P  A     AA
Sbjct: 3196 TGGAGAAAAAAAGGAG-SGRQQAYGPGGSGAAAASAAGGPGYGGQQGYGPGGAGAAAAAA 3254

Query: 364  HG--VPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAAA 531
             G   P    A GP    +AA  A A+G G    Y PGA   P+  A     + AAAA
Sbjct: 3255 AGGAGPGTQQAYGPGGSGAAAAAAAASGPGPS-GYEPGA-AGPSGPAGAGAAAAAAAA 3310

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 55/182 (30%), Positives = 79/182 (43%), Gaps = 7/182 (3%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSFSGPP---YAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
            P +  ++ PG   G ++AA + SGP    Y PG    SGP G  A++ A ++  S P G 
Sbjct: 3260 PGTQQAYGPGGS-GAAAAAAAASGPGPSGYEPGAAGPSGPAGAGAAAAAAAAGGSGPGGY 3318

Query: 181  HLGSRGGAPPSVAG----GYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHG 348
              G  G  P    G    G G SG  +A  +   G+    Q    Q    +G +   A G
Sbjct: 3319 GQGPSGYGPSGPGGQQGYGPGGSGAAAAAAAAAGGAGPGRQQGYGQ--GSSGAAAAAAAG 3376

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAA 528
            G    +G  + +G  G  +  +AA+ A   G G   AY PG   + A +   +   P AA
Sbjct: 3377 G--PGYGGQQVYGPGGAGA--AAAVAAGGAGPGRQQAYGPGGSGAAAGSGP-SGYGPGAA 3431

Query: 529  AA 534
            AA
Sbjct: 3432 AA 3433

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 50/165 (30%), Positives = 64/165 (38%), Gaps = 8/165 (4%)
 Frame = +1

Query: 4    QQPPSYGSHVPGSVVG------GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSAS 165
            Q P  YG   PG   G      G++AA + +     PG   G GPGG  A++ A      
Sbjct: 2601 QGPSGYGPSGPGGQQGNGPGGSGAAAAAAAAAGGAGPGRQQGYGPGGAAAAAAAGGPGYG 2660

Query: 166  LPQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAH 345
              QG   G  G A  + AGG   +GP         G+  +   A    P P+G  P    
Sbjct: 2661 GQQGYGPGGAGAAAAAAAGG---AGPGRQQAYGPGGAGAAAAAAAAAGPGPSGYGP---- 2713

Query: 346  GGVTAAHGVPRHHGANGPASLNSA-ALPAYATGGGNGP-AYPPGA 474
                         GA+GP+    A A  A A  GG+GP  Y  GA
Sbjct: 2714 -------------GASGPSGTGGAGAAAAAAAAGGSGPGGYGQGA 2745

[191][TOP]
>UniRef100_A2R1W4 Differential expressed Arsa-7 from patent
           US2003215950-A1-Aspergillus niger n=1 Tax=Aspergillus
           niger CBS 513.88 RepID=A2R1W4_ASPNC
          Length = 406

 Score = 55.1 bits (131), Expect = 3e-06
 Identities = 59/150 (39%), Positives = 67/150 (44%), Gaps = 5/150 (3%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAAGSFSGPPYAP-GVYAGSGPGGHPASSY---APSSSASLPQGAH 183
           S GS   GS     S + SF G   AP GV  G+GP   P+ S+   APS  A     + 
Sbjct: 273 SQGSFEQGSSSEQGSGSSSFGGNGAAPSGVAGGNGPS--PSGSFGGAAPSGVAGGNGPSP 330

Query: 184 LGSRGGAPPS-VAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTA 360
            GS GGA PS VAGG G S          SGSF     AP  +    GPSP  + GG  A
Sbjct: 331 SGSFGGAAPSGVAGGNGPS---------PSGSFGGNGAAPSGVAGGNGPSPSGSFGGNGA 381

Query: 361 AHGVPRHHGANGPASLNSAALPAYATGGGN 450
           A       GA G A   S A PA A  G +
Sbjct: 382 APS-----GAAGGAPAASGA-PAAAPSGAS 405

[192][TOP]
>UniRef100_UPI000186E27C conserved hypothetical protein n=1 Tax=Pediculus humanus corporis
           RepID=UPI000186E27C
          Length = 607

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 52/174 (29%), Positives = 76/174 (43%), Gaps = 15/174 (8%)
 Frame = +1

Query: 34  PGSVVGGSSA----AGSFSG---PPYAPGVYAGS-GPGGHPASSYAPSSSASLPQGAHLG 189
           PGS  GG+      +GSF G   P    G + GS GP G P+ S+  +   S P G+  G
Sbjct: 424 PGSSFGGAQGPFGPSGSFGGSQGPSGPSGTFGGSQGPSG-PSESFGGNQGPSGPSGSFGG 482

Query: 190 SRGGAPPSVA--GGYGASGPTSATFSNESGSFQSLQPAP--PQMPP---PTGPSPHLAHG 348
           S+G + PSV+  G  G+  P +      S +F    P    P   P   P G SP    G
Sbjct: 483 SQGTSGPSVSFVGQQGSRVPVTGGSPGPSSTFGPTTPTAGYPSASPTQRPGGYSPSGTSG 542

Query: 349 GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNR 510
           G T +       G +  ++  ++  P  AT    GP++ P +   P S+   N+
Sbjct: 543 GYTPS-------GPSSTSAFGNSQRPVSAT--TTGPSFGPSSTFGPPSSRPNNQ 587

[193][TOP]
>UniRef100_UPI0000DD8F95 Os04g0245000 n=1 Tax=Oryza sativa Japonica Group RepID=UPI0000DD8F95
          Length = 1541

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 54/169 (31%), Positives = 60/169 (35%), Gaps = 6/169 (3%)
 Frame = +1

Query: 1    AQQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
            A  PPS G+  P          G  +G P  P +    G GGH A    P     LP+G 
Sbjct: 1098 APPPPSIGAGAPPP----PPPPGGITGVPPPPPI---GGLGGHQAPPAPP-----LPEGI 1145

Query: 181  HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTG-----PSPHLAH 345
                 G  PP   GG G                      PP  PPP G     P P+ AH
Sbjct: 1146 G----GVPPPPPVGGLGG---------------------PPAPPPPAGFRGGTPPPN-AH 1179

Query: 346  GGVTAAHGVPRHHGA-NGPASLNSAALPAYATGGGNGPAYPPGAIVSPA 489
            GGV      PR HG   GP +   A  P    G   GP  PPG    PA
Sbjct: 1180 GGVAPPPPPPRGHGGVGGPPTPPGAPAPPMPPGVPGGPPPPPGGRGLPA 1228

[194][TOP]
>UniRef100_UPI00017B2D12 UPI00017B2D12 related cluster n=1 Tax=Tetraodon nigroviridis
           RepID=UPI00017B2D12
          Length = 1568

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 57/187 (30%), Positives = 77/187 (41%), Gaps = 27/187 (14%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVG---GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
           PP    H PG  V    G  + GS SGP Y P        G +   SY  S + S     
Sbjct: 120 PPVSPHHTPGGPVYPGMGPYSQGSPSGP-YGPQGSQYGHQGNYHRPSYGGSGATSYSGSN 178

Query: 181 HLGSRGGAPPSVAGGYGASGPTSATFSNESGS----FQSLQPAPPQMPPPTGPS---PHL 339
           +LG   G+P     G G+S P     ++ SGS    + ++ P  P MP P GP    P L
Sbjct: 179 NLGMNAGSPGL---GQGSSQPIPVRRNHGSGSQNRGYPAMAPISPSMPHPVGPGMGPPSL 235

Query: 340 A------HGGVTAA------HGVPRHHGANGPASLNSAALPAYATGG-----GNGPAYPP 468
           A        G  AA      HG  +  G + P+++ +    +  TG      GNG A  P
Sbjct: 236 AASNRKPQEGTVAANSTQSRHGTYQGPGVSQPSTMATIVPYSQPTGNNSSDMGNGQA--P 293

Query: 469 GAIVSPA 489
           G  ++PA
Sbjct: 294 GYTIAPA 300

[195][TOP]
>UniRef100_Q1B7N1 Putative uncharacterized protein n=1 Tax=Mycobacterium sp. MCS
           RepID=Q1B7N1_MYCSS
          Length = 771

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 51/184 (27%), Positives = 70/184 (38%), Gaps = 28/184 (15%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           PG+ V  S   G+ + PP  P     S  G  P +  AP +    P    +     A  +
Sbjct: 18  PGAPVAASGGVGAPAAPPAVPAGVVDSSSGVTPPAPAAPPAGVVQPAAGAVPPAPSAVGA 77

Query: 214 VAGGYGASG-------PTSATFSNESGSFQSLQPAPPQ--------MPPPTGPSPHLAHG 348
            AGG G +G       P +A     +G+     PAPP         + PP  P+P    G
Sbjct: 78  PAGGSGGAGAPAAPPAPPAAVVEPAAGATPPAPPAPPAAVVEPASGVTPPAPPAPGGPAG 137

Query: 349 GVTAAHGVPRH--------HGANG--PASLNSAALPAYATGGG---NGPAYPPGAIVSPA 489
           G   A   P            A+G  P +  +   PA  +GG     GP  PP A+V PA
Sbjct: 138 GSGGAVTPPGPPAPPAAVVEPASGVTPPAPPAPGGPAGGSGGAVTPPGPPAPPAAVVEPA 197

Query: 490 STAT 501
           +  T
Sbjct: 198 AGVT 201

[196][TOP]
>UniRef100_A8LHL3 Putative uncharacterized protein n=1 Tax=Frankia sp. EAN1pec
           RepID=A8LHL3_FRASN
          Length = 391

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 53/172 (30%), Positives = 73/172 (42%), Gaps = 7/172 (4%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVGGSSAAGSFSGPPYA---PGVYAGSGPGGHPASSYAPSSSASLPQ 174
           +  PS G  VP S  GG+    S SGPP A   P   AG  P  H   S+A  S AS   
Sbjct: 11  ESSPSSGP-VP-SPAGGNPQPLSTSGPPQASTWPAPQAGGEPAPHATGSHAAGSGASQAP 68

Query: 175 GAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPP---TGPSPHLAH 345
           G   GS   + P   G   A G  S+  +   G+     P P   PPP   +G  P  + 
Sbjct: 69  G-WTGSPAWSGPPPPGPGSAPGEVSSRAAASPGA-----PVPGVSPPPRVASGALPRWSL 122

Query: 346 GGVTAAHGVPRHHGANGPASLNSAALPAYATGGG-NGPAYPPGAIVSPASTA 498
           G    A  +         A++N+++L +   GGG  G    P  +++PA +A
Sbjct: 123 GRTAVAGAIALALAVGAAAAVNASSLGSDGAGGGPGGLRGGPFQVMNPAGSA 174

[197][TOP]
>UniRef100_Q01HL2 H0211F06-OSIGBa0153M17.6 protein n=1 Tax=Oryza sativa
            RepID=Q01HL2_ORYSA
          Length = 1510

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 54/169 (31%), Positives = 60/169 (35%), Gaps = 6/169 (3%)
 Frame = +1

Query: 1    AQQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
            A  PPS G+  P          G  +G P  P +    G GGH A    P     LP+G 
Sbjct: 1098 APPPPSIGAGAPPP----PPPPGGITGVPPPPPI---GGLGGHQAPPAPP-----LPEGI 1145

Query: 181  HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTG-----PSPHLAH 345
                 G  PP   GG G                      PP  PPP G     P P+ AH
Sbjct: 1146 G----GVPPPPPVGGLGG---------------------PPAPPPPAGFRGGTPPPN-AH 1179

Query: 346  GGVTAAHGVPRHHGA-NGPASLNSAALPAYATGGGNGPAYPPGAIVSPA 489
            GGV      PR HG   GP +   A  P    G   GP  PPG    PA
Sbjct: 1180 GGVAPPPPPPRGHGGVGGPPTPPGAPTPPMPPGVPGGPPPPPGGRGLPA 1228

[198][TOP]
>UniRef100_B9FE31 Putative uncharacterized protein n=1 Tax=Oryza sativa Japonica Group
            RepID=B9FE31_ORYSJ
          Length = 1980

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 54/169 (31%), Positives = 60/169 (35%), Gaps = 6/169 (3%)
 Frame = +1

Query: 1    AQQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
            A  PPS G+  P          G  +G P  P +    G GGH A    P     LP+G 
Sbjct: 1409 APPPPSIGAGAPPP----PPPPGGITGVPPPPPI---GGLGGHQAPPAPP-----LPEGI 1456

Query: 181  HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTG-----PSPHLAH 345
                 G  PP   GG G                      PP  PPP G     P P+ AH
Sbjct: 1457 G----GVPPPPPVGGLGG---------------------PPAPPPPAGFRGGTPPPN-AH 1490

Query: 346  GGVTAAHGVPRHHGA-NGPASLNSAALPAYATGGGNGPAYPPGAIVSPA 489
            GGV      PR HG   GP +   A  P    G   GP  PPG    PA
Sbjct: 1491 GGVAPPPPPPRGHGGVGGPPTPPGAPAPPMPPGVPGGPPPPPGGRGLPA 1539

[199][TOP]
>UniRef100_B1B5J3 RHYTHM OF CHLOROPLAST 15 n=1 Tax=Chlamydomonas reinhardtii
           RepID=B1B5J3_CHLRE
          Length = 631

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 49/155 (31%), Positives = 64/155 (41%), Gaps = 3/155 (1%)
 Frame = +1

Query: 4   QQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAH 183
           QQ PS G+       G S AA S      +P V A +     P S+ A +++ S P  AH
Sbjct: 485 QQRPSDGATAADGTAGCSPAAVS------SPAVAAAA-----PPSTAAAAATPSAPHSAH 533

Query: 184 LGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAA 363
             S  G   S +GG G  G  S +  + SGS         +  PP+ P+P  A     AA
Sbjct: 534 KPSTHGQGSSGSGGSGCGGSGSGSGGHGSGSSARAGSKRSEPEPPSRPTPQRAVAVTEAA 593

Query: 364 HGVPRHHGANGPASLNSA---ALPAYATGGGNGPA 459
                H   +  +  NSA   A  A A   GNG A
Sbjct: 594 LASSAHPAGSSGSGRNSAGGSAAAATAAAAGNGVA 628

[200][TOP]
>UniRef100_Q58MY1 Phage tail fiber-like protein n=1 Tax=Prochlorococcus phage P-SSM2
           RepID=Q58MY1_BPPRM
          Length = 597

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 53/180 (29%), Positives = 67/180 (37%), Gaps = 28/180 (15%)
 Frame = +1

Query: 76  SGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGG-------APPSVAGG--- 225
           +GPP   G+   SGP G       P  +   PQG  +G  GG        PP  AGG   
Sbjct: 177 AGPPGPTGITGPSGPPGPSGPGGGPGPAG--PQG-DVGPSGGPGPTGPAGPPGPAGGPPG 233

Query: 226 ----YGASGPTSATFSNESGS-FQSLQPAPPQMPPPTGPSPHLAHGGVT----------- 357
                G +GPT  T    +GS   +  P P   P PTGP+      G T           
Sbjct: 234 PQGPQGDAGPTGPTGPPGTGSPGPAGPPGPSGGPGPTGPAGPTGPDGPTGPTGPAGGPPG 293

Query: 358 --AAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAAA 531
                G P   G +GPA  + +  P   +GG  GP+  PG    P          PA +A
Sbjct: 294 PPGPSGPPGPSGGDGPAGPSGSPGPPGPSGGPPGPSGGPGPAGPPGPDGPSGPPGPAGSA 353

[201][TOP]
>UniRef100_Q9BIU1 Major ampullate spidroin 2 (Fragment) n=1 Tax=Gasteracantha
           cancriformis RepID=Q9BIU1_GASCA
          Length = 342

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 57/199 (28%), Positives = 68/199 (34%), Gaps = 29/199 (14%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASS-----YAPSSSASLPQGAHL 186
           G + PGS  GG    G  SG    PG     GPG   A++     Y P S     QG   
Sbjct: 66  GGYGPGSGQGGPGQQGPGSGGQQGPGGQGPYGPGAAAAAAAAAGGYGPGSGQGGQQGPGS 125

Query: 187 GSRGGAPPSVAGGYGASGPTSATFSNESGSF--QSLQPAPPQMPPPTGP----------S 330
              G       GG G  GP++A  +   G +   + Q  P Q  P +G            
Sbjct: 126 QGPGSGGQQGPGGQGPYGPSAAAAAAAVGGYGPGAGQQGPGQQGPGSGGQRGPGGQGPYG 185

Query: 331 PHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGP------------AYPPGA 474
           P  A     AA G     G  GP      +       GG GP             Y PG+
Sbjct: 186 PGAAAAAAAAAGGYGPASGQQGPGQQGPGS-GGQRGPGGQGPYGPGAAAAASAGGYGPGS 244

Query: 475 IVSPASTATFNRLSPAAAA 531
             SPAS A     SP A A
Sbjct: 245 GGSPASGAASRLSSPQAGA 263

[202][TOP]
>UniRef100_C3XWW9 Putative uncharacterized protein n=1 Tax=Branchiostoma floridae
           RepID=C3XWW9_BRAFL
          Length = 309

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 50/156 (32%), Positives = 59/156 (37%), Gaps = 8/156 (5%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGP-PYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPP 210
           P   VG   A G    P P  PG  AG+GP G P S  +P    +       G  G  P 
Sbjct: 113 PEGPVGPKGAEGERGAPGPPGPGGQAGTGPPGPPGSPGSPGEKGATGPAGPKGREG--PR 170

Query: 211 SVAGGYGASGPTSATFSNES-GSFQSLQPAPPQ----MPPPTGPSPHLAHGGVTAAHGVP 375
              G  G  GP     S  S G   ++ PA P+     P P GP+      G +   G P
Sbjct: 171 GPVGPQGLRGPVGPPGSPGSPGLKGAVGPAGPKGRGGPPGPRGPT------GPSGLPGSP 224

Query: 376 RHHGANGPASLNSAALPAYATG--GGNGPAYPPGAI 477
              GA GPA       P    G  G  GP  PPG +
Sbjct: 225 GEKGATGPAGPKGGEGPLGPVGPQGRVGPPGPPGPV 260

[203][TOP]
>UniRef100_B9PUT7 Protein transport protein sec13, putative n=2 Tax=Toxoplasma gondii
           RepID=B9PUT7_TOXGO
          Length = 654

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 54/181 (29%), Positives = 67/181 (37%), Gaps = 4/181 (2%)
 Frame = +1

Query: 1   AQQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
           A Q   +GS  P      S      S PP  P   A      HP  S  PSS  SLPQ  
Sbjct: 412 APQLQPHGSAAPLGAYPPSHPPSLSSSPPTHPAHGAS-----HPPLSSFPSSHPSLPQNP 466

Query: 181 HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTG---PSPHL-AHG 348
             G     PPS A      GP +                PPQ  P  G   P+P   A+ 
Sbjct: 467 APGPLSATPPSTAATPRPLGPAAG--------------QPPQGSPTPGVAFPAPGAPAYP 512

Query: 349 GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAA 528
           G  A+ G+        P    S   PA+A     G A+PP   V PA T+   + +P+ A
Sbjct: 513 GTPASAGLYGPPTPGAPGGAQSYPQPAFAAPYPQGSAFPPA--VQPAQTSLGGQQAPSPA 570

Query: 529 A 531
           +
Sbjct: 571 S 571

[204][TOP]
>UniRef100_B4IKV7 GM11218 n=1 Tax=Drosophila sechellia RepID=B4IKV7_DROSE
          Length = 1272

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 61/182 (33%), Positives = 78/182 (42%), Gaps = 14/182 (7%)
 Frame = +1

Query: 31  VPGSVVGGSSAAGSFSGP-PYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGA- 204
           VP +    SS AG+ +G    +  V +G G G    S  A S+  S  QGA  G+ GG+ 
Sbjct: 161 VPATPKSSSSGAGASTGSGTSSAAVTSGPGSGSTKVSVAASSAQQSGLQGA-TGAGGGSS 219

Query: 205 ------PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGG----V 354
                 P S AGG  A+ P SA      G+  S     P +PP +   PH   G      
Sbjct: 220 SAPGTQPGSGAGGAIAARPVSAM----GGTVSSTAGGAPSIPPISTMPPHTVPGSTNTTT 275

Query: 355 TAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYP--PGAIVSPASTATFNRLSPAAA 528
           TA  G     GA G A+ N+AAL A     G   AYP  PG     +S+      +  AA
Sbjct: 276 TAMAGGVGGPGAAG-ANPNAAALMASLLNAGQTGAYPGAPGQTAVNSSSLLDGSTAAVAA 334

Query: 529 AA 534
           AA
Sbjct: 335 AA 336

[205][TOP]
>UniRef100_B3RLH9 Putative uncharacterized protein (Fragment) n=1 Tax=Trichoplax
           adhaerens RepID=B3RLH9_TRIAD
          Length = 181

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 48/164 (29%), Positives = 64/164 (39%), Gaps = 8/164 (4%)
 Frame = +1

Query: 55  SSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYGA 234
           SS A   SG  Y P   A S    HP+++Y PSS+   P G        A P  + GY  
Sbjct: 10  SSTAYPPSGTAYPPSSTAQS----HPSTAYPPSSTGYPPSGTAYPPSSTAQPHPSTGYPP 65

Query: 235 SG---PTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPAS 405
           SG   P S+T      + Q         PP +    H        + G P    A  P+S
Sbjct: 66  SGTAYPPSSTAQPHPSTAQPHPSTGTAYPPSSTAQKHPPTAQPPPSTGYPPSGAAYPPSS 125

Query: 406 L-----NSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPA 522
                  +   P+ A    +  AYPP    +P STAT+   +PA
Sbjct: 126 TVYPPSGAVYPPSTAAYPPSTAAYPPSGTANPTSTATYPPSAPA 169

[206][TOP]
>UniRef100_A9UV04 Predicted protein (Fragment) n=1 Tax=Monosiga brevicollis
           RepID=A9UV04_MONBE
          Length = 237

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 48/188 (25%), Positives = 66/188 (35%), Gaps = 24/188 (12%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLG 189
           PP   S    +     SA G     P  P   A S     P  ++AP S+  +P  A   
Sbjct: 10  PPMPNSAAYATPPTQPSATGPVPSAPQGPSTSAQSAGSVFPGPNHAPQSAPPMPNSAAYA 69

Query: 190 S-------RGGAPPSVAGGYGASGPTSATFSNESGSFQSLQP--------APPQMPPPTG 324
           +        G AP +  G   ++    + F     + QS  P         PP  P  TG
Sbjct: 70  TPPTQPSATGPAPSAPQGSSTSAQSAGSVFPGPHHAPQSAPPMPNSAAYATPPTQPSATG 129

Query: 325 PSPHLAHGGVTAAHGV------PRHHGANGPASLNSAAL---PAYATGGGNGPAYPPGAI 477
           P+P    G  T+A         P H   + P   NSAA    P   +  G  P+ P G+ 
Sbjct: 130 PAPSAPQGSSTSAQSAGSVFPGPNHAPQSAPPMPNSAAYATPPTQPSATGPAPSAPQGSS 189

Query: 478 VSPASTAT 501
            S  S  +
Sbjct: 190 TSAQSAGS 197

[207][TOP]
>UniRef100_C9SR21 DNA-directed RNA polymerase II subunit RPB1 n=1 Tax=Verticillium
            albo-atrum VaMs.102 RepID=C9SR21_9PEZI
          Length = 1756

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 51/176 (28%), Positives = 72/176 (40%), Gaps = 15/176 (8%)
 Frame = +1

Query: 43   VVGGSSAAGSFSGPPYAP--GVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSV 216
            +VG  S   +  G  Y    G + G+ PG   A+S   +S  S P  +  G+ G +P S 
Sbjct: 1526 IVGAGSDDNTGFGTEYGGTYGGFGGASPGRAGATSPFTTSPTS-PFSSFAGAGGYSPTSP 1584

Query: 217  AGGYGASGP---------TSATFSNESGSFQSL----QPAPPQMPPPTGPSPHLAHGGVT 357
             GGY  + P         TS  FS  S SF       +P  P  P  +  SP  +    T
Sbjct: 1585 GGGYSPTSPLMDGGARYATSPQFSPSSPSFSPTSPVHRPTSPASPNYSPTSPSYSPTSPT 1644

Query: 358  AAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAA 525
            +    PRH+    PA  NS   P+Y+      P+Y P +     +  T    SPA+
Sbjct: 1645 S----PRHYSPTSPAQFNSPTSPSYSPA---SPSYSPTSPNLHGAGPTSPSYSPAS 1693

[208][TOP]
>UniRef100_Q7XWS7 Formin-like protein 12 n=1 Tax=Oryza sativa Japonica Group
            RepID=FH12_ORYSJ
          Length = 1669

 Score = 54.7 bits (130), Expect = 4e-06
 Identities = 54/169 (31%), Positives = 60/169 (35%), Gaps = 6/169 (3%)
 Frame = +1

Query: 1    AQQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGA 180
            A  PPS G+  P          G  +G P  P +    G GGH A    P     LP+G 
Sbjct: 1098 APPPPSIGAGAPPP----PPPPGGITGVPPPPPI---GGLGGHQAPPAPP-----LPEGI 1145

Query: 181  HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTG-----PSPHLAH 345
                 G  PP   GG G                      PP  PPP G     P P+ AH
Sbjct: 1146 G----GVPPPPPVGGLGG---------------------PPAPPPPAGFRGGTPPPN-AH 1179

Query: 346  GGVTAAHGVPRHHGA-NGPASLNSAALPAYATGGGNGPAYPPGAIVSPA 489
            GGV      PR HG   GP +   A  P    G   GP  PPG    PA
Sbjct: 1180 GGVAPPPPPPRGHGGVGGPPTPPGAPAPPMPPGVPGGPPPPPGGRGLPA 1228

[209][TOP]
>UniRef100_UPI0001868CED hypothetical protein BRAFLDRAFT_129955 n=1 Tax=Branchiostoma
           floridae RepID=UPI0001868CED
          Length = 703

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 58/175 (33%), Positives = 65/175 (37%), Gaps = 13/175 (7%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFS-GPPYAPGVYAGSGPGGHPASSYAPS----SSASLPQG-AHLGSR 195
           P    G    AG  S GPP  PG     GP G PAS   P       A  P G   +G  
Sbjct: 121 PPGPPGEKGPAGPVSVGPPGPPGEKGAMGPAG-PASVGPPGPPEEKGAMGPAGPVSVGPP 179

Query: 196 GGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVP 375
           G  PP   G  G +GP S       G   ++ PA P    P GP       G     G P
Sbjct: 180 G--PPGEKGAMGPAGPVSVGPPGPPGDKGAMGPAGPVSVGPPGPP---GEKGAMGPPGPP 234

Query: 376 RHHGANGPA---SLNSAALPAYATG--GGNGPAYPPGAI--VSPASTATFNRLSP 519
              GA GPA       A  P   +G  G  GPA P G    + PA   +F R  P
Sbjct: 235 GEKGAMGPAGPPGEKGAMGPTGPSGEKGAVGPAGPLGKTGPIGPAGPVSFGRPGP 289

[210][TOP]
>UniRef100_UPI00015B6358 PREDICTED: hypothetical protein n=1 Tax=Nasonia vitripennis
           RepID=UPI00015B6358
          Length = 441

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 52/166 (31%), Positives = 72/166 (43%), Gaps = 7/166 (4%)
 Frame = +1

Query: 13  PSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSY-APSSSASLPQGAHLG 189
           P+ G    G    G  A  S  G P + G + GS  GG P+SSY APS+  S   GA   
Sbjct: 42  PNLGGGGGGGGGFGGGAPSSSYGAPSSGGGFGGSFGGGAPSSSYGAPSTGGSFGGGAPSS 101

Query: 190 SRGGAPPSVAGGYGAS-GPTSATFSNESGSFQSLQPAPPQMPPPTGPS-----PHLAHGG 351
           S G   PS  G +G S G  + + S  + SF    P+     P  G S     P  ++G 
Sbjct: 102 SYGA--PSSGGSFGGSFGGGAPSSSYGAPSFGGNAPSSSYGAPSAGGSFGGGAPSNSYGP 159

Query: 352 VTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPA 489
            ++++G P   G+ G +S  S        GG  G   P  +  +PA
Sbjct: 160 PSSSYGAPSAGGSFGGSSGGS-------FGGSFGGGAPSSSYGAPA 198

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/165 (32%), Positives = 72/165 (43%), Gaps = 6/165 (3%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSY-APSSSASLPQGAHLGS 192
           SYG+   G   GGS   G+ S    AP    GS  GG P+SSY APSS  S   G   G 
Sbjct: 62  SYGAPSSGGGFGGSFGGGAPSSSYGAPST-GGSFGGGAPSSSYGAPSSGGSF--GGSFG- 117

Query: 193 RGGAPPSVAG--GYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTGPSPHLAHG--GVT 357
            GGAP S  G   +G + P+S+  + +  GSF    P+    PP +      A G  G +
Sbjct: 118 -GGAPSSSYGAPSFGGNAPSSSYGAPSAGGSFGGGAPSNSYGPPSSSYGAPSAGGSFGGS 176

Query: 358 AAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPAS 492
           +        G   P+S   A  P+  +     P+ P     +P+S
Sbjct: 177 SGGSFGGSFGGGAPSSSYGAPAPSRPSSNYGAPSRPSSNYGAPSS 221

[211][TOP]
>UniRef100_UPI000056A77D collagen, type I, alpha 2 n=1 Tax=Danio rerio RepID=UPI000056A77D
          Length = 1352

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 50/170 (29%), Positives = 64/170 (37%), Gaps = 19/170 (11%)
 Frame = +1

Query: 22   GSHVPGSVVG--GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSR 195
            G+  P    G  G+       GP  APG    +G  G   ++  P +     +  + G  
Sbjct: 597  GARGPSGTPGPDGNKGEPGAVGPAGAPGPQGAAGMPGERGAAGTPGAKGEKGEAGYRGLE 656

Query: 196  GGAPPSVA-GGYGASGPTSATFSN----ESGSFQSLQPAPPQMPP----PTGPSPHLAHG 348
            G A    A G  G SGP     +N    E+GSF    PA P+  P     +GP+      
Sbjct: 657  GNAGKDGARGAPGPSGPPGPAGANGDKGETGSFGPPGPAGPRGAPGERGESGPAGPSGFA 716

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATG--------GGNGPAYPPGA 474
            G   A G     G  GPA     A PA   G        G +GP  PPGA
Sbjct: 717  GPPGADGQTGPRGEKGPAGGKGDAGPAGPAGPAGNTGPLGPSGPVGPPGA 766

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 57/167 (34%), Positives = 65/167 (38%), Gaps = 13/167 (7%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSF-----SGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQ 174
            P   G   P    G     GSF     +GP  APG    SGP G       PS  A  P 
Sbjct: 668  PGPSGPPGPAGANGDKGETGSFGPPGPAGPRGAPGERGESGPAG-------PSGFAG-PP 719

Query: 175  GA--HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPP----PTGPSPH 336
            GA    G RG   P  AGG G +GP     +  +G+   L P+ P  PP     +GP+  
Sbjct: 720  GADGQTGPRGEKGP--AGGKGDAGPAGP--AGPAGNTGPLGPSGPVGPPGARGDSGPTGL 775

Query: 337  LAHGGVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                G     G P   G  GPA L   A      G  G  GPA PPG
Sbjct: 776  TGFPGAPGRVGPPGPAGIVGPAGLTGPAGKDGPRGPRGDVGPAGPPG 822

[212][TOP]
>UniRef100_UPI00016E45BB UPI00016E45BB related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E45BB
          Length = 1632

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/166 (31%), Positives = 56/166 (33%), Gaps = 21/166 (12%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-------GAPP 210
            G+S +   SGPP   G     GP G P     P          H G RG         PP
Sbjct: 756  GTSGSDGPSGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLPGHPGQRGETGFQGKTGPP 815

Query: 211  SVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTG-------------PSPHLAHG 348
               G  G  GPT  T    E G      P PP  P   G             P P     
Sbjct: 816  GPGGVVGPQGPTGETGPVGERG-----HPGPPGPPGEQGLPGSAGKEGAKGDPGPQ---- 866

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            G +   G P   G  G   L  AA PA    GG GP  PPG I SP
Sbjct: 867  GPSGKDGPPGLRGFPGERGLPGAAGPA-GLKGGEGPQGPPGPIGSP 911

[213][TOP]
>UniRef100_UPI00016E45BA UPI00016E45BA related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E45BA
          Length = 1724

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/166 (31%), Positives = 56/166 (33%), Gaps = 21/166 (12%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-------GAPP 210
            G+S +   SGPP   G     GP G P     P          H G RG         PP
Sbjct: 838  GTSGSDGPSGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLPGHPGQRGETGFQGKTGPP 897

Query: 211  SVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTG-------------PSPHLAHG 348
               G  G  GPT  T    E G      P PP  P   G             P P     
Sbjct: 898  GPGGVVGPQGPTGETGPVGERG-----HPGPPGPPGEQGLPGSAGKEGAKGDPGPQ---- 948

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            G +   G P   G  G   L  AA PA    GG GP  PPG I SP
Sbjct: 949  GPSGKDGPPGLRGFPGERGLPGAAGPA-GLKGGEGPQGPPGPIGSP 993

[214][TOP]
>UniRef100_UPI00016E45B9 UPI00016E45B9 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E45B9
          Length = 1732

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/166 (31%), Positives = 56/166 (33%), Gaps = 21/166 (12%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-------GAPP 210
            G+S +   SGPP   G     GP G P     P          H G RG         PP
Sbjct: 843  GTSGSDGPSGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLPGHPGQRGETGFQGKTGPP 902

Query: 211  SVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTG-------------PSPHLAHG 348
               G  G  GPT  T    E G      P PP  P   G             P P     
Sbjct: 903  GPGGVVGPQGPTGETGPVGERG-----HPGPPGPPGEQGLPGSAGKEGAKGDPGPQ---- 953

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            G +   G P   G  G   L  AA PA    GG GP  PPG I SP
Sbjct: 954  GPSGKDGPPGLRGFPGERGLPGAAGPA-GLKGGEGPQGPPGPIGSP 998

[215][TOP]
>UniRef100_UPI00016E45B8 UPI00016E45B8 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E45B8
          Length = 1743

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/166 (31%), Positives = 56/166 (33%), Gaps = 21/166 (12%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-------GAPP 210
            G+S +   SGPP   G     GP G P     P          H G RG         PP
Sbjct: 867  GTSGSDGPSGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLPGHPGQRGETGFQGKTGPP 926

Query: 211  SVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTG-------------PSPHLAHG 348
               G  G  GPT  T    E G      P PP  P   G             P P     
Sbjct: 927  GPGGVVGPQGPTGETGPVGERG-----HPGPPGPPGEQGLPGSAGKEGAKGDPGPQ---- 977

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            G +   G P   G  G   L  AA PA    GG GP  PPG I SP
Sbjct: 978  GPSGKDGPPGLRGFPGERGLPGAAGPA-GLKGGEGPQGPPGPIGSP 1022

[216][TOP]
>UniRef100_UPI00016E4599 UPI00016E4599 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E4599
          Length = 1789

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/166 (31%), Positives = 56/166 (33%), Gaps = 21/166 (12%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-------GAPP 210
            G+S +   SGPP   G     GP G P     P          H G RG         PP
Sbjct: 890  GTSGSDGPSGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLPGHPGQRGETGFQGKTGPP 949

Query: 211  SVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTG-------------PSPHLAHG 348
               G  G  GPT  T    E G      P PP  P   G             P P     
Sbjct: 950  GPGGVVGPQGPTGETGPVGERG-----HPGPPGPPGEQGLPGSAGKEGAKGDPGPQ---- 1000

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            G +   G P   G  G   L  AA PA    GG GP  PPG I SP
Sbjct: 1001 GPSGKDGPPGLRGFPGERGLPGAAGPA-GLKGGEGPQGPPGPIGSP 1045

[217][TOP]
>UniRef100_UPI00016E4598 UPI00016E4598 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E4598
          Length = 1803

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/166 (31%), Positives = 56/166 (33%), Gaps = 21/166 (12%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-------GAPP 210
            G+S +   SGPP   G     GP G P     P          H G RG         PP
Sbjct: 904  GTSGSDGPSGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLPGHPGQRGETGFQGKTGPP 963

Query: 211  SVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTG-------------PSPHLAHG 348
               G  G  GPT  T    E G      P PP  P   G             P P     
Sbjct: 964  GPGGVVGPQGPTGETGPVGERG-----HPGPPGPPGEQGLPGSAGKEGAKGDPGPQ---- 1014

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            G +   G P   G  G   L  AA PA    GG GP  PPG I SP
Sbjct: 1015 GPSGKDGPPGLRGFPGERGLPGAAGPA-GLKGGEGPQGPPGPIGSP 1059

[218][TOP]
>UniRef100_UPI00016E4597 UPI00016E4597 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E4597
          Length = 1813

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/166 (31%), Positives = 56/166 (33%), Gaps = 21/166 (12%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-------GAPP 210
            G+S +   SGPP   G     GP G P     P          H G RG         PP
Sbjct: 914  GTSGSDGPSGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLPGHPGQRGETGFQGKTGPP 973

Query: 211  SVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTG-------------PSPHLAHG 348
               G  G  GPT  T    E G      P PP  P   G             P P     
Sbjct: 974  GPGGVVGPQGPTGETGPVGERG-----HPGPPGPPGEQGLPGSAGKEGAKGDPGPQ---- 1024

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            G +   G P   G  G   L  AA PA    GG GP  PPG I SP
Sbjct: 1025 GPSGKDGPPGLRGFPGERGLPGAAGPA-GLKGGEGPQGPPGPIGSP 1069

[219][TOP]
>UniRef100_UPI00016E4575 UPI00016E4575 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E4575
          Length = 1763

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/166 (31%), Positives = 56/166 (33%), Gaps = 21/166 (12%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-------GAPP 210
            G+S +   SGPP   G     GP G P     P          H G RG         PP
Sbjct: 864  GTSGSDGPSGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLPGHPGQRGETGFQGKTGPP 923

Query: 211  SVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTG-------------PSPHLAHG 348
               G  G  GPT  T    E G      P PP  P   G             P P     
Sbjct: 924  GPGGVVGPQGPTGETGPVGERG-----HPGPPGPPGEQGLPGSAGKEGAKGDPGPQ---- 974

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            G +   G P   G  G   L  AA PA    GG GP  PPG I SP
Sbjct: 975  GPSGKDGPPGLRGFPGERGLPGAAGPA-GLKGGEGPQGPPGPIGSP 1019

[220][TOP]
>UniRef100_UPI00016E4574 UPI00016E4574 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E4574
          Length = 1686

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/166 (31%), Positives = 56/166 (33%), Gaps = 21/166 (12%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-------GAPP 210
            G+S +   SGPP   G     GP G P     P          H G RG         PP
Sbjct: 787  GTSGSDGPSGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLPGHPGQRGETGFQGKTGPP 846

Query: 211  SVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTG-------------PSPHLAHG 348
               G  G  GPT  T    E G      P PP  P   G             P P     
Sbjct: 847  GPGGVVGPQGPTGETGPVGERG-----HPGPPGPPGEQGLPGSAGKEGAKGDPGPQ---- 897

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            G +   G P   G  G   L  AA PA    GG GP  PPG I SP
Sbjct: 898  GPSGKDGPPGLRGFPGERGLPGAAGPA-GLKGGEGPQGPPGPIGSP 942

[221][TOP]
>UniRef100_UPI00016E4573 UPI00016E4573 related cluster n=1 Tax=Takifugu rubripes
            RepID=UPI00016E4573
          Length = 1815

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/166 (31%), Positives = 56/166 (33%), Gaps = 21/166 (12%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRG-------GAPP 210
            G+S +   SGPP   G     GP G P     P          H G RG         PP
Sbjct: 916  GTSGSDGPSGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLPGHPGQRGETGFQGKTGPP 975

Query: 211  SVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTG-------------PSPHLAHG 348
               G  G  GPT  T    E G      P PP  P   G             P P     
Sbjct: 976  GPGGVVGPQGPTGETGPVGERG-----HPGPPGPPGEQGLPGSAGKEGAKGDPGPQ---- 1026

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSP 486
            G +   G P   G  G   L  AA PA    GG GP  PPG I SP
Sbjct: 1027 GPSGKDGPPGLRGFPGERGLPGAAGPA-GLKGGEGPQGPPGPIGSP 1071

[222][TOP]
>UniRef100_Q90YJ0 Procollagen type I alpha 2 chain n=1 Tax=Danio rerio
            RepID=Q90YJ0_DANRE
          Length = 1352

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 50/170 (29%), Positives = 64/170 (37%), Gaps = 19/170 (11%)
 Frame = +1

Query: 22   GSHVPGSVVG--GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSR 195
            G+  P    G  G+       GP  APG    +G  G   ++  P +     +  + G  
Sbjct: 597  GARGPSGTPGPDGNKGEPGAVGPAGAPGPQGAAGMPGERGAAGTPEAKGEKGEAGYRGLE 656

Query: 196  GGAPPSVA-GGYGASGPTSATFSN----ESGSFQSLQPAPPQMPP----PTGPSPHLAHG 348
            G A    A G  G SGP     +N    E+GSF    PA P+  P     +GP+      
Sbjct: 657  GNAGKDGARGAPGPSGPPGPAGANGDKGETGSFGPPGPAGPRGAPGERGESGPAGPSGFA 716

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATG--------GGNGPAYPPGA 474
            G   A G     G  GPA     A PA   G        G +GP  PPGA
Sbjct: 717  GPPGADGQTGPRGEKGPAGGKGDAGPAGPAGPAGNTGPLGPSGPVGPPGA 766

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 57/167 (34%), Positives = 65/167 (38%), Gaps = 13/167 (7%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSF-----SGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQ 174
            P   G   P    G     GSF     +GP  APG    SGP G       PS  A  P 
Sbjct: 668  PGPSGPPGPAGANGDKGETGSFGPPGPAGPRGAPGERGESGPAG-------PSGFAG-PP 719

Query: 175  GA--HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPP----PTGPSPH 336
            GA    G RG   P  AGG G +GP     +  +G+   L P+ P  PP     +GP+  
Sbjct: 720  GADGQTGPRGEKGP--AGGKGDAGPAGP--AGPAGNTGPLGPSGPVGPPGARGDSGPTGL 775

Query: 337  LAHGGVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                G     G P   G  GPA L   A      G  G  GPA PPG
Sbjct: 776  TGFPGAPGRVGPPGPAGIVGPAGLTGPAGKDGPRGPRGDVGPAGPPG 822

[223][TOP]
>UniRef100_Q6IQX2 Collagen, type I, alpha 2 n=1 Tax=Danio rerio RepID=Q6IQX2_DANRE
          Length = 1352

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 50/170 (29%), Positives = 64/170 (37%), Gaps = 19/170 (11%)
 Frame = +1

Query: 22   GSHVPGSVVG--GSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSR 195
            G+  P    G  G+       GP  APG    +G  G   ++  P +     +  + G  
Sbjct: 597  GARGPSGTPGPDGNKGEPGAVGPAGAPGPQGAAGMPGERGAAGTPGAKGEKGEAGYRGLE 656

Query: 196  GGAPPSVA-GGYGASGPTSATFSN----ESGSFQSLQPAPPQMPP----PTGPSPHLAHG 348
            G A    A G  G SGP     +N    E+GSF    PA P+  P     +GP+      
Sbjct: 657  GNAGKDGARGAPGPSGPPGPAGANGDKGETGSFGPPGPAGPRGAPGERGESGPAGPSGFA 716

Query: 349  GVTAAHGVPRHHGANGPASLNSAALPAYATG--------GGNGPAYPPGA 474
            G   A G     G  GPA     A PA   G        G +GP  PPGA
Sbjct: 717  GPPGADGQTGPRGEKGPAGGKGDAGPAGPAGPAGNTGPLGPSGPVGPPGA 766

 Score = 53.5 bits (127), Expect = 9e-06
 Identities = 57/167 (34%), Positives = 65/167 (38%), Gaps = 13/167 (7%)
 Frame = +1

Query: 10   PPSYGSHVPGSVVGGSSAAGSF-----SGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQ 174
            P   G   P    G     GSF     +GP  APG    SGP G       PS  A  P 
Sbjct: 668  PGPSGPPGPAGANGDKGETGSFGPPGPAGPRGAPGERGESGPAG-------PSGFAG-PP 719

Query: 175  GA--HLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPP----PTGPSPH 336
            GA    G RG   P  AGG G +GP     +  +G+   L P+ P  PP     +GP+  
Sbjct: 720  GADGQTGPRGEKGP--AGGKGDAGPAGP--AGPAGNTGPLGPSGPVGPPGARGDSGPTGL 775

Query: 337  LAHGGVTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                G     G P   G  GPA L   A      G  G  GPA PPG
Sbjct: 776  TGFPGAPGRVGPPGPAGIVGPAGLTGPAGKDGPRGPRGDVGPAGPPG 822

[224][TOP]
>UniRef100_Q8K173 Col3a1 protein (Fragment) n=1 Tax=Mus musculus RepID=Q8K173_MOUSE
          Length = 1222

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 49/155 (31%), Positives = 58/155 (37%), Gaps = 10/155 (6%)
 Frame = +1

Query: 31  VPGSVVGGSSAAGSFSGPPY------APGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
           +PG+  GG        G P       APG   G G  G P     P  +A +P     G+
Sbjct: 400 IPGT--GGPPGENGKPGEPGPKGEVGAPGAPGGKGDSGAPGER-GPPGTAGIP-----GA 451

Query: 193 RGGA-PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
           RGGA PP   GG G +GP     ++ S   Q + P     P   GP       G   A G
Sbjct: 452 RGGAGPPGPEGGKGPAGPPGPPGASGSPGLQGM-PGERGGPGSPGPKGEKGEPGGAGADG 510

Query: 370 VPRHHGANGPASLNSAALPAYATGG---GNGPAYP 465
           VP   G  GPA       PA   G    G  P  P
Sbjct: 511 VPGKDGPRGPAGPIGPPGPAGQPGDKGEGGSPGLP 545

[225][TOP]
>UniRef100_Q8BLW4 Putative uncharacterized protein n=1 Tax=Mus musculus
            RepID=Q8BLW4_MOUSE
          Length = 1464

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 49/155 (31%), Positives = 58/155 (37%), Gaps = 10/155 (6%)
 Frame = +1

Query: 31   VPGSVVGGSSAAGSFSGPPY------APGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
            +PG+  GG        G P       APG   G G  G P     P  +A +P     G+
Sbjct: 642  IPGT--GGPPGENGKPGEPGPKGEVGAPGAPGGKGDSGAPGER-GPPGTAGIP-----GA 693

Query: 193  RGGA-PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
            RGGA PP   GG G +GP     ++ S   Q + P     P   GP       G   A G
Sbjct: 694  RGGAGPPGPEGGKGPAGPPGPPGASGSPGLQGM-PGERGGPGSPGPKGEKGEPGGAGADG 752

Query: 370  VPRHHGANGPASLNSAALPAYATGG---GNGPAYP 465
            VP   G  GPA       PA   G    G  P  P
Sbjct: 753  VPGKDGPRGPAGPIGPPGPAGQPGDKGEGGSPGLP 787

[226][TOP]
>UniRef100_Q7TT32 Collagen, type III, alpha 1 n=1 Tax=Mus musculus RepID=Q7TT32_MOUSE
          Length = 1464

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 49/155 (31%), Positives = 58/155 (37%), Gaps = 10/155 (6%)
 Frame = +1

Query: 31   VPGSVVGGSSAAGSFSGPPY------APGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
            +PG+  GG        G P       APG   G G  G P     P  +A +P     G+
Sbjct: 642  IPGT--GGPPGENGKPGEPGPKGEVGAPGAPGGKGDSGAPGER-GPPGTAGIP-----GA 693

Query: 193  RGGA-PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
            RGGA PP   GG G +GP     ++ S   Q + P     P   GP       G   A G
Sbjct: 694  RGGAGPPGPEGGKGPAGPPGPPGASGSPGLQGM-PGERGGPGSPGPKGEKGEPGGAGADG 752

Query: 370  VPRHHGANGPASLNSAALPAYATGG---GNGPAYP 465
            VP   G  GPA       PA   G    G  P  P
Sbjct: 753  VPGKDGPRGPAGPIGPPGPAGQPGDKGEGGSPGLP 787

[227][TOP]
>UniRef100_P08121 Collagen alpha-1(III) chain n=3 Tax=Mus musculus RepID=CO3A1_MOUSE
          Length = 1464

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 49/155 (31%), Positives = 58/155 (37%), Gaps = 10/155 (6%)
 Frame = +1

Query: 31   VPGSVVGGSSAAGSFSGPPY------APGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
            +PG+  GG        G P       APG   G G  G P     P  +A +P     G+
Sbjct: 642  IPGT--GGPPGENGKPGEPGPKGEVGAPGAPGGKGDSGAPGER-GPPGTAGIP-----GA 693

Query: 193  RGGA-PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
            RGGA PP   GG G +GP     ++ S   Q + P     P   GP       G   A G
Sbjct: 694  RGGAGPPGPEGGKGPAGPPGPPGASGSPGLQGM-PGERGGPGSPGPKGEKGEPGGAGADG 752

Query: 370  VPRHHGANGPASLNSAALPAYATGG---GNGPAYP 465
            VP   G  GPA       PA   G    G  P  P
Sbjct: 753  VPGKDGPRGPAGPIGPPGPAGQPGDKGEGGSPGLP 787

[228][TOP]
>UniRef100_Q3UH72 Putative uncharacterized protein n=1 Tax=Mus musculus
            RepID=Q3UH72_MOUSE
          Length = 1464

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 49/155 (31%), Positives = 58/155 (37%), Gaps = 10/155 (6%)
 Frame = +1

Query: 31   VPGSVVGGSSAAGSFSGPPY------APGVYAGSGPGGHPASSYAPSSSASLPQGAHLGS 192
            +PG+  GG        G P       APG   G G  G P     P  +A +P     G+
Sbjct: 642  IPGT--GGPPGENGKPGEPGPKGEVGAPGAPGGKGDSGAPGER-GPPGTAGIP-----GA 693

Query: 193  RGGA-PPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHG 369
            RGGA PP   GG G +GP     ++ S   Q + P     P   GP       G   A G
Sbjct: 694  RGGAGPPGPEGGKGPAGPPGPPGASGSPGLQGM-PGERGGPGSPGPKGEKGEPGGAGADG 752

Query: 370  VPRHHGANGPASLNSAALPAYATGG---GNGPAYP 465
            VP   G  GPA       PA   G    G  P  P
Sbjct: 753  VPGKDGPRGPAGPIGPPGPAGQPGDKGEGGSPGLP 787

[229][TOP]
>UniRef100_Q9L252 Putative uncharacterized protein SCO2669 n=1 Tax=Streptomyces
           coelicolor RepID=Q9L252_STRCO
          Length = 604

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 53/162 (32%), Positives = 63/162 (38%), Gaps = 10/162 (6%)
 Frame = +1

Query: 16  SYGSHVPGSVVGGSSAAGSFSGP--PYAPGVYAGSGPGGHPASSYAPSSSASLP----QG 177
           S G   PG   GG    G F  P  P  PG + G G    P  S  P+ +         G
Sbjct: 195 SGGPGAPGGP-GGPGGPGGFGSPDGPNRPGGFGGPGSPDGPGGSGGPNGAGGFGGPGGPG 253

Query: 178 AHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSL-QPAPPQMP-PPTGPSPHLAHGG 351
              G  G   P+ AGG+G  GP     S  SG F     P  P  P  P GP  +   GG
Sbjct: 254 GPNGPGGPGGPNGAGGFG--GPGGPGGSGGSGGFGGPGGPGGPSGPNSPGGPGGYNGPGG 311

Query: 352 VTAAHGVPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
               +G P + G  GP   N    P   +G  G +GP  PPG
Sbjct: 312 PGGPNG-PNNPG--GPGGYNGPGGPGGPSGPNGPSGPPAPPG 350

[230][TOP]
>UniRef100_C3AC52 Collagen triple helix repeat domain protein n=1 Tax=Bacillus
           mycoides DSM 2048 RepID=C3AC52_BACMY
          Length = 922

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 45/154 (29%), Positives = 58/154 (37%), Gaps = 13/154 (8%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
           P  + G +   G   GPP   G    +GPGG P+ S   + +       + G  G A   
Sbjct: 192 PTGITGPTGITGPSGGPPGPTGATGATGPGGGPSGSTGATGAT-----GNTGVTGSA--G 244

Query: 214 VAGGYGASGPTSATFSNESGSFQSLQ-------PAPPQ----MPPPTGPSPHLAHGGVTA 360
           V G  G SG T  T +      Q +Q       P  PQ    +P PTG +      GV  
Sbjct: 245 VTGNTGPSGSTGETGAQGLQGIQGVQGPIGPTGPEGPQGIQGIPGPTGVTGEQGIQGVQG 304

Query: 361 AHGVPRHHGANGPASLNSAALPAYATG--GGNGP 456
             G+    G  GP  +  A  P   TG  G  GP
Sbjct: 305 IQGITGATGDQGPQGIQGAIGPQGITGATGDQGP 338

[231][TOP]
>UniRef100_Q9LKA4 AT3G15010 protein n=1 Tax=Arabidopsis thaliana RepID=Q9LKA4_ARATH
          Length = 404

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 49/157 (31%), Positives = 66/157 (42%), Gaps = 5/157 (3%)
 Frame = +1

Query: 1   AQQPPSYGSHVPGSVVGGSSAAGSF--SGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQ 174
           AQ   S   HV G  +G    AG +  +G   A G Y+G  P  H  S+++     S   
Sbjct: 256 AQDGGSGHGHVHGEGMGMVRPAGPYGAAGGISAYGGYSGGPPAHHMNSTHSSMGVGSAGY 315

Query: 175 GAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGV 354
           G H G  GG  P   G YG  G         SG ++     PP   P  G  P   H G+
Sbjct: 316 GGHYGGYGG--PGGTGVYGGLGGGYGGPGTGSGQYR----MPPSSMPGGGGYPESGHYGL 369

Query: 355 TAAHGVP-RHHGANGPASLNSAALPAYATGG--GNGP 456
           +++ G P +HH A G     ++ +P    GG   NGP
Sbjct: 370 SSSAGYPGQHHQAVG-----TSPVPRVPHGGMYPNGP 401

[232][TOP]
>UniRef100_A8IZJ6 RWP-RK transcription factor n=1 Tax=Chlamydomonas reinhardtii
           RepID=A8IZJ6_CHLRE
          Length = 1428

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 45/157 (28%), Positives = 57/157 (36%), Gaps = 7/157 (4%)
 Frame = +1

Query: 22  GSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPAS-SYAPS-SSASLPQGAHLGSR 195
           G    G V GG    G + GPP + GV  GSGP G P S    P      +P  A     
Sbjct: 540 GQQRGGGVRGGMPGDGGWIGPP-SGGVAGGSGPLGRPHSPDLGPHMGGGGMPLQALQSGG 598

Query: 196 GGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVP 375
            G  P+ +GGYG  G          G      P P      +G   H ++G    ++G  
Sbjct: 599 SGYGPAHSGGYGGPGGGGGDMGAGPG------PGPGHYNDMSGRGHHDSYGSAPGSYGPN 652

Query: 376 R-----HHGANGPASLNSAALPAYATGGGNGPAYPPG 471
                 + G  G        +  Y  GGG G  Y PG
Sbjct: 653 SASGGGYGGPGGGGGGQGGGMGGYGGGGGRGGGYGPG 689

[233][TOP]
>UniRef100_B9QKW0 HECT domain-containing protein n=1 Tax=Toxoplasma gondii VEG
            RepID=B9QKW0_TOXGO
          Length = 11061

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 58/190 (30%), Positives = 78/190 (41%), Gaps = 13/190 (6%)
 Frame = +1

Query: 4    QQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAH 183
            + PP   +H PG+ + G+   G+ SGP  +PG           +     SSSASLPQ   
Sbjct: 5198 RDPPRPSNH-PGTPLAGAGTGGA-SGPSVSPGF---------ASVPLLASSSASLPQNPE 5246

Query: 184  LGSRG----GAPPSVA-------GGYGASGPTSATFSNESGSFQSLQPAPPQMPPP--TG 324
            L +      G+ PS +       GG G+ G    +F   S  F   QP P  MP P  +G
Sbjct: 5247 LSASPNQLEGSVPSPSQRLQFRRGGLGSDG-WDGSFDASSTPFLRAQPVPTAMPMPALSG 5305

Query: 325  PSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATF 504
            P+       + AA  +PR       +S +SA  P        GPA  P  IVSP  T   
Sbjct: 5306 PASRPPVSSLPAAMSLPRGPAPPSGSSRDSALPPI-------GPA--PVQIVSPPLTPAL 5356

Query: 505  NRLSPAAAAA 534
                P +  A
Sbjct: 5357 PLAGPVSGLA 5366

[234][TOP]
>UniRef100_B6KP87 HECT-domain (Ubiquitin-transferase) containing protein n=1
            Tax=Toxoplasma gondii ME49 RepID=B6KP87_TOXGO
          Length = 10999

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 58/190 (30%), Positives = 78/190 (41%), Gaps = 13/190 (6%)
 Frame = +1

Query: 4    QQPPSYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAH 183
            + PP   +H PG+ + G+   G+ SGP  +PG           +     SSSASLPQ   
Sbjct: 5198 RDPPRPSNH-PGTPLAGAGTGGA-SGPSVSPGF---------ASVPLLASSSASLPQNPE 5246

Query: 184  LGSRG----GAPPSVA-------GGYGASGPTSATFSNESGSFQSLQPAPPQMPPP--TG 324
            L +      G+ PS +       GG G+ G    +F   S  F   QP P  MP P  +G
Sbjct: 5247 LSASPNQLEGSVPSPSQRLQFRRGGLGSDG-WDGSFDASSTPFLRAQPVPTAMPMPALSG 5305

Query: 325  PSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATF 504
            P+       + AA  +PR       +S +SA  P        GPA  P  IVSP  T   
Sbjct: 5306 PASRPPVSSLPAAMSLPRGPAPPSGSSRDSALPPI-------GPA--PVQIVSPPLTPAL 5356

Query: 505  NRLSPAAAAA 534
                P +  A
Sbjct: 5357 PLAGPVSGLA 5366

[235][TOP]
>UniRef100_B4Q0N7 GE17489 n=1 Tax=Drosophila yakuba RepID=B4Q0N7_DROYA
          Length = 2036

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 57/177 (32%), Positives = 75/177 (42%), Gaps = 10/177 (5%)
 Frame = +1

Query: 34  PGSVVGGSSAAGSFSGP-PYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAP- 207
           P +    SS AG+ +G    +  V +G G G    S+ A S+  S  QGA  G+ GG+  
Sbjct: 162 PATPKSSSSGAGATTGSGTSSAAVTSGPGSGSTKVSAAASSAQQSGLQGA-TGAGGGSSS 220

Query: 208 -PSVAGGYGASGPTSA-TFSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRH 381
            P    G GA G T+A   S   G+  S     P +PP +   PH   G  T        
Sbjct: 221 TPGTQPGSGAGGATAARPVSAMGGTVSSTAGGAPSIPPISTMPPHTVPGS-TNTTTTAMA 279

Query: 382 HGANGP----ASLNSAALPAYATGGGNGPAYP--PGAIVSPASTATFNRLSPAAAAA 534
            GA GP    A+ N+ AL A     G   AYP  PG     +S+      +  AAAA
Sbjct: 280 GGAGGPGAAAANRNAEALMASLLNTGQTGAYPGAPGQTAVNSSSLLDGSTAAVAAAA 336

[236][TOP]
>UniRef100_B4NI92 GK13553 n=1 Tax=Drosophila willistoni RepID=B4NI92_DROWI
          Length = 779

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 55/189 (29%), Positives = 81/189 (42%), Gaps = 13/189 (6%)
 Frame = +1

Query: 1   AQQPPSYGSHVPGSVVGGSSAAGSFSGP-PYAPGV-YAGSGPGGHPASSY---APSSSAS 165
           A +  SY +  P S     S+  +  GP P AP   Y+   P  +   SY   APSSS S
Sbjct: 385 ANRGGSYPAASPSSSYSAPSSGSNNGGPYPSAPSSSYSAPSPSANAGGSYPAAAPSSSYS 444

Query: 166 LPQGAHLGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPT-----GPS 330
            P    L S  G P   A     S P+ +  +N  GS+ +  P+     P +     GP 
Sbjct: 445 APS---LDSSSGGPYRSAPSSSYSAPSPS--ANVGGSYPAATPSSSYSAPSSDSSRGGPY 499

Query: 331 PHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYATGGGNG---PAYPPGAIVSPASTAT 501
           P  A     +A     + G + PA+  S++  A ++G  NG   P+ P  +  +P+ +A 
Sbjct: 500 PS-APSSSYSAPSPSANRGGSYPAASPSSSYSAPSSGSNNGGPYPSAPSSSYSAPSPSAN 558

Query: 502 FNRLSPAAA 528
                PAAA
Sbjct: 559 VGGSYPAAA 567

[237][TOP]
>UniRef100_C5DNK9 KLTH0G17886p n=1 Tax=Lachancea thermotolerans CBS 6340
           RepID=C5DNK9_LACTC
          Length = 804

 Score = 54.3 bits (129), Expect = 5e-06
 Identities = 58/178 (32%), Positives = 71/178 (39%), Gaps = 3/178 (1%)
 Frame = +1

Query: 10  PPSYGSHVPGSVVGGSSAA--GSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAH 183
           PP+    +P S   G+ A      S PP  P  +A + P   PASS APS   S P  A 
Sbjct: 205 PPASAPPLPSSNAPGTPAPLLPQSSAPPAPPVPFAAAPPA--PASS-APSVPKSSPSSAP 261

Query: 184 LGSRGGAPPSVAGGYGASGPTSATFSNESGSFQSLQPAPPQMPPPTGPS-PHLAHGGVTA 360
                 + P V G   +S P +              PAPP  P P  PS P L   G   
Sbjct: 262 PAPPAPSAPPVPGLPKSSAPPAPPAP-------PAPPAPPAPPAPPVPSAPALPKSGAPP 314

Query: 361 AHGVPRHHGANGPASLNSAALPAYATGGGNGPAYPPGAIVSPASTATFNRLSPAAAAA 534
           A  VP       P S    A PA      + P  PP     PAS+A   R +P+AA+A
Sbjct: 315 APPVPSAPAL--PKSGAPPAPPAPTLPKSSVPPAPPAPPALPASSAAPQRRAPSAASA 370

[238][TOP]
>UniRef100_UPI0000F2C218 PREDICTED: similar to collagen, type XI, alpha 1, isoform 3 n=1
            Tax=Monodelphis domestica RepID=UPI0000F2C218
          Length = 1768

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 56/189 (29%), Positives = 61/189 (32%), Gaps = 21/189 (11%)
 Frame = +1

Query: 16   SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGG-----HPASSYAPSSSASLPQGA 180
            S G+  P    G    +GS  GPP  PG     GP G      P     P     LP   
Sbjct: 852  SRGARGPTGKPGPKGTSGS-DGPPGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLP--G 908

Query: 181  HLGSRG-------GAPPSVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTGPSPH 336
            H G RG         PP   G  G  GPT  T    E G      P PP  P   G    
Sbjct: 909  HPGQRGETGFQGKTGPPGPGGVVGPQGPTGETGPIGERG-----HPGPPGPPGEQGLPGA 963

Query: 337  LAHGGVTAAHGVPRHHGANGPASLNS--------AALPAYATGGGNGPAYPPGAIVSPAS 492
                G     G     G +GPA L           A  A    GG GP  PPG + SP  
Sbjct: 964  AGKEGAKGDPGPQGVSGKDGPAGLRGFPGERGLPGAQGAPGLKGGEGPQGPPGPLGSPGE 1023

Query: 493  TATFNRLSP 519
              +     P
Sbjct: 1024 RGSAGTAGP 1032

[239][TOP]
>UniRef100_UPI0000F2C1FC PREDICTED: similar to collagen, type XI, alpha 1, isoform 2 n=1
            Tax=Monodelphis domestica RepID=UPI0000F2C1FC
          Length = 1819

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 56/189 (29%), Positives = 61/189 (32%), Gaps = 21/189 (11%)
 Frame = +1

Query: 16   SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGG-----HPASSYAPSSSASLPQGA 180
            S G+  P    G    +GS  GPP  PG     GP G      P     P     LP   
Sbjct: 903  SRGARGPTGKPGPKGTSGS-DGPPGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLP--G 959

Query: 181  HLGSRG-------GAPPSVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTGPSPH 336
            H G RG         PP   G  G  GPT  T    E G      P PP  P   G    
Sbjct: 960  HPGQRGETGFQGKTGPPGPGGVVGPQGPTGETGPIGERG-----HPGPPGPPGEQGLPGA 1014

Query: 337  LAHGGVTAAHGVPRHHGANGPASLNS--------AALPAYATGGGNGPAYPPGAIVSPAS 492
                G     G     G +GPA L           A  A    GG GP  PPG + SP  
Sbjct: 1015 AGKEGAKGDPGPQGVSGKDGPAGLRGFPGERGLPGAQGAPGLKGGEGPQGPPGPLGSPGE 1074

Query: 493  TATFNRLSP 519
              +     P
Sbjct: 1075 RGSAGTAGP 1083

[240][TOP]
>UniRef100_UPI0000E215D9 PREDICTED: similar to prepro-alpha2(I) collagen isoform 1 n=1 Tax=Pan
            troglodytes RepID=UPI0000E215D9
          Length = 1039

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 51/156 (32%), Positives = 58/156 (37%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG    AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 624  PG-VVGAVGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 678

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 679  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 736

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G  GP  PPG
Sbjct: 737  AKGERGAKGPKGENGVVGPTGPVGAAGPAGPNGPPG 772

[241][TOP]
>UniRef100_UPI0000E215D8 PREDICTED: similar to alpha2(I) collagen isoform 5 n=1 Tax=Pan
            troglodytes RepID=UPI0000E215D8
          Length = 1201

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 51/156 (32%), Positives = 58/156 (37%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG    AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 624  PG-VVGAVGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 678

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 679  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 736

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G  GP  PPG
Sbjct: 737  AKGERGAKGPKGENGVVGPTGPVGAAGPAGPNGPPG 772

[242][TOP]
>UniRef100_UPI0000E215D7 PREDICTED: alpha 2 type I collagen isoform 7 n=1 Tax=Pan troglodytes
            RepID=UPI0000E215D7
          Length = 1300

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 51/156 (32%), Positives = 58/156 (37%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG    AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 558  PG-VVGAVGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 612

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 613  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 670

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G  GP  PPG
Sbjct: 671  AKGERGAKGPKGENGVVGPTGPVGAAGPAGPNGPPG 706

[243][TOP]
>UniRef100_UPI0000E215D6 PREDICTED: similar to prepro-alpha2(I) collagen isoform 2 n=1 Tax=Pan
            troglodytes RepID=UPI0000E215D6
          Length = 1249

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 51/156 (32%), Positives = 58/156 (37%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG    AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 624  PG-VVGAVGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 678

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 679  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 736

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G  GP  PPG
Sbjct: 737  AKGERGAKGPKGENGVVGPTGPVGAAGPAGPNGPPG 772

[244][TOP]
>UniRef100_UPI0000E215D5 PREDICTED: alpha 2 type I collagen isoform 4 n=1 Tax=Pan troglodytes
            RepID=UPI0000E215D5
          Length = 1363

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 51/156 (32%), Positives = 58/156 (37%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG    AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 621  PG-VVGAVGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 675

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 676  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 733

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G  GP  PPG
Sbjct: 734  AKGERGAKGPKGENGVVGPTGPVGAAGPAGPNGPPG 769

[245][TOP]
>UniRef100_UPI0000E215D4 PREDICTED: similar to alpha2(I) collagen isoform 8 n=1 Tax=Pan
            troglodytes RepID=UPI0000E215D4
          Length = 1312

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 51/156 (32%), Positives = 58/156 (37%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG    AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 624  PG-VVGAVGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 678

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 679  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 736

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G  GP  PPG
Sbjct: 737  AKGERGAKGPKGENGVVGPTGPVGAAGPAGPNGPPG 772

[246][TOP]
>UniRef100_UPI0000E215D3 PREDICTED: alpha 2 type I collagen isoform 3 n=1 Tax=Pan troglodytes
            RepID=UPI0000E215D3
          Length = 1365

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 51/156 (32%), Positives = 58/156 (37%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG    AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 624  PG-VVGAVGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 678

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 679  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 736

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G  GP  PPG
Sbjct: 737  AKGERGAKGPKGENGVVGPTGPVGAAGPAGPNGPPG 772

[247][TOP]
>UniRef100_UPI0000E215D2 PREDICTED: alpha 2 type I collagen isoform 10 n=1 Tax=Pan troglodytes
            RepID=UPI0000E215D2
          Length = 1366

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 51/156 (32%), Positives = 58/156 (37%), Gaps = 10/156 (6%)
 Frame = +1

Query: 34   PGSVVGGSSAAGSFSGPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPS 213
            PG VVG    AG  SGP   PG    +G  G       P     +      G+RG AP  
Sbjct: 624  PG-VVGAVGTAGP-SGPSGLPGERGAAGIPGGKGEKGEPGLRGEIGNPGRDGARG-AP-- 678

Query: 214  VAGGYGASGPTSATFSN-ESGSFQSLQPAPPQMPP-------PTGPSPHLAHGGVTAAHG 369
              G  GA GP  AT    E+G+     PA P+  P       P GP+      G     G
Sbjct: 679  --GAVGAPGPAGATGDRGEAGAAGPAGPAGPRGSPGERGEVGPAGPNGFAGPAGAAGQPG 736

Query: 370  VPRHHGANGPASLNSAALPAYATG--GGNGPAYPPG 471
                 GA GP   N    P    G  G  GP  PPG
Sbjct: 737  AKGERGAKGPKGENGVVGPTGPVGAAGPAGPNGPPG 772

[248][TOP]
>UniRef100_UPI00005E7048 PREDICTED: similar to collagen, type XI, alpha 1, isoform 1 n=1
            Tax=Monodelphis domestica RepID=UPI00005E7048
          Length = 1807

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 56/189 (29%), Positives = 61/189 (32%), Gaps = 21/189 (11%)
 Frame = +1

Query: 16   SYGSHVPGSVVGGSSAAGSFSGPPYAPGVYAGSGPGG-----HPASSYAPSSSASLPQGA 180
            S G+  P    G    +GS  GPP  PG     GP G      P     P     LP   
Sbjct: 891  SRGARGPTGKPGPKGTSGS-DGPPGPPGERGPQGPQGPVGFPGPKGPPGPPGKDGLP--G 947

Query: 181  HLGSRG-------GAPPSVAGGYGASGPTSATFS-NESGSFQSLQPAPPQMPPPTGPSPH 336
            H G RG         PP   G  G  GPT  T    E G      P PP  P   G    
Sbjct: 948  HPGQRGETGFQGKTGPPGPGGVVGPQGPTGETGPIGERG-----HPGPPGPPGEQGLPGA 1002

Query: 337  LAHGGVTAAHGVPRHHGANGPASLNS--------AALPAYATGGGNGPAYPPGAIVSPAS 492
                G     G     G +GPA L           A  A    GG GP  PPG + SP  
Sbjct: 1003 AGKEGAKGDPGPQGVSGKDGPAGLRGFPGERGLPGAQGAPGLKGGEGPQGPPGPLGSPGE 1062

Query: 493  TATFNRLSP 519
              +     P
Sbjct: 1063 RGSAGTAGP 1071

[249][TOP]
>UniRef100_UPI0000121787 Hypothetical protein CBG05354 n=1 Tax=Caenorhabditis briggsae AF16
           RepID=UPI0000121787
          Length = 299

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 41/132 (31%), Positives = 47/132 (35%)
 Frame = +1

Query: 79  GPPYAPGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVAGGYGASGPTSATF 258
           GPP  PG     G  G P S   P   A+  +    G  G  PP   G  G  G      
Sbjct: 151 GPPGPPGPPGPPGDSGEPGSPGLPGQDAAPGEPGPKGPPG--PPGAPGAPGTPGEPGVPA 208

Query: 259 SNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHGANGPASLNSAALPAYAT 438
            +E       +P PP  P P GP       G   + G P   G NGP     A       
Sbjct: 209 QSEP--LIPGEPGPPGEPGPQGPPGPPGQPGADGSPGQPGPKGPNGPDGQPGAD----GN 262

Query: 439 GGGNGPAYPPGA 474
            G  GPA PPG+
Sbjct: 263 PGAPGPAGPPGS 274

[250][TOP]
>UniRef100_UPI00017B24B3 UPI00017B24B3 related cluster n=1 Tax=Tetraodon nigroviridis
            RepID=UPI00017B24B3
          Length = 973

 Score = 53.9 bits (128), Expect = 7e-06
 Identities = 50/150 (33%), Positives = 59/150 (39%), Gaps = 10/150 (6%)
 Frame = +1

Query: 52   GSSAAGSFSGPPYA---PGVYAGSGPGGHPASSYAPSSSASLPQGAHLGSRGGAPPSVA- 219
            GS     F+GPP A   PG+    G  G    + AP      PQG   G+ G A P+   
Sbjct: 764  GSPGPAGFAGPPGADGQPGIKGEQGETGQKGDAGAPG-----PQGPS-GAPGPAGPTGVF 817

Query: 220  ---GGYGASGPTSAT-FSNESGSFQSLQPAPPQMPPPTGPSPHLAHGGVTAAHGVPRHHG 387
               G  GA GP  AT F   +G      P P   P P GP+      G     G     G
Sbjct: 818  GPKGARGAQGPPGATGFPGAAGRVGP--PGPNGNPGPAGPAGSPGKDGPKGIRGDAGPPG 875

Query: 388  ANGPASLNSAALPAYATG--GGNGPAYPPG 471
              G A L   A P+   G  G +GP  PPG
Sbjct: 876  RQGDAGLRGPAGPSGEKGDAGEDGPVGPPG 905