Query lcl|Aclame:protein:vir:103370|NCBI_annot:hypothetical protein|genbank:acc:YP_024741;genbank:gi:48697083;genbank:GeneID:2846038 Match_columns 418 No_of_seqs 89 out of 98 Neff 6.3 Searched_HMMs 1612 Date Sun Dec 1 11:53:25 2013 Command /home/guerois/workspace/virfam/python/lib/hhsearch//hhsearch2 -i .//seq/seq_18 -d /home/guerois/workspace/virfam/python/profile_database/capsid_neck_tail.hhm -glob -cpu 7 -o .//seq/HHR/seq_18_vs_rec_db.hhr No Hit Prob E-value P-value Score SS Cols Query HMM Template HMM 1 protein:vir:96442 Length: 418 100.0 5E-140 3E-143 784.1 35.4 414 1-418 1-418 (418) 2 protein:vir:103370 Length: 418 100.0 5E-138 3E-141 773.2 34.3 414 1-418 1-418 (418) 3 protein:vir:8843 Length: 317 # 100.0 1.3E-81 8.2E-85 464.0 26.7 304 1-408 1-317 (317) 4 protein:vir:104479 Length: 310 99.6 4.5E-19 2.8E-22 121.2 8.6 157 1-176 149-310 (310) 5 protein:vir:97255 Length: 310 98.8 2.4E-10 1.5E-13 73.3 13.7 296 68-406 1-310 (310) 6 protein:vir:94933 Length: 330 98.3 2.8E-08 1.7E-11 62.0 12.6 314 27-407 1-330 (330) 7 protein:vir:95763 Length: 297 97.6 2.6E-05 1.6E-08 45.7 17.0 286 68-407 1-297 (297) 8 protein:vir:94142 Length: 304 97.4 4.4E-05 2.8E-08 44.4 15.0 290 61-405 1-304 (304) 9 protein:vir:105905 Length: 304 97.4 4.4E-05 2.8E-08 44.4 15.0 290 61-405 1-304 (304) 10 protein:vir:99424 Length: 360 97.3 6.9E-05 4.3E-08 43.4 15.5 317 43-409 1-360 (360) 11 protein:vir:41 Length: 299 # N 97.3 3.7E-05 2.3E-08 44.9 13.6 294 61-408 1-299 (299) 12 protein:vir:7771 Length: 330 # 97.2 0.00012 7.7E-08 42.0 16.5 311 61-418 1-329 (330) 13 protein:vir:102823 Length: 470 97.2 2.3E-05 1.5E-08 46.0 12.2 330 35-418 1-355 (470) 14 protein:vir:2504 Length: 305 # 97.1 9.7E-05 6E-08 42.6 14.2 297 69-418 1-305 (305) 15 protein:vir:97148 Length: 324 97.0 5.9E-05 3.6E-08 43.8 12.7 318 4-416 1-324 (324) 16 protein:vir:348 Length: 321 # 97.0 5.8E-05 3.6E-08 43.8 12.5 296 35-404 1-321 (321) 17 protein:vir:8187 Length: 311 # 96.9 7.7E-05 4.8E-08 43.1 12.3 286 69-407 1-311 (311) 18 protein:vir:99749 Length: 324 96.9 9.6E-05 6E-08 42.6 12.7 314 27-416 1-324 (324) 19 protein:vir:103955 Length: 324 96.7 0.00014 8.7E-08 41.7 12.5 312 27-418 1-323 (324) 20 protein:vir:9759 Length: 303 # 96.4 0.00021 1.3E-07 40.8 11.6 284 79-406 1-303 (303) 21 protein:vir:9309 Length: 324 # 96.3 0.00021 1.3E-07 40.7 11.3 304 4-418 1-321 (324) 22 protein:vir:2344 Length: 397 # 96.2 0.00079 4.9E-07 37.6 13.5 302 61-418 1-318 (397) 23 protein:vir:104085 Length: 320 96.0 0.00039 2.4E-07 39.3 11.3 298 61-417 1-320 (320) 24 protein:vir:96392 Length: 324 96.0 0.0008 5E-07 37.6 12.9 310 44-416 1-324 (324) 25 protein:vir:78830 Length: 324 96.0 0.0008 5E-07 37.6 12.9 310 44-416 1-324 (324) 26 protein:vir:94771 Length: 298 96.0 0.0012 7.3E-07 36.6 13.6 281 79-405 1-298 (298) 27 protein:vir:3158 Length: 321 # 95.9 0.00083 5.1E-07 37.5 12.3 308 52-416 1-321 (321) 28 protein:vir:96223 Length: 324 95.8 0.0008 5E-07 37.6 12.0 310 27-418 1-323 (324) 29 protein:vir:4159 Length: 315 # 95.4 0.0022 1.4E-06 35.2 14.1 299 61-403 1-315 (315) 30 protein:vir:2430 Length: 318 # 95.3 0.0024 1.5E-06 34.9 13.3 301 41-411 1-318 (318) 31 protein:vir:9574 Length: 300 # 95.3 0.0024 1.5E-06 34.9 14.0 287 69-406 1-300 (300) 32 protein:vir:4339 Length: 395 # 94.9 0.0032 2E-06 34.3 17.9 320 1-407 68-395 (395) 33 protein:vir:4226 Length: 326 # 94.7 0.0037 2.3E-06 33.9 15.9 308 27-409 1-326 (326) 34 protein:vir:80684 Length: 315 94.6 0.003 1.9E-06 34.4 11.7 296 69-418 1-314 (315) 35 protein:vir:99311 Length: 463 94.5 0.0044 2.7E-06 33.5 12.2 324 6-418 1-352 (463) 36 protein:vir:95603 Length: 463 94.5 0.0044 2.7E-06 33.5 12.2 324 6-418 1-352 (463) 37 protein:vir:4856 Length: 293 # 94.4 0.0045 2.8E-06 33.4 15.4 280 65-418 1-293 (293) 38 protein:vir:78523 Length: 338 93.7 0.0067 4.1E-06 32.5 14.3 318 54-411 1-338 (338) 39 protein:vir:100135 Length: 418 93.6 0.0069 4.3E-06 32.4 19.0 289 1-409 110-418 (418) 40 protein:vir:96666 Length: 462 93.6 0.007 4.4E-06 32.4 13.1 317 27-418 1-359 (462) 41 protein:vir:80835 Length: 464 93.0 0.0091 5.6E-06 31.8 13.2 328 4-418 1-356 (464) 42 protein:vir:1638 Length: 298 # 93.0 0.0091 5.7E-06 31.8 16.0 281 81-405 1-298 (298) 43 protein:vir:1886 Length: 385 # 92.9 0.0096 6E-06 31.6 18.8 322 1-407 61-385 (385) 44 protein:vir:191 Length: 385 # 92.9 0.0096 6E-06 31.6 18.8 322 1-407 61-385 (385) 45 protein:vir:100851 Length: 514 92.5 0.011 6.8E-06 31.3 14.7 354 27-418 1-391 (514) 46 protein:vir:80068 Length: 301 92.2 0.0031 1.9E-06 34.4 7.7 274 80-404 1-301 (301) 47 protein:vir:6242 Length: 390 # 90.4 0.021 1.3E-05 29.8 14.2 299 1-408 72-390 (390) 48 protein:vir:81070 Length: 390 90.3 0.022 1.4E-05 29.7 17.8 316 1-404 70-390 (390) 49 protein:vir:103285 Length: 296 89.6 0.014 8.4E-06 30.8 8.6 282 68-407 1-296 (296) 50 protein:vir:81227 Length: 413 88.8 0.03 1.9E-05 28.9 18.3 326 1-416 74-413 (413) 51 protein:vir:96123 Length: 274 88.1 0.035 2.2E-05 28.6 19.6 254 81-412 1-274 (274) 52 protein:vir:4197 Length: 314 # 85.3 0.054 3.4E-05 27.5 17.0 299 61-399 1-314 (314) 53 protein:vir:97053 Length: 390 84.8 0.057 3.6E-05 27.4 17.9 317 1-405 68-390 (390) 54 protein:vir:10364 Length: 390 84.0 0.064 4E-05 27.1 16.4 318 1-405 61-390 (390) 55 protein:vir:108211 Length: 318 82.5 0.077 4.8E-05 26.7 14.6 292 61-407 1-318 (318) 56 protein:vir:9820 Length: 272 # 81.5 0.085 5.3E-05 26.5 19.7 265 61-410 1-272 (272) 57 protein:vir:3033 Length: 272 # 81.5 0.085 5.3E-05 26.5 19.7 265 61-410 1-272 (272) 58 protein:vir:8102 Length: 543 # 81.0 0.089 5.5E-05 26.3 17.9 309 1-407 212-543 (543) 59 protein:vir:63741 Length: 468 80.8 0.041 2.6E-05 28.2 6.8 328 13-418 1-369 (468) 60 protein:vir:3613 Length: 272 # 74.7 0.16 9.6E-05 25.0 17.8 253 81-406 1-272 (272) 61 protein:vir:93742 Length: 274 74.1 0.16 0.0001 24.9 19.0 256 81-411 1-274 (274) 62 protein:vir:78223 Length: 333 73.9 0.16 0.0001 24.9 16.9 314 54-416 1-333 (333) 63 protein:vir:94494 Length: 274 66.0 0.27 0.00017 23.7 18.9 259 81-411 1-274 (274) 64 protein:vir:97433 Length: 274 66.0 0.27 0.00017 23.7 18.9 259 81-411 1-274 (274) 65 protein:vir:107687 Length: 319 61.2 0.12 7.4E-05 25.6 4.6 298 52-404 1-319 (319) 66 protein:vir:100247 Length: 425 60.4 0.37 0.00023 22.9 15.7 311 1-408 91-425 (425) 67 protein:vir:5739 Length: 366 # 59.6 0.39 0.00024 22.8 13.5 338 1-406 1-366 (366) 68 protein:vir:4953 Length: 397 # 59.5 0.39 0.00024 22.8 14.7 312 1-418 66-397 (397) 69 protein:vir:99920 Length: 311 59.2 0.4 0.00025 22.8 14.7 288 69-408 1-311 (311) 70 protein:vir:80491 Length: 467 58.1 0.42 0.00026 22.6 10.7 327 14-418 1-368 (467) 71 protein:vir:7409 Length: 408 # 58.0 0.42 0.00026 22.6 21.4 319 1-418 77-403 (408) 72 protein:vir:80376 Length: 435 57.8 0.43 0.00026 22.6 14.9 337 1-408 65-435 (435) 73 protein:vir:103886 Length: 302 57.1 0.38 0.00023 22.9 6.5 271 91-412 1-302 (302) 74 protein:vir:98566 Length: 355 56.1 0.46 0.00029 22.4 7.6 300 68-418 1-353 (355) 75 protein:vir:739 Length: 231 # 55.9 0.47 0.00029 22.4 17.2 226 104-406 1-231 (231) 76 protein:vir:4456 Length: 401 # 55.4 0.48 0.0003 22.3 16.8 305 1-407 76-401 (401) 77 protein:vir:4997 Length: 397 # 53.9 0.52 0.00032 22.2 14.4 317 1-418 67-396 (397) 78 protein:vir:485 Length: 407 # 53.0 0.54 0.00033 22.1 18.9 313 1-417 79-407 (407) 79 protein:vir:6061 Length: 357 # 51.8 0.14 8.9E-05 25.2 3.3 327 17-418 1-354 (357) 80 protein:vir:8420 Length: 477 # 50.9 0.6 0.00037 21.8 11.1 355 1-412 77-477 (477) 81 protein:vir:1829 Length: 355 # 50.0 0.6 0.00037 21.8 6.5 314 17-418 1-354 (355) 82 protein:vir:95318 Length: 328 49.0 0.65 0.0004 21.6 8.6 240 61-337 1-328 (328) 83 protein:vir:1328 Length: 392 # 48.4 0.67 0.00042 21.5 18.0 287 1-408 91-392 (392) 84 protein:vir:94070 Length: 339 45.9 0.75 0.00047 21.3 10.6 315 27-404 1-339 (339) 85 protein:vir:94673 Length: 419 44.3 0.81 0.0005 21.1 19.8 320 1-414 91-419 (419) 86 protein:vir:7855 Length: 497 # 42.2 0.9 0.00056 20.8 14.6 329 1-410 111-497 (497) 87 protein:vir:101650 Length: 497 42.2 0.9 0.00056 20.8 14.6 329 1-410 111-497 (497) 88 protein:vir:100331 Length: 342 39.1 0.76 0.00047 21.2 5.2 259 115-410 1-342 (342) 89 protein:vir:78777 Length: 358 38.4 1.1 0.00066 20.4 8.2 313 1-418 1-353 (358) 90 protein:vir:80930 Length: 278 38.2 1.1 0.00067 20.4 18.7 262 81-410 1-278 (278) 91 protein:vir:4830 Length: 397 # 37.7 1.1 0.00069 20.3 13.2 318 1-418 39-395 (397) 92 protein:vir:79642 Length: 329 37.4 1.1 0.0007 20.3 6.4 295 43-407 1-329 (329) 93 protein:vir:94622 Length: 341 37.3 1.1 0.0007 20.3 15.7 288 61-411 1-341 (341) 94 protein:vir:9410 Length: 415 # 36.2 1.2 0.00073 20.2 17.7 324 1-417 62-415 (415) 95 protein:vir:105038 Length: 428 34.9 1.3 0.00078 20.0 16.4 321 1-406 98-428 (428) 96 protein:vir:1433 Length: 435 # 34.3 1.3 0.00081 20.0 15.1 350 1-408 65-435 (435) 97 protein:vir:96833 Length: 275 33.3 1.4 0.00085 19.8 17.7 256 81-411 1-275 (275) 98 protein:vir:5694 Length: 357 # 33.1 0.53 0.00033 22.1 3.4 327 17-418 1-355 (357) 99 protein:vir:2016 Length: 357 # 29.8 0.7 0.00044 21.4 3.4 327 17-418 1-354 (357) 100 protein:vir:104342 Length: 314 29.2 1.7 0.001 19.4 6.0 292 50-407 1-314 (314) 101 protein:vir:105334 Length: 276 28.9 1.7 0.0011 19.3 19.5 258 81-415 1-276 (276) 102 protein:vir:1239 Length: 274 # 27.2 1.9 0.0012 19.1 18.6 256 81-411 1-274 (274) 103 protein:vir:107826 Length: 331 25.2 2.1 0.0013 18.8 8.1 238 61-337 1-331 (331) 104 protein:vir:107388 Length: 331 25.2 2.1 0.0013 18.8 8.1 238 61-337 1-331 (331) 105 protein:vir:98525 Length: 331 25.2 2.1 0.0013 18.8 8.1 238 61-337 1-331 (331) 106 protein:vir:81160 Length: 371 23.7 2.3 0.0014 18.6 13.3 297 1-407 57-371 (371) 107 protein:vir:1025 Length: 408 # 22.4 2.5 0.0015 18.4 21.1 318 1-418 75-405 (408) 108 protein:vir:101607 Length: 379 22.2 2.5 0.0015 18.4 18.2 305 1-404 71-379 (379) 109 protein:vir:107593 Length: 392 21.1 2.7 0.0017 18.3 19.0 300 1-418 78-392 (392) 110 protein:vir:102082 Length: 392 21.1 2.7 0.0017 18.3 19.0 300 1-418 78-392 (392) 111 protein:vir:105004 Length: 392 21.1 2.7 0.0017 18.3 19.0 300 1-418 78-392 (392) 112 protein:vir:102873 Length: 392 21.1 2.7 0.0017 18.3 19.0 300 1-418 78-392 (392) 113 protein:vir:98339 Length: 415 20.5 2.8 0.0017 18.2 21.5 314 1-417 89-415 (415) 114 protein:vir:79987 Length: 415 20.5 2.8 0.0017 18.2 21.5 314 1-417 89-415 (415) 115 protein:vir:81100 Length: 415 20.5 2.8 0.0017 18.2 21.5 314 1-417 89-415 (415) 116 protein:vir:3845 Length: 395 # 20.1 2.8 0.0018 18.1 14.4 327 1-418 43-394 (395) No 1 >protein:vir:96442 Length: 418 # NCBI annotation: hypothetical protein # Family: family:all:11266 # MgeID: mge:1616 # MgeName: 119X # Cross-refs: genbank:acc:YP_001218814;genbank:gi:147917331;genbank:GeneID:5142645 Probab=100.00 E-value=5.4e-140 Score=784.11 Aligned_cols=414 Identities=92% Similarity=1.305 Sum_probs=391.8 Q ss_pred CcceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) Q Consensus 1 ~~~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~t 80 (418) |||++|+||+||||+|||++||+++++++.||+|+||++|+++|+..++++++|+||||+|++..++++++..+++|+|+ T Consensus 1 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~PN~~~p~l~~i~~g~~~~~~~~t~~w~~d~l~~~~~~~ta~~~a~~T~i~ 80 (418) T protein:vir:96 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEALADATVLT 80 (418) T ss_pred CceeeeecccCCChhhhchhhhhhhhhhhcCCcccchhhhhcccCccccceeEEEEEeeEeeeeeEEEEEEEecCceEEE Confidence 99999999999999999999999999999999999999999999999999999999999999999999999999999999 Q ss_pred EccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceecccee Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFT 160 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~t 160 (418) |+++++|+++++|++++++|+|||++|||++|||.|||++|+|++|++|++|+++|.+++||+|++++++..+++++||| T Consensus 81 V~~~~~f~~~~l~~~~~~~EvirVtsVng~~lTV~RG~~~t~aa~iaag~~~~~ig~~~eEGsd~~ta~~~k~~~vsN~t 160 (418) T protein:vir:96 81 VENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRIAAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFT 160 (418) T ss_pred ecCCcccccccEEEEecCCeEEEEEEEeCCEEEEEEccCCeeeeeeecCceEEEeecCcccccccCCcceecceeccchh Confidence 99999999999999999999999999999999999999999999999999999999999999999999999999999999 Q ss_pred EEEeeeeeechhHHHH-hhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccc Q lcl|Aclame:pro 161 QIFRNAWALTDTARAS-YAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNA 239 (418) Q Consensus 161 QIf~~~v~VSgTa~Av-~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~ 239 (418) |||++.|+||+||||+ .++|+.+++++| +++|+++|.++|+++++|++.+++++++|-+.+.|+++.++++.++|++. T Consensus 161 QIf~e~vsVSgTAqA~v~qaGvsn~~~~e-~d~l~~~kv~iE~ali~g~~~~~~~ng~p~~~t~R~m~gI~~f~~~Nvi~ 239 (418) T protein:vir:96 161 QIFRNAWALTDTARASYAEAGYSNITESR-RDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAIRQYAPDNVNA 239 (418) T ss_pred heehhhhhhhhhhhhhhhhcCcchhHHHH-HHHHHHHHHHHHHhhhccccccCCCCCcccccccchhHHHHhhccccccc Confidence 9999999999999995 667988776666 89999999999999999999998888776534444444455667899999 Q ss_pred cCCCCccchHHHHHHHHHHHHhcccCCCcee---EEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCeEE Q lcl|Aclame:pro 240 MPNPTAVTYDDVVDATIDAFKWSVNVGDNTQ---RVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKGRL 316 (418) Q Consensus 240 ~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~---~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~v 316 (418) +++.+++++++|.++++++|++|.+.+++.+ .+++|++.+|++|++|+ +++++.++++.+|.+|++|+||||++ T Consensus 240 ag~~~~~t~d~L~~~~~~a~~~g~n~G~~~~~~~y~~~V~a~~k~~I~k~~---~~I~~~~~en~~G~vv~~~~Td~G~v 316 (418) T protein:vir:96 240 MPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFF---GEVTVTQRETSYGMVFTEWKFFKGRL 316 (418) T ss_pred cCCCCcCCHHHHHHHHHHHHhhcCCCCCcccceEEEEEeChHHHHHHhhhh---ceeEeccccceeceEEEEEEeeccEE Confidence 8888899999999999999999988877776 45689999999999985 46999999999999999999999999 Q ss_pred EEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEeccc Q lcl|Aclame:pro 317 ILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQ 396 (418) Q Consensus 317 ~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~k 396 (418) .|++||+|++.++|+++||||||++|+++||+||++++|+|+|+|.+......+++..||.|+++|||++|||||++||+ T Consensus 317 ~ii~n~~~pad~I~~g~mlVvD~~~vkL~yL~~R~~~~E~l~k~G~~~~~~~~~~~~~~~~D~~~G~l~~Eltle~~N~~ 396 (418) T protein:vir:96 317 IIKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQ 396 (418) T ss_pred EEEecCCCCccccCcceEEEEecCceEEEEecCCCccchhcccCCCcccccccccccccccccccCEEEEEEEEEeeccc Confidence 99999999999999999999999999999999999999999999999999999999999999999999999999999999 Q ss_pred ceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 397 GCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 397 A~a~I~gL~~~~~~~~~~~~~~ 418 (418) |||+|+||+||||+||||+|+| T Consensus 397 a~a~itgl~~~~~~~~~~~~~~ 418 (418) T protein:vir:96 397 GCAVITGLQKAKERVYLTAPAP 418 (418) T ss_pred ccEEeecccccccccccCCCCC Confidence 9999999999999999999999 No 2 >protein:vir:103370 Length: 418 # NCBI annotation: hypothetical protein # Family: family:all:11266 # MgeID: mge:1621 # MgeName: PaP2 # Cross-refs: genbank:acc:YP_024741;genbank:gi:48697083;genbank:GeneID:2846038 Probab=100.00 E-value=5.2e-138 Score=773.21 Aligned_cols=414 Identities=92% Similarity=1.269 Sum_probs=397.5 Q ss_pred CcceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) Q Consensus 1 ~~~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~t 80 (418) |||++|+||+||||+|||+|||+++++++.||+|+||++|+++|+..++++++|+||+|+|++++++++|++++++|+|+ T Consensus 1 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~PN~~~pll~li~~g~~~ta~ast~~w~~d~~~~~~~~~ta~a~a~~T~l~ 80 (418) T protein:vir:10 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) T ss_pred CceeccccccCCChhhhchhhhhhhhhhhcCCcchhhhhhhhcccccccceeEEEEEEEEEeeeeEEEEEEEecCceEEE Confidence 99999999999999999999999999999999999999999999999999999999999999999999999999999999 Q ss_pred EccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceecccee Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFT 160 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~t 160 (418) |+++++|.++++|++++++|+|+|++|||++|||.|||++|++++|++|++|+++|++++||+|++++++..+++++||| T Consensus 81 ve~~~~f~~~~l~~~~~~~Evirv~sVng~~lTV~Rg~~~t~aaaia~n~~~~~Ig~~~eEGsd~~ta~~~k~~~vsNvt 160 (418) T protein:vir:10 81 VENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFT 160 (418) T ss_pred EcCcceeccccEEEEccCCeEEEEEEEeCCEEEEEEecCCeeEEEEecCceEEEeccccccccccCCcceecceeccchh Confidence 99999999999999999999999999999999999999999999999999999999999999999999999999999999 Q ss_pred EEEeeeeeechhHHHH-hhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccc Q lcl|Aclame:pro 161 QIFRNAWALTDTARAS-YAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNA 239 (418) Q Consensus 161 QIf~~~v~VSgTa~Av-~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~ 239 (418) |||+++|+||+|+||+ ..+|..|++++|..+++++ +++||+++|+|+++++++++++.|+|+||+.+++++.++|++. T Consensus 161 QIF~~avsvSgTaqAs~~q~Gvsn~~ese~drk~~~-av~iEkalI~G~~~~~~~~~g~~R~m~GIl~~vr~~~~gnVv~ 239 (418) T protein:vir:10 161 QIFRNAWALTDTARASYAEAGYSNITESRRDCMDFH-ATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNA 239 (418) T ss_pred hhhhhhhhhhhhhhhccccccCchHHHHHHHHHHHH-HHHHHHHHhcccccCCCcCCcchhhHHHHHHHHhhhcccceec Confidence 9999999999999996 5568889999995555555 6799999999999999999999999999999999999999999 Q ss_pred cCCCCccchHHHHHHHHHHHHhcccCCCcee---EEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCeEE Q lcl|Aclame:pro 240 MPNPTAVTYDDVVDATIDAFKWSVNVGDNTQ---RVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKGRL 316 (418) Q Consensus 240 ~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~---~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~v 316 (418) +++++++++++|.++++++|++|.+.++.++ .+++|++++|++|++|. +++++.++++.+|++|++|.+..|.+ T Consensus 240 a~~~t~~s~d~l~~a~~~af~~g~~~G~~~q~~~f~~~V~~~~k~~I~k~~---~~I~~~~~e~~~G~vv~~~~~~~G~I 316 (418) T protein:vir:10 240 MPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFF---GEVTVTQRETSYGMVFTEWKFFKGRL 316 (418) T ss_pred cCCCCccCHHHHHHHHHHHhhccCCCcccccceeEEEEeChHHHHHhhhhh---hheeecccceeeeEEEEEEEcceEEE Confidence 9888899999999999999999888777765 66789999999999985 35899999999999999998888999 Q ss_pred EEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEeccc Q lcl|Aclame:pro 317 ILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQ 396 (418) Q Consensus 317 ~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~k 396 (418) .+..||+|.+.|||+|+|+|+||++++++||++|++++|.|+|+|.+......+++..||.|++||||++|||||++||+ T Consensus 317 ~L~~~p~~~~~~lp~g~mlVvD~~~vkL~~L~~R~~~~E~l~k~G~~~~~~~~~~~~~~~~D~~kG~iv~E~tLe~~N~~ 396 (418) T protein:vir:10 317 ILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQ 396 (418) T ss_pred EeecccccccccCCCceEEEEccccceEEEeccccccchhcccCCCcccccccccccccccccccceEEEEeeeeeeccc Confidence 99999999999999999999999999999999999999999999999999999999999999999999999999999999 Q ss_pred ceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 397 GCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 397 A~a~I~gL~~~~~~~~~~~~~~ 418 (418) |||+|+||+|||||||||||+| T Consensus 397 a~avitgl~~~~~~~~~t~p~~ 418 (418) T protein:vir:10 397 GCAVITGLQKAKERVYLTAPAP 418 (418) T ss_pred ceEEeeccceecccccCCCCCC Confidence 9999999999999999999999 No 3 >protein:vir:8843 Length: 317 # NCBI annotation: major head protein # Family: family:all:3919 # MgeID: mge:158 # MgeName: PaP3 # Cross-refs: genbank:acc:NP_775251;genbank:gi:27476049;genbank:GeneID:2700597 Probab=100.00 E-value=1.3e-81 Score=463.99 Aligned_cols=304 Identities=13% Similarity=0.115 Sum_probs=261.2 Q ss_pred CcceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) Q Consensus 1 ~~~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~t 80 (418) ||.-+.-|-+ .-+-.++++|+|+|.++.|. .||++.|++ +.+++++.|+|..|.+.... T Consensus 1 ma~~~~~~~t--~~~~g~~~dl~~~I~~isp~-dTPf~S~i~---~~~a~~~~~~W~~d~l~~~~--------------- 59 (317) T protein:vir:88 1 MATPTNAVST--VEINGKREDLIDIIYNIAPY-DTPFMSAIG---KGVATAITHEWQTDELRQPG--------------- 59 (317) T ss_pred CCccccceEe--eeeeeeeechhhhheecCCc-cCcceeeec---CceecccEEEEEeeecCCcc--------------- Confidence 8888877765 33467889999999999995 999998753 36799999999887652100 Q ss_pred EccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceecccee Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFT 160 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~t 160 (418) -|+++||+|+++++..+|++++||| T Consensus 60 -------------------------------------------------------~~~~~EG~da~~~~~~~r~~~~N~t 84 (317) T protein:vir:88 60 -------------------------------------------------------KNTRVEGEDATIKAGSFTTMLNNYC 84 (317) T ss_pred -------------------------------------------------------ccccccCcccccccccCCEEeccEE Confidence 0566799999999999999999999 Q ss_pred EEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccc------ Q lcl|Aclame:pro 161 QIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAP------ 234 (418) Q Consensus 161 QIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~------ 234 (418) |||+|+++||||++|++.+|+.+|++||++||++|||||||++||+|++..++++.+.+|+|+||+.|+++... T Consensus 85 QIf~k~v~VSgTa~av~~~G~~~ela~q~~kk~~EikrdmE~~li~g~~a~~~~~~t~~r~~~Gl~~~i~t~~~~~~~g~ 164 (317) T protein:vir:88 85 QISDETLQVTGTADRVKKAGRKNELAYQLAKKSKELKLDMEYALVGAPQAKVQRNTTTPGQMANIFAYYKTNGSLGANGV 164 (317) T ss_pred EEEEeEEEEeehhhhhhhcCccchhHHHHHHHHHHHHHHHHHHHhcCeeeccCCCCccchhhhhHHHHhccCceeccCcc Confidence 99999999999999999999999999999999999999999999999988766666667999999999865211 Q ss_pred ------cCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhh-ccceEEEcccceeeceEEE Q lcl|Aclame:pro 235 ------DNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGR-FFGEVTVTQRETSYGMVFT 307 (418) Q Consensus 235 ------~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~-~~~~~~~~~~~~~~G~~v~ 307 (418) ++....+...++||++|.++++++|+.|+..+ .+||++.+|++|++|.+ ...+++..+.++.+|.+|+ T Consensus 165 ~~~~~~~~~~t~~t~~~lte~~l~~~l~~i~~~Gg~~~-----~i~v~a~~k~~i~~~~~~~~~~i~~~~~~~~~g~~v~ 239 (317) T protein:vir:88 165 APVGDGSNTGTAGDLRLLTEDMLLNASESIWRNGGQAN-----SIQTSSSIKKAISKNMKGRATEITLDASDNRIAQTVD 239 (317) T ss_pred ccccCCCccccccccccccHHHHHHHHHHHHhcCCCCC-----EEEeChHHHHHHHHHhcCCceeEEEcccCeEEEEEEE Confidence 01112223346899999999999999876544 58999999999999964 3345677889999999999 Q ss_pred EEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEE Q lcl|Aclame:pro 308 EWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSE 387 (418) Q Consensus 308 ~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E 387 (418) +|+||||+++||+||+ ||+|++++|||++|+++|| |+++.|+|+|+| |++++||++| T Consensus 240 ~~~tdfG~v~ii~~r~-----lp~~~~~~~D~~~~~l~~L--r~~~~e~laKtG----------------d~~k~~i~~E 296 (317) T protein:vir:88 240 VYESDFGKYTIRANRW-----FHENTLFVFDPKMHSLCYL--RPFFQHELAKTG----------------DSEKRQLLVE 296 (317) T ss_pred EEEeCCeEEEEEeCCC-----CCCCeEEEEcccccceeec--ccceeeccCCCc----------------ccceeEEEEE Confidence 9999999999999976 5889999999999999999 999999999999 9999999999 Q ss_pred EEEEEecccceEEeecCcccc Q lcl|Aclame:pro 388 WALELLNPQGCAVITGLQKAK 408 (418) Q Consensus 388 ~tLev~N~kA~a~I~gL~~~~ 408 (418) +|||||||+|||+|+||.+.- T Consensus 297 ~tLe~~N~~a~a~i~~l~~~~ 317 (317) T protein:vir:88 297 YTFRVNNEKSGALIRDVVAQL 317 (317) T ss_pred EEEEEcCccceeEEEEecccC Confidence 999999999999999997763 No 4 >protein:vir:104479 Length: 310 # NCBI annotation: gp15 # Family: family:all:1105 # MgeID: mge:1548 # MgeName: P-SSM4 # Cross-refs: genbank:acc:YP_214651;genbank:gi:61806292;genbank:GeneID:3294534 Probab=99.63 E-value=4.5e-19 Score=121.16 Aligned_cols=157 Identities=13% Similarity=0.064 Sum_probs=100.5 Q ss_pred Ccceeeeec-cCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEE Q lcl|Aclame:pro 1 MSVYAGIFN-TTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVL 79 (418) Q Consensus 1 ~~~~~~~~~-~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~ 79 (418) |--+-|-+= .--+..+ +|.-..|...-.+.. .+ .+.. --+..++...|.-....++++++..+++|+| T Consensus 149 ~Ft~kg~lY~Pv~~~~~-Ik~i~idf~~~~~~~-----~~-~~~~----~~sv~~~~~~D~dG~~~Ttlsa~Isa~~ts~ 217 (310) T protein:vir:10 149 QFTAKTYLYGPVTDAKV-VRKTQVDYYANTDVN-----TA-PRAR----RYTVQPESTIDRDGTVATTLSATISKTATGF 217 (310) T ss_pred EEEEeEEecCcccCcce-eeeEeeeeccCcccc-----cc-ccce----eeecceEEEccccceeEEEecccccccceee Confidence 111111111 0001111 222111111100000 00 0011 1122222223333345577888999999999 Q ss_pred EEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEee---ccccc-ccCCcCccccccee Q lcl|Aclame:pro 80 TVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIG---TAFEE-GSQRPTARSIQPVY 155 (418) Q Consensus 80 tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g---~a~~E-Gada~~~~~~~~~~ 155 (418) .|+++++|..+..+ .|++|+|+|++|+|++|||.||+.+|+|++|..|++|.++. ++-+| |+|+ ..... T Consensus 218 ~V~d~s~~~~~~~i--~Id~E~i~i~~isgn~LTV~RG~~~T~aa~H~~g~~V~~in~~d~~lle~gddf-----g~~e~ 290 (310) T protein:vir:10 218 AVANASGINQYDNI--YIGAELMRVTNKVGNNLSVIRGYEKSTPTVHSVGSNVFIVNAADNALLESDDDF-----GFGEI 290 (310) T ss_pred eecccccccccceE--EECcEEEEEEeeccceEEEEecccCCchhhhhcCCcEEEEccCCCccCCccccc-----ccccc Confidence 99999999999965 69999999999999999999999999999999999999885 22344 7774 45567 Q ss_pred ccceeEEEeeeeeechhHHHH Q lcl|Aclame:pro 156 VPNFTQIFRNAWALTDTARAS 176 (418) Q Consensus 156 ~~N~tQIf~~~v~VSgTa~Av 176 (418) ++||+||.... .+|++++|+ T Consensus 291 ~s~~~d~~~~~-~~~~~~~a~ 310 (310) T protein:vir:10 291 YSEYTDMKKYN-PVSGQDEAI 310 (310) T ss_pred ccccccceeec-cccceeecC Confidence 89999977666 999999999 No 5 >protein:vir:97255 Length: 310 # NCBI annotation: hypothetical protein ORF017 # Family: family:all:1120 # MgeID: mge:1657 # MgeName: M6 # Cross-refs: genbank:acc:YP_001294525;genbank:gi:149408246;genbank:GeneID:5237120 Probab=98.83 E-value=2.4e-10 Score=73.28 Aligned_cols=296 Identities=10% Similarity=0.059 Sum_probs=156.7 Q ss_pred EEEEeecCceEEEEccccccccCceeEecc-CceEEE---EEEecCceeEEEccccccchhhhhCCceEEEeeccccccc Q lcl|Aclame:pro 68 VTAEAAADATVLTVENSDGLTKGMIFYNEA-TGENMR---LELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGS 143 (418) Q Consensus 68 ~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~-~~E~~~---Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGa 143 (418) ++ +++-+... +.+.+.. ...+++.-+ ..+++. -..|.|+.....|-.-.+.++....+.+. -.+|. T Consensus 1 mp-altLaea~--k~~~d~l-~~~ViE~~~~~s~lL~~LpF~~veg~~~~ynR~~~~~~~~~~~v~~~~------~~~g~ 70 (310) T protein:vir:97 1 MA-SVTLAESA--KLAQDEL-VAGVIENIITVNRMFDVLPFDSIEGNSLAYNRENVLGDVIMAGVGTTF------SGAGA 70 (310) T ss_pred Cc-ccchHHHh--hcCcchH-HHHHHHHHhccchHHHhCCcccccCCcceeeEeeccCCcccccccccc------cCCCc Confidence 22 12111111 1111111 111111111 223332 24566776554443333333222223222 11222 Q ss_pred CCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhH Q lcl|Aclame:pro 144 QRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQ 223 (418) Q Consensus 144 da~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~ 223 (418) .-..... .+.+--+-|+...++|-.--.........++.++|++.+.+.|++..|..||+|-... +.-. T Consensus 71 ~~~~~t~---~~~~~~L~i~~g~~~Vd~~i~dl~~~~~~dq~~~Ql~~~iea~~~~~e~~lINGD~a~--------n~F~ 139 (310) T protein:vir:97 71 GKAAATF---TKVNSNLTTIMGDAEVNGLIQATRSGDGNDQTAVQIASKAKSAGRKYQDQLINGNGAG--------NEFA 139 (310) T ss_pred ccccccc---ceeeeeeeeeeehhhhhhHHHhhhcCChHHHHHHHHHHHHHHHHHHHHHHhhccccCC--------Cccc Confidence 2222222 2334467788888887654433322224478999999999999999999999987531 2244 Q ss_pred HHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccce-EEEcccceee Q lcl|Aclame:pro 224 GIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGE-VTVTQRETSY 302 (418) Q Consensus 224 GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~-~~~~~~~~~~ 302 (418) |++..+. .....+..+.++.+|.++|.+++..+|.+.+. +.++++++..+++|.+|.+..++ -.+......+ T Consensus 140 GL~~~~~--~~q~i~~~~~gg~~t~d~LDeLl~~v~~~~g~-----p~~~l~~~~~~r~i~A~~R~~~~~g~~~~~~~~~ 212 (310) T protein:vir:97 140 GLIQLCA--SGQKATTGATGSAISFAILDELMDLVVDKDGQ-----VDYLTMHARTLRSYKALLRALGGASINEVVELPS 212 (310) T ss_pred chhhcCC--ccceeecCCCCCCCCHHHHHHHHHHHhcCCCC-----CCEEEecHHHHHHHHHHHHHhcCCCCCCccccCC Confidence 6654432 12223444566789999999999999975433 34799999999999999875543 2333345677 Q ss_pred ceEEEEEEcCCeEEEEEECccccccCCC-----CCeEEEEchhh--c--eeeeccCCCcccccccccCcccccccccccc Q lcl|Aclame:pro 303 GMVFTEWKFFKGRLILKEHPLFSAIGIS-----PGFAVVVDVPA--V--KLAYMDGRNAKVENYGQGGGENKSGATDYSY 373 (418) Q Consensus 303 G~~v~~~~SdfG~v~vv~n~~l~~~~mp-----~d~~lv~D~~~--~--~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~ 373 (418) |..|..| +-+.|+++.++..-..+ .-.++++-.-. + -+.=| .....++-+.+.-+ . T Consensus 213 G~~v~~~----~GiPi~~~d~ip~~~~~~~~~gtTsIya~r~Ge~~~~~Gv~Gl--------~~~~~~glsVr~~G---~ 277 (310) T protein:vir:97 213 GAEVPAY----SGTPIFRNDYIPTNQTKGGTTGCTTIFAGTLDDGSRTHGIAGL--------TATQAAGIQVVDVG---E 277 (310) T ss_pred CCEEeee----CCeEEEEeCccCCCccccccCCceeEEEEeeCccccccceecc--------ccCCccceeEEeCC---c Confidence 8777543 34677777654221000 01122222111 0 01000 00011111111100 0 Q ss_pred ccCccccccEEEEEEEEEEecccceEEeecCcc Q lcl|Aclame:pro 374 GHGVDAQGGSLTSEWALELLNPQGCAVITGLQK 406 (418) Q Consensus 374 ~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~ 406 (418) .+..+..++.+.+=|++-+.|++|.|+++|..- T Consensus 278 ~~~~~v~~~~V~~Y~~~av~~~~A~a~L~~V~~ 310 (310) T protein:vir:97 278 SEDSDEHIWRVKWYCGLALFSEKGLACADGITN 310 (310) T ss_pred ccCCcceeEEEEEeeeEEEecccceeeeccccC Confidence 223367888888889999999999999999977 No 6 >protein:vir:94933 Length: 330 # NCBI annotation: putative phage structural protein # Family: family:all:1120 # MgeID: mge:1538 # MgeName: Xp15 # Cross-refs: genbank:acc:YP_239278;genbank:gi:66392060;genbank:GeneID:5076578 Probab=98.34 E-value=2.8e-08 Score=62.00 Aligned_cols=314 Identities=12% Similarity=0.087 Sum_probs=157.9 Q ss_pred eEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeEecc-CceE---E Q lcl|Aclame:pro 27 LRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEA-TGEN---M 102 (418) Q Consensus 27 ~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~-~~E~---~ 102 (418) |.++- +||+-. || -+.+|++=.-.| ++-..+.+..+ +. +.+ ...++..-. ..|+ | T Consensus 1 ~~~~~--~~~~~~--~~------~~~~~~~p~l~m-------~alTLaea~~l-~~--d~~-~~~VIE~l~~~s~iL~~l 59 (330) T protein:vir:94 1 MVRIC--TPPLRG--RW------RTLTHQFPELKM-------PTVTLAESAKL-SQ--DHL-VSGLIETIVEVNPLYEMM 59 (330) T ss_pred Cceec--CCcccc--ce------eehhccccccch-------hhhhhhHHhhc-Cc--hhh-HHHHHHhhhccchHHhhc Confidence 33332 344431 11 122333322222 22111111111 11 111 111111111 1122 2 Q ss_pred EEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhc-c Q lcl|Aclame:pro 103 RLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEA-G 181 (418) Q Consensus 103 ~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g-~ 181 (418) -.+.|+++..+..|-.. ..+..+..++....| ......+.++--|-++.-.++|..--.- .++ . T Consensus 60 pf~~ve~~~~~~~r~~~-------lp~a~~r~~n~~~~~------~~~~Tf~q~t~~l~~l~~~~~Vd~~iad--l~g~~ 124 (330) T protein:vir:94 60 PFTEIEGNALAYNRENV-------LGDVQFLAVGGTITA------KNPATFTKVTSELTTLIGDAEVNGLIQA--TRSDF 124 (330) T ss_pred ccccccCCcceeeeeec-------CCcceeeeccccccc------cCcceeeeeeechhhhhhhHHHHHHHHH--hcCCH Confidence 34667777654433111 123334333211111 1111122333345566665555543322 233 2 Q ss_pred cchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCc-cccCCCCccchHHHHHHHHHHHH Q lcl|Aclame:pro 182 YSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNV-NAMPNPTAVTYDDVVDATIDAFK 260 (418) Q Consensus 182 ~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv-~~~~~~a~~te~~l~d~~~~~~~ 260 (418) .+..++|.+.+.+.|+..+|..||+|-.. .+.-.||+..+ ...+. ++.++++.+|.++|.+++..+|. T Consensus 125 ~d~~~~q~~~~ieal~~~~e~~linGDs~--------~~~F~GL~~~~---~~~q~i~tg~~gg~~T~d~LDeLl~~v~~ 193 (330) T protein:vir:94 125 MDQTSVQVASKAKSIGRQYQASMITGDGT--------GNSFQGMMGLV---AASQTISAGANGGTLTFELLDQLLDLVKD 193 (330) T ss_pred HHHHHHHHHHHHHHHHHHHHHHhhccCCC--------CccccchhhcC---CcccEEecCCCCCCCCHHHHHHHHHHhcC Confidence 36788999999999999999999999421 13456765443 23333 34456788999999999999997 Q ss_pred hcccCCCceeEEEEeChHHHHHHHhhhhccceEEEc-ccceeeceEEEEEEcCCeEEEEEECccccccCCCC------Ce Q lcl|Aclame:pro 261 WSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVT-QRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISP------GF 333 (418) Q Consensus 261 ~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~-~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~------d~ 333 (418) ..+. +.+++.+....++|.+|.+..+++-+. .....+|..|-.| +-+.|+++.++..- ..+ -. T Consensus 194 ~~g~-----~~~~l~n~a~~r~I~a~~R~~~~~~v~~~~~~~~G~~v~~~----~GvPi~~~d~ip~~-~~~~~~~~tts 263 (330) T protein:vir:94 194 KDGQ-----VDYLMSSFAMRRKYFSLLRALGGAAIGEVMTLPSGRQIPTY----RGVPWFVNDFIPSN-MTQGTATNATA 263 (330) T ss_pred CCCC-----CcEEEechhHHHHHHHHHHhccCCCCCCcccccCCCEEeee----CCeEEEecccccCC-CCcccCCCcee Confidence 5533 347889999999999998766654443 3445677766443 23566666544210 000 12 Q ss_pred EEEEchh--hceeeeccCCCcccccccccCcccccccccccc-ccCccccccEEEEEEEEEEecccceEEeecCccc Q lcl|Aclame:pro 334 AVVVDVP--AVKLAYMDGRNAKVENYGQGGGENKSGATDYSY-GHGVDAQGGSLTSEWALELLNPQGCAVITGLQKA 407 (418) Q Consensus 334 ~lv~D~~--~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~-~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~ 407 (418) ++++... ...... -=|-.+|. ........+ .+..+..++.+.+=|++-+.|++|.|+++|+..- T Consensus 264 Iyav~~G~~~~~qgV--------~Gl~~~g~--~glsVr~~G~~~~k~v~~~~v~~y~~~av~~~~a~~~L~~V~~g 330 (330) T protein:vir:94 264 IFAGTFDDGSNKYGI--------AGLTARGS--AGLRVQNVGAKENADETITRVKMYCGFANFSQLGLAAIKGLIPG 330 (330) T ss_pred EEEEeecccccccce--------EeecCCCC--CcceeeeCCCccccceeeEEEEEeeeeEEechhheeeeccccCC Confidence 2222211 100000 00111110 000000111 2233677888999999999999999999999777 No 7 >protein:vir:95763 Length: 297 # NCBI annotation: head protein # Family: family:all:507 # MgeID: mge:1578 # MgeName: SMP # Cross-refs: genbank:acc:YP_950590;genbank:gi:119953785;genbank:GeneID:5076833 Probab=97.64 E-value=2.6e-05 Score=45.70 Aligned_cols=286 Identities=12% Similarity=0.063 Sum_probs=131.7 Q ss_pred EEEEeecCceEEEEccccccccCceeEeccCce---------EEEEEEecCce-eEEEccccccchhhhhCCceEEEeec Q lcl|Aclame:pro 68 VTAEAAADATVLTVENSDGLTKGMIFYNEATGE---------NMRLELVNGLN-LTVKRQTGRISAAIIAANTKLIVIGT 137 (418) Q Consensus 68 ~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E---------~~~Vtav~g~~-~tv~rg~~~tta~~~~~gt~v~~~g~ 137 (418) +++..-.+....+-.++..+.+..+. +++-+. ...+.-+.+.. .++.+-..+. ...| T Consensus 1 m~~~~~~~~~~~~t~~~~~lvP~~~~-~~ii~~~~~~s~l~~~~~~~~~~~~~~~~~~~~~~~~-------~a~~----- 67 (297) T protein:vir:95 1 MTVQTFNPENVLVSQKKDGTLHKEFT-DIIMKEVAQNSLVMQLGQYQEMEGEQEKTVYVQTDGI-------SAYW----- 67 (297) T ss_pred CCccccccccccccCCCcceechhHH-HHHHHHHHhhchhhhhcceeecCCCccEEEEEEcCCc-------eeEE----- Confidence 22221111111111111222222211 111111 11223333322 2222111111 1112 Q ss_pred ccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCc Q lcl|Aclame:pro 138 AFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQ 217 (418) Q Consensus 138 a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~ 217 (418) ..||++.+..... . -..-..+++-...+.-|.+..+.. ..+-..+-..+-...+.+.+|.++|+|.-. + . T Consensus 68 -v~Eg~~~~~~~~~-f--~~v~l~~~k~~~~~~is~ell~ds-~~~l~~~i~~~la~ai~~~~d~a~l~G~g~----~-~ 137 (297) T protein:vir:95 68 -VNETEKIKTDKPE-V--VPVTLKAHKLGIILVTSREALNYT-WKKFFEDMKPQIVEAFYKKIDEAGLLGHDT----P-F 137 (297) T ss_pred -eecCccccccccc-e--eEEEEeeEEEEEeehhhHHHHhcC-HHHHHHHHHHHHHHHHHHHHHHHHhcccCC----c-c Confidence 2477665543311 1 112234444444555555555432 223334444555556899999999988531 1 1 Q ss_pred cchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcc Q lcl|Aclame:pro 218 PLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQ 297 (418) Q Consensus 218 ~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~ 297 (418) + .||+..+.. .+ ...++.++.+++.++..++...+... ..++++++....|.++....|++.+.. T Consensus 138 ~----~gi~~~~~~---~~---~~~~~~~t~~~i~~~~~~l~~~~~~~-----~~~v~~~~~~~~L~~l~d~~G~~i~~~ 202 (297) T protein:vir:95 138 A----NSVAKAAKD---AN---KVIGGPINYDNILKLQDALYDADVEP-----NAFVSKIQNRSALREARDGNKVSIYDK 202 (297) T ss_pred c----ccccccccc---cc---eecccccCHHHHHHHHHHhhhccCCc-----CEEEEcHHHHHHHHHhhccCCceeecC Confidence 1 244332211 11 12334678999999998887654332 246789988888888755555544432 Q ss_pred cceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccc-cccccccC Q lcl|Aclame:pro 298 RETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGA-TDYSYGHG 376 (418) Q Consensus 298 ~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~-~~~~~~~g 376 (418) ... +-+|. .++..+ +..++++.+++.|++.+-+..- .+...+.+........... +.....-. T Consensus 203 ~~~----------~l~G~-Pv~~~~---~~~~~~~~~~~gd~s~~~~~~~--~~~~i~~~~~~~~~~~~~~~~~~~~~~~ 266 (297) T protein:vir:95 203 AAN----------TIDGI-TTVDLK---SARFEKGDLLAGDFDNLIYGVP--YNITYKISEEGQISTITNADGTPINLFE 266 (297) T ss_pred CCC----------cccce-eeEeec---CCCCCCceEEEEecccEEEEEe--cCeEEEEeeccccccccccCccchhhhh Confidence 211 11232 223222 2345778999999988754433 3333333333221100000 00000011 Q ss_pred ccccccEEEEEEEEEEecccceEEeecCccc Q lcl|Aclame:pro 377 VDAQGGSLTSEWALELLNPQGCAVITGLQKA 407 (418) Q Consensus 377 ~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~ 407 (418) .|...-+....+...+.||+|.++|+.-.+. T Consensus 267 ~~~~~~r~~~~~d~~v~~~~a~~~l~~at~~ 297 (297) T protein:vir:95 267 QEMIAIRATMDIAVMITKTDAFAKLTPAERV 297 (297) T ss_pred cCcEEEEEEEEeccEeecccceEEEeecCCC Confidence 1455556778899999999999998633322 No 8 >protein:vir:94142 Length: 304 # NCBI annotation: ORF013 # Family: family:all:507 # MgeID: mge:1494 # MgeName: 96 # Cross-refs: genbank:acc:YP_240234;genbank:gi:66395898;genbank:GeneID:5133311 Probab=97.35 E-value=4.4e-05 Score=44.45 Aligned_cols=290 Identities=9% Similarity=-0.037 Sum_probs=124.8 Q ss_pred cccceeEEEEEeecCceEEEEccccccccCceeEeccCc---------eEEEEEEecCceeEEEccccccchhhhhCCce Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATG---------ENMRLELVNGLNLTVKRQTGRISAAIIAANTK 131 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~ 131 (418) |.....+ ....+..+..+...+..+..++-+ ....+.-+.+...++-+-..+.. .. T Consensus 1 ma~~~~~--------~~~~~~t~~gg~lip~~~~~~ii~~~~~~~~l~~~~~~~~~~~~~~~ip~~~~~~~-------a~ 65 (304) T protein:vir:94 1 MATPTYT--------PGNVILSDFKNGVIPAEQGTLIMKDIMANSAIMKLAKNEPMTAQKKKFTYLAKGVG-------AY 65 (304) T ss_pred Ccccccc--------cccccccCCCceecchhHHHHHHHHHHhccchhhhcceeeccCCceEEEEEeCCcc-------eE Confidence 2111111 111122222222222111111100 11223334444444333222111 12 Q ss_pred EEEeecccccccCCcCcccccceecccee-EEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCccc Q lcl|Aclame:pro 132 LIVIGTAFEEGSQRPTARSIQPVYVPNFT-QIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAF 210 (418) Q Consensus 132 v~~~g~a~~EGada~~~~~~~~~~~~N~t-QIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~ 210 (418) |. .||+..+... +. +++.+ ..++-...+.-|.++.... ..+-..+-...-...+.+.+|.++|+|... T Consensus 66 ~v------~E~~~~~~~~--~~--~~~i~~~~~k~~~~~~iS~ell~ds-~~~l~~~i~~~l~~~ia~~~d~~~l~G~g~ 134 (304) T protein:vir:94 66 WV------SETERIQTSK--PE--YAQAEMEAKKIGVIIPLSKEFLKWT-AKDFFNEVKPLIAEAFYKAFDQAVIFGTKS 134 (304) T ss_pred Ee------ecCccccccc--ce--eeEEEEEEEEEEEeehhhHHHHhcc-hHHHHHHHHHHHHHHHHHHHHhhheeccCC Confidence 22 3665544322 11 11111 1222223333444554432 223334444444566899999999998653 Q ss_pred ccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhcc Q lcl|Aclame:pro 211 MGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFF 290 (418) Q Consensus 211 ~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~ 290 (418) ..+.+ -...|++..+. .......++..+.++|.++..++-..... ...+++++.....|.++.... T Consensus 135 ~~~~~----~~~~~~~~~~~-----~~~~~~~~~~~~~~~i~~~~~~l~~~~~~-----~~~~v~~~~~~~~L~~lkd~~ 200 (304) T protein:vir:94 135 PYNTS----TSGKPLVEGAE-----EKGNVVTDTNNLYVDLSALMATIEDEELD-----PNGVLTTRSFRSKMRNALDAN 200 (304) T ss_pred Ccccc----ccccccccccc-----ccccccccccchHHHHHHHHHHhhhccCC-----cCEEEEcHHHHHHHHHhhccC Confidence 21111 11222222111 11112233456788888887776543222 224778988888888775555 Q ss_pred ceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccc Q lcl|Aclame:pro 291 GEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATD 370 (418) Q Consensus 291 ~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~ 370 (418) +++.+..... +=+| +.|+..+.+.. .-+...+++.|++++.+..- .+...+.+.+.+..... +.+ T Consensus 201 G~~l~~~~~~----------~l~G-~PV~~~~~~~~-~~~~~~~~~gd~~~~~~~~~--~~~~i~~~~e~~~~~~~-~~~ 265 (304) T protein:vir:94 201 DRPLFDANGN----------EIMG-LPLSYTGADVY-DKKKSLALMGDWDYARYGIL--QGIEYAISEDATLTTLQ-ASD 265 (304) T ss_pred CcEeecCCCc----------cccc-eeeEEeccccc-CCCCcEEEEEehhhEEEEEe--cceEEEEeecceeeeec-ccc Confidence 5544432211 1133 24444443321 11234578888887654433 22322333222210000 000 Q ss_pred ccc----ccCccccccEEEEEEEEEEecccceEEeecCc Q lcl|Aclame:pro 371 YSY----GHGVDAQGGSLTSEWALELLNPQGCAVITGLQ 405 (418) Q Consensus 371 ~~~----~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~ 405 (418) .+. .-..|-...+....+.+.+++|+|..+|+.=. T Consensus 266 ~~g~~~~~f~~~~~~~r~~~r~~~~v~~~~a~~~l~~a~ 304 (304) T protein:vir:94 266 ASGQPVSLFERDMFALRATMHIAYMNVKPEAFATLKPTE 304 (304) T ss_pred cCccchhhhhcCcEEEEEEEEeccEeecccceEEEEecC Confidence 000 00114455567789999999999998876543 No 9 >protein:vir:105905 Length: 304 # NCBI annotation: major capsid protein # Family: family:all:507 # MgeID: mge:1514 # MgeName: phiETA3 # Cross-refs: genbank:acc:YP_001004375;genbank:gi:122891830;genbank:GeneID:4712376 Probab=97.35 E-value=4.4e-05 Score=44.45 Aligned_cols=290 Identities=9% Similarity=-0.037 Sum_probs=124.8 Q ss_pred cccceeEEEEEeecCceEEEEccccccccCceeEeccCc---------eEEEEEEecCceeEEEccccccchhhhhCCce Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATG---------ENMRLELVNGLNLTVKRQTGRISAAIIAANTK 131 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~ 131 (418) |.....+ ....+..+..+...+..+..++-+ ....+.-+.+...++-+-..+.. .. T Consensus 1 ma~~~~~--------~~~~~~t~~gg~lip~~~~~~ii~~~~~~~~l~~~~~~~~~~~~~~~ip~~~~~~~-------a~ 65 (304) T protein:vir:10 1 MATPTYT--------PGNVILSDFKNGVIPAEQGTLIMKDIMANSAIMKLAKNEPMTAQKKKFTYLAKGVG-------AY 65 (304) T ss_pred Ccccccc--------cccccccCCCceecchhHHHHHHHHHHhccchhhhcceeeccCCceEEEEEeCCcc-------eE Confidence 2111111 111122222222222111111100 11223334444444333222111 12 Q ss_pred EEEeecccccccCCcCcccccceecccee-EEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCccc Q lcl|Aclame:pro 132 LIVIGTAFEEGSQRPTARSIQPVYVPNFT-QIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAF 210 (418) Q Consensus 132 v~~~g~a~~EGada~~~~~~~~~~~~N~t-QIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~ 210 (418) |. .||+..+... +. +++.+ ..++-...+.-|.++.... ..+-..+-...-...+.+.+|.++|+|... T Consensus 66 ~v------~E~~~~~~~~--~~--~~~i~~~~~k~~~~~~iS~ell~ds-~~~l~~~i~~~l~~~ia~~~d~~~l~G~g~ 134 (304) T protein:vir:10 66 WV------SETERIQTSK--PE--YAQAEMEAKKIGVIIPLSKEFLKWT-AKDFFNEVKPLIAEAFYKAFDQAVIFGTKS 134 (304) T ss_pred Ee------ecCccccccc--ce--eeEEEEEEEEEEEeehhhHHHHhcc-hHHHHHHHHHHHHHHHHHHHHhhheeccCC Confidence 22 3665544322 11 11111 1222223333444554432 223334444444566899999999998653 Q ss_pred ccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhcc Q lcl|Aclame:pro 211 MGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFF 290 (418) Q Consensus 211 ~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~ 290 (418) ..+.+ -...|++..+. .......++..+.++|.++..++-..... ...+++++.....|.++.... T Consensus 135 ~~~~~----~~~~~~~~~~~-----~~~~~~~~~~~~~~~i~~~~~~l~~~~~~-----~~~~v~~~~~~~~L~~lkd~~ 200 (304) T protein:vir:10 135 PYNTS----TSGKPLVEGAE-----EKGNVVTDTNNLYVDLSALMATIEDEELD-----PNGVLTTRSFRSKMRNALDAN 200 (304) T ss_pred Ccccc----ccccccccccc-----ccccccccccchHHHHHHHHHHhhhccCC-----cCEEEEcHHHHHHHHHhhccC Confidence 21111 11222222111 11112233456788888887776543222 224778988888888775555 Q ss_pred ceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccc Q lcl|Aclame:pro 291 GEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATD 370 (418) Q Consensus 291 ~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~ 370 (418) +++.+..... +=+| +.|+..+.+.. .-+...+++.|++++.+..- .+...+.+.+.+..... +.+ T Consensus 201 G~~l~~~~~~----------~l~G-~PV~~~~~~~~-~~~~~~~~~gd~~~~~~~~~--~~~~i~~~~e~~~~~~~-~~~ 265 (304) T protein:vir:10 201 DRPLFDANGN----------EIMG-LPLSYTGADVY-DKKKSLALMGDWDYARYGIL--QGIEYAISEDATLTTLQ-ASD 265 (304) T ss_pred CcEeecCCCc----------cccc-eeeEEeccccc-CCCCcEEEEEehhhEEEEEe--cceEEEEeecceeeeec-ccc Confidence 5544432211 1133 24444443321 11234578888887654433 22322333222210000 000 Q ss_pred ccc----ccCccccccEEEEEEEEEEecccceEEeecCc Q lcl|Aclame:pro 371 YSY----GHGVDAQGGSLTSEWALELLNPQGCAVITGLQ 405 (418) Q Consensus 371 ~~~----~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~ 405 (418) .+. .-..|-...+....+.+.+++|+|..+|+.=. T Consensus 266 ~~g~~~~~f~~~~~~~r~~~r~~~~v~~~~a~~~l~~a~ 304 (304) T protein:vir:10 266 ASGQPVSLFERDMFALRATMHIAYMNVKPEAFATLKPTE 304 (304) T ss_pred cCccchhhhhcCcEEEEEEEEeccEeecccceEEEEecC Confidence 000 00114455567789999999999998876543 No 10 >protein:vir:99424 Length: 360 # NCBI annotation: hypothetical protein # Family: family:all:1377 # ACLAME annotation(s): phi:0000161 - phage head/capsid # MgeID: mge:1595 # MgeName: BJ1 # Cross-refs: genbank:acc:YP_919080;genbank:gi:119757038;genbank:GeneID:4606077 Probab=97.30 E-value=6.9e-05 Score=43.39 Aligned_cols=317 Identities=11% Similarity=0.044 Sum_probs=140.0 Q ss_pred hccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccc Q lcl|Aclame:pro 43 VVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRIS 122 (418) Q Consensus 43 ~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tt 122 (418) +|....+.++.+...+--.+. +++++... ...+.+.-...|.....=...+-... ++ +++.+-..... T Consensus 1 ~~~~~~~~~~~n~~~~~i~k~---~it~~~l~-~g~L~p~~a~~Fl~~v~~~t~iL~~~-r~-------~~~~s~~~ei~ 68 (360) T protein:vir:99 1 MSSNSTIDSVRNQNMNSLSQK---DIGLAELD-GFQLPVDVTEEFLERMQKGVQILGMA-DT-------MTLARLEMEVP 68 (360) T ss_pred CcchhHHHHHhhhHHHHHHhh---hccccccC-ceeecHHHHHHHHHHHhhccchhhhc-ce-------eeccccccccc Confidence 333333444444443322222 23333332 34555554444433221111111111 11 11111111110 Q ss_pred hhhhhCCceEEEeecccccccCCcC-ccccc-ceeccceeEEEeeeeeechhHHHH--hhhcccchHHHHHHHH-HHHHH Q lcl|Aclame:pro 123 AAIIAANTKLIVIGTAFEEGSQRPT-ARSIQ-PVYVPNFTQIFRNAWALTDTARAS--YAEAGYSNITESRRDC-MDFHA 197 (418) Q Consensus 123 a~~~~~gt~v~~~g~a~~EGada~~-~~~~~-~~~~~N~tQIf~~~v~VSgTa~Av--~~~g~~dela~q~~kk-~~Eik 197 (418) -+..|. ++.+++.|+.+.++ +.... .+. -|.+.=++-.+.+ +.+.+ +.+..+.++..-+... .+.+. T Consensus 69 --kig~G~---r~~r~~~e~~~~~~~~~~~~~~v~-~~~~~~~~~~~~i--~~~~~~~n~~~~~~~f~~~i~~~~ae~~~ 140 (360) T protein:vir:99 69 --QFGVPR---LSGHTRDEEGSRTENSEAESGSVK-FNATDKSYYILVE--PKRDALKNTHYGPDQFGDYIVDQFIERYG 140 (360) T ss_pred --ccccce---eeccccccCCCCCcCCcCccccCc-cccccceeeEeec--hHHHHHhhhhcccchhHHHHHHHHHHHHH Confidence 011222 34456656333222 22111 111 1222222222222 23332 2233334444443444 45679 Q ss_pred HHHhHHHhcCcccc-----cCcCCccchhhHHHHHHHhhcccc---------------------------CccccCCCCc Q lcl|Aclame:pro 198 TEQETAIFFGQAFM-----GTYNGQPLHTTQGIVDAVRQYAPD---------------------------NVNAMPNPTA 245 (418) Q Consensus 198 rdmE~a~i~G~k~~-----~~s~~~~~r~t~GI~~~i~~~~~~---------------------------nv~~~~~~a~ 245 (418) +|||..+++|-+.. +++..+.-+.+.|++-.+..+... |.+..+...+ T Consensus 141 ~Dle~l~~~g~~ds~d~~~~~~~d~fl~~~dGwlKka~~~~~~id~a~d~t~~~~~~~~~~~~~~~~~~~~~~g~~~~~~ 220 (360) T protein:vir:99 141 NDLGLMGIRAGASSGNLQSIGGAAELDNTFKGWIARAEGDAQSVDDAGDSTRIGLEDTATADADSMPSIANTDGSGNPQP 220 (360) T ss_pred HHHHHHHhhccchhcccccCcccchhhhhhHHHHHHhhcccchhhccccccccccccccccccccchhhhcccccccccc Confidence 99999999987632 233334557789988766433211 1111122233 Q ss_pred cchHHHHHHHHHHHHhcccCC-CceeEEEEeChHHHHHHHh-hhhccceEEEcccceeeceEE---EEEEcCCeEEEEEE Q lcl|Aclame:pro 246 VTYDDVVDATIDAFKWSVNVG-DNTQRVMFCDTVGMRTMQD-IGRFFGEVTVTQRETSYGMVF---TEWKFFKGRLILKE 320 (418) Q Consensus 246 ~te~~l~d~~~~~~~~g~~~~-g~~~~~i~v~a~~k~~i~~-~~~~~~~~~~~~~~~~~G~~v---~~~~SdfG~v~vv~ 320 (418) +.+..|.++++.+=.+ .-.+ ....+ ++.+......-.. +.. .....|-.+ ....+.+| +.++. T Consensus 221 ~~~~lf~~~~~~Lp~k-yr~~~~~~~~-~~~s~~~~~~yr~~L~~---------R~t~LGd~~l~g~~~~~~~G-ipi~~ 288 (360) T protein:vir:99 221 VDTSLFNETIQTLDSR-YRESDAYSPV-LMTSPNQVQSYTMSLTE---------REDPLGSAVIFGDSDITPFS-YDLVG 288 (360) T ss_pred chHHHHHHHHHhcchh-hhcCcccceE-EEccCchHHHHHHHHhc---------cCcccchhheecccccccce-eeeEE Confidence 4555555655544222 1111 11223 3344332222222 211 112222221 23456678 66777 Q ss_pred CccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCcc-ccccEEEEEEEEEEecccceE Q lcl|Aclame:pro 321 HPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVD-AQGGSLTSEWALELLNPQGCA 399 (418) Q Consensus 321 n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~D-a~k~~i~~E~tLev~N~kA~a 399 (418) -|. ||.+.+++-+|.++.+..- |++..+....+- +.... + +.+..+.+-+...++++.|++ T Consensus 289 v~~-----~pd~~~mlT~p~NLi~g~~--~~iri~~~~e~~---~~~~~--------~~~~~~~~~~~~D~~iee~~Av~ 350 (360) T protein:vir:99 289 VNG-----FPDEYMMFTDPNNLAFGLY--EEMELDQSTDTD---KVHEQ--------RLHSRNWLEGQFDFQIKEQQAGV 350 (360) T ss_pred cCC-----CCCCceEEeccCceeEEee--eeeEEeecccch---hhhhh--------ceeeeEEEEEEeeEEEEecccEE Confidence 765 5779999999999965544 777654333321 10000 1 112234556777889999999 Q ss_pred EeecCccccc Q lcl|Aclame:pro 400 VITGLQKAKE 409 (418) Q Consensus 400 ~I~gL~~~~~ 409 (418) +++|+..++- T Consensus 351 ~vt~~~~~~~ 360 (360) T protein:vir:99 351 LVTDLETPTA 360 (360) T ss_pred EEecCCCCCC Confidence 9999977643 No 11 >protein:vir:41 Length: 299 # NCBI annotation: major capsid protein # Family: family:all:507 # MgeID: mge:2 # MgeName: A118 # Cross-refs: genbank:acc:NP_463467;swissprot:trembl:q9t1b7;genbank:gi:16798789;uniprot:Q9T1B7;genbank:GeneID:922353 Probab=97.26 E-value=3.7e-05 Score=44.90 Aligned_cols=294 Identities=12% Similarity=0.052 Sum_probs=134.2 Q ss_pred cccceeEEEEEeecCceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccc Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFE 140 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~ 140 (418) |-+.....+....++.+ ++-.-+..+.... ....+-.-...+..+.+....+.... + + ...|. . T Consensus 1 ~g~~a~~~~~~~~~~~~-iP~~~~~~ii~~~-~~~s~l~~~~~~~~~~~~~~~~~~~~-~--~-----~a~~v------~ 64 (299) T protein:vir:41 1 MGFNPDTTTMQSAKTGS-IPINISEQIITGV-KNGSAAMKLAKAVPMTKPEEEFTFMS-G--V-----GAFWV------D 64 (299) T ss_pred CCcCCCcccccCCCcee-cchhHHHHHHHHH-HhcchhhhhceeeecCCCcEEEEEEc-C--C-----ceeee------e Confidence 22222222221111111 1000000000000 00000001123444445544443211 1 1 11222 3 Q ss_pred cccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccch Q lcl|Aclame:pro 141 EGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLH 220 (418) Q Consensus 141 EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r 220 (418) ||.+.+... +. .-.-...+.+-...+.-|.+..+... .+-..+-...-...+.+.+|.++|+|.. ++ .+ T Consensus 65 E~~~~~~~~--~~-f~~v~l~~~k~~~~~~is~ell~ds~-~~~~~~i~~~l~~a~~~~~d~a~l~G~g----~~-~~-- 133 (299) T protein:vir:41 65 EAERIQTSK--PT-FTKAKMRSKKMGVIIPTTKENLNYSV-TNFFSLMQAEIVEAFYKKFDQAVFTGVE----SP-YN-- 133 (299) T ss_pred cCccccccc--cc-eeEEEEeeEEEEEeehhhHHHHhcCH-HHHHHHHHHHHHHHHHHHHHHHHhhccc----Cc-cc-- Confidence 666554332 11 11123334444455556666665322 2333445555556689999999998863 22 11 Q ss_pred hhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccce Q lcl|Aclame:pro 221 TTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET 300 (418) Q Consensus 221 ~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~ 300 (418) -||+..... . ......+..+.++|.+++.++-..+.. ...+++++.....|.++...++++-+... . T Consensus 134 --~gil~~~~~---~--~~~~~~~~~~~~~l~~~~~~l~~~~~~-----~~~~v~n~~~~~~L~~lkd~~G~~l~~~~-~ 200 (299) T protein:vir:41 134 --WNILKSATD---A--SNLVEETANKYDDLNEAIGLIEAEDLE-----PNGIATIRKQRVKYRSTKDGNGMPIFNTA-T 200 (299) T ss_pred --ccccccccc---c--ceeeccccccHHHHHHHHHhhhcccCC-----cCEEEEcHHHHHHHHHhhccCCceeecCC-c Confidence 244432211 1 111123456788898888776543322 22478999888899987655555443321 1 Q ss_pred eeceEEEEEEcCCeEEEEEECccccccCCCCCe----EEEEchhhceeeeccCCCcccccccccCcccccccccc-cccc Q lcl|Aclame:pro 301 SYGMVFTEWKFFKGRLILKEHPLFSAIGISPGF----AVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDY-SYGH 375 (418) Q Consensus 301 ~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~----~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~-~~~~ 375 (418) ..|.. +=+| +.|+..+. ||++. +++.|++++.+..- .++..+.+.........-.... ...- T Consensus 201 ~~~~~-----~l~G-~PV~~~~~-----~~~~~~~~~~~~gdfs~~~i~~~--~~~~i~~~~~~~~~~~~~~~~~~~~~~ 267 (299) T protein:vir:41 201 SNGVD-----DVLG-LPIAYTPK-----YTFGDKDISELVGDWNQAYYGIL--RGVEYEILTEATLTTVADETGKPLNLA 267 (299) T ss_pred CCCCc-----eecc-eeeEEecc-----cCCCCCceEEEEEecccEEEEEe--cCcEEEEeecccccccccccccchhhh Confidence 11211 1245 46666654 45554 88889887644332 3455454443331110000000 0001 Q ss_pred CccccccEEEEEEEEEEecccceEEeecCcccc Q lcl|Aclame:pro 376 GVDAQGGSLTSEWALELLNPQGCAVITGLQKAK 408 (418) Q Consensus 376 g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~ 408 (418) ..|...-+....+.+.+++|+|..+|+.- .|- T Consensus 268 ~~~~~~~r~~~~~d~~v~~~~A~~~l~~~-aa~ 299 (299) T protein:vir:41 268 ERDMAAIKATFEVGFMVVKDEAFSAVQPK-AGN 299 (299) T ss_pred hcCcEEEEEEEEeccEEecccceEEEEec-cCC Confidence 12445556678899999999999999653 222 No 12 >protein:vir:7771 Length: 330 # NCBI annotation: gp17 # Family: family:all:507 # MgeID: mge:149 # MgeName: Bxz2 # Cross-refs: genbank:acc:NP_817605;genbank:gi:29566035;genbank:GeneID:1259229 Probab=97.23 E-value=0.00012 Score=42.01 Aligned_cols=311 Identities=11% Similarity=0.001 Sum_probs=128.0 Q ss_pred cccceeEEEEEeecCceEEEE-ccccccccCcee----Eec----cCceEEEEEEecCceeEEEccccccchhhhhCCce Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTV-ENSDGLTKGMIF----YNE----ATGENMRLELVNGLNLTVKRQTGRISAAIIAANTK 131 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV-~~~~~~~~~~~~----~~~----~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~ 131 (418) |........ ..+. .++.++.+..+. ... .-...+.+..+.+..+++-+-..+.. .. T Consensus 1 m~~~~~~a~--------~~~~t~~~g~~i~~~~~~~ii~~~~~~s~l~~~~~~~~~~~~~~~~p~~~~~~~-------a~ 65 (330) T protein:vir:77 1 MAGSTVPST--------QVALTGDFSAFLTPEQSQDYFAEIEKTSIVQRIARKVPMGPTGISIPHWTGAVS-------AS 65 (330) T ss_pred Ccccccchh--------hccccCCCcceechhHHHHHHHHHHhccchhhhcceeeccCCceEEEEEcCCcc-------ee Confidence 322221111 1111 111122222211 100 00111223334444444333222211 12 Q ss_pred EEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccc Q lcl|Aclame:pro 132 LIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFM 211 (418) Q Consensus 132 v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~ 211 (418) |. .||...+..... -.. --..+++-...+.-|.+..... ..+-.++-...-.+.+.+.+|++||+|.- T Consensus 66 ~v------~Eg~~~~~~~~~-f~~--i~~~~~k~~~~~~is~ell~ds-~~~~~~~i~~~l~~ai~~~~~~~~l~G~g-- 133 (330) T protein:vir:77 66 WT------GEAERKPITKGS-FGK--QELEPVKITTIFAESAEVVRLN-PLNYLNTMRTKIAEAIALKFDAAAIHGID-- 133 (330) T ss_pred Ee------cCCCccccccce-eeE--EEEeEEEEEEeehhhHHHHhcc-hHHHHHHHHHHHHHHHHHHHHHHhhcccC-- Confidence 22 366655543211 111 1223333333444455555432 22334555566667789999999998864 Q ss_pred cCcCCccchhhHHHHHHHhhc---cccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhh Q lcl|Aclame:pro 212 GTYNGQPLHTTQGIVDAVRQY---APDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGR 288 (418) Q Consensus 212 ~~s~~~~~r~t~GI~~~i~~~---~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~ 288 (418) ++.+ ..||+..+... ...+............+++.+++.++...... ...+++++.....|.++.. T Consensus 134 --~~~~----~~g~~~~~~~~~~~~~~~~~~~~~~~~~~~~~l~~~~~~~~~~~~~-----~~~~vmn~~~~~~l~~lkd 202 (330) T protein:vir:77 134 --KPSA----FKGYLAETTKVVSLADTNLTTASGPQGNAYLAVNNALSLLVNSGKK-----WTGTLLDNVTEPILNTAVD 202 (330) T ss_pred --CCCc----cccccccccccceeecccccccccccchhHHHHHHHHHhhhhcCCC-----ccEEEEcHHHHHHHHHHhc Confidence 2222 23444322110 01111111122234456677777776654322 2247788888888888755 Q ss_pred ccceEEEcccceeeceEEEEEEcCCeEEEEEECccccccC-CCCCeEEEEchhhceeeeccCCCcccccccccCcccccc Q lcl|Aclame:pro 289 FFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIG-ISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSG 367 (418) Q Consensus 289 ~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~-mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~ 367 (418) .++++-+.......+..--.-.+=+| +.|+..+.+..-. -....+++.|++...+..- .++..+.+.......... T Consensus 203 ~~G~~l~~~~~~~~~~~~~~~~~l~G-~PV~~~~~~p~~~~~~~~~~~~gd~s~~~i~~~--~~~~i~~~~e~~~~~~~~ 279 (330) T protein:vir:77 203 GNGRPLFVESTYTEQVGAIREGRILG-RPTYVADNVVNGTVGNRVVGVMGDFSQVIWGQI--GGLSFDVTDQATLDFGEE 279 (330) T ss_pred cCCceeecCccccccccccCCceecc-eeeEEeccccCCCCCCccEEEEEecceEEEEEe--cCcEEEEeecceeeeccc Confidence 55554443221111100000001134 3555554432100 0012366778777643322 233222222211000000 Q ss_pred c-ccccccc----CccccccEEEEEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 368 A-TDYSYGH----GVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 368 ~-~~~~~~~----g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) . ..+...+ ..|....+...-+...+++|+|.++|++-... ++|.. T Consensus 280 ~~~~~~~~~~~~f~~~~~~~r~~~r~d~~v~~~~a~~~i~~~~~~------~~~~~ 329 (330) T protein:vir:77 280 QGGVWVPKLISLWQHNMVAVRCEAEFAFMVNDKDAFVKLTDQVAG------TDPEE 329 (330) T ss_pred ccccccccccchhhcCcEEEEEEEEeccEEecccceEEEEeccCC------cCCCC Confidence 0 0000000 11445556778889999999999998765422 22222 No 13 >protein:vir:102823 Length: 470 # NCBI annotation: major structural protein # Family: family:all:2450 # MgeID: mge:1610 # MgeName: YS40 # Cross-refs: genbank:acc:YP_874086;genbank:gi:118197693;genbank:GeneID:4496015 Probab=97.23 E-value=2.3e-05 Score=45.96 Aligned_cols=330 Identities=15% Similarity=0.085 Sum_probs=144.9 Q ss_pred chhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeEeccCceEEEEEEecCceeEE Q lcl|Aclame:pro 35 APLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTV 114 (418) Q Consensus 35 ~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv 114 (418) -|+-+|--+- +.+.--+.++...+.+ +.+.+ -++.|+......+.+|. T Consensus 1 ~~~~~~~~~~-----------------~a~~~al~~a~~~g~A-lR~Es--------------Ld~~l~~lt~~~~~ftf 48 (470) T protein:vir:10 1 MPYEHLKHLD-----------------EATLKALNAAGQVAES-LERED--------------LEPEVTQLNVLDTPLTD 48 (470) T ss_pred CChhHhhhhh-----------------HHHHHHHHHhhhcchh-hhhhh--------------hccceeEeeecCccchh Confidence 3344332221 1111111112221111 22221 22222222222222211 Q ss_pred E--ccccccchhhhhCCceEEEeec----ccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHH Q lcl|Aclame:pro 115 K--RQTGRISAAIIAANTKLIVIGT----AFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITES 188 (418) Q Consensus 115 ~--rg~~~tta~~~~~gt~v~~~g~----a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q 188 (418) - -..-...+..|..+....+=|+ +..||.........-+ |..=..-.+..+..||.-+--....+..|-++.+ T Consensus 49 ~~~i~k~~a~STV~ey~~~~~rhG~~g~s~~~E~~l~~~~d~~~~-Rr~v~~K~l~~~~~VT~~a~~~~~n~v~d~~~~~ 127 (470) T protein:vir:10 49 LLSKNAVKAKAYEHEYNVVTARHDKIGYAAFREGGLPRTVEVNVV-RRRIRPMLVGHRITVTELATRTTQNGVMQIDELV 127 (470) T ss_pred hhhcCCchhhhHhhhhhhhccccccccceeecccccCccCCCceE-EEEEEEEEEeecchhhhhhhhhhhccccchHHHH Confidence 1 1111222333444433333222 2236655443321111 1111223333334444332112234777889999 Q ss_pred HHHHHHHHHHHHhHHHhcCccccc-C-cCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCC Q lcl|Aclame:pro 189 RRDCMDFHATEQETAIFFGQAFMG-T-YNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVG 266 (418) Q Consensus 189 ~~kk~~EikrdmE~a~i~G~k~~~-~-s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~ 266 (418) .++++.-+...+|++++.|-.... . .+++..-+-+||...|..-.+.|+... .|..++++.|..+..++-.. .+ T Consensus 128 ~~dai~~ia~tiE~a~FyGDs~l~s~~~g~~~gleFDGl~~lId~~~~~NViDa-rG~~Ls~~~L~~aa~~I~~~---~~ 203 (470) T protein:vir:10 128 KREKMIAVANEFEYLAFYGDNLLGDDVPGSPNNLQQDGIINIIKRGAPQNVLDA-GGRPLSIDLLWEAESRVVST---QA 203 (470) T ss_pred HHHHHHHHHHHHHhhhhhhccccccccCcccCceeccchhhhccCCCCcccccc-CCCCccHHHHHHHHhhhccc---cc Confidence 999999999999999999965332 0 122333457888776665556677654 34578999998888777532 23 Q ss_pred CceeEEEEeChHHHHHHHhhhhccceEEEcccc----eeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhc Q lcl|Aclame:pro 267 DNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRE----TSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAV 342 (418) Q Consensus 267 g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~----~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~ 342 (418) .+++.-+|.+...+..|..- ...+.|+.... ...|..+..|+|-.|.+++-++-+|+..++. .-++||-+ T Consensus 204 fGt~TD~~lp~~vka~f~~~--~~~~qRv~~~~N~~~~~~G~~v~~f~sa~G~I~L~~s~~m~~~~k~--~p~~l~~~-- 277 (470) T protein:vir:10 204 FANPTAVFISYVDKLNLQAS--FYQISRVMTTADRRAGLLGADAQSYIGVRGEHSLYPSQFLGDFHKF--NPARFGAE-- 277 (470) T ss_pred ccChhhhccchhHHHHHHHh--hcCceEEEEecCCCceeeeeeccceeeeeeeeeecccccccchhhc--CcccCCcc-- Confidence 44445577777667666553 22445555443 3568999999999998888666555332221 11222221 Q ss_pred eeeeccCCCcccccccccCccccccccccccccCccccccE----EEEEEEEEEecccce--EEeecC----cccccccC Q lcl|Aclame:pro 343 KLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGS----LTSEWALELLNPQGC--AVITGL----QKAKERVY 412 (418) Q Consensus 343 ~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~----i~~E~tLev~N~kA~--a~I~gL----~~~~~~~~ 412 (418) ..+++.+....-....+-...-..|+.+|. =+++|..++.|-.+- ..|.+- ..+-..+- T Consensus 278 -----------v~~~aAP~~~~tv~~t~~~~a~~~~sk~g~~~~~~v~sy~y~v~~~~gds~s~~v~vt~t~~~v~kgv~ 346 (470) T protein:vir:10 278 -----------VGDFAAPSNSWTVSTTDNFVTLPYNSGLGDPANTTVYSYAFKAANFYGESAAKYIDVYIDSTEAGKGVR 346 (470) T ss_pred -----------cCCcccCceeEEeecCCCceeecccCCCCcccCcceeEEEEEEEEecCCCCcceEEEEEeeehhcceeE Confidence 122222211000000000011111233231 233555565553321 112111 00111111 Q ss_pred CCC-CC--C Q lcl|Aclame:pro 413 LTA-PA--P 418 (418) Q Consensus 413 ~~~-~~--~ 418 (418) ++- ++ + T Consensus 347 ltI~~~~~v 355 (470) T protein:vir:10 347 FQFHGLVNV 355 (470) T ss_pred EEEecCCCC Confidence 111 11 1 No 14 >protein:vir:2504 Length: 305 # NCBI annotation: major capsid subunit gp9 # Family: family:all:507 # MgeID: mge:53 # MgeName: TM4 # Cross-refs: genbank:acc:NP_569745;genbank:gi:18496895;genbank:GeneID:932268 Probab=97.06 E-value=9.7e-05 Score=42.57 Aligned_cols=297 Identities=11% Similarity=0.031 Sum_probs=126.3 Q ss_pred EEEeecCceEEEEccccccccCceeEeccC----ceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccC Q lcl|Aclame:pro 69 TAEAAADATVLTVENSDGLTKGMIFYNEAT----GENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQ 144 (418) Q Consensus 69 ~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~----~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGad 144 (418) .+..+.++....|.. .+. ..|+..... ...+.+..+.+..+++-+-..+.. ..|. .||+. T Consensus 1 ma~~t~~~gg~liP~--~~~-~~Ii~~~~~~s~l~~l~~~~~~~~~~~~~p~~~~~~~-------a~wv------~E~~~ 64 (305) T protein:vir:25 1 MADISRAEVASLIQE--AYS-DTLLAAAKQGSTVLSAFQNVNMGTKTTHLPVLATLPE-------ADWV------GESAT 64 (305) T ss_pred CCCccCCccceecCH--HHH-HHHHHHHHhhchhhhhcceeeccCCcEEEEEEeCCcc-------eEEe------ecccc Confidence 222222222212210 000 111110000 011234444444444433222211 1222 35544 Q ss_pred CcCcccccceeccceeEE----EeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccch Q lcl|Aclame:pro 145 RPTARSIQPVYVPNFTQI----FRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLH 220 (418) Q Consensus 145 a~~~~~~~~~~~~N~tQI----f~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r 220 (418) .+..... .. -..+.+| ++-...+.-|.+..+... .+-.++-.+.-.+.+.+.+|.++|+|.-. ..+ . T Consensus 65 ~~~~~~~-~s-~~~f~~i~~~~~k~~~~~~is~ell~ds~-~~~~~~i~~~l~~~~a~~~d~a~~~G~g~----~~~--~ 135 (305) T protein:vir:25 65 DPKGVKP-TS-KVTWANRTLVAEEIAVIIPVHENVIDDAT-VAVLTEVAELGGQAIGKKLDQAVIFGTDK----PAS--W 135 (305) T ss_pred ccccccc-cc-ccceeeEEeeeEEEEEeehhhHHHHhcch-HHHHHHHHHHHHHHHHHHHhhhheeccCC----CCC--c Confidence 3322111 10 1123333 333333444555554322 23345555666688999999999988631 111 1 Q ss_pred hhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccce Q lcl|Aclame:pro 221 TTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET 300 (418) Q Consensus 221 ~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~ 300 (418) ...++..... ..........+..+..++.+.+.++......... ...-+++++.....|.++...++++.+ +.+. T Consensus 136 ~~~~~~~~~~---~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~-~~~~~v~~~~~~~~l~~lkd~~G~~i~-~~~~ 210 (305) T protein:vir:25 136 VSPALIPAAV---TAGQAVEVVGGVANESDIVGATNRAAKAVASAGW-APDTLLSSLALRYEVANIRDANGNPVF-RDDS 210 (305) T ss_pred cccccccccc---cccccccccccchhhhHHHHHHHHHHHhhhhccc-ccceeEecHHHHHHHHHhhccCCceee-cCCc Confidence 1111111110 0111112233344556666666665543222111 111255688777788877555565544 3344 Q ss_pred eeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCcccc Q lcl|Aclame:pro 301 SYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQ 380 (418) Q Consensus 301 ~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~ 380 (418) -+|.-| +.+++ +.. ......+++.|++.+.+..-. +...+......+.+... ....-..|-. T Consensus 211 l~G~Pv--~~~~~----------~~~-~~~~~~~~~gd~s~~~i~~~~--~~~i~~~~~~~~~~~~~---~~~~~~~~~~ 272 (305) T protein:vir:25 211 FAGFRT--FFNRN----------GAW-DADAAIEVIADSSRVKIGVRQ--DITVKFLDQATLGTGEN---QINLAERDMV 272 (305) T ss_pred ccccce--EEcCc----------cCC-CCCccEEEEEecceEEEEEec--CeEEEEeeeeeeecCCc---eeeeeecCcE Confidence 455443 22222 111 122345677787765443332 22222221111100000 0001111344 Q ss_pred ccEEEEEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 381 GGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 381 k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) .-+.+..+.+.+.||+|..+++++..+ +..||. T Consensus 273 ~~R~~~r~~~~v~~p~a~v~~~~~~~~-----~~~pa~ 305 (305) T protein:vir:25 273 ALRLKARFAYVLGVSATAQGANKTPVA-----VVAPAA 305 (305) T ss_pred EEEEEEeecceeeCcccEEEEcccccc-----ccCCCC Confidence 445667799999999999999999877 334444 No 15 >protein:vir:97148 Length: 324 # NCBI annotation: ORF010 # Family: family:all:507 # MgeID: mge:1654 # MgeName: 85 # Cross-refs: genbank:acc:YP_239726;genbank:gi:66394880;genbank:GeneID:5130881 Probab=97.03 E-value=5.9e-05 Score=43.78 Aligned_cols=318 Identities=12% Similarity=0.020 Sum_probs=134.1 Q ss_pred eeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEcc Q lcl|Aclame:pro 4 YAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVEN 83 (418) Q Consensus 4 ~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~ 83 (418) |+ .+++++.+ ++ .|..+...............+.+...|.. T Consensus 1 ~~-------~~~~~~~~----------------------~~----------~f~~~~~~~~~~~a~~~~~~~~~~~~iP~ 41 (324) T protein:vir:97 1 ME-------QTQKLKLN----------------------LQ----------HFASNNVKPQVFNPDNVMMHEKKDGTLMN 41 (324) T ss_pred Cc-------cchhHHHH----------------------HH----------HHHHhhhhhhhhccccccccCCCcceech Confidence 10 00111000 00 01111111111000000001111111110 Q ss_pred ccccccCceeEe----ccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceeccce Q lcl|Aclame:pro 84 SDGLTKGMIFYN----EATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNF 159 (418) Q Consensus 84 ~~~~~~~~~~~~----~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~ 159 (418) .+. ..|+.. ..-...+.+.-+++.++++-+-..... ..|. .||...+..... .++. T Consensus 42 --~~~-~~ii~~~~~~s~l~~~~~~~~~~~~~~~ip~~~~~~~-------a~~v------~Eg~~~~~~~~~----f~~v 101 (324) T protein:vir:97 42 --EFT-TPILQEVMENSKIMQLGKYEPMEGTEKKFTFWADKPG-------AYWV------GEGQKIETSKAT----WVNA 101 (324) T ss_pred --hHH-HHHHHHHHhhcchhhhcceeeccCCceEEEEEecCcc-------eeEe------ccCccccccccc----eeEE Confidence 000 011110 000111233334444444333221111 1222 366655433211 1222 Q ss_pred e-EEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCcc Q lcl|Aclame:pro 160 T-QIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVN 238 (418) Q Consensus 160 t-QIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~ 238 (418) + ..++=..-+.=|.+..... ..+-..+-...-...+.+.+|.++|+|.. .+.. -.||+.... ..+ T Consensus 102 ~~~~~k~~~~~~is~ell~ds-~~~l~~~i~~~l~~aia~~~d~a~l~G~g----~~~~----~~gi~~~~~---~~~-- 167 (324) T protein:vir:97 102 TMRAFKLGVILPVTKEFLNYT-YSQFFEEMKPMIAEAFYKKFDEAGILNQG----NNPF----GKSIAQSIE---KTN-- 167 (324) T ss_pred EEeeEEEEEeehhhHHHHhcc-hHHHHHHHHHHHHHHHHHHHHHHhhccCC----CCcc----Ccccccccc---ccc-- Confidence 2 1222222333344444332 23444555566667789999999998863 2212 234433221 111 Q ss_pred ccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCeEEEE Q lcl|Aclame:pro 239 AMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKGRLIL 318 (418) Q Consensus 239 ~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~v 318 (418) ....+.++.+++.++...+-...... ..+++++.....|.++....+++.+..... .+=+|. .| T Consensus 168 -~~~~~~~~~~~i~~~~~~l~~~~~~~-----~~~v~n~~~~~~L~~lkd~~g~~~~~~~~~---------~tl~G~-PV 231 (324) T protein:vir:97 168 -KVIKGDFTQDNIIDLEALLEDDELEA-----NAFISKTQNRSLLRKIVDPETKERIYDRNS---------DTLDGL-PV 231 (324) T ss_pred -eeccccCCHHHHHHHHHhhhhccCCC-----CEEEEcHHHHHHHHHhhcCCCceeecCCCC---------ccccce-ee Confidence 22335678999998887765433222 246788888888887755555544431110 011332 23 Q ss_pred EECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccc-cccCccccccEEEEEEEEEEecccc Q lcl|Aclame:pro 319 KEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYS-YGHGVDAQGGSLTSEWALELLNPQG 397 (418) Q Consensus 319 v~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~-~~~g~Da~k~~i~~E~tLev~N~kA 397 (418) +.++. ...+.+.+++.|++++-+..- .++..+.+............... ..--.|...-+....+...+++++| T Consensus 232 ~~~~~---~~~~~~~~~~gd~~~~~i~~~--~~~~i~~~~~~~~~~~~~~~~~~~~~f~~d~~~~r~~~r~d~~v~~~~a 306 (324) T protein:vir:97 232 VNLKS---SNLKRGELITGDFDKLIYGIP--QLIEYKIDETAQLSTVKNEDGTPVNLFEQDMVALRATMHVALHIADDKA 306 (324) T ss_pred EeecC---CCCCcceEEEEecccEEEEEe--cCcEEEEeecccccccccccccchhhhhcCcEEEEEEEEeccEEecccc Confidence 33332 234567788889988765554 33333333322210000000000 0001155556677888999999999 Q ss_pred eEEeecCcccccccCCCCC Q lcl|Aclame:pro 398 CAVITGLQKAKERVYLTAP 416 (418) Q Consensus 398 ~a~I~gL~~~~~~~~~~~~ 416 (418) +++|++..... +++|.+- T Consensus 307 ~~~l~~~~~~~-~~~~~~~ 324 (324) T protein:vir:97 307 FAKLVPADKKT-DSVPGEV 324 (324) T ss_pred eEEEEeccCCC-CCCCCCC Confidence 99999976664 2332222 No 16 >protein:vir:348 Length: 321 # NCBI annotation: major virion structural protein # Family: family:all:3198 # MgeID: mge:9 # MgeName: Mx8 # Cross-refs: genbank:acc:NP_203462;genbank:gi:15320618;genbank:GeneID:921734 Probab=97.00 E-value=5.8e-05 Score=43.81 Aligned_cols=296 Identities=11% Similarity=0.043 Sum_probs=142.0 Q ss_pred chhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccC----ceeEeccCceEEEEEEecCc Q lcl|Aclame:pro 35 APLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKG----MIFYNEATGENMRLELVNGL 110 (418) Q Consensus 35 ~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~----~~~~~~~~~E~~~Vtav~g~ 110 (418) -|+-+|+-+... + +...+....- .|.....+... -.+....+.+.|++.---.. T Consensus 1 mp~~~lsel~t~---t------l~~rs~~~~D-------------~v~~~n~LL~~L~~kG~~~~~~gg~~I~~~l~y~~ 58 (321) T protein:vir:34 1 MPFPNISDIITT---T------IESRSGVIAD-------------NVTKNNAILARLAKRGKPRLVSGGYTILEELSFSG 58 (321) T ss_pred CCCchHHHHHHH---H------HHhhcchhhh-------------hhhcccHHHHHHHhcCcccccCCCeeEEEEEeecc Confidence 333334444211 0 1111111000 11111111100 00011122222211111111 Q ss_pred eeEEEccccccchhhhhCCceEEEe-ecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhh--hcccchHHH Q lcl|Aclame:pro 111 NLTVKRQTGRISAAIIAANTKLIVI-GTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYA--EAGYSNITE 187 (418) Q Consensus 111 ~~tv~rg~~~tta~~~~~gt~v~~~-g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~--~g~~dela~ 187 (418) ..+-.+-++..+ .-+ -+.-.+.+.++ .+.-. -.+.|||+-+--+. +-..|.+.. T Consensus 59 ~s~~~wy~Gyd~----------l~~~p~d~~~~Aef~-----wk~aa--------~~~~isg~e~l~n~g~~~~idll~~ 115 (321) T protein:vir:34 59 NSNGGWYSGYDV----------LPTAPQDVISSAEYA-----LKQYA--------VPVVISGLEMLQNSGKEAQLDLLEA 115 (321) T ss_pred CcceeEEEeeee----------eccchhhhccccccc-----hhhee--------EeeEEehhHHhhccchHHHHHHHHH Confidence 111111111111 100 01111222222 11111 23455666553221 111234444 Q ss_pred HHHHHHHHHHHHHhHHHhc-CcccccCcCCccchhhHHHHHHHh----------------hccccCccccCCCCccchHH Q lcl|Aclame:pro 188 SRRDCMDFHATEQETAIFF-GQAFMGTYNGQPLHTTQGIVDAVR----------------QYAPDNVNAMPNPTAVTYDD 250 (418) Q Consensus 188 q~~kk~~EikrdmE~a~i~-G~k~~~~s~~~~~r~t~GI~~~i~----------------~~~~~nv~~~~~~a~~te~~ 250 (418) +++.+-+.++-.++..+-. |.. -. .+++.|+=..+. .++-+.+.. .++..|-.. T Consensus 116 ~~~~ae~t~~n~l~~~l~sdGTa------~g-~~~i~GL~~lv~~~p~tGtvGGIdra~~~~WRn~~~d--~~~~~t~~t 186 (321) T protein:vir:34 116 RMNVAEATMANDISAALYGDGTA------FG-GRAINGLDGAVPVDPTVGTYGGINRALWPFWRSQVED--MAAVATINT 186 (321) T ss_pred HHHHHHHHHHhhhhHhhhccccc------cc-cchhhhhhhhcccCCCCceeccccccchhhhhhhhhh--hhhcccHHH Confidence 4444444455555555543 221 00 133444322221 111112222 223467888 Q ss_pred HHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcc-cceeeceEEEEEEcCCeEEEEEECccccccCC Q lcl|Aclame:pro 251 VVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQ-RETSYGMVFTEWKFFKGRLILKEHPLFSAIGI 329 (418) Q Consensus 251 l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~-~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~m 329 (418) +..++.++|.+.. -++..+.+++++......-+..-. .-+ |+.. +.-..|+.==.|.+ +.||.++.+.. .| T Consensus 187 l~~~m~~~w~~~~-Rg~~~PDlii~~~~~y~~y~~s~q-~~q-R~~~~~~a~~Gf~~Lky~~----~div~D~~~g~-~~ 258 (321) T protein:vir:34 187 IQPAMTKLWSRCV-RGADMPDLIMSGNDAWTTYSNSLQ-VLQ-RFTSAEEANLGFRSLKFLS----TDVVLDGGIGG-FA 258 (321) T ss_pred HHHHHHHHHHhhc-cCCCCccEEEechHHHHHHHHhhh-eee-eecccccccccceeeeeee----EEEEEeCCCCC-Cc Confidence 9999999998865 355678899999988877766322 111 2222 22234543333444 89999998766 49 Q ss_pred CCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecccceEEeecC Q lcl|Aclame:pro 330 SPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGL 404 (418) Q Consensus 330 p~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL 404 (418) |++.++.+|.+|+++++-..|+|. ++.-.. ++ +++-|+.-..|..-+-|-|.|+.+|+++.+- T Consensus 259 pan~~yfiNT~yl~~r~h~~~~~~--pi~p~r---~~-------~~NqdA~~q~I~~~GnL~~sn~~~~~vL~~~ 321 (321) T protein:vir:34 259 GANTMYFLNTKYLHFRPHKDRNMV--PLSPSR---RA-------AFNQDAEAQILAWAGNLTCSGAQFQGRLIAE 321 (321) T ss_pred cccceeeeecceEEEEEcCCCcee--ecCccc---cc-------ccchhHHhhhhhhhheeeeecccceeEEeeC Confidence 999999999999999999888885 222111 11 2455898899999999999999999999887 No 17 >protein:vir:8187 Length: 311 # NCBI annotation: gp7 # Family: family:all:966 # MgeID: mge:153 # MgeName: Che9d # Cross-refs: genbank:acc:NP_817980;genbank:gi:29566414;genbank:GeneID:2700968 Probab=96.90 E-value=7.7e-05 Score=43.14 Aligned_cols=286 Identities=9% Similarity=-0.051 Sum_probs=118.7 Q ss_pred EEEeecCceEEEEccccccccCceeEeccCc---------eEEEEEEecCceeEEEccccccchhhhhCCceEEEeeccc Q lcl|Aclame:pro 69 TAEAAADATVLTVENSDGLTKGMIFYNEATG---------ENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAF 139 (418) Q Consensus 69 ~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~ 139 (418) +|...++ ++..+.-+..++-+ ....+.-+.+..+++-+-.++.. ..|. T Consensus 1 mat~~~g----------g~lvP~~~~~~ii~~~~~~s~i~~~~~~i~~~~~~~~~p~~~~~~~-------a~wv------ 57 (311) T protein:vir:81 1 MVALATG----------TFQLPKHLVPGVWQKAQGQSVLARLSMAEPQEFGEQQYMTLTAPPR-------GEVV------ 57 (311) T ss_pred CceecCC----------ceEcchhHHHHHHHHHHhcchhhhhcceeecCCCceEEEEEeCCce-------eEEe------ Confidence 2222222 22222111111111 11122233334444433222211 1222 Q ss_pred ccccCCcCcccccceeccceeEEEeee----eeechhHHHHhhhc--ccchHHHHHHHHHHHHHHHHhHHHhcCcccccC Q lcl|Aclame:pro 140 EEGSQRPTARSIQPVYVPNFTQIFRNA----WALTDTARASYAEA--GYSNITESRRDCMDFHATEQETAIFFGQAFMGT 213 (418) Q Consensus 140 ~EGada~~~~~~~~~~~~N~tQIf~~~----v~VSgTa~Av~~~g--~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~ 213 (418) .||.+.+.... .+.+|--+. .-+.-|.+..+... ..+-..+-..+-...|.+.+|.++++|... + T Consensus 58 ~Eg~~~~~~~~-------~f~~v~l~~~kl~~~~~iS~ell~~~~d~~~~l~~~i~~~la~ai~~~~d~a~l~G~~~--~ 128 (311) T protein:vir:81 58 GEGAQKSESTA-------TFAPVTAIPRKVQVTQRFSQEVKWADESRQLGVLQTMADLSGVALGRALDLIGIHGINP--L 128 (311) T ss_pred ecCcccccccc-------eeeEEEEeeEEEEEeehhhHHHhhcCcccHHHHHHHHHHHHHHHHHHHHHHhhhccccC--C Confidence 36766554321 123332222 22333344332111 112234444555667899999999999631 1 Q ss_pred cCCccchhhHHHHHHHhhccccCccccCCCCccc-hHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccce Q lcl|Aclame:pro 214 YNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVT-YDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGE 292 (418) Q Consensus 214 s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~t-e~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~ 292 (418) .+.. -.||...+.. ..+....+...... ..++.++...+-..+. +...++.++....+|.++.-.+++ T Consensus 129 ~~~~----~~gi~~~~~~--~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~-----~~~~~vmn~~~~~~l~~lkd~~G~ 197 (311) T protein:vir:81 129 TGAA----LSGSPAKILD--TTNIVELTTGTSATPDLAVEAAVGLVLGDNL-----SPDGVALDNTFSFMLATQRDSQGR 197 (311) T ss_pred CCcc----cccccccccc--cceeeeecccccchHHHHHHHHHHHhhhcCC-----CceEEEEcHHHHHHHHhhhccCCC Confidence 1111 2233222111 11221112222222 3334344333322222 223366788888889887545566 Q ss_pred EEEccc------ceeeceEEEEEEcCC--eEEEEEECc-cccccCCCCCeEEEEchhhceeeeccCCCcccccccccCcc Q lcl|Aclame:pro 293 VTVTQR------ETSYGMVFTEWKFFK--GRLILKEHP-LFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGE 363 (418) Q Consensus 293 ~~~~~~------~~~~G~~v~~~~Sdf--G~v~vv~n~-~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~ 363 (418) +.+... ..-+|.-| +.+++ +......+. .....+.+.+.+++.|.+.+-+.... ++..+-+.. +.. T Consensus 198 ~l~~~~~~~~~~~tl~G~Pv--~~~~~i~~~~~~~~~~~~~~~~~~~~~~~~~gDfs~~~i~~~~--~~~~~~~~~-~~~ 272 (311) T protein:vir:81 198 KLYPELGFGTDVASFAGLNA--AVSDTVRGGPEAVTASTGVYRTTNPNVKAIAGDFSAFRWGVQV--SIPLELIEF-GDP 272 (311) T ss_pred eeecCccccCCCceecceeE--EecccccccccccccccchhcccCCccEEEEEecccEEEEEec--cceEEEecc-CCC Confidence 544321 12223322 22221 000000000 00012234456788898887666552 222222111 100 Q ss_pred ccccccccccccCccccccEEEEEEEEEEecccceEEeecCccc Q lcl|Aclame:pro 364 NKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKA 407 (418) Q Consensus 364 ~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~ 407 (418) +.. + + .-..|-...+....+...+++|+|..+|++-..| T Consensus 273 ~~~--~--~-~~~~~~v~~r~~~r~d~~v~~~~a~~~l~~a~~~ 311 (311) T protein:vir:81 273 DGL--G--D-LKRQNQIAIRAEVVYGIGIMSTDAFAVVRDADES 311 (311) T ss_pred Ccc--h--h-hhhcCcEEEEEEEEeccEeecccceEEEEeeccC Confidence 000 0 0 0001344455678899999999999999998888 No 18 >protein:vir:99749 Length: 324 # NCBI annotation: head protein # Family: family:all:507 # MgeID: mge:1497 # MgeName: phiETA2 # Cross-refs: genbank:acc:YP_001004307;genbank:gi:122891761;genbank:GeneID:4712304 Probab=96.88 E-value=9.6e-05 Score=42.60 Aligned_cols=314 Identities=11% Similarity=0.031 Sum_probs=134.2 Q ss_pred eEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeEecc--------- Q lcl|Aclame:pro 27 LRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEA--------- 97 (418) Q Consensus 27 ~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~--------- 97 (418) |.+.-+ .+.....|-.+..+.... .+ ..+..+ .++.++.+..+. +++ T Consensus 1 ~~k~~~----------------~~~~~~~~~~~~~~~~~~--~a----~~~~~~-~~~~~lip~~~~-~~ii~~~~~~s~ 56 (324) T protein:vir:99 1 MEQTQK----------------LKLNLQHFASNNVKPQVF--NP----DNVMMH-EKKDGTLLNDFT-TPILQEVMENSK 56 (324) T ss_pred CCCchH----------------hhHHHHHHHHHhhhhhhc--cc----cceecc-CCCcceechhHH-HHHHHHHHhhch Confidence 111111 010011111111111110 00 000000 011111121111 111 Q ss_pred CceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHh Q lcl|Aclame:pro 98 TGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASY 177 (418) Q Consensus 98 ~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~ 177 (418) -...+.+..+.+.++++-+-..+.. ..|. .||...+.....- ..+. ...++-..-+.=|.+..+ T Consensus 57 l~~~~~~~~~~~~~~~~p~~~~~~~-------a~~v------~Eg~~~~~~~~~~-~~v~--~~~~k~~~~~~iS~ell~ 120 (324) T protein:vir:99 57 IMRLGKYEPMEGTEKKFTFWADKPG-------AYWV------GEGQKIETSKATW-VNAT--MRAFKLGVILPVTKEFLN 120 (324) T ss_pred hhhhcceeeccCCceEEEEEecCcc-------eeEe------ccCccccccccce-eEEE--EeeEEEEEeehhhHHHHh Confidence 1112334445555554443222111 1222 4776666443221 1111 112222223333344443 Q ss_pred hhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHH Q lcl|Aclame:pro 178 AEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATID 257 (418) Q Consensus 178 ~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~ 257 (418) .. ..+-..|-...-...+.+.+|.++|+|.- .+.. ..|+...+. .. .....+.++.+++.++... T Consensus 121 ds-~~~l~~~i~~~l~~ai~~~~d~~~l~G~g----~~~~----~~~~~~~~~---~~---~~~~~~~~~~~~i~~~~~~ 185 (324) T protein:vir:99 121 YT-YSQFFEEMKPMIAEAFYKKFDEAGILNQG----NNPF----GKSIAQSIE---KT---NKVIKGDFTQDNIIDLEAL 185 (324) T ss_pred cc-hHHHHHHHHHHHHHHHHHHHHHHhhhcCC----CCcc----Ccccccccc---cc---ceeccccCCHHHHHHHHHh Confidence 32 22344555566667789999999998753 1211 233332221 11 1123346888999998877 Q ss_pred HHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEE Q lcl|Aclame:pro 258 AFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVV 337 (418) Q Consensus 258 ~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~ 337 (418) +-...... ..+++++.....|.++....++..+..... .+=+| +.|+.++. ...+.+.+++. T Consensus 186 l~~~~~~~-----~~~v~n~~~~~~L~~l~d~~g~~~~~~~~~---------~~l~G-~PVv~~~~---~~~~~~~~i~g 247 (324) T protein:vir:99 186 LEDDELEA-----NAFISKTQNRSLLRKIVDPETKERIYDRNS---------DTLDG-LPVVNLKS---SNLKRGELITG 247 (324) T ss_pred hhhccCCC-----CEEEEcHHHHHHHHHhhcCCCceeecCCCC---------ccccc-eeEEeecC---CCCCcceEEEE Confidence 75433222 246788888888888754555544432110 11234 23344333 23355678888 Q ss_pred chhhceeeeccCCCcccccccccCccccccccccc-cccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCCC Q lcl|Aclame:pro 338 DVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYS-YGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAP 416 (418) Q Consensus 338 D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~-~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~ 416 (418) |++++.+..-. ++..+................. ..-..|....+...-+...+.|++|..+|++..... +++|.+- T Consensus 248 d~~~~~~~~~~--~~~i~~~~~~~~~~~~~~~~~~~~~f~~~~~~~r~~~r~d~~v~~~~a~~~lt~a~~~~-~~~~~~~ 324 (324) T protein:vir:99 248 DFDKLIYGIPQ--LIEYKIDETAQLSTVKNEDGTPVNLFEQDMVALRATMHVALHIADDKAFAKLVPADKKT-DSVPGEV 324 (324) T ss_pred ecccEEEEEec--CcEEEEeecccccccccccccchhhhhcCcEEEEEEEEEccEEecccceEEEEeccCCC-CCCCCCC Confidence 99887655543 3333333322211000000000 000114455566677899999999999999865541 1111111 No 19 >protein:vir:103955 Length: 324 # NCBI annotation: head protein # Family: family:all:507 # MgeID: mge:1662 # MgeName: phiNM # Cross-refs: genbank:acc:YP_873992;genbank:gi:118430767;genbank:GeneID:4525449 Probab=96.72 E-value=0.00014 Score=41.70 Aligned_cols=312 Identities=11% Similarity=0.035 Sum_probs=133.8 Q ss_pred eEeecCCcchhHHHhhhccccceeeeeeeeeeee-cccceeEEEEEeecCceEEEEccccccccCceeEeccCc------ Q lcl|Aclame:pro 27 LRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKT-MVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATG------ 99 (418) Q Consensus 27 ~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~-~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~------ 99 (418) |.+.-+ .....+-|... ++... ..+ ..+..+ .++.++.+..+. +++-+ T Consensus 1 ~~~~~~-----------------~~~~~~~f~~~~~~~~~--~~a----~~~~~~-~~~~~liP~~~~-~~ii~~~~~~s 55 (324) T protein:vir:10 1 MEQTQK-----------------LKLNLQHFASNNVKPQV--FNP----DNVMMH-EKKDGTLLNDFT-TPILQEVMENS 55 (324) T ss_pred CCCchH-----------------HHHHHHHHHHHhhccce--ecc----cceecc-CCCcceechhHH-HHHHHHHHhhc Confidence 111100 00000101111 11110 000 000000 011112222211 11111 Q ss_pred ---eEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHH Q lcl|Aclame:pro 100 ---ENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARAS 176 (418) Q Consensus 100 ---E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av 176 (418) ....+..+.+..+++-+-..+.. ..|. .||+..+..... ...+. ...++-..-+.=|.++. T Consensus 56 ~l~~~~~~~~~~~~~~~~p~~~~~~~-------a~~v------~Eg~~~~~~~~~-~~~v~--~~~~k~~~~~~iS~ell 119 (324) T protein:vir:10 56 KIMQLGKYEPMEGTEKKFTFWADKPG-------AYWV------GEGQKIETSKAT-WVNAT--MRAFKLGVILPVTKEFL 119 (324) T ss_pred hhhhhcceeeccCCceEEEEEeCCcc-------eeEe------ccCccccccccc-eeEEE--EeeEEEEEeehhhHHHH Confidence 11234444444444433221111 1222 377666543322 11111 12222233333444444 Q ss_pred hhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHH Q lcl|Aclame:pro 177 YAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATI 256 (418) Q Consensus 177 ~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~ 256 (418) +.. ..+-..|-...-...+.+.+|.++|+|.- .+.. ..|++..+. .. .....+.++.++|.+++. T Consensus 120 ~ds-~~~l~~~i~~~l~~ai~~~~d~a~l~G~g----~~~~----~~~i~~~~~---~~---~~~~~~~~t~~~i~~~~~ 184 (324) T protein:vir:10 120 NYT-YSQFFEEMKPMIAEAFYKKFDEAGILNQG----NNPF----GKSIAQSIE---KT---NKVIKGDFTQDNIIDLEA 184 (324) T ss_pred hcc-hHHHHHHHHHHHHHHHHHHHHHHhhhcCC----CCcc----Ccccccccc---cc---ceeccccCCHHHHHHHHH Confidence 432 22334555556667789999999998753 1212 234433221 11 112335788999999988 Q ss_pred HHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEE Q lcl|Aclame:pro 257 DAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVV 336 (418) Q Consensus 257 ~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv 336 (418) .+-......+ .+++++.....|.++....+++.+..... .+=+|. .|+.++. ...+.+.+++ T Consensus 185 ~l~~~~~~~~-----~~v~n~~~~~~L~~l~d~~g~~~~~~~~~---------~~l~G~-PV~~~~~---~~~~~~~~~~ 246 (324) T protein:vir:10 185 LLEDDELEAN-----AFISKTQNRSLLRKIVDPETKERIYDRNS---------DTLDGL-PVVNLKS---SNLKRGELIT 246 (324) T ss_pred hhhhccCCCC-----EEEEcHHHHHHHHHhhccCCceeecCCCC---------ccccce-eEEeecC---CCCCcceEEE Confidence 7765332222 36678888888888754555544332110 112332 3333332 3345677888 Q ss_pred EchhhceeeeccCCCcccccccccCcccccccccc-ccccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCC Q lcl|Aclame:pro 337 VDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDY-SYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTA 415 (418) Q Consensus 337 ~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~-~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~ 415 (418) .|++.+.+..- +++..+.+.............. ...-..|....+...-+...+.+++|..+|++..... ++ . T Consensus 247 gd~~~~~~~~~--~~~~i~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r~~~r~d~~v~~~~A~~~l~~a~~~~-~~---~ 320 (324) T protein:vir:10 247 GDFDKLIYGIP--QLIEYKIDETAQLSTVKNEDGTPVNLFEQDMVALRATMHVALHIADDKAFAKLVPADKKT-DS---V 320 (324) T ss_pred EecccEEEEEe--cCcEEEEeecccccccccccccchhhhhcCcEEEEEEEEEccEEecccceEEEEeccCCC-CC---C Confidence 89988765554 3333333322211000000000 0000114555566778999999999999999865441 11 2 Q ss_pred CCC Q lcl|Aclame:pro 416 PAP 418 (418) Q Consensus 416 ~~~ 418 (418) |+. T Consensus 321 ~~~ 323 (324) T protein:vir:10 321 PGE 323 (324) T ss_pred CCC Confidence 222 No 20 >protein:vir:9759 Length: 303 # NCBI annotation: putative structural protein # Family: family:all:966 # MgeID: mge:175 # MgeName: 315.3 # Cross-refs: genbank:acc:NP_795521;genbank:gi:28876283;genbank:GeneID:1257824 Probab=96.42 E-value=0.00021 Score=40.79 Aligned_cols=284 Identities=11% Similarity=-0.001 Sum_probs=118.8 Q ss_pred EEEccccccccCceeEeccC---------ceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcc Q lcl|Aclame:pro 79 LTVENSDGLTKGMIFYNEAT---------GENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTAR 149 (418) Q Consensus 79 ~tV~~~~~~~~~~~~~~~~~---------~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~ 149 (418) +-+.++.++..+.-+..++- .-...+.-+.+.++++-+-..+.. ..|+ .||+..+... T Consensus 1 m~t~t~gg~liP~~~~~~ii~~l~~~s~i~~l~~~~~~~~~~~~ip~~~~~~~-------a~wv------~E~~~~~~s~ 67 (303) T protein:vir:97 1 MGTETSKASLFDKHLVSDLINKVKGHSSLAKLSSQKPIPFNGSKEFTFTLDSD-------IDVV------AENGKKTHGG 67 (303) T ss_pred CcccCCCCeEcchhHHHHHHHHHHhhchhhhhcceeecCCCceEEEEEecCcc-------eEEe------ecCccccccc Confidence 12212222222221111110 011123334444444433222211 1232 3665544332 Q ss_pred cccceeccceeEEEeeeeeec----hhHHHHhhh--cccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhH Q lcl|Aclame:pro 150 SIQPVYVPNFTQIFRNAWALT----DTARASYAE--AGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQ 223 (418) Q Consensus 150 ~~~~~~~~N~tQIf~~~v~VS----gTa~Av~~~--g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~ 223 (418) . .+.||--+.-++. =|.+.+..- -..+-.++-..+-.+.+.+.+|.++|+|.....+.+..+.. .. T Consensus 68 ~-------~f~~v~l~~~kl~~~~~iS~ell~~~~d~~~~l~~~i~~~la~a~~~~ld~a~l~G~~~~~g~~~~~~~-~~ 139 (303) T protein:vir:97 68 L-------SLEPVTIVPIKVEYGARLSDEFLYATEEEKIDILKAFNEGFAKKLARGIDLMAMHGINPRTKKASDVIG-TN 139 (303) T ss_pred c-------ceeeEEeeeEEEEEeehhhHHHhhcCccchHHHHHHHHHHHHHHHHHHHHhhhhcccccCCcccccccc-cc Confidence 1 2333333333333 333332110 11122344455555667899999999997432222222111 11 Q ss_pred HHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeec Q lcl|Aclame:pro 224 GIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYG 303 (418) Q Consensus 224 GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G 303 (418) +... ..+++.. .+.+..+.+++.+++..+-..+... ..++.++....+|.++.-.++++.+...-. .| T Consensus 140 -~~~~----~~~~~~~-~~~~~~~~~~i~~~~~~~~~~~~~~-----~~~vmn~~~~~~L~~lkd~~g~~~~~~~~~-~~ 207 (303) T protein:vir:97 140 -HFDS----KVTQVVK-FTESEDADANIEAAVNLIQGAEGVV-----TGLAMDTEFSTALAKVTNGEMGPKMYPELA-WG 207 (303) T ss_pred -cccc----ccccccc-cccccchHHHHHHHHHHHhhcCCCc-----cEEEEcHHHHHHHHHhhccCCCeEEecCcc-CC Confidence 1000 0111111 1223456777888777665433222 236678888888887754455555433211 11 Q ss_pred eEEEEEEcCCeEEEEEECccccc---cCCCCCeEEEEchhhc-eeeeccCCCcccccccccCccccccccccccccCccc Q lcl|Aclame:pro 304 MVFTEWKFFKGRLILKEHPLFSA---IGISPGFAVVVDVPAV-KLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDA 379 (418) Q Consensus 304 ~~v~~~~SdfG~v~vv~n~~l~~---~~mp~d~~lv~D~~~~-~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da 379 (418) .... +=+| +.++.++.+.. ...+.+.+++.|.+.. .+... ++...+-.. .+..+... ++ .-..|- T Consensus 208 ~~~~---~l~G-~Pv~~s~~v~~~~~~~~~~~~~~~Gdf~~~~~~~~~--~~~~~~~~~-~~~~d~~~-~~---~~~~n~ 276 (303) T protein:vir:97 208 ANPD---SING-LKSSVNTTVGAGADEAESKDLVIIGDFESMFKWGYA--KQIPMEIIK-YGDPDNSG-KD---LKGYNQ 276 (303) T ss_pred CCCc---eecc-eeeEEecccCCccccCCCccEEEEeeccccEEEEEe--cCcEEEEee-ccCCCCcc-hh---hhhcCc Confidence 1111 1224 45555544321 1122345677776432 23332 222222111 11000000 00 001133 Q ss_pred cccEEEEEEEEEEecccceEEeecCcc Q lcl|Aclame:pro 380 QGGSLTSEWALELLNPQGCAVITGLQK 406 (418) Q Consensus 380 ~k~~i~~E~tLev~N~kA~a~I~gL~~ 406 (418) ..-+....+...++||+|..+|++.+- T Consensus 277 ~~~r~~~r~~~~v~~p~af~~l~~~~~ 303 (303) T protein:vir:97 277 IYLRAEAYIGWGILDAKSFARVTKGEV 303 (303) T ss_pred EEEEEEEEeccEeecccceEEeeCCCC Confidence 344557788999999999999998877 No 21 >protein:vir:9309 Length: 324 # NCBI annotation: head protein # Family: family:all:507 # MgeID: mge:165 # MgeName: phi 11 # Cross-refs: genbank:acc:NP_803287;genbank:gi:29028597;genbank:GeneID:1258044 Probab=96.35 E-value=0.00021 Score=40.73 Aligned_cols=304 Identities=12% Similarity=0.040 Sum_probs=132.4 Q ss_pred eeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEc- Q lcl|Aclame:pro 4 YAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVE- 82 (418) Q Consensus 4 ~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~- 82 (418) |+..=....|.. .|....++...- .+ ..+ +.. T Consensus 1 ~~~~~~~~~~~~---------------------------------------~f~~~~~~~~~~--~a----~~~--~~~~ 33 (324) T protein:vir:93 1 MEQTQKLKLNLQ---------------------------------------HFASNNVKPQVF--NP----DNV--MMHE 33 (324) T ss_pred CchhHHHHHHHH---------------------------------------HHHHhhhhhhhc--cc----ccc--cccC Confidence 211111111111 111111111110 00 000 000 Q ss_pred cccccccCceeEeccC---------ceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccc Q lcl|Aclame:pro 83 NSDGLTKGMIFYNEAT---------GENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQP 153 (418) Q Consensus 83 ~~~~~~~~~~~~~~~~---------~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~ 153 (418) ++.++.+..+. .++- ...+.+.-+.+..+++-+-..+.. ..|. .||.+.+.... T Consensus 34 ~~~~liP~~~~-~~ii~~~~~~s~l~~l~~~~~~~~~~~~ip~~~~~~~-------a~~v------~Eg~~~~~~~~--- 96 (324) T protein:vir:93 34 KKDGTLLNDFT-TPILQEVMENSKIMQLGKYEPMEGTEKKFTFWADKPG-------AYWV------GEGQKIETSKA--- 96 (324) T ss_pred CCcceechhHH-HHHHHHHHhhchhhhhcceeeccCCceEEEEEecCcc-------eeee------cCCcccccccc--- Confidence 01111121111 1110 111233344444444332211111 1222 47766654321 Q ss_pred eeccceeEEEeeeeeechh----HHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHH Q lcl|Aclame:pro 154 VYVPNFTQIFRNAWALTDT----ARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAV 229 (418) Q Consensus 154 ~~~~N~tQIf~~~v~VSgT----a~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i 229 (418) .+.+|--+.-.+.+. .+..... ..+-..+-...-.+.+.+.+|.++|+|.- .+.. ..|++..+ T Consensus 97 ----~f~~i~~~~~k~~~~~~iS~ell~ds-~~~l~~~i~~~l~~aia~~~d~a~l~G~g----~~~~----~~~~~~~~ 163 (324) T protein:vir:93 97 ----TWVNATMRAFKLGVILPVTKEFLNYT-YSQFFEEMKPMIAEAFYKKFDEAGILNQG----NNPF----GKSIAQSI 163 (324) T ss_pred ----ceeEEEEEeEEEEEeehhhHHHHhcc-hHHHHHHHHHHHHHHHHHHHHHHHhcCCC----CCCc----Cccccccc Confidence 233443333333333 3333321 12323344444456789999999998853 2212 23343222 Q ss_pred hhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEccc--ceeeceEEE Q lcl|Aclame:pro 230 RQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQR--ETSYGMVFT 307 (418) Q Consensus 230 ~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~--~~~~G~~v~ 307 (418) . ..+ ....+..+.+++.++...+-...... ..+++++.....|.++...+|++.+... .+-+|. T Consensus 164 ~---~~~---~~~~~~~~~~~i~~~~~~l~~~~~~~-----~~~v~n~~~~~~L~~l~d~~G~~~~~~~~~~~l~G~--- 229 (324) T protein:vir:93 164 E---KTN---KVIKGDFTQDNIIDLEALLEDDELEA-----NAFISKTQNRSLLRKIVDPETKERIYDRNSDSLDGL--- 229 (324) T ss_pred c---ccc---eeccccccHHHHHHHHHhhhhccCCC-----CEEEEcHHHHHHHHHhhCCCCCeeecCCCCCcccce--- Confidence 1 111 12234678899998888776543222 2477898888888887555565544321 112232 Q ss_pred EEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccc-cccCccccccEEEE Q lcl|Aclame:pro 308 EWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYS-YGHGVDAQGGSLTS 386 (418) Q Consensus 308 ~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~-~~~g~Da~k~~i~~ 386 (418) .|+.++. ..++.+.+++.|++++.+..- .++..+.+............... ..--.|...-+... T Consensus 230 ---------PVv~~~~---~~~~~~~i~~gdfs~~~~~~~--~~~~i~~~~~~~~~~~~~~~~~~~~~f~~n~~~~r~~~ 295 (324) T protein:vir:93 230 ---------PVVNLKS---SNLKRGELITGDFDKLIYGIP--QLIEYKIDETAQLSTVKNEDGTPVNLFEQDMVALRATM 295 (324) T ss_pred ---------eeEeecC---CCCCcceEEEEecceEEEEEe--cCcEEEEeecccccccccccccchhhhhcCcEEEEEEE Confidence 2333322 234667888899888755444 33333333332211110000000 00011556667788 Q ss_pred EEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 387 EWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 387 E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) -+.+.+.+++|..+|++-... +.+.| T Consensus 296 r~d~~v~~~~a~~~l~~a~~~------~~~~~ 321 (324) T protein:vir:93 296 HVALHIADDKAFAKLVPADKR------TDSVP 321 (324) T ss_pred EeccEEecccceEEEeccccc------CCCCC Confidence 999999999999999865443 22233 No 22 >protein:vir:2344 Length: 397 # NCBI annotation: gp14 # Family: family:all:507 # MgeID: mge:51 # MgeName: Bxb1 # Cross-refs: genbank:acc:NP_075281;genbank:gi:12657868;genbank:GeneID:920118 Probab=96.16 E-value=0.00079 Score=37.60 Aligned_cols=302 Identities=12% Similarity=0.006 Sum_probs=131.5 Q ss_pred cccceeEEEEEeecCceEEEEccccccccCceeEeccCc---------eEEEEEEecCceeEEEccccccchhhhhCCce Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATG---------ENMRLELVNGLNLTVKRQTGRISAAIIAANTK 131 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~ 131 (418) |-+.-.......+.. .+..++.+..+.. .+-+ .+..+..+.+..+++-+-..++. .. T Consensus 1 ~g~~~e~~~~~~~~t------~~~~g~l~~~~~~-~ii~~l~~~s~i~~l~~~~~~~~~~~~ip~~~~~~~-------a~ 66 (397) T protein:vir:23 1 MGFSADHSQIAQTKD------TMFTGYLDPVQAK-DYFAEAEKTSIVQRVAQKIPMGATGIVIPHWTGDVS-------AQ 66 (397) T ss_pred CCcCHHHHHHhhccC------CCCccccchhHHH-HHHHHHHhccchhhhcceeeccCCceEEEEEcCCcc-------eE Confidence 111111100000000 0001112211111 1111 11223344444444433322211 12 Q ss_pred EEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccc Q lcl|Aclame:pro 132 LIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFM 211 (418) Q Consensus 132 v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~ 211 (418) |+ .||...+... +. .-..-..+++-...+.-|.+..+.. ..+-..+-.++-.+.+.+.+|.++|+|... T Consensus 67 wv------~Eg~~~~~s~--~~-f~~v~l~~~k~~~~v~iS~ell~ds-~~~l~~~i~~~l~~aia~~~d~a~l~G~gt- 135 (397) T protein:vir:23 67 WI------GEGDMKPITK--GN-MTKRDVHPAKIATIFVASAETVRAN-PANYLGTMRTKVATAIAMAFDNAALHGTNA- 135 (397) T ss_pred Ee------cCCccccccc--cc-eeEEEEeeEEEEEeehhhHHHHhcc-hHHHHHHHHHHHHHHHHHHHHHHHhhcccC- Confidence 22 3665554432 11 1111233344444455555555432 234456666677777899999999987641 Q ss_pred cCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccc Q lcl|Aclame:pro 212 GTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFG 291 (418) Q Consensus 212 ~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~ 291 (418) ... ..|+... .+. ..........+++.++..++....... ..+++++.....|.++...++ T Consensus 136 ---~~~----~~~~~~~------~~~-~~~~~~~~~~~~~~~~~~~l~~~~~~~-----a~~vmn~~~~~~L~~lkd~~G 196 (397) T protein:vir:23 136 ---PSA----FQGYLDQ------SNK-TQSISPNAYQGLGVSGLTKLVTDGKKW-----THTLLDDTVEPVLNGSVDANG 196 (397) T ss_pred ---Ccc----ccccccc------ccc-eeeecccchhHHHHHHHHhhhhcccCC-----CEEEEcHHHHHHHHHhhccCC Confidence 111 2222211 111 111233556777778777777544322 347788888888888755555 Q ss_pred eEEEcccceeeceEEEEEE-cCCeEEEEEECccccccCCCCCeE--EEEchhhceeeeccCCCcccccccccCccccccc Q lcl|Aclame:pro 292 EVTVTQRETSYGMVFTEWK-FFKGRLILKEHPLFSAIGISPGFA--VVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGA 368 (418) Q Consensus 292 ~~~~~~~~~~~G~~v~~~~-SdfG~v~vv~n~~l~~~~mp~d~~--lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~ 368 (418) ++-+.... ..+....... +=+| +.++.++ +||+++. ++-|...+-+..- ++...+.+.......-. T Consensus 197 ~~i~~~~~-~~~~~~~~~~~tl~G-~Pv~~s~-----~~~~g~~~~~~gDfs~~~i~~~--~~i~i~~~~e~~~~~~~-- 265 (397) T protein:vir:23 197 RPLFVEST-YESLTTPFREGRILG-RPTILSD-----HVAEGDVVGYAGDFSQIIWGQV--GGLSFDVTDQATLNLGS-- 265 (397) T ss_pred ceeecccc-cccccccccCceeee-eeEEEeC-----CCCCCceEEEEeecceEEEEEE--eceEEEEeeeeeeeecc-- Confidence 54433221 1111110000 0012 1334433 3566554 3346665433332 22333322222110000 Q ss_pred ccccccc----CccccccEEEEEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 369 TDYSYGH----GVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 369 ~~~~~~~----g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) +....+ -.|-...+....+...+++++|..++..-......+++.+|+. T Consensus 266 -~~~~~~~~lf~~d~v~~ra~~r~d~~v~~~~a~~~~~~~~~~~~~~~~~~~~~ 318 (397) T protein:vir:23 266 -QESPNFVSLWQHNLVAVRVEAEYGLLINDVNAFVKLTFDPVLTTYALDLDGAS 318 (397) T ss_pred -ccccceeeeeeccceeEEEEeeeccceecccceEEEeeccccceeeecccccC Confidence 000000 0133445566788999999999999997655555555555444 No 23 >protein:vir:104085 Length: 320 # NCBI annotation: gp17 # Family: family:all:507 # MgeID: mge:1656 # MgeName: Che12 # Cross-refs: genbank:acc:YP_655596;genbank:gi:109392467;genbank:GeneID:4156953 Probab=96.04 E-value=0.00039 Score=39.29 Aligned_cols=298 Identities=10% Similarity=0.018 Sum_probs=120.5 Q ss_pred cccceeEEEEEeecCceEEEEc---cccccccCceeEeccCc---------eEEEEEEecCceeEEEccccccchhhhhC Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVE---NSDGLTKGMIFYNEATG---------ENMRLELVNGLNLTVKRQTGRISAAIIAA 128 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~---~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~~tv~rg~~~tta~~~~~ 128 (418) |.-. .+...+...+... ++.++.+..+. .++-+ ....+.-+.+..+++-+-..+. T Consensus 1 ~~~~-----~~~~~~~~~~~~t~~~~~~~~ip~~~~-~~ii~~~~~~s~l~~~~~~~~~~~~~~~~p~~~~~~------- 67 (320) T protein:vir:10 1 MAAG-----TAFQVDHAQIAQTGDTMFKGYLEPEQA-KDYFAEAEKTSIVQQFAQKVPMGTTGQKIPHWIGDV------- 67 (320) T ss_pred CCCC-----ccCCHHHHHhhccccccccccccHHHH-HHHHHHHHhccchhhhcceeeccCCceEEEEEeCCc------- Confidence 1000 0000001111111 11112222211 11111 1112223334444433221111 Q ss_pred CceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCc Q lcl|Aclame:pro 129 NTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQ 208 (418) Q Consensus 129 gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~ 208 (418) ...|. .||++.|..... .. ..-..+++-...+.-|.++.+... .+-.++-..+-.+.+.+.+|.++|+|. T Consensus 68 ~a~~v------~E~~~~~~~~~~-f~--~v~~~~~k~~~~~~is~ell~ds~-~~l~~~i~~~l~~a~a~~~d~a~l~G~ 137 (320) T protein:vir:10 68 SAQWI------GEGDMKPITKGN-MT--SQNIAPHKIATIFVASAETVRANP-ANYLGTMRTKVATAFAMAFDSAALNGT 137 (320) T ss_pred ceEEe------cCCccccccccc-ee--EEEEeeEEEEEeehhhHHHHhcCh-HHHHHHHHHHHHHHHHHHHHHHhhccc Confidence 11221 377666543321 11 122344455555556666665322 344455566666888999999999887 Q ss_pred ccccCcCCccchhhHHHHHHHhhccccCcccc--CCCCccc--hHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHH Q lcl|Aclame:pro 209 AFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAM--PNPTAVT--YDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQ 284 (418) Q Consensus 209 k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~--~~~a~~t--e~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~ 284 (418) ... .+.. ..|+... .+.... ...+.++ ++.+.++...+... +.....+++++.....|. T Consensus 138 g~~-----~~~~-~~~~~~~------~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~-----~~~~~~~v~n~~~~~~L~ 200 (320) T protein:vir:10 138 DSP-----FPTY-LAQTTKS------VSLADPGGATASDLTAYDAVAVNGLSLLVNA-----KKKWTHTLLDDIVEPILN 200 (320) T ss_pred CCC-----CCcc-ccccccc------ccceecccccccccccHHHHHHHHHhhhhcc-----cCCCcEEEEcHHHHHHHH Confidence 521 1101 1111110 011000 0111111 12233333333322 222336788999999998 Q ss_pred hhhhccceEEEcccceeeceEEEEEEcCCeE---EEEEECccccccCCCCCe--EEEEchhhceeeeccCCCcccccccc Q lcl|Aclame:pro 285 DIGRFFGEVTVTQRETSYGMVFTEWKFFKGR---LILKEHPLFSAIGISPGF--AVVVDVPAVKLAYMDGRNAKVENYGQ 359 (418) Q Consensus 285 ~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~---v~vv~n~~l~~~~mp~d~--~lv~D~~~~~~~~L~~r~~~~e~laK 359 (418) ++....+++.+.......+. ..+ ..++ +.+++++ +||+++ +++.|++++-+..- .++..+.+.. T Consensus 201 ~lkd~~G~~l~~~~~~~~~~--~~~--~~~~i~g~pv~~~~-----~~~~~~~~~~~gd~~~~~~~~~--~~~~i~~~~~ 269 (320) T protein:vir:10 201 GAKDKNGRPLFIESTYTDEN--SPF--RAGRIVSRPTILSD-----HVADGTTVGYMGDFRNVIWGQV--GGLSFDVTDQ 269 (320) T ss_pred HhhccCCceeeccccccCcc--ccc--cCceeeeeeeEecC-----CCCCCceEEEEeecceEEEEEe--cCeEEEEeec Confidence 87655555444321111000 000 1122 2445553 356665 34568776644333 2232222222 Q ss_pred cCcccccccccccc-ccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCCCC Q lcl|Aclame:pro 360 GGGENKSGATDYSY-GHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPA 417 (418) Q Consensus 360 tG~~~~~~~~~~~~-~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~ 417 (418) ....+......... .-..|....+...-+.+.+.+|+|.++|++.. | ||| T Consensus 270 ~~~~~~~~~~~~~~~~f~~~~~~~r~~~~~d~~v~~~~a~~~l~~~~-a-------p~~ 320 (320) T protein:vir:10 270 ATLNLGTPTEPNFVSLWQHNLVAVRVEAEYAFHNNDKDAFVKLTNVV-T-------PDA 320 (320) T ss_pred ceeeeccccccccchhhhcCcEEEEEEEeeccEEecccceEEEEecc-C-------CCC Confidence 11100000000000 00013444566678899999999999998654 2 223 No 24 >protein:vir:96392 Length: 324 # NCBI annotation: ORF011 # Family: family:all:507 # MgeID: mge:1613 # MgeName: 53 # Cross-refs: genbank:acc:YP_239648;genbank:gi:66395381;genbank:GeneID:5132868 Probab=96.01 E-value=0.0008 Score=37.55 Aligned_cols=310 Identities=11% Similarity=0.005 Sum_probs=131.3 Q ss_pred ccccceeeeee-eeeeeecccceeEEEEEeecCceEEEEccccccccCceeEeccCc---------eEEEEEEecCceeE Q lcl|Aclame:pro 44 VGSTTAKASTH-GYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATG---------ENMRLELVNGLNLT 113 (418) Q Consensus 44 ~~~~~~~~~~~-~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~~t 113 (418) ..+..-..... .|..+..+............+.. ..+.+..+. ..+-+ ..+.+..+.+.+++ T Consensus 1 ~~~~~~~~~~~~~~~~~~~~~~~~~a~~~~~~~~~-------~~~iP~~~~-~~ii~~~~~~s~l~~l~~~~~~~~~~~~ 72 (324) T protein:vir:96 1 MEQTQKLKLNLQHFASNNVKPQVFNPDNVMMHEKK-------DGTLMNEFT-TPILQEVMENSKIMQLGKYEPMEGTEKK 72 (324) T ss_pred CCcchhhhHHHHHHHHHhhhhhhhccccccccCcC-------ccccchhHH-HHHHHHHHhhchhhhhcceeeccCCceE Confidence 01111111111 11111111100000000001111 111111111 11111 11233344444444 Q ss_pred EEccccccchhhhhCCceEEEeecccccccCCcCcccccceeccce-eEEEeeeeeechhHHHHhhhcccchHHHHHHHH Q lcl|Aclame:pro 114 VKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNF-TQIFRNAWALTDTARASYAEAGYSNITESRRDC 192 (418) Q Consensus 114 v~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~-tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk 192 (418) +-+-..+. ...|. .||+..+..... +++. ...++-..-+.-|.+..+.. ..+...+-...- T Consensus 73 ~p~~~~~~-------~a~~v------~Eg~~~~~~~~~----~~~v~~~~~k~~~~~~is~ell~ds-~~~l~~~i~~~l 134 (324) T protein:vir:96 73 FTFWADKP-------GAYWV------GEGQKIETSKAT----WVNATMRAFKLGVILPVTKEFLNYT-YSQFFEEMKPMI 134 (324) T ss_pred EEEEecCc-------ceeEe------cCCccccccccc----eeEEEEeeEEEEEeehhhHHHHhcc-hHHHHHHHHHHH Confidence 33221111 11222 477666543321 1111 12222223333344444332 223334445555 Q ss_pred HHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEE Q lcl|Aclame:pro 193 MDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRV 272 (418) Q Consensus 193 ~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~ 272 (418) .+.+.+.+|.++|+|.- .+.. -.||..... .......+..+.+++.++...+-...... .. T Consensus 135 a~ai~~~~d~a~l~G~g----~~~~----~~gi~~~~~------~~~~~~~~~~t~~~i~~~~~~l~~~~~~~-----~~ 195 (324) T protein:vir:96 135 AEAFYKKFDEAGILNQG----NNPF----GKSIAQSIE------KTNKVIKGDFTQDNIIDLEALLEDDELEA-----NA 195 (324) T ss_pred HHHHHHHHHHHHhccCC----CCCc----Ccccccccc------ccceeccccccHHHHHHHHHhhhhccCCC-----CE Confidence 67889999999998853 1212 234432211 11122335678999999887775533222 24 Q ss_pred EEeChHHHHHHHhhhhccceEEEccc--ceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCC Q lcl|Aclame:pro 273 MFCDTVGMRTMQDIGRFFGEVTVTQR--ETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGR 350 (418) Q Consensus 273 i~v~a~~k~~i~~~~~~~~~~~~~~~--~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r 350 (418) +++++.....|.++....+++.+... ..-+|. .|+.++. ..++.+.+++.|++++-+..- . T Consensus 196 ~vmn~~~~~~L~~l~d~~G~~~~~~~~~~~l~G~------------PV~~~~~---~~~~~~~~~~gd~~~~~~g~~--~ 258 (324) T protein:vir:96 196 FISKTQNRSLLRKIVDPETKERIYDRNSDSLDGL------------PVVNLKS---SNLKRGELITGDFDKLIYGIP--Q 258 (324) T ss_pred EEEcHHHHHHHHHhhccCCCeeecCCCCCcccce------------eeEeeCC---CCCCcceEEEEecceEEEEEe--c Confidence 67888878888887555555544321 112222 2333322 335667888889887655443 2 Q ss_pred CcccccccccCccccccccccc-cccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCCC Q lcl|Aclame:pro 351 NAKVENYGQGGGENKSGATDYS-YGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAP 416 (418) Q Consensus 351 ~~~~e~laKtG~~~~~~~~~~~-~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~ 416 (418) ++..+.+............... ..-..|....+...-+...+++|+|.++|++.....+-.| -+- T Consensus 259 ~~~i~~~~~~~~~~~~~~~~~~~~~f~~d~~~~r~~~r~d~~v~~~~A~~~l~~a~~~~~~~~-~~~ 324 (324) T protein:vir:96 259 LIEYKIDETAQLSTVKNEDGTPVNLFEQDMVALRATMHVALHIADDKAFAKLVPADKRTDSVP-GEV 324 (324) T ss_pred CcEEEEeecccccccccccccchhhhhcCcEEEEEEEEEccEEecccceEEEecccccCCCCC-CCC Confidence 3333333222110000000000 0001145555667788999999999999988655422111 111 No 25 >protein:vir:78830 Length: 324 # NCBI annotation: major head protein # Family: family:all:507 # MgeID: mge:1858 # MgeName: 80alpha # Cross-refs: genbank:acc:YP_001285361;genbank:gi:148717889;genbank:GeneID:5246961 Probab=96.01 E-value=0.0008 Score=37.55 Aligned_cols=310 Identities=11% Similarity=0.005 Sum_probs=131.3 Q ss_pred ccccceeeeee-eeeeeecccceeEEEEEeecCceEEEEccccccccCceeEeccCc---------eEEEEEEecCceeE Q lcl|Aclame:pro 44 VGSTTAKASTH-GYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATG---------ENMRLELVNGLNLT 113 (418) Q Consensus 44 ~~~~~~~~~~~-~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~~t 113 (418) ..+..-..... .|..+..+............+.. ..+.+..+. ..+-+ ..+.+..+.+.+++ T Consensus 1 ~~~~~~~~~~~~~~~~~~~~~~~~~a~~~~~~~~~-------~~~iP~~~~-~~ii~~~~~~s~l~~l~~~~~~~~~~~~ 72 (324) T protein:vir:78 1 MEQTQKLKLNLQHFASNNVKPQVFNPDNVMMHEKK-------DGTLMNEFT-TPILQEVMENSKIMQLGKYEPMEGTEKK 72 (324) T ss_pred CCcchhhhHHHHHHHHHhhhhhhhccccccccCcC-------ccccchhHH-HHHHHHHHhhchhhhhcceeeccCCceE Confidence 01111111111 11111111100000000001111 111111111 11111 11233344444444 Q ss_pred EEccccccchhhhhCCceEEEeecccccccCCcCcccccceeccce-eEEEeeeeeechhHHHHhhhcccchHHHHHHHH Q lcl|Aclame:pro 114 VKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNF-TQIFRNAWALTDTARASYAEAGYSNITESRRDC 192 (418) Q Consensus 114 v~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~-tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk 192 (418) +-+-..+. ...|. .||+..+..... +++. ...++-..-+.-|.+..+.. ..+...+-...- T Consensus 73 ~p~~~~~~-------~a~~v------~Eg~~~~~~~~~----~~~v~~~~~k~~~~~~is~ell~ds-~~~l~~~i~~~l 134 (324) T protein:vir:78 73 FTFWADKP-------GAYWV------GEGQKIETSKAT----WVNATMRAFKLGVILPVTKEFLNYT-YSQFFEEMKPMI 134 (324) T ss_pred EEEEecCc-------ceeEe------cCCccccccccc----eeEEEEeeEEEEEeehhhHHHHhcc-hHHHHHHHHHHH Confidence 33221111 11222 477666543321 1111 12222223333344444332 223334445555 Q ss_pred HHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEE Q lcl|Aclame:pro 193 MDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRV 272 (418) Q Consensus 193 ~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~ 272 (418) .+.+.+.+|.++|+|.- .+.. -.||..... .......+..+.+++.++...+-...... .. T Consensus 135 a~ai~~~~d~a~l~G~g----~~~~----~~gi~~~~~------~~~~~~~~~~t~~~i~~~~~~l~~~~~~~-----~~ 195 (324) T protein:vir:78 135 AEAFYKKFDEAGILNQG----NNPF----GKSIAQSIE------KTNKVIKGDFTQDNIIDLEALLEDDELEA-----NA 195 (324) T ss_pred HHHHHHHHHHHHhccCC----CCCc----Ccccccccc------ccceeccccccHHHHHHHHHhhhhccCCC-----CE Confidence 67889999999998853 1212 234432211 11122335678999999887775533222 24 Q ss_pred EEeChHHHHHHHhhhhccceEEEccc--ceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCC Q lcl|Aclame:pro 273 MFCDTVGMRTMQDIGRFFGEVTVTQR--ETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGR 350 (418) Q Consensus 273 i~v~a~~k~~i~~~~~~~~~~~~~~~--~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r 350 (418) +++++.....|.++....+++.+... ..-+|. .|+.++. ..++.+.+++.|++++-+..- . T Consensus 196 ~vmn~~~~~~L~~l~d~~G~~~~~~~~~~~l~G~------------PV~~~~~---~~~~~~~~~~gd~~~~~~g~~--~ 258 (324) T protein:vir:78 196 FISKTQNRSLLRKIVDPETKERIYDRNSDSLDGL------------PVVNLKS---SNLKRGELITGDFDKLIYGIP--Q 258 (324) T ss_pred EEEcHHHHHHHHHhhccCCCeeecCCCCCcccce------------eeEeeCC---CCCCcceEEEEecceEEEEEe--c Confidence 67888878888887555555544321 112222 2333322 335667888889887655443 2 Q ss_pred CcccccccccCccccccccccc-cccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCCC Q lcl|Aclame:pro 351 NAKVENYGQGGGENKSGATDYS-YGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAP 416 (418) Q Consensus 351 ~~~~e~laKtG~~~~~~~~~~~-~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~ 416 (418) ++..+.+............... ..-..|....+...-+...+++|+|.++|++.....+-.| -+- T Consensus 259 ~~~i~~~~~~~~~~~~~~~~~~~~~f~~d~~~~r~~~r~d~~v~~~~A~~~l~~a~~~~~~~~-~~~ 324 (324) T protein:vir:78 259 LIEYKIDETAQLSTVKNEDGTPVNLFEQDMVALRATMHVALHIADDKAFAKLVPADKRTDSVP-GEV 324 (324) T ss_pred CcEEEEeecccccccccccccchhhhhcCcEEEEEEEEEccEEecccceEEEecccccCCCCC-CCC Confidence 3333333222110000000000 0001145555667788999999999999988655422111 111 No 26 >protein:vir:94771 Length: 298 # NCBI annotation: major head protein # Family: family:all:966 # MgeID: mge:1529 # MgeName: phi LC3 # Cross-refs: genbank:acc:NP_996706;genbank:gi:45597421;genbank:GeneID:2769044 Probab=95.97 E-value=0.0012 Score=36.65 Aligned_cols=281 Identities=10% Similarity=-0.016 Sum_probs=118.2 Q ss_pred EEEccccccccCceeEeccCc---------eEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcc Q lcl|Aclame:pro 79 LTVENSDGLTKGMIFYNEATG---------ENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTAR 149 (418) Q Consensus 79 ~tV~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~ 149 (418) +++.. +...+.-+..++-+ -...+..+.+..+++-+-..+.. ..|+ .||.+.+... T Consensus 1 ma~~g--G~lip~~~~~~ii~~~~~~s~i~~~~~~~~~~~~~~~~p~~~~~~~-------a~~v------~Eg~~~~~~~ 65 (298) T protein:vir:94 1 MVLNK--GTLFDPELVTDLISKVAGKSSIARLSAQKPIPFNGEKVFTFTMDSE-------IDVV------AESGKKTHGG 65 (298) T ss_pred Ceecc--ccccChhHHHHHHHHHHhhchhhhhcceeeccCCceEEEEEecCcc-------eEEe------eCCccccccc Confidence 23321 11111111111100 11122333333344333222211 1222 3666555332 Q ss_pred cccceeccceeEEEee----eeeechhHHHHhhh--cccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhH Q lcl|Aclame:pro 150 SIQPVYVPNFTQIFRN----AWALTDTARASYAE--AGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQ 223 (418) Q Consensus 150 ~~~~~~~~N~tQIf~~----~v~VSgTa~Av~~~--g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~ 223 (418) .. +.||--+ ...+.=|.+..... -..+-..+-..+-...|.+.+|.++|+|...-.+.+... . T Consensus 66 ~~-------f~~v~l~~~k~~~~~~iS~ell~~~~~~~~~l~~~i~~~la~ai~~~~d~~~l~G~~~~~g~~~~~----~ 134 (298) T protein:vir:94 66 VT-------LAPQTMVPIKVEYGARISDEFMYASDEEKINILQAFNDGFAKKVARGIDLMAFHGVNPRLGTASAV----I 134 (298) T ss_pred cc-------eeEEEEeeeEEEEeeehhHHHhccCCccHHHHHHHHHHHHHHHHHHHHHHHhhcccccCCCccccc----c Confidence 11 2222222 22233334433211 112233445556667789999999999864222111111 1 Q ss_pred HHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeec Q lcl|Aclame:pro 224 GIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYG 303 (418) Q Consensus 224 GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G 303 (418) |+...... ..+....+.......+++.++..++-.... ....+++++.....|.++...+|++-+...... | T Consensus 135 ~~~~~~~~--~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~-----~~~~~vmn~~~~~~l~~lkd~~G~~l~~~~~~~-~ 206 (298) T protein:vir:94 135 GTNHFDSK--VTQKVEAPRGIADPNGAIENAVELLTGVDA-----DVTGIAINPSFRSALAKQKDLQGNALFPELKWG-A 206 (298) T ss_pred cccccccc--cccccccccccccHHHHHHHHHHhhhhcCC-----CccEEEEcHHHHHHHHHhhccCCCeeecCcccC-C Confidence 11111110 111222222223345566666665543322 223578898888888887555565544321110 0 Q ss_pred eEEEEEEcCCeEEEEEECcccc-ccCCCCCeEEEEchhhce-eeeccCCCcccccccccCccccccccccccccCccccc Q lcl|Aclame:pro 304 MVFTEWKFFKGRLILKEHPLFS-AIGISPGFAVVVDVPAVK-LAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQG 381 (418) Q Consensus 304 ~~v~~~~SdfG~v~vv~n~~l~-~~~mp~d~~lv~D~~~~~-~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k 381 (418) . . .+=+| +.|+.++.+. ..+.+.+.+|+-|.+.+- +..- .+...+-.. .+..+.... + .--.|... T Consensus 207 ~-~---~tl~G-~PV~~~~~v~~~~~~~~~~~~~Gdfs~~~~~~~~--~~~~~~~~~-~~~~d~~~~---~-~f~~~~v~ 274 (298) T protein:vir:94 207 T-P---DTING-LPVDVNKTVSDMSLTQRDRAIIGDFANGFKWGYA--KEVPLEVIQ-YGDPDNSGL---D-LKGYNQVY 274 (298) T ss_pred C-C---ceecc-eeeEEecccccccCCCccEEEEeeccceEEEEEe--cCceEEEee-cCCCcCcch---h-hhhcCcEE Confidence 0 0 01123 2444444332 223455678888987642 2222 222222211 110000000 0 00013333 Q ss_pred cEEEEEEEEEEecccceEEeecCc Q lcl|Aclame:pro 382 GSLTSEWALELLNPQGCAVITGLQ 405 (418) Q Consensus 382 ~~i~~E~tLev~N~kA~a~I~gL~ 405 (418) .+....+.+.+++|+|..+|++-. T Consensus 275 ~r~~~r~~~~~~~~~a~~~l~~~t 298 (298) T protein:vir:94 275 IRAELFLGWGILDATKFARVTEAN 298 (298) T ss_pred EEEEEEeccEeecccceEEEEecC Confidence 455677889999999999999988 No 27 >protein:vir:3158 Length: 321 # NCBI annotation: capsid protein gpE # Family: family:all:1377 # ACLAME annotation(s): phi:0000161 - phage head/capsid # MgeID: mge:316 # MgeName: PhiCh1 # Cross-refs: genbank:acc:NP_665929;genbank:gi:22091115;genbank:GeneID:951342 Probab=95.85 E-value=0.00083 Score=37.48 Aligned_cols=308 Identities=10% Similarity=0.013 Sum_probs=122.6 Q ss_pred eeeeeeeeecccc--eeEEEEEeecCceEEEEc--cccccccCceeEeccCceEEEEEEecCceeEEEc-cccccchhhh Q lcl|Aclame:pro 52 STHGYFSKTMVFA--SAVVTAEAAADATVLTVE--NSDGLTKGMIFYNEATGENMRLELVNGLNLTVKR-QTGRISAAII 126 (418) Q Consensus 52 ~~~~~~~~~~~~~--~~t~~a~~~a~~t~~tV~--~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~r-g~~~tta~~~ 126 (418) |.-+.|.+++... ...++.+..+.. ++|. -...+... +.....-.-.+.|.-+...+..+.+ +.++... T Consensus 1 ~~~k~~~~~l~~~~~~~~~~~~~~~~g--~~v~~~~~~~l~~~-i~e~s~~l~~i~v~~v~~~~~~i~~~~~~~~~~--- 74 (321) T protein:vir:31 1 MASRTINNDLSRITEKNALTVDDLDAG--GTLPDPLWDEFWTD-MIEETPLLDAIRTETVGAKKTRIPTLNIGERHR--- 74 (321) T ss_pred CchHHHHHHHHHHHHhccccccccCCc--ceeCHHHHHHHHHH-HHHhhhhhhhceeeeccCcceeeeeeccCCccc--- Confidence 2222333322111 011111111111 1121 00111100 0000000001122223222211111 1111110 Q ss_pred hCCceEEEeecccccccCCcCcccccceeccce---eEEEeeeeeechhHHHHhhhc-ccchHHHHHHHHHHHHHHHHhH Q lcl|Aclame:pro 127 AANTKLIVIGTAFEEGSQRPTARSIQPVYVPNF---TQIFRNAWALTDTARASYAEA-GYSNITESRRDCMDFHATEQET 202 (418) Q Consensus 127 ~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~---tQIf~~~v~VSgTa~Av~~~g-~~dela~q~~kk~~EikrdmE~ 202 (418) +. ..||.... ....+ .++.. |.-..--+.|| .+...... ..+--++-..+-.+.+.+|++. T Consensus 75 ~~----------~~e~~~~~-~~~~~--~~~~~~~~~~k~~~~~~it--~e~L~d~a~~~d~e~~i~~~ia~~~a~~~~~ 139 (321) T protein:vir:31 75 RP----------QDEGEWNE-NESDV--STGTIDISTEKATVAWDLP--REVVQENPEGEALADRILNLMTDAWSADVED 139 (321) T ss_pred cc----------cccccccc-ccccc--eeeeeeeeeEEEEeehhcc--HHHHHhhhcchhHHHHHHHHHHHHHHHHHHh Confidence 00 11221111 11111 01111 11111122232 23332221 2343344455555678999999 Q ss_pred HHhcCcccccCcCCcc-chhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHH Q lcl|Aclame:pro 203 AIFFGQAFMGTYNGQP-LHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMR 281 (418) Q Consensus 203 a~i~G~k~~~~s~~~~-~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~ 281 (418) ++++|... +.++ ...-.|++..++.... ....++..++.+.+.++...+=.. .-+..+ -+++++.+... T Consensus 140 ~~~nGd~~----~~~~~~~~n~G~l~~a~~~~~---~~~~~~~~~~~d~l~~l~~~l~~~--yr~~~~-~v~im~~~~~~ 209 (321) T protein:vir:31 140 LAANGDED----AEDSFENQNDGFITVAEGDVE---TIDAADDILDNDLVIRTIAGLDSK--YRARMN-PALIVSEDQLL 209 (321) T ss_pred heeecccc----CCCcccccchhhhhhhccccc---cccccccccCHHHHHHHHHhccHh--HhcCCC-eEEEechHHHH Confidence 99999642 1111 1234576654432211 122244567888888877654211 111112 24678877665 Q ss_pred HHHh-hhhccceEEEcccceeeceEE--EEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCccccccc Q lcl|Aclame:pro 282 TMQD-IGRFFGEVTVTQRETSYGMVF--TEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYG 358 (418) Q Consensus 282 ~i~~-~~~~~~~~~~~~~~~~~G~~v--~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~la 358 (418) .+-+ +....+. .+...+ ....+ ++=+.++..|+ ||++.+++.|+.++.+.+- ++...+.+. T Consensus 210 ~~~~~l~~~~~~--------~~~~~l~~~~~~t-l~G~pvv~~~~-----mP~~~il~t~~~nl~~~~~--~~~~~~~~~ 273 (321) T protein:vir:31 210 SYHYTLTDRDTP--------LGDNVIMGEADVN-PFSFPIIGSGL-----WPDDKAMFTDPQNLIYALY--RDLEIDVLT 273 (321) T ss_pred HHHHHHhcCCCc--------cccchhhcccccc-ccceeEEEcCC-----CCCCcEEEeccccEEEEEe--eccEEEEee Confidence 5433 2211111 111111 01123 33456677665 6889999999999976655 333333332 Q ss_pred ccCccccccccccccccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCCC Q lcl|Aclame:pro 359 QGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAP 416 (418) Q Consensus 359 KtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~ 416 (418) ..... . ...+..-.-+..-+.-.+.++.|+++|+|++-..+.+-+++- T Consensus 274 ~~~~~---~-------~~~~~~~~~~~~~~~~~ve~~~a~a~~~~i~~~~~~~~~~~~ 321 (321) T protein:vir:31 274 ESDKV---S-------ERDLHARYFMRGDDDFAIENTEAVVLAEGLGDPLEHLEEETS 321 (321) T ss_pred cCccc---c-------ccceeeEeeeeeecceeEeccccEEEEecCCcchhcccCCCC Confidence 22100 0 000111112344566778899999999999765554433322 No 28 >protein:vir:96223 Length: 324 # NCBI annotation: ORF011 # Family: family:all:507 # MgeID: mge:1607 # MgeName: 69 # Cross-refs: genbank:acc:YP_239571;genbank:gi:66395304;genbank:GeneID:5132771 Probab=95.79 E-value=0.0008 Score=37.56 Aligned_cols=310 Identities=12% Similarity=0.044 Sum_probs=129.8 Q ss_pred eEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeEeccCc------- Q lcl|Aclame:pro 27 LRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATG------- 99 (418) Q Consensus 27 ~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~------- 99 (418) |.+. .+.+.....|..+..+.... .+ .+...-.++.++.+..+. .++-+ T Consensus 1 ~~~~----------------~~~~~~~~~f~~~~~~~~~~--~a-----~~~~~~~~~~~lip~~~~-~~ii~~~~~~s~ 56 (324) T protein:vir:96 1 MEQT----------------QKLKLNLQHFASNNVKPQVF--NP-----DNVMMHEKKDGTLLNDFT-TPILQEVMENSK 56 (324) T ss_pred CCcc----------------hhhhHHHHHHHHhhhhhhhc--cc-----ccccccCCCcceechhHH-HHHHHHHHhhch Confidence 1111 00111111121111111110 00 000000011112222211 11111 Q ss_pred --eEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceecccee-EEEeeeeeechhHHHH Q lcl|Aclame:pro 100 --ENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFT-QIFRNAWALTDTARAS 176 (418) Q Consensus 100 --E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~t-QIf~~~v~VSgTa~Av 176 (418) ..+.+..+.+..+++-+-..+ + ...|. .||...+..... +++.+ -+++-..-+.=|.+.. T Consensus 57 l~~l~~~~~~~~~~~~~p~~~~~--~-----~a~~v------~Eg~~~~~~~~~----f~~v~~~~~k~~~~~~is~ell 119 (324) T protein:vir:96 57 IMQLGKYEPMEGTEKKFTFWADK--P-----GAYWV------GEGQKIETSKAT----WVNATMRAFKLGVILPVTKEFL 119 (324) T ss_pred hhhhcceeeccCCceEEEEEecC--c-----ceeee------cCCccccccccc----eeEEEEEeEEEEEeehhhHHHH Confidence 112333444444433221111 1 11222 477666543321 12221 1122222222233333 Q ss_pred hhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHH Q lcl|Aclame:pro 177 YAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATI 256 (418) Q Consensus 177 ~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~ 256 (418) ... ..+-..+-...-.+.+.+.+|.++|+|.- .+..+ .|+...+. .......+.++.+++.++.. T Consensus 120 ~ds-~~~l~~~i~~~l~~aia~~~d~~~l~G~g----~~~~~----~~~~~~~~------~~~~~~~~~~~~~~i~~~~~ 184 (324) T protein:vir:96 120 NYT-YSQFFEEMKPMIAEAFYKKFDEAGILNQG----NNPFG----KSIAQSIK------KTNKVIKGDFTQDNIIDLEA 184 (324) T ss_pred hcc-hHHHHHHHHHHHHHHHHHHHHHHhhhcCC----CCCcC----cccccccc------ccceecccccchHHHHHHHH Confidence 321 22333444555556689999999998853 12121 23332211 11112334678899999888 Q ss_pred HHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcc--cceeeceEEEEEEcCCeEEEEEECccccccCCCCCeE Q lcl|Aclame:pro 257 DAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQ--RETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFA 334 (418) Q Consensus 257 ~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~--~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~ 334 (418) ++-...... ..+++++.....|.++...++++.+.. ...-+|+- |+.++. ..++.+.+ T Consensus 185 ~i~~~~~~~-----~~~i~n~~~~~~L~~lkd~~G~~~~~~~~~~~l~G~P------------V~~~~~---~~~~~~~~ 244 (324) T protein:vir:96 185 LLEDDELEA-----NAFISKTQNRSLLRKIVDPETKERIYDRNSDSLDGLP------------VVNLKS---SNLKRGEL 244 (324) T ss_pred hhhhccCCC-----CEEEEcHHHHHHHHHhhCCCCCeeecCCCCCccccee------------eEeecC---CCCCcceE Confidence 775533222 247788888888888755556544431 11222322 232322 33566778 Q ss_pred EEEchhhceeeeccCCCcccccccccCccccccccccc-cccCccccccEEEEEEEEEEecccceEEeecCcccccccCC Q lcl|Aclame:pro 335 VVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYS-YGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYL 413 (418) Q Consensus 335 lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~-~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~ 413 (418) ++.|++++.+..- .++..+.+...+........... ..-..|....+...-+.+.+++++|..+|++-...-.- T Consensus 245 ~~gd~s~~~~~~~--~~~~i~~~~~~~~~~~~~~~~~~~~~~~~n~v~~r~~~r~d~~v~~~~a~~~l~~a~~~~~~--- 319 (324) T protein:vir:96 245 ITGDFDKLIYGIP--QLIEYKIDETAQLSTVKNEDGTPVNLFEQDMVALRATMHVALHIADDKAFAKLVPADKRTDS--- 319 (324) T ss_pred EEEecceEEEEEe--cCcEEEEeecccccccccccccchhhhhcCcEEEEEEEEeccEEecccceEEEecccccCCC--- Confidence 8899988765544 23333333222210000000000 00011445556678889999999999998866544211 Q ss_pred CCCCC Q lcl|Aclame:pro 414 TAPAP 418 (418) Q Consensus 414 ~~~~~ 418 (418) .|-. T Consensus 320 -~~~~ 323 (324) T protein:vir:96 320 -VPGE 323 (324) T ss_pred -CCCC Confidence 1111 No 29 >protein:vir:4159 Length: 315 # NCBI annotation: structural protein # Family: family:all:1377 # ACLAME annotation(s): phi:0000161 - phage head/capsid # MgeID: mge:87 # MgeName: psiM2 # Cross-refs: genbank:acc:NP_046968;genbank:gi:9630538;genbank:GeneID:1261712 Probab=95.37 E-value=0.0022 Score=35.16 Aligned_cols=299 Identities=11% Similarity=0.008 Sum_probs=116.5 Q ss_pred cccceeEEEEEeecCceEEEEccccc-cccCceeEecc---Cc--eEEE---E-EEecCceeEEEccccccchhhhhCCc Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSDG-LTKGMIFYNEA---TG--ENMR---L-ELVNGLNLTVKRQTGRISAAIIAANT 130 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~~-~~~~~~~~~~~---~~--E~~~---V-tav~g~~~tv~rg~~~tta~~~~~gt 130 (418) |-......--.....-..+++.+..+ +.++.....-+ .+ .++. | +...+.+..+.+ +..|. T Consensus 1 ~~~~~~~~~~~~~~~~k~~t~~d~~Gg~l~P~~~~~~i~~~~e~s~~l~~~~vi~~~~~~~~~i~~---------~g~~~ 71 (315) T protein:vir:41 1 MLTIEDIRGGKPFEIVPKIDVPDLGRGVLSVDRFGEFVKAVRDSAVIIPEARIDNALKSYEKDISR---------LSLVL 71 (315) T ss_pred CcccchhhcCChhhhhhhcCCcCCCCceechHHHHHHHHHHHhhhhhhhhceeeeccccccccccc---------cccCc Confidence 10000000000000011233333332 22222221101 00 1111 1 111111111110 00111 Q ss_pred eEEEeecccccccCCcCcccccceeccc--eeEEEeeeeeechhHHHHhhh-cccchHHHHHHHHHHHHHHHHhHHHhcC Q lcl|Aclame:pro 131 KLIVIGTAFEEGSQRPTARSIQPVYVPN--FTQIFRNAWALTDTARASYAE-AGYSNITESRRDCMDFHATEQETAIFFG 207 (418) Q Consensus 131 ~v~~~g~a~~EGada~~~~~~~~~~~~N--~tQIf~~~v~VSgTa~Av~~~-g~~dela~q~~kk~~EikrdmE~a~i~G 207 (418) .+.. .....|...+..+..|.. -.+ .|.-+.--+.| |++...-. -+.+--++-..+-.+++.+++|.+|++| T Consensus 72 ~~~~--g~~~~~~~~~~~~~~~~f-~~~~l~~~~l~~~~~i--t~elL~D~~~~~~~e~~l~~~~a~~~a~~~~~~~~nG 146 (315) T protein:vir:41 72 DVGP--GRDETGQKLAPPESTAEV-KTNTLYMREMVTKVVI--HEDAIEDNIEGKAFEQKIVTLLGEGISYVLEKYYLHG 146 (315) T ss_pred cccc--ccccccCcCCCCCCcccc-ceeeeceeeeeeeccc--cHHHHHhhhccccHHHHHHHHHHHHHHHHHHHHhhcc Confidence 1110 011112222222222211 111 12222222333 34444322 1234345555566778999999999999 Q ss_pred cccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHH---HHhcccCCCceeEEEEeChHHHHHHH Q lcl|Aclame:pro 208 QAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDA---FKWSVNVGDNTQRVMFCDTVGMRTMQ 284 (418) Q Consensus 208 ~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~---~~~g~~~~g~~~~~i~v~a~~k~~i~ 284 (418) ... ++.+...+-.|++..+....... ........++.+.|.++++.+ |.+ ++.+. .++++.....++. T Consensus 147 dg~---s~~p~~~~~~G~l~~a~~~~~~~-~~~~~a~~~~~d~l~~l~~sl~~~yr~----~~~~~-~~imn~~t~~~~r 217 (315) T protein:vir:41 147 DTS---SSDPLLRMSDGWLKLASEKLTES-DVDPEAEDWPMNLFDTMIESLPTPYRN----NLPNM-KFYVTWDIYRAYR 217 (315) T ss_pred CCc---CcCccccccccceeccccccccc-ccccccccccHHHHHHHHHhcChHHhh----cCCce-EEEEcHHHHHHHH Confidence 531 11111234567664332211111 111222345677777777643 322 12222 3556766667777 Q ss_pred hhhhccceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccc Q lcl|Aclame:pro 285 DIGRFFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGEN 364 (418) Q Consensus 285 ~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~ 364 (418) ++-...+++-... .-..|. -.+=+| +.|+..|.|...++|++.+++-|+.++.+..- |++..++....-. . T Consensus 218 klk~~~g~~lw~~-~~~~g~----~~tl~G-~PV~~~~~m~~~~~~~~~ilf~d~~nl~~~~~--~~i~i~~~~~a~~-~ 288 (315) T protein:vir:41 218 DALKGRETGLGDQ-ALTGAN----SILYDG-RPVQYVPALEALNDGKSRALFVVPTQLVYGFW--RNIKVVPDYDAEM-R 288 (315) T ss_pred HHhccCCCccccc-hhhcCC----Cceecc-cceEecccccccCCCCccEEEecccceEEEec--cccEEEeeecCCC-C Confidence 7643233221110 000011 112234 45567777877888999999999998755433 5555544332210 0 Q ss_pred cccccccccccCccccccEEEEEEEEEEecccceEEeec Q lcl|Aclame:pro 365 KSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITG 403 (418) Q Consensus 365 ~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~g 403 (418) +. ...-....-+.+.+.|-.+.++|.= T Consensus 289 ~~------------~~~~~~r~d~~~~~~~~~a~~~~~v 315 (315) T protein:vir:41 289 LT------------KYVASLRTDNHYEDEEGAVSATITV 315 (315) T ss_pred ce------------EEEEEEEeceeEEeccceeEeeeeC Confidence 01 0111123345556666544544433 No 30 >protein:vir:2430 Length: 318 # NCBI annotation: major head subunit # Family: family:all:507 # MgeID: mge:52 # MgeName: D29 # Cross-refs: genbank:acc:NP_046832;genbank:gi:9630400;genbank:GeneID:1261582 Probab=95.26 E-value=0.0024 Score=34.93 Aligned_cols=301 Identities=10% Similarity=0.023 Sum_probs=120.1 Q ss_pred hhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeE--------eccCceEEEEEEecCcee Q lcl|Aclame:pro 41 TSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFY--------NEATGENMRLELVNGLNL 112 (418) Q Consensus 41 ~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~--------~~~~~E~~~Vtav~g~~~ 112 (418) .+-|. . +.+....+...-+ .++.++.+..+.. ..+-.....+..+.+..+ T Consensus 1 ~~~~~------~--------~~~e~~~~~~~~~--------~~~~~~ip~~~~~~ii~~~~~~~~l~~~~~~~~~~~~~~ 58 (318) T protein:vir:24 1 MAAGT------A--------FAVDHAQIAQTGD--------TMFKGYLEPEQAKDYFAEAEKTSIVQQFAQKVPMGTTGQ 58 (318) T ss_pred CCCCC------C--------CCHHHHHhhcccC--------cccceeechhHHHHHHHHHHhhchhhhhcceeeccCCce Confidence 01110 0 0000000000000 0111111111100 000011123334444444 Q ss_pred EEEccccccchhhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeee----eeechhHHHHhhhcccchHHHH Q lcl|Aclame:pro 113 TVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNA----WALTDTARASYAEAGYSNITES 188 (418) Q Consensus 113 tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~----v~VSgTa~Av~~~g~~dela~q 188 (418) ++-+-..+..+ .|. .||...+.... .+.||--+. ..+.-|.+.... ...+-..+- T Consensus 59 ~ip~~~~~~~a-------~~v------~Eg~~~~~~~~-------~f~~i~~~~~k~~~~~~iS~e~l~d-s~~~~~~~i 117 (318) T protein:vir:24 59 KIPHWVGDVSA-------QWI------GEGDMKPITKG-------NMTSQTIAPHKIATIFVASAETVRA-NPANYLGTM 117 (318) T ss_pred EEEEEeCCcce-------EEe------cCCcccccccc-------ceeEEEEeeEEEEEeehhhHHHhhc-ChHHHHHHH Confidence 44433322111 222 25555443221 233332222 222334444432 223444555 Q ss_pred HHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCc Q lcl|Aclame:pro 189 RRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDN 268 (418) Q Consensus 189 ~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~ 268 (418) ...-...+.+.+|.++|+|... + .+ .|++..... .......+......+++.++...+..... T Consensus 118 ~~~l~~~~~~~~d~a~l~G~g~----~-~~----~~~~~~~~~---~~~~~~~~~~~~~~~~~~~~~~~~~~~~~----- 180 (318) T protein:vir:24 118 RTKVATAFAMAFDGAAMHGTDS----P-FP----TYIGQTTKA---ISIADTTGATTVYDQVAVNGLSLLVNDGK----- 180 (318) T ss_pred HHHHHHHHHHHHHHhhhcccCC----C-CC----ccccccccc---ccccccccccchHHHHHHHHHHhhccccC----- Confidence 5666667899999999998742 1 11 122211110 01111112223344445555555543221 Q ss_pred eeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEE--cCCeEEEEEECccccccCCCCC--eEEEEchhhcee Q lcl|Aclame:pro 269 TQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWK--FFKGRLILKEHPLFSAIGISPG--FAVVVDVPAVKL 344 (418) Q Consensus 269 ~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~--SdfG~v~vv~n~~l~~~~mp~d--~~lv~D~~~~~~ 344 (418) ....+++++.....|.++...++++.+.......+ ...+. .-+| +.++..+. +|.+ .+++.|++.+.+ T Consensus 181 ~~~~~v~n~~~~~~L~~lkd~~G~~l~~~~~~~~~--~~~~~~~~i~g-~pv~~~~~-----~~~~~~~~~~gdfs~~~~ 252 (318) T protein:vir:24 181 KWTHTLLDDITEPILNGAKDQNGRPLFIESTYGEA--ASPFRSGRIVA-RPTILSDH-----VVEGTTVGFMGDFSQLIW 252 (318) T ss_pred CCCEEEEcHHHHHHHHHhhccCCceeecCccccCc--cccccCceEEE-EeeEEeCC-----CCCCccEEEEeecceEEE Confidence 12247789888888888755555554432211111 11110 1112 24444443 3444 346668877654 Q ss_pred eeccCCCcccccccccCcccccccccc-ccccCccccccEEEEEEEEEEecccceEEeecCccccccc Q lcl|Aclame:pro 345 AYMDGRNAKVENYGQGGGENKSGATDY-SYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERV 411 (418) Q Consensus 345 ~~L~~r~~~~e~laKtG~~~~~~~~~~-~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~ 411 (418) ..- .+...+.....+.......... ...-..|...-+...-+...+++|+|.++|++..-+--+- T Consensus 253 ~~~--~~l~i~~~~~~~~~~~~~~~~~~~~~f~~~~~~~r~~~r~d~~v~~~~a~~~i~~~~a~~~~~ 318 (318) T protein:vir:24 253 GQI--GGLSFDVTDQATLNLGTVESPNFVSLWQHNLVAVRVEAEYAFHCNDAEAFVALTNVVSGGGEG 318 (318) T ss_pred EEe--cCeEEEEeeccceeccccccccchhhhhcCcEEEEEEEEEccEEecccceEEEEeeccCCCCC Confidence 433 2333333322221100000000 0000013444566788999999999999999874441111 No 31 >protein:vir:9574 Length: 300 # NCBI annotation: gp40 # Family: family:all:966 # MgeID: mge:171 # MgeName: SM1 # Cross-refs: genbank:acc:NP_862879;genbank:gi:32469471;genbank:GeneID:1461316 Probab=95.25 E-value=0.0024 Score=34.91 Aligned_cols=287 Identities=11% Similarity=0.022 Sum_probs=116.2 Q ss_pred EEEeecCceEEEEccccccccCceeEeccCce-E----EEEEEecCceeEEEccccccchhhhhCCceEEEeeccccccc Q lcl|Aclame:pro 69 TAEAAADATVLTVENSDGLTKGMIFYNEATGE-N----MRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGS 143 (418) Q Consensus 69 ~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E-~----~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGa 143 (418) +|..+.+...+ |.. + +.. .|+.. ..++ . ..+.-+.+..+++-+-..+ ....|+ .||. T Consensus 1 ma~~t~~~G~l-ip~-~-~~~-~ii~~-l~~~s~i~~l~~~~~~~~~~~~~p~~~~~-------~~a~wv------~Eg~ 62 (300) T protein:vir:95 1 MSEAQLSKGNL-FNP-E-LVT-KVINK-VKGHSSIAKLSPQKPIPFNGQREFVFDFD-------SDIDIV------AENG 62 (300) T ss_pred CcccccCCcce-ech-h-hHH-HHHHH-HHhhhhhhhhcceeeccCCceEEEEEecC-------cceEEe------eCCc Confidence 33222222221 110 0 000 01100 0000 0 1122222232332221111 112232 3665 Q ss_pred CCcCcccccceeccceeEEEeeeeee----chhHHHHhh--hcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCc Q lcl|Aclame:pro 144 QRPTARSIQPVYVPNFTQIFRNAWAL----TDTARASYA--EAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQ 217 (418) Q Consensus 144 da~~~~~~~~~~~~N~tQIf~~~v~V----SgTa~Av~~--~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~ 217 (418) +.+.... -+.||--+.-.+ .=|.+..+. ....+-..+-..+-.+.+.+.+|.++|+|.....+.+.. T Consensus 63 ~~~~s~~-------~f~~v~l~~~k~~~~~~iS~ell~~~~d~~~~l~~~i~~~l~~aia~~~d~~~l~G~~~~~g~~~~ 135 (300) T protein:vir:95 63 KKTHGGV-------SLDPVTIVPLKVEYGARVSDEFLHASEEAKVDMLTDFVEGFSKKLARGLDIMSIHGINPRTKQAST 135 (300) T ss_pred ccccccc-------cceeeEeeeEEEEEeehhhHHHhccCCCCHHHHHHHHHHHHHHHHHHHHHHhhhhcccCCCCCCcc Confidence 5543221 122322222222 222222211 112232333444456778999999999996433333322 Q ss_pred cchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcc Q lcl|Aclame:pro 218 PLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQ 297 (418) Q Consensus 218 ~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~ 297 (418) +.. .... ..............+.+++.++..++-..+.. ...++.++....+|.++...+|++.+.. T Consensus 136 ~~~----~~~~----~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~-----~~~~vmn~~~~~~L~~lkd~~G~~i~~~ 202 (300) T protein:vir:95 136 IIG----DNCF----DKKVTQTVPFKDTNPDESMEDAVGMIDGSERD-----ITGAILDPIFTTALSKMKNAEGGKLYPE 202 (300) T ss_pred ccc----cccc----ccccceeecccccchHHHHHHHHHHhhhcCCC-----ccEEEECHHHHHHHHHhhccCCCeeccC Confidence 211 1110 01111222233455667777777666433322 2246678888888988865666655432 Q ss_pred cceeeceEEEEEEcCCeEEEEEECccccc-cCCCCCeEEEEchhhc-eeeeccCCCcccccccccCcccccccccccccc Q lcl|Aclame:pro 298 RETSYGMVFTEWKFFKGRLILKEHPLFSA-IGISPGFAVVVDVPAV-KLAYMDGRNAKVENYGQGGGENKSGATDYSYGH 375 (418) Q Consensus 298 ~~~~~G~~v~~~~SdfG~v~vv~n~~l~~-~~mp~d~~lv~D~~~~-~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~ 375 (418) .... | . .-+=+| +.++.++.++. ..++.+.+|+-|.+.. .+..-.+-.+...+.+..-+... + .- T Consensus 203 ~~~~-~-~---~~~l~G-~Pv~~s~~v~~~~~~~~~~~~~GDf~~~~~~~~~~~~~~~v~~~~~~d~~~~------~-~f 269 (300) T protein:vir:95 203 LAWG-G-V---PDAING-LAVDKNRTVSYSQTDPKNTAIVGDFETMFKWGYAKEVPMEIIKYGDPDNSGR------D-LK 269 (300) T ss_pred cccc-C-C---Cceecc-eeeEEecCCCCCCCCCccEEEEeeccceEEEEEecccEEEEeeccCCCCcch------h-hh Confidence 1110 0 0 001123 13333333211 1233445677787643 22222222222111110000000 0 00 Q ss_pred CccccccEEEEEEEEEEecccceEEeecCcc Q lcl|Aclame:pro 376 GVDAQGGSLTSEWALELLNPQGCAVITGLQK 406 (418) Q Consensus 376 g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~ 406 (418) -.|-...+....+.+.+++|+|..+|++-.= T Consensus 270 ~~~~v~~r~~~r~d~~v~~~~a~~~l~~~~g 300 (300) T protein:vir:95 270 GYNQIYIRCEAYIGWGIMDAASFARIVKTGG 300 (300) T ss_pred hcCcEEEEEEEeecceeecccceEEEecCCC Confidence 0133444667789999999999999987744 No 32 >protein:vir:4339 Length: 395 # NCBI annotation: major head protein # Family: family:all:585 # MgeID: mge:93 # MgeName: D3 # Cross-refs: genbank:acc:NP_061502;genbank:gi:9635591;genbank:GeneID:1262860 Probab=94.91 E-value=0.0032 Score=34.25 Aligned_cols=320 Identities=10% Similarity=0.037 Sum_probs=117.6 Q ss_pred CcceeeeeccCCCh---hhhhhhh-----cccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEe Q lcl|Aclame:pro 1 MSVYAGIFNTTLNP---QELNMKS-----FAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEA 72 (418) Q Consensus 1 ~~~~~~~~~~~~~~---~~~~~~s-----~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~ 72 (418) +......-.....+ .+..+++ +...+.. .......-..++.. ...-+.+ +.++ . T Consensus 68 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~-~~~~~~~~~~~~~~-------~~~~g~~---vp~~-------~ 129 (395) T protein:vir:43 68 MLANEKRDGGEEAPKTAGQMVAESLKEQGVTSSLRG-SHRVSMPRSAITSI-------DGSGGAL---VAPD-------R 129 (395) T ss_pred HHhhhccccccchhhhHHHHHHHHHHHHHHHHHhhh-hhhhhhhhhhhccc-------CCCCccc---cchh-------h Confidence 00000000000000 0111111 1111100 00000000001000 0000100 0000 0 Q ss_pred ecCceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCccccc Q lcl|Aclame:pro 73 AADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQ 152 (418) Q Consensus 73 ~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~ 152 (418) ...--+ .+.....+. ..+.+..+.+..++.-+-..+.. . ..|. .||...+..... T Consensus 130 ~~~ii~-~~~~~~~l~-----------~l~~~~~~~~~~~~~~~~~~~~~-~-----a~~v------~E~~~~~~~~~~- 184 (395) T protein:vir:43 130 RPGVVA-APQRRLTIR-----------DLVAPGTTESNSVEYVRETGFVN-N-----AAPV------SEGTQKPYSDLT- 184 (395) T ss_pred HHHHHH-HHHhhhhHH-----------hhccceecCCCceEEEEEecCCC-c-----eeee------cCCccccccccc- Confidence 000000 000000000 00011111222222222111110 0 0111 355554433211 Q ss_pred ceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhc Q lcl|Aclame:pro 153 PVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQY 232 (418) Q Consensus 153 ~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~ 232 (418) ...+ ...+++-..-+.-|.+..+.. .+-.++-...-...+.+.+|.++|+|.. .+.. ..||+...... T Consensus 185 ~~~i--~~~~~k~~~~~~is~ell~d~--~~l~~~v~~~la~a~~~~~d~~~l~G~g----~~~~----~~Gi~~~~~~~ 252 (395) T protein:vir:43 185 FELE--NAPVRTIAHLFKASRQILDDA--SALQSYIDARARYGLMLVEECQLLYGNG----TGAN----LHGIIPQAQAY 252 (395) T ss_pred eeEE--EEeeeeEEEeehhhHHHHHhH--HHHHHHHHHHHHHHHHHHHHHHHHhccC----CCCc----ccccccccccc Confidence 1112 222223333333344444432 2333444555556779999999998842 2222 34565322110 Q ss_pred cccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcC Q lcl|Aclame:pro 233 APDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFF 312 (418) Q Consensus 233 ~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~Sd 312 (418) .........+....+++.+++.++-.. +.....+++++.....|.++...+|++.+... ..|. . -+= T Consensus 253 --~~~~~~~~~~~~~~~~i~~~~~~~~~~-----~~~~~~~vmn~~~~~~l~~lkd~~G~~i~~~~--~~~~-~---~~l 319 (395) T protein:vir:43 253 --APPSGVVVTAEQRIDRIRLAILQAQLA-----EFPASGIVLNPIDWALIELNKDAENRYIIGSP--QNGT-T---PTL 319 (395) T ss_pred --ccccccccccchhHHHHHHHHHhhccc-----cCCCcEEEEcHHHHHHHHHhhccCCceecccc--ccCC-C---cee Confidence 001111122233455555555444332 22223577888888888877555565544221 1111 0 122 Q ss_pred CeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEE Q lcl|Aclame:pro 313 KGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALEL 392 (418) Q Consensus 313 fG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev 392 (418) +| +.|+.+++ ||++++++.|+....+-+.+ .....+.....+.. + ..|........-+...+ T Consensus 320 ~G-~pVv~~~~-----~~~~~~~~gd~~~~~~~~~~-~~~~i~~~~~~~~~---f--------~~~~~~~r~~~r~d~~v 381 (395) T protein:vir:43 320 WR-LPVVETQA-----ITQDEFLTGAFSLGAQIFDR-MDIEVLVSTENDKD---F--------ENNMVTIRAEERLAFAV 381 (395) T ss_pred cc-eeeEEcCC-----CCCCcEEEEeccceEEEEEe-cceEEEEeccccch---h--------hcCcEEEEEEEeeccEE Confidence 56 46677654 68899999999875333331 11111111111100 0 00233344556789999 Q ss_pred ecccceEEeecCccc Q lcl|Aclame:pro 393 LNPQGCAVITGLQKA 407 (418) Q Consensus 393 ~N~kA~a~I~gL~~~ 407 (418) ++|+|+..+ .+++| T Consensus 382 ~~~~a~~~~-~~taa 395 (395) T protein:vir:43 382 YRPEAFVTG-SLTAS 395 (395) T ss_pred ecccceEEE-EeccC Confidence 999998888 55555 No 33 >protein:vir:4226 Length: 326 # NCBI annotation: observed 35.2Kd protein # Family: family:all:507 # MgeID: mge:89 # MgeName: L5 # Cross-refs: genbank:acc:NP_039681;swissprot:sw:q05223;genbank:gi:9625447;uniprot:Q05223;genbank:GeneID:2942929 Probab=94.70 E-value=0.0037 Score=33.91 Aligned_cols=308 Identities=10% Similarity=0.029 Sum_probs=121.5 Q ss_pred eEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeEecc----Cc--- Q lcl|Aclame:pro 27 LRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEA----TG--- 99 (418) Q Consensus 27 ~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~----~~--- 99 (418) |..||..+-..++..-. .+ ++. ...+..++.+..+.. ++ .+ T Consensus 1 ~~~~~~r~~~~~~~~e~------~a----------------~~~---------~~~~~g~~ip~~~~~-~ii~~~~~~s~ 48 (326) T protein:vir:42 1 MAVNPDRTTPFLGVNDP------KV----------------AQT---------GDSMFEGYLEPEQAQ-DYFAEAEKISI 48 (326) T ss_pred CCCCccchhhhcCcchh------hh----------------eec---------cccCCcceechhhHH-HHHHHHHhcch Confidence 55555543332211000 00 000 000111122222111 00 00 Q ss_pred --eEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHh Q lcl|Aclame:pro 100 --ENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASY 177 (418) Q Consensus 100 --E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~ 177 (418) ....+.-+.+..+++-+-..+ .....+ .||...+..... ...+ -...++-...|.-|.+..+ T Consensus 49 i~~~~~~~~~~~~~~~~p~~~~~---------~~a~~v----~Eg~~~~~~~~~-f~~i--~~~~~k~~~~v~iS~ell~ 112 (326) T protein:vir:42 49 VQQFAQKIPMGTTGQKIPHWTGD---------VSASWI----GEGDMKPITKGN-MTSQ--TIAPHKIATIFVASAETVR 112 (326) T ss_pred hhhhcceeeccCCceEEEEEeCC---------cceEEe----cCCccccccccc-eeEE--EEeeEEEEEeehhhHHHHh Confidence 112233333444443322221 111112 377666544321 1111 2233334444455555554 Q ss_pred hhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHH--HHH Q lcl|Aclame:pro 178 AEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVV--DAT 255 (418) Q Consensus 178 ~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~--d~~ 255 (418) ... .+-.+|-.++-.+.+.+.+|.++|+|.- ++ .| .||+..............+..+..+..++. ++. T Consensus 113 ~s~-~~~~~~i~~~l~~a~~~~~d~a~l~G~g----s~-~p----~gi~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 182 (326) T protein:vir:42 113 ANP-ANYLGTMRTKVATAFAMAFDNAAINGTD----SP-FP----TFLAQTTKEVSLVDPDGTGSNADLTVYDAVAVNAL 182 (326) T ss_pred cCH-HHHHHHHHHHHHHHHHHHHHHHhhcccC----CC-cc----ccccccccccceeecccccccccchhHHHHHHHHH Confidence 422 3444555555567789999999998854 22 11 122211110000001111111122222221 111 Q ss_pred HHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEE-EEEcCCeEEEEEECccccccCCCCCeE Q lcl|Aclame:pro 256 IDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFT-EWKFFKGRLILKEHPLFSAIGISPGFA 334 (418) Q Consensus 256 ~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~-~~~SdfG~v~vv~n~~l~~~~mp~d~~ 334 (418) ... .. .+.....+++++.....|.++...++++.+...... |.... ..-+-+| +.++.++. +|+++. T Consensus 183 ~~~-~~----~~~~~a~~v~n~~~~~~L~~lkd~~G~~l~~~~~~~-~~~~~~~~~~l~G-~pv~~~~~-----~~~~~~ 250 (326) T protein:vir:42 183 SLL-VN----AGKKWTHTLLDDITEPILNGAKDKSGRPLFIESTYT-EENSPFRLGRIVA-RPTILSDH-----VASGTV 250 (326) T ss_pred hhh-hh----hccCccEEEEeHHHHHHHHHhhccCCceeecccccc-CccccccCceeee-eeEEEcCC-----CCCCce Confidence 111 11 111122466888888888887544555443321111 10000 0111223 34555544 455554 Q ss_pred EE--EchhhceeeeccCCCcccccccccCccccccccccccc----cCccccccEEEEEEEEEEecccceEEeecCcccc Q lcl|Aclame:pro 335 VV--VDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYG----HGVDAQGGSLTSEWALELLNPQGCAVITGLQKAK 408 (418) Q Consensus 335 lv--~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~----~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~ 408 (418) ++ -|.+.+-+..- .+...+.+......... +.... --.|-...+....+...+.+|+|.++|++...++ T Consensus 251 ~~~~Gd~s~~~~~~~--~~~~v~~~~e~~~~~~~---~~~~~~~~~~~~d~~~~r~~~~~d~~v~~~~a~~~l~~~~~~~ 325 (326) T protein:vir:42 251 VGYQGDFRQLVWGQV--GGLSFDVTDQATLNLGT---PQAPNFVSLWQHNLVAVRVEAEYAFHCNDKDAFVKLTNVDATE 325 (326) T ss_pred EEEEeecceEEEEEe--cceEEEEeecceeeecc---cccccchhhhhcCcEEEEEEEEeccEEecccceEEEeeccccC Confidence 43 36655533322 12222211111100000 00000 0013444456888899999999999999987664 Q ss_pred c Q lcl|Aclame:pro 409 E 409 (418) Q Consensus 409 ~ 409 (418) - T Consensus 326 ~ 326 (326) T protein:vir:42 326 A 326 (326) T ss_pred C Confidence 4 No 34 >protein:vir:80684 Length: 315 # NCBI annotation: gp6 # Family: family:all:966 # MgeID: mge:1884 # MgeName: PA6 # Cross-refs: genbank:acc:YP_001285582;genbank:gi:148727088;genbank:GeneID:5247055 Probab=94.63 E-value=0.003 Score=34.41 Aligned_cols=296 Identities=14% Similarity=0.077 Sum_probs=115.5 Q ss_pred EEEeecCceEEEEccccccccCceeEeccCceE----EEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccC Q lcl|Aclame:pro 69 TAEAAADATVLTVENSDGLTKGMIFYNEATGEN----MRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQ 144 (418) Q Consensus 69 ~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~----~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGad 144 (418) ++..+.+.+...|.. .+. ..|+......-. ..+.-+.+..+++-+-.++..+ .|+ .||.. T Consensus 1 Ma~~~~~~gg~~vP~--~~~-~~ii~~l~~~s~i~~l~~~i~~~~~~~~ip~~~~~~~a-------~wv------~Eg~~ 64 (315) T protein:vir:80 1 MADDFLSAGKLELPG--SMI-GAVRDRAIDSGVLAKLSPEQPTIFGPVKGAVFSGVPRA-------KIV------GEGEV 64 (315) T ss_pred CCCCcCCcCceEcch--HHH-HHHHHHHHhhchhhhhcceeecCCCceEEEEEeCCcce-------EEe------eCCcc Confidence 222222222222221 000 011110000000 1122233333333332222211 222 36655 Q ss_pred CcCcccccceeccceeEEEeeeeee----chhHHHHhhhcc--cchHHHHH-HHHHHHHHHHHhHHHhcCcccccCcCCc Q lcl|Aclame:pro 145 RPTARSIQPVYVPNFTQIFRNAWAL----TDTARASYAEAG--YSNITESR-RDCMDFHATEQETAIFFGQAFMGTYNGQ 217 (418) Q Consensus 145 a~~~~~~~~~~~~N~tQIf~~~v~V----SgTa~Av~~~g~--~dela~q~-~kk~~EikrdmE~a~i~G~k~~~~s~~~ 217 (418) .+... + -+.||--+..++ .=|.+..+.-.. .+++...+ +.-...|.+.+|.++|+|.... .+.. T Consensus 65 ~~~s~--~-----~f~~v~l~~~kl~~~~~iS~ell~~s~~~~~~~l~~~i~~~la~ai~~~~d~a~~~G~~~~--~~~~ 135 (315) T protein:vir:80 65 KPSAS--V-----DVSAFTAQPIKVVTQQRVSDEFMWADADYRLGVLQDLISPALGASIGRAVDLIAFHGIDPA--TGKA 135 (315) T ss_pred ccccc--c-----ceeeeEeeeeeEEeeehhhHHHhhcCchhHHHHHHHHHHHHHHHHHHHHHhhheeeccCCC--CCcc Confidence 54332 1 233333232223 333333322111 11233333 3445567888999999986311 1111 Q ss_pred cchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEE--- Q lcl|Aclame:pro 218 PLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVT--- 294 (418) Q Consensus 218 ~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~--- 294 (418) ..|+...+. ...... ..+..+.+++.+++..+=...... ...+++++.....|.++....++.- T Consensus 136 ----~~~~~~~~~----~~~~~~-~~~~~~~~d~~~~~~~~~~~~~~~----~~~~imn~~~~~~L~~l~~~~g~~~~g~ 202 (315) T protein:vir:80 136 ----ASAVHTSLN----KTKNIV-DATDSATADLVKAVGLIAGAGLQV----PNGVALDPAFSFALSTEVYPKGSPLAGQ 202 (315) T ss_pred ----ccccccccc----ccccee-eccccchHHHHHHHHHHhhccCcc----ceEEEEcHHHHHHHHHHhhccCCccccc Confidence 222221111 111111 112234566666665443222221 1236678888888877632222110 Q ss_pred EcccceeeceEEEEEEcCCeEEEEEECccccccC----CCCCeEEEEchhhceeeeccCCCcccccccccCccccccccc Q lcl|Aclame:pro 295 VTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIG----ISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATD 370 (418) Q Consensus 295 ~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~----mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~ 370 (418) ....+-..|. .-+=+| +.|+.++.++.-. -+...+++-|.+++.+.+. +++..+-+.... .+... + T Consensus 203 ~~~~~~~~g~----~~tl~G-~PV~~~~~~~~~~~~~~~~~~~~~~GDfs~~~~g~~--~~~~i~i~~~~~-~~~~~-~- 272 (315) T protein:vir:80 203 PMYPAAGFAG----LDNWRG-LNVGASSTVSGAPEMSPASGVKAIVGDFSRVHWGFQ--RNFPIELIEYGD-PDQTG-R- 272 (315) T ss_pred ccccccccCC----Cceecc-eeeEecCcCCcccccccccccEEEEeecccEEEEEe--cCeeEEEecccc-ccCcc-c- Confidence 0000100110 011123 2344443321100 0112356678888766665 333333221110 00000 0 Q ss_pred cccccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 371 YSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 371 ~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) + .--.|....+....+.+.+++|+|..++++-...+ +++|+- T Consensus 273 -~-~~~~~~v~~r~~~r~~~~v~~~~a~~~l~~~~a~~----~~~~~~ 314 (315) T protein:vir:80 273 -D-LKGHNEVMVRAEAVLYVAIESLDSFAVVKEKAAPK----PNPPAE 314 (315) T ss_pred -c-hhhcCcEEEEEEEEecceeecccceEEEeeccCCC----CCCCCC Confidence 0 00014445566678999999999999998765543 455555 No 35 >protein:vir:99311 Length: 463 # NCBI annotation: putative capsid protein # Family: family:all:2450 # MgeID: mge:1655 # MgeName: K # Cross-refs: genbank:acc:YP_024474;genbank:gi:48696433;genbank:GeneID:2948039 Probab=94.45 E-value=0.0044 Score=33.52 Aligned_cols=324 Identities=15% Similarity=0.128 Sum_probs=138.4 Q ss_pred eeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEE-----eecCceEEE Q lcl|Aclame:pro 6 GIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAE-----AAADATVLT 80 (418) Q Consensus 6 ~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~-----~~a~~t~~t 80 (418) =-+++.+.|. .+--|.||..- -.||.+-+| ...++.-+-.++ +...-+.++ T Consensus 1 ~~~~~~~~~~-----------------~~~~~~~~~e~----~~KS~~tg~---g~~p~~q~~~~AlR~EsL~~~i~~Lt 56 (463) T protein:vir:99 1 MTIEKNLSDV-----------------QQKYADQFQED----VVKSFQTGY---GITPDTQIDAGALRREILDDQITMLT 56 (463) T ss_pred CCcccccchH-----------------HHHHHhhhhHH----HHHHhhcCC---ccCCccccCcchhhhhhhhhhhheee Confidence 0011111111 00111121100 012211111 010010000000 111112222 Q ss_pred EccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEee-----cccccccCCcCccccccee Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIG-----TAFEEGSQRPTARSIQPVY 155 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g-----~a~~EGada~~~~~~~~~~ 155 (418) ..+. ...|++.+... ...+..+..+..+ ..| ....|+..+.. . T Consensus 57 ~~~~-----~f~~~~~i~k~-------------------~a~STV~~y~~~~-~~G~~g~~~f~~E~g~~~~-------~ 104 (463) T protein:vir:99 57 WTNE-----DLIFYRDISRR-------------------PAQSTVVKYDQYL-RHGNVGHSRFVKEIGVAPV-------S 104 (463) T ss_pred eccc-----chhhhhhcCCc-------------------hhhhhhhhheeee-ccCcccccccccccccccc-------C Confidence 2221 11122222211 1112222222222 111 12346544432 2 Q ss_pred ccceeEEEeeeeeechhHHHHhhh----cccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhh Q lcl|Aclame:pro 156 VPNFTQIFRNAWALTDTARASYAE----AGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQ 231 (418) Q Consensus 156 ~~N~tQIf~~~v~VSgTa~Av~~~----g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~ 231 (418) ..||.|+-..-==++.|.+.+... +..|-++.|.++++.-+...+|++++.|-+.......+..-.-+||...|. T Consensus 105 d~~~~Rr~~~~K~l~~~~~VS~~~~l~n~~~d~~~~~~~dai~~ia~tiE~a~FyGds~l~~~~~~~gleFDGl~~lId- 183 (463) T protein:vir:99 105 DPNIRQKTVSMKYVSDTKNMSIASGLVNNIADPSQILTEDAIAVVAKTIEWASFYGDASLTSEVEGEGLEFDGLAKLID- 183 (463) T ss_pred CCceEEEEEEeeeeehhhhhhhHHHhhcccccHHHHHHHHHHHHHHHHHHHHHhhhhhccCCCcCccccchhhhhhhcC- Confidence 234544433322356666655433 234667889999999999999999999987554333333456778866553 Q ss_pred ccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccc--e--eeceEEE Q lcl|Aclame:pro 232 YAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRE--T--SYGMVFT 307 (418) Q Consensus 232 ~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~--~--~~G~~v~ 307 (418) ..|+... .|..++++.|..+-.++= . +.++..-+|.+...+..|....- .+.|+.... . ..|..+. T Consensus 184 --~enviDa-rG~~Ls~~~ln~Aa~~i~---~--~fGt~TD~~lp~~vka~f~~~~l--~~qrv~~~~N~~~~~~G~~v~ 253 (463) T protein:vir:99 184 --KNNVINA-KGNQLTEKHLNEAAVRIG---K--GFGTATDAYMPIGVHADFVNSIL--GRQMQLMQDNSGNVNTGYSVN 253 (463) T ss_pred --CCCeeec-CCCcccHHHHhhhhhhhh---c--ccCChhheecchHHHHHHHHHhc--CceEEEEcCCCCceeeeeecc Confidence 4555433 446899999887776662 1 34445567888777777775432 333333222 2 5689999 Q ss_pred EEEcCCeEEEEEECccccccCCCCCeEEEEchhhc--eeeeccCCCc-ccccccccCccccccccccccccCccccccEE Q lcl|Aclame:pro 308 EWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAV--KLAYMDGRNA-KVENYGQGGGENKSGATDYSYGHGVDAQGGSL 384 (418) Q Consensus 308 ~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~--~~~~L~~r~~-~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i 384 (418) .|.|-.|.+.+-.+.++++ -.++|-+.- -=+|...-.. ..++-.|.++.+ ++..+.+ T Consensus 254 ~f~s~~G~I~L~~s~~m~~-------~~il~~~~~~~p~ap~~~~~tatv~~~~~~~~~~-------------~~~~a~~ 313 (463) T protein:vir:99 254 GFYSSRGFIKLHGSTVMEN-------ELILDESLQPLPNAPQPAKVTATVETKQKGAFEN-------------EEDRAGL 313 (463) T ss_pred ceeeeeeeeeeCCceecCC-------cccccchhhcCCCCccCceeEEEEeeccCCCCCC-------------cccccce Confidence 9999999999988888754 224443322 1111110000 111212222111 1122221 Q ss_pred EEEEEEEEecccceEEeecCccccc-------ccCCCCCCC Q lcl|Aclame:pro 385 TSEWALELLNPQGCAVITGLQKAKE-------RVYLTAPAP 418 (418) Q Consensus 385 ~~E~tLev~N~kA~a~I~gL~~~~~-------~~~~~~~~~ 418 (418) .|-..+.|-.+-.+-.-+-++-. +.--|.|+- T Consensus 314 --~Y~vv~~s~~geS~pS~ivtaT~a~~~~gv~l~It~~a~ 352 (463) T protein:vir:99 314 --SYKVVVNSDDAQSAPSEEVTATVSNVDDGVKLSINVNAM 352 (463) T ss_pred --EEEEEEECCCCCcccchheeeeeeeccceEEEEEEecCC Confidence 34444444333221111111100 000111211 No 36 >protein:vir:95603 Length: 463 # NCBI annotation: ORF016 # Family: family:all:2450 # MgeID: mge:1577 # MgeName: G1 # Cross-refs: genbank:acc:YP_240903;genbank:gi:66394965;genbank:GeneID:5132544 Probab=94.45 E-value=0.0044 Score=33.52 Aligned_cols=324 Identities=15% Similarity=0.128 Sum_probs=138.4 Q ss_pred eeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEE-----eecCceEEE Q lcl|Aclame:pro 6 GIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAE-----AAADATVLT 80 (418) Q Consensus 6 ~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~-----~~a~~t~~t 80 (418) =-+++.+.|. .+--|.||..- -.||.+-+| ...++.-+-.++ +...-+.++ T Consensus 1 ~~~~~~~~~~-----------------~~~~~~~~~e~----~~KS~~tg~---g~~p~~q~~~~AlR~EsL~~~i~~Lt 56 (463) T protein:vir:95 1 MTIEKNLSDV-----------------QQKYADQFQED----VVKSFQTGY---GITPDTQIDAGALRREILDDQITMLT 56 (463) T ss_pred CCcccccchH-----------------HHHHHhhhhHH----HHHHhhcCC---ccCCccccCcchhhhhhhhhhhheee Confidence 0011111111 00111121100 012211111 010010000000 111112222 Q ss_pred EccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEee-----cccccccCCcCccccccee Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIG-----TAFEEGSQRPTARSIQPVY 155 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g-----~a~~EGada~~~~~~~~~~ 155 (418) ..+. ...|++.+... ...+..+..+..+ ..| ....|+..+.. . T Consensus 57 ~~~~-----~f~~~~~i~k~-------------------~a~STV~~y~~~~-~~G~~g~~~f~~E~g~~~~-------~ 104 (463) T protein:vir:95 57 WTNE-----DLIFYRDISRR-------------------PAQSTVVKYDQYL-RHGNVGHSRFVKEIGVAPV-------S 104 (463) T ss_pred eccc-----chhhhhhcCCc-------------------hhhhhhhhheeee-ccCcccccccccccccccc-------C Confidence 2221 11122222211 1112222222222 111 12346544432 2 Q ss_pred ccceeEEEeeeeeechhHHHHhhh----cccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhh Q lcl|Aclame:pro 156 VPNFTQIFRNAWALTDTARASYAE----AGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQ 231 (418) Q Consensus 156 ~~N~tQIf~~~v~VSgTa~Av~~~----g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~ 231 (418) ..||.|+-..-==++.|.+.+... +..|-++.|.++++.-+...+|++++.|-+.......+..-.-+||...|. T Consensus 105 d~~~~Rr~~~~K~l~~~~~VS~~~~l~n~~~d~~~~~~~dai~~ia~tiE~a~FyGds~l~~~~~~~gleFDGl~~lId- 183 (463) T protein:vir:95 105 DPNIRQKTVSMKYVSDTKNMSIASGLVNNIADPSQILTEDAIAVVAKTIEWASFYGDASLTSEVEGEGLEFDGLAKLID- 183 (463) T ss_pred CCceEEEEEEeeeeehhhhhhhHHHhhcccccHHHHHHHHHHHHHHHHHHHHHhhhhhccCCCcCccccchhhhhhhcC- Confidence 234544433322356666655433 234667889999999999999999999987554333333456778866553 Q ss_pred ccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccc--e--eeceEEE Q lcl|Aclame:pro 232 YAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRE--T--SYGMVFT 307 (418) Q Consensus 232 ~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~--~--~~G~~v~ 307 (418) ..|+... .|..++++.|..+-.++= . +.++..-+|.+...+..|....- .+.|+.... . ..|..+. T Consensus 184 --~enviDa-rG~~Ls~~~ln~Aa~~i~---~--~fGt~TD~~lp~~vka~f~~~~l--~~qrv~~~~N~~~~~~G~~v~ 253 (463) T protein:vir:95 184 --KNNVINA-KGNQLTEKHLNEAAVRIG---K--GFGTATDAYMPIGVHADFVNSIL--GRQMQLMQDNSGNVNTGYSVN 253 (463) T ss_pred --CCCeeec-CCCcccHHHHhhhhhhhh---c--ccCChhheecchHHHHHHHHHhc--CceEEEEcCCCCceeeeeecc Confidence 4555433 446899999887776662 1 34445567888777777775432 333333222 2 5689999 Q ss_pred EEEcCCeEEEEEECccccccCCCCCeEEEEchhhc--eeeeccCCCc-ccccccccCccccccccccccccCccccccEE Q lcl|Aclame:pro 308 EWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAV--KLAYMDGRNA-KVENYGQGGGENKSGATDYSYGHGVDAQGGSL 384 (418) Q Consensus 308 ~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~--~~~~L~~r~~-~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i 384 (418) .|.|-.|.+.+-.+.++++ -.++|-+.- -=+|...-.. ..++-.|.++.+ ++..+.+ T Consensus 254 ~f~s~~G~I~L~~s~~m~~-------~~il~~~~~~~p~ap~~~~~tatv~~~~~~~~~~-------------~~~~a~~ 313 (463) T protein:vir:95 254 GFYSSRGFIKLHGSTVMEN-------ELILDESLQPLPNAPQPAKVTATVETKQKGAFEN-------------EEDRAGL 313 (463) T ss_pred ceeeeeeeeeeCCceecCC-------cccccchhhcCCCCccCceeEEEEeeccCCCCCC-------------cccccce Confidence 9999999999988888754 224443322 1111110000 111212222111 1122221 Q ss_pred EEEEEEEEecccceEEeecCccccc-------ccCCCCCCC Q lcl|Aclame:pro 385 TSEWALELLNPQGCAVITGLQKAKE-------RVYLTAPAP 418 (418) Q Consensus 385 ~~E~tLev~N~kA~a~I~gL~~~~~-------~~~~~~~~~ 418 (418) .|-..+.|-.+-.+-.-+-++-. +.--|.|+- T Consensus 314 --~Y~vv~~s~~geS~pS~ivtaT~a~~~~gv~l~It~~a~ 352 (463) T protein:vir:95 314 --SYKVVVNSDDAQSAPSEEVTATVSNVDDGVKLSINVNAM 352 (463) T ss_pred --EEEEEEECCCCCcccchheeeeeeeccceEEEEEEecCC Confidence 34444444333221111111100 000111211 No 37 >protein:vir:4856 Length: 293 # NCBI annotation: major head protein # Family: family:all:21 # MgeID: mge:106 # MgeName: DT1 # Cross-refs: genbank:acc:NP_049396;genbank:gi:9632424;genbank:GeneID:1258532 Probab=94.39 E-value=0.0045 Score=33.42 Aligned_cols=280 Identities=13% Similarity=0.040 Sum_probs=110.5 Q ss_pred eeEEEEEeecCceEEEEccccccccCceeEeccCc---------eEEEEEEecCc--eeEEEccccccchhhhhCCceEE Q lcl|Aclame:pro 65 SAVVTAEAAADATVLTVENSDGLTKGMIFYNEATG---------ENMRLELVNGL--NLTVKRQTGRISAAIIAANTKLI 133 (418) Q Consensus 65 ~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~--~~tv~rg~~~tta~~~~~gt~v~ 133 (418) .....+..+.++ .++..+.-+...|-+ ....+..+.+. ++.+.+..... + ...|. T Consensus 1 ~l~~~~~~t~~~--------gg~liP~~~~~~Ii~~~~~~~~l~~~~~~~~~~~~~g~~~~~~~~~~~-~-----~a~~v 66 (293) T protein:vir:48 1 MLDSKTDHSGSD--------AGLTIPQDIRTAINTLVRQYDSLQEYVNVENVTTLTGSRVYEKWTDIT-G-----LANID 66 (293) T ss_pred CceeecccccCc--------CceEechhHHHHHHHHHHhhhhhhhhceeeeccCCcceEEEEeecCCC-c-----ceeee Confidence 111111111111 112211111111111 01112222221 12222211110 0 11222 Q ss_pred EeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccC Q lcl|Aclame:pro 134 VIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGT 213 (418) Q Consensus 134 ~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~ 213 (418) .||...+.........+. ...++-...+.=|.+..+.... +-.++-..+-.+.+.+.+++.+++|... T Consensus 67 ------~Eg~~~~~~~~~~~~~i~--l~~~k~~~~~~iS~ell~ds~~-~l~~~i~~~la~~~~~~~~~~i~~g~~~--- 134 (293) T protein:vir:48 67 ------DEAGKIADIDDPKLSLIK--YTIKRYAGISTVTNSLLADSAE-NILAWLSGWIAKKVVVTRNKAILGVVDK--- 134 (293) T ss_pred ------cCCcccccccccceeEEE--EeeeEEEEeehhhHHHHhhhhH-HHHHHHHHHHHHHHHHHHHhHHhhcccc--- Confidence 456554432111111111 1222223333334444433222 2223333334445566777777765431 Q ss_pred cCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceE Q lcl|Aclame:pro 214 YNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEV 293 (418) Q Consensus 214 s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~ 293 (418) .+ ...+..+.++|.++..++-... ..+ ..+++++.....|.++....+++ T Consensus 135 -~~------------------------~~~~~~~~d~i~~~~~~l~~~~-~~~----a~~vmn~~~~~~L~~lkd~~g~~ 184 (293) T protein:vir:48 135 -LP------------------------TKPTLTKWDDIIDLEAKVDPAI-KQT----SFFLTNTSGFTALKKVKNALGDY 184 (293) T ss_pred -cc------------------------ccccccCHHHHHHHHHhhhhhh-cCC----CEEEEcHHHHHHHHHhhccCCce Confidence 00 1224567888888776664321 111 24678888888888876556665 Q ss_pred EEcccceeeceEEEEEEcCCeE-EEEEECccccccCCCCCeEEEEchhh-ceeeeccCCCcccccccccCcccccccccc Q lcl|Aclame:pro 294 TVTQRETSYGMVFTEWKFFKGR-LILKEHPLFSAIGISPGFAVVVDVPA-VKLAYMDGRNAKVENYGQGGGENKSGATDY 371 (418) Q Consensus 294 ~~~~~~~~~G~~v~~~~SdfG~-v~vv~n~~l~~~~mp~d~~lv~D~~~-~~~~~L~~r~~~~e~laKtG~~~~~~~~~~ 371 (418) .+...-.. |. -.+=+|. |.++.+..+.........+++.|+.. +.+..- .+...+.....+. .+ T Consensus 185 l~~~~~~~-~~----~~~l~G~Pv~~~~~~~~~~~~~~~~~~~~gd~~~~~~~~~~--~~~~i~~~~~~~~---~~---- 250 (293) T protein:vir:48 185 LMERDVKS-PT----GYSIAGFAVKEISDRWLPNASSGVMPLYFGDLKQAVTLFDR--QQMSLLSTNIGGG---AF---- 250 (293) T ss_pred EeecCcCC-CC----CceecceeeEEecccccCCccCCceEEEEEeccceEEEEEe--cceEEEEecccch---hh---- Confidence 44321000 00 0011232 22222333222122223466667653 222222 1221111111110 00 Q ss_pred ccccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 372 SYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 372 ~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) -.|.........+...+++++|..+++.=+.+.|..-...+|- T Consensus 251 ----~~~~~~~r~~~r~d~~~~~~~a~~~l~~~~~~~~~~~~~~~~~ 293 (293) T protein:vir:48 251 ----ETDTTKVRVIDRFDVVATDTEAFVPASFKAIADQKGNIGSTAV 293 (293) T ss_pred ----hcCeEEEEEEEeeCcEEecccceEEEEeeccccCCccccccCC Confidence 0134445577888999999999999985455544444444444 No 38 >protein:vir:78523 Length: 338 # NCBI annotation: Putative head structural protein # Family: family:all:507 # MgeID: mge:1853 # MgeName: U2 # Cross-refs: genbank:acc:YP_001491585;genbank:gi:157786408;genbank:GeneID:5625675 Probab=93.70 E-value=0.0067 Score=32.51 Aligned_cols=318 Identities=12% Similarity=-0.009 Sum_probs=122.8 Q ss_pred eeeeeeecccceeEEEEEeecCceEEEEccccccccCcee----Eec----cCceEEEEEEecCceeEEEccccccchhh Q lcl|Aclame:pro 54 HGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIF----YNE----ATGENMRLELVNGLNLTVKRQTGRISAAI 125 (418) Q Consensus 54 ~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~----~~~----~~~E~~~Vtav~g~~~tv~rg~~~tta~~ 125 (418) ..|++.-- .. +...+. ....+.. +..+.+..+. ... .-.....+..+.+..+++-+-.....+.- T Consensus 1 ~~~~~e~~-~~--~~~~~~---~~~~~~~-~~~liP~~~~~~ii~~~~~~s~l~~l~~~~~~~~~~~~ip~~~~~~~a~~ 73 (338) T protein:vir:78 1 MATLNELA-PN--TAGSNH---QGRLAHV-PSDLLPKEIVGPIFDKAQESSLVLRLGENIPISYGETIIPTTVKRPEVGQ 73 (338) T ss_pred CcchHHhh-hh--hccccc---ccceecc-cccccchHHHHHHHHHHHhhchhhhhcceeeccCCceEEEEEecCcccee Confidence 22222110 00 000000 0011111 1112222111 100 00111234445555544443222211110 Q ss_pred hhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeee----chhHHHHhhhcccchHHHHHHHHHHHHHHHHh Q lcl|Aclame:pro 126 IAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWAL----TDTARASYAEAGYSNITESRRDCMDFHATEQE 201 (418) Q Consensus 126 ~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~V----SgTa~Av~~~g~~dela~q~~kk~~EikrdmE 201 (418) ...+. +.-..||.+.+.... .+.+|--+...+ .-|.+.+... ..+-..+-..+-.+.+.+.+| T Consensus 74 v~~~~-----~~~~~Eg~~~~~~~~-------~f~~v~l~~~k~~~~~~is~ell~ds-~~~~~~~i~~~la~a~~~~~d 140 (338) T protein:vir:78 74 VGVGT-----SNEQREGGTKPLSGT-------AWDTRSVAPIKLATIVTVSEEFARMN-PSGLYTKLQADLAYAIGRGID 140 (338) T ss_pred ecccc-----ccccccccccccccc-------ceeEEEEEEEEEEEeehhhHHHHhcC-HHHHHHHHHHHHHHHHHHHHH Confidence 00011 011246655543221 233333333333 3333444332 223345555666677899999 Q ss_pred HHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHH Q lcl|Aclame:pro 202 TAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMR 281 (418) Q Consensus 202 ~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~ 281 (418) .++|+|..... .. .-.||......-..+..+....+.....+++.++...+-... ......+++++.... T Consensus 141 ~~~l~G~g~~~--~~----~~~gi~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~----~~~~~~~~m~~~~~~ 210 (338) T protein:vir:78 141 LAVFHGKSPLT--GS----ALQGIDTNNVIVNTTNVDYLQTGTTPLLDRFLDGYDLVSANT----DVDFNGWAADPRYRA 210 (338) T ss_pred HHhhcccCCCc--cc----cccccccccccccccccccccccchhhHHHHHHHHHHhhhhc----cccceEEEEchHHHH Confidence 99998875211 11 122333211110111122222223345566666665554221 112335778887777 Q ss_pred HHHhhhh---ccceEEEcccceeeceEEEEEEcCCeEEEEEECccccc----cCCCCCeEEEEchhhceeeeccCCCccc Q lcl|Aclame:pro 282 TMQDIGR---FFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSA----IGISPGFAVVVDVPAVKLAYMDGRNAKV 354 (418) Q Consensus 282 ~i~~~~~---~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~----~~mp~d~~lv~D~~~~~~~~L~~r~~~~ 354 (418) .|.++.. .++++-+.... ..|.. .+=+|. .|+.++.+.. -..+...+++-|+++..+..- .+... T Consensus 211 ~L~~~~~l~d~~g~~l~~~~~-~~~~~----~~l~G~-PV~~~~~ip~~~~~~~~~~~~~~~gdfs~~~~~~~--~~~~i 282 (338) T protein:vir:78 211 RLLRSQAYRDANGNVDPTRIN-LAASA----GDLLGL-PVQFGKAVGGDLGAATDSKVRVVGGDFSQLKYGFA--DEIRV 282 (338) T ss_pred HHHHHhhhccCCCceeecccc-cCCCC----ceeeee-eEEEccccCccccccCCcccEEEEEecceEEEEee--cccEE Confidence 7665422 33443332111 00100 111232 4444443321 111223467778887655544 23322 Q ss_pred ccccccCcccccccccc-ccccCccccccEEEEEEEEEEecccceEEeecCccccccc Q lcl|Aclame:pro 355 ENYGQGGGENKSGATDY-SYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERV 411 (418) Q Consensus 355 e~laKtG~~~~~~~~~~-~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~ 411 (418) +.....+..+....... ...-..|-...+.+.-+...+.+|+|..+|++-. +|.+ T Consensus 283 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r~~~r~d~~v~~~~a~~~l~~~~--~~~~ 338 (338) T protein:vir:78 283 KMSDTATLTDNTSPTPQTVSMWQTNQIAILIEVTFGWLLGDKQAFVKFVDDE--DPDA 338 (338) T ss_pred EEeecccccccccccccchhhhhcCcEEEEEEEEeccEeecccceEEEeccc--CCCC Confidence 22222221110000000 0001114445566778899999999999988732 2222 No 39 >protein:vir:100135 Length: 418 # NCBI annotation: gp5 # Family: family:all:585 # MgeID: mge:1639 # MgeName: phi1026b # Cross-refs: genbank:acc:NP_945035;genbank:gi:38707895;genbank:GeneID:2744182 Probab=93.64 E-value=0.0069 Score=32.45 Aligned_cols=289 Identities=11% Similarity=0.011 Sum_probs=122.8 Q ss_pred Cc----ce-eeee--------------c-cCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeee Q lcl|Aclame:pro 1 MS----VY-AGIF--------------N-TTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKT 60 (418) Q Consensus 1 ~~----~~-~~~~--------------~-~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~ 60 (418) .+ +. .+.+ . ++.+---|.-+.++..++...+. ..+|+++.+. .++...+ T Consensus 110 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~g~lvp~~~~~~ii~~~~~-~~~l~~~~~~---~~~~~~~------- 178 (418) T protein:vir:10 110 KGMDGSARKSVRVRVDRKSIMNVPATVGSGVSGSNSLVVADRQAGIIAPPQR-KMTIRDLLMP---GQTSSSS------- 178 (418) T ss_pred HHHHHHHhhhhhhhhHHHHHHHhhhhccCCCCCCccccchhHHHHHHHHHhh-hhhHHhhcce---eeccCCc------- Confidence 00 00 0000 0 00000001111111122221111 2223322111 0010000 Q ss_pred cccceeEEEEEeecCceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccc Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFE 140 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~ 140 (418) .+..++++..+ ++ .|. . T Consensus 179 --------------------------------------~~~~~~~~~~~------------~a-------~~v------~ 195 (418) T protein:vir:10 179 --------------------------------------IEYTVETGFTN------------NA-------AAV------A 195 (418) T ss_pred --------------------------------------eeEEEEecCCC------------ce-------eee------c Confidence 01111111100 00 111 2 Q ss_pred cccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccch Q lcl|Aclame:pro 141 EGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLH 220 (418) Q Consensus 141 EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r 220 (418) ||...+..... -.. -....++-...+.-|.+..+.. .+-.++-...-...+.+.+|.+||+|.. ++..| T Consensus 196 E~~~~~~~~~~-f~~--v~~~~~k~~~~~~is~ell~ds--~~l~~~i~~~l~~a~~~~~d~a~l~G~g----~~~~p-- 264 (418) T protein:vir:10 196 EGAQKPTSDLK-FNL--KNQPVRTIAHLFKASRQILDDA--PALQSYIDGRARYGLQLTEEGQILKGDG----TGANI-- 264 (418) T ss_pred cCccccccccc-eee--EEEeeeeEEEeehhhHHHHHhH--HHHHHHHHHHHHHHHHHHHHHHHhccCC----CCccc-- Confidence 44443322211 111 1122223333333444444432 2444555555667789999999998843 22222 Q ss_pred hhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccce Q lcl|Aclame:pro 221 TTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET 300 (418) Q Consensus 221 ~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~ 300 (418) .||+... .......+.....+.+++.+++..+...+.. ...+++++.....|.++-..+|++.+..... T Consensus 265 --~Gi~~~~----~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~-----~~~~v~n~~~~~~L~~lkd~~G~~i~~~~~~ 333 (418) T protein:vir:10 265 --LGILPQA----SAFMPSITLANATPIDKIRLALLQAVLAEFP-----ATGIVLNPIDWASIELTKDSQGRYIVGNPVN 333 (418) T ss_pred --ccccccc----ccccccccccccccHHHHHHHHHhhccccCC-----CCEEEEcHHHHHHHHHhhcCCCceecccccc Confidence 3665322 1112222233445677788877776543322 2246788888888888755556554432111 Q ss_pred eeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCcccc Q lcl|Aclame:pro 301 SYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQ 380 (418) Q Consensus 301 ~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~ 380 (418) |.. -+=+| +.|+.++ +||++.+++.|+++..+-+.. .+...+.....+.. + ..|.. T Consensus 334 --~~~----~~l~G-~pV~~~~-----~~p~~~~~~gd~s~~~~~~~~-~~~~i~~~~~~~~~---f--------~~~~~ 389 (418) T protein:vir:10 334 --GTT----PRLWN-LPVVETQ-----AMTANEFLVGAFSMAAQIFDR-MEIEVLLSTENVDD---F--------EKNMV 389 (418) T ss_pred --CCC----ceecc-eeeEEcC-----CCCCCcEEEeeccceEEEEEe-cceEEEEecccchh---h--------hcCce Confidence 110 12246 3666664 478899999999764222221 11111111111100 0 01334 Q ss_pred ccEEEEEEEEEEecccceEEeecCccccc Q lcl|Aclame:pro 381 GGSLTSEWALELLNPQGCAVITGLQKAKE 409 (418) Q Consensus 381 k~~i~~E~tLev~N~kA~a~I~gL~~~~~ 409 (418) ..+.+.-+...+++|+|...++--..+.- T Consensus 390 ~~r~~~~~d~~~~~~~a~~~~~~~~~~~g 418 (418) T protein:vir:10 390 SIRAEERLALAVYRPESFVTGALVEQAGG 418 (418) T ss_pred EEEEEEeeccEEecccceEEEEeccCCCC Confidence 45567789999999999999887655544 No 40 >protein:vir:96666 Length: 462 # NCBI annotation: ORF016 # Family: family:all:2450 # MgeID: mge:1623 # MgeName: Twort # Cross-refs: genbank:acc:YP_238545;genbank:gi:66391271;genbank:GeneID:5130448 Probab=93.60 E-value=0.007 Score=32.39 Aligned_cols=317 Identities=16% Similarity=0.136 Sum_probs=133.2 Q ss_pred eEeecCCcc----hhHHHhhhccccceeeeeeeeeeeecccceeEEEEE-----eecCceEEEEccccccccCceeEecc Q lcl|Aclame:pro 27 LRRVPNGSA----PLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAE-----AAADATVLTVENSDGLTKGMIFYNEA 97 (418) Q Consensus 27 ~~~~~~~~~----p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~-----~~a~~t~~tV~~~~~~~~~~~~~~~~ 97 (418) |-++-|.+. -+.++. - .-.||.+-+| ...++.-+-.++ +..+-+.++..+. ..+|++++ T Consensus 1 ~~~~~~~~~~~~~~~~~~~--e--~~~KS~~tg~---g~~p~~q~~~gAlR~esL~~~i~~Lt~~~~-----~~~~~~~i 68 (462) T protein:vir:96 1 MHKDTNLTAEQNKYADKFQ--E--EVMKSYQTGY---GITPDTQVDAGALRREILDDQITMLTWTQD-----DLIFYREI 68 (462) T ss_pred Cccccccchhhhhhhchhh--H--HHHHHHhcCC---CcCCccccccchhhhhhhhhhhheeeeccc-----chhhhhhc Confidence 111111110 011110 0 0011111111 000000000000 1111112222211 11112222 Q ss_pred CceEEEEEEecCceeEEEccccccchhhhhCCceEEEee-----cccccccCCcCcccccceeccceeEE------Eeee Q lcl|Aclame:pro 98 TGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIG-----TAFEEGSQRPTARSIQPVYVPNFTQI------FRNA 166 (418) Q Consensus 98 ~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g-----~a~~EGada~~~~~~~~~~~~N~tQI------f~~~ 166 (418) ... ...+..+..+..+ ..| ....|+..++... .||.|+ +..+ T Consensus 69 ~k~-------------------~a~sTv~~y~~~~-~~G~~g~~~f~~E~g~~~~~d-------~~~~R~~~~~k~l~~t 121 (462) T protein:vir:96 69 SRR-------------------PAQSTVQKYDVYL-RHGNVGHSRFVREVGVAPVSD-------PNIRQKTVEMKYVSDT 121 (462) T ss_pred CCc-------------------hhhhhhhhheeee-ccCccccccccccccccccCC-------CceEEEEEEEEEEeee Confidence 210 1112222222222 111 2235655443222 233332 2223 Q ss_pred eeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCcc Q lcl|Aclame:pro 167 WALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAV 246 (418) Q Consensus 167 v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~ 246 (418) -.||--+.- ..+..|-++.|.++++.-+...+|++.+.|-+.......+..-.-+||...| ...|+.... |..+ T Consensus 122 ~~vsi~~tl--~n~~~d~~~~~~~dai~~~a~tiE~a~Fygds~l~~~~~~~gleFDGl~~lI---~~~NViDar-G~~L 195 (462) T protein:vir:96 122 KNLSIASTL--VNNIQDPMQILTEDAIAVVAKTIEWASFYGDASLTADPTGQGLEFDGLAKLI---DKDNVIDAK-GESL 195 (462) T ss_pred eeechhhhh--ccchhhHHHHHHHHHHHHHHHHHHHHHhhhhcccCCCccccccchhhhhhhc---CCCceeecC-CCCc Confidence 333333332 2345667899999999999999999999998755433322235577886555 456776553 4689 Q ss_pred chHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccce----eeceEEEEEEcCCeEEEEEECc Q lcl|Aclame:pro 247 TYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET----SYGMVFTEWKFFKGRLILKEHP 322 (418) Q Consensus 247 te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~----~~G~~v~~~~SdfG~v~vv~n~ 322 (418) +++.|..+...+= .+.++..-+|.+...+..|....- .+.|+....+ ..|..+..|.|-.|.+++-.+. T Consensus 196 s~~~ln~aa~~i~-----~~fGt~TD~~~p~~v~a~f~~~~l--~~qrv~~~~n~g~~~~G~~v~~f~s~~G~I~L~~s~ 268 (462) T protein:vir:96 196 TETLLNRSAVLIG-----KSFGTATDAYMPIGVHADFVNSVL--GRQMQLMQDNSGNVNAGYNVQGFYSSRGFIKLHGST 268 (462) T ss_pred cHHHHhhhhhhcc-----cccCChhheecchHHHHHHHHhhc--CceEEEEcCCCCceeeeeeccceeeeeeeeeeCCce Confidence 9999988876661 234444557777777777765422 3333333332 5688999999999999998888 Q ss_pred cccccCCCCCeEEEEchhhceeeeccCCC--cccccccccCccccccccccccccCccccccEEEEEEEEEEecccceE- Q lcl|Aclame:pro 323 LFSAIGISPGFAVVVDVPAVKLAYMDGRN--AKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCA- 399 (418) Q Consensus 323 ~l~~~~mp~d~~lv~D~~~~~~~~L~~r~--~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a- 399 (418) ++++ -+++|-+.-...-..... ...-.+++.| .+.+.. | .+||.-+|.=-.++| T Consensus 269 ~m~~-------~~i~~~~~~~~p~ap~~~~vsaTv~t~~~g-----~f~~~~-----d------~~~y~Y~V~avs~dge 325 (462) T protein:vir:96 269 VMEN-------ELILDESLQPLPNAPQPATVKATVETGKKG-----LFTDEH-----D------RAELTYKVVVNSDDAQ 325 (462) T ss_pred ecCc-------ccccccccccCCCCCCCCceeEEEEeCCCC-----CCCCcc-----C------ceeEEEEEEEECCCCc Confidence 8753 233443332111110000 0001122222 111100 1 244443333222221 Q ss_pred ---------Ee------ecCcccccccCCCCCCC Q lcl|Aclame:pro 400 ---------VI------TGLQKAKERVYLTAPAP 418 (418) Q Consensus 400 ---------~I------~gL~~~~~~~~~~~~~~ 418 (418) -+ ..|...-+.++-..|-- T Consensus 326 S~PS~~VtaTva~~~~gv~ltIt~~a~~~~~~~~ 359 (462) T protein:vir:96 326 SAPSEAVTATVNNATDGVKLEISVNAMYQQQPQF 359 (462) T ss_pred cccceeeEeeeecccccceEEEEEcCCccccceE Confidence 00 00111101111111100 No 41 >protein:vir:80835 Length: 464 # NCBI annotation: putative major capsid protein # Family: family:all:2450 # MgeID: mge:1885 # MgeName: phiEF24C # Cross-refs: genbank:acc:YP_001504125;genbank:gi:158079312;genbank:GeneID:5666484 Probab=93.03 E-value=0.0091 Score=31.78 Aligned_cols=328 Identities=15% Similarity=0.145 Sum_probs=139.5 Q ss_pred eeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEcc Q lcl|Aclame:pro 4 YAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVEN 83 (418) Q Consensus 4 ~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~ 83 (418) |.- |=|++ ..++|.-..-+-.++...+..+.+++--+-+-... +...-+.+++.+ T Consensus 1 ~~~---------~~n~~------~~~~~~~e~~~Ks~ttgy~~~p~~q~~~~AlRrEs----------L~~~i~~Lt~~~ 55 (464) T protein:vir:80 1 MTE---------KKNTE------RQLTSVQEEVIKGFTTGYGITPESQTDAAALRREF----------LDDQITMLTWAD 55 (464) T ss_pred CCc---------chhhH------hhcCcccHHHHHHHHhCCccCcccccCcchhhhhh----------hhhhhheeeecc Confidence 211 11222 12222211112223222222222221111111000 111112233332 Q ss_pred ccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEee-----cccccccCCcCcccccceeccc Q lcl|Aclame:pro 84 SDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIG-----TAFEEGSQRPTARSIQPVYVPN 158 (418) Q Consensus 84 ~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g-----~a~~EGada~~~~~~~~~~~~N 158 (418) .+ ..|++.+...- .++..+..+..+ ..| ....|+..++... .| T Consensus 56 ~~-----f~f~~di~k~~-------------------a~STV~~y~~~~-~~G~~g~~~f~~E~g~~~~~d-------~~ 103 (464) T protein:vir:80 56 GD-----LSFYRDITKRP-------------------ATSTVAKYDVYL-AHGRVGHTRFTREIGVAPISD-------PN 103 (464) T ss_pred cc-----hhhhhhcCCch-------------------hhhhhhhhheee-ccCccccccccccccccccCC-------Cc Confidence 21 12222222211 111112222211 111 2235665543222 34 Q ss_pred eeEEEeeeeeechhHHHHhh----hcccchHHHHHHHHHHHHHHHHhHHHhcCcccccC-cCCccchhhHHHHHHHhhcc Q lcl|Aclame:pro 159 FTQIFRNAWALTDTARASYA----EAGYSNITESRRDCMDFHATEQETAIFFGQAFMGT-YNGQPLHTTQGIVDAVRQYA 233 (418) Q Consensus 159 ~tQIf~~~v~VSgTa~Av~~----~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~-s~~~~~r~t~GI~~~i~~~~ 233 (418) |.|+--.-=-+|+|.+.+.. ..+.|-+..|.++++.-+...+|++.+.|-+.... ..++..-+-+||...| . T Consensus 104 ~~Rr~~~~Kfl~~~r~vsia~~lvn~~~d~~~~~~~dai~~va~tiE~a~FyGds~l~~~~~~~~gleFDGl~~lI---~ 180 (464) T protein:vir:80 104 LRQKTVNMKYVSDTKNMSIATGLVNNIEDPMRILTDDAISVVAKTIEWASFYGDSDLSENPDAGSGLEFDGLAKLI---D 180 (464) T ss_pred eEEEEEEeeeeecceeeeeehhhhcchhhHHHHHHHHHHHHHHHHHHHHHhhhccccCCCCCCccccchhhhHhhc---C Confidence 44332221123333332211 12337788999999999999999999999875432 2333445678887665 3 Q ss_pred ccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHH-HHhhhhccceEEEcccce---eeceEEEEE Q lcl|Aclame:pro 234 PDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRT-MQDIGRFFGEVTVTQRET---SYGMVFTEW 309 (418) Q Consensus 234 ~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~-i~~~~~~~~~~~~~~~~~---~~G~~v~~~ 309 (418) ..|+.... |..++++.|..+-..+= + +.+++.-+|.+...+-. ++.+.. .+.++..... ..|..+..| T Consensus 181 ~~NViDar-G~~Ls~~~ln~Aa~~i~-~----~fGt~TD~~lp~~v~a~f~n~~l~--~q~~~~~~n~~~~~~G~~v~~f 252 (464) T protein:vir:80 181 KHNVLDAK-GASLTEALLNQASVLVG-K----GYGTPTDAYMPIGVQADFVNQQLD--RQVQVISDNGQNATMGFNVKGF 252 (464) T ss_pred CCceeecC-CCCcCHHHHhhhhhhhh-c----ccCChhhcccchhHHHHHHhhhcC--ceeEEEcCCCCcceeeeecccc Confidence 56775543 45699999987776662 1 34444456777666645 477643 4555554333 448999999 Q ss_pred EcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEE Q lcl|Aclame:pro 310 KFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWA 389 (418) Q Consensus 310 ~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~t 389 (418) .|-.|.+.+-.+-+|+. .-++|++..+ +.+-+...---+..... ...++.+.. .-.-.+|- T Consensus 253 ~sa~G~i~L~~s~~m~~-------~~~ld~~~~~---~~~apaapsvt~tv~~~--------~~g~f~~~~-~~~~~~Yk 313 (464) T protein:vir:80 253 NSARGFIRLHGSTVMEL-------EQILDENRMQ---LPNAPQKATVKATLEAG--------TKGKFRDED-LTIDTEYK 313 (464) T ss_pred cccccceeccCccccCc-------cccccccccc---CCCCcCCceeEEEecCC--------cccCCcccc-ccceeEEE Confidence 99999888877766533 3345554432 11100000000000000 001111111 00111455 Q ss_pred EEEecccceEEeecCcc--------------cccccCCCCCCC Q lcl|Aclame:pro 390 LELLNPQGCAVITGLQK--------------AKERVYLTAPAP 418 (418) Q Consensus 390 Lev~N~kA~a~I~gL~~--------------~~~~~~~~~~~~ 418 (418) ..+.|-.+--++...-+ --...|...|.- T Consensus 314 v~~vn~~GeS~ps~~~~~ti~~~~~~V~l~it~~~~~~~~p~y 356 (464) T protein:vir:80 314 VVVVSDDAESAPSDVASVVIDDKKKQVKLEITINNMYQARPQY 356 (464) T ss_pred EEEECCCCccccceeeeeeecCcccEEEEEEEeCCccccccce Confidence 55555444333322111 101111111111 No 42 >protein:vir:1638 Length: 298 # NCBI annotation: Structural protein # Family: family:all:966 # MgeID: mge:33 # MgeName: r1t # Cross-refs: genbank:acc:NP_695059;genbank:gi:23455750;genbank:GeneID:955469 Probab=93.01 E-value=0.0091 Score=31.77 Aligned_cols=281 Identities=10% Similarity=-0.033 Sum_probs=111.8 Q ss_pred EccccccccCceeEeccCc---------eEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccc Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATG---------ENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSI 151 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~ 151 (418) ++.+.+...+.-+..++-+ -...+.-+.+..+++-+-.++.. ..|+ .||.+.+.... T Consensus 1 ma~~gG~lvp~~~~~~ii~~~~~~s~i~~l~~~~~~~~~~~~ip~~~~~~~-------a~~v------~E~~~~~~~~~- 66 (298) T protein:vir:16 1 MVLNKGTLFDPTLVTDLISKVAGKSSIARLSAQKPIPFNGEKVFTFTMDSE-------IDVV------AESGKKTHGGV- 66 (298) T ss_pred CcccCcceechhHHHHHHHHHHhhhhhhhhcceeeccCCceEEEEEecCcc-------eEEe------cCCcccccccc- Confidence 2211111111111111111 11122233334444433222211 1222 36665553321 Q ss_pred cceeccceeEEEeeeeeec----hhHHHHhh--hcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHH Q lcl|Aclame:pro 152 QPVYVPNFTQIFRNAWALT----DTARASYA--EAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGI 225 (418) Q Consensus 152 ~~~~~~N~tQIf~~~v~VS----gTa~Av~~--~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI 225 (418) .+.||--+.-.+. =|.+.... .-..+-.++-..+-.+.+.+.+|.++++|...-.+.... .-|+ T Consensus 67 ------~f~~v~l~~~k~a~~~~iS~ell~~s~d~~~~l~~~i~~~la~ai~~~~d~~~l~G~~~~~g~~~~----~~~~ 136 (298) T protein:vir:16 67 ------TLAPQTMVPIKVEYGARISDEFMYASDEEKINILQEFNDGFAKKVARGIDLMAFHGVNPRLGTASA----VIGT 136 (298) T ss_pred ------ceeEEEEeeeeEEEeehhhHHHhhcCcccHHHHHHHHHHHHHHHHHHHHHHHhhccccCCCCcccc----cccc Confidence 1233322222222 22232211 111122334445556678899999999986421111111 1111 Q ss_pred HHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceE Q lcl|Aclame:pro 226 VDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMV 305 (418) Q Consensus 226 ~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~ 305 (418) ..... ...+............+++.++...+...... ...+++++.....|.++...+|++.+..... .|. T Consensus 137 ~~~~~--~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~-----~~~~vmn~~~~~~l~~lkd~~G~~i~~~~~~-~~~- 207 (298) T protein:vir:16 137 NHFDS--KVTQKVEAPRGIADPNGAIENAVELLTGVDAD-----VTGIAINPSFRSALAKQKDLQDNALFPELKW-GAT- 207 (298) T ss_pred ccccc--ccccccccccccccHHHHHHHHHHHhhhcCCC-----ccEEEEcHHHHHHHHHhhccCCCeeecCccc-CCC- Confidence 11000 00111111111122244566666555433222 2236678888888888755556655432211 010 Q ss_pred EEEEEcCCeEEEEEECcccc-ccCCCCCeEEEEchhhc-eeeeccCCCcccccccccCccccccccccccccCccccccE Q lcl|Aclame:pro 306 FTEWKFFKGRLILKEHPLFS-AIGISPGFAVVVDVPAV-KLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGS 383 (418) Q Consensus 306 v~~~~SdfG~v~vv~n~~l~-~~~mp~d~~lv~D~~~~-~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~ 383 (418) .. +=+|. .++.+..+. ....+.+.+|+-|.+.. .+..- .+...+-.. .+..+... . ..--.|-...+ T Consensus 208 ~~---~l~G~-PV~~~~~v~~~~~~~~~~~~~GDfs~~~~~~~~--~~~~~~~~~-~~~~~~~~-~---~~f~~~~v~~r 276 (298) T protein:vir:16 208 PD---TINGL-PVDVNKTVSDMSLTQRDRAIIGDFANGFKWGYA--KEVPLEVIQ-YGDPDNSG-L---DLKGYNQVYIR 276 (298) T ss_pred Cc---eecce-eeEEecccccccCCCccEEEEeeccceEEEEEe--cCceEEEee-ccCCcCcc-h---hhhhcCcEEEE Confidence 00 11232 444444332 12234456777787653 22222 122111111 11000000 0 00001333345 Q ss_pred EEEEEEEEEecccceEEeecCc Q lcl|Aclame:pro 384 LTSEWALELLNPQGCAVITGLQ 405 (418) Q Consensus 384 i~~E~tLev~N~kA~a~I~gL~ 405 (418) ....+...+++|+|.++|++-. T Consensus 277 a~~r~d~~v~~~~a~~~l~~at 298 (298) T protein:vir:16 277 AELFLGWGILDATKFARVTEAN 298 (298) T ss_pred EEEEEccEeecccceEEEeecC Confidence 5667788999999999998887 No 43 >protein:vir:1886 Length: 385 # NCBI annotation: major capsid subunit precursor # Family: family:all:585 # MgeID: mge:41 # MgeName: HK022 # Cross-refs: genbank:acc:NP_037666;genbank:gi:9634124;genbank:GeneID:1262513 Probab=92.88 E-value=0.0096 Score=31.64 Aligned_cols=322 Identities=9% Similarity=-0.027 Sum_probs=124.7 Q ss_pred CcceeeeeccCCC---hhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCce Q lcl|Aclame:pro 1 MSVYAGIFNTTLN---PQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADAT 77 (418) Q Consensus 1 ~~~~~~~~~~~~~---~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t 77 (418) ..-.+...+.... ..+...+++...+.....+.......-.-..++.........-++.... .. T Consensus 61 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~g~~i~~~~~~~ii--------~~----- 127 (385) T protein:vir:18 61 EQKLASGAENPGEKKSFSERAAEELIKSWDGKQGTFGAKTFNKSLGSDADSAGSLIQPMQIPGII--------MP----- 127 (385) T ss_pred HHHhhccccccchhhhhHHHHHHHHHHHHHHhhccchhhHHHhhhccccccCCceecchhhhHHH--------HH----- Confidence 0000000000000 0000011111111111111111111000000000000000000111100 00 Q ss_pred EEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceecc Q lcl|Aclame:pro 78 VLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVP 157 (418) Q Consensus 78 ~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~ 157 (418) +...+.+.. .+.+..+.+..++.-+-..... ...|. .||...+... + .... T Consensus 128 ---~~~~~~l~~-----------~~~~~~~~~~~~~~~~~~~~~~------~a~~v------~E~~~~~~~~--~-~~~~ 178 (385) T protein:vir:18 128 ---GLRRLTIRD-----------LLAQGRTSSNALEYVREEVFTN------NADVV------AEKALKPESD--I-TFSK 178 (385) T ss_pred ---hhhccchhh-----------hcceecccCcceEEEEEecCCc------ceeee------ccCccccccc--c-ceeE Confidence 000000000 0011111122221111111000 01111 2554433222 1 1112 Q ss_pred ceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCc Q lcl|Aclame:pro 158 NFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNV 237 (418) Q Consensus 158 N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv 237 (418) ....+++-...+.-|.+..+.. .+-..+-...-...+.+.+|.++|+|.- ++.. ..||+.... ... T Consensus 179 ~~~~~~k~~~~~~is~ell~d~--~~l~~~i~~~la~a~~~~~d~~~l~G~g----~~~~----~~Gi~~~~~----~~~ 244 (385) T protein:vir:18 179 QTANVKTIAHWVQASRQVMDDA--PMLQSYINNRLMYGLALKEEGQLLNGDG----TGDN----LEGLNKVAT----AYD 244 (385) T ss_pred EEEeeeeEEEeehhhHHHHhhH--HHHHHHHHHHHHHHHHHHHHHHHHhccC----CCCc----ccccccccc----ccc Confidence 2344444444444555555432 2334555556666788999999998842 2221 456654321 111 Q ss_pred cccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCeEEE Q lcl|Aclame:pro 238 NAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKGRLI 317 (418) Q Consensus 238 ~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~ 317 (418) .........+.++|.+++.++-..... ...+++++.....|.++....|++-+.......+ -+=+| +. T Consensus 245 ~~~~~~~~~~~d~i~~~~~~l~~~~~~-----~~~~~~~~~~~~~l~~lkd~~G~~l~~~~~~~~~------~~l~G-~p 312 (385) T protein:vir:18 245 TSLNATGDTRADIIAHAIYQVTESEFS-----ASGIVLNPRDWHNIALLKDNEGRYIFGGPQAFTS------NIMWG-LP 312 (385) T ss_pred ccccccccchHHHHHHHHHhhccccCC-----CCEEEEcHHHHHHHHHhhcCCCceeccCcccCCC------ceecc-ee Confidence 222233456778888888777543322 2257788888888888755556544322111100 11156 46 Q ss_pred EEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecccc Q lcl|Aclame:pro 318 LKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQG 397 (418) Q Consensus 318 vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA 397 (418) |+.++ +||++++++.|+.....-+.. -+...+.....+ + .-..|........-+...+++|+| T Consensus 313 V~~~~-----~~p~~~~~~gd~~~~~~~~~~-~~~~v~~~~~~~----------~-~~~~~~~~~~~~~r~~~~v~~~~a 375 (385) T protein:vir:18 313 VVPTK-----AQAAGTFTVGGFDMASQVWDR-MDATVEVSREDR----------D-NFVKNMLTILCEERLALAHYRPTA 375 (385) T ss_pred eEEcC-----cCCCCcEEEeecccEEEEEEe-cceEEEEecccc----------c-hhhcCcEEEEEEEeeccEEecccc Confidence 66665 468899999998753222210 111111111111 0 000123333455678899999999 Q ss_pred eEEeecCccc Q lcl|Aclame:pro 398 CAVITGLQKA 407 (418) Q Consensus 398 ~a~I~gL~~~ 407 (418) ..+++-=.-+ T Consensus 376 ~~~~~~~aa~ 385 (385) T protein:vir:18 376 IIKGTFSSGS 385 (385) T ss_pred eEEEEeccCC Confidence 9998754333 No 44 >protein:vir:191 Length: 385 # NCBI annotation: major head subunit precursor # Family: family:all:585 # MgeID: mge:6 # MgeName: HK97 # Cross-refs: genbank:acc:NP_037701;genbank:gi:9634158;genbank:GeneID:1262530 Probab=92.88 E-value=0.0096 Score=31.64 Aligned_cols=322 Identities=9% Similarity=-0.027 Sum_probs=124.7 Q ss_pred CcceeeeeccCCC---hhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCce Q lcl|Aclame:pro 1 MSVYAGIFNTTLN---PQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADAT 77 (418) Q Consensus 1 ~~~~~~~~~~~~~---~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t 77 (418) ..-.+...+.... ..+...+++...+.....+.......-.-..++.........-++.... .. T Consensus 61 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~g~~i~~~~~~~ii--------~~----- 127 (385) T protein:vir:19 61 EQKLASGAENPGEKKSFSERAAEELIKSWDGKQGTFGAKTFNKSLGSDADSAGSLIQPMQIPGII--------MP----- 127 (385) T ss_pred HHHhhccccccchhhhhHHHHHHHHHHHHHHhhccchhhHHHhhhccccccCCceecchhhhHHH--------HH----- Confidence 0000000000000 0000011111111111111111111000000000000000000111100 00 Q ss_pred EEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceecc Q lcl|Aclame:pro 78 VLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVP 157 (418) Q Consensus 78 ~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~ 157 (418) +...+.+.. .+.+..+.+..++.-+-..... ...|. .||...+... + .... T Consensus 128 ---~~~~~~l~~-----------~~~~~~~~~~~~~~~~~~~~~~------~a~~v------~E~~~~~~~~--~-~~~~ 178 (385) T protein:vir:19 128 ---GLRRLTIRD-----------LLAQGRTSSNALEYVREEVFTN------NADVV------AEKALKPESD--I-TFSK 178 (385) T ss_pred ---hhhccchhh-----------hcceecccCcceEEEEEecCCc------ceeee------ccCccccccc--c-ceeE Confidence 000000000 0011111122221111111000 01111 2554433222 1 1112 Q ss_pred ceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCc Q lcl|Aclame:pro 158 NFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNV 237 (418) Q Consensus 158 N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv 237 (418) ....+++-...+.-|.+..+.. .+-..+-...-...+.+.+|.++|+|.- ++.. ..||+.... ... T Consensus 179 ~~~~~~k~~~~~~is~ell~d~--~~l~~~i~~~la~a~~~~~d~~~l~G~g----~~~~----~~Gi~~~~~----~~~ 244 (385) T protein:vir:19 179 QTANVKTIAHWVQASRQVMDDA--PMLQSYINNRLMYGLALKEEGQLLNGDG----TGDN----LEGLNKVAT----AYD 244 (385) T ss_pred EEEeeeeEEEeehhhHHHHhhH--HHHHHHHHHHHHHHHHHHHHHHHHhccC----CCCc----ccccccccc----ccc Confidence 2344444444444555555432 2334555556666788999999998842 2221 456654321 111 Q ss_pred cccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCeEEE Q lcl|Aclame:pro 238 NAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKGRLI 317 (418) Q Consensus 238 ~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~ 317 (418) .........+.++|.+++.++-..... ...+++++.....|.++....|++-+.......+ -+=+| +. T Consensus 245 ~~~~~~~~~~~d~i~~~~~~l~~~~~~-----~~~~~~~~~~~~~l~~lkd~~G~~l~~~~~~~~~------~~l~G-~p 312 (385) T protein:vir:19 245 TSLNATGDTRADIIAHAIYQVTESEFS-----ASGIVLNPRDWHNIALLKDNEGRYIFGGPQAFTS------NIMWG-LP 312 (385) T ss_pred ccccccccchHHHHHHHHHhhccccCC-----CCEEEEcHHHHHHHHHhhcCCCceeccCcccCCC------ceecc-ee Confidence 222233456778888888777543322 2257788888888888755556544322111100 11156 46 Q ss_pred EEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecccc Q lcl|Aclame:pro 318 LKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQG 397 (418) Q Consensus 318 vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA 397 (418) |+.++ +||++++++.|+.....-+.. -+...+.....+ + .-..|........-+...+++|+| T Consensus 313 V~~~~-----~~p~~~~~~gd~~~~~~~~~~-~~~~v~~~~~~~----------~-~~~~~~~~~~~~~r~~~~v~~~~a 375 (385) T protein:vir:19 313 VVPTK-----AQAAGTFTVGGFDMASQVWDR-MDATVEVSREDR----------D-NFVKNMLTILCEERLALAHYRPTA 375 (385) T ss_pred eEEcC-----cCCCCcEEEeecccEEEEEEe-cceEEEEecccc----------c-hhhcCcEEEEEEEeeccEEecccc Confidence 66665 468899999998753222210 111111111111 0 000123333455678899999999 Q ss_pred eEEeecCccc Q lcl|Aclame:pro 398 CAVITGLQKA 407 (418) Q Consensus 398 ~a~I~gL~~~ 407 (418) ..+++-=.-+ T Consensus 376 ~~~~~~~aa~ 385 (385) T protein:vir:19 376 IIKGTFSSGS 385 (385) T ss_pred eEEEEeccCC Confidence 9998754333 No 45 >protein:vir:100851 Length: 514 # NCBI annotation: hypothetical protein # Family: family:all:2450 # MgeID: mge:1633 # MgeName: LP65 # Cross-refs: genbank:acc:YP_164744;genbank:gi:56693157;genbank:GeneID:3197484 Probab=92.55 E-value=0.011 Score=31.33 Aligned_cols=354 Identities=12% Similarity=0.098 Sum_probs=146.8 Q ss_pred eEeecCCcchhHHHhhhccccceeeeeeee-eeeecccceeEEEEEeecCceEEEEccccccccCceeEeccCceEEEEE Q lcl|Aclame:pro 27 LRRVPNGSAPLLAMTSVVGSTTAKASTHGY-FSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATGENMRLE 105 (418) Q Consensus 27 ~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~-~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vt 105 (418) |+--- +---++.-+-+||-+.+---|.+= .-+...+. ...+.+.+++-.. +.++..-+.-++.+.-++.|+.. T Consensus 1 ~~~~~-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~-~~~k~a~t~gy~~----~~~~~t~gaAlR~EsLd~~l~~L 74 (514) T protein:vir:10 1 MYTQD-KTKDIMKKSFFGGDRAVAFDTNKEDILNENLPE-NVKKSAFTAGHSI----TPDTQTDGAANRIESLNRDLKVT 74 (514) T ss_pred CCccc-hhhHHHhhhhcccceeeeecCcHHHHHHHhcch-hhhhhhhcccccc----CCccccCccchhhhhhccceeEe Confidence 21111 112223333344433221111100 00001111 1111111111111 22234444444444455555554 Q ss_pred EecCceeEEEc--cccccchhhhhCCceEEEee-----cccccccCCcCcccccceeccceeEEE------eeeeeechh Q lcl|Aclame:pro 106 LVNGLNLTVKR--QTGRISAAIIAANTKLIVIG-----TAFEEGSQRPTARSIQPVYVPNFTQIF------RNAWALTDT 172 (418) Q Consensus 106 av~g~~~tv~r--g~~~tta~~~~~gt~v~~~g-----~a~~EGada~~~~~~~~~~~~N~tQIf------~~~v~VSgT 172 (418) ....+.+|.-+ ..-...+..|..+.-. ..| ....|+..+... -.||.|+- ..+..||-- T Consensus 75 t~~~~~ftf~~~i~k~~a~STV~ey~~~~-~~G~~G~~~f~~E~gi~~~~-------d~~~~rk~~~~k~l~~~~~vS~~ 146 (514) T protein:vir:10 75 TWGERDFTLYNDIAKQPVDNTVLKYTQYY-SHGRTGHSLFQPEIGIGDVN-------NPNERQRTINIKYIVDTHVTSIA 146 (514) T ss_pred eecCcchhhhhhcCCchhhHHHhhhhhhc-ccCcccccccccccccCcCC-------CcceEEEEEeeeeeeeeeeeeeh Confidence 55444333221 2222334445555433 222 223565443322 22343332 223333433 Q ss_pred HHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHH Q lcl|Aclame:pro 173 ARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVV 252 (418) Q Consensus 173 a~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~ 252 (418) +.-++ +..+-++.|.+.++.-+...+|+++++|-+.......+..-.-+||...|. ..|+... .|..++++.|. T Consensus 147 ~~l~n--~i~d~~~~~~~dai~~ia~tiE~a~FyGDs~L~s~~~~~gleFDGl~~lI~---~~NvIDa-rG~~Ls~~~ln 220 (514) T protein:vir:10 147 LQRAN--TIVDSLKVQEYAAISTVIKTDEWAMFYGDADLTSGQKGEGLQFDGLFKLIA---PENHIDL-RGGRLSPAALN 220 (514) T ss_pred hhhcc--chhhHHHHHHHHHHHHHHHHHHHHHhhhcccCCCccccCcchhhhHHHhhc---CCCeEec-CCCCccHHHHh Confidence 33332 455778899999999999999999999987543222223366889887764 5677644 44589999888 Q ss_pred HHHHHHHHhcccCCCceeEEEEeChHHHHHHH-hhhhccceEEEcccce----eeceEEEEEEcCCeEEEEEECcccccc Q lcl|Aclame:pro 253 DATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQ-DIGRFFGEVTVTQRET----SYGMVFTEWKFFKGRLILKEHPLFSAI 327 (418) Q Consensus 253 d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~-~~~~~~~~~~~~~~~~----~~G~~v~~~~SdfG~v~vv~n~~l~~~ 327 (418) .+...+=. +.+++.-+|.+...+..|. .+ ..+.|+....+ ..|..+..|.|-.|.+++-.+-+++. T Consensus 221 ~aA~~i~~-----gfGt~TD~ylp~~vka~f~~~~---~~~qRV~~~~n~~~~~~G~~v~~f~s~~G~I~L~gs~im~~- 291 (514) T protein:vir:10 221 MAARKIGE-----GFGTPTDAYMPIGIKADFVNQH---LNGQRVMLPGQTGGMTTGLDIDKFLSAHGSIRIQGSTIMDS- 291 (514) T ss_pred hhhhhhhc-----ccCChhheeCchHHHHHHhhcc---cCcceEEeecCccceeeeeeccceeEeccceeecCCeeecc- Confidence 77644422 2333444666655555443 33 24455555444 66889999999999998666555432 Q ss_pred CCCCCeEEEEchhhceeeeccCC-CcccccccccCccccccccccccccC---ccccccEEEEEEEEEEecccceE---E Q lcl|Aclame:pro 328 GISPGFAVVVDVPAVKLAYMDGR-NAKVENYGQGGGENKSGATDYSYGHG---VDAQGGSLTSEWALELLNPQGCA---V 400 (418) Q Consensus 328 ~mp~d~~lv~D~~~~~~~~L~~r-~~~~e~laKtG~~~~~~~~~~~~~~g---~Da~k~~i~~E~tLev~N~kA~a---~ 400 (418) ...|=++.+..--++-..- .....+.+ .| .++..+ ....+| -+++.|. +=.|-..+.|-.+-- . T Consensus 292 ----~n~L~~~~~~~~~Ap~~~~va~svT~~~-~g-~~~~ad--~t~~~g~~~~~~~~g~-~~sYaVv~~n~~GeS~ps~ 362 (514) T protein:vir:10 292 ----DNKLDFDRPVSPTAPTAPQLSATVTPDG-GG-LWHEAD--KTDSKGEVILNKEVGV-EQSYVAVMVSRHGDSRPSL 362 (514) T ss_pred ----cccCccCCccCCcCCCCCcceEEEecCc-cc-ccCccc--ccccccccccccccce-eEEEEEEEECCCCcccccc Confidence 1111111111101111000 00001111 11 001000 000111 0111111 113444444433221 0 Q ss_pred eecCccccc--cc---------CCCCCCC Q lcl|Aclame:pro 401 ITGLQKAKE--RV---------YLTAPAP 418 (418) Q Consensus 401 I~gL~~~~~--~~---------~~~~~~~ 418 (418) |..-+.++. ++ +...|.- T Consensus 363 ~vtaT~a~~~~~i~ltItp~~~~~~~p~y 391 (514) T protein:vir:10 363 VQTATPTKKDDAITLTITPNAMQNVIPDY 391 (514) T ss_pred eeeeeeeccCceEEEEEEeccCcccccce Confidence 111111111 11 1111100 No 46 >protein:vir:80068 Length: 301 # NCBI annotation: gp8 # Family: family:all:463 # MgeID: mge:1876 # MgeName: B054 # Cross-refs: genbank:acc:YP_001468712;genbank:gi:157325292;genbank:GeneID:5601759 Probab=92.21 E-value=0.0031 Score=34.35 Aligned_cols=274 Identities=9% Similarity=0.009 Sum_probs=117.3 Q ss_pred EEccccc-cccCceeEeccCceEE--EEEEecCceeEEEccccccchhhhhCCceE--E----Eeeccc--cccc-CCcC Q lcl|Aclame:pro 80 TVENSDG-LTKGMIFYNEATGENM--RLELVNGLNLTVKRQTGRISAAIIAANTKL--I----VIGTAF--EEGS-QRPT 147 (418) Q Consensus 80 tV~~~~~-~~~~~~~~~~~~~E~~--~Vtav~g~~~tv~rg~~~tta~~~~~gt~v--~----~~g~a~--~EGa-da~~ 147 (418) -|.++++ |..... ..++.+++ +.....+..+--.++. ..++++. + ..|.+. ..++ |.|. T Consensus 1 ~~~~~~g~f~~~~l--~~id~~v~e~~~~~l~~r~l~~v~~~-------~~~~~~~~~~~~~~~~G~~~~~~~~~~dip~ 71 (301) T protein:vir:80 1 MQGKITATIEARDL--QAIDNVIYEPKQEELTARSVFPQKFD-------VNEGAESYSFDVMTRSGAAKIIANGADDLPL 71 (301) T ss_pred CCccccchhhHHHH--HHHHHHHHHhhhhhhhhhhhcccccC-------CCCceEEEEEeeeccceeEEEecCccccccc Confidence 2222221 222111 11222221 0111111111100011 1111111 0 011111 1111 1221 Q ss_pred cccccceeccceeEEEe--eeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHH Q lcl|Aclame:pro 148 ARSIQPVYVPNFTQIFR--NAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGI 225 (418) Q Consensus 148 ~~~~~~~~~~N~tQIf~--~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI 225 (418) .... ..+. +.+|++ ..+.++--.-+.....+.+.-....+.+...+.+.+....++|.+.. ..-|+ T Consensus 72 ~~~~-~~~~--~~~i~~~~~~~~~~~~El~~a~~~g~~l~~~k~~aa~~~~~~~~n~~~f~G~~~~---------g~~GL 139 (301) T protein:vir:80 72 VDVD-MVRK--SVPIYSIGIGLSYTIQDLRAARMQGTTVDAAKATTVRRAIAEKENSIAFRGEKKY---------AIKGA 139 (301) T ss_pred cccc-ceeE--EEEEEEEEeeeeecHHHHHHHHHhCCChHHHHHHHHHHHHHHhhceEEeeecccc---------cceee Confidence 1111 1111 334444 55555544444445566665566667777888888888888886532 12333 Q ss_pred HHHHhhcc-ccCccccCCC---Cccc----hHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcc Q lcl|Aclame:pro 226 VDAVRQYA-PDNVNAMPNP---TAVT----YDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQ 297 (418) Q Consensus 226 ~~~i~~~~-~~nv~~~~~~---a~~t----e~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~ 297 (418) +..=.-.. .+.....++. +.-| .++|..++.++|..++... .+..+++++.....|+.- ++. T Consensus 140 lN~p~~~~~~~~~~~~~~~~~w~~~t~~ei~~di~~~~~~l~~~s~g~~--~p~~L~L~p~~~~~L~~~-------~~~- 209 (301) T protein:vir:80 140 FEATGIQIDVSPTTGVGNVSKWEKKTAEQIIDEIGEAHTKITVLPGYGT--ASLKLCLPPKQFELINKK-------RYS- 209 (301) T ss_pred ecCCCcccccccCcccccccccccCCHHHHHHHHHHHHHHHHHhcCcee--cccEEEecHHHHHhhhhc-------ccc- Confidence 32100000 0000000000 1112 4567777778887543332 345688898888777641 000 Q ss_pred cceeeceEE-EEEEcCCeEEEEEECccccccCC-CCCeEEEE--chhhceeeeccCCCcccccccccCcccccccccccc Q lcl|Aclame:pro 298 RETSYGMVF-TEWKFFKGRLILKEHPLFSAIGI-SPGFAVVV--DVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSY 373 (418) Q Consensus 298 ~~~~~G~~v-~~~~SdfG~v~vv~n~~l~~~~m-p~d~~lv~--D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~ 373 (418) ...|..+ +.+...+.-+.|+.-|.|...+. ..+.++++ +++++++++= .++...+.-..+. T Consensus 210 --~~~~~tvl~~l~~~~~~~~I~~~p~L~~~g~~g~~~~v~~~~~~d~~~~~v~--~~~~~~~~e~~~~----------- 274 (301) T protein:vir:80 210 --NEDSRSVLKVLQDNAWFSAIVRVPDLAGMGTAGSDSFAVIHDSNETAELIIP--MDITRHPEEYSFP----------- 274 (301) T ss_pred --CCCCeeHHHHHHHHcCcceEEEcceeccCCCCcccEEEEEecCCcEEEEEec--CceeeecceecCc----------- Confidence 1123332 33434455577888888765432 23556666 4666665543 2222222111110 Q ss_pred ccCccccccEEEEE-EEEEEecccceEEeecC Q lcl|Aclame:pro 374 GHGVDAQGGSLTSE-WALELLNPQGCAVITGL 404 (418) Q Consensus 374 ~~g~Da~k~~i~~E-~tLev~N~kA~a~I~gL 404 (418) ..+ --.+.. .+++++-|.|.+.+.|+ T Consensus 275 ----~~~-~~~~~r~~Gv~i~~P~ai~~~~GI 301 (301) T protein:vir:80 275 ----RTK-VPFEERTAGVVVRFPAAIVRVDGI 301 (301) T ss_pred ----eeE-eeeeeeeEEEEEEccceEEEEecC Confidence 000 011223 37999999999999999 No 47 >protein:vir:6242 Length: 390 # NCBI annotation: gp36 # Family: family:all:21 # MgeID: mge:131 # MgeName: phi-BT1 # Cross-refs: genbank:acc:NP_813696;swissprot:trembl:q859c1;genbank:gi:29366756;interpro:IPR006444;uniprot:Q859C1;genbank:GeneID:1258897 Probab=90.42 E-value=0.021 Score=29.79 Aligned_cols=299 Identities=12% Similarity=0.102 Sum_probs=120.7 Q ss_pred Ccceeeeec--cCCChh---hhhhhhcc-cceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeec Q lcl|Aclame:pro 1 MSVYAGIFN--TTLNPQ---ELNMKSFA-GTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAA 74 (418) Q Consensus 1 ~~~~~~~~~--~~~~~~---~~~~~s~~-~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a 74 (418) ...-.+... ++.+.. .+ |+.. .+. + + .........+ +++ + T Consensus 72 ~~~~~~~~~~~~~~~~~~~~~~--r~~~~~~~----r--~-~~~~~~~~~~----t~~---------------------~ 117 (390) T protein:vir:62 72 SGLQGSGSGAQRSADVDDDATL--RAGNLGEA----R--S-FEFAPEKRDG----TKA---------------------G 117 (390) T ss_pred hhcccccccchhhcchHHHHHH--hhhhhhhh----H--H-HHhhhhhhcc----ccc---------------------C Confidence 111111111 122221 11 1110 000 0 0 0000000000 000 0 Q ss_pred CceEEEEccccccccCceeEeccC---------ceEEEEEEe-cCceeEEEccccccchhhhhCCceEEEeecccccccC Q lcl|Aclame:pro 75 DATVLTVENSDGLTKGMIFYNEAT---------GENMRLELV-NGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQ 144 (418) Q Consensus 75 ~~t~~tV~~~~~~~~~~~~~~~~~---------~E~~~Vtav-~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGad 144 (418) + .++.+..+....+. .-+..|... ++..+.+-+-.+... ..|. .||+. T Consensus 118 ~---------g~~~~~~~~~~~i~~~~~~~~~l~~~~~~~~~~~~~~~~~p~~~~~~~-------a~wv------~E~~~ 175 (390) T protein:vir:62 118 N---------PNVLSRTLYGQLIAQAVERSAIMRGGATTFTTSDANPLDFTVITGRSS-------ASIV------GETAE 175 (390) T ss_pred C---------CccccccchHHHHHHHHhhhhhhhhcceeeecCCCceeEEEEEcCCcc-------eeee------ccccc Confidence 0 01111111100000 001112222 223333332222111 1222 46665 Q ss_pred CcCcccccceeccceeEEEeee----eeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccch Q lcl|Aclame:pro 145 RPTARSIQPVYVPNFTQIFRNA----WALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLH 220 (418) Q Consensus 145 a~~~~~~~~~~~~N~tQIf~~~----v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r 220 (418) .+.... .+.||-... .-+.=|.+....... +..++-...-...+.+.+|.+||+|. + +| T Consensus 176 ~~~~~~-------~f~~i~~~~~k~~~~~~iS~ell~ds~~-~l~~~i~~~l~~~i~~~~d~~~l~G~------G-~p-- 238 (390) T protein:vir:62 176 IPESYP-------ATAQRSMGGFKYGFASVVSYEFATDQVL-DLVGFLVSDAGPAIGDAMGRHFITGT------G-QP-- 238 (390) T ss_pred cccccc-------ceeeeEeeeeeEEeehHHHHHHHhhhhH-HHHHHHHHHHHHHHHHHHHhhhhccC------C-cc-- Confidence 544221 122332222 223335555544322 33344444445677888999999874 1 22 Q ss_pred hhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccce Q lcl|Aclame:pro 221 TTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET 300 (418) Q Consensus 221 ~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~ 300 (418) .||+..... ..+....+....++.++|.++...+-.. ...+ ..+++++.....|.++...++++-+.. +- T Consensus 239 --~Gi~~~~~~--~~~~~~~~~~~~~~~~~l~~~~~~l~~~--~~~~---a~~vmn~~~~~~L~~lkd~~g~~l~~~-~~ 308 (390) T protein:vir:62 239 --RGILTDASP--ATATFLATDTDSKVSDALIDLFHEVPSA--YRAN---AKYVVNDLRAAQMRKLKDANGQYLWQS-GL 308 (390) T ss_pred --ccccccccc--cccceecccccccchHHHHHHHHhhhhh--hhcC---CEEEEchHHHHHHHHhhccCCCeeecC-Cc Confidence 255543211 1112222333467888888877665321 1112 246788888888988855556554322 21 Q ss_pred eeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCcccc Q lcl|Aclame:pro 301 SYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQ 380 (418) Q Consensus 301 ~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~ 380 (418) ..|. ..+=+|. .|+.++ .||++.+++-|++++.+..- .++..+.+....+ ..|.. T Consensus 309 ~~g~----~~~l~G~-Pv~~~~-----~~p~~~i~~gd~s~~~i~~~--~~~~v~~~~~~~~-------------~~~~~ 363 (390) T protein:vir:62 309 TVGA----PSLFNGK-VVETDD-----GMPADKILFADLSKYRVRFA--GSLRVDRSVDAKF-------------STDQI 363 (390) T ss_pred CCCc----cceeccc-ceEEec-----CCCCccEEEeeccceeEEee--cceEEEeeccccc-------------cCCcE Confidence 1111 0111232 334443 46888888899876433222 1222211111110 00223 Q ss_pred ccEEEEEEEEEEecccceEEeecCcccc Q lcl|Aclame:pro 381 GGSLTSEWALELLNPQGCAVITGLQKAK 408 (418) Q Consensus 381 k~~i~~E~tLev~N~kA~a~I~gL~~~~ 408 (418) ....+.=+...+.+|+|..+++ ++.|. T Consensus 364 ~~~~~~r~d~~~~~~~A~~~l~-~~~~a 390 (390) T protein:vir:62 364 VYRFLQRADGLLVDARGAKVLT-VTPGA 390 (390) T ss_pred EEEEEEEeCcEeechhheEEEE-eecCC Confidence 2233444788999999988887 55554 No 48 >protein:vir:81070 Length: 390 # NCBI annotation: p09 # Family: family:all:585 # MgeID: mge:1889 # MgeName: Xop411 # Cross-refs: genbank:acc:YP_001285679;genbank:gi:148727187;genbank:GeneID:5247115 Probab=90.25 E-value=0.022 Score=29.69 Aligned_cols=316 Identities=12% Similarity=0.057 Sum_probs=122.6 Q ss_pred Cc-ceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhc---cccceeee-eeeeeeeecccceeEEEEEeecC Q lcl|Aclame:pro 1 MS-VYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVV---GSTTAKAS-THGYFSKTMVFASAVVTAEAAAD 75 (418) Q Consensus 1 ~~-~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~---~~~~~~~~-~~~~~~~~~~~~~~t~~a~~~a~ 75 (418) -. .-...........+. .+.+.......-......+.....-. .+...... .-+|....+...... T Consensus 70 ~~~~~~~~~~~~~~~~~~-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~g~~~~~~~~~~ii~~~~~~-------- 140 (390) T protein:vir:81 70 GGDVQHVSVGDMFVASEQ-FQASAGRWNDRSARATMNIKAALNTASTDAAGSAGALTTPNRLPGFITPPDAR-------- 140 (390) T ss_pred ccccccccchhhhhhhHH-HHHHHHHHhhhhhhhhhHHHHHHHhhccccccCCcceechhhhHHHHHHHhhh-------- Confidence 00 000000000000000 00000000000000000111110000 00000000 001111111000000 Q ss_pred ceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCccccccee Q lcl|Aclame:pro 76 ATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVY 155 (418) Q Consensus 76 ~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~ 155 (418) ..+.. .+.+..+.+..++..+-...+. ...|. .||...+..... . T Consensus 141 ---------~~l~~-----------~~~~~~~~~~~~~~~~~~~~~~------~a~~v------~Eg~~~~~~~~~---~ 185 (390) T protein:vir:81 141 ---------LTVRD-----------LIGSGRTDSALIEYVQETGFVN------NAAIV------AEGALKPESSLK---F 185 (390) T ss_pred ---------hhhhh-----------hcceeeccCCceEEEEEecCCc------ceeee------cCCcccccccce---e Confidence 00000 0011111222222211111100 01111 255544432211 1 Q ss_pred ccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhcccc Q lcl|Aclame:pro 156 VPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPD 235 (418) Q Consensus 156 ~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~ 235 (418) -.-...+++-...+.-|.++..... +-..+-...-...+.+.+|.+||+|.. .+.. ..||+.... . T Consensus 186 ~~i~~~~~k~~~~~~is~ell~d~~--~~~~~i~~~l~~~~~~~~d~a~l~G~g----~~~~----~~Gi~~~~~----~ 251 (390) T protein:vir:81 186 AKKTDTTHVIAHTMKATRQILSDAP--QLASYMNNRLIRGLKVKEDAEILRGTG----ANDG----LLGLIPQAT----T 251 (390) T ss_pred eEEEEeeeEEEEeehhhHHHHHhHH--HHHHHHHHHHHHHHHHHHHHHHHhcCC----CCCc----ccceeeccc----c Confidence 1122333333333444445555432 445556666677789999999998842 2222 346653211 1 Q ss_pred CccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCeE Q lcl|Aclame:pro 236 NVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKGR 315 (418) Q Consensus 236 nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~ 315 (418) .......+...+.+++.+++.++...+... ..+++++.....|.++-...|++.+.......+ -+=+|. T Consensus 252 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~-----~~~v~~~~~~~~l~~lkd~~G~~l~~~~~~~~~------~~l~G~ 320 (390) T protein:vir:81 252 YAAPTTIAGATRVDQLRLAMLQASLAEYNP-----SGIVINPIDWAAIELAKDANNQYLIGNARGTLT------PTLWGL 320 (390) T ss_pred cccccccccchhHHHHHHHHHhhccccCCC-----CEEEEcHHHHHHHHHhhcCCCceeecCcccccC------ceecce Confidence 111222334556777888877776543222 246778888888888755555554432111110 012453 Q ss_pred EEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecc Q lcl|Aclame:pro 316 LILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNP 395 (418) Q Consensus 316 v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~ 395 (418) .|+.++ +||++++++.|++..-.-+.+ -+...+..... ..-..|....+.+.-+...+++| T Consensus 321 -pv~~~~-----~~p~~~~~~gd~~~~~~~~~~-~~~~v~~~~~~------------~~~~~~~v~~r~~~r~d~~v~~~ 381 (390) T protein:vir:81 321 -PVVATQ-----AMAPGEFLVGAFDLAAQIFDQ-WDARVEIGYVG------------EDFQRNMITVLAEERLALVVYRP 381 (390) T ss_pred -eeEEcC-----CCCCCcEEEEehhceEEEEEe-cceEEEEeccc------------chhhcCcEEEEEEEeeccEEecc Confidence 455553 478899999999864222220 12211111000 00001444556788899999999 Q ss_pred cceEEeecC Q lcl|Aclame:pro 396 QGCAVITGL 404 (418) Q Consensus 396 kA~a~I~gL 404 (418) +|+.+|+== T Consensus 382 ~a~v~~t~a 390 (390) T protein:vir:81 382 EALISGSFA 390 (390) T ss_pred cceEEEEeC Confidence 999887632 No 49 >protein:vir:103285 Length: 296 # NCBI annotation: hypothetical protein # Family: family:all:463 # MgeID: mge:1605 # MgeName: JK06 # Cross-refs: genbank:acc:YP_277465;genbank:gi:71834107;genbank:GeneID:3562396 Probab=89.56 E-value=0.014 Score=30.81 Aligned_cols=282 Identities=12% Similarity=0.034 Sum_probs=118.3 Q ss_pred EEEEeecCceEEEEccccccccCceeEeccCceEE--EEEEecCceeEEEccccccchhhhhCCceEEEeecccc--c-c Q lcl|Aclame:pro 68 VTAEAAADATVLTVENSDGLTKGMIFYNEATGENM--RLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFE--E-G 142 (418) Q Consensus 68 ~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~--~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~--E-G 142 (418) ++.....++.. |....+= .++..++ +...+.+-++--.++..+..+....- ...+..|.++. . + T Consensus 1 ~~~~~a~~~~~--------f~~~ql~--~id~~v~e~~~~~l~~~~~i~v~~~~~~~~~~~~~-~~~~~~G~a~~~~~~~ 69 (296) T protein:vir:10 1 MGVDKADAAGI--------WTVKQLT--ASLNKAYETEYDQNSVVNLFPVSNEIPGYAKYFEY-PVFDGVGIAQIVADYT 69 (296) T ss_pred CcccchhhhHH--------HHHHHHH--HHHHHHHhhhhcccccceecccccCCCCceeEEEe-eeeeccCceeEeCCCc Confidence 22111111111 2211110 1111111 00111111111111111111100000 00111122221 1 1 Q ss_pred cCCcCcccccceeccceeEEEeeeeeechhHHHH--hhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccch Q lcl|Aclame:pro 143 SQRPTARSIQPVYVPNFTQIFRNAWALTDTARAS--YAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLH 220 (418) Q Consensus 143 ada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av--~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r 220 (418) .|.|..... ..+. ..+|++-...++.+-+=+ ....+.+.-+...+-+...+.+.+....++|.+.. T Consensus 70 ~dip~v~~~-~~~~--~~~i~~~~~~~~~~~~El~~a~~~g~~l~~~ka~aA~~~~~~~~n~~~f~G~~~~--------- 137 (296) T protein:vir:10 70 DDLPLVDAL-ATER--QGKVFRFGNAFLISIDEIKVGQATGQSLSTRKQSLAFEAHDKLLDKLVWSGSTAH--------- 137 (296) T ss_pred cccceeecc-ceeE--EEEEEEEEeeeeecHHHHHHHHHhCCChHHHHHHHHHHHHHHhhceEEEeecccc--------- Confidence 122211111 1111 335565555555444422 33344443333444455777888888888886522 Q ss_pred hhHHHHHHHhhccccCccccCC--CCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEccc Q lcl|Aclame:pro 221 TTQGIVDAVRQYAPDNVNAMPN--PTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQR 298 (418) Q Consensus 221 ~t~GI~~~i~~~~~~nv~~~~~--~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~ 298 (418) .+-|++.. ..-....+.++ ..+--.+|+..++..+|...... ..+..+..++.+...|+.... T Consensus 138 g~~GLlN~---p~v~~~~~~~~W~~~t~i~~Di~~~~~~l~~~s~g~--~~p~~l~L~p~~~~~L~~~~~---------- 202 (296) T protein:vir:10 138 GIPSVFDY---PNINNVVSGGSWSQPTTAVSDITSLLDIIETSTNGQ--HRATHLLLPTTARRIMQNLVP---------- 202 (296) T ss_pred cceeEeec---CCCccccccCCccCHHHHHHHHHHHHHHHHHhhCce--ecceeEEeCHHHHHHHhhccC---------- Confidence 12233311 00000111000 01123667777788888754332 234567778888887765311 Q ss_pred ceeeceE-EEEEEcCCeEEEEEECccccccCC-CCCeEEEEc--hhhceeeeccCCCcccccccccCccccccccccccc Q lcl|Aclame:pro 299 ETSYGMV-FTEWKFFKGRLILKEHPLFSAIGI-SPGFAVVVD--VPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYG 374 (418) Q Consensus 299 ~~~~G~~-v~~~~SdfG~v~vv~n~~l~~~~m-p~d~~lv~D--~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~ 374 (418) ..|.. .+.+...|.-+.|+.-|.|...+- ..+.+++++ ++++.+++= .++...+.-+.+ . T Consensus 203 --~~~~t~l~~ik~~~~~l~i~~~~~l~~a~~~g~~~~v~~~~~~~~~~~~v~--~~~~~~~~e~~~-----l------- 266 (296) T protein:vir:10 203 --GTSVSYGEFFRQNNSGVTVEFVQYLNDYNGTGTSAAIAYEKDPNNMAIEIP--EATNALPAQPKD-----L------- 266 (296) T ss_pred --CCCccHHHHHHHhcCCceEEEeeeeccCCCCcceEEEEEEcCCceEEEEcC--cceeeecccccC-----c------- Confidence 11222 234555555666777777754322 335677766 777776642 233333322111 0 Q ss_pred cCccccccEEEEEE-EEEEecccceEEeecCccc Q lcl|Aclame:pro 375 HGVDAQGGSLTSEW-ALELLNPQGCAVITGLQKA 407 (418) Q Consensus 375 ~g~Da~k~~i~~E~-tLev~N~kA~a~I~gL~~~ 407 (418) +..-.++.-+ +++++.|.|.+.+.|++=| T Consensus 267 ----~~~~~~~~~~~Gv~i~~P~ai~~~dGI~~~ 296 (296) T protein:vir:10 267 ----HFKIPVTSKATGLIVYRPLTMAVMKGITFA 296 (296) T ss_pred ----eEEEeeEeeEEEEEEECCceeEEEeeeecC Confidence 1111223334 5999999999999999999 No 50 >protein:vir:81227 Length: 413 # NCBI annotation: gp6, major capsid protein # Family: family:all:585 # MgeID: mge:1893 # MgeName: BFK20 # Cross-refs: genbank:acc:YP_001456736;genbank:gi:157168379;hssp:P49861;interpro:IPR006444;uniprot:Q9MBJ9;genbank:GeneID:5580350 Probab=88.84 E-value=0.03 Score=28.94 Aligned_cols=326 Identities=10% Similarity=0.019 Sum_probs=113.2 Q ss_pred CcceeeeeccCCChh--h---hhhhhcccceeEeecCCcchhHHHhhhccccceeeeee-eeee-eecccceeEEEEEee Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQ--E---LNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTH-GYFS-KTMVFASAVVTAEAA 73 (418) Q Consensus 1 ~~~~~~~~~~~~~~~--~---~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~-~~~~-~~~~~~~~t~~a~~~ 73 (418) ..-..-.+.+...-. + ........... .....-.+.+....++........+ ..++ +-+.. T Consensus 74 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~--~~~~~~~~~~~~~~~~~~~~~~~~vp~~~~~~ii~~---------- 141 (413) T protein:vir:81 74 YKSIGEFFAKRAGDQIKQQAGGAQLNYSVGEY--VAPRVKAASDPASTATLTDEFQGGYGTTWNRNIIYR---------- 141 (413) T ss_pred hhhhhhhhhhhhhhHHHHHHHHHHhhhhhhhh--hhhHHHhhhhhhhhcccccccccccchhhHHHHHHH---------- Confidence 000000000000000 0 00000000000 0000000111111111000000000 0000 00000 Q ss_pred cCceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccc Q lcl|Aclame:pro 74 ADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQP 153 (418) Q Consensus 74 a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~ 153 (418) ......+ ...+.+..+.+..++.-+-....+ ...+..|. .||...+.... T Consensus 142 -------------~~~~~~l-----~~~~~~~~~~~~~~~~~~~~~~~~---~~~~a~~v------~Eg~~~~~~~~--- 191 (413) T protein:vir:81 142 -------------RREKLVV-----ADLMDNLTMTNTTIKYLMEKANRV---VEGGFKTV------AEGGKKPYMRF--- 191 (413) T ss_pred -------------HhhhhhH-----HhhcceeeccCCceeEEEeccccc---ccccccee------cCcccccccCc--- Confidence 0000000 011112222222222111111100 00111222 35544432221 Q ss_pred eeccceeEE----EeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHH Q lcl|Aclame:pro 154 VYVPNFTQI----FRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAV 229 (418) Q Consensus 154 ~~~~N~tQI----f~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i 229 (418) ..+.|| ++-...+.-|.+..+... ....|-..+-...+.+-+|++||+|.- .+.+ -.||+... T Consensus 192 ---~~f~~i~~~~~k~~~~~~iS~ell~ds~--~l~~~i~~~la~~~~~~~d~~~l~G~G----~~~~----~~Gi~~~~ 258 (413) T protein:vir:81 192 ---ADFDIVTESLSKIAGLTKITDEMIEDYD--FLVSYINARLLEELAIEEERQLLLGDG----TGNN----LTGLLKRD 258 (413) T ss_pred ---ccceeeEeeeeeEEEeehhhHHHHHHHH--HHHHHHHHHHHHHHHHHHHHHHhccCC----CCCc----cccccccc Confidence 112222 222222223333443322 233444445566789999999998742 2222 34554321 Q ss_pred hhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEccccee-eceE-EE Q lcl|Aclame:pro 230 RQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETS-YGMV-FT 307 (418) Q Consensus 230 ~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~-~G~~-v~ 307 (418) . ... ....++....+++.+++..+-...+.. ...+++++.....|.++-..+|++.+...... .|.- .. T Consensus 259 ~----~~~-~~~~~~~~~~~~i~~~~~~~~~~~~~~----~~~~vmn~~~~~~l~~lkd~~G~~l~~~~~~~~~~~~~~~ 329 (413) T protein:vir:81 259 G----IQT-LAVSNKDELADSIYKAMTNISLATPFQ----ADALVINPLDYQELRLAKDANGQYYGGGVFQGQYGSGGIM 329 (413) T ss_pred c----ccc-ccccccchhHHHHHHHHHHhhhhccCC----CcEEEEcHHHHHHHHHhhccCCceeccccccccccccccc Confidence 1 111 111112233444445544443322211 11256777777788887655666544322111 1100 00 Q ss_pred EEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCC-CcccccccccCccccccccccccccCccccccEEEE Q lcl|Aclame:pro 308 EWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGR-NAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTS 386 (418) Q Consensus 308 ~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r-~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~ 386 (418) .-.+=+|. .|+.+ .+||++++++.|++...+-+. | ++..+.....+ +. -..|....+... T Consensus 330 ~~~~l~G~-pv~~s-----~~~~~~~~~~gd~~~~~~~~~--~~~~~v~~~~~~~----------~~-~~~~~~~~r~~~ 390 (413) T protein:vir:81 330 LDPAPWGL-RTVQS-----QVVPVGKPVVGAFRSAASVLR--KGGVRIDSTNTNV----------DD-FENNLITVRAEE 390 (413) T ss_pred cCceecce-eeEEc-----CCCCcccEEEEecccEEEEEE--ecceEEEEecccc----------ch-hhcCcEEEEEEE Confidence 00122343 45555 357889999999986422222 2 22222211111 00 001344555667 Q ss_pred EEEEEEecccceEEeecCcccccccCCCCC Q lcl|Aclame:pro 387 EWALELLNPQGCAVITGLQKAKERVYLTAP 416 (418) Q Consensus 387 E~tLev~N~kA~a~I~gL~~~~~~~~~~~~ 416 (418) .+.+.+.++.|+.+++- +++ ++| T Consensus 391 r~d~~~~~~~a~~~l~~-~~~------~~p 413 (413) T protein:vir:81 391 RVGLMVTFPEAIVQLDV-AEV------VTP 413 (413) T ss_pred eeccEEecccceEEEEe-cCC------CCC Confidence 88999999999999863 222 222 No 51 >protein:vir:96123 Length: 274 # NCBI annotation: ORF013 # Family: family:all:522 # MgeID: mge:1602 # MgeName: 37 # Cross-refs: genbank:acc:YP_240078;genbank:gi:66395742;genbank:GeneID:5133103 Probab=88.05 E-value=0.035 Score=28.58 Aligned_cols=254 Identities=15% Similarity=0.079 Sum_probs=122.6 Q ss_pred EccccccccCcee----EeccCc---eEEEEEEe----------cCceeEEEccccccchhhhhCCceEEEeecc--ccc Q lcl|Aclame:pro 81 VENSDGLTKGMIF----YNEATG---ENMRLELV----------NGLNLTVKRQTGRISAAIIAANTKLIVIGTA--FEE 141 (418) Q Consensus 81 V~~~~~~~~~~~~----~~~~~~---E~~~Vtav----------~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a--~~E 141 (418) -++...-....|+ ..-+.+ ..++...+ .|+++++-+ ++ .+|.+ ..| T Consensus 1 ma~~~T~~~d~i~Pev~s~~v~~~~~~~~~~~~~~~~~~~l~g~~G~tv~ip~--~~-------------~~g~~~~~~~ 65 (274) T protein:vir:96 1 MAQGTTKVSNLIVPEVLAPMMQAELDKKLRFAQFADIDSTLVGQPGDTLTFPA--FT-------------YSGDAQVIAE 65 (274) T ss_pred CCccccchhhhhhhHHHHHHHHHHHHhhhhhcccccccccccCCCCCEEEEEe--ec-------------cCCCccccCC Confidence 3322211111111 000000 00111111 123333211 00 01111 134 Q ss_pred ccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchh Q lcl|Aclame:pro 142 GSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHT 221 (418) Q Consensus 142 Gada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~ 221 (418) |.+.+...-......--..|+ .+.|++++-+.+. ...|.+..-..+....+.+.+++.++.--+. ++ T Consensus 66 g~~i~~~~it~~~~~~~i~~~-~~~~~i~D~~~~~---~~~d~~~~~~~~~~~~~a~~~d~~i~~~l~~-----a~---- 132 (274) T protein:vir:96 66 GEKIPVDQIGTSKREAKVRKI-GKGTELTDEAVLS---GFGDPQGEAVRQHGLAIANKVDNDVLEALKG-----AT---- 132 (274) T ss_pred CCcCchhhcccceeEEEEEee-eceeeecHHHHHh---hcchHHHHHHHHHHHHHHHHHHHHHHHHHhc-----CC---- Confidence 444332222222211133443 4667777766544 3445667767777778888998887732210 00 Q ss_pred hHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEccc-ce Q lcl|Aclame:pro 222 TQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQR-ET 300 (418) Q Consensus 222 t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~-~~ 300 (418) ....+.+++.+.+.++.+++= .. ....++++|++.+...|-+.. ..++... +. T Consensus 133 -----------------~~~~~~~~~~d~i~dA~~~l~----d~-~~~~~~ivv~p~~~~~L~k~~----~~~f~~~~~~ 186 (274) T protein:vir:96 133 -----------------LTVEADITKLDGLQTAIDKFN----DE-DLEPMVLFVNPLDAGGLRTSA----SDNFTRPTQL 186 (274) T ss_pred -----------------CCcCcccccHHHHHHHHHHhc----cc-CCCceEEEeCHHHHHHHHhcc----cccccccccc Confidence 011223567888888887753 22 236789999999888776532 1121111 11 Q ss_pred eeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCcccc Q lcl|Aclame:pro 301 SYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQ 380 (418) Q Consensus 301 ~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~ 380 (418) ..+....-....|-=+.|+.++ ++|.++.+++.+..+.+. .+++...|..+..- ++.|.. T Consensus 187 g~~~~~~g~ig~~~G~~Vi~s~-----~~p~~t~~l~~~gA~~~~--~~~~~~vE~~Rd~~-------------~~~d~i 246 (274) T protein:vir:96 187 GDNIIVKGAFGEALGAVIVRSN-----KLNKGEALLAKKGAVKLI--TKRDFFLEKDRDAS-------------RKSTAL 246 (274) T ss_pred cccceeecccceecCeeEEEcC-----CCCcceEEEEeCcceeee--ecCCcccccccchh-------------hcccEE Confidence 1122222112222224677764 468899999999887654 34665555443221 223544 Q ss_pred ccEEEEEEEEEEecccceEEeecCcccccccC Q lcl|Aclame:pro 381 GGSLTSEWALELLNPQGCAVITGLQKAKERVY 412 (418) Q Consensus 381 k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~ 412 (418) .+..+ |+..+.||.+..+++- -+.++|- T Consensus 247 ~~~~~--yg~~~~~~~~vv~~t~--~~~~~~~ 274 (274) T protein:vir:96 247 YSDKH--YVAYLYDESKVVKITK--GAGDEVM 274 (274) T ss_pred EEeeE--EEEEEEcCccEEEEEc--CcccccC Confidence 44444 8999999998888763 3333443 No 52 >protein:vir:4197 Length: 314 # NCBI annotation: putative structural protein # Family: family:all:1377 # ACLAME annotation(s): phi:0000161 - phage head/capsid # MgeID: mge:88 # MgeName: psiM100 # Cross-refs: genbank:acc:NP_071822;genbank:gi:11863105;genbank:GeneID:1257607 Probab=85.26 E-value=0.054 Score=27.53 Aligned_cols=299 Identities=9% Similarity=0.023 Sum_probs=116.6 Q ss_pred cccceeEEEEEeecCceEEEEcccc-ccccCceeEec---cCceE--E-EEEEec---CceeEEEc-cccccchhhhhCC Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSD-GLTKGMIFYNE---ATGEN--M-RLELVN---GLNLTVKR-QTGRISAAIIAAN 129 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~-~~~~~~~~~~~---~~~E~--~-~Vtav~---g~~~tv~r-g~~~tta~~~~~g 129 (418) |+.-.--. .....|++.+.. ++..+.-+..- +.++. + +++-|+ ..+..+.+ +.+.+. T Consensus 1 ~~~~~~~~-----~~~k~it~~d~~gG~L~P~~~~~~i~~l~e~s~i~~~a~vi~t~~s~~~~i~~i~~g~~~------- 68 (314) T protein:vir:41 1 MDFLNKPF-----QITPKIDVPDLGKGILAVQRFGEFVREVRENSAIIKDARVLNALKSYEVDISRISLGVEL------- 68 (314) T ss_pred CchhhhHH-----HhhcccccccCCCceeChHHHHHHHHHHHhccchhhheeeecccCccceeecccccCccc------- Confidence 33322211 112235555443 33333322100 11111 1 011111 11111111 111111 Q ss_pred ceEEEeeccccc-ccCCcCcccccc-eeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcC Q lcl|Aclame:pro 130 TKLIVIGTAFEE-GSQRPTARSIQP-VYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFG 207 (418) Q Consensus 130 t~v~~~g~a~~E-Gada~~~~~~~~-~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G 207 (418) .....| |.+....+..+. ..+.=.|.-..--+.||.-.--=+. .+.+.-.+-..+-.+.+.+|+|.+|++| T Consensus 69 ------~~~~~~~~~~~~~~~~~~tf~~~~l~~~kl~~~v~is~e~L~D~a-~~~~le~~i~~~~Ae~~g~~~~~~~~nG 141 (314) T protein:vir:41 69 ------EPGRNTSGTKVAPTADEVTVSTNTLEMKELVTKVVLEDEALEDNI-EQSAFEQTITSLLASGVTYDLECFFLHA 141 (314) T ss_pred ------ccccccccCCccCCcccccccceeeeeEEEEEeecccHHHHHhhh-chhhHHHHHHHHHHHHHHHHHHHHhhcc Confidence 111112 211111111111 0011012222233455543322122 2234334555566778999999999999 Q ss_pred cccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhh Q lcl|Aclame:pro 208 QAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIG 287 (418) Q Consensus 208 ~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~ 287 (418) ..... ++.+-..+-.||+..+.. .-+...+++...+.+.|.+++..+-.. .-.++.+.+ ++++.....++.++- T Consensus 142 dg~~~-s~~~~~~~p~G~l~~a~~---~~~~~~~~~~~~~~~~~~~l~~sl~~~-yr~~~~~~~-~~m~~~t~~~~r~~l 215 (314) T protein:vir:41 142 DSSLT-TGRELYRINDGWMKLAGN---QYTDAEPEDENWPLNLFDGMMDELDTR-YLQLKPRMK-FYVSNEIYNGYRKQL 215 (314) T ss_pred ccCCc-Ccccchhcchhhhhhccc---ceeecCccccccHHHHHHHHHHhcCch-hhcCCCceE-EEecHHHHHHHHHHH Confidence 75322 122223456787643321 112233344456777777777655221 111233334 456766666666642 Q ss_pred hccceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCcccccc Q lcl|Aclame:pro 288 RFFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSG 367 (418) Q Consensus 288 ~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~ 367 (418) ...+.. .-+.. ..+- .-.+-+| +.|+..+.|+..++|++.+++-|+.++-+.. .++...++-+... ..+.. T Consensus 216 ~~~~~~-l~~~~-~~~~---~~~~l~G-~PV~~~~~~~~~~~~~~~i~fgd~~nlv~~~--~~~ir~~~~~~a~-~~~~~ 286 (314) T protein:vir:41 216 LVRETG-LGDSA-LIGA---TGLQYDG-IPIQYVPALDALGDDKARALLTVPTNLVYGF--WRNIRIEPKRDAA-MRRTE 286 (314) T ss_pred hccCCc-ccchh-hhCC---CCceecc-eeeEecccccccCCCCceEEEechhheEEEe--eceeEEeecccCc-CCeEE Confidence 211110 00000 0011 1111223 4677778888889999999999999985533 3555543322211 00111 Q ss_pred ccccccccCccccccEEEEE--EEEEEecccceE Q lcl|Aclame:pro 368 ATDYSYGHGVDAQGGSLTSE--WALELLNPQGCA 399 (418) Q Consensus 368 ~~~~~~~~g~Da~k~~i~~E--~tLev~N~kA~a 399 (418) ++-. +-.|. ++..| ..+.+-|+.+.| T Consensus 287 ~~~~---~r~d~---~~~~~~aa~~~~~~~~~~~ 314 (314) T protein:vir:41 287 YIAS---LRADC---NYEDENAAVAAVIDMSSGG 314 (314) T ss_pred EEEE---EEece---EEEEcCcEEEEEeeccCCC Confidence 1000 00000 11111 223333333333 No 53 >protein:vir:97053 Length: 390 # NCBI annotation: putative head protein # Family: family:all:585 # MgeID: mge:1653 # MgeName: OP1 # Cross-refs: genbank:acc:YP_453565;genbank:gi:84662600;genbank:GeneID:5142468 Probab=84.82 E-value=0.057 Score=27.38 Aligned_cols=317 Identities=10% Similarity=0.012 Sum_probs=117.9 Q ss_pred CcceeeeeccCC--ChhhhhhhhcccceeEeecCCcchhHHHhhhccccceee---ee-eeeeeeecccceeEEEEEeec Q lcl|Aclame:pro 1 MSVYAGIFNTTL--NPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKA---ST-HGYFSKTMVFASAVVTAEAAA 74 (418) Q Consensus 1 ~~~~~~~~~~~~--~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~---~~-~~~~~~~~~~~~~t~~a~~~a 74 (418) -.-...-....+ ....-..+.+.......-......+..+..-+.+....+ .. -.+..+-........ .+-. T Consensus 68 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~g~lip~~~~~~ii~~~~~~~--~i~~ 145 (390) T protein:vir:97 68 GAGGDVQHVSVGDMFVASEQFQASTGRWNDRSARATMNIKAALNTASTDAAGSAGALTTPNRLPGFITPPDARL--TVRD 145 (390) T ss_pred ccccccccccchhhhhhhHHHHHHHHHhhhhhhhhhhHHHHHHHhhhcccccccccccchhhhHHHHHHHhhhh--hhHh Confidence 000000000000 000000011111111111111111111111110000000 00 011111110000000 0000 Q ss_pred CceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccce Q lcl|Aclame:pro 75 DATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPV 154 (418) Q Consensus 75 ~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~ 154 (418) -.+.+++ .+.+++.-+-...+ . ...|. .||...+..... -. T Consensus 146 ~~~~~~~--------------------------~~~~~~~~~~~~~~-~-----~a~~v------~Eg~~~~~~~~~-~~ 186 (390) T protein:vir:97 146 LIGSGRT--------------------------DSALIEYVQETGFV-N-----NAAIV------AEGALKPESSLK-FA 186 (390) T ss_pred hcceeec--------------------------cCCceEEEEEecCC-c-----ceeee------cCCccccccccc-ee Confidence 0011111 11111111100000 0 01111 255544433211 11 Q ss_pred eccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccc Q lcl|Aclame:pro 155 YVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAP 234 (418) Q Consensus 155 ~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~ 234 (418) . --..+++-..-+.-|.+.++.. .+..++-..+-...+.+.+|.+||+|. +++.. -.||+... . T Consensus 187 ~--i~~~~~k~~~~~~is~ell~ds--~~l~~~i~~~la~a~~~~~d~a~l~G~----g~~~~----p~Gi~~~~----~ 250 (390) T protein:vir:97 187 K--KTDTTHVIAHTMKATRQILSDA--PQLASYMNNRLIRGLKVKEDAEILRGT----GANDG----LLGLIPQA----T 250 (390) T ss_pred E--EEEeeeeEEEeehhhHHHHHhH--HHHHHHHHHHHHHHHHHHHHHHHhhcC----CCCcc----ccceeecc----c Confidence 1 1222333333344444555432 234455555667778999999999873 23322 23665321 1 Q ss_pred cCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCe Q lcl|Aclame:pro 235 DNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKG 314 (418) Q Consensus 235 ~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG 314 (418) ........++....+++.++..++-..+.. ...+++++.....|.++....|++.+.......+- +=+| T Consensus 251 ~~~~~~~~~~~~~~d~~~~~~~~~~~~~~~-----~~~~v~n~~~~~~L~~lkd~~G~~l~~~~~~~~~~------~l~G 319 (390) T protein:vir:97 251 TYAAPTTIAGATRVDQLRLAMLQASLAEYP-----ASGIVINPIDWAAIELAKDANNQYLIGNARGTLTP------TLWG 319 (390) T ss_pred cccccccccccchHHHHHHHHHhhccccCC-----CCEEEEcHHHHHHHHHhhcCCCceeecCccCCCCc------eecc Confidence 111122223345566666666555432222 22466788888888887655666544321111110 1134 Q ss_pred EEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEec Q lcl|Aclame:pro 315 RLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLN 394 (418) Q Consensus 315 ~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N 394 (418) . .|+.++ .||++++++.|++..-+-+. .-+...+...... .-..|....+...-+.+.+++ T Consensus 320 ~-pV~~~~-----~~~~~~~~~gd~~~~~~~~~-~~~~~i~~~~~~~------------~f~~~~~~~r~~~r~d~~v~~ 380 (390) T protein:vir:97 320 L-PVVATQ-----AMAPGEFLVGAFDLAAQIFD-QWDARVEIGYVND------------DFQRNMVTVLAEERLALVVYR 380 (390) T ss_pred e-eeEEcC-----CCCCCcEEEEeccceEEEEE-ecceEEEEeeccc------------ccccCcEEEEEEEeeccEEec Confidence 3 555554 46889999999975322121 0111111110000 001144455667788999999 Q ss_pred ccceEEeecCc Q lcl|Aclame:pro 395 PQGCAVITGLQ 405 (418) Q Consensus 395 ~kA~a~I~gL~ 405 (418) |+|+.+|+ |. T Consensus 381 ~~a~v~~~-~a 390 (390) T protein:vir:97 381 PEALITGS-FA 390 (390) T ss_pred cccEEEEE-eC Confidence 99997775 33 No 54 >protein:vir:10364 Length: 390 # NCBI annotation: head protein; major capsid subunit precursor # Family: family:all:585 # MgeID: mge:183 # MgeName: Xp10 # Cross-refs: genbank:acc:NP_858956;genbank:gi:32128421;genbank:GeneID:2648357 Probab=83.98 E-value=0.064 Score=27.13 Aligned_cols=318 Identities=11% Similarity=0.017 Sum_probs=125.2 Q ss_pred Ccceeeeecc----CCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCc Q lcl|Aclame:pro 1 MSVYAGIFNT----TLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADA 76 (418) Q Consensus 1 ~~~~~~~~~~----~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~ 76 (418) +.=.+..... ...+.+..+++.--. -+...-..++ .....++. .. .....+. .+ T Consensus 61 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~----------~~~~~~~~~~----~~~~~~~~--~~--~~~~~~~-~~--- 118 (390) T protein:vir:10 61 VAELEGNGAGGDVQHVSVGDLFVASEQFQ----------ASAGRWNDRS----ARATMNIK--AA--LNTASTD-AA--- 118 (390) T ss_pred HHHHHhhcccccccccchhhhhhhhHHHH----------HHHHhhhhhh----hhhhhHHH--HH--HHhhhcc-cc--- Confidence 1111111110 111111111110000 0000000000 00000000 00 0000000 00 Q ss_pred eEEEEccccccccCcee----EeccC----ceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCc Q lcl|Aclame:pro 77 TVLTVENSDGLTKGMIF----YNEAT----GENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTA 148 (418) Q Consensus 77 t~~tV~~~~~~~~~~~~----~~~~~----~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~ 148 (418) .++.++.+..++ ..... ...+.+..+.+..++.-+....+.. ..|. .||...+.. T Consensus 119 -----~~~g~~~~~~~~~~ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~~~------a~~v------~Eg~~~~~~ 181 (390) T protein:vir:10 119 -----GSAGALTTPNRLPGFITQPDARLTVRDLIGSGRTDSALIEYVQETGFVNN------AAIV------AEGALKPES 181 (390) T ss_pred -----cccccccchhHHHHHHHHHHhhchhhhhcceeeccCCceEEEEEecCCcc------eeee------cCCcccccc Confidence 111112222111 10000 1122333444444444433322211 1121 366554432 Q ss_pred ccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHH Q lcl|Aclame:pro 149 RSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDA 228 (418) Q Consensus 149 ~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~ 228 (418) ... -.. -...+++-...+.-|.+..+.. .+-..+-..+-...+.+.+|.++|+|.- ++.. -.||+.. T Consensus 182 ~~~-~~~--i~~~~~k~~~~~~is~ell~d~--~~l~~~i~~~l~~~~~~~~~~~il~G~G----~~~~----p~Gi~~~ 248 (390) T protein:vir:10 182 SLK-FAK--KTDTTHVIAHTMKATRQILSDA--PQLASYMNNRLIRGLKVKEDAEILRGTG----ANDG----LLGLIPQ 248 (390) T ss_pred ccc-eeE--EEEeeEEEEEeehhhHHHHHhH--HHHHHHHHHHHHHHHHHHHHHHHhhcCC----CCcc----ccccccc Confidence 211 111 1222223233333344444432 2334455555556789999999998842 2322 2366533 Q ss_pred HhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEE Q lcl|Aclame:pro 229 VRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTE 308 (418) Q Consensus 229 i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~ 308 (418) .. .... ..........+++.+++.++-...... ..+++++.....|.++....|++.+...-...+ T Consensus 249 ~~---~~~~-~~~~~~~~~~~~~~~~~~~l~~~~~~~-----~~~v~n~~~~~~L~~lkd~~g~~l~~~~~~~~~----- 314 (390) T protein:vir:10 249 AT---TYAA-PTTIAGATRVDQLRLAMLQASLAEYPA-----SGIVINPIDWAAIELAKDANNQYLIGNARGTLT----- 314 (390) T ss_pred cc---cccc-cccccccchHHHHHHHHHhhccccCCC-----CEEEEcHHHHHHHHHhhcCCCceeecCCcCcCC----- Confidence 21 1111 122223445667777776665433221 236678887888888755555554432111100 Q ss_pred EEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEE Q lcl|Aclame:pro 309 WKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEW 388 (418) Q Consensus 309 ~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~ 388 (418) -+=+|. .|+.++ +||++++++.|++..-.-+.. -+...+...... .-..|....+....+ T Consensus 315 -~~l~G~-pv~~~~-----~~p~~~~~~gdf~~~~~~~~~-~~~~i~~~~~~~------------~~~~~~~~~r~~~r~ 374 (390) T protein:vir:10 315 -PTLWGL-PVVATQ-----AMAPGEFLVGAFDLAAQIFDQ-WDARVEIGYVND------------DFQRNMVTVLAEERL 374 (390) T ss_pred -ceecce-eeEEcC-----CCCCCcEEEEeccceEEEEEe-cceEEEEeeccc------------ccccCcEEEEEEEee Confidence 012453 555554 478899999999753211210 111111111000 001155556677889 Q ss_pred EEEEecccceEEeecCc Q lcl|Aclame:pro 389 ALELLNPQGCAVITGLQ 405 (418) Q Consensus 389 tLev~N~kA~a~I~gL~ 405 (418) ...+++|+|+.+|+= . T Consensus 375 d~~v~~~~a~~~~~~-a 390 (390) T protein:vir:10 375 ALVVYRPEALISGSF-A 390 (390) T ss_pred ccEEeccccEEEEEe-C Confidence 999999999977652 2 No 55 >protein:vir:108211 Length: 318 # NCBI annotation: gp9 # Family: family:all:6420 # MgeID: mge:2004 # MgeName: Giles # Cross-refs: genbank:acc:YP_001552338;genbank:gi:160700658;genbank:GeneID:5758931 Probab=82.45 E-value=0.077 Score=26.70 Aligned_cols=292 Identities=11% Similarity=0.061 Sum_probs=121.2 Q ss_pred cccceeEEEEEeecCceEEEEccccccccCceeEecc----Cc----e--EEEEEEecCceeEEEccccccchhhhhCCc Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEA----TG----E--NMRLELVNGLNLTVKRQTGRISAAIIAANT 130 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~----~~----E--~~~Vtav~g~~~tv~rg~~~tta~~~~~gt 130 (418) |......+++ ..+ -+|||.+- +..+.++...+ .. + ..++.+-++....-.++... ..+++ T Consensus 1 ~~~~~~i~s~-~~~--~~itv~~l--l~~P~~I~~~i~e~~~~~~iad~lf~~~~a~~~~~v~f~~~~p~-----~~~~d 70 (318) T protein:vir:10 1 MTAPTGIVSV-SDG--PAITVREL--VGNPLWIPTALKKMMVNQFISESLFRNGGANPNGVVAYNEGNPS-----FLEDD 70 (318) T ss_pred CCCCCcceee-ecC--CceehHHh--hCCchhHHHHHHHHHhccchhhhhhhcccccccceeEEEecccc-----cccCc Confidence 3333222222 222 36676631 12122221111 00 1 11232322222111111111 11111 Q ss_pred eEEEeecccccccCCcCccccc-ceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcC-- Q lcl|Aclame:pro 131 KLIVIGTAFEEGSQRPTARSIQ-PVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFG-- 207 (418) Q Consensus 131 ~v~~~g~a~~EGada~~~~~~~-~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G-- 207 (418) . ....||...|...... ..++- +.+ +-...+.=|.++. .++.++.+..+..+...-|.|..+...+.- T Consensus 71 ~-----e~VaEggEiP~~~~~~G~~~ia-~~~--K~G~~~~vS~Em~-~~n~~~~v~r~~~~l~Nti~r~~d~~a~dal~ 141 (318) T protein:vir:10 71 V-----ADVAEFGEIPVSAGARGLPRTA-FAV--KKALGVRVSKEMI-DENRVGAVNDQMLQLRNTFIRANDRSAKALLQ 141 (318) T ss_pred H-----hhccCcccccccCCCCCchhhh-hhe--hhccceeccHHHH-hhcChhHHHHHHHHHHHHHHHHHHHHHHHHHh Confidence 1 2234666655433222 22221 122 3333334444444 346667888888888888888888776531 Q ss_pred ---cccccCcCCcc--chhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhc----ccCCCceeEEEEeChH Q lcl|Aclame:pro 208 ---QAFMGTYNGQP--LHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWS----VNVGDNTQRVMFCDTV 278 (418) Q Consensus 208 ---~k~~~~s~~~~--~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g----~~~~g~~~~~i~v~a~ 278 (418) +...+.|.+-. -....|++.++. .+....-.+.... ...-|..+..|+.++. T Consensus 142 sa~t~~~~~s~~w~~~~~~~~d~~~A~e-------------------~v~~a~~~~~~a~~~~~~~~~GY~pdtIVlhP~ 202 (318) T protein:vir:10 142 SPIVPTLAVPTAWDNGGKVRTDIAIAIE-------------------QISTAAPTAYPAGVGSSDEYFGFIPDTIVMHYA 202 (318) T ss_pred ccccccccCCcCCCCcccccccchhhhh-------------------hhhhhhhhhhhhhhhhhhhccCccceeeEECHH Confidence 11111111100 000012211111 1111111111000 0112445567889988 Q ss_pred HHHHHHhhhhccceEEEcccceeeceEEEE--EEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCccccc Q lcl|Aclame:pro 279 GMRTMQDIGRFFGEVTVTQRETSYGMVFTE--WKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVEN 356 (418) Q Consensus 279 ~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~--~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~ 356 (418) ....|.+-....+-+.-.......+...+. .-+.+| ++++.+|++ |.|+++++|-..+-. +-+.|+...++ T Consensus 203 ~~~~l~~n~~~~~~y~~~a~~~~~~~~~tg~~~g~~lG-l~vi~s~~~-----p~~~alvlq~g~vG~-~~d~~pl~~t~ 275 (318) T protein:vir:10 203 LLPILMDNENFMKVYERNANYVSTAPDWTGNFPGSVMG-LNVIRSRTF-----PIDRVLIMERGTVGF-YSDTRPLQFTA 275 (318) T ss_pred HHHHHhcchhhhhhhhccchhhhhcccccccccceeec-eEEeecCcc-----CCCeeEEEecCCcce-eeccccceeee Confidence 877774321111111111111111111111 113356 899999886 679999999776641 11334444444 Q ss_pred ccccCccccccccccccccCccccccE--EEEEEEEEEecccceEEeecCccc Q lcl|Aclame:pro 357 YGQGGGENKSGATDYSYGHGVDAQGGS--LTSEWALELLNPQGCAVITGLQKA 407 (418) Q Consensus 357 laKtG~~~~~~~~~~~~~~g~Da~k~~--i~~E~tLev~N~kA~a~I~gL~~~ 407 (418) |.--|+ + ..|+..+.+. +.-=-++-|..|||..+|+||.+- T Consensus 276 ~~~egg-------~---~~g~~~~s~~~~~~~~~~~~V~~PkA~~~itgi~~~ 318 (318) T protein:vir:10 276 LYPEGN-------G---PNGGPTESYRADASHKRALAVDQPKAALWLTGIVTP 318 (318) T ss_pred cccCCC-------C---CCCCcchhhheehheeeeeeeeCcceeEEEeeccCC Confidence 443221 0 1112222222 222235678999999999999775 No 56 >protein:vir:9820 Length: 272 # NCBI annotation: putative major capsid/head protein # Family: family:all:522 # MgeID: mge:176 # MgeName: 315.4 # Cross-refs: genbank:acc:NP_795582;genbank:gi:28876339;genbank:GeneID:1257858 Probab=81.52 E-value=0.085 Score=26.46 Aligned_cols=265 Identities=15% Similarity=0.106 Sum_probs=120.3 Q ss_pred cccceeEEEEEeecCceEEEEccc---cccccCceeEe--ccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEe Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENS---DGLTKGMIFYN--EATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVI 135 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~---~~~~~~~~~~~--~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~ 135 (418) |..+.+++...+.- +|-+. ..+....++.. .++. ......|+++++-+-.....+. + T Consensus 1 MA~~~T~~~~~~iP-----ev~s~~v~~~~~~~~~~~~~~~~~~---~~~g~~G~tv~iP~~~~~~~a~-------~--- 62 (272) T protein:vir:98 1 MAVGTTKMAQMLDP-----EVLADMIDAEVGKAIRFAPLAEVDT---TLEGQPGTTLTVPKWDYIGDAE-------D--- 62 (272) T ss_pred CCCccccchheech-----HHHHHHHHHHHHHHhhhhccccccc---cccCCCCCEEEEEEecCCCCcc-------c--- Confidence 33322221111000 00000 00000000000 0000 0122345666554321111111 1 Q ss_pred ecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcC Q lcl|Aclame:pro 136 GTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYN 215 (418) Q Consensus 136 g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~ 215 (418) ..||.+.+..........-...+ +...+++|.-... . ...|-+++-..+....+.+.+|..++..-+. T Consensus 63 ---v~eg~~i~~~~~~~~~~~~~~~~-~~~~~~itd~~~~--~-s~~d~~~~~~~~~~~~~a~~~d~~i~~~~~~----- 130 (272) T protein:vir:98 63 ---VAEGEAIPMTQLGFKKTTMTIKK-AGKGVEITDEAIL--S-GYGDPVGQAAKQIVEAIDHKVDADVLDALSK----- 130 (272) T ss_pred ---ccCCCcccccccccceEEEEeee-eeeeeeecHHHHh--h-ccccHHHHHHHHHHHHHHHHHHHHHHHHhcc----- Confidence 23565544333222221112333 2345666654432 2 3446667777777788899999988742211 Q ss_pred CccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEE Q lcl|Aclame:pro 216 GQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTV 295 (418) Q Consensus 216 ~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~ 295 (418) + ++. .++..+.+.+.|+...+ .. .+...+++++++.....|.+.... +. T Consensus 131 a------------------~~~----~~~~~t~d~i~da~~~l-~~----~~~~~~~~vv~p~~~~~L~k~~~~----~~ 179 (272) T protein:vir:98 131 S------------------TQT----VEATATVDGVSKALDIF-ND----EDDAETVIVMNPADASTLRLDAAK----EW 179 (272) T ss_pred c------------------ccc----cccccCHHHHHHHHHHH-hc----cCCCccEEEEcHHHHHHHHHhccc----cc Confidence 0 001 12345678888876654 22 133456899999988777653210 10 Q ss_pred c-ccceeeceEEEE-EEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCcccccccccccc Q lcl|Aclame:pro 296 T-QRETSYGMVFTE-WKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSY 373 (418) Q Consensus 296 ~-~~~~~~G~~v~~-~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~ 373 (418) . ..+...+...+- +-+-.| +.|+.++. ||.++++++++..+.+.. .++...|..+... T Consensus 180 ~~~~~~~~~~~~~g~ig~i~G-~~Vi~s~~-----~p~~t~~~~~~~a~~~~~--~~~~~ve~~r~~~------------ 239 (272) T protein:vir:98 180 LGATEVGANRVVSGVYGEVLG-VQIVRSRK-----CPKGTAYMVRKGALRIML--KRNTMVETDRDIT------------ 239 (272) T ss_pred cccccccccccccccchhhcC-eeEEEcCC-----CCcceEEEEcCCeEEEEe--cCCceeeeccccc------------ Confidence 0 001111111111 112234 47777754 688999999999776544 3555555443321 Q ss_pred ccCccccccEEEEEEEEEEecccceEEeecCcccccc Q lcl|Aclame:pro 374 GHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKER 410 (418) Q Consensus 374 ~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~ 410 (418) ++.|... ...=|++.+.||.+..+++ ++.|+.. T Consensus 240 -~~~~~i~--~~~~~~~~v~~~~~vv~~t-~~~a~~~ 272 (272) T protein:vir:98 240 -KAINQIV--ANKHYGVYLYKAEKAVKIT-LKDAAKK 272 (272) T ss_pred -cceeEEE--EEEEEEEEEEcCCceEEEE-ecccccC Confidence 1223332 2233688999999888874 4444333 No 57 >protein:vir:3033 Length: 272 # NCBI annotation: major capsid protein # Family: family:all:522 # MgeID: mge:61 # MgeName: PhiNIH1.1 # Cross-refs: genbank:acc:NP_438146;genbank:gi:16271809;genbank:GeneID:929235 Probab=81.52 E-value=0.085 Score=26.46 Aligned_cols=265 Identities=15% Similarity=0.106 Sum_probs=120.3 Q ss_pred cccceeEEEEEeecCceEEEEccc---cccccCceeEe--ccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEe Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENS---DGLTKGMIFYN--EATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVI 135 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~---~~~~~~~~~~~--~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~ 135 (418) |..+.+++...+.- +|-+. ..+....++.. .++. ......|+++++-+-.....+. + T Consensus 1 MA~~~T~~~~~~iP-----ev~s~~v~~~~~~~~~~~~~~~~~~---~~~g~~G~tv~iP~~~~~~~a~-------~--- 62 (272) T protein:vir:30 1 MAVGTTKMAQMLDP-----EVLADMIDAEVGKAIRFAPLAEVDT---TLEGQPGTTLTVPKWDYIGDAE-------D--- 62 (272) T ss_pred CCCccccchheech-----HHHHHHHHHHHHHHhhhhccccccc---cccCCCCCEEEEEEecCCCCcc-------c--- Confidence 33322221111000 00000 00000000000 0000 0122345666554321111111 1 Q ss_pred ecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcC Q lcl|Aclame:pro 136 GTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYN 215 (418) Q Consensus 136 g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~ 215 (418) ..||.+.+..........-...+ +...+++|.-... . ...|-+++-..+....+.+.+|..++..-+. T Consensus 63 ---v~eg~~i~~~~~~~~~~~~~~~~-~~~~~~itd~~~~--~-s~~d~~~~~~~~~~~~~a~~~d~~i~~~~~~----- 130 (272) T protein:vir:30 63 ---VAEGEAIPMTQLGFKKTTMTIKK-AGKGVEITDEAIL--S-GYGDPVGQAAKQIVEAIDHKVDADVLDALSK----- 130 (272) T ss_pred ---ccCCCcccccccccceEEEEeee-eeeeeeecHHHHh--h-ccccHHHHHHHHHHHHHHHHHHHHHHHHhcc----- Confidence 23565544333222221112333 2345666654432 2 3446667777777788899999988742211 Q ss_pred CccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEE Q lcl|Aclame:pro 216 GQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTV 295 (418) Q Consensus 216 ~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~ 295 (418) + ++. .++..+.+.+.|+...+ .. .+...+++++++.....|.+.... +. T Consensus 131 a------------------~~~----~~~~~t~d~i~da~~~l-~~----~~~~~~~~vv~p~~~~~L~k~~~~----~~ 179 (272) T protein:vir:30 131 S------------------TQT----VEATATVDGVSKALDIF-ND----EDDAETVIVMNPADASTLRLDAAK----EW 179 (272) T ss_pred c------------------ccc----cccccCHHHHHHHHHHH-hc----cCCCccEEEEcHHHHHHHHHhccc----cc Confidence 0 001 12345678888876654 22 133456899999988777653210 10 Q ss_pred c-ccceeeceEEEE-EEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCcccccccccccc Q lcl|Aclame:pro 296 T-QRETSYGMVFTE-WKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSY 373 (418) Q Consensus 296 ~-~~~~~~G~~v~~-~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~ 373 (418) . ..+...+...+- +-+-.| +.|+.++. ||.++++++++..+.+.. .++...|..+... T Consensus 180 ~~~~~~~~~~~~~g~ig~i~G-~~Vi~s~~-----~p~~t~~~~~~~a~~~~~--~~~~~ve~~r~~~------------ 239 (272) T protein:vir:30 180 LGATEVGANRVVSGVYGEVLG-VQIVRSRK-----CPKGTAYMVRKGALRIML--KRNTMVETDRDIT------------ 239 (272) T ss_pred cccccccccccccccchhhcC-eeEEEcCC-----CCcceEEEEcCCeEEEEe--cCCceeeeccccc------------ Confidence 0 001111111111 112234 47777754 688999999999776544 3555555443321 Q ss_pred ccCccccccEEEEEEEEEEecccceEEeecCcccccc Q lcl|Aclame:pro 374 GHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKER 410 (418) Q Consensus 374 ~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~ 410 (418) ++.|... ...=|++.+.||.+..+++ ++.|+.. T Consensus 240 -~~~~~i~--~~~~~~~~v~~~~~vv~~t-~~~a~~~ 272 (272) T protein:vir:30 240 -KAINQIV--ANKHYGVYLYKAEKAVKIT-LKDAAKK 272 (272) T ss_pred -cceeEEE--EEEEEEEEEEcCCceEEEE-ecccccC Confidence 1223332 2233688999999888874 4444333 No 58 >protein:vir:8102 Length: 543 # NCBI annotation: gp6 # Family: family:all:21 # MgeID: mge:152 # MgeName: Che9c # Cross-refs: genbank:acc:NP_817683;genbank:gi:29566114;genbank:GeneID:1259308 Probab=81.04 E-value=0.089 Score=26.34 Aligned_cols=309 Identities=11% Similarity=0.017 Sum_probs=114.6 Q ss_pred Ccce--------------eeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeeccccee Q lcl|Aclame:pro 1 MSVY--------------AGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASA 66 (418) Q Consensus 1 ~~~~--------------~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~ 66 (418) +... .........+.+ .+.+. .....+ ++.+.-+++--....... T Consensus 212 ~~~~~~~~~~~~a~~~~~~~~~~~~l~~~e--~~~~~---------------~~~~~~----~t~~~gg~lip~~~~~~i 270 (543) T protein:vir:81 212 QCLATSSPAYLRAWSKMARNPHAAILTEEE--KRAIN---------------EVRAMG----LTKADGGYLVPFQLDPTV 270 (543) T ss_pred hhhhhhhhhhhhHHHHHHHhhHHHHhhhhh--hhhhh---------------hhhhcc----cccccCcccCchhhhhHH Confidence 0000 000000011110 01100 000000 000111111000000000 Q ss_pred EEEEEeecCceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCc Q lcl|Aclame:pro 67 VVTAEAAADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRP 146 (418) Q Consensus 67 t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~ 146 (418) .... +.....+.. +..|.-..|+.. +-+...+..+ .|. .||+..+ T Consensus 271 i~~~----------~~~~~~l~~-----------~~~~~~~~g~~~-~~~~~~~~~a-------~~v------~Eg~~~~ 315 (543) T protein:vir:81 271 IITS----------NGSLNDIRR-----------FARQVVATGDVW-HGVSSAAVQW-------SWD------AEFEEVS 315 (543) T ss_pred HHHH----------Hhhhchhhh-----------hcccccCCcceE-EEEecCCcce-------eec------ccCcccc Confidence 0000 000000000 000111112111 1111111000 111 2555444 Q ss_pred CcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHH Q lcl|Aclame:pro 147 TARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIV 226 (418) Q Consensus 147 ~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~ 226 (418) ..... .-.-..-..+-..-+.-|.+..+.. .+-.++-...-...+.+.++.+||+|. |++.+ --||+ T Consensus 316 ~~~~~---~~~i~~~~~k~~~~~~is~ell~d~--~~~~~~i~~~l~~~~~~~~d~ail~G~----Gt~~~----p~Gi~ 382 (543) T protein:vir:81 316 DDSPE---FGQPEIPVKKAQGFVPISIEALQDE--ANVTETVALLFAEGKDELEAVTLTTGT----GQGNQ----PTGIV 382 (543) T ss_pred ccccc---cceeeeeeeeeEeeehhhHHHHhcc--HHHHHHHHHHHHHHHHHHHHHHHhccC----CCCcc----cccch Confidence 32211 1111122222233334444555432 355566666667778999999999884 22222 34555 Q ss_pred HHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEE Q lcl|Aclame:pro 227 DAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVF 306 (418) Q Consensus 227 ~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v 306 (418) ..... ........+...++.+++.++...+=. . +... ..+++++.....|.++...+|++.+..... |.. T Consensus 383 ~~~~~--~~~~~~~~~~~~~~~~~~~~~~~~l~~-~-~~~~---~~~v~n~~~~~~l~~lkd~~G~~l~~~~~~--g~~- 452 (543) T protein:vir:81 383 TALAG--TAAEIAPVTAETFALADVYAVYEQLAA-R-HRRQ---GAWLANNLIYNKIRQFDTQGGAGLWTTIGN--GEP- 452 (543) T ss_pred hhccc--ccccccccccccccHHHHHHHHHhhhc-c-ccCC---cEEEEcHHHHHHHHHhhcCCCceeccCcCC--CCC- Confidence 43211 111122234456788888888765521 1 1111 246788888888888755556655432111 100 Q ss_pred EEEEcCCeEEEEEECcccccc---CCCCC--eEEEEchhhceeeeccCCCcccccccccCccccccccccccccCcccc- Q lcl|Aclame:pro 307 TEWKFFKGRLILKEHPLFSAI---GISPG--FAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQ- 380 (418) Q Consensus 307 ~~~~SdfG~v~vv~n~~l~~~---~mp~d--~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~- 380 (418) .+=+|. .|+..+.++.- ...++ .+++.|++++.+..- .++..+...... .+-|.. T Consensus 453 ---~~l~G~-pv~~~~~~~~~~~~~~~~~~~~i~~gd~~~~~i~~~--~~~~i~~~~~~~-------------~~~~~~~ 513 (543) T protein:vir:81 453 ---SQLLGR-PVGEAEAMDANWNTSASADNFVLLYGNFQNYVIADR--IGMTVEFIPHLF-------------GTNRRPN 513 (543) T ss_pred ---ccccce-eeEEeccccccccccccCCcceEEEeeccceeEEee--cccEEEEecccc-------------ccchhhc Confidence 122452 44444333210 01111 255667766544322 122111111111 011222 Q ss_pred ---ccEEEEEEEEEEecccceEEeecCccc Q lcl|Aclame:pro 381 ---GGSLTSEWALELLNPQGCAVITGLQKA 407 (418) Q Consensus 381 ---k~~i~~E~tLev~N~kA~a~I~gL~~~ 407 (418) ......-+.+.+.|++|+.+++-=..| T Consensus 514 ~~~~~~~~~r~d~~v~~~~A~~~l~~~~~a 543 (543) T protein:vir:81 514 GSRGWFAYYRMGADVVNPNAFRLLNVETAS 543 (543) T ss_pred CceEEEEEEeeccEeecccceEEEEecccC Confidence 334445589999999998777654444 No 59 >protein:vir:63741 Length: 468 # NCBI annotation: Cps # Family: family:all:2450 # MgeID: mge:1517 # MgeName: P100 # Cross-refs: genbank:gi:82547622;genbank:GeneID:3783474 Probab=80.76 E-value=0.041 Score=28.16 Aligned_cols=328 Identities=14% Similarity=0.128 Sum_probs=132.6 Q ss_pred ChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEE-----eecCceEEEEcccccc Q lcl|Aclame:pro 13 NPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAE-----AAADATVLTVENSDGL 87 (418) Q Consensus 13 ~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~-----~~a~~t~~tV~~~~~~ 87 (418) -| .-|||+. +||+..--... ...||.+-+| ...++.-+-.++ +...-+.|+..+.+ | T Consensus 1 ~~-~~~~~~~------~~~~~~~~~~e-------~~~Ks~~agy---~~~p~~q~~~~AlR~EsL~~~i~~L~~~~~~-f 62 (468) T protein:vir:63 1 MP-KNNKEEE------VKEVNLNSVQE-------DALKSFTTGY---GITPDTQTDAGALRREFLDDQISMLTWTEND-L 62 (468) T ss_pred CC-CCcchhh------ccccChhHHHH-------HHHHHHHcCc---ccCCccccCcchhhhhhhhhhhheeeecccc-h Confidence 11 2234422 23431111100 0011111111 000000000000 11111122222211 1 Q ss_pred ccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEee-----cccccccCCcCcccccceeccceeEE Q lcl|Aclame:pro 88 TKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIG-----TAFEEGSQRPTARSIQPVYVPNFTQI 162 (418) Q Consensus 88 ~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g-----~a~~EGada~~~~~~~~~~~~N~tQI 162 (418) .+++.+.... ..+..+..+..+ ..| ....|+..+......-+.+. =..-- T Consensus 63 ----~~~~di~k~~-------------------a~stv~~y~~~~-~~G~~g~~~f~~E~g~~~~~~~~~~r~~-~~~k~ 117 (468) T protein:vir:63 63 ----TFYKDIAKKP-------------------ATSTVAKYDVYM-QHGKVGHTRFTREIGVAPVSDPNIRQKT-VNMKF 117 (468) T ss_pred ----hhhhhcccch-------------------hhhhhhhheeee-ccCccccccccccccccccCCCceEEEE-EEeee Confidence 1111111110 112222222222 111 12356654432221111111 12223 Q ss_pred EeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCccccc-CcCCccchhhHHHHHHHhhccccCccccC Q lcl|Aclame:pro 163 FRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMG-TYNGQPLHTTQGIVDAVRQYAPDNVNAMP 241 (418) Q Consensus 163 f~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~-~s~~~~~r~t~GI~~~i~~~~~~nv~~~~ 241 (418) +..+..||.-+.-++. ..|-++.|.++++.-+...+|++++.|-+... ..+++.--+-+||+..+ ...|+... T Consensus 118 l~~~~~vs~~~~l~n~--i~d~~~~~~~~ai~~~a~tiE~a~FyGds~l~~s~~~~~glqfDGi~~li---~~enviDa- 191 (468) T protein:vir:63 118 ASDTKNISIAAGLVNN--IQDPMQILTDDAIVNIAKTIEWASFFGDSDLSDSPEPQAGLEFDGLAKLI---NQDNVHDA- 191 (468) T ss_pred eeeeeeehhhhhhhcc--hhhHHHHHHHHHHHHHHHHHHHHhhhcccccccCCCccccccccceeEEe---cCCceecc- Confidence 3344444555544433 44668999999999999999999999987553 22333334567776444 23466443 Q ss_pred CCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHH-HhhhhccceEEEcccc---eeeceEEEEEEcCCeEEE Q lcl|Aclame:pro 242 NPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTM-QDIGRFFGEVTVTQRE---TSYGMVFTEWKFFKGRLI 317 (418) Q Consensus 242 ~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i-~~~~~~~~~~~~~~~~---~~~G~~v~~~~SdfG~v~ 317 (418) .|..+++++|..+...+=+ +.++..-+|.+...+-.| +.... -+.++.... ...|..|..|.|..|.+. T Consensus 192 ~G~~ls~~~lneaa~~i~~-----gfG~~td~~~~~~v~a~~~~~~L~--~q~~v~~~n~~~~~~G~~v~g~~sa~G~I~ 264 (468) T protein:vir:63 192 RGASLTESLLNQAAVMISK-----GYGTPTDAYMPVGVQADFVNQQLS--KQTQLVRDNGNNVSVGFNIQGFHSARGFIK 264 (468) T ss_pred CCCccCHHHHHHHhhhccc-----cccChhhhhcchhHHhhhhhhhcC--ceEEEEcCCCCceeeeecccceecceeeee Confidence 3456899988888743322 233333466666666455 66533 444554322 355888999999999998 Q ss_pred EEECccccccCCCCCeEEEEchhhce--eeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecc Q lcl|Aclame:pro 318 LKEHPLFSAIGISPGFAVVVDVPAVK--LAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNP 395 (418) Q Consensus 318 vv~n~~l~~~~mp~d~~lv~D~~~~~--~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~ 395 (418) +..+-+|+..+++ ||+... .++-..--.......+.|.. . +.|.- .=+|-..+.|. T Consensus 265 l~gs~il~~~~~l-------~~~~~~~~~Apsp~~vsaT~~~~~~g~~-~----------~~~~a----~y~Y~v~~vs~ 322 (468) T protein:vir:63 265 LHGSTVMENEQIL-------DERILALPTAPQPAKVTATQEAGKKGQF-R----------AEDLA----AHEYKVVVSSD 322 (468) T ss_pred ecCceeeccccCC-------CcccccccccccCCccceeeecccCCcc-c----------CCCcc----eEEEEEEEECC Confidence 8777666554433 333322 11111000001111111100 0 00000 02233334343 Q ss_pred cceEEeecCccc--------------ccccCCCCCC----------C Q lcl|Aclame:pro 396 QGCAVITGLQKA--------------KERVYLTAPA----------P 418 (418) Q Consensus 396 kA~a~I~gL~~~--------------~~~~~~~~~~----------~ 418 (418) .+-.+....-++ -+.+|...|- . T Consensus 323 ~GES~pS~~vtvTVaa~~dg~~ltIt~~~~~~~~p~yv~IYR~~~gg 369 (468) T protein:vir:63 323 DAESIASEVATATVTAKDDGVKLEIELAPMYSSRPQFVSIYRKGAET 369 (468) T ss_pred CCccccccceEEEecCcccceeEEEEecCCCCCcceEEEEEEeCCCC Confidence 322222221111 0111111010 0 No 60 >protein:vir:3613 Length: 272 # NCBI annotation: MHP # Family: family:all:522 # MgeID: mge:74 # MgeName: TP901-1 # Cross-refs: genbank:acc:NP_112699;genbank:gi:13786567;genbank:GeneID:921035 Probab=74.69 E-value=0.16 Score=25.02 Aligned_cols=253 Identities=15% Similarity=0.078 Sum_probs=111.7 Q ss_pred EccccccccCce----eEeccC---ceEEEEEEecCceeEEEccccccchhhhhCCceEEE-----eecc--cccccCCc Q lcl|Aclame:pro 81 VENSDGLTKGMI----FYNEAT---GENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIV-----IGTA--FEEGSQRP 146 (418) Q Consensus 81 V~~~~~~~~~~~----~~~~~~---~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~-----~g~a--~~EGada~ 146 (418) -++...-..+.| +..-+. .+.+++..+.-..-+. -|. .|..|.+ +|.+ ..||.+.+ T Consensus 1 ma~~~T~~~d~iiPev~~~~v~~~~~~~~~~~~~~~~~~~l-~g~---------~G~ti~iP~~~~~gda~~~~eg~~i~ 70 (272) T protein:vir:36 1 MSKQKTTLADLVNPEVLAPIVSYELNKALRFAPLAQVDTTL-QGQ---------PGNTLKFPAFTYIGDAADVAEGGEIS 70 (272) T ss_pred CCCcceehhhhhchHHHHHHHHHHHHhhhhhcccccccccc-ccC---------CCCEEEEeeeccCccccccCCCCccC Confidence 232121111111 110000 0111111110000000 011 1222222 2222 24555444 Q ss_pred CcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHH Q lcl|Aclame:pro 147 TARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIV 226 (418) Q Consensus 147 ~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~ 226 (418) ...-......--..|+ .+.|++++-+.+. ...|-+..-..+....+++.+++.++..-+.. T Consensus 71 ~~~lt~~~~~~~i~~~-~k~~~vtD~~~~~---~~~d~~~~~~~~~a~~~a~~~d~~i~~~l~~~--------------- 131 (272) T protein:vir:36 71 LDKIGTTTKSVTIKKA-AKGTEITDEAALS---GYGDPIGESNKQLGLSLANKVDDDLLSAAKTT--------------- 131 (272) T ss_pred hhhcCCcceeEeeehh-hccccccHHHHhh---ccchHHHHHHHHHHHHHHHHHHHHHHHHhccc--------------- Confidence 3332222211123343 4567777766554 33355555555666677888887776221100 Q ss_pred HHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEE Q lcl|Aclame:pro 227 DAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVF 306 (418) Q Consensus 227 ~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v 306 (418) ....++..+.+.+.++...+=+. +...++++|++.....|.+... +........-++.+ T Consensus 132 ------------~~~~~~~~~~d~i~~A~~~lgd~-----~~~~~~ivv~p~~~~~L~k~~~----~~~~~~~~~~~~~~ 190 (272) T protein:vir:36 132 ------------SQTVSTKANVDGVQAALDIFNDE-----DAQAYVLIVNPKDAAKIRKDAN----AKNIGSEVGANALI 190 (272) T ss_pred ------------cccccccccHHHHHHHHHHhhhc-----CCCceEEEEcHHHHHHHhcccc----ccccccccccccee Confidence 01122356778888877665332 2345789999998888866432 11111111112222 Q ss_pred EEEE-cCCeEEEEEECccccccCCCCCeEE----EEchhhceeeeccCCCcccccccccCccccccccccccccCccccc Q lcl|Aclame:pro 307 TEWK-FFKGRLILKEHPLFSAIGISPGFAV----VVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQG 381 (418) Q Consensus 307 ~~~~-SdfG~v~vv~n~~l~~~~mp~d~~l----v~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k 381 (418) +-.. +-.| +.|+.++. +|.+..+ ++=+.. +.+..+++...|..+..- ++.|... T Consensus 191 ~G~ig~~~G-~~Vv~s~~-----~p~~~~~~~~~~~~~gA--~~~~~~~~~~vE~~R~~~-------------~~~d~i~ 249 (272) T protein:vir:36 191 NGTYADVLG-AQIVRSKK-----LAEGSALMFKIVSNSPA--LKLVLKRGVQVETDRDIV-------------TKTTVIT 249 (272) T ss_pred eeccceecC-eeEEEeCC-----CCCCceeEEEEEecccc--eeeeecCCcccccccchh-------------hcCcEEE Confidence 2111 1134 46777644 5666553 222333 334444555555544332 2234444 Q ss_pred cEEEEEEEEEEecccceEEeecCcc Q lcl|Aclame:pro 382 GSLTSEWALELLNPQGCAVITGLQK 406 (418) Q Consensus 382 ~~i~~E~tLev~N~kA~a~I~gL~~ 406 (418) +..+ |++.+.||.+..+++-=+- T Consensus 250 ~~~~--y~~~v~~~~~vv~~t~~g~ 272 (272) T protein:vir:36 250 ADEH--YAAYLYDLTKVVNITFTGV 272 (272) T ss_pred EEEE--EEEEEEcCccEEEEeecCC Confidence 4433 8999999998888753332 No 61 >protein:vir:93742 Length: 274 # NCBI annotation: ORF013 # Family: family:all:522 # MgeID: mge:1475 # MgeName: 55 # Cross-refs: genbank:acc:YP_240459;genbank:gi:66396126;genbank:GeneID:5133511 Probab=74.08 E-value=0.16 Score=24.91 Aligned_cols=256 Identities=16% Similarity=0.099 Sum_probs=121.7 Q ss_pred EccccccccCceeEec----cC---ceEEEEEEec--CceeEEEccccccchhhhhCCceEEE-----eeccc--ccccC Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNE----AT---GENMRLELVN--GLNLTVKRQTGRISAAIIAANTKLIV-----IGTAF--EEGSQ 144 (418) Q Consensus 81 V~~~~~~~~~~~~~~~----~~---~E~~~Vtav~--g~~~tv~rg~~~tta~~~~~gt~v~~-----~g~a~--~EGad 144 (418) -++...-.-+.++--+ +. .+.+++..+. ...+ -|. .|..+.+ +|.++ .||.+ T Consensus 1 ma~~~T~~~~~iiPev~~~~v~~~~~~~~~~~~~~~~~~~l---~g~---------~G~tv~ip~~~~~g~~~~~~eg~~ 68 (274) T protein:vir:93 1 MPQGITKTSNQIIPEVLAPMMQAQLEKKLRFASFAEVDSTL---QGQ---------PGDTLTFPAFVYSGDAQVVAEGEK 68 (274) T ss_pred CCccceehhheechHHHHHHHHHHHHhhhhhcccccccccc---cCC---------CCCEEEEEeeccCCCcccccCCCc Confidence 3332221112111100 00 0111111110 0000 011 1222211 22222 34544 Q ss_pred CcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHH Q lcl|Aclame:pro 145 RPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQG 224 (418) Q Consensus 145 a~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~G 224 (418) .+..........--..| ..+.+++++-+.+. ...|-+.....+....+.+.+++.++..-+. ++ T Consensus 69 i~~~~it~~~~~~~i~~-~~~~~~i~D~~~~~---~~~d~~~~~~~~~~~~~a~~~d~~~~~~~~~-----a~------- 132 (274) T protein:vir:93 69 IPTDILETKKREAKIRK-IAKGTSITDEALLS---GYGDPQGEQVRQHGLAHANKVDNDVLEALMG-----AK------- 132 (274) T ss_pred ccccccccceeEEEeee-ecccccccHHHHHh---hccchHHHHHHHHHHHHHHHHHHHHHHHHhc-----cc------- Confidence 43332222221112334 23467777765544 3456677777777889999999888732211 00 Q ss_pred HHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEccc-ceeec Q lcl|Aclame:pro 225 IVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQR-ETSYG 303 (418) Q Consensus 225 I~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~-~~~~G 303 (418) ..+ .+.+++.+.+.|+.+++=+ . +...++++|++.....|-+-. ..++... ...-+ T Consensus 133 ----------~~~----~~~~~~~d~i~dA~~~l~d----~-~~~~~~ivv~p~~~~~L~k~~----~~~f~~~s~~g~~ 189 (274) T protein:vir:93 133 ----------LTV----NADITKLNGLQSAIDKFND----E-DLEPMVLFINPLDAGKLRGDA----STNFTRATELGDD 189 (274) T ss_pred ----------ccc----cccccCHHHHHHHHHHhhh----c-cCCccEEEeCHHHHHHHHhhh----hhccccccccccc Confidence 001 2235678888888876532 2 235679999999887775421 1121111 11112 Q ss_pred eEEEEEE-cCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCcccccc Q lcl|Aclame:pro 304 MVFTEWK-FFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGG 382 (418) Q Consensus 304 ~~v~~~~-SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~ 382 (418) ....-.. +-.| +.|+.++. +|.++.+++++..+.+.. +++...|..+..- +..|...+ T Consensus 190 ~~~~G~ig~~~G-~~Vi~s~~-----~p~~t~~l~~~gai~~~~--~~~~~vE~~Rd~~-------------~~~d~i~~ 248 (274) T protein:vir:93 190 IIVKGAFGEALG-AIIVRTNK-----LEAGTAILAKKGAVKLIL--KRDFFLEVARDAS-------------TKTTALYS 248 (274) T ss_pred ceeecccceecC-eeEEEcCC-----CCcceEEEEeCCeEEEEe--cCCcccccccchh-------------hcccEEEE Confidence 2222111 1224 46777644 688999999999887543 4665566554332 12244433 Q ss_pred EEEEEEEEEEecccceEEeecCccccccc Q lcl|Aclame:pro 383 SLTSEWALELLNPQGCAVITGLQKAKERV 411 (418) Q Consensus 383 ~i~~E~tLev~N~kA~a~I~gL~~~~~~~ 411 (418) ..+ |...+.||.+..+++- ..+--+- T Consensus 249 ~~~--y~~~~~~~~~~v~~t~-~~~s~~~ 274 (274) T protein:vir:93 249 DKH--YVAYLYDESKAVKITK-GSGSLEM 274 (274) T ss_pred EEE--EEEEEEcCCceEEEee-CccccCC Confidence 333 7899999999888872 1111111 No 62 >protein:vir:78223 Length: 333 # NCBI annotation: Putative major head protein # Family: family:all:966 # MgeID: mge:1849 # MgeName: Bethlehem # Cross-refs: genbank:acc:YP_001491666;genbank:gi:157786490;genbank:GeneID:5625701 Probab=73.95 E-value=0.16 Score=24.89 Aligned_cols=314 Identities=12% Similarity=0.005 Sum_probs=118.1 Q ss_pred eeeeeeecccceeEEEEEeecCceEEEEccccccccCce----eEeccC----ceEEEEEEecCceeEEEccccccchhh Q lcl|Aclame:pro 54 HGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMI----FYNEAT----GENMRLELVNGLNLTVKRQTGRISAAI 125 (418) Q Consensus 54 ~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~----~~~~~~----~E~~~Vtav~g~~~tv~rg~~~tta~~ 125 (418) .+|+.... ...+. .......+ .....+.+..+ +..... .....+..+.+..+++-+-....++.- T Consensus 1 ~a~l~el~-~~~~~-----~~~~g~~~-~~~~~liP~~~~~~ii~~l~~~s~l~~~~~~~~~~~~~~~~p~~~~~~~a~~ 73 (333) T protein:vir:78 1 MATLNELL-PNSAG-----SNHQGRLA-HVPSDLLPKEIVGPIFDKAQESSLVLRMGEQIPISYGETIIPTTVKRPEVGQ 73 (333) T ss_pred CchhHHhh-hhccc-----ccccCcee-cCCccccchhHHHHHHHHHHhhchhhhhcceeeccCCceEEEEEeCCceeEe Confidence 22222111 00000 00000000 00011111111 110000 111234445555444443333222211 Q ss_pred hhCCceEEEeecccccccCCcCcccccceeccceeEEEee----eeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHh Q lcl|Aclame:pro 126 IAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRN----AWALTDTARASYAEAGYSNITESRRDCMDFHATEQE 201 (418) Q Consensus 126 ~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~----~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE 201 (418) +..|.. ....|+...+... .-+.||--. ...+.-|.+.++. ...+-.++-...-.+.+.+.+| T Consensus 74 v~eg~~-----~~~~e~~~~~~~~-------~~f~~i~l~~~kl~~~~~is~ell~~-s~~~~~~~i~~~la~ai~~~~d 140 (333) T protein:vir:78 74 VGVGTS-----NEQREGGLKPLSG-------TAWDTRSVSPIKLATIVTVSEEFARM-NPSGLYTKLQGDLAYAIGRGID 140 (333) T ss_pred ecCccc-----ccccccccccccc-------cceeEEEEeeEEEEEeehhhHHHHhc-CHHHHHHHHHHHHHHHHHHHHH Confidence 111111 1112333222111 122333222 2333344455433 2223445566666777899999 Q ss_pred HHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHH Q lcl|Aclame:pro 202 TAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMR 281 (418) Q Consensus 202 ~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~ 281 (418) .++|+|.-...+ ....|+.....-...++.......+..+.+++.++...+-.+. ......+++++.... T Consensus 141 ~~~l~G~g~~~~------~~~~g~~~~~~~~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~----~~~~~~~vmn~~~~~ 210 (333) T protein:vir:78 141 LAVFHGKSPLTG------SALQGIDTDNVIANTTNVDYLQETGDPLLDRLLDGYDLVSANT----DVEFNGWAVDPRFRA 210 (333) T ss_pred HHHhcccCCCCC------cccccccccccccccccccccccccchhHHHHHHHHHhhcccc----ccCceEEEEcchHHH Confidence 999987742211 1122332111000111222223334556667777665543221 112234566877666 Q ss_pred HHHhhhh---ccceEEEcccceeeceEEEEEEcCCeEEEEEECcccccc----CCCCCeEEEEchhhceeeeccCCCccc Q lcl|Aclame:pro 282 TMQDIGR---FFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAI----GISPGFAVVVDVPAVKLAYMDGRNAKV 354 (418) Q Consensus 282 ~i~~~~~---~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~----~mp~d~~lv~D~~~~~~~~L~~r~~~~ 354 (418) .|.++.. .++.+.+...-.. |. --+=+| +.|+.++++... ..+...+++.|.+...+..- .++.. T Consensus 211 ~L~~~~~~~d~~G~~i~~~~~~~-~~----~~~l~G-~Pv~~~~~i~~~~~~~~~~~~~~~~gD~~~~~~g~~--~~~~i 282 (333) T protein:vir:78 211 HLLRAQAYRDANGNVDPSRINLA-AQ----TGDVLG-LPAQFGRAVGGDLGAAVDSKTRIIGGDFSQLKFGFA--DEIRI 282 (333) T ss_pred HHHHHhhhcCCCCceeecCcccc-CC----Cceeec-eeeEEccccCCCccccCCCccEEEEEecccEEEEEe--eccEE Confidence 6655432 2334333211100 00 011223 244554433211 11223577888887654433 22222 Q ss_pred ccccccCccccccccccccccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCCC Q lcl|Aclame:pro 355 ENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAP 416 (418) Q Consensus 355 e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~ 416 (418) +........+.... ....-..|-...+.+..+.+.+++|+|..+|++ + ++| T Consensus 283 ~~~~~~~~~~~~~~--~~~~~~~~~v~~r~~~r~d~~v~~~~a~~~l~~---~------~a~ 333 (333) T protein:vir:78 283 KMSDTATLTDSGSA--TVSMWQTNQIAILIEVTFGWLLGDKQAFVKFVD---D------EQP 333 (333) T ss_pred EEeccccccccccc--eeehhhcCcEEEEEEEEEccEEecccceEEEec---c------CCC Confidence 22111110000000 000001133444667788999999999999743 2 333 No 63 >protein:vir:94494 Length: 274 # NCBI annotation: ORF015 # Family: family:all:522 # MgeID: mge:1508 # MgeName: 88 # Cross-refs: genbank:acc:YP_240676;genbank:gi:66396348;genbank:GeneID:5133758 Probab=65.98 E-value=0.27 Score=23.66 Aligned_cols=259 Identities=15% Similarity=0.060 Sum_probs=122.4 Q ss_pred EccccccccCceeE----eccC---ceEEEEEEecCceeEEEccccccchhhhhCCceEEE-----eeccc--ccccCCc Q lcl|Aclame:pro 81 VENSDGLTKGMIFY----NEAT---GENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIV-----IGTAF--EEGSQRP 146 (418) Q Consensus 81 V~~~~~~~~~~~~~----~~~~---~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~-----~g~a~--~EGada~ 146 (418) -++...-..+.|+- .-+. .+.++.+.+. ++-+-. ....|..+.+ +|.++ .||.+.+ T Consensus 1 ma~~~T~~~d~iiPev~~~~v~~~~~~~l~~~~~~----~~d~~l------~g~~G~tv~iP~~~~~g~a~~~~~g~~i~ 70 (274) T protein:vir:94 1 MPQGLTKTSDQIIPEVLAPMMQAQLEKKLRFASFA----EVDSTL------QGQPGDTLTFPAFVYSGDAQVVAEGEKIP 70 (274) T ss_pred CCccceehhheechHHHHHHHHHhhhhhhhhcccc----eecccc------cCCCCCEEEEeeecCCCccccccCCCccc Confidence 33222111111111 0000 0111111110 000000 0111222222 22222 3454443 Q ss_pred CcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHH Q lcl|Aclame:pro 147 TARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIV 226 (418) Q Consensus 147 ~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~ 226 (418) ...-......--..|+ .+.+++++-+.+. +..|-+.........-+.+.++..++.--+. + T Consensus 71 ~~~lt~~~~~~~i~~~-~~~~~i~D~~~~~---~~~dp~~~~~~~~a~a~a~~vd~~~~~~l~~----a----------- 131 (274) T protein:vir:94 71 TDILETKKREAKIRKI-AKGTSITDEALLS---GYGDPQGEQVRQHGLAHANKVDNDVLEALMG----A----------- 131 (274) T ss_pred ccccccceeEEEeeee-cceecccHHHHHh---ccchHHHHHHHHHHHHHHHHHHHHHHHHHhc----c----------- Confidence 3322222221223442 3567887776554 3445667777777788889999887732110 0 Q ss_pred HHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccce-eeceE Q lcl|Aclame:pro 227 DAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET-SYGMV 305 (418) Q Consensus 227 ~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~-~~G~~ 305 (418) ...+ .+.+++.+.+.|+.+++=+. +...++++|++.....|-+-. ..++..... .-++. T Consensus 132 -------~~~~----~~~~~~~d~i~dA~~~l~d~-----~~~~~~ivv~p~~~~~L~k~~----~~~f~~~s~~g~~~~ 191 (274) T protein:vir:94 132 -------KLTV----NADITKLNGLQSAIDKFNDE-----DLEPMVLFVNPLDAGKLRGDA----STNFTRATELGDDII 191 (274) T ss_pred -------Cccc----cccccCHHHHHHHHHHhhcc-----CCCceEEEeCHHHHHHHHhhh----hhhccccCcccccce Confidence 0001 22457788899988775322 235689999999887775521 112111111 11111 Q ss_pred EEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEE Q lcl|Aclame:pro 306 FTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLT 385 (418) Q Consensus 306 v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~ 385 (418) ..-....|-=+.|+.++. +|.++.+++.+..+.+. .+|+...|..+..- +..|...+.. T Consensus 192 ~~G~ig~~~G~~Vi~s~~-----~p~~t~~l~~~gA~~~~--~~~~~~vE~~Rd~~-------------~~~d~i~~~~- 250 (274) T protein:vir:94 192 VKGAFGEALGAIIVRTNK-----LEAGTAILAKKGAVKLI--LKRDFFLEVARDAS-------------TKTTALYSDK- 250 (274) T ss_pred eccccceecCeeEEEcCC-----CCcceEEEEeCcceEee--ecCCceeccccchh-------------hcccEEEEEE- Confidence 111111121236777644 68899999999888753 34666666654432 2224443333 Q ss_pred EEEEEEEecccceEEeecCccccccc Q lcl|Aclame:pro 386 SEWALELLNPQGCAVITGLQKAKERV 411 (418) Q Consensus 386 ~E~tLev~N~kA~a~I~gL~~~~~~~ 411 (418) =|+..+.||.+..+++- ..|--+- T Consensus 251 -~y~~~~~~~~~vv~~t~-~~~~~~~ 274 (274) T protein:vir:94 251 -HYVAYLYDESKAVKITK-GSGSLEM 274 (274) T ss_pred -EEEEEEEcCCceEEEec-CcccccC Confidence 37889999999988872 2221111 No 64 >protein:vir:97433 Length: 274 # NCBI annotation: ORF014 # Family: family:all:522 # MgeID: mge:1676 # MgeName: 92 # Cross-refs: genbank:acc:YP_240749;genbank:gi:66396420;genbank:GeneID:5133789 Probab=65.98 E-value=0.27 Score=23.66 Aligned_cols=259 Identities=15% Similarity=0.060 Sum_probs=122.4 Q ss_pred EccccccccCceeE----eccC---ceEEEEEEecCceeEEEccccccchhhhhCCceEEE-----eeccc--ccccCCc Q lcl|Aclame:pro 81 VENSDGLTKGMIFY----NEAT---GENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIV-----IGTAF--EEGSQRP 146 (418) Q Consensus 81 V~~~~~~~~~~~~~----~~~~---~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~-----~g~a~--~EGada~ 146 (418) -++...-..+.|+- .-+. .+.++.+.+. ++-+-. ....|..+.+ +|.++ .||.+.+ T Consensus 1 ma~~~T~~~d~iiPev~~~~v~~~~~~~l~~~~~~----~~d~~l------~g~~G~tv~iP~~~~~g~a~~~~~g~~i~ 70 (274) T protein:vir:97 1 MPQGLTKTSDQIIPEVLAPMMQAQLEKKLRFASFA----EVDSTL------QGQPGDTLTFPAFVYSGDAQVVAEGEKIP 70 (274) T ss_pred CCccceehhheechHHHHHHHHHhhhhhhhhcccc----eecccc------cCCCCCEEEEeeecCCCccccccCCCccc Confidence 33222111111111 0000 0111111110 000000 0111222222 22222 3454443 Q ss_pred CcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHH Q lcl|Aclame:pro 147 TARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIV 226 (418) Q Consensus 147 ~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~ 226 (418) ...-......--..|+ .+.+++++-+.+. +..|-+.........-+.+.++..++.--+. + T Consensus 71 ~~~lt~~~~~~~i~~~-~~~~~i~D~~~~~---~~~dp~~~~~~~~a~a~a~~vd~~~~~~l~~----a----------- 131 (274) T protein:vir:97 71 TDILETKKREAKIRKI-AKGTSITDEALLS---GYGDPQGEQVRQHGLAHANKVDNDVLEALMG----A----------- 131 (274) T ss_pred ccccccceeEEEeeee-cceecccHHHHHh---ccchHHHHHHHHHHHHHHHHHHHHHHHHHhc----c----------- Confidence 3322222221223442 3567887776554 3445667777777788889999887732110 0 Q ss_pred HHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccce-eeceE Q lcl|Aclame:pro 227 DAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET-SYGMV 305 (418) Q Consensus 227 ~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~-~~G~~ 305 (418) ...+ .+.+++.+.+.|+.+++=+. +...++++|++.....|-+-. ..++..... .-++. T Consensus 132 -------~~~~----~~~~~~~d~i~dA~~~l~d~-----~~~~~~ivv~p~~~~~L~k~~----~~~f~~~s~~g~~~~ 191 (274) T protein:vir:97 132 -------KLTV----NADITKLNGLQSAIDKFNDE-----DLEPMVLFVNPLDAGKLRGDA----STNFTRATELGDDII 191 (274) T ss_pred -------Cccc----cccccCHHHHHHHHHHhhcc-----CCCceEEEeCHHHHHHHHhhh----hhhccccCcccccce Confidence 0001 22457788899988775322 235689999999887775521 112111111 11111 Q ss_pred EEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEE Q lcl|Aclame:pro 306 FTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLT 385 (418) Q Consensus 306 v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~ 385 (418) ..-....|-=+.|+.++. +|.++.+++.+..+.+. .+|+...|..+..- +..|...+.. T Consensus 192 ~~G~ig~~~G~~Vi~s~~-----~p~~t~~l~~~gA~~~~--~~~~~~vE~~Rd~~-------------~~~d~i~~~~- 250 (274) T protein:vir:97 192 VKGAFGEALGAIIVRTNK-----LEAGTAILAKKGAVKLI--LKRDFFLEVARDAS-------------TKTTALYSDK- 250 (274) T ss_pred eccccceecCeeEEEcCC-----CCcceEEEEeCcceEee--ecCCceeccccchh-------------hcccEEEEEE- Confidence 111111121236777644 68899999999888753 34666666654432 2224443333 Q ss_pred EEEEEEEecccceEEeecCccccccc Q lcl|Aclame:pro 386 SEWALELLNPQGCAVITGLQKAKERV 411 (418) Q Consensus 386 ~E~tLev~N~kA~a~I~gL~~~~~~~ 411 (418) =|+..+.||.+..+++- ..|--+- T Consensus 251 -~y~~~~~~~~~vv~~t~-~~~~~~~ 274 (274) T protein:vir:97 251 -HYVAYLYDESKAVKITK-GSGSLEM 274 (274) T ss_pred -EEEEEEEcCCceEEEec-CcccccC Confidence 37889999999988872 2221111 No 65 >protein:vir:107687 Length: 319 # NCBI annotation: hypothetical protein # Family: family:all:463 # MgeID: mge:1518 # MgeName: T1 # Cross-refs: genbank:acc:YP_003898;genbank:gi:45686314;genbank:GeneID:2773027 Probab=61.18 E-value=0.12 Score=25.63 Aligned_cols=298 Identities=12% Similarity=0.047 Sum_probs=119.5 Q ss_pred eeeeeeeee------cccceeEEEEEeecCceEEEEccccccccCceeEeccCceEE--EEEEecCceeEEEccccccch Q lcl|Aclame:pro 52 STHGYFSKT------MVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATGENM--RLELVNGLNLTVKRQTGRISA 123 (418) Q Consensus 52 ~~~~~~~~~------~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~--~Vtav~g~~~tv~rg~~~tta 123 (418) |+|.=|+.- ......++.-+..++..-+++ ..+= .++..++ +...+.+..+--.++..+..+ T Consensus 1 ~~~~~~~~~~~~~~~~~~~~~~~~~da~~~~g~~~~--------~ql~--~id~~v~e~~~~~l~~~~~i~v~~~~~~~~ 70 (319) T protein:vir:10 1 MTTKKFDEADKSNVEMYLIQAGVKQDAAATMGIWTA--------QELH--RIKSQSYEEDYPVGSALRVFPVTTELSPTD 70 (319) T ss_pred CCCcchhHHhhHHHHHHHhhccchhhhhhhhhhHHH--------HHHH--HHHHHHHhhhhcceechhhcccccCCCCce Confidence 555444422 111222222222222222221 1110 1121111 000111111100111111000 Q ss_pred hhhhCCceEEEeecccc--ccc-CCcCcccccceeccceeEEEeeeeeechhHH--HHhhhcccchHHHHHHHHHHHHHH Q lcl|Aclame:pro 124 AIIAANTKLIVIGTAFE--EGS-QRPTARSIQPVYVPNFTQIFRNAWALTDTAR--ASYAEAGYSNITESRRDCMDFHAT 198 (418) Q Consensus 124 ~~~~~gt~v~~~g~a~~--EGa-da~~~~~~~~~~~~N~tQIf~~~v~VSgTa~--Av~~~g~~dela~q~~kk~~Eikr 198 (418) ..+.-. ..+..|.+.. .++ |.|...... .+. ..+|++-...++.+.+ +.....+.+.-......+...+.+ T Consensus 71 ~~~~~~-~~~~~G~a~~~~d~~~dip~v~~~~-~~~--~~~i~~~~~~~~~~~~El~~a~~~g~~l~~~k~~aA~~~~~~ 146 (319) T protein:vir:10 71 KTFEYM-TFDKVGTAQIIADYTDDLPLVDALG-TSE--FGKVFRLGNAYLISIDEIKAGQATGRPLSTRKASACQLAHDQ 146 (319) T ss_pred EEEEee-eeccccceeeecCccccccceeccc-eee--EEEEEEEEeeeeecHHHHHHHHHhCCChHHHHHHHHHHHHHH Confidence 000000 0011111111 111 122111111 111 2355654444444444 333334555445555556677777 Q ss_pred HHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCcc----chHHHHHHHHHHHHhcccCCCceeEEEE Q lcl|Aclame:pro 199 EQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAV----TYDDVVDATIDAFKWSVNVGDNTQRVMF 274 (418) Q Consensus 199 dmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~----te~~l~d~~~~~~~~g~~~~g~~~~~i~ 274 (418) .+....++|.+.. ..-|++..= .....+.....+.++. -.+|+..++.++|....... .+..+. T Consensus 147 ~~n~i~f~G~~~~---------g~~GLlN~p-~~~~~~~~~~~~~~t~t~~~i~~di~~~~~~l~~~s~g~~--~p~~L~ 214 (319) T protein:vir:10 147 LVNRLVFKGSAPH---------KIVSVFNHP-NITKITSGKWIDVSTMKPETAEAELTQAIETIETITRGQH--RATNIL 214 (319) T ss_pred hhceEEEeecccc---------cceeEEeCC-CceeeecCCCCCccccCHHHHHHHHHHHHHHHHHhcCcee--eceEEE Confidence 7777788885422 123333210 0000000000011112 23567777888886543322 345677 Q ss_pred eChHHHHHHHhhhhccceEEEcccceeeceE-EEEEEcCCeEEEEEECccccccCC-CCCeEEEE--chhhceeeeccCC Q lcl|Aclame:pro 275 CDTVGMRTMQDIGRFFGEVTVTQRETSYGMV-FTEWKFFKGRLILKEHPLFSAIGI-SPGFAVVV--DVPAVKLAYMDGR 350 (418) Q Consensus 275 v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~-v~~~~SdfG~v~vv~n~~l~~~~m-p~d~~lv~--D~~~~~~~~L~~r 350 (418) +++.+...|+.... ..|.. .+.+...|--+.|+.-|.|...+- ..+.++++ |++++.+++= . T Consensus 215 L~p~~~~~L~~~~~------------~~~~t~l~~lk~~~~~l~I~~~pel~~ag~~g~~~~v~y~~~~~~~~~~v~--~ 280 (319) T protein:vir:10 215 IPPSMRKVLAIRMP------------ETTMSYLDYFKSQNSGIEIDSIAELEDIDGAGTKGVLVYEKNPMNMSIEIP--E 280 (319) T ss_pred ecHHHHHhhhcccC------------CCCeeHHHHHHHhcCCceEEEeeeecccCCCcceEEEEEecCCceEEEecC--c Confidence 89888877764211 12332 233445555567777777754332 23555655 4777766542 2 Q ss_pred CcccccccccCccccccccccccccCccccccEEEEEEEEEEecccceEEeecC Q lcl|Aclame:pro 351 NAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGL 404 (418) Q Consensus 351 ~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL 404 (418) ++...+.-+.+. . .+-.-.-.=.+++++-|.|.+.+.|+ T Consensus 281 ~~~~~~~e~~~l---~------------~~~~~~~r~~Gv~i~~P~ai~~~dGI 319 (319) T protein:vir:10 281 AFNMLPAQPKDL---H------------FKVPCTSKCTGLTIYRPMTIVLITGV 319 (319) T ss_pred ceeeeeeeecCc---e------------EEEeeeeeeEEEEEEccceeEeeecC Confidence 333323211110 0 00000111235889999999999999 No 66 >protein:vir:100247 Length: 425 # NCBI annotation: gp76 # Family: family:all:21 # MgeID: mge:1619 # MgeName: Bcep176 # Cross-refs: genbank:acc:YP_355412;genbank:gi:77864702;genbank:GeneID:3725969 Probab=60.38 E-value=0.37 Score=22.93 Aligned_cols=311 Identities=15% Similarity=0.107 Sum_probs=113.6 Q ss_pred Ccceeeeec------cCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeee------eeecccceeEE Q lcl|Aclame:pro 1 MSVYAGIFN------TTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYF------SKTMVFASAVV 68 (418) Q Consensus 1 ~~~~~~~~~------~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~------~~~~~~~~~t~ 68 (418) +........ ......+. ++++-..+ +++. .-..++ .+ +...-+|+ .+.+....... T Consensus 91 ~~~~~~~~~~~~~~~~~~~~~~~-~~af~~~l----~~~e-~~~al~-~~-----t~~~gG~lvP~~~~~~ii~~~~~~s 158 (425) T protein:vir:10 91 ANIKIAAAQMGANGVKPLRDPEY-TEAFKAHV----KRGD-VQAALN-KG-----EDSEGGYLTPIEWDRTITNKLVLIS 158 (425) T ss_pred HHHHHHhhhcccccccccccHHH-HHHHHHHh----hhhh-hHHHhh-cC-----cCCCCceeccHhHHHHHHHHHHhhh Confidence 000000000 00011111 11111000 0000 000000 00 00000111 00000000000 Q ss_pred EEEeecCceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCc Q lcl|Aclame:pro 69 TAEAAADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTA 148 (418) Q Consensus 69 ~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~ 148 (418) . +-.-.+.+++.+.. ..+ . + ..+++.+ .|. .||...+.. T Consensus 159 ~--l~~l~~~~~~~~~~----~~~---------~-~------------~~~~~~a-------~wv------~E~~~~~~~ 197 (425) T protein:vir:10 159 P--MRQLCRVQPVSKAG----FSK---------L-F------------NMGGTTS-------GWV------GEASQRPQT 197 (425) T ss_pred h--hhhhceeeeccCCc----eEE---------E-E------------EcCCcce-------eee------ccccccccc Confidence 0 00000111111100 000 0 0 0011111 111 244333221 Q ss_pred ccccceeccceeEE----EeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHH Q lcl|Aclame:pro 149 RSIQPVYVPNFTQI----FRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQG 224 (418) Q Consensus 149 ~~~~~~~~~N~tQI----f~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~G 224 (418) .. ..+.|| ++-..-+.-|.+..+... .+-..+-..+-...+.+.+|.+||+|.- ++ + -.| T Consensus 198 ~~------~~f~~v~~~~~k~~~~i~iS~ell~ds~-~~l~~~i~~~la~ai~~~~d~~~l~G~G----~~-~----p~G 261 (425) T protein:vir:10 198 NA------ATFQPLSFASGEIYANPAATQQILDDAE-IDLESWLATEVQTEFAKQEGKAFLAGDG----TN-K----PNG 261 (425) T ss_pred cc------cccceeeeeheeeEeehHhHHHHHhcch-hHHHHHHHHHHHHHHHHHHHhhhhcccC----CC-C----cce Confidence 10 012222 222233344455554322 2444566666677778999999998852 11 1 124 Q ss_pred HHHHHhhcc--------ccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEc Q lcl|Aclame:pro 225 IVDAVRQYA--------PDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVT 296 (418) Q Consensus 225 I~~~i~~~~--------~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~ 296 (418) |+..+.... ..........+.++.+++.++...+-..- .++ ..+++++.....|.++...+|++-+. T Consensus 262 il~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d~l~~l~~~l~~~~--~~~---a~~vmn~~~~~~L~~lkD~~G~~l~~ 336 (425) T protein:vir:10 262 LLTYIAGGANAAKHPFGAIEVVNSGAAADITSDGIIDLVYDLPSAF--TGN---ARFAMNRNTQRQVRKLKDGQGNYLWQ 336 (425) T ss_pred eeeccccccccccccccccccccccccccccHHHHHHHHhhhhhhh--ccC---CEEEEchHHHHHHHHhhcCCCceeec Confidence 433211000 00011122334578888888876654321 111 24678888888888876556665443 Q ss_pred ccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccC Q lcl|Aclame:pro 297 QRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHG 376 (418) Q Consensus 297 ~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g 376 (418) .. -..|.. .+=+|. .|+.++.+...+-..+.+++.|++..-.-+- | ...+-+... +. . T Consensus 337 ~~-~~~g~~----~~l~G~-PV~~~~~~p~~~~~~~~i~~Gd~~~~~~i~~--~-~~~~v~~d~----------~~---~ 394 (425) T protein:vir:10 337 PS-YVAGQP----ATLAGY-PVTEVPDMPDVAANSTPILFGDFQQTYLIID--R-IGVRVLRDP----------YT---A 394 (425) T ss_pred cC-ccCCCC----ceecce-eeEEecCcCCccCCccEEEEEehhccEEEEE--e-cceEEEecc----------cc---c Confidence 21 111110 112342 4555554432222234567778875311111 1 111111100 00 0 Q ss_pred ccccccEEEEEEEEEEecccceEEeecCcccc Q lcl|Aclame:pro 377 VDAQGGSLTSEWALELLNPQGCAVITGLQKAK 408 (418) Q Consensus 377 ~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~ 408 (418) .|......+.-+...+.+|+|+.+ .-++.+| T Consensus 395 ~~~~~~~~~~r~d~~v~~~~A~~~-l~~~as~ 425 (425) T protein:vir:10 395 KPYVLFYTTKRVGGGLLNPEPMRA-MKVAASE 425 (425) T ss_pred CCcEEEEEEEEeccEeecccceEE-EEeeccC Confidence 134444555568899999999955 4466666 No 67 >protein:vir:5739 Length: 366 # NCBI annotation: capsid protein # Family: family:all:21 # MgeID: mge:122 # MgeName: PY54 # Cross-refs: genbank:acc:NP_892050;genbank:gi:33770513;interpro:IPR006444;uniprot:Q7Y410;genbank:GeneID:1732928 Probab=59.57 E-value=0.39 Score=22.83 Aligned_cols=338 Identities=14% Similarity=0.092 Sum_probs=119.3 Q ss_pred CcceeeeeccCCCh----hhhhhhhcccceeEeecCCcc---hhHHHhhhcccc-ceeeeeeeeeeeecccceeEEEEEe Q lcl|Aclame:pro 1 MSVYAGIFNTTLNP----QELNMKSFAGTILRRVPNGSA---PLLAMTSVVGST-TAKASTHGYFSKTMVFASAVVTAEA 72 (418) Q Consensus 1 ~~~~~~~~~~~~~~----~~~~~~s~~~~~~~~~~~~~~---p~~~l~~~~~~~-~~~~~~~~~~~~~~~~~~~t~~a~~ 72 (418) ||-..-+=- +.+. .-..++ ...+.+.. -...|.+-.+.. .+-..-++.+.+...... +++ T Consensus 1 ~a~~~a~~~-~~~~~~~~~~~~~~-------~~~~kg~~~~~~~~a~a~~~g~~~~a~~~a~~~~~~~~~~~a--~~~-- 68 (366) T protein:vir:57 1 MAAAVAVPV-KAHSVAPGIIIKEE-------LQQYKGAGMTRMVMSIAAGKGNLADAAKFAATELGDTGLSMA--IST-- 68 (366) T ss_pred Ccccccccc-cccccccccccccc-------cccccchhHHHHHHHHHhcccchhHHHHHHHHhhcchhhhhh--ccc-- Confidence 221111100 0010 000000 00000000 011111100000 000001111211110000 000 Q ss_pred ecCceEEEEccccccccCceeEeccCc----e-EE-E--EEEe--cCceeEEEccccccchhhhhCCceEEEeecccccc Q lcl|Aclame:pro 73 AADATVLTVENSDGLTKGMIFYNEATG----E-NM-R--LELV--NGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEG 142 (418) Q Consensus 73 ~a~~t~~tV~~~~~~~~~~~~~~~~~~----E-~~-~--Vtav--~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EG 142 (418) +. +..++..+.-+..++-+ + .+ + ++.| ....+++-+-..+.. ..|. .|| T Consensus 69 -------~~-~~Gg~lvP~~~~~~ii~~l~~~s~l~~lg~~~v~~~~g~~~~p~~t~~~~-------a~wv------~E~ 127 (366) T protein:vir:57 69 -------AA-GSGGALIPQNMQNEVIELLRDRTVVRILGARSIPLPNGNLSMPRLSGGAT-------AGYV------GEG 127 (366) T ss_pred -------cc-cCCccccchhHHHHHHHHHhhhcchhhhceeeeecCCCceEEEEEeCCcc-------eeee------ccC Confidence 00 01111111111101100 0 01 0 1112 111222222111111 1122 466 Q ss_pred cCCcCcccccceeccceeEEEeeee----eechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCcc Q lcl|Aclame:pro 143 SQRPTARSIQPVYVPNFTQIFRNAW----ALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQP 218 (418) Q Consensus 143 ada~~~~~~~~~~~~N~tQIf~~~v----~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~ 218 (418) .+.+.... .+.+|--+.. .+.-|.+...... .+-.++-..+-.+.+.+.+|.+||+|.- .+.+| T Consensus 128 ~~~~~s~~-------~f~~i~~~~~k~~~~~~iS~ell~ds~-~~~~~~i~~~l~~a~~~~~d~a~l~G~G----~~~~p 195 (366) T protein:vir:57 128 KDVVATGA-------TFDDVKLSAKTMIALVPVSNQLIGRAG-FNVEQLLLGDILSAIATREDKAFLRDDG----TGDTP 195 (366) T ss_pred cccccccc-------ceeEEEEeeEEEEEeehhhHHHHhhhh-HHHHHHHHHHHHHHHHHHHHHHhhccCC----CCccc Confidence 65553221 1333333333 3334444443322 2333445566666788999999998852 22232 Q ss_pred chhhHHHHHHHhhccccCccccCCCCccchHHHH---HHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEE Q lcl|Aclame:pro 219 LHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVV---DATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTV 295 (418) Q Consensus 219 ~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~---d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~ 295 (418) .||+.... ..+......++..+.+.+. +++...+... .. ......+++++.....|.++...+|++.+ T Consensus 196 ----~Gi~~~~~---~~~~~~~~~~t~~~~~~~~~~~~~~~~~~~~~-~~-~~~~a~~vmn~~~~~~L~~lkd~~G~~l~ 266 (366) T protein:vir:57 196 ----KGMKAVAT---AANRLVAWTGTAINLTTIDEYLDSLILKHMDS-NS-NMIRCGWGLSNRTYMTLFGLRDGNGNKVY 266 (366) T ss_pred ----cceeeccc---cccceeeccccccchhhHHHHHHHHHHhhhcc-cc-ccccCEEEecHHHHHHHHhhhccCCceec Confidence 24443211 1122222223344444333 3333333211 00 11112356888888888887555566554 Q ss_pred cccceeeceEEEEEEcCCeEEEEEECcccccc-CCC--CCeEEEEchhhceeeeccCCCcccccccccCccccccccccc Q lcl|Aclame:pro 296 TQRETSYGMVFTEWKFFKGRLILKEHPLFSAI-GIS--PGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYS 372 (418) Q Consensus 296 ~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~-~mp--~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~ 372 (418) ..... | +=+| +.|+.++.+.+. +-. ...+++.|++.+-+..- .+...+.+......+-. +... T Consensus 267 ~~~~~--g-------~l~G-~Pvv~s~~ip~~~~~~~~~~~i~~gdfs~~~i~~~--~~i~i~~~~ea~~~~~~--g~~~ 332 (366) T protein:vir:57 267 PEMSQ--G-------ILKG-YPIQRTSAIPANLGDDGNESEIYFCDFNDVVIGED--GMMKVDFSTEATYKDAD--GQLV 332 (366) T ss_pred cCCCC--C-------eecc-eeeEEccccccccccCCCccEEEEEecceEEEEEe--cceEEEEeecccccccc--ccch Confidence 32111 1 0122 234444333110 000 12356667766543221 12222222221110000 0000 Q ss_pred cccCccccccEEEEEEEEEEecccceEEeecCcc Q lcl|Aclame:pro 373 YGHGVDAQGGSLTSEWALELLNPQGCAVITGLQK 406 (418) Q Consensus 373 ~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~ 406 (418) ..-..|...-+.+..+.+.+++|+|.++++|.+= T Consensus 333 ~~f~~~~~~iR~~~~~d~~v~~~~a~~~lt~~~~ 366 (366) T protein:vir:57 333 SAFARNQSLIRVVTEHDIGFRHPEGLVLGTGVIW 366 (366) T ss_pred hhhhcCceeEEeeeeeCcEeeccccEEEEecccC Confidence 0001145566777889999999999999999998 No 68 >protein:vir:4953 Length: 397 # NCBI annotation: major head protein # Family: family:all:21 # MgeID: mge:108 # MgeName: Sfi19 # Cross-refs: genbank:acc:NP_049929;genbank:gi:9632900;genbank:GeneID:1262076 Probab=59.53 E-value=0.39 Score=22.82 Aligned_cols=312 Identities=13% Similarity=0.023 Sum_probs=115.9 Q ss_pred Ccce-----eeeeccCCChh--hhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEee Q lcl|Aclame:pro 1 MSVY-----AGIFNTTLNPQ--ELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAA 73 (418) Q Consensus 1 ~~~~-----~~~~~~~~~~~--~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~ 73 (418) .... .......++.. ...++.+ .+..+.+... .. T Consensus 66 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~---------------~~~l~~~~~~------------~~------------ 106 (397) T protein:vir:49 66 NEVANMSEEEKKPLTKSEEEVKAGFVKDF---------------KNLVRGRYQN------------LL------------ 106 (397) T ss_pred HhhhccccccccccccchhHHHHHHHHHH---------------HHHHhcchhH------------HH------------ Confidence 0000 00000000000 0000110 0111110000 00 Q ss_pred cCceEEEEccccccccCceeEeccCc---------eEEEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccc Q lcl|Aclame:pro 74 ADATVLTVENSDGLTKGMIFYNEATG---------ENMRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEG 142 (418) Q Consensus 74 a~~t~~tV~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EG 142 (418) ...+. ......++..+.-+...|-+ ..+.+..+.+.+ +.+.+...+. ....|. .|| T Consensus 107 ~~~~~-~t~~~gg~~vP~~~~~~ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~~~------~~a~~v------~E~ 173 (397) T protein:vir:49 107 DSKTD-ASGSDAGLTIPQDIQTAIHTLVSQYDSLQEYVNVENVTTLTGSRVYEKWTDIT------GLANID------DEA 173 (397) T ss_pred HHhhc-cccccCcccccHhHHHHHHHHHHhhhhHHhhhceeecccCccceEEEeeccCC------cceeee------cCc Confidence 00000 01111222222211111111 011222332221 2222221110 001222 466 Q ss_pred cCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhh Q lcl|Aclame:pro 143 SQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTT 222 (418) Q Consensus 143 ada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t 222 (418) ++.+.........+ -..+++-...+.-|.+...... .+-..|-...-...+.+.+|.++|+|... +.. T Consensus 174 ~~~~~~~~~~~~~i--~~~~~k~~~~~~iS~ell~ds~-~~l~~~i~~~l~~~~~~~~d~ai~~G~g~----~~~----- 241 (397) T protein:vir:49 174 GKIADVDDPKLSLI--KYTIKRYAGISTVTNSLLADSA-ENILAWLSGWIAKKVVVTRNKAILEAIAA----LPT----- 241 (397) T ss_pred cccccccccceeeE--EeeeeeEEeeehhHHHHHhhhH-HHHHHHHHHHHHHHHHHHHHHHHHhhccc----ccc----- Confidence 55442111111111 2233333444444444443322 23345555666677788999999987531 111 Q ss_pred HHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceee Q lcl|Aclame:pro 223 QGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSY 302 (418) Q Consensus 223 ~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~ 302 (418) .++..+.+++.++...+-..... + ..+++++.....|.++...+|++.+...- .. T Consensus 242 -------------------~~~~~~~d~i~~~~~~l~~~~~~-~----a~~vmn~~~~~~l~~lkd~~G~~l~~~~~-~~ 296 (397) T protein:vir:49 242 -------------------KPTLTKWDDIIDLEAKVDPAIKQ-T----SFFLTNTSGFTALKKVKNALGDYLMERDV-KS 296 (397) T ss_pred -------------------ccccccHHHHHHHHHhhhhhhcC-C----CEEEEcHHHHHHHHHhhcCCCceeeccCc-CC Confidence 11234567777777666443222 1 24778888888888875555655443210 00 Q ss_pred ceEEEEEEcCCeE-EEEEECccccccCCCCCeEEEEchhh-ceeeeccCCCcccccccccCccccccccccccccCcccc Q lcl|Aclame:pro 303 GMVFTEWKFFKGR-LILKEHPLFSAIGISPGFAVVVDVPA-VKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQ 380 (418) Q Consensus 303 G~~v~~~~SdfG~-v~vv~n~~l~~~~mp~d~~lv~D~~~-~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~ 380 (418) |. --+=+|. |.++.+.++.....+...+++.|+.. +.+..- .+...+.....+. .+ -.|.. T Consensus 297 ~~----~~~l~G~PV~~~~~~~~~~~~~~~~~i~~gd~~~~~~~~~~--~~~~i~~~~~~~~---~~--------~~~~~ 359 (397) T protein:vir:49 297 PT----GYSIDGFAVKEVADRWLANGTGGAMPLYFGDLKQAVTLFDR--QHMSLLSTNIGGG---AF--------ETDTT 359 (397) T ss_pred CC----CceecceeeEEecccccccccCCceeEEEeeccceEEEEee--cceEEEEeccccc---hh--------hcCce Confidence 00 0011332 22233444433333434567778764 222211 1111111111110 00 00233 Q ss_pred ccEEEEEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 381 GGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 381 k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) ....+.-+...+.+|+|+.+++-=..+.++.....-|- T Consensus 360 ~~r~~~r~d~~~~~~~a~~~~~~~~~~~~~~~~~~~~~ 397 (397) T protein:vir:49 360 KVRVIDRFDVVATDTEAFVPASFKAIADQKGNLGSTAV 397 (397) T ss_pred eEEEEeeeCcEEecccceEEEEeecccCCCCCcccccC Confidence 34566678889999999988764433322221111111 No 69 >protein:vir:99920 Length: 311 # NCBI annotation: gp7 # Family: family:all:966 # MgeID: mge:1611 # MgeName: Halo # Cross-refs: genbank:acc:YP_655524;genbank:gi:109392294;genbank:GeneID:4157089 Probab=59.16 E-value=0.4 Score=22.78 Aligned_cols=288 Identities=10% Similarity=-0.022 Sum_probs=106.0 Q ss_pred EEEeecCceEEEEccccccccCceeEeccCc----eEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccC Q lcl|Aclame:pro 69 TAEAAADATVLTVENSDGLTKGMIFYNEATG----ENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQ 144 (418) Q Consensus 69 ~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~----E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGad 144 (418) +|..+.+. ...|.. .+. ..|+...... ....+.-+....+++-+-.++.. ..|+ .||.. T Consensus 1 Mat~tt~~-g~~vP~--~~~-~~ii~~~~~~s~l~~~~~~i~~~~~~~~~p~~~~~~~-------a~wv------~Eg~~ 63 (311) T protein:vir:99 1 MATFGTGN-LKNLPR--NIA-DGMVKDVVQGSTVAVLSARKPQRFGNEDIITFNGRPK-------AEFV------GEGQQ 63 (311) T ss_pred CceecCCC-ceeccH--HHH-HHHHHHHHhhchhhhhcceeeccCCceEEEEEeCCce-------eEEe------ecCcc Confidence 22222111 112210 010 0111100000 01112223333333333222211 1222 46666 Q ss_pred CcCcccccceecccee-EEEeeeeeechhHHHHhh--hcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchh Q lcl|Aclame:pro 145 RPTARSIQPVYVPNFT-QIFRNAWALTDTARASYA--EAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHT 221 (418) Q Consensus 145 a~~~~~~~~~~~~N~t-QIf~~~v~VSgTa~Av~~--~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~ 221 (418) .|..... .++.+ ..++-...+.=|.+.... ....+-..+-..+-...+.+.+|.++|+|.-.. .+..+ .. T Consensus 64 ~~~~~~~----f~~v~l~~~k~~~~~~iS~ell~~~~d~~~~l~~~i~~~la~ai~~~~d~~~l~G~g~~--~g~~~-~g 136 (311) T protein:vir:99 64 KSSTTGE----FDFVTSTPKKAQVTMRFNEEVQWADEDYQLGVLQTLSEAGAEALARALDLGLYHRINPL--TGTVI-PG 136 (311) T ss_pred cccccce----eeEEEEeeEEEEEeehhhHHHhhcccccHHHHHHHHHHHHHHHHHHHHHHHhhcccCcc--cCccc-cc Confidence 5533211 11111 112222233333333321 112233455566667778999999999886411 11111 11 Q ss_pred hHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccc-- Q lcl|Aclame:pro 222 TQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRE-- 299 (418) Q Consensus 222 t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~-- 299 (418) ..++... ....+.....+.....+++.++....-..+.. .. ..-+++++.....|.++.-.+|++.+.... T Consensus 137 ~~~~~~~----~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~--~~-~~~~vmn~~~~~~L~~lkd~~G~~l~~~~~~~ 209 (311) T protein:vir:99 137 WSNYLGA----ASKRVELTADTIANPDLAIEAAVGLLVANGHP--TP-VNGLALHPSIAWGLSTARYTDGRKKFPELGLG 209 (311) T ss_pred ccccccc----ccceeeccccccchhHHHHHHHHHHHhhhccC--CC-ccEEEEcHHHHHHHHhhhccCCCeeecCcccC Confidence 1222111 11111111122222334444444433322111 11 112667888888888875555665553221 Q ss_pred ----eeeceEEEEEEcCC---------eEEEEEECccccccCCCCCeEEEEchhh-ceeeeccCCCcccccccccCcccc Q lcl|Aclame:pro 300 ----TSYGMVFTEWKFFK---------GRLILKEHPLFSAIGISPGFAVVVDVPA-VKLAYMDGRNAKVENYGQGGGENK 365 (418) Q Consensus 300 ----~~~G~~v~~~~Sdf---------G~v~vv~n~~l~~~~mp~d~~lv~D~~~-~~~~~L~~r~~~~e~laKtG~~~~ 365 (418) .-+|.-| +.|++ +...+... +.+.+++-|.+. +.+... ++...+-+. .+..+- T Consensus 210 ~~~~~l~G~Pv--~~s~~i~~~~~~~~~~~~~~~~--------~~~~~~~Gdf~~~~~~~~~--~~~~~~~~~-~~~~~~ 276 (311) T protein:vir:99 210 IGVSSFEGIDA--SVSDTVNGGDEADPDDEDLDAA--------RAVRGIVGDFANGIHWGVQ--RDIPVELIK-YGDPDG 276 (311) T ss_pred CCCceecceee--Eeecccccccccccccchhhcc--------CcceEEEeeccccEEEEEe--cCceEEEee-cCCCCc Confidence 2334433 33321 11111111 224566667653 333333 222111111 110000 Q ss_pred ccccccccccCccccccEEEEEEEEEEecccceEEeecCcccc Q lcl|Aclame:pro 366 SGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAK 408 (418) Q Consensus 366 ~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~ 408 (418) . + + .-..|-...+....+...+++| |+.++.+- +. T Consensus 277 ~--~--~-~~~~d~~~~r~~~r~d~~v~~~-~~v~~~~~--~A 311 (311) T protein:vir:99 277 Q--G--D-LKRHNQIALRLEIVYGWYVFTD-RFVVIENA--VA 311 (311) T ss_pred c--h--h-hhhcCcEEEEEEEeecceecCh-hHeeeecc--cC Confidence 0 0 0 0001334445577889999997 44444332 21 No 70 >protein:vir:80491 Length: 467 # NCBI annotation: Cps # Family: family:all:2450 # MgeID: mge:1883 # MgeName: A511 # Cross-refs: genbank:acc:YP_001468466;genbank:gi:157325041;genbank:GeneID:5601449 Probab=58.10 E-value=0.42 Score=22.65 Aligned_cols=327 Identities=14% Similarity=0.123 Sum_probs=132.8 Q ss_pred hhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEE-----eecCceEEEEccccccc Q lcl|Aclame:pro 14 PQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAE-----AAADATVLTVENSDGLT 88 (418) Q Consensus 14 ~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~-----~~a~~t~~tV~~~~~~~ 88 (418) --+-||+++- -.||. ....++ .||.+-+| ...++.-+-.++ +...-+.|+..+.+ | T Consensus 1 ~~~~~~~~~~----~~n~~--~~~e~~--------~Ks~~agy---~~~p~tq~~~~AlR~EsL~~~i~~Lt~~~~~-f- 61 (467) T protein:vir:80 1 MPKNNKEEVK----EVNLN--SVQEDA--------LKSFTTGY---GITPDTQTDAGALRREFLDDQISMLTWTEND-L- 61 (467) T ss_pred CCCcchhhhh----hcccc--cCHHHH--------HHHHHccc---ccCCccccCcchhhhhhhhhhhheeeccccc-h- Confidence 1122333221 12332 111111 12211122 000000000000 11111222222211 1 Q ss_pred cCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEee-----cccccccCCcCcccccceeccceeEEE Q lcl|Aclame:pro 89 KGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIG-----TAFEEGSQRPTARSIQPVYVPNFTQIF 163 (418) Q Consensus 89 ~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g-----~a~~EGada~~~~~~~~~~~~N~tQIf 163 (418) .+++.+..... .+..+..+..+ ..| ....|+..+......-+.+. =..--+ T Consensus 62 ---~~~~di~k~~a-------------------~stv~~y~~~~-~~G~~g~~~f~~E~g~~~~~~~~~~r~~-~~~k~l 117 (467) T protein:vir:80 62 ---TFYKDIAKKPA-------------------TSTVAKYDVYM-QHGKVGHTRFTREIGVAPVSDPNIRQKT-VNMKFA 117 (467) T ss_pred ---hhhhhcccchh-------------------hhhhhhheeee-ccCccccccccccccccccCCCceEEEE-EEeeee Confidence 12222222110 01112222211 111 12356654432221111111 122233 Q ss_pred eeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCccccc-CcCCccchhhHHHHHHHhhccccCccccCC Q lcl|Aclame:pro 164 RNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMG-TYNGQPLHTTQGIVDAVRQYAPDNVNAMPN 242 (418) Q Consensus 164 ~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~-~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~ 242 (418) ..+-.||.-+.-++. ..|-++.|.++++.-+...+|++.+.|-+... ..+++.--+-+||+..+ ...|+... . T Consensus 118 ~~~~~vs~~~~l~n~--i~d~~~~~~~~ai~~~a~tiE~a~FyGds~l~~s~~~~~glqfDGi~~li---~~enviDa-~ 191 (467) T protein:vir:80 118 SDTKNISIAAGLVNN--IQDPMQILTDDAIVNIAKTIEWASFFGDSDLSDSPEPQAGLEFDGLAKLI---NQDNVHDA-R 191 (467) T ss_pred eeeeeehhhhhhhcc--hhhHHHHHHHHHHHHHHHHHHHHhhhcccccccCCCccccccccceeEEe---cCCceecc-C Confidence 344445555544433 44668999999999999999999999987653 22333334567776444 23466443 3 Q ss_pred CCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHH-HhhhhccceEEEcccc---eeeceEEEEEEcCCeEEEE Q lcl|Aclame:pro 243 PTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTM-QDIGRFFGEVTVTQRE---TSYGMVFTEWKFFKGRLIL 318 (418) Q Consensus 243 ~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i-~~~~~~~~~~~~~~~~---~~~G~~v~~~~SdfG~v~v 318 (418) |..+++++|..+...+=+ +.++..-+|.+...+-.| +.... -+.++.... ...|..|..|.|..|.+.+ T Consensus 192 G~~ls~~~lneaa~~i~~-----gfG~~td~~~p~~v~a~~~~~~L~--~q~~v~~~n~~~~~~G~~v~g~~sa~G~I~l 264 (467) T protein:vir:80 192 GASLTESLLNQAAVMISK-----GYGTPTDAYMPVGVQADFVNQQLS--KQTQLVRDNGNNVSVGFNIQGFHSARGFIKL 264 (467) T ss_pred CCccCHHHHHHHhhhccc-----cccChhhhhcchhHHhhhhhhhcC--ceEEEEcCCCCceeeeecccceecceeeeee Confidence 456899988888743322 233333456666666455 66533 444554322 3558889999999999988 Q ss_pred EECccccccCCCCCeEEEEchhhce--eeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEeccc Q lcl|Aclame:pro 319 KEHPLFSAIGISPGFAVVVDVPAVK--LAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQ 396 (418) Q Consensus 319 v~n~~l~~~~mp~d~~lv~D~~~~~--~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~k 396 (418) ..+-+|+..+++ ||+... .++-..--.......+.|.. . +.|.- .=+|-..+.|.. T Consensus 265 ~gs~il~~~~~l-------~~~~~~~~~Apsp~~vsaT~~~~~~g~~-~----------~~~~a----~y~Y~v~~vs~~ 322 (467) T protein:vir:80 265 HGSTVMENEQIL-------DERILALPTAPQPAKVTATQEAGKKGQF-R----------AEDLA----AHEYKVVVSSDD 322 (467) T ss_pred cCceeeccccCC-------CcccccccccccCCccceeeecccCCcc-c----------CCCcc----eEEEEEEEECCC Confidence 777666554433 333322 11111000001111111100 0 00000 022333344433 Q ss_pred ceEEeecCccc--------------ccccCCCCCC----------C Q lcl|Aclame:pro 397 GCAVITGLQKA--------------KERVYLTAPA----------P 418 (418) Q Consensus 397 A~a~I~gL~~~--------------~~~~~~~~~~----------~ 418 (418) +-.+....-++ -+.+|...|- . T Consensus 323 GES~pS~~vtvTVaa~~dg~~ltIt~~~~~~~~p~yv~IYR~~~gg 368 (467) T protein:vir:80 323 AESIASEVATATVTAKDDGVKLEIELAPMYSSRPQFVSIYRKGAET 368 (467) T ss_pred CccccccceEEEecCcccceeEEEEecCCCCCcceEEEEEEeCCCC Confidence 22222221111 0111111010 0 No 71 >protein:vir:7409 Length: 408 # NCBI annotation: major structural protein # Family: family:all:21 # MgeID: mge:146 # MgeName: P335 # Cross-refs: genbank:acc:NP_839926;genbank:gi:30089896;genbank:GeneID:1260683 Probab=58.02 E-value=0.42 Score=22.64 Aligned_cols=319 Identities=14% Similarity=0.058 Sum_probs=114.9 Q ss_pred CcceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) Q Consensus 1 ~~~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~t 80 (418) ...........--..++ .+.+...+ +... -.+... ... .... .+..++... T Consensus 77 ~~~~~~~~~~~~~~~~~-~~~~~~~~-~~~~---~~~~~~-~~~-a~~~----------------------~~~~~gg~~ 127 (408) T protein:vir:74 77 EEKGPLNKSENELKDKF-VKDFVNMV-RNPM---AFLNTV-SSK-TETS----------------------GSDSAAGLT 127 (408) T ss_pred cccccccchhhhhHHHH-HHHHHHHH-hcch---hhhhhh-hhh-hhcc----------------------cccCCCcee Confidence 00000000111111122 22222211 1111 111111 110 0000 000001111 Q ss_pred EccccccccCceeEeccCc----eEEEEEEecCc--eeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccce Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATG----ENMRLELVNGL--NLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPV 154 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~----E~~~Vtav~g~--~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~ 154 (418) |. ..+. ..|+...... -.+.+..+.+. .+.+.+....... ..| ..||++.++....... T Consensus 128 vP--~~~~-~~Ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~~------~~~------v~E~~~~~~~~~~~~~ 192 (408) T protein:vir:74 128 IP--QDIR-TMINTLVRQYDSLQQYVRVESVSTSSGSRVYEKWTDVTPL------KAM------DEEDGKIPDLDNPRLT 192 (408) T ss_pred ec--hhHh-hHHHHHHhhhcchhhhcceeeccCCcceEEEEeecCCccc------ccc------ccccccccccccccee Confidence 11 0010 0111000000 01112222222 1222222111100 011 1355554422111101 Q ss_pred eccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccc Q lcl|Aclame:pro 155 YVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAP 234 (418) Q Consensus 155 ~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~ 234 (418) . --...++-...+.-|.++.+. ...+...|-...-...+.+-+|.++|+|.. ++.. T Consensus 193 ~--i~~~~~k~~~~~~iS~ell~d-s~~~l~~~i~~~l~~~~~~~~d~~il~G~G----~~~~----------------- 248 (408) T protein:vir:74 193 I--IKYLIKRYAGIITATNTLLKD-TAENILAWLSSWIAKKVVVTRNQAIIAAMG----TVPK----------------- 248 (408) T ss_pred e--EEeeeeeEEeeehhHHHHHhh-chHHHHHHHHHHHHHHHHHHHHHHHhhccc----cccc----------------- Confidence 1 112222223333344444433 222344555556666778889999998743 1111 Q ss_pred cCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCe Q lcl|Aclame:pro 235 DNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKG 314 (418) Q Consensus 235 ~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG 314 (418) .+...+.+++.+++...-......+ ..+++++.....|.++...+|++.+...- ..|.. . +=+| T Consensus 249 -------~~~~~~~~~i~~~~~~~l~~~~~~~----a~~v~n~~~~~~l~~lkd~~G~~l~~~~~-~~~~~-~---~l~G 312 (408) T protein:vir:74 249 -------KPTIANFDDVITMINTSVDPAIIAT----SSLLTNQSGLNKLALVKTAEGKYLLEPDP-TKPNS-Y---LIKG 312 (408) T ss_pred -------ccccccHHHHHHHHHHhhhhhhcCC----CEEEEcHHHHHHHHHhhcCCCceEeccCc-CCCCC-c---eecc Confidence 1123456677776643222221111 35778998888898875555665543211 00100 0 0133 Q ss_pred E-EEEEECccccccCCCCCeEEEEchhhc-eeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEE Q lcl|Aclame:pro 315 R-LILKEHPLFSAIGISPGFAVVVDVPAV-KLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALEL 392 (418) Q Consensus 315 ~-v~vv~n~~l~~~~mp~d~~lv~D~~~~-~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev 392 (418) . |.+..+..+...+.....+++.|+... .+..- .+...+.....+.. .-.|....+++.-+...+ T Consensus 313 ~pV~~~~~~~~~~~~~~~~~i~~gd~~~~~~~~~~--~~~~i~~~~~~~~~-----------f~~~~~~~r~~~r~d~~~ 379 (408) T protein:vir:74 313 KQVIVVADRWLPNSGSTVYPLYYGDMSQAITLFDR--ENMSLLPTNIGAGA-----------FETDTTKIRVIDRFDVKA 379 (408) T ss_pred eeeEEecCcccccccCCcceEEEEehhccEEEEEe--cceEEEEeccccch-----------hhcceeeEEEEEeeCcEE Confidence 2 222223333332333345677787643 22111 12222221111100 000233334566678899 Q ss_pred ecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 393 LNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 393 ~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) .+|+|+.+++--..+ ..+++-|++ T Consensus 380 ~~~~a~~~~~~~~~~--~~~~~~~~~ 403 (408) T protein:vir:74 380 TDSEALVAGSFTAIA--DQVGNFKTT 403 (408) T ss_pred ecccceEEEEeeccc--CCCCCCCCC Confidence 999999998764333 223333444 No 72 >protein:vir:80376 Length: 435 # NCBI annotation: gp6, major capsid head protein # Family: family:all:21 # MgeID: mge:1881 # MgeName: phi644-2 # Cross-refs: genbank:acc:YP_001111085;genbank:gi:134288639;genbank:GeneID:4960624 Probab=57.84 E-value=0.43 Score=22.62 Aligned_cols=337 Identities=12% Similarity=0.062 Sum_probs=119.9 Q ss_pred Ccc--e--eeeec--------cCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEE Q lcl|Aclame:pro 1 MSV--Y--AGIFN--------TTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVV 68 (418) Q Consensus 1 ~~~--~--~~~~~--------~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~ 68 (418) ++. . .+... ...+-.+.....+......+.....-..... ......++....... + T Consensus 65 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~---------~~~~~~~~~~~~~~~---~ 132 (435) T protein:vir:80 65 AAVPVDPNPAAVTASAAAPVYAQPKAPEVKGAKMARMVRALAAARGDAQLAS---------KLAIERGFGEEVAMS---L 132 (435) T ss_pred hcccccchhhhhccccccccccccchhhhhHHHHHHHHHHHHhccchhHHHH---------HHHHhhhhhhhhhhh---h Confidence 111 0 01111 1111111111111111111111100000000 000000111000000 0 Q ss_pred EEEeecCceEEEEccccccccCceeEecc----CceE----EEEEEec--CceeEEEccccccchhhhhCCceEEEeecc Q lcl|Aclame:pro 69 TAEAAADATVLTVENSDGLTKGMIFYNEA----TGEN----MRLELVN--GLNLTVKRQTGRISAAIIAANTKLIVIGTA 138 (418) Q Consensus 69 ~a~~~a~~t~~tV~~~~~~~~~~~~~~~~----~~E~----~~Vtav~--g~~~tv~rg~~~tta~~~~~gt~v~~~g~a 138 (418) +. .+. ...++..+.-+...+ .... +.++-|. ...+.+-+-..+ + ...|. T Consensus 133 ~~-~~~--------~~gg~lvP~~~~~~ii~~l~~~~~i~~~~~~~v~~~~~~~~~p~~~~~--~-----~a~~v----- 191 (435) T protein:vir:80 133 NT-LSP--------GAGGVLVPENLSSEVIELLRPKSVVRKLGARTLPLSNGNITIPRLKGG--A-----IVGYI----- 191 (435) T ss_pred cc-cCC--------CCCccccchhHHHHHHHHHhhhchhhhccceeeecCCCceEEEEEeCC--c-----ceeee----- Confidence 00 000 011111111110000 0000 0011111 111222111111 0 11121 Q ss_pred cccccCCcCcccccceeccceeEEE----eeeeeechhHHHHhhhcc-cchHHHHHHHHHHHHHHHHhHHHhcCcccccC Q lcl|Aclame:pro 139 FEEGSQRPTARSIQPVYVPNFTQIF----RNAWALTDTARASYAEAG-YSNITESRRDCMDFHATEQETAIFFGQAFMGT 213 (418) Q Consensus 139 ~~EGada~~~~~~~~~~~~N~tQIf----~~~v~VSgTa~Av~~~g~-~dela~q~~kk~~EikrdmE~a~i~G~k~~~~ 213 (418) .||...+... + .+.+|- +-...+.-|.+.....+. .+..++-...-...+.+.+|.+||+|. | T Consensus 192 -~E~~~~~~~~--~-----~f~~i~~~~~k~~~~~~is~ell~ds~~~~~l~~~i~~~l~~a~~~~~d~a~l~G~----G 259 (435) T protein:vir:80 192 -GADTDIPTTQ--Q-----QFDDLKLTAKKMAALVPIANDLIKYAGVNPNVDQIVVGDLTAAIGAREDKAFIRDD----G 259 (435) T ss_pred -ccCccccccc--c-----ceeeEEEeeEEEEEeehhhHHHHHhhcccHHHHHHHHHHHHHHHHHHHHHHhhccC----C Confidence 3565544322 1 233333 233333344444443332 233355555566678999999999884 2 Q ss_pred cCCccchhhHHHHHHHhhccccCccccCCCC--ccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccc Q lcl|Aclame:pro 214 YNGQPLHTTQGIVDAVRQYAPDNVNAMPNPT--AVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFG 291 (418) Q Consensus 214 s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a--~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~ 291 (418) ++..| .||+... ...++.....+. .....++.+++..+...... .....+++++.....|.++...+| T Consensus 260 ~~~~p----~Gi~~~~---~~~~~~~~~~~~~~~~~~~d~~~~~~~~~~~~~~---~~~~~~vmn~~~~~~L~~lkd~~G 329 (435) T protein:vir:80 260 TANTP----KGLRFWA---LPGNVITASDGSTLQKIETDLGKAILALENADAN---LTQPGWIMAPRTFRFLEGLRDGNG 329 (435) T ss_pred CCCcc----cceeecc---cccceeecccccchhhHHHHHHHHHHHhhccccc---cccCEEEEcHHHHHHHHhhhccCC Confidence 22222 2554221 112222222211 12234455554444332111 112246678888888988765666 Q ss_pred eEEEccc--ceeeceEEEEEEcCCeEEEEEECcccccc---CCCCCeEEEEchhhceeeeccCCCcccccccccCccccc Q lcl|Aclame:pro 292 EVTVTQR--ETSYGMVFTEWKFFKGRLILKEHPLFSAI---GISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKS 366 (418) Q Consensus 292 ~~~~~~~--~~~~G~~v~~~~SdfG~v~vv~n~~l~~~---~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~ 366 (418) ++.+... ..-+|. .|+.+..+... .-....+++.|++++-+.-- .+...+.....+..+.. T Consensus 330 ~~l~~~~~~~~l~G~------------pv~~~~~~p~~~~~~~~~~~i~~gd~s~~~i~~~--~~~~i~~~~~~~~~~~~ 395 (435) T protein:vir:80 330 NKVYPELANGMLKGY------------PVGKTTQVPINLGEAGKESEIYFTDFGDVFIGEE--ETLEIDYSKEATYKDAD 395 (435) T ss_pred ceeccCCCCCeEeee------------eeEEeccccccccCCCCcceEEEEEcccEEEEee--cceEEEEeccccccccc Confidence 6554321 122232 23333222110 00112567777766432211 23333333222211000 Q ss_pred cccccccccCccccccEEEEEEEEEEecccceEEeecCcccc Q lcl|Aclame:pro 367 GATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAK 408 (418) Q Consensus 367 ~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~ 408 (418) .. ....--.|....+...-+.+.+.+|+|..+|+|++=.. T Consensus 396 ~~--~~~~f~~n~~~~r~~~r~d~~~~~~~a~~~l~~~~~~~ 435 (435) T protein:vir:80 396 GH--MVSAFQRDQTLIRVIAKNDFGPRHVESIAVLSGVAWGA 435 (435) T ss_pred cc--hhhhhhcCcceeeeeeeeCcEeecccceEEEeccCCCC Confidence 00 00000014455567777888999999999999997664 No 73 >protein:vir:103886 Length: 302 # NCBI annotation: putative major head subunit protein # Family: family:all:776 # MgeID: mge:1522 # MgeName: D3112 # Cross-refs: genbank:acc:NP_938242;genbank:gi:38229147;genbank:GeneID:2648201 Probab=57.09 E-value=0.38 Score=22.90 Aligned_cols=271 Identities=10% Similarity=-0.018 Sum_probs=113.5 Q ss_pred ceeEeccCceEEEEEEe-cCceeEEEccccccc----------hhhhhCCceEEEeecccccccCCcCcccccceec--- Q lcl|Aclame:pro 91 MIFYNEATGENMRLELV-NGLNLTVKRQTGRIS----------AAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYV--- 156 (418) Q Consensus 91 ~~~~~~~~~E~~~Vtav-~g~~~tv~rg~~~tt----------a~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~--- 156 (418) |++ +.+++. ++ .+-.-....||.... +......+-. .+ .++|.-+.-...+. T Consensus 1 m~i----t~~~l~--~l~~~~~~~~~~~y~~a~~~~~~~a~~~~sdf~~~~~~-~l-------g~~p~l~e~~Ge~~~~~ 66 (302) T protein:vir:10 1 MLI----NKQSLN--AAFVAIKTIFNNAFAAAPTTWQKIAMEVPSNTSSNDYK-WL-------STFPKMRRWIGAKVVKN 66 (302) T ss_pred Ccc----cHHHHH--HHHHHHHHHHHHHHHhhhhhhhceeeecCCCcceeece-ec-------CCCCCccccccceeecc Confidence 111 111110 00 000000000111100 0000000000 00 01111111000000 Q ss_pred ------cceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHh Q lcl|Aclame:pro 157 ------PNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVR 230 (418) Q Consensus 157 ------~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~ 230 (418) .---.=|.++|+||.-+-.=...|....+..++-.+..++--++=+.+|.+-....-+.+++-.. . T Consensus 67 l~~~~~~i~~~~~g~~v~i~R~~i~nDdlg~~~~~~~~~G~aaa~~~~~lv~~~L~~g~~~~~~DG~~fF~--------~ 138 (302) T protein:vir:10 67 LKAYKYVVENEDFEATVEVDRNDIEDDQIGIYSPQAKMAGYSAAQLPDELVYEAVNGAFTKPCFDGQYFID--------T 138 (302) T ss_pred ccccceeEEeecccceecccHHhhcccccchhHHHHHHHHHHHHhhHHHHHHHHHhccCCCcccCCcceec--------c Confidence 00112244555555444333445655566666666666666666666664311000011111000 0 Q ss_pred hcc--c---cCccc---cCCCCccchHH---HHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccc Q lcl|Aclame:pro 231 QYA--P---DNVNA---MPNPTAVTYDD---VVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRE 299 (418) Q Consensus 231 ~~~--~---~nv~~---~~~~a~~te~~---l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~ 299 (418) .|. . .|... ......++.+. ...++++....+|..-+..+++++|++.+.....++-. +.++ ....+ T Consensus 139 dH~~g~~~~~N~g~~~~~~~~~~l~~~~~~aa~~am~~~k~~~G~~L~i~P~~LiVp~~le~~A~~ll~-~~~~-~~g~~ 216 (302) T protein:vir:10 139 DHPVGDASVSNKGTAPLSNASQAAAKAGYGAARTAMKKFKDEEGRSLNVSPNVLLVGPALEDVAKMLLT-NPKL-ADNTP 216 (302) T ss_pred cccccccccccccchhhhhcccccchHHHHHHHHHHHHHhhhcccccccCCCEEEecchhHHHHHHHhh-cccc-CCCCc Confidence 000 0 00000 00112334333 34456666667777778889999999888777666522 2221 01111 Q ss_pred eeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccc Q lcl|Aclame:pro 300 TSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDA 379 (418) Q Consensus 300 ~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da 379 (418) |. -+|++.+|.+|+|++ +..=-|+=||..++..||+||..- +.-.+.++ +.|. T Consensus 217 Np----------~~g~~~~vv~p~L~s---~~aWyL~a~~~~i~~~~l~g~~~P-~~~~~~~~-------------~~dg 269 (302) T protein:vir:10 217 NP----------YVGTAELVVDGRIES---DTAWFLLDTTKPVKPFIFQPRKQP-EFVSQVNL-------------DSDD 269 (302) T ss_pred ce----------eccceEEEEeeccCC---CCceEEEecCCccceEEEcCcccc-EEEeccCC-------------CCCc Confidence 11 248999999999864 223445568999999999888432 11123332 1255 Q ss_pred cccEEEEEEEEEEecccceEEeecCcccccccC Q lcl|Aclame:pro 380 QGGSLTSEWALELLNPQGCAVITGLQKAKERVY 412 (418) Q Consensus 380 ~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~ 412 (418) .+..+.=.++...|--.+++-=-..=.++.++. T Consensus 270 v~~k~~~d~Gvd~R~~~G~~~wq~a~~s~g~~~ 302 (302) T protein:vir:10 270 VFNLRKLKFGAEARAAAGYGFWQLAYGSTGTGA 302 (302) T ss_pred eEEEEEEEEeeeeeeecchhhhhhhhccCccCC Confidence 666666666666665444432222222222221 No 74 >protein:vir:98566 Length: 355 # NCBI annotation: gp5 # Family: family:all:201 # MgeID: mge:1533 # MgeName: PSP3 # Cross-refs: genbank:acc:NP_958060;genbank:gi:41057357;genbank:GeneID:2744237 Probab=56.09 E-value=0.46 Score=22.41 Aligned_cols=300 Identities=13% Similarity=0.074 Sum_probs=126.8 Q ss_pred EEEE-------e----------ec--CceEEEEccccc-cccCceeEeccCceE------EEEEEecCceeEE--Ecccc Q lcl|Aclame:pro 68 VTAE-------A----------AA--DATVLTVENSDG-LTKGMIFYNEATGEN------MRLELVNGLNLTV--KRQTG 119 (418) Q Consensus 68 ~~a~-------~----------~a--~~t~~tV~~~~~-~~~~~~~~~~~~~E~------~~Vtav~g~~~tv--~rg~~ 119 (418) +... + .. ....++|+-+.. -....|.. ..|. +-|..+.|.++-+ ..... T Consensus 1 M~~~tr~~~~~y~~~~A~~ngv~~~~~~~~FsV~P~v~q~L~~~i~e---ss~FL~~INvv~V~e~~Ge~i~lgv~g~ia 77 (355) T protein:vir:98 1 MRPETRFKFNAYLTRVAELNNISTDDVSKKFTVEPSVTQTLMNTVQA---SSAFLKTINILPVAEMKGEKIGVGVTGTIA 77 (355) T ss_pred CChHHHHHHHHHHHHHHHHhCCChhHccceeecCHHHHHHHHHHHHH---HHHHhhcCceeccccceeeEeeeccCcccc Confidence 2111 0 00 001222221110 00000100 0111 1233333444322 11111 Q ss_pred ccchhhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHH-HHHHHH Q lcl|Aclame:pro 120 RISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDC-MDFHAT 198 (418) Q Consensus 120 ~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk-~~Eikr 198 (418) ++|... ...|+.-......... .-.|+=-.--..+++-. ........+|...+... .+.+.+ T Consensus 78 grtdT~------------~~~~R~~~~~~~l~~~---~Y~c~qtn~dt~i~y~~--LD~WA~~~dF~~r~~~~i~k~~AL 140 (355) T protein:vir:98 78 STTDTS------------GDKERQTADFTALESS---KYECNQINFDFHLKYKT--LDLWARFQDFQRRIRDAIVKRQAL 140 (355) T ss_pred ccccCC------------CCCCcccccccccCCC---ccEEEEeeeeeeecHHH--HHHHhcChhHHHHHHHHHHHHHhh Confidence 111100 0001000000000000 01233222223344333 22222333566555544 456789 Q ss_pred HHhHHHhcCcccccCcCCc-cchh---hHHHHHHHhhccccCccccC-------------CCCccchHHHHHHHHHHHHh Q lcl|Aclame:pro 199 EQETAIFFGQAFMGTYNGQ-PLHT---TQGIVDAVRQYAPDNVNAMP-------------NPTAVTYDDVVDATIDAFKW 261 (418) Q Consensus 199 dmE~a~i~G~k~~~~s~~~-~~r~---t~GI~~~i~~~~~~nv~~~~-------------~~a~~te~~l~d~~~~~~~~ 261 (418) ||-.+=++|+..-..++-. .+.. =-|++-.++.+.+..+...+ -|..-++..|..++.++... T Consensus 141 D~i~IGfNG~s~A~~Td~~~nPllqDVNkGWlQ~~Re~ap~~v~~~~~~~~~~~~~~~i~~G~~gdy~NLDAlV~D~~~~ 220 (355) T protein:vir:98 141 DLIMAGFNGTTRADTSDRTKNTLLQDVAVGWLQKYRNEAPARVMSNITDADGKVVSAVIRVGKNGDYENIDALVMDATNN 220 (355) T ss_pred chhhhcccceeeeccCChhhCcCccccchhHHHHHHhcchhhhhhhhcccCccccccceeeCCCCCcccHHHHHHHHHhc Confidence 9999999999754444322 1111 23777677776655443211 12234567777777777643 Q ss_pred cccCC--CceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEc--CCeEEEEEECccccccCCCCCeEEEE Q lcl|Aclame:pro 262 SVNVG--DNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKF--FKGRLILKEHPLFSAIGISPGFAVVV 337 (418) Q Consensus 262 g~~~~--g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~S--dfG~v~vv~n~~l~~~~mp~d~~lv~ 337 (418) -...- ....=+++||.++... +....-++- ...+++.. .+.+.| -+|-+..+.-|+| |++.++|- T Consensus 221 lI~~~~~~d~dLVvivG~dLla~--k~~~l~n~~-~~ptE~~A---a~~i~s~k~iGGlpa~~~Pff-----P~~~~lVT 289 (355) T protein:vir:98 221 LIDEVYQDDPNLVAIVGRKLLAD--KYFPLVNKQ-QENSESLA---ADIIISQKRIGNLPAVRVPYF-----PANAVLVT 289 (355) T ss_pred cCChHHhcCCCEEEEEchhhhHH--HhhhHhhcc-CCcHHHHH---HHHHHHhhhhCCceeEEcccc-----CCCceEEe Confidence 22211 1112378899886542 211100110 11223222 122333 4677888888875 88999999 Q ss_pred chhhceeeeccC---CCcccccccccCccccccccccccccCccccccEEEEEEEEEEecccceEEeecCcccccccCCC Q lcl|Aclame:pro 338 DVPAVKLAYMDG---RNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLT 414 (418) Q Consensus 338 D~~~~~~~~L~~---r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~ 414 (418) -.++|++.+..| |....++ .+. |. ++|-. ..- +-.|.+..+.|.|++++-+++..| . T Consensus 290 ~L~NLsIY~Q~gs~RR~~~d~p-~r~----ri--e~y~s-----~Ne-------~YvVEd~~~~a~ienI~~~~~~~~-~ 349 (355) T protein:vir:98 290 TLENLSIYFMDESHRRSIDENP-KKD----RV--ENYES-----MNI-------DYVVEVYAAGCLLENITLGDFTAP-A 349 (355) T ss_pred eccccEEEEecCcEEEEEEecc-ccc----cc--cchhh-----hcc-------eeeeeccccEEEeeceeeeCCCCC-c Confidence 999999999965 2221111 111 11 11110 011 223445556888999999877543 3 Q ss_pred CCCC Q lcl|Aclame:pro 415 APAP 418 (418) Q Consensus 415 ~~~~ 418 (418) +|+. T Consensus 350 ~~~~ 353 (355) T protein:vir:98 350 APES 353 (355) T ss_pred cccc Confidence 4443 No 75 >protein:vir:739 Length: 231 # NCBI annotation: major structural protein 4 # Family: family:all:522 # MgeID: mge:14 # MgeName: Tuc2009 # Cross-refs: genbank:acc:NP_108716;genbank:gi:13487838;genbank:GeneID:920884 Probab=55.90 E-value=0.47 Score=22.39 Aligned_cols=226 Identities=14% Similarity=0.003 Sum_probs=109.3 Q ss_pred EEEec-CceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhccc Q lcl|Aclame:pro 104 LELVN-GLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGY 182 (418) Q Consensus 104 Vtav~-g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~ 182 (418) --+|| |+++|+= -|.| .++.++ ||..-+....+.....-=..|+ .+.|+|++.++.+. +| T Consensus 1 ~~~~~~Gdtit~P-~~iG-da~~v~-------------eG~~i~~~~l~~t~~~atIk~~-gk~~~itD~a~l~~-~g-- 61 (231) T protein:vir:73 1 ENGINLANLCEYP-NDIG-DAADVA-------------EGGEISLDKIGTTTKSVTIKKA-AKGTEITDEAALSG-YG-- 61 (231) T ss_pred CccccCCceEEec-cccc-chhhhc-------------CCCcCChhhccccceeeeEeee-ccceeeeHHHHhhc-cC-- Confidence 12564 7888875 2322 233344 4444333222222221124665 78899999888763 22 Q ss_pred chHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhc Q lcl|Aclame:pro 183 SNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWS 262 (418) Q Consensus 183 dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g 262 (418) |-...-..+-...|++.+.+-++.-- ..++ -.....++.+.+.+++...-+ T Consensus 62 Dp~~ea~~Q~~~~iA~kvD~di~~~~-----~~a~----------------------l~~~~~~t~d~i~~A~~~fgd-- 112 (231) T protein:vir:73 62 DPIGESNKQLGLSLANKVDDDLLKAA-----KTTS----------------------QTVSTKANVDGVQAALDIFND-- 112 (231) T ss_pred chHHHHHHHHHHHHHHhhhHHHHHhh-----cccc----------------------ccccccccHHHHHHHHHHhcc-- Confidence 33333333334445555555444100 0000 001235788888888777432 Q ss_pred ccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEE----Ec Q lcl|Aclame:pro 263 VNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVV----VD 338 (418) Q Consensus 263 ~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv----~D 338 (418) . ...+++++|++...-.|-++...... ...-..++.++-..-.|-=++|+.++. +|.+..+. .- T Consensus 113 --e-~~~~~vivv~p~~~~~Lrk~~~~~~~----~~~~g~~i~~~G~iG~i~G~~Vi~S~~-----~~~~~~~~~~~i~~ 180 (231) T protein:vir:73 113 --E-DAQAYVLIVNPKDAAKIRKDANAKNI----GSEVGANALINGTYADVLGAQIVRSKK-----LAEGSALMFKIVSN 180 (231) T ss_pred --c-cccceEEEEcchHHHhhhhccchhhh----hhhhccceeeecccceEcceEEEEcCC-----CCCCceeeeeEEee Confidence 2 24567899998776666665321110 111111222222222221257777754 46666643 22 Q ss_pred hhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecccceEEeecCcc Q lcl|Aclame:pro 339 VPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQK 406 (418) Q Consensus 339 ~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~ 406 (418) +..+ .++..|+...|.-+..- +.. |.. ..--=|...+-||....+|+-=+- T Consensus 181 ~gAl--~~~~k~~~~vEtdRd~~---~k~----------~~i--~~~~~y~v~l~~~~~vv~~t~~g~ 231 (231) T protein:vir:73 181 SPAL--KLVLKRGVQVETDRDIV---TKT----------TVI--TADEHYAAYLYDLTKVVNITFTGV 231 (231) T ss_pred ccce--eeeecccceeecccccc---ccc----------cEE--EEeEEEEEEEEcCccEEEEEeecC Confidence 4444 44444777666654332 000 111 111227889999998888743222 No 76 >protein:vir:4456 Length: 401 # NCBI annotation: Major capsid protein precursor # Family: family:all:21 # MgeID: mge:96 # MgeName: ST64B # Cross-refs: genbank:acc:NP_700379;genbank:gi:23505451;genbank:GeneID:955658 Probab=55.38 E-value=0.48 Score=22.33 Aligned_cols=305 Identities=11% Similarity=-0.007 Sum_probs=115.3 Q ss_pred Ccc----eee---eeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEee Q lcl|Aclame:pro 1 MSV----YAG---IFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAA 73 (418) Q Consensus 1 ~~~----~~~---~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~ 73 (418) ... ... .|-..|...++...+. -.+... + T Consensus 76 ~~~~~~e~~~a~~~~lr~~~~~~~~~~e~---------------~a~~~~-----------------------------~ 111 (401) T protein:vir:44 76 QNKVAAEHKDAFVGFLRKGREDGLRDLER---------------KALQVG-----------------------------T 111 (401) T ss_pred ccchhHHHHHHHHHHHhhhhhhhhHHHHH---------------HHhhcC-----------------------------C Confidence 000 000 0112333333311000 000000 0 Q ss_pred cCceEEEEcc--ccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccc Q lcl|Aclame:pro 74 ADATVLTVEN--SDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSI 151 (418) Q Consensus 74 a~~t~~tV~~--~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~ 151 (418) .++.-+.|.. ...+.....-...+ .-...+..+.+....+-+...++.+ .| ..||...+... T Consensus 112 ~~~GG~~iP~~~~~~ii~~~~~~~~l-~~~~~~~~~~~~~~~~~~~~~~~~a-------~w------v~E~~~~~~~~-- 175 (401) T protein:vir:44 112 DEDGGYAVPEELDRSILSLLKDEVVM-RQEATVITVGGSDYKKLVNLGGTAS-------GW------VGETDTRSQTA-- 175 (401) T ss_pred CCCCceeccHhHHHHHHHHHHhhhhh-hhhceeeecCCCceEEEEecCCccc-------ee------eccccccCccc-- Confidence 0000001100 00000000000000 0112233333433332222222111 12 13554332111 Q ss_pred cceeccceeEEEeeeeee----chhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHH Q lcl|Aclame:pro 152 QPVYVPNFTQIFRNAWAL----TDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVD 227 (418) Q Consensus 152 ~~~~~~N~tQIf~~~v~V----SgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~ 227 (418) ...+.||.-..-.+ .-|.+.+.-... +-..|-..+-...+.+.+|.+||+|.- ++ . ..||+. T Consensus 176 ----~~~~~~v~~~~~k~~~~~~iS~ell~ds~~-~l~~~i~~~la~ai~~~~~~~~l~G~G----~~-~----p~Gil~ 241 (401) T protein:vir:44 176 ----TSRLGLIEPFMGEIYGNPQATQKMLDDAFF-NVEAWINSELATEFAEQEEIAFTTGDG----TK-K----PKGFLA 241 (401) T ss_pred ----cccceeeeeehhheeeehhhhHHHHhcchH-HHHHHHHHHHHHHHHHHHHhhhhccCC----CC-c----cceeec Confidence 11355554433333 334444433221 323444444456678999999998753 11 1 234443 Q ss_pred HHhhccc--------cCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccc Q lcl|Aclame:pro 228 AVRQYAP--------DNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRE 299 (418) Q Consensus 228 ~i~~~~~--------~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~ 299 (418) ....... ......+..+.++.+++.++...+-.. ...+ ..++++......|.++.-.+|++-+... T Consensus 242 ~~~~~~~~~~~~~~~~~~~~t~~~~~~~~d~i~~~~~~l~~~--~~~~---a~~v~n~~~~~~L~~lkd~~G~~l~~~~- 315 (401) T protein:vir:44 242 YESTEESDKARAFGKLQHIVSGEATAVTADAIIKLIYTLRKA--HRTG---AKFMMNNNSLFAIRLLKDTEGNYLWRPG- 315 (401) T ss_pred cccccccccccccccccccccccccccCHHHHHHHHHhcchh--hhcC---CEEEEcHHHHHHHHHhhccCCceeecCC- Confidence 2111000 011122234467888888887655321 1111 2477888888888887555555444221 Q ss_pred eeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccc Q lcl|Aclame:pro 300 TSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDA 379 (418) Q Consensus 300 ~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da 379 (418) -..|.. .+=+|. .|+..+.+...+-....+++.|++..- ... +....+-+.. ++ . ..|. T Consensus 316 ~~~g~~----~~l~G~-PVv~~~~~p~~~~~~~~i~~Gd~~~~~-~i~--~~~~~~~~~~----------~~--~-~~~~ 374 (401) T protein:vir:44 316 LELGQP----SSLAGY-GIAENEQMPDIAADAKAIAFGNFKRGY-TIV--DRIGTRILRD----------PY--T-NKPF 374 (401) T ss_pred cCCCCC----ceecce-eeEEecCcCCccCCccEEEEeehhccE-EEE--EecceEEeee----------cc--c-cCCc Confidence 111110 011231 344444433222222346667886431 111 1111111100 00 0 0134 Q ss_pred cccEEEEEEEEEEecccceEEeecCccc Q lcl|Aclame:pro 380 QGGSLTSEWALELLNPQGCAVITGLQKA 407 (418) Q Consensus 380 ~k~~i~~E~tLev~N~kA~a~I~gL~~~ 407 (418) ...+.+.-+...+.+++|+.+|. ++.| T Consensus 375 v~~~a~~r~d~~~~~~~a~~~l~-~~aa 401 (401) T protein:vir:44 375 VGFYTTKRTGGMLVDSQAIKLLK-IAAA 401 (401) T ss_pred EEEEEEEEeccEEecccceEEEE-eecC Confidence 44556667889999999997654 4444 No 77 >protein:vir:4997 Length: 397 # NCBI annotation: major head protein # Family: family:all:21 # MgeID: mge:109 # MgeName: Sfi21 # Cross-refs: genbank:acc:NP_049971;genbank:gi:9632943;genbank:GeneID:1262106 Probab=53.90 E-value=0.52 Score=22.15 Aligned_cols=317 Identities=12% Similarity=0.038 Sum_probs=115.5 Q ss_pred CcceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) Q Consensus 1 ~~~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~t 80 (418) ....... ....+..-..+........ -+.+..+.+...... ..+.. T Consensus 67 ~~~~~~~--~~~~~~~~~~~~~~~~~~~-------~~~~~l~~~~~~~~~-------------------------~~~~~ 112 (397) T protein:vir:49 67 EVANMSE--EEKKPLTKNEEEVKANFVK-------DFKNLVRGRYQNLLD-------------------------SKTDG 112 (397) T ss_pred hhhcccc--cccccccchhhHHHHHHHH-------HHHHHhhcchhhHHH-------------------------hhhcc Confidence 0000000 0001100000000000000 011111111000000 00000 Q ss_pred EccccccccCceeEeccCc---------eEEEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccccCCcCcc Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATG---------ENMRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTAR 149 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~---------E~~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~ 149 (418) .....++..+..+...+-+ ..+.|..+.+.. +.+.+... +.+. ..|. .||...++.. T Consensus 113 t~~~gg~~iP~~~~~~ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~-~~~~-----a~~v------~E~~~~~~~~ 180 (397) T protein:vir:49 113 SGSDAGLTIPQDIRTAINTLVRQFDSLQEYVNVENVTTLTGSRVYEKWAD-ITGL-----AKLD------DEGGQIGQND 180 (397) T ss_pred CCccCcceecHHHHHHHHHHHHhhhhHhhhcceeeccCCcceEEEEeecc-CCcc-----eeee------cccccccccc Confidence 1111112222111111111 112233444332 22222211 1111 1121 3665544322 Q ss_pred cccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHH Q lcl|Aclame:pro 150 SIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAV 229 (418) Q Consensus 150 ~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i 229 (418) ......+.=-..-+...+.|| .+...... .+-..+-...-...+.+.+|.++|+|.. .+. + T Consensus 181 ~~~~~~v~~~~~k~~~~~~iS--~ell~ds~-~~l~~~i~~~l~~~~~~~~d~ail~G~g----~~~-~----------- 241 (397) T protein:vir:49 181 DPKLSLIRYAIKRYAGISTVT--NSLLADSA-ENILAWLSGWIAKKVVVTRNKAILEAIG----TLP-N----------- 241 (397) T ss_pred ccceeeeEeeeeeeEeehhhH--HHHHhhhh-HHHHHHHHHHHHHHHHHHHHHHHHhccc----ccc-c----------- Confidence 111111111111112223333 33333222 2334555666667778899999998753 111 0 Q ss_pred hhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEE Q lcl|Aclame:pro 230 RQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEW 309 (418) Q Consensus 230 ~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~ 309 (418) .+..++.+++.++..++=.... ....+++++.....|.++...+|++.+... -..|. - T Consensus 242 ------------~~~~~~~d~i~~~~~~l~~~~~-----~~a~~v~n~~~~~~l~~lkd~~g~~l~~~~-~~~g~----~ 299 (397) T protein:vir:49 242 ------------KPTLAKWDDIIDLQAKVDPAIK-----QTSLFLTNTSGFTALKKVKNAMGDYLMERD-VKSPT----G 299 (397) T ss_pred ------------cccccCHHHHHHHHHhhhhhhc-----CCCEEEEcHHHHHHHHHhhccCCceeeccc-ccCCC----C Confidence 1224566777777665533221 123578899888899888655666544321 00010 0 Q ss_pred EcCCeE-EEEEECccccccCCCCCeEEEEchhh-ceeeeccCCCcccccccccCccccccccccccccCccccccEEEEE Q lcl|Aclame:pro 310 KFFKGR-LILKEHPLFSAIGISPGFAVVVDVPA-VKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSE 387 (418) Q Consensus 310 ~SdfG~-v~vv~n~~l~~~~mp~d~~lv~D~~~-~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E 387 (418) .+=+|. |.+..+..+..-.++...+++.|+.. +.+... .+...+.....+. + + -.|....+...- T Consensus 300 ~~l~G~pV~~~~~~~~~~~~~~~~~~~~gd~~~~~~~~~~--~~~~i~~~~~~~~--~-~--------~~~~~~~~~~~r 366 (397) T protein:vir:49 300 YSIDGFVVKEISDRFLPNGTGGAMPLYFGDLKQAVTLFDR--QHLSLLSTNIGGG--A-F--------ETDTTKVRVIDR 366 (397) T ss_pred ceecceeeEEecccccccccCCceeEEEeeccceEEEEee--cccEEEEeccccc--h-h--------hcCeeeEEEEEe Confidence 111332 22222323322233344677778764 322222 1111111111110 0 0 002333345677 Q ss_pred EEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 388 WALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 388 ~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) +...+++++|+.+++--.++. ..|.+.+.- T Consensus 367 ~d~~~~~~~a~~~~~~~~~~~-~~~~~~~~~ 396 (397) T protein:vir:49 367 FDVVSTDTEAFVPASFKAIAD-QKAKLSTAG 396 (397) T ss_pred eccEEecccceEEEEeccccc-ccCcccccC Confidence 888999999999997655542 111121111 No 78 >protein:vir:485 Length: 407 # NCBI annotation: putative major capsid protein # Family: family:all:21 # MgeID: mge:11 # MgeName: P27 # Cross-refs: genbank:acc:NP_543092;swissprot:trembl:q8w627;genbank:gi:18249904;uniprot:Q8W627;genbank:GeneID:929693 Probab=52.99 E-value=0.54 Score=22.05 Aligned_cols=313 Identities=12% Similarity=0.038 Sum_probs=115.8 Q ss_pred Ccceeeeec---cCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCce Q lcl|Aclame:pro 1 MSVYAGIFN---TTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADAT 77 (418) Q Consensus 1 ~~~~~~~~~---~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t 77 (418) -+-....|. .+|...++...+. -.+.. .+.+.-+++- |+.. .. T Consensus 79 ~~e~~~a~~~~l~~g~~~~~~~~e~---------------~a~~~------~t~~~gG~~i----P~~~---------~~ 124 (407) T protein:vir:48 79 ASEHKEAFIGFMRKGREDGLRELER---------------KALQV------GNDEDGGYAI----PEEL---------DR 124 (407) T ss_pred hhHHHHHHHHHHhccchhhhhHHHH---------------Hhhhc------ccCCCCcccc----cHhH---------HH Confidence 000000000 1333333322111 00000 0000011110 0000 00 Q ss_pred EEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceecc Q lcl|Aclame:pro 78 VLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVP 157 (418) Q Consensus 78 ~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~ 157 (418) + +- ..+.....+. -...+.-+.+..+.+-+-..++.+ .|. .||...+... .. T Consensus 125 ~--I~--~~~~~~~~l~-----~~~~~~~~~~~~~~~~~~~~~~~a-------~~v------~E~~~~~~~~------~~ 176 (407) T protein:vir:48 125 T--IL--TLLKDEVVMR-----QEATVITLGGSDYKKLVNLGGTTS-------GWV------GETDARPETA------TS 176 (407) T ss_pred H--HH--HHHHhhhhhh-----hhceeeecCCCceEEEEecCCcce-------eee------cccccccccc------cc Confidence 0 00 0000000000 000011111111111111112111 121 3554433211 12 Q ss_pred ceeEEEeeeee----echhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhcc Q lcl|Aclame:pro 158 NFTQIFRNAWA----LTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYA 233 (418) Q Consensus 158 N~tQIf~~~v~----VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~ 233 (418) .+.||--..-. +.-|.+...-.. .+-..|-..+-...+.+-+|.+||+|.- .+ + -.||+....... T Consensus 177 ~f~~i~~~~~k~~~~~~iS~ell~ds~-~~l~~~i~~~l~~~i~~~~~~a~l~G~G----~~-~----p~Gil~~~~~~~ 246 (407) T protein:vir:48 177 KLGLIEPFMGEIYGNPQATQKMLDDAF-FNVEDWINSELALEFAEQEEIAFTSGDG----SK-K----PKGFLAYESTDE 246 (407) T ss_pred cceeEEeeeeeeEeehhhHHHHHhcch-HHHHHHHHHHHHHHHHHHHHhhhhccCC----CC-c----cceeeecccccc Confidence 24444333322 334444444322 2333444455556678999999998842 11 2 225543221100 Q ss_pred ccC--------ccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceE Q lcl|Aclame:pro 234 PDN--------VNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMV 305 (418) Q Consensus 234 ~~n--------v~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~ 305 (418) .++ .......+.++.+++.++...+-...- +++ .++++......|.++.-.+|++-+... -..|.. T Consensus 247 ~~~~~~~~~~~~~~~~~~~~~~~d~i~~l~~~l~~~~~--~~a---~~v~n~~~~~~L~~lkD~~Gr~l~~~~-~~~g~~ 320 (407) T protein:vir:48 247 DDKTRAFGKLQHIASGAASGVTADAIIKLIYTLRKAHR--SGA---KFMMNNSSLFAIRLLKDNDGNYLWRPG-IELGQP 320 (407) T ss_pred cccccccccccccccccccccChHHHHHHHHhhchhhh--cCC---EEEEcHHHHHHHHHhhccCCceeeccC-cCCCCC Confidence 000 112223346788999988877654321 221 366888888888887555566544321 111110 Q ss_pred EEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhc-eeeeccCCCcccccccccCccccccccccccccCccccccEE Q lcl|Aclame:pro 306 FTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAV-KLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSL 384 (418) Q Consensus 306 v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~-~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i 384 (418) .+=+|. .|+.++.+..-+-....+++-|++.. .+.--.+-.+..+++.. .|...... T Consensus 321 ----~~l~G~-PV~~~~~~p~~~~~~~~i~~Gd~~~~~~i~~~~~~~i~~d~~~~-----------------~~~~~~~~ 378 (407) T protein:vir:48 321 ----SSLAGY-GIVENEQMPDIAADAKAIAFGNFKRGYTIVDRIGTRILRDPYTN-----------------KPFVGFYT 378 (407) T ss_pred ----ceecce-eeEEecCcCCccCCccEEEEEeccccEEEEEeeceEEEeecccc-----------------CCcEEEEE Confidence 011342 44555443221111234566787642 11111111111111111 13444455 Q ss_pred EEEEEEEEecccceEEeecCcccccccCCCCCC Q lcl|Aclame:pro 385 TSEWALELLNPQGCAVITGLQKAKERVYLTAPA 417 (418) Q Consensus 385 ~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~ 417 (418) +.-+...+.+++|+.++.-=..+..+.. | T Consensus 379 ~~r~d~~v~~~~a~~~l~~~aa~~~~~~----~ 407 (407) T protein:vir:48 379 TKRTGGMLVDSQAIKLMKIGAATRQKAA----A 407 (407) T ss_pred EEEeccEEecccceEEEEeeccCCCCCC----C Confidence 6678899999999977654333222211 1 No 79 >protein:vir:6061 Length: 357 # NCBI annotation: gpN # Family: family:all:201 # MgeID: mge:126 # MgeName: WPhi # Cross-refs: genbank:acc:NP_878202;genbank:gi:33438901;genbank:GeneID:1457736 Probab=51.76 E-value=0.14 Score=25.20 Aligned_cols=327 Identities=12% Similarity=0.059 Sum_probs=132.4 Q ss_pred hhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeEec Q lcl|Aclame:pro 17 LNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNE 96 (418) Q Consensus 17 ~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~ 96 (418) ++++ .+..-| .-+.++-.+.|...... -++|+..-...+ ++-. . -..+++.+....++. T Consensus 1 M~~~------tr~~~~--~y~~~~A~~ngv~~~d~--~~~FsV~P~v~q-~L~~-------~-i~ess~FL~~INvv~-- 59 (357) T protein:vir:60 1 MRQE------TRFKFN--AYLSRVAELNGIDAGDV--SKKFTVEPSVTQ-TLMN-------T-MQESSDFLTRINIVP-- 59 (357) T ss_pred CChH------HHHHHH--HHHHHHHHHhCCChHHh--cceeecCHHHHH-HHHH-------H-HHHHHHHhccCCccc-- Confidence 1000 000000 11112222222111100 012221100000 0000 0 011333333333321 Q ss_pred cCceEEEEEEecCceeEE--EccccccchhhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHH Q lcl|Aclame:pro 97 ATGENMRLELVNGLNLTV--KRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTAR 174 (418) Q Consensus 97 ~~~E~~~Vtav~g~~~tv--~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~ 174 (418) |..+.|.++-+ .....++|... +. -.| +-.|.. ..... .-.|+=-.--..+++-. T Consensus 60 -------V~e~~Ge~i~lg~~g~iagrtdT~---~~-~~R------~~~~~~--~l~~~---~Y~c~qTn~dt~i~Y~~- 116 (357) T protein:vir:60 60 -------VSEMKGEKIGIGVTGSIASTTDTA---GG-TER------QPKDFS--KLASN---KYECDQINFDFYIRYKT- 116 (357) T ss_pred -------cccceeeEEecccCcccccccccC---CC-CCc------cccccc--ccCCC---ccEEEEeeeeccccHHH- Confidence 33333444321 00111111100 00 000 000000 00000 01222222223333332 Q ss_pred HHhhhcccchHHHHHHH-HHHHHHHHHhHHHhcCcccccCcCCccchh----hHHHHHHHhhccccCcccc------C-- Q lcl|Aclame:pro 175 ASYAEAGYSNITESRRD-CMDFHATEQETAIFFGQAFMGTYNGQPLHT----TQGIVDAVRQYAPDNVNAM------P-- 241 (418) Q Consensus 175 Av~~~g~~dela~q~~k-k~~EikrdmE~a~i~G~k~~~~s~~~~~r~----t~GI~~~i~~~~~~nv~~~------~-- 241 (418) ........+|...+.. -.+.+.+||-.+=++|+..-..++-..-.. =-|++-.++.+.+..+... . T Consensus 117 -lD~WA~~~dF~~r~~~~i~~~~ALD~i~IGfNGts~A~~Td~~~nPllqDVN~GWlQ~~Re~ap~rVm~~~~~~~g~~~ 195 (357) T protein:vir:60 117 -LDLWARYQDFQLRVRNAIIKRQSLDLIMAGFNGVRRAETSDRSSNQMLQDVAVGWLQKYRNEAPARVMSKVTDEEGHTT 195 (357) T ss_pred -HHHHhcChhHHHHHHHHHHHHHhhccceecccceeeeccCChhhCcCccccchhHHHHHHhhchhhhhccccccCCccc Confidence 2222233456555544 345678999999999997554443221111 1277777777665544321 0 Q ss_pred -----CCCccchHHHHHHHHHHHHhcccCC--CceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEc--C Q lcl|Aclame:pro 242 -----NPTAVTYDDVVDATIDAFKWSVNVG--DNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKF--F 312 (418) Q Consensus 242 -----~~a~~te~~l~d~~~~~~~~g~~~~--g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~S--d 312 (418) -|..-++..|..++.++...-...- ....=+++||.++.. .+....-++-. ..+++.. .+.+.| - T Consensus 196 ~~~i~~G~~gdy~NLDalV~D~~~~lI~~~~~~d~dLVvivG~dLla--~k~~~l~n~~~-~pTE~~A---a~~i~s~k~ 269 (357) T protein:vir:60 196 SEVIRVGKGGDYASLDALVMDATNNLIEPWYQEDPDLVVIVGRQLLA--DKYFPIVNREQ-DNSEMLA---ADVIISQKR 269 (357) T ss_pred cceeeecCCCCcccHHHHHHHHHhccCChHHhcCCCEEEEEchhhhh--HHhhhHhhcCC-ChHHHHH---HHHHHHhhh Confidence 1122356777777777765322211 111247889988764 22111001100 1223221 223333 4 Q ss_pred CeEEEEEECccccccCCCCCeEEEEchhhceeeeccCC---CcccccccccCccccccccccccccCccccccEEEEEEE Q lcl|Aclame:pro 313 KGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGR---NAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWA 389 (418) Q Consensus 313 fG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r---~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~t 389 (418) +|-+..+.-|+| |++.++|--.++|++.|..|- ....++ .+. |.. +|-. ..- + T Consensus 270 iGGl~a~~~PfF-----P~~~llVT~L~NLsIY~Q~gs~RR~~~d~p-~r~----riE--~y~s-----~Ne-------~ 325 (357) T protein:vir:60 270 IGNLPAVRVPYF-----PADAMLITKLENLSIYYMDDSHRRVIEENP-KLD----RVE--NYES-----MNI-------D 325 (357) T ss_pred hcCcceEEcccc-----CCCceEEeeccccEEEEecCcEEEEEEecc-ccc----ccc--chhh-----hcc-------e Confidence 787888888875 889999999999999999652 221111 111 111 1100 011 2 Q ss_pred EEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 390 LELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 390 Lev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) -.|.+..+.|.|++++-+++..|...+++ T Consensus 326 YvVEd~~~~a~iE~i~~~~~~~pa~~~~~ 354 (357) T protein:vir:60 326 YVVEDYAAGCLVEKIKVGDFSTPAKATAE 354 (357) T ss_pred eeeeccccEEEeeeeeeccCcccccCCCC Confidence 23445556888999988766655444444 No 80 >protein:vir:8420 Length: 477 # NCBI annotation: gp15 # Family: family:all:21 # MgeID: mge:155 # MgeName: Omega # Cross-refs: genbank:acc:NP_818316;genbank:gi:29566752;genbank:GeneID:1260033 Probab=50.95 E-value=0.6 Score=21.82 Aligned_cols=355 Identities=10% Similarity=-0.033 Sum_probs=113.4 Q ss_pred Ccceeeeecc---------CCCh----hhhhhhhcccceeEeecCC--cchhHHHhhhccccceeeeeeeeeeee--ccc Q lcl|Aclame:pro 1 MSVYAGIFNT---------TLNP----QELNMKSFAGTILRRVPNG--SAPLLAMTSVVGSTTAKASTHGYFSKT--MVF 63 (418) Q Consensus 1 ~~~~~~~~~~---------~~~~----~~~~~~s~~~~~~~~~~~~--~~p~~~l~~~~~~~~~~~~~~~~~~~~--~~~ 63 (418) .+-..+.-+. ..++ ...+.+++...+.-..... ......+.+.. ......+++.... ... T Consensus 77 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~---~~~~~~~~~~~~~~~~~~ 153 (477) T protein:vir:84 77 IERSGKLEAETKTVRKATVEVNEALTYEKGNGQSYFRDLAMQTVGMADEPAKERLRRHM---VDVESDKEIRKIAKVGEE 153 (477) T ss_pred HHHhhcchhhhhhhcccccccccchhhhhhHHHHHHHHHHHHHhhhhhhHHHHHHHHHH---hhhhhhhhHHHHHHhhhh Confidence 0000000000 0000 0001111100000000000 00000000000 0011111111100 000 Q ss_pred ceeEEEEEeecCceEEEEccccccccCceeEeccC----ceEEEEEEecCc--eeEEEccccccchhhhhCCceEEEeec Q lcl|Aclame:pro 64 ASAVVTAEAAADATVLTVENSDGLTKGMIFYNEAT----GENMRLELVNGL--NLTVKRQTGRISAAIIAANTKLIVIGT 137 (418) Q Consensus 64 ~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~----~E~~~Vtav~g~--~~tv~rg~~~tta~~~~~gt~v~~~g~ 137 (418) .... +. .+..+..+.... +..+.++..... .-.+.+..+.+. .+++-+-..+... ..|. T Consensus 154 ~~~~-~~-~~~~gg~lv~~~---~~~~~ii~~l~~~~~i~~~~~~~~~~~~~~~~~ip~~~~~~~~------a~~~---- 218 (477) T protein:vir:84 154 YRDL-DR-NGGTGGYAVPPL---WMMNRFIELARAGRTYANLCPTEPLPGGTSSINIPKILTGTST------AIQA---- 218 (477) T ss_pred hccc-cc-cCCCcceeeccc---hhHHHHHHHhhhcchHHHhhceeeecCCcceeEEEEEecCcce------eeee---- Confidence 0000 00 000011100000 111111100000 001122223322 2332221111110 1111 Q ss_pred ccccccCCcCcccccceeccceeEEEeeeee----echhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccC Q lcl|Aclame:pro 138 AFEEGSQRPTARSIQPVYVPNFTQIFRNAWA----LTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGT 213 (418) Q Consensus 138 a~~EGada~~~~~~~~~~~~N~tQIf~~~v~----VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~ 213 (418) .||+..+.. ..|.... .+-+|--+.-. +.-|.+....... +-.+|-..+-...+.+-+|.+||+|. | T Consensus 219 --~Eg~~~~~~-~~~~s~~-~f~~i~~~~~k~~~~~~iS~ell~ds~~-~l~~~i~~~l~~~~~~~~d~~~l~G~----G 289 (477) T protein:vir:84 219 --ADNAALTAP-SAHEVDL-TDGFVQANVKTIAGQQGIAIQLLDQAAV-SVDEFVFRDLAADYANKLNVQVISGT----G 289 (477) T ss_pred --ccCcccccc-ccccccc-ceeeEEEeeeeEEeeeHHHHHHHhccch-hHHHHHHHHHHHHHHHHHHHHHhccC----C Confidence 355432221 1111111 24444433333 3345555544332 33455556666778999999999874 2 Q ss_pred cCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHH---HHHHhcccCCCceeEEEEeChHHHHHHHhhhhcc Q lcl|Aclame:pro 214 YNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATI---DAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFF 290 (418) Q Consensus 214 s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~---~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~ 290 (418) .+.+| .||+... ....+... .+..+...+..+.. ++...-..........++.++.....|.++.-.+ T Consensus 290 t~~~p----~Gi~~~~---~~~~~~~~--~~~~t~~~~~~~~~~i~~~~~~~~~~~~~~~~~~v~~~~~~~~l~~lkd~~ 360 (477) T protein:vir:84 290 SNNQV----VGVRATA---GITQVTAT--SAGSALEKHQIIYQKIADAIQRVHTSRFLEPEVIVMHPRRWASFHAIFAGD 360 (477) T ss_pred CCCcc----ceeeecc---cccccccc--ccccchhhHHHHHHHHHHHHhhccccccCCccEEEEcHHHHHHHHHhhccC Confidence 22232 3665321 11111111 11222222222221 2211110111112235667877777888875556 Q ss_pred ceEEEcccceee---ceEEEEEE-cCCeEE---EEEECccccccCCCCC--------eEEEEchhhceeeeccCCCcccc Q lcl|Aclame:pro 291 GEVTVTQRETSY---GMVFTEWK-FFKGRL---ILKEHPLFSAIGISPG--------FAVVVDVPAVKLAYMDGRNAKVE 355 (418) Q Consensus 291 ~~~~~~~~~~~~---G~~v~~~~-SdfG~v---~vv~n~~l~~~~mp~d--------~~lv~D~~~~~~~~L~~r~~~~e 355 (418) +++-+......+ +.....+. -..|++ .|+.++. ||++ .+++.|.+.+-+. T Consensus 361 G~~l~~~~~~~~~~~~~~~~~~~~~~~~~l~G~pVv~s~~-----~p~~~~~~~d~~~i~~gd~~~~~i~---------- 425 (477) T protein:vir:84 361 DRPLIVPSGPGFNNLGVLTEVASQRVVGQMHGLPVVTDPT-----LPTTLGTGTDQDVIHVLRASDLALF---------- 425 (477) T ss_pred CCeeeecCcccccccccccccccccccchhcccceEecCc-----ccccccccCCcceEEEEEeceEEEE---------- Confidence 665443222111 10000000 011222 4555543 4433 4566666554221 Q ss_pred cccccCccccccccccccccCccccccEEEEEEE-EEEecccceEEeecCcccccccC Q lcl|Aclame:pro 356 NYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWA-LELLNPQGCAVITGLQKAKERVY 412 (418) Q Consensus 356 ~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~t-Lev~N~kA~a~I~gL~~~~~~~~ 412 (418) ..|.+......++. +-+..-.++++.+. +-+|+|+|+.+|+|-.+..|+-. T Consensus 426 ---~~~~~~~~~~~~~~---~~~~~~~~v~~~~~~~~~r~~~afv~~t~~~~~~~~~~ 477 (477) T protein:vir:84 426 ---ESSVRMRALQETRA---ENLSVLLQVYGYLAFTAARFPQSVVEIGGTALTAPTFA 477 (477) T ss_pred ---eeceeEEecccccc---ccceeeeeehhhhhhhhhccccceEEeecccccccccC Confidence 11111111111111 00111223344333 46689999999999877755544 No 81 >protein:vir:1829 Length: 355 # NCBI annotation: major capsid protein # Family: family:all:201 # MgeID: mge:324 # MgeName: 186 # Cross-refs: genbank:acc:NP_052253;genbank:gi:9634060;genbank:GeneID:1262428 Probab=50.04 E-value=0.6 Score=21.79 Aligned_cols=314 Identities=13% Similarity=0.061 Sum_probs=133.3 Q ss_pred hhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEc-------------c Q lcl|Aclame:pro 17 LNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVE-------------N 83 (418) Q Consensus 17 ~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~-------------~ 83 (418) ++++ .+..-| .-+.++-.+.|..... ....++|+ + T Consensus 1 M~~~------tr~~~~--~y~~~~A~~ngv~~~~------------------------~~~~Fsv~P~v~q~L~~~i~es 48 (355) T protein:vir:18 1 MRQE------TRFKFN--AYLTQLAKLNGISVDD------------------------VSKKFTVEPSVTQTLMNTVQAS 48 (355) T ss_pred CChH------HHHHHH--HHHHHHHHHhCCChhH------------------------ccceeccCHHHHHHHHHHHHHH Confidence 1110 000000 1122222222221100 01122332 3 Q ss_pred ccccccCceeEeccCceEEEEEEecCceeEE--EccccccchhhhhCCceEEEeecccccccCCcCcccccceeccceeE Q lcl|Aclame:pro 84 SDGLTKGMIFYNEATGENMRLELVNGLNLTV--KRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQ 161 (418) Q Consensus 84 ~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv--~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQ 161 (418) ++.+....++ -|..+.|.++-+ .....++|... ...|+.-......... .-.|+ T Consensus 49 s~FL~~INvv---------~V~e~~Ge~i~lgv~g~iagrtdT~------------~~~~R~~~~~~~l~~~---~Y~c~ 104 (355) T protein:vir:18 49 SAFLQMINIL---------PVAEMKGEKIGVGVTGTIASTTDTS------------GDKERQTADFTALESN---KYECN 104 (355) T ss_pred HHHhhcCcee---------ccccceeeEEeeccCcceeeccccC------------CCCCcccccccccCCC---ccEEE Confidence 3323333332 133333444321 11111222110 0001100000000000 01222 Q ss_pred EEeeeeeechhHHHHhhhcccchHHHHHHHH-HHHHHHHHhHHHhcCcccccCcCCc-cchh---hHHHHHHHhhccccC Q lcl|Aclame:pro 162 IFRNAWALTDTARASYAEAGYSNITESRRDC-MDFHATEQETAIFFGQAFMGTYNGQ-PLHT---TQGIVDAVRQYAPDN 236 (418) Q Consensus 162 If~~~v~VSgTa~Av~~~g~~dela~q~~kk-~~EikrdmE~a~i~G~k~~~~s~~~-~~r~---t~GI~~~i~~~~~~n 236 (418) =-.--..+++-. ........+|...+... .+.+.+||-.+=++|+..-..++-. .+.. =-|++-.++.+.+.. T Consensus 105 qtn~dt~i~y~~--LD~WA~~~dF~~r~~~~i~k~~ALD~i~IGfNG~s~A~~Td~~~nPllqDVNkGWlQ~~Re~ap~r 182 (355) T protein:vir:18 105 QINFDFHLTYKR--LDLWARFQDFQRRIRDAIVQRQALDFIMAGFNGTTRADTSDRVKNPMLQDVAVGWLQKYRNEAPAR 182 (355) T ss_pred EeeeeeeecHHH--HHHHhcChhHHHHHHHHHHHHHhhchhhhcccceeeeccCChhhCcCccccchhHHHHHHhcchhh Confidence 222223344333 22222233466555544 4567899999999999754444322 1111 237777777766554 Q ss_pred ccccC-------------CCCccchHHHHHHHHHHHHhcccCC--CceeEEEEeChHHHHHHHhhhhccceEEEccccee Q lcl|Aclame:pro 237 VNAMP-------------NPTAVTYDDVVDATIDAFKWSVNVG--DNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETS 301 (418) Q Consensus 237 v~~~~-------------~~a~~te~~l~d~~~~~~~~g~~~~--g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~ 301 (418) |...+ -|..-++..|..++.++...-...- ....=+++||.++.. .+....-.+- -..+++. T Consensus 183 V~~~~~~~~~~~~~~~i~~G~~gdy~NLDAlV~d~~~~lI~~~~~~d~dLVvivG~dLla--~k~~~l~n~~-~~ptE~~ 259 (355) T protein:vir:18 183 VMSNITDADGKVVSAVIRVGKNGDYENLDALVMDGTNTLIDEIYQDDPKLVAIVGRKLLA--DKYFPLVNKQ-QENTESL 259 (355) T ss_pred hhccccccccccccceeeecCCCCcccHHHHHHHHHhccCChHHhcCCCEEEEEchhhhH--HHHhHHhhcc-CChHHHH Confidence 43211 0122356777777777775322211 111237889988654 2211100110 1123332 Q ss_pred eceEEEEEEc--CCeEEEEEECccccccCCCCCeEEEEchhhceeeeccC---CCcccccccccCccccccccccccccC Q lcl|Aclame:pro 302 YGMVFTEWKF--FKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDG---RNAKVENYGQGGGENKSGATDYSYGHG 376 (418) Q Consensus 302 ~G~~v~~~~S--dfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~---r~~~~e~laKtG~~~~~~~~~~~~~~g 376 (418) . .+.+.| -+|-+..+.-|+| |++.++|--.++|++.+..| |.+..++ .+. |. ++ T Consensus 260 A---a~~i~s~k~iGGlpa~~~Pff-----P~~~~lVT~L~NLsIY~Q~gs~RR~~~d~p-~r~----ri--e~------ 318 (355) T protein:vir:18 260 A---ADIIISQKRIGNLPAVRVPYF-----PANAVFVTTLENLSIYFMDESHRRSIDENP-KKD----RV--EN------ 318 (355) T ss_pred H---HHHHHHHHhhCCceeEEcccc-----CCCceEEeeccccEEEEecCcEEEEEEecc-ccc----cc--cc------ Confidence 2 233333 4777888888875 88999999999999999965 2221111 111 11 11 Q ss_pred ccccccEEEEEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 377 VDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 377 ~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) ++.. - -+-.|.+..+.|.|++++-+++..|+++..- T Consensus 319 --y~s~---N-e~YvVEd~~~~a~ieni~~~~~~~~~~~~~g 354 (355) T protein:vir:18 319 --YESM---N-IDYVVEAYAAGCLLENITLGDFTAPAAPEGG 354 (355) T ss_pred --hhhh---c-ceeeeeccccEEEEeeeeecCCCCcccccCC Confidence 1100 0 1223445557888999998876544333333 No 82 >protein:vir:95318 Length: 328 # NCBI annotation: hypothetical protein # Family: family:all:1903 # MgeID: mge:1564 # MgeName: phiV10 # Cross-refs: genbank:acc:YP_512264;genbank:gi:89152431;genbank:GeneID:3952987 Probab=48.99 E-value=0.65 Score=21.60 Aligned_cols=240 Identities=11% Similarity=0.135 Sum_probs=103.7 Q ss_pred cccceeEEEEEeecCceEEEEc---cccccccCceeEe-ccCceE---EEEEEec-Cc--eeEEEccccccchhhhhCCc Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVE---NSDGLTKGMIFYN-EATGEN---MRLELVN-GL--NLTVKRQTGRISAAIIAANT 130 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~---~~~~~~~~~~~~~-~~~~E~---~~Vtav~-g~--~~tv~rg~~~tta~~~~~gt 130 (418) |.....+. -|-+.++ +.++.. ..|++. .-..|+ |....++ |. .-++. .-..+. T Consensus 1 m~~~~~~~-------~TL~e~Akr~~~d~~~-~~VIE~l~~~n~IL~~lpf~e~n~gt~~~~~v~---------~~LP~~ 63 (328) T protein:vir:95 1 MAVKGLTA-------LTLADWGKRVDPNGKV-DKIIELLGQTNPILQDMPFVEGNLPTGHRTTIR---------SGLPSA 63 (328) T ss_pred CCcccccc-------ccHHHHHhhhCcchhH-HHHHHHHhccchhHhhcceeecccCCcceeeEe---------eccCCc Confidence 22111111 1111111 111110 111110 011122 2233332 22 11111 112334 Q ss_pred eEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccc-hHHHHHHHHHHHHHHHHhHHHhcCcc Q lcl|Aclame:pro 131 KLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYS-NITESRRDCMDFHATEQETAIFFGQA 209 (418) Q Consensus 131 ~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~d-ela~q~~kk~~EikrdmE~a~i~G~k 209 (418) .+..++... .+....+.+++-.|=||.-.++|..-... ..|..+ ..+.|.+.+++-+.++++..||+|-- T Consensus 64 ~fR~lN~g~-------~~s~~tt~q~t~~l~ilgg~~eVDr~la~--~~Gn~~~~ra~q~~~~~ka~~~~~~~~~iyGds 134 (328) T protein:vir:95 64 TWRLLNYGV-------QPSKSTTVQVTDSVGMLETYAEVDKSLAD--LNGNTAEFRLSEDRAFIEAMNQQMAQTLFYGDS 134 (328) T ss_pred eeeecCCcc-------CcccceeEEEEEEEEEEecceeechHHHh--hcCCHHHHHHHHHHHHHHHHHHHHHHHHhcCCc Confidence 455443222 22233466778899999999999985543 345443 35889999999999999999999821 Q ss_pred -------------cccC---------------cCCccc-------hhhHHHHHHHhh----c---cc------------- Q lcl|Aclame:pro 210 -------------FMGT---------------YNGQPL-------HTTQGIVDAVRQ----Y---AP------------- 234 (418) Q Consensus 210 -------------~~~~---------------s~~~~~-------r~t~GI~~~i~~----~---~~------------- 234 (418) +.+. ++-+.. ..+.||+.--.+ + .+ T Consensus 135 a~~p~~F~GL~~R~~~~s~~~a~qiidaGgtg~~~TSi~~v~~g~~~~~giyPkG~~~Gl~~~d~g~~~~~~~~g~~y~~ 214 (328) T protein:vir:95 135 SVNPQQFMGLSSRYSSLSAGNAQNIIDAGGTGTDNTSIWLVVWGENTVHGIFPKGKKAGIQMEDKGQVTLEDANGGKYEG 214 (328) T ss_pred cCChhhhcchhhhcCccccccccceeecccCCCCceEEEEEEEcCCeEEEecccccccCceeeecCceeeecCCCCeeeE Confidence 1100 000000 112233210000 0 00 Q ss_pred ----------------------cCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccce Q lcl|Aclame:pro 235 ----------------------DNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGE 292 (418) Q Consensus 235 ----------------------~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~ 292 (418) .|.+...-+....-.++.+++-++..+= ...+....++||+.+....|.+-....++ T Consensus 215 y~~~~~w~~Gl~i~d~r~vvrI~NId~~~l~~~~~~~~l~~lm~~a~~~i-p~~~~~~~~~y~n~~v~~~L~~q~~~~~n 293 (328) T protein:vir:95 215 YRTHYKWDNGLALRDWRYVVRIANIDVSNLSEPSSAANIAKLMVKALHRI-PNRGMGRPVFYMNRTVGQALDLQSLEKTS 293 (328) T ss_pred EEEEEEeeeeeEEcCcccEEEEecCcccccccccChhhHHHHHHHHHHHh-ccCCCCcceeehhHHHHHHHHHHHhcCcc Confidence 0111000001123455666766665431 11122234689998888888764333455 Q ss_pred EEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEE Q lcl|Aclame:pro 293 VTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVV 337 (418) Q Consensus 293 ~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~ 337 (418) +++...+ ..|-.+++| +| +.|....-+.+ .+..|+ T Consensus 294 ~~~~~~~-~~g~~~t~~---~g-ipir~~dai~~-----tE~~vv 328 (328) T protein:vir:95 294 LAISVKE-TEGEWWTSF---RG-VPIRETDALLE-----TEARVV 328 (328) T ss_pred eeeeeec-cCCcceeEE---CC-eEEEEEeeeec-----CccccC Confidence 5655444 555544443 34 55544432211 122222 No 83 >protein:vir:1328 Length: 392 # NCBI annotation: gp36 # Family: family:all:21 # MgeID: mge:28 # MgeName: phi-C31 # Cross-refs: genbank:acc:NP_047927;swissprot:trembl:q9zwv6;genbank:gi:9631145;uniprot:Q9ZWV6;genbank:GeneID:2715889 Probab=48.44 E-value=0.67 Score=21.54 Aligned_cols=287 Identities=14% Similarity=0.149 Sum_probs=114.4 Q ss_pred Ccceeeeec---------------cCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccce Q lcl|Aclame:pro 1 MSVYAGIFN---------------TTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFAS 65 (418) Q Consensus 1 ~~~~~~~~~---------------~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~ 65 (418) ..+-+|... .++++.-+.. .+...++...+...+++.++.+ T Consensus 91 ~~~r~g~~~~~~~~~~~~~~~~~t~~~~g~~~~~-~~~~~~i~~~~~~~~~l~~~~~----------------------- 146 (392) T protein:vir:13 91 AVLRAGNLGEARSFEFAPEKRDGTKAGNPNVLSR-TLYGQLIAQAVERSAIMRGGAS----------------------- 146 (392) T ss_pred HHHhccchhhhHHHHhhhhhhcccccCCCccccc-cchHHHHHHHHhhhhhhhhcce----------------------- Confidence 000011100 0111100000 0000000000111111111100 Q ss_pred eEEEEEeecCceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCC Q lcl|Aclame:pro 66 AVVTAEAAADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQR 145 (418) Q Consensus 66 ~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada 145 (418) .+....+ ..+.+-+..+...+ .|+ .||... T Consensus 147 ------------~~~~~~~-------------------------~~~~~~~~~~~~~a-------~~v------~E~~~~ 176 (392) T protein:vir:13 147 ------------TFTTSDA-------------------------NPMDFTVITGRATA-------GIV------GETAEI 176 (392) T ss_pred ------------eeecCCC-------------------------ceeEEEEEcCCcce-------eee------cccccc Confidence 0000000 00011000010000 111 255444 Q ss_pred cCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHH Q lcl|Aclame:pro 146 PTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGI 225 (418) Q Consensus 146 ~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI 225 (418) +... +. .-..-.-.++-...+--|.+....... +-..+-...-...+.+.+|.+||+|. |++ .| .|| T Consensus 177 ~~~~--~~-f~~v~~~~~k~~~~~~iS~ell~ds~~-~l~~~i~~~l~~~i~~~~d~~~l~G~----Gt~-~p----~Gi 243 (392) T protein:vir:13 177 PESY--PA-TTQRSMGGFKYGFASVVSYEFATDQVL-DLVGFLVSDAGPAIGDAMGRHFLTGT----GTG-QP----RGI 243 (392) T ss_pred cccc--cc-eeeEEeeeeeEEeeehhHHHHHhcchH-HHHHHHHHHHHHHHHHHHHHHHhccc----CCc-cc----ccc Confidence 3321 11 101122233333334445555543222 33344445556777888999999884 222 22 266 Q ss_pred HHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceE Q lcl|Aclame:pro 226 VDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMV 305 (418) Q Consensus 226 ~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~ 305 (418) +..... .+..........++.+++.++...+-.. ..++ ..+++++.....|.++...+|++-+... ...|.. T Consensus 244 l~~~~~--~~~~~~~~~~~~~~~d~l~~~~~~l~~~--~~~~---a~~v~n~~~~~~l~~lkd~~G~~l~~~~-~~~g~~ 315 (392) T protein:vir:13 244 LTDATG--ANAAFGEADADSKVSDALIDLFHEVPSA--YRKN---AKFVVNDLRAAQMRKLKDANGQYLWQSA-LTVGAP 315 (392) T ss_pred cccccc--ccccccccccccccHHHHHHHHHhhhhh--hhcC---CEEEEcHHHHHHHHHhhccCCceeecCC-cCCCCC Confidence 533210 1111112233467788888876655321 1112 1356788888888887555565444321 111111 Q ss_pred EEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEE Q lcl|Aclame:pro 306 FTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLT 385 (418) Q Consensus 306 v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~ 385 (418) . +=+| +.|+.++ +||++.+++-|++.+.+..- ..+..+.+....+ ..|....+.+ T Consensus 316 -~---~l~G-~Pv~~~~-----~~~~~~i~~Gdf~~~~i~~~--~~~~i~~~~~~~~-------------~~~~~~~r~~ 370 (392) T protein:vir:13 316 -D---TFNG-KVVETDD-----GMPADKVLFADLSKYRVRFA--GSLRVDRSVDAKF-------------STDQIVYRFL 370 (392) T ss_pred -c---eecc-eeeEEcC-----CCCCCcEEEeeccceeEEee--cceEEEeeccccc-------------cCCcEEEEEE Confidence 0 1134 3445553 46889999999886544332 2222221111110 0133344555 Q ss_pred EEEEEEEecccceEEeecCcccc Q lcl|Aclame:pro 386 SEWALELLNPQGCAVITGLQKAK 408 (418) Q Consensus 386 ~E~tLev~N~kA~a~I~gL~~~~ 408 (418) .-+...+.+|+|+.++ .++.|. T Consensus 371 ~r~d~~~~~~~A~~~~-~~~~aa 392 (392) T protein:vir:13 371 QRADGLLVDARGAKVL-TVTPAA 392 (392) T ss_pred EEeccEEecccceEEE-EeeccC Confidence 6677889999996654 456664 No 84 >protein:vir:94070 Length: 339 # NCBI annotation: putative structural protein # Family: family:all:1653 # MgeID: mge:1493 # MgeName: OP2 # Cross-refs: genbank:acc:YP_453625;genbank:gi:84662661;genbank:GeneID:5142580 Probab=45.87 E-value=0.75 Score=21.25 Aligned_cols=315 Identities=13% Similarity=0.082 Sum_probs=115.7 Q ss_pred eEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeEeccCceEEE--E Q lcl|Aclame:pro 27 LRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATGENMR--L 104 (418) Q Consensus 27 ~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~--V 104 (418) |.++.. +.-+-+|=++|-. ..+-...|++..+ ...-+.++..+.... ++.+ .++.--++ .-++.++++ . T Consensus 1 ~~~~~~-~~~~~~l~~~g~~--~~~~~~~~~~~~~--~~~a~d~~~~~~~~~-~~~~-~~i~a~~~--~~i~~~vy~~~~ 71 (339) T protein:vir:94 1 MSINND-RTDIKQLEKVGII--FDGYSPKSISSEV--SAYAMDAVNLTPTLQ-TTAN-AGIPAWMT--TFVDRRVIDIQL 71 (339) T ss_pred Cceech-HHHHHHHHhhcee--eccchhhhcchhh--Hhhhccccccccccc-cccc-cchhhhhh--hhhchhheeecc Confidence 222221 3344455444432 1111122222211 111112222222111 2222 22210010 012222221 1 Q ss_pred EEecCceeEEEccccccchhhhh-CCceE----EEeecccccccCCcCcccccceecc-c--eeEEEeeeeeechhHH-- Q lcl|Aclame:pro 105 ELVNGLNLTVKRQTGRISAAIIA-ANTKL----IVIGTAFEEGSQRPTARSIQPVYVP-N--FTQIFRNAWALTDTAR-- 174 (418) Q Consensus 105 tav~g~~~tv~rg~~~tta~~~~-~gt~v----~~~g~a~~EGada~~~~~~~~~~~~-N--~tQIf~~~v~VSgTa~-- 174 (418) -......|--+ ++.. .+ ..+-. +..|.|+.=| |.. ..|.+.++ | .-||++..+..+..-+ T Consensus 72 ~~~~~~~l~pv-----~t~g-~w~~~t~~y~~~e~~G~a~~yg-d~a---d~Pl~~~~v~~~~~~v~~~~~g~~y~~~E~ 141 (339) T protein:vir:94 72 APMAAAKIFPE-----VKKG-DWTTTYGVFIIAEPVGQVATYS-DWS---ANGMSKANVNFESRQNYRYQTWTEYGDLEM 141 (339) T ss_pred cccchhhhccc-----ccCC-CCcccEEEEeeeecccceEEcc-ccc---CCCcccccceeeEEeEEEEEEEEeecHHHH Confidence 11122221100 1110 11 12222 2333444332 222 11222221 1 2244444444443322 Q ss_pred HHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhc-cccCccccCCCCccch----H Q lcl|Aclame:pro 175 ASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQY-APDNVNAMPNPTAVTY----D 249 (418) Q Consensus 175 Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~-~~~nv~~~~~~a~~te----~ 249 (418) +.....+.+.-+...+-....+.+.+.+..++|... +..-|++. .. ....+...+.=+.-|. + T Consensus 142 ~~A~~~g~~l~~~Ka~aA~~al~~~~N~i~~~Gd~~---------~~~~GLlN---~P~l~~~v~~s~~Wa~kT~~eI~~ 209 (339) T protein:vir:94 142 ATYGEAGIDYVARQEISASLVMAKFANSSYLLGVAG---------IANYGLMN---DPSLPAPVAATVNWATAAPEDIAN 209 (339) T ss_pred HHHHhhCCChHHHHHHHHHHHHHHhhceEEeeeecc---------cceEEEEe---CCCccccccCCCCcccCCHHHHHH Confidence 223334444333334444444555555666666542 12233331 10 0000110000011233 5 Q ss_pred HHHHHHHHHHHhcccCCC-ceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEE-EEEEcCCeEEEEEECcccccc Q lcl|Aclame:pro 250 DVVDATIDAFKWSVNVGD-NTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVF-TEWKFFKGRLILKEHPLFSAI 327 (418) Q Consensus 250 ~l~d~~~~~~~~g~~~~g-~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v-~~~~SdfG~v~vv~n~~l~~~ 327 (418) ||..+..++|...++... ..+-.++..+.....|+.- +.+|+.+ +.+..+|-.+.|+--|.|... T Consensus 210 Di~~~~~~l~~~s~g~~~~~~~~~L~LP~~~~~~L~~~-------------n~~~~Tvl~~lk~n~pnl~i~~~~el~~a 276 (339) T protein:vir:94 210 DVVAMVGRLISQSGGLITGQERMVMALAPSALNNVNRT-------------NNFGLSAGAKIAQTYPNIQFVAVPEFDTA 276 (339) T ss_pred HHHHHHHHHHHhcCCeeeeccCcEEEecHHHHHhcccC-------------CcCCccHHHHHHHhcCCcEEEEccccccC Confidence 566677777765532211 1223466777776666531 1223322 234444555677777777543 Q ss_pred CCCCCeEEEEc-----hhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecccceEEee Q lcl|Aclame:pro 328 GISPGFAVVVD-----VPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVIT 402 (418) Q Consensus 328 ~mp~d~~lv~D-----~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~ 402 (418) + .+++.++. ++.+++++- +++..-+.+.+.. -.+-.-+-.=++++++-|.|.+.+. T Consensus 277 ~--g~~~~~~~~~~~~~~~~~~~~p-------~~~~~lpvq~~~~----------~~~v~~~~rt~Gv~i~~P~ai~~~~ 337 (339) T protein:vir:94 277 S--GRLVQLWVPEVNGQPTGEVAFA-------EKLRSHSIERYST----------TTRQKHSGATFGAVIYQPWAVTQEL 337 (339) T ss_pred C--CceEEEEEEeccCCcceEEEcc-------hhhhccccEEcCc----------eEEecceeeeeeEEEEccceeeeee Confidence 2 24443332 223333322 2222222111110 1111122333689999999999999 Q ss_pred cC Q lcl|Aclame:pro 403 GL 404 (418) Q Consensus 403 gL 404 (418) |+ T Consensus 338 GI 339 (339) T protein:vir:94 338 GV 339 (339) T ss_pred cC Confidence 99 No 85 >protein:vir:94673 Length: 419 # NCBI annotation: major capsid protein # Family: family:all:585 # MgeID: mge:1527 # MgeName: mu1/6 # Cross-refs: genbank:acc:YP_579208;genbank:gi:93007444;genbank:GeneID:5076792 Probab=44.32 E-value=0.81 Score=21.08 Aligned_cols=320 Identities=12% Similarity=-0.023 Sum_probs=120.5 Q ss_pred Cc---ceeeeeccCCChh-hhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCc Q lcl|Aclame:pro 1 MS---VYAGIFNTTLNPQ-ELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADA 76 (418) Q Consensus 1 ~~---~~~~~~~~~~~~~-~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~ 76 (418) +. -..+... .+-.+ ++ +.+... ...+....++. .. +... T Consensus 91 ~~~~~~~~~~~~-~~~~~~~~--~~~~~~----------~~~~~~~~~~~--~~----------------------~~~~ 133 (419) T protein:vir:94 91 SDGLREYRARDK-RGQFQVEM--RDIDPN----------RLLSRDAPAGT--IT----------------------NPNV 133 (419) T ss_pred HHHHHHHHHhhh-hhhhhHHH--HHHHHH----------Hhhcccccccc--cc----------------------CCcc Confidence 00 0001100 11111 11 100000 00000000000 00 0000 Q ss_pred eEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhh-CCceEEEeecccccccCCcCccccccee Q lcl|Aclame:pro 77 TVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIA-ANTKLIVIGTAFEEGSQRPTARSIQPVY 155 (418) Q Consensus 77 t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~-~gt~v~~~g~a~~EGada~~~~~~~~~~ 155 (418) ..++-.....+.. ..-....-..++.+..+.+..++.-+....+.+.... ....|. .||+..+..... -.. T Consensus 134 ~~~p~~~~~~i~~-~~~~~~~i~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~a~~v------~Eg~~~~~~~~~-~~~ 205 (419) T protein:vir:94 134 PHLPQLVPGIVPT-TPDLPLLVADLLDQQNADYNVLEYIRDTSGTAGAGSTWNKAAVV------PEGTAKPQSTLS-FDT 205 (419) T ss_pred cccchhhhHHHHH-HHhhhhhhhhcceeeeccCCceeeeeeccccccccccCccccee------cCCccccccccc-eee Confidence 0000000000000 0000000011223334444444443333332221000 011122 466665543211 111 Q ss_pred ccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhcccc Q lcl|Aclame:pro 156 VPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPD 235 (418) Q Consensus 156 ~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~ 235 (418) + -..+++-..-+.-|.+.++.. .+-.++-...-...+.+-+|.++|+|.- ++ + .-||+.... .. T Consensus 206 i--~~~~~k~~~~~~is~ell~d~--~~l~~~i~~~la~a~~~~~d~aii~G~G----~~-~----p~Gi~~~~~---~~ 269 (419) T protein:vir:94 206 I--TTTLKTVAHWLPITRQAADDN--SQLMGYIQGRLTYGLRFLRDRQLLNGNG----ST-E----MQGILTTPG---IG 269 (419) T ss_pred E--EeeeeeEEEeehhhHHHHHhH--HHHHHHHHHHHHHHHHHHHHHHHHhccC----cc-c----ccceecccc---cc Confidence 1 122333333333444555432 2323444444677789999999998743 21 2 225543211 01 Q ss_pred CccccCC----CCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEc Q lcl|Aclame:pro 236 NVNAMPN----PTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKF 311 (418) Q Consensus 236 nv~~~~~----~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~S 311 (418) ....... ......+++.++...+-..... ...+++++.....|.++....+...+.+.+-..|.. .+ T Consensus 270 ~~~~~~~~~~~t~~~~~~~l~~~~~~~~~~~~~-----~~~~v~n~~~~~~l~~~k~~~~~~~~~~~~~~~~~~----~~ 340 (419) T protein:vir:94 270 TYQQPKPTAPATDEPPLVDIRRAKTVAEIAGFP-----PDGVVVHPQDWESIELDQAPGSGVFRVIANVQGEAT----PR 340 (419) T ss_pred cccccccccccccchhHHHHHHHHHhhhhccCC-----CCEEEEcHHHHHHHHHHhhcCCCceeecCCcccCCC----cc Confidence 1111111 1223455566665555433222 225778988888887764333332222221111111 01 Q ss_pred CCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEE Q lcl|Aclame:pro 312 FKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALE 391 (418) Q Consensus 312 dfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLe 391 (418) =+|. .|+.++ +||++.+++.|+.+..+-+.+ .++..+.....+.. -..|.....+..-+.+. T Consensus 341 l~G~-pV~~~~-----~~~~~~~~~gd~~~~~~~~~~-~~~~v~~~~~~~~~-----------~~~~~~~~r~~~r~d~~ 402 (419) T protein:vir:94 341 IWGL-NVVSTV-----AIAQGTALVGGFRQGATLWSR-QGITVLMTDSHADF-----------FTANTLVILAEFRANLA 402 (419) T ss_pred ccce-eeEEcC-----CCCCccEEEeeccceEEEEEe-cceEEEEeccccch-----------hhcCcEEEEEEEeeccE Confidence 1352 455553 468889999999875332221 12222221111100 00144455677778999 Q ss_pred EecccceEEeecCcccccccCCC Q lcl|Aclame:pro 392 LLNPQGCAVITGLQKAKERVYLT 414 (418) Q Consensus 392 v~N~kA~a~I~gL~~~~~~~~~~ 414 (418) +++|+|+.+++- +.| +| T Consensus 403 v~~~~a~~~~~~-~aa-----~~ 419 (419) T protein:vir:94 403 VYQPKAFVRVTF-AAA-----TT 419 (419) T ss_pred EeccccEEEEEe-ccC-----CC Confidence 999999988763 222 22 No 86 >protein:vir:7855 Length: 497 # NCBI annotation: gp12 # Family: family:all:585 # MgeID: mge:150 # MgeName: CJW1 # Cross-refs: genbank:acc:NP_817462;genbank:gi:29565891;genbank:GeneID:1259081 Probab=42.17 E-value=0.9 Score=20.84 Aligned_cols=329 Identities=13% Similarity=0.099 Sum_probs=109.2 Q ss_pred CcceeeeeccCCChh-hhh-----hhhcccceeEeecCCcchhHHHhhhccccceeeeeee------eeeeecccceeEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQ-ELN-----MKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHG------YFSKTMVFASAVV 68 (418) Q Consensus 1 ~~~~~~~~~~~~~~~-~~~-----~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~------~~~~~~~~~~~t~ 68 (418) ...+..-.+....+. +.. +..+.+.+. ++........+ +....+ |..+-........ T Consensus 111 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~------~~~~~~~~~~~-----~~~~gg~~vp~~~~~~ii~~~~~~~ 179 (497) T protein:vir:78 111 GTKFDVSFNVSAKAADPGTAAAELMGAFADGET------APAAIGQNPFG-----STGTFAPGILPTFLPGIVEQLFYEL 179 (497) T ss_pred hhhhhhhhhhhhhhhhhHHHHHHHHHHHhhhhh------hHHHHHhhhcc-----cCcccccccchhhhHHHHHHHHhhh Confidence 000000000000000 000 000000000 00000000000 000011 1111010000000 Q ss_pred EEEeecCceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCc Q lcl|Aclame:pro 69 TAEAAADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTA 148 (418) Q Consensus 69 ~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~ 148 (418) . |. .+ +.+.-+.+..+++-+-..++. . ..|+ .||...|.. T Consensus 180 ~-----------i~--------~l---------~~~~~~~~~~~~~~~~~~~~~-~-----a~wv------~E~~~~~~s 219 (497) T protein:vir:78 180 S-----------LA--------DL---------ISSRPVTSPNLSYLTESAAHN-N-----AAAV------AEAGTYPFS 219 (497) T ss_pred h-----------HH--------hh---------ccccccCCCceEEEEEcCCCC-c-----ceee------ccCcccccc Confidence 0 00 00 000011111122111111110 0 0121 255544432 Q ss_pred ccccceeccceeEEEeeee----eechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccc-c----CcCC--- Q lcl|Aclame:pro 149 RSIQPVYVPNFTQIFRNAW----ALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFM-G----TYNG--- 216 (418) Q Consensus 149 ~~~~~~~~~N~tQIf~~~v----~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~-~----~s~~--- 216 (418) . + .+.+|-...- -+.-|.+..+-. .+..+|-..+-...|.+.+|.+||+|.-.. + ...+ T Consensus 220 ~--~-----~f~~i~~~~~k~a~~~~iS~ell~d~--~~l~~~i~~~l~~~i~~~~d~~~l~G~G~~~p~Gil~~~~~~~ 290 (497) T protein:vir:78 220 S--E-----EFARVYEQVGKVANALTITDEGLRDA--PELFNFVQGRLLEGIQRKEEVQLLAGGGYPGVNGLLQRSTGFT 290 (497) T ss_pred c--c-----cceeeEeeeeeeEeecHhHHHHHHhH--HHHHHHHHHHHHHHHHHHHHHHhhcCCCccccccccccccccc Confidence 1 1 1233332222 223333444322 133345555566778999999999874210 0 0000 Q ss_pred -ccchhhHH-H---HHHHhhccc-cC-----------------------ccccCCCCccchHHHHHHHHHHHHhcccCCC Q lcl|Aclame:pro 217 -QPLHTTQG-I---VDAVRQYAP-DN-----------------------VNAMPNPTAVTYDDVVDATIDAFKWSVNVGD 267 (418) Q Consensus 217 -~~~r~t~G-I---~~~i~~~~~-~n-----------------------v~~~~~~a~~te~~l~d~~~~~~~~g~~~~g 267 (418) .....+.+ . ...+..... .+ ..........+..++.+.+.+++..-...++ T Consensus 291 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 370 (497) T protein:vir:78 291 ASSASSLFGATSATVSNVKFPADGTNGAFVGQDTVASLKYGRVVTGAAGSGSGVAGSYPTAAEIAENVFDAFVDIQLTLF 370 (497) T ss_pred ccccccchhhhhhhhhhhhhhcccccchhhhhhHHHHHHHHHhhhhhhhhccchhccccchhhhhhHHHHHHhhhhhhcc Confidence 00000000 0 000000000 00 0000001112222233333333322111122 Q ss_pred ceeEEEEeChHHHHHHHhhhhccceEEEcccce-eeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeee Q lcl|Aclame:pro 268 NTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET-SYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAY 346 (418) Q Consensus 268 ~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~-~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~ 346 (418) .....++.++.....|.++...+|++....... ..|.-+..-.+=+| +.|+.++ .||++.+++.|.+...+.. T Consensus 371 ~~~~~~vmn~~~~~~l~~lkd~~G~~i~~~~~~~~~~~~~~~~~~l~G-~pV~~t~-----~~~~~~~~~Gd~~~~~~~i 444 (497) T protein:vir:78 371 QTPNAVVMNPRDWELLRLTKDANGQYMGGNFFGNAYGNPVNGGKNIWG-VPVVTTP-----LIPLGTILVGHFAPSVIQT 444 (497) T ss_pred cCCCeEEEchHHHHHHHHhhcCCCceeccCcccccccccccCCceeec-eeeEecC-----CCCCCceEEeecccceEEE Confidence 222246677777777887765666655432211 11111111112345 3455553 4688888888887654433 Q ss_pred ccCCCcccccccccCccccccccccccccCccccccE----EEEEEEEEEecccceEEeecCcccccc Q lcl|Aclame:pro 347 MDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGS----LTSEWALELLNPQGCAVITGLQKAKER 410 (418) Q Consensus 347 L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~----i~~E~tLev~N~kA~a~I~gL~~~~~~ 410 (418) .+.-++..+.....+ .|+++.+ ...++.+.+++|.|+.+++--..++-. T Consensus 445 ~~r~~~~v~~~~~~~---------------~~f~~n~v~~r~~~r~~~~v~~p~A~~~l~~~~~~~~~ 497 (497) T protein:vir:78 445 ARREGVTMQMTNSNG---------------TDFVDGKVTVRAEERLGLLVYRPSAFQLIQLKKGATGS 497 (497) T ss_pred EEecccEEEeecccc---------------hhhhcCcEEEEEEEeecceeeccccEEEEEecCCccCC Confidence 321122221111111 1344444 447899999999999999875554222 No 87 >protein:vir:101650 Length: 497 # NCBI annotation: gp13 # Family: family:all:585 # MgeID: mge:1515 # MgeName: 244 # Cross-refs: genbank:acc:YP_654768;genbank:gi:109302766;genbank:GeneID:4156084 Probab=42.17 E-value=0.9 Score=20.84 Aligned_cols=329 Identities=13% Similarity=0.099 Sum_probs=109.2 Q ss_pred CcceeeeeccCCChh-hhh-----hhhcccceeEeecCCcchhHHHhhhccccceeeeeee------eeeeecccceeEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQ-ELN-----MKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHG------YFSKTMVFASAVV 68 (418) Q Consensus 1 ~~~~~~~~~~~~~~~-~~~-----~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~------~~~~~~~~~~~t~ 68 (418) ...+..-.+....+. +.. +..+.+.+. ++........+ +....+ |..+-........ T Consensus 111 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~------~~~~~~~~~~~-----~~~~gg~~vp~~~~~~ii~~~~~~~ 179 (497) T protein:vir:10 111 GTKFDVSFNVSAKAADPGTAAAELMGAFADGET------APAAIGQNPFG-----STGTFAPGILPTFLPGIVEQLFYEL 179 (497) T ss_pred hhhhhhhhhhhhhhhhhHHHHHHHHHHHhhhhh------hHHHHHhhhcc-----cCcccccccchhhhHHHHHHHHhhh Confidence 000000000000000 000 000000000 00000000000 000011 1111010000000 Q ss_pred EEEeecCceEEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCc Q lcl|Aclame:pro 69 TAEAAADATVLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTA 148 (418) Q Consensus 69 ~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~ 148 (418) . |. .+ +.+.-+.+..+++-+-..++. . ..|+ .||...|.. T Consensus 180 ~-----------i~--------~l---------~~~~~~~~~~~~~~~~~~~~~-~-----a~wv------~E~~~~~~s 219 (497) T protein:vir:10 180 S-----------LA--------DL---------ISSRPVTSPNLSYLTESAAHN-N-----AAAV------AEAGTYPFS 219 (497) T ss_pred h-----------HH--------hh---------ccccccCCCceEEEEEcCCCC-c-----ceee------ccCcccccc Confidence 0 00 00 000011111122111111110 0 0121 255544432 Q ss_pred ccccceeccceeEEEeeee----eechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccc-c----CcCC--- Q lcl|Aclame:pro 149 RSIQPVYVPNFTQIFRNAW----ALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFM-G----TYNG--- 216 (418) Q Consensus 149 ~~~~~~~~~N~tQIf~~~v----~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~-~----~s~~--- 216 (418) . + .+.+|-...- -+.-|.+..+-. .+..+|-..+-...|.+.+|.+||+|.-.. + ...+ T Consensus 220 ~--~-----~f~~i~~~~~k~a~~~~iS~ell~d~--~~l~~~i~~~l~~~i~~~~d~~~l~G~G~~~p~Gil~~~~~~~ 290 (497) T protein:vir:10 220 S--E-----EFARVYEQVGKVANALTITDEGLRDA--PELFNFVQGRLLEGIQRKEEVQLLAGGGYPGVNGLLQRSTGFT 290 (497) T ss_pred c--c-----cceeeEeeeeeeEeecHhHHHHHHhH--HHHHHHHHHHHHHHHHHHHHHHhhcCCCccccccccccccccc Confidence 1 1 1233332222 223333444322 133345555566778999999999874210 0 0000 Q ss_pred -ccchhhHH-H---HHHHhhccc-cC-----------------------ccccCCCCccchHHHHHHHHHHHHhcccCCC Q lcl|Aclame:pro 217 -QPLHTTQG-I---VDAVRQYAP-DN-----------------------VNAMPNPTAVTYDDVVDATIDAFKWSVNVGD 267 (418) Q Consensus 217 -~~~r~t~G-I---~~~i~~~~~-~n-----------------------v~~~~~~a~~te~~l~d~~~~~~~~g~~~~g 267 (418) .....+.+ . ...+..... .+ ..........+..++.+.+.+++..-...++ T Consensus 291 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 370 (497) T protein:vir:10 291 ASSASSLFGATSATVSNVKFPADGTNGAFVGQDTVASLKYGRVVTGAAGSGSGVAGSYPTAAEIAENVFDAFVDIQLTLF 370 (497) T ss_pred ccccccchhhhhhhhhhhhhhcccccchhhhhhHHHHHHHHHhhhhhhhhccchhccccchhhhhhHHHHHHhhhhhhcc Confidence 00000000 0 000000000 00 0000001112222233333333322111122 Q ss_pred ceeEEEEeChHHHHHHHhhhhccceEEEcccce-eeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeee Q lcl|Aclame:pro 268 NTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET-SYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAY 346 (418) Q Consensus 268 ~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~-~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~ 346 (418) .....++.++.....|.++...+|++....... ..|.-+..-.+=+| +.|+.++ .||++.+++.|.+...+.. T Consensus 371 ~~~~~~vmn~~~~~~l~~lkd~~G~~i~~~~~~~~~~~~~~~~~~l~G-~pV~~t~-----~~~~~~~~~Gd~~~~~~~i 444 (497) T protein:vir:10 371 QTPNAVVMNPRDWELLRLTKDANGQYMGGNFFGNAYGNPVNGGKNIWG-VPVVTTP-----LIPLGTILVGHFAPSVIQT 444 (497) T ss_pred cCCCeEEEchHHHHHHHHhhcCCCceeccCcccccccccccCCceeec-eeeEecC-----CCCCCceEEeecccceEEE Confidence 222246677777777887765666655432211 11111111112345 3455553 4688888888887654433 Q ss_pred ccCCCcccccccccCccccccccccccccCccccccE----EEEEEEEEEecccceEEeecCcccccc Q lcl|Aclame:pro 347 MDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGS----LTSEWALELLNPQGCAVITGLQKAKER 410 (418) Q Consensus 347 L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~----i~~E~tLev~N~kA~a~I~gL~~~~~~ 410 (418) .+.-++..+.....+ .|+++.+ ...++.+.+++|.|+.+++--..++-. T Consensus 445 ~~r~~~~v~~~~~~~---------------~~f~~n~v~~r~~~r~~~~v~~p~A~~~l~~~~~~~~~ 497 (497) T protein:vir:10 445 ARREGVTMQMTNSNG---------------TDFVDGKVTVRAEERLGLLVYRPSAFQLIQLKKGATGS 497 (497) T ss_pred EEecccEEEeecccc---------------hhhhcCcEEEEEEEeecceeeccccEEEEEecCCccCC Confidence 321122221111111 1344444 447899999999999999875554222 No 88 >protein:vir:100331 Length: 342 # NCBI annotation: major capsid protein N # Family: family:all:201 # MgeID: mge:1484 # MgeName: phi-MhaA1-PHL101 # Cross-refs: genbank:acc:YP_655472;genbank:gi:109289940;genbank:GeneID:4157374 Probab=39.13 E-value=0.76 Score=21.25 Aligned_cols=259 Identities=10% Similarity=0.048 Sum_probs=121.4 Q ss_pred EccccccchhhhhCCceEEEeecccccccC-----C-cCcccccce----------------ecc--ceeEEEeeeeeec Q lcl|Aclame:pro 115 KRQTGRISAAIIAANTKLIVIGTAFEEGSQ-----R-PTARSIQPV----------------YVP--NFTQIFRNAWALT 170 (418) Q Consensus 115 ~rg~~~tta~~~~~gt~v~~~g~a~~EGad-----a-~~~~~~~~~----------------~~~--N~tQIf~~~v~VS 170 (418) .|-..+.- ..+ ++..-|++-|.+ + ..+...|.+ +++ =+.|+--+.|.++ T Consensus 1 M~~~tr~~---~~~----y~~~~A~~ngv~~~~~~~~~~FsV~P~v~q~L~~~i~ess~FL~~INvv~V~e~~Ge~i~lg 73 (342) T protein:vir:10 1 MKDLTLEK---YNA----YLARQAELNNLPFNALATGIKFTVQPSVQQKLYEKVRESSDFLKSISFVFVDEQTGETLGLD 73 (342) T ss_pred CChHHHHH---HHH----HHHHHHHHhCCChhHccccceeecChHHHHHHHHHHHHHHHHhccCcccccccceeeEEecc Confidence 11111110 000 000011111211 0 012222211 111 2567777777663 Q ss_pred h------h-H------HHHhh-hc--------------------------ccchHHHHHH-HHHHHHHHHHhHHHhcCcc Q lcl|Aclame:pro 171 D------T-A------RASYA-EA--------------------------GYSNITESRR-DCMDFHATEQETAIFFGQA 209 (418) Q Consensus 171 g------T-a------~Av~~-~g--------------------------~~dela~q~~-kk~~EikrdmE~a~i~G~k 209 (418) - + . +-... .+ ...+|...+. .-.+.+.+||-.+=++|+. T Consensus 74 ~~g~iagrtdT~~~~~R~~~~~~~l~~~~Y~c~qTn~dt~i~Y~~lD~WA~~~dF~~r~~~~i~~~~ALD~i~IGfNGts 153 (342) T protein:vir:10 74 SAHTVASTTDTSGDGERKTTSIAKLVKQTYHCQQINFDTHINYKQLDMWAKFPDFQQKVANVAAKQRKRDLIMIGFNGTS 153 (342) T ss_pred cCcccccccccCCCCCcccccccccCCCccEEEEeeecccccHHHHHHHhcChhHHHHHHHHHHHHHhhccceeccccee Confidence 1 1 0 00000 00 0112333332 3345568888888889987 Q ss_pred cccCcCCccchh----hHHHHHHHhhccccCccccCC-------CCccchHHHHHHHHHHHHhcccCC--CceeEEEEeC Q lcl|Aclame:pro 210 FMGTYNGQPLHT----TQGIVDAVRQYAPDNVNAMPN-------PTAVTYDDVVDATIDAFKWSVNVG--DNTQRVMFCD 276 (418) Q Consensus 210 ~~~~s~~~~~r~----t~GI~~~i~~~~~~nv~~~~~-------~a~~te~~l~d~~~~~~~~g~~~~--g~~~~~i~v~ 276 (418) .-..++-..-.. =-|++-.++.+.+..+...+. +..-++..|..++.++...-...- ....=+++|| T Consensus 154 ~A~~Td~~~nPllqDVN~GWlQ~~Re~ap~rv~~~~~~~~~i~iG~~gdy~NLDalV~D~~~~lI~~~~~~d~dLVvivG 233 (342) T protein:vir:10 154 RAATSDRNSNPLLQDVAKGWLQKMREDAKERVMNGESTDNQVLVGKGQEYANLDALVMDATEELIDEWHRDDTDLVVITG 233 (342) T ss_pred eccCCChhhCcCccccchHHHHHHHhhhhhhhcccceeccceeecCCCCcccHHHHHHHHHhccCChHHhcCCCEEEEEc Confidence 554443221111 127777777776665543211 122366667777777764322211 1112478899 Q ss_pred hHHHHHHHhhhhccceEEEcccceeeceEEEEEEc--CCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCC---C Q lcl|Aclame:pro 277 TVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKF--FKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGR---N 351 (418) Q Consensus 277 a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~S--dfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r---~ 351 (418) .++.. ++......+- -..+++.. .+.+.| -+|-+..+.-|+| |++.++|--.++|++.+..|- . T Consensus 234 ~dLla--dk~~~l~n~~-~~ptE~~A---a~~i~s~k~iGGl~a~~~PfF-----P~~~ilVT~L~NLsIY~Q~gs~RR~ 302 (342) T protein:vir:10 234 RKLLA--DKYFPIVNQQ-NAPTEELA---ADIVISQKRIGGLKAVRVPFF-----PANAILITKLENLAIYVQEGTTRKH 302 (342) T ss_pred hhhhH--HHHHHHHhcC-CChHHHHH---HHHHHhhhhhcCceeEEcccc-----CCCceEEeeccccEEEEecCcEEEE Confidence 88875 3321111110 01223222 223333 4787888888875 889999999999999999652 2 Q ss_pred cccccccccCccccccccccccccCccccccEEEEEEEEEEecccceEEeecCcccccc Q lcl|Aclame:pro 352 AKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKER 410 (418) Q Consensus 352 ~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~ 410 (418) ...++ .+. |.. |++. . --+-.|.+..+.|.|++++-++|+ T Consensus 303 ~~d~p-~r~----rie----------~y~s---~-Ne~YvVEd~~~~a~iE~i~i~~~~ 342 (342) T protein:vir:10 303 IENVP-KKD----RIE----------TYES---E-NIDYVVEDYGCAALIENITLKDKE 342 (342) T ss_pred EEecc-ccc----ccc----------chhh---h-ccceeeeccccEEEeecceecCCC Confidence 21111 111 111 1110 0 012334456678899999999888 No 89 >protein:vir:78777 Length: 358 # NCBI annotation: putative major capsid protein # Family: family:all:201 # MgeID: mge:1857 # MgeName: phiO18P # Cross-refs: genbank:acc:YP_001285647;genbank:gi:148727153;genbank:GeneID:5220125 Probab=38.38 E-value=1.1 Score=20.42 Aligned_cols=313 Identities=10% Similarity=-0.025 Sum_probs=137.8 Q ss_pred CcceeeeeccCCChh-hhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQ-ELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVL 79 (418) Q Consensus 1 ~~~~~~~~~~~~~~~-~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~ 79 (418) |+.| .+++ .. .- ...+.++-.+.|...... +..+ T Consensus 1 m~~~-------M~~~tr~------------~~--~~y~~~~A~~ngv~~~~~------------------------~~~F 35 (358) T protein:vir:78 1 MSQT-------LTVQAEQ------------RL--NKYCDALAKAYGIDISKL------------------------DKQF 35 (358) T ss_pred Cccc-------ccHHHHH------------HH--HHHHHHHHHHhCCChhHc------------------------ccee Confidence 1111 1111 00 00 012222222333211111 1223 Q ss_pred EEc-------------cccccccCceeEeccCceEEEEEEecCceeEE--EccccccchhhhhCCceEEEeecccccccC Q lcl|Aclame:pro 80 TVE-------------NSDGLTKGMIFYNEATGENMRLELVNGLNLTV--KRQTGRISAAIIAANTKLIVIGTAFEEGSQ 144 (418) Q Consensus 80 tV~-------------~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv--~rg~~~tta~~~~~gt~v~~~g~a~~EGad 144 (418) +|+ +++.+....++. |..+.|.++-+ .....++|.. + +.... .+ T Consensus 36 sv~p~v~q~L~~~i~ess~FL~~INvv~---------V~e~~Ge~v~lg~~g~iagrt~t---------r--~~~~~-~~ 94 (358) T protein:vir:78 36 SVTGPVETTLRSALLASVEFLGLITCLD---------VDQIKGQVVQVGVGQLYTGRKKG---------G--RFKGK-VG 94 (358) T ss_pred eeChHHHHHHHHHHHHHHHHhhcCcccc---------cccceeeEEeecCCcccceecCC---------C--ccccc-cc Confidence 333 333333333321 33334444322 1111222210 0 00000 00 Q ss_pred CcCcccccceeccceeEEEeeeeeechhH-HHHhhhcccchHHHHHHH-HHHHHHHHHhHHHhcCcccccCcCCccchh- Q lcl|Aclame:pro 145 RPTARSIQPVYVPNFTQIFRNAWALTDTA-RASYAEAGYSNITESRRD-CMDFHATEQETAIFFGQAFMGTYNGQPLHT- 221 (418) Q Consensus 145 a~~~~~~~~~~~~N~tQIf~~~v~VSgTa-~Av~~~g~~dela~q~~k-k~~EikrdmE~a~i~G~k~~~~s~~~~~r~- 221 (418) .....+ .-...||| ..+++.. .+=.+.+..++|.-.+.. -.+.+.+|+-.+=++|+..-..++-..-.. T Consensus 95 l~~~~Y--~c~qTn~d------t~i~Y~~lD~WA~f~~~~dF~~r~~~~i~~~~ALD~i~IGfNGts~A~~Td~~~nPll 166 (358) T protein:vir:78 95 VDGNTY--ELTETDSC------ASLDWATLCTWANAGSEGEFIKLVGEFVNKAFALDMLRVGWNGVSAADDTDPTANPLG 166 (358) T ss_pred cCCCcc--EEEEecee------eeccHHHHHHHHhCCChhHHHHHHHHHHHHHHhhccceecccceeeccCCChhhCcCc Confidence 000000 01112332 3344332 233333433456655554 456679999999999997554443221111 Q ss_pred ---hHHHHHHHhhccccCcccc---------CCCCccchHHHHHHHHHHHHhcccCC--CceeEEEEeChHHHHHH-Hhh Q lcl|Aclame:pro 222 ---TQGIVDAVRQYAPDNVNAM---------PNPTAVTYDDVVDATIDAFKWSVNVG--DNTQRVMFCDTVGMRTM-QDI 286 (418) Q Consensus 222 ---t~GI~~~i~~~~~~nv~~~---------~~~a~~te~~l~d~~~~~~~~g~~~~--g~~~~~i~v~a~~k~~i-~~~ 286 (418) =-|++-.++.+.+..+... +.++.-++..|..++.++.......- ....=+++||.++...= -++ T Consensus 167 qDVN~GWlQ~~Re~a~~~v~~~~~~~~~i~ig~g~~Gdy~NLDalV~D~~~~lI~~~~~~d~dLVvivG~dLla~k~~~l 246 (358) T protein:vir:78 167 QDVNKGWHQLAREWKGGSQIIKAAAGEKIYFDPDGKGEYKTLDEMASDLINTTIDPLFQQDPRLVVLVGTDLVAAAQAKL 246 (358) T ss_pred cccchHHHHHHHhhchhhhhccccccCceeecCCCCCccccHHHHHHHHHhccCChHHhcCCCEEEEEchhhhhHHhhhH Confidence 1277777887777665431 22233467778888888775443321 11124788998876421 111 Q ss_pred hhccceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCC---CcccccccccCcc Q lcl|Aclame:pro 287 GRFFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGR---NAKVENYGQGGGE 363 (418) Q Consensus 287 ~~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r---~~~~e~laKtG~~ 363 (418) ....+ ..+++..+ +.+..-+|-+..+.-|+| |++.++|--.++|++.+..|- ....++ .+. T Consensus 247 ~n~~~----~pTE~~Aa---~~i~k~iGGlpa~~~PfF-----P~~~ilVT~L~NLsIY~Q~gs~RR~~~d~p-~r~--- 310 (358) T protein:vir:78 247 YSEAT----KPSEQIAA---QQLAKSIAGRKAYIPPFF-----PGKRMVVTTLDNLHCYTQRGTRKRKADDNQ-DSK--- 310 (358) T ss_pred hhcCC----CcHHHHHH---HHHHHHhCCCeEEEcccc-----CCCceEEeeccccEEEEecCcEEEEEEecc-ccc--- Confidence 11111 12333222 223355888888888885 889999999999999999652 221111 111 Q ss_pred ccccccccccccCccccccEEEEEEEEEEecccceEEeecCc--ccccccCCCC-CCC Q lcl|Aclame:pro 364 NKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQ--KAKERVYLTA-PAP 418 (418) Q Consensus 364 ~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~--~~~~~~~~~~-~~~ 418 (418) |. ++ ++. .- -+-.|.+..+.|.|+++. -+++.+|+.+ ++| T Consensus 311 -ri--E~--------y~s---~N-e~YvVEd~~~~a~iE~i~v~~~~~pa~~~~~~~~ 353 (358) T protein:vir:78 311 -SF--DN--------QYW---RM-EGYALGEHKAYGGFEEADIEIGADPAVLAVEAAA 353 (358) T ss_pred -cc--cc--------hhh---hc-ceeeeeccccEEEEeeeeeeeCCCCCccccCCcc Confidence 11 11 110 00 122344556778888874 3444444443 222 No 90 >protein:vir:80930 Length: 278 # NCBI annotation: Cps # Family: family:all:522 # MgeID: mge:1886 # MgeName: A500 # Cross-refs: genbank:acc:YP_001468392;genbank:gi:157324966;genbank:GeneID:5601363 Probab=38.23 E-value=1.1 Score=20.41 Aligned_cols=262 Identities=13% Similarity=0.098 Sum_probs=111.6 Q ss_pred Eccc-ccc---ccCceeEeccC---ceEEEEEEecCceeEEEccccccchhhhhCCceEEE-----eecc--cccccCCc Q lcl|Aclame:pro 81 VENS-DGL---TKGMIFYNEAT---GENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIV-----IGTA--FEEGSQRP 146 (418) Q Consensus 81 V~~~-~~~---~~~~~~~~~~~---~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~-----~g~a--~~EGada~ 146 (418) -++. +.+ -.+.++...+. .+.+++..+ ..+-+-+. ...|..+.+ +|.+ ..||.+.+ T Consensus 1 Ma~~~T~~~~~iiPev~s~~v~~~~~~~~v~~~~----~~~~~~l~------g~~G~tv~ip~~~~~g~a~~~~~g~~i~ 70 (278) T protein:vir:80 1 MADLTTKLANLIDPEVMGPMISAKLPKAIKFGKI----APIDNSLE------GQPGSEITVPKYKYIGDAQDVAEGAAID 70 (278) T ss_pred CCCcceehhheecHHHHHHHHHHHHHHhhhhccc----ceeccccc------CCCCCEEEEeeeccCCcceeecCCCcCc Confidence 2221 111 11111100000 111111111 00000000 112322222 2211 23344333 Q ss_pred CcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHH Q lcl|Aclame:pro 147 TARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIV 226 (418) Q Consensus 147 ~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~ 226 (418) ...-......--..|. .+.|++++-..+. ...|.+..-......-+.+.+++.++..-+.... +.. + T Consensus 71 ~~~lt~~~~~~~i~~~-~~a~~v~D~~~~~---~~~d~~~~~~~~~a~~~a~~~d~~l~~~l~~a~~-~~~------~-- 137 (278) T protein:vir:80 71 YSALETESVKHGIKKA-GKGVKLTDESVLS---GYGDPVEEAQKQIRMAIASKVDNDILEEALTTTL-EVK------G-- 137 (278) T ss_pred ccccccceeeEeeehh-hccccccHHHHhh---ccccHHHHHHHHHHHHHHHHHHHHHHHHHhcccc-ccc------c-- Confidence 2221111111122332 3456666655443 3446677777777888899999888754331100 000 0 Q ss_pred HHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcc-cceeeceE Q lcl|Aclame:pro 227 DAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQ-RETSYGMV 305 (418) Q Consensus 227 ~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~-~~~~~G~~ 305 (418) .... .+.....+.+.|+..++ . ..+....+++++++.+...|.+... .++.. ....-|+. T Consensus 138 -------~~t~----~~~~~~~~~~~da~~~l-~---~~~~~~~~~ivv~p~~~~~L~k~~~----~~~~~~~~~g~~~~ 198 (278) T protein:vir:80 138 -------AINI----GLIDKIENTFTDAPDAI-E---DESITTTGVLFLNYKDTAKLREEAA----GSWTKASQLGDDLL 198 (278) T ss_pred -------cccc----chhhhHHHHHHHHHHhh-c---ccCCCcccEEEECHHHHHHHHhhhh----hhccccccccccce Confidence 0000 01112234445544432 2 2233344578899988777765421 11111 11111222 Q ss_pred EEEEE-cCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEE Q lcl|Aclame:pro 306 FTEWK-FFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSL 384 (418) Q Consensus 306 v~~~~-SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i 384 (418) ..-.. +-.| +.|+.++ ++|.++.+++.+..+. |..+++...|..+.. .++.|...+.. T Consensus 199 ~~G~ig~~~G-~~Vi~s~-----~~p~~t~~l~~~gAi~--~~~~~~~~vE~~Rd~-------------~~~~d~i~~~~ 257 (278) T protein:vir:80 199 VKGAFGELLG-WEIVRTK-----KLADGNALAVKAGALK--TFLKRNLLAESGRDM-------------DHKLTKFNADQ 257 (278) T ss_pred eeccceeecc-eeEEEcC-----CCCcceEEEEecccee--eeecCCcccccccch-------------hhccceeeeee Confidence 21111 1123 4677764 4678999999998665 444455555544322 12335554444 Q ss_pred EEEEEEEEecccceEEeecCcccccc Q lcl|Aclame:pro 385 TSEWALELLNPQGCAVITGLQKAKER 410 (418) Q Consensus 385 ~~E~tLev~N~kA~a~I~gL~~~~~~ 410 (418) + |+..+.||.+..+|+= ++-. T Consensus 258 ~--yg~~v~~~~~~v~it~---~a~~ 278 (278) T protein:vir:80 258 H--YAVALVDETKAVKVVP---VAGN 278 (278) T ss_pred E--EEEEEEcCcceEEEee---ccCC Confidence 4 7999999998888762 2111 No 91 >protein:vir:4830 Length: 397 # NCBI annotation: MPL-7201 # Family: family:all:21 # MgeID: mge:105 # MgeName: 7201 # Cross-refs: genbank:acc:NP_038327;genbank:gi:9634653;genbank:GeneID:1262632 Probab=37.68 E-value=1.1 Score=20.34 Aligned_cols=318 Identities=12% Similarity=0.008 Sum_probs=115.6 Q ss_pred Cccee-------eeec-------------------cCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeee Q lcl|Aclame:pro 1 MSVYA-------GIFN-------------------TTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTH 54 (418) Q Consensus 1 ~~~~~-------~~~~-------------------~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~ 54 (418) +.-+. ..++ ..-.|.+-..+....+.. T Consensus 39 ~~~l~~ei~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~--------------------------- 91 (397) T protein:vir:48 39 LQAIKNERDTAKMKRDMFKEQYTEARANEVVNMSEEEKKPLTKSEEEVKAGFV--------------------------- 91 (397) T ss_pred HHHHHHHHHHHHHHHHHHHHHHHHHHHhhhhhhhhhccccccchhhHHHHHHH--------------------------- Confidence 00000 0000 000000000000000000 Q ss_pred eeeeeecccceeEEEEEeecCceEEEEccccccccCceeEeccCce---------EEEEEEecCcee--EEEccccccch Q lcl|Aclame:pro 55 GYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATGE---------NMRLELVNGLNL--TVKRQTGRISA 123 (418) Q Consensus 55 ~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~E---------~~~Vtav~g~~~--tv~rg~~~tta 123 (418) ..+...+........... +. .+....++..+.-+...|-+. .+.+..+.+.+. .+.+...... T Consensus 92 ~~~~~~~~~~~~~~~~~~----~~-~t~~~gg~~iP~~~~~~ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~- 165 (397) T protein:vir:48 92 KDFKNLVRGRYQNLLDSK----TD-ASGSDAGLTIPQDIQTAIHTLVRQYDSLQEYVNVENVTTLTGSRVYEKWADITG- 165 (397) T ss_pred HHHHHHHhhhhhHHHHHh----hc-cCCccccccccHHHHHHHHHHHHHHHHHHhhhceeeccCCcceEEEEeecCCCc- Confidence 000011100000000000 00 011111222211111111111 111222222221 1111111100 Q ss_pred hhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHH Q lcl|Aclame:pro 124 AIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETA 203 (418) Q Consensus 124 ~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a 203 (418) ...| ..||...++.....-..+. ..+++-...+.-|.+..+.. ..+-..|-...-...+.+.+|.+ T Consensus 166 -----~a~~------v~E~~~~~~~~~~~~~~v~--~~~~k~~~~~~iS~ell~ds-~~~l~~~v~~~l~~~~~~~~d~~ 231 (397) T protein:vir:48 166 -----LAKL------DDEAGSIGTNDDPKLYPIR--YAIKRYAGISTVTNSLLADS-AENILAWLSGWIAKKVVVTRNKA 231 (397) T ss_pred -----ceee------eccccccccccccceeeEE--eeheeeeeehhhHHHHHhhc-hHHHHHHHHHHHHHHHHHHHHHH Confidence 0111 1355444322111111111 01122222223333334322 22334455556666778889999 Q ss_pred HhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHH Q lcl|Aclame:pro 204 IFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTM 283 (418) Q Consensus 204 ~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i 283 (418) +|+|... +.. .++..+.+++.++..++-..... ...+++++.....| T Consensus 232 il~G~g~----~~~------------------------~~~~~~~d~i~~~~~~l~~~~~~-----~a~~v~n~~~~~~L 278 (397) T protein:vir:48 232 ILEAIAT----LPT------------------------KPTLTKWDDIIDLQAKVDPAIKQ-----TSFFLTNTSGFTAL 278 (397) T ss_pred Hhhcccc----ccc------------------------ccccccHHHHHHHHHHhhhhhcC-----CCEEEECHHHHHHH Confidence 9987531 100 11245667788776665433221 13578899989999 Q ss_pred HhhhhccceEEEcccceeeceEEEEEEcCCeE-EEEEECccccccCCCCCeEEEEchhhc-eeeeccCCCcccccccccC Q lcl|Aclame:pro 284 QDIGRFFGEVTVTQRETSYGMVFTEWKFFKGR-LILKEHPLFSAIGISPGFAVVVDVPAV-KLAYMDGRNAKVENYGQGG 361 (418) Q Consensus 284 ~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG~-v~vv~n~~l~~~~mp~d~~lv~D~~~~-~~~~L~~r~~~~e~laKtG 361 (418) .++...+|++.+...- ..|. -.+=+|. |.++.+..+.....+...+++.|++.. .+..-.+..+ +.....+ T Consensus 279 ~~lkd~~G~~i~~~~~-~~~~----~~~l~G~PV~~~~~~~~~~~~~~~~~~~~gd~~~~~~~~~~~~~~i--~~~~~~~ 351 (397) T protein:vir:48 279 KKVKNAFGDYLMERDV-KSPT----GYSIDGFAVKEVADRWLANASSGAMPLYFGDLKQAVTLFDRQQMSL--LSTNIGG 351 (397) T ss_pred HHhhcCCCceeeccCc-CCCC----CceeccceeEEecccccCCcCCCceEEEEEeccceEEEEeecceEE--EEeccch Confidence 8885555665443210 0010 0011342 333445455445556667788888743 3322211111 1111111 Q ss_pred ccccccccccccccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 362 GENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 362 ~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) . . -..|......+.-+...+++|+|+.+++-=..+. .|++-|+- T Consensus 352 ~---~--------~~~~~~~~r~~~r~d~~~~~~~a~~~~~~~~~~~--~~~~~~~~ 395 (397) T protein:vir:48 352 G---A--------FETDTTKIRVIDRFDVVATDTESFVPASFKAIAD--QKGNLGST 395 (397) T ss_pred h---h--------hhcCceeEEEEeeeccEEecccceEEEEeccccc--CCCCcccc Confidence 0 0 0013344456677899999999997765433331 11222222 No 92 >protein:vir:79642 Length: 329 # NCBI annotation: HsbB # Family: family:all:463 # MgeID: mge:1872 # MgeName: TLS # Cross-refs: genbank:acc:YP_001285525;genbank:gi:148734508;genbank:GeneID:5220000 Probab=37.36 E-value=1.1 Score=20.31 Aligned_cols=295 Identities=12% Similarity=0.052 Sum_probs=116.4 Q ss_pred hccccceeeeeeeeeeeec--ccceeEEEEEeecCceEEEEccccccccCceeEeccCc-------------eEEEEE-E Q lcl|Aclame:pro 43 VVGSTTAKASTHGYFSKTM--VFASAVVTAEAAADATVLTVENSDGLTKGMIFYNEATG-------------ENMRLE-L 106 (418) Q Consensus 43 ~~~~~~~~~~~~~~~~~~~--~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~~~~-------------E~~~Vt-a 106 (418) +.|..-.+.+.+..++-.. ...+......... +.-.|....+= .++. +++-|+ . T Consensus 1 ~~~~~~~~~~~~d~~~~~~~a~~~~~~~~~~~~~--------~~~~f~~~ql~--~id~~v~e~~~~~l~~~~~i~i~~~ 70 (329) T protein:vir:79 1 MRGNIMSKEMKYDEFEANVIANHMQLRGAKNDAS--------DMGIWTSQELH--KIKAQAYEKEYPAGSALRVFPVTSE 70 (329) T ss_pred CccchhhhhhccchhhhhhHhhhcccccceeccc--------hhhHHHHHHHH--HHHHHHHhhhhcccchhhhcccccC Confidence 2232223344443333221 1111111111000 00112221100 0111 222121 1 Q ss_pred ec-CceeEEEccccccchhhhhCCceEEEeecccccc---cCCcCcccccceeccceeEEEeeeeeechhHH--HHhhhc Q lcl|Aclame:pro 107 VN-GLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEG---SQRPTARSIQPVYVPNFTQIFRNAWALTDTAR--ASYAEA 180 (418) Q Consensus 107 v~-g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EG---ada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~--Av~~~g 180 (418) ++ +......+.+. ..|.+..=| .|.|.....-... ...|++-...++.+-+ +..... T Consensus 71 ~~~~~~~~t~~~~~--------------~~G~a~~~~d~~~dip~vd~~~~~~---~~~i~~~~~~~~~~~~El~~a~~~ 133 (329) T protein:vir:79 71 LSDTDKTFEYQTFD--------------KVGHAKIIADYTDDLSTVDALMTSE---FGKVFRLGNAFLISIDEIKAGQRT 133 (329) T ss_pred CCCceeEEEeeeee--------------cceeeeeecCcccccceeeccccee---EEEEEEEEEEEEecHHHHHHHHHh Confidence 11 11111111111 111111111 1222111111111 2344444444444433 333333 Q ss_pred ccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccC-C-------CCccchHHHH Q lcl|Aclame:pro 181 GYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMP-N-------PTAVTYDDVV 252 (418) Q Consensus 181 ~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~-~-------~a~~te~~l~ 252 (418) +.+.-....+-+...+.+.+....++|.+.. ..-|++.. ..-......+ + +..--.++|. T Consensus 134 g~~l~~~k~~aA~~~~~~~~n~i~f~G~~~~---------g~~GLlN~---p~v~~~~~~~~~~~~w~~kt~~ei~~di~ 201 (329) T protein:vir:79 134 GKSLSTRKANAAQNAHDQLVNHLVFKGSKPH---------KIISVFEH---PNLTTINSAGWNNAAGTGKKPETAQDELE 201 (329) T ss_pred CCChHHHHHHHHHHHHHHhhccEEEeecccc---------cceeeecC---CCccccccCCCCCccccccCHHHHHHHHH Confidence 4454455555566677777778888885421 12333321 0000000000 0 0111346678 Q ss_pred HHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceE-EEEEEcCCeEEEEEECccccccCC-C Q lcl|Aclame:pro 253 DATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMV-FTEWKFFKGRLILKEHPLFSAIGI-S 330 (418) Q Consensus 253 d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~-v~~~~SdfG~v~vv~n~~l~~~~m-p 330 (418) +++.++|...+.. ..+..+.+++.+...|+.-.. ..|.. .+.+.-.|--+.|+.-|+|...+- . T Consensus 202 ~~~~~l~~~s~g~--~~p~~L~Lpp~~~~~L~~~~~------------~~~~tvl~~lk~~~~~l~I~~~~el~~ag~~g 267 (329) T protein:vir:79 202 QAIEKIETLTNGQ--HRANMILIPPSMRKVLMVRMP------------ETTMSYLDYFKQQNGGITIESISELEDIDGAG 267 (329) T ss_pred HHHHHHHHhcCce--ecccEEEecHHHHHHhhcccC------------CCCccHHHHHHHhCCCcEEEEcccccccCCCC Confidence 8888888765432 234567788888777754210 11222 122333344566777777755432 3 Q ss_pred CCeEEEE--chhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecccceEEeecCccc Q lcl|Aclame:pro 331 PGFAVVV--DVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKA 407 (418) Q Consensus 331 ~d~~lv~--D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~ 407 (418) .+.++++ |++++.+.+- .++...+.-+-+. ..+-.-.-.=++++++-|.|.+.+.|+--- T Consensus 268 ~~~~v~y~~~~~~~~~~vp--~~~~~l~~q~~~~---------------~~~v~~~~r~~Gv~i~~P~ai~~~dGI~~~ 329 (329) T protein:vir:79 268 TKAALVYEKDPMNMSIEIP--EAFNMLTAQPKDL---------------HFKVPCTSKCTGLTIYRPLTLVLIKGLVVG 329 (329) T ss_pred ceEEEEEecCCceEEEecC--cceeeeeceecCc---------------eEEEceeeeEEEEEEECcceeeeeeeeeeC Confidence 3666665 4555554432 2332222211110 111111222236899999999888888444 No 93 >protein:vir:94622 Length: 341 # NCBI annotation: PfWMP4_37 # Family: family:all:2203 # MgeID: mge:1525 # MgeName: Pf-WMP4 # Cross-refs: genbank:acc:YP_762667;genbank:gi:115304375;genbank:GeneID:5142322 Probab=37.32 E-value=1.1 Score=20.30 Aligned_cols=288 Identities=11% Similarity=0.015 Sum_probs=113.6 Q ss_pred cccceeEEEEEeecCc-eEE--EEccc---cccccCceeEecc-CceEEEEEEecCceeEEEccccccchhhhhCCceEE Q lcl|Aclame:pro 61 MVFASAVVTAEAAADA-TVL--TVENS---DGLTKGMIFYNEA-TGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLI 133 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~-t~~--tV~~~---~~~~~~~~~~~~~-~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~ 133 (418) |.+-.+-.-.+++.+. +.+ +|-+. ..|.+..++.+.. +.|. . ..+|+++++-+- +..++..+..|..+. T Consensus 1 ~~~~~~~~~~~~~t~~v~~fipei~s~~i~~~l~~~~v~~~~~~d~~~-~--~~~Gdtv~ip~~-g~~~~~d~~~~~~i~ 76 (341) T protein:vir:94 1 MALGNTITGPSINTQRGQQFIPEQWLSEVQMFRKAKMLDTSVVKTWGA-Q--VKKGDTFHVPRI-SELGVEDKATDVPVG 76 (341) T ss_pred CcchhhhccccccchhHHHHHHHHHHHHHHHHHHhhcchhhccccccc-c--ccCCceEEEecc-CcceeeeecCCCccc Confidence 3222222222221111 111 00010 1122222221110 1110 0 124666666542 222222232222221 Q ss_pred EeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccC Q lcl|Aclame:pro 134 VIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGT 213 (418) Q Consensus 134 ~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~ 213 (418) ..+.. .....+ ...|.-...+.|+.-.+.-. ..|..+...+.....|++.++..++.-.+.... T Consensus 77 --------~~~~~----~~~~~i-tiD~~~~~~~~i~d~d~~~~---~~d~~~~~~~~~~~aLA~~~D~~i~~~~a~~~~ 140 (341) T protein:vir:94 77 --------VQPVN----DTDFVI-TVDTDRTTAVALDDLLEIQA---SYDLRAPYLEAMGYALAKDMTGSILGLRAAVQN 140 (341) T ss_pred --------ccccc----CceEEE-EEeeeeecceeechHHHHhh---ccchHHHHHHHHHHHHHHHHHHHHHHHhhhccc Confidence 11111 011111 23344455677777666543 346667777788888999999877643321111 Q ss_pred cCCccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceE Q lcl|Aclame:pro 214 YNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEV 293 (418) Q Consensus 214 s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~ 293 (418) ... .+. ....+....+.+..++.+.+.++.+.+=++... . ..|++++++.+...|-+..+....- T Consensus 141 -~~~-----~~~------~~~~~~~~t~~~~~~~~~~i~~a~~~Lde~~VP-~--~gR~lvv~P~~~~~Ll~~~~~~~~~ 205 (341) T protein:vir:94 141 -TAS-----QNV------FSSSNGAITGNGQAFSFAVFLAARRLLLEADVP-E--EKIVLLISPGQESALFTIPQFISKD 205 (341) T ss_pred -ccc-----Ccc------ccCccccccCchhhhhHHHHHHHHHHHhhcCCC-c--cCCEEEeCHHHHHHHhhchhhhhhh Confidence 100 000 011112122233456677777776666554432 2 2378999998887774421111110 Q ss_pred EEccc-------ceeeceEEEEEEcCC---eE-----------------------------------E-EEEECcccccc Q lcl|Aclame:pro 294 TVTQR-------ETSYGMVFTEWKFFK---GR-----------------------------------L-ILKEHPLFSAI 327 (418) Q Consensus 294 ~~~~~-------~~~~G~~v~~~~Sdf---G~-----------------------------------v-~vv~n~~l~~~ 327 (418) ..... -+..| |+.|+|+- +. + -++.||+. T Consensus 206 ~~g~~~l~~G~ig~i~G--~~V~~Sn~lp~~~~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~gl~~~~~a--- 280 (341) T protein:vir:94 206 FINNAPIAQGQIGSLMG--VRVIRTSLIGNNSATGWRNGAPTIAPAEATPGFTGSRYLPKQDSFTSLPATFTGNSRP--- 280 (341) T ss_pred ccccchhheeeeeeEec--eEEEEeccccccccccccccccceecccccccccccccccccccccccEEEEEEeccc--- Confidence 00000 11223 33344431 10 0 11112110 Q ss_pred CCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecccceEEeecCccc Q lcl|Aclame:pro 328 GISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKA 407 (418) Q Consensus 328 ~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~ 407 (418) ....-++||+.+.... .+.+.--+..+...+. |...+.+ =|+-++.+|.+. .-|+++ T Consensus 281 ---v~~~k~~~~~~~~~~~-------~~~~~~~~~~~~~~~~--------~~i~~~~--~~G~~~lrp~~~---v~~~~~ 337 (341) T protein:vir:94 281 ---VHTAVMCHMDWAAAVV-------SKAPRVTQSFENREQV--------WLMVGRQ--AYGARLYRPLHA---VNIHTT 337 (341) T ss_pred ---ccceeeecchhhhccc-------cccccccccchhhhhh--------hhhhhhh--hhcccccCccee---EEEecC Confidence 1222334444332111 1222222222211122 2222222 246778888873 478888 Q ss_pred cccc Q lcl|Aclame:pro 408 KERV 411 (418) Q Consensus 408 ~~~~ 411 (418) .++| T Consensus 338 ~~~~ 341 (341) T protein:vir:94 338 GDTV 341 (341) T ss_pred cCCC Confidence 8888 No 94 >protein:vir:9410 Length: 415 # NCBI annotation: head protein # Family: family:all:21 # MgeID: mge:167 # MgeName: phi 13 # Cross-refs: genbank:acc:NP_803388;genbank:gi:29028700;genbank:GeneID:1258136 Probab=36.25 E-value=1.2 Score=20.18 Aligned_cols=324 Identities=10% Similarity=-0.010 Sum_probs=119.4 Q ss_pred Cc------ceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccc---eeeeeeeeeeeecccceeEEEEE Q lcl|Aclame:pro 1 MS------VYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTT---AKASTHGYFSKTMVFASAVVTAE 71 (418) Q Consensus 1 ~~------~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~---~~~~~~~~~~~~~~~~~~t~~a~ 71 (418) .+ -.....+.......-++. .....+.... .......-|.+.+..... T Consensus 62 ~~~~~~~~~~~~~~~~~~~~~~~~~~------------------~~~~~~~~~~~~~~~~~e~~~~~~~~~~~~~----- 118 (415) T protein:vir:94 62 KEKDGTSENNQQSVEVNEASTYRNQA------------------NINDLGISIQNTKVTSQEVRDFTEYLETRND----- 118 (415) T ss_pred HHHHHhhhhccccccccchhhHHHHH------------------HHHHHHhhhhhhhhhHHHHHHHHHHhhhhhh----- Confidence 00 000000000000000000 0000000000 000000001111100000 Q ss_pred eecCceEEEEccccccccCceeEecc-----Cc----eEEEEEEecCc--eeEEEccccccchhhhhCCceEEEeecccc Q lcl|Aclame:pro 72 AAADATVLTVENSDGLTKGMIFYNEA-----TG----ENMRLELVNGL--NLTVKRQTGRISAAIIAANTKLIVIGTAFE 140 (418) Q Consensus 72 ~~a~~t~~tV~~~~~~~~~~~~~~~~-----~~----E~~~Vtav~g~--~~tv~rg~~~tta~~~~~gt~v~~~g~a~~ 140 (418) ..+ ...+..+ .++..+.-+...+ .. ..+.+..+.+. ++.+.+...+..+. ... T Consensus 119 ~~~--~~~~~~~-g~~~iP~~~~~~ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~~~-------------~v~ 182 (415) T protein:vir:94 119 IQG--GSLKTDS-GFVVIPEEIVTDILKLKEVEFNLDKYVTVKRVTNGSGKYPVVRQSEVAALE-------------KVE 182 (415) T ss_pred hhh--hcccccc-ccccCcHHHHHHHHHHHHhhhhhhhhcceeeccCCceeEEEEeecCCccce-------------ecc Confidence 000 0001111 1122221111011 00 11222333322 33333322221111 113 Q ss_pred cccCCcCcccccceeccceeEEEee----eeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCC Q lcl|Aclame:pro 141 EGSQRPTARSIQPVYVPNFTQIFRN----AWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNG 216 (418) Q Consensus 141 EGada~~~~~~~~~~~~N~tQIf~~----~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~ 216 (418) ||++.+.... ..+.+|--. ..-+.-|.+...-.. .+-..|-...-...+.+.+|.++|+|... +. T Consensus 183 Eg~~~~~~~~------~~~~~i~~~~~k~~~~~~is~ell~ds~-~~~~~~i~~~l~~~~~~~~~~~il~g~g~----g~ 251 (415) T protein:vir:94 183 ELEENPELAV------KPFFQLAYDINTHRGYFRISREAIEDAK-VNVLQELKLWMARTIAATRNKAIIDVITK----GS 251 (415) T ss_pred cccccccccc------ccceeeEeeheeeeeechhhHHHHhhch-HHHHHHHHHHHHHHHHHHHHHHHhhcccc----Cc Confidence 6655543211 122333222 222233334443222 23344555566667789999999987541 11 Q ss_pred ccchhhHHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEc Q lcl|Aclame:pro 217 QPLHTTQGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVT 296 (418) Q Consensus 217 ~~~r~t~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~ 296 (418) .. .. +.... .........+..+.++|.+++..+-..... ...+++++....+|.++...+|++.+. T Consensus 252 ~~-~~---~~~~~-----~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~-----~~~~vmn~~~~~~l~~lkd~~G~~l~~ 317 (415) T protein:vir:94 252 TG-ST---SSGFE-----KEGKKLEVKKAKSLDDIKDAINLNVKPNYE-----HNVAIVSQTMFAKLDKMKDKLGNYLIQ 317 (415) T ss_pred cc-cc---ccccc-----ccccccccccccchHHHHHHHHhhhhhccC-----CCEEEEcHHHHHHHHHhhccCCCeeec Confidence 11 11 11110 011122233457788888887766443222 124778988888898875556665443 Q ss_pred cc------ceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccc Q lcl|Aclame:pro 297 QR------ETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATD 370 (418) Q Consensus 297 ~~------~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~ 370 (418) .. ..-+|.-| +..+.+..-......+++.|+...-+-+.. -+...+.. ... T Consensus 318 ~~~~~~~~~~l~G~pV------------~~~~~~~~~~~~~~~i~~gd~~~~~~~~~~-~~~~v~~~----------~~~ 374 (415) T protein:vir:94 318 PDVKEKTQQRLLGAKI------------EILPDEVLGQKGNNTLIIGNLKDAIVLFDR-SQYQASWT----------DYM 374 (415) T ss_pred cCcCCCCCceecceee------------EEecccccCCCCccEEEEEehhccEEEEee-cceEEEEe----------ccc Confidence 21 12223322 222211000000112555566543221220 01111100 000 Q ss_pred cccccCccccccEEEEEEEEEEecccceEEeecCcccccccCCCCCC Q lcl|Aclame:pro 371 YSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPA 417 (418) Q Consensus 371 ~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~ 417 (418) .+....+.+.-+.+.+.+|+|+.+++--+++++.-.+---+ T Consensus 375 ------~~~~~~r~~~r~d~~~~~~~a~~~~~~~~~~~~~~~~~~~~ 415 (415) T protein:vir:94 375 ------HFGECLMIAVRQDCRILDYKSAIVIEYDDSERGEGDLGLEA 415 (415) T ss_pred ------cCceEEEEEEEeccEEeccccEEEEEEeccCCCCCccccCC Confidence 02334467778899999999999999666665444333333 No 95 >protein:vir:105038 Length: 428 # NCBI annotation: major capsid head protein precursor # Family: family:all:21 # MgeID: mge:1465 # MgeName: phiKO2 # Cross-refs: genbank:acc:YP_006586;genbank:gi:46402092;genbank:GeneID:2777903 Probab=34.86 E-value=1.3 Score=20.02 Aligned_cols=321 Identities=12% Similarity=0.072 Sum_probs=116.5 Q ss_pred CcceeeeeccCCChh---hhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCce Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQ---ELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADAT 77 (418) Q Consensus 1 ~~~~~~~~~~~~~~~---~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t 77 (418) +++.. ..++.. ++.+++.-++ ...+... ..+..-+++ ++......-- T Consensus 98 ~~~~~----~~~~~~~~~~~~~~~~~~~-------------~~~~~~~---~~~~~gg~l----------iP~~~~~~ii 147 (428) T protein:vir:10 98 MSIAA----AQGNLQDAAKFASDELNDQ-------------SVSMAIS---TAAGSGGVL----------IPQNIHSEVI 147 (428) T ss_pred HHHHH----hhhhHHHHHHHhhhhhhhh-------------hHhhhhc---ccccCCccc----------cchhHHHHHH Confidence 11111 122222 2221211100 0000000 000000010 0000000000 Q ss_pred EEEEccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceecc Q lcl|Aclame:pro 78 VLTVENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVP 157 (418) Q Consensus 78 ~~tV~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~ 157 (418) ++ +.....+... .-.. |+.-+|+ +++-|-..+.. ..|. .||...+..... -..+ T Consensus 148 ~~-l~~~~~l~~~-------~~~~--~~~~~g~-~~~p~~~~~~~-------a~~v------~Eg~~~~~~~~~-f~~i- 201 (428) T protein:vir:10 148 EL-LRDRTIVRKL-------GARS--IPLPNGN-MSLPRLAGGAT-------ASYT------GENQDAKVSEAR-FDDV- 201 (428) T ss_pred HH-Hhhhchhhhh-------ccee--eecCCcc-eEEEEEeCCcc-------eeee------ccCccccccccc-eeeE- Confidence 00 0000000000 0000 0000111 11111111100 1111 356555432211 0111 Q ss_pred ceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCc Q lcl|Aclame:pro 158 NFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNV 237 (418) Q Consensus 158 N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv 237 (418) .....+=..-+.-|.+..... ..+-..|-...-...+.+.+|.++|+|.. ++..| .||+..... .... T Consensus 202 -~~~~~k~~~~v~is~ell~ds-~~~l~~~i~~~l~~ai~~~~d~~~l~G~G----~~~~p----~Gi~~~~~~--~~~~ 269 (428) T protein:vir:10 202 -KLTAKTMIAMVPISNALIGRA-GFNVEQLVLQDILTAISVREDKAFMRDDG----TGDTP----IGMKARATQ--WNRL 269 (428) T ss_pred -EeeeEEEEEeehhhHHHHhhh-hHHHHHHHHHHHHHHHHHHHHHHHhccCC----CCccc----ccccccccc--cccc Confidence 112222233344444444432 22334555566667789999999998743 33333 266532211 1111 Q ss_pred cccCCCCccchHHHHHHHHHHHH--hcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccc--eeeceEEEEEEcCC Q lcl|Aclame:pro 238 NAMPNPTAVTYDDVVDATIDAFK--WSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRE--TSYGMVFTEWKFFK 313 (418) Q Consensus 238 ~~~~~~a~~te~~l~d~~~~~~~--~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~--~~~G~~v~~~~Sdf 313 (418) ......+..+.+.+..++..+.. ......... ..+++++.....|.++...+|++.+.... .-+|.- T Consensus 270 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~-~~~v~n~~~~~~L~~lkd~~G~~i~~~~~~g~l~G~p-------- 340 (428) T protein:vir:10 270 LPWAADAAVNLDTIDTYLDSIILMSMDGNSNMIS-SGWGMSNRTYMKLFGLRDGNGNKVYPEMAQGMLKGYP-------- 340 (428) T ss_pred ccccccccccHHHHHHHHHHHHHhhhcccccccc-CEEEEcHHHHHHHHHhhccCCceeccCCCCCeeecee-------- Confidence 12222334444444444333321 111111112 23567888888888876556665543211 122322 Q ss_pred eEEEEEECccccc---cCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEE Q lcl|Aclame:pro 314 GRLILKEHPLFSA---IGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWAL 390 (418) Q Consensus 314 G~v~vv~n~~l~~---~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tL 390 (418) |+.+..++. .+.....+++.|++.+-+..-. +...+........+- .+.....--.|-..-+.+.-+.+ T Consensus 341 ----v~~~~~~p~~~~~~~~~~~i~~gd~s~~~i~~~~--~i~i~~~~~~~~~~~--~~~~~~~f~~~~~~~R~~~r~d~ 412 (428) T protein:vir:10 341 ----IQRTSAIPANLGEGGKESEIYFADFNDVVIGEDG--NMKVDFSKEASYIDT--DGKLVSAFSRNQSLIRVVTEHDI 412 (428) T ss_pred ----eEEeccccccccCCCccceEEEEecceEEEEEec--ceEEEeecccccccc--cccccchhhcchhheeeeeeeCc Confidence 333322211 1111235677788766544321 111121111110000 00000000014455567778888 Q ss_pred EEecccceEEeecCcc Q lcl|Aclame:pro 391 ELLNPQGCAVITGLQK 406 (418) Q Consensus 391 ev~N~kA~a~I~gL~~ 406 (418) .+.+|+|..+++|+.= T Consensus 413 ~v~~p~a~~~~t~~~~ 428 (428) T protein:vir:10 413 GFRHPEGLVLGTGVLF 428 (428) T ss_pred eeeccceEEEEeccCC Confidence 9999999999999987 No 96 >protein:vir:1433 Length: 435 # NCBI annotation: putative major capsid protein # Family: family:all:21 # MgeID: mge:30 # MgeName: phiE125 # Cross-refs: genbank:acc:NP_536362;genbank:gi:17975167;genbank:GeneID:929171 Probab=34.25 E-value=1.3 Score=19.95 Aligned_cols=350 Identities=12% Similarity=0.073 Sum_probs=118.3 Q ss_pred Cc--ceee--eeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccc--cceeeeeeeeeeeecccceeEEEEEeec Q lcl|Aclame:pro 1 MS--VYAG--IFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGS--TTAKASTHGYFSKTMVFASAVVTAEAAA 74 (418) Q Consensus 1 ~~--~~~~--~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~--~~~~~~~~~~~~~~~~~~~~t~~a~~~a 74 (418) ++ +..+ -....+.+..-. +...++. +..-..-.+..+....+. .......-.++..... ..+++ .+. T Consensus 65 ~~~~~~~~~~~~~~~~~~~~~~-~~~~~~~--~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~---~~~~~-~t~ 137 (435) T protein:vir:14 65 AAVPVDPNPTAVAAPAAAPVHA-QPKALEV--KGAKMARMVRALAAARGDAQLASKLAIERGFGEEVA---MSLNT-LSP 137 (435) T ss_pred hcccccchhhhhhhcccccccc-ccchhhh--hHHHHHHHHHHHHhhcchhhHHHHHHHhhhhhhhhh---hhccc-CCc Confidence 11 1111 001111100000 0000000 000000001111100000 0000000011110000 00000 011 Q ss_pred CceEEEEccccccccCceeEeccCceEE---EEEEe--cCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcc Q lcl|Aclame:pro 75 DATVLTVENSDGLTKGMIFYNEATGENM---RLELV--NGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTAR 149 (418) Q Consensus 75 ~~t~~tV~~~~~~~~~~~~~~~~~~E~~---~Vtav--~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~ 149 (418) ..+-..|.. .+. ..|+......-.+ .++.+ ....+++-+-..+. ...|. .||...+... T Consensus 138 ~~gg~~vP~--~~~-~~ii~~l~~~~~i~~~~~~~~~~~~~~~~~p~~~~~~-------~a~~v------~E~~~~~~~~ 201 (435) T protein:vir:14 138 GAGGVLVPE--NLS-SEVIELLRPKSVVRKLGARTLPLSNGNITIPRLKGGA-------IVGYI------GADTDIPTTQ 201 (435) T ss_pred CCCccccch--hHH-HHHHHHHhhhchhhhhcceeeecCCCceEEEEEeCCc-------ceeee------ccCccccccc Confidence 111111110 000 0011000000000 01111 11122222211111 11121 3665544322 Q ss_pred cccceeccceeEEE----eeeeeechhHHHHhhhcccchHHH-HHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHH Q lcl|Aclame:pro 150 SIQPVYVPNFTQIF----RNAWALTDTARASYAEAGYSNITE-SRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQG 224 (418) Q Consensus 150 ~~~~~~~~N~tQIf----~~~v~VSgTa~Av~~~g~~dela~-q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~G 224 (418) + .+.+|- +-...+.-|.+..+-.+..-.+.. -...-...+.+.+|.+||+|.- .+..| .| T Consensus 202 --~-----~f~~i~~~~~k~~~~~~iS~ell~ds~~~~~l~~~i~~~l~~ai~~~~d~a~l~G~G----~~~~p----~G 266 (435) T protein:vir:14 202 --Q-----QFDDLKLTAKKMAALVPIANDLIKYAGVNPNVDQIVVGDLTAAIGAREDKAFIRDDG----TANTP----KG 266 (435) T ss_pred --c-----ceeEEEeeeEEEEEeehhhHHHHHhhccCHHHHHHHHHHHHHHHHHHHHHHhhccCC----CCccc----cc Confidence 1 233333 333333444444444332212433 3444456689999999998842 22222 35 Q ss_pred HHHHHhhccccCccccCCC--CccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceee Q lcl|Aclame:pro 225 IVDAVRQYAPDNVNAMPNP--TAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSY 302 (418) Q Consensus 225 I~~~i~~~~~~nv~~~~~~--a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~ 302 (418) |+... ...++.....+ .....+++.+++..+....... ....+++++.....|.++.-.+|++.+... .. T Consensus 267 i~~~~---~~~~~~~~~~~~~~~~~~~~~~~l~~~~~~~~~~~---~~~~~v~n~~~~~~L~~lkd~~G~~l~~~~--~~ 338 (435) T protein:vir:14 267 LRFWA---LPSNVITASDASTLQKIETDLGKVILALENADANL---TQPGWIMAPRTFRFLEGLRDGNGNKVYPEL--AN 338 (435) T ss_pred eeecc---cccceeccccccchhhHHHHHHHHHHHhhhccccc---cCCEEEEcHHHHHHHHHhhccCCceeccCC--CC Confidence 54221 11222221111 1223345555554444322111 112466788888888887656666655321 11 Q ss_pred ceEEEEEEcCCeEEEEEECccccc---cCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccc Q lcl|Aclame:pro 303 GMVFTEWKFFKGRLILKEHPLFSA---IGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDA 379 (418) Q Consensus 303 G~~v~~~~SdfG~v~vv~n~~l~~---~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da 379 (418) | +=+| +.|+.++.+.. .......+++.|++.+-+.-- .+...+.....+..+- .+.....-..|. T Consensus 339 g-------~l~G-~Pv~~~~~~p~~~~~~~~~~~i~~gd~s~~~i~~~--~~~~~~~~~~~~~~~~--~~~~~~~f~~~~ 406 (435) T protein:vir:14 339 G-------MLKG-YPVGKTTQVPINLGETGKESEIYFTDFGDVFIGEE--ETLEIDYSKEATYKDA--DGHMVSAFQRDQ 406 (435) T ss_pred C-------eeec-ceeEeeccccccccCCCccceEEEeecccEEEEEe--cccEEEEecccccccc--ccchhhhhhcCh Confidence 1 1123 13333332211 011223577777776432211 1111111111111000 000000001145 Q ss_pred cccEEEEEEEEEEecccceEEeecCcccc Q lcl|Aclame:pro 380 QGGSLTSEWALELLNPQGCAVITGLQKAK 408 (418) Q Consensus 380 ~k~~i~~E~tLev~N~kA~a~I~gL~~~~ 408 (418) ..-+.+.=+.+.+.+|+|..+++|+.=-. T Consensus 407 ~~~r~~~r~d~~~~~~~a~~~l~~~~~~~ 435 (435) T protein:vir:14 407 TLIRVIAKNDFGPRHVESIAVLAGVAWGA 435 (435) T ss_pred hheeeeeeeCceeecccceEEEecCCCCC Confidence 55667788889999999999999985432 No 97 >protein:vir:96833 Length: 275 # NCBI annotation: ORF015 # Family: family:all:522 # MgeID: mge:1642 # MgeName: EW # Cross-refs: genbank:acc:YP_240157;genbank:gi:66395822;genbank:GeneID:5133174 Probab=33.32 E-value=1.4 Score=19.84 Aligned_cols=256 Identities=14% Similarity=0.061 Sum_probs=114.9 Q ss_pred Eccccc-cccCceeE----eccCc---eEEEEEEecCceeEEEccccccchhhhhCCceEEE-----eecc--cccccCC Q lcl|Aclame:pro 81 VENSDG-LTKGMIFY----NEATG---ENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIV-----IGTA--FEEGSQR 145 (418) Q Consensus 81 V~~~~~-~~~~~~~~----~~~~~---E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~-----~g~a--~~EGada 145 (418) -+.... -..+.|+- .-+.+ +.++...+ .++-+-+. ...|..+.+ +|.+ ..||.+. T Consensus 1 ~~~~~~T~l~d~i~PEv~~~~v~~~~~~~~~~~~~----~~~~~~l~------g~~G~tv~iP~~~~ig~a~~~~~g~~i 70 (275) T protein:vir:96 1 MALENMTKLANMVNPEVLAPMMQAELDKKLKFAQF----ADIDNTLV------GQPGNTITFPAFVYSGDAKVVPEGEEI 70 (275) T ss_pred CCCcccchhhhhhchHHHHHHHHHHHHHhhhhccc----ceeccccc------CCCCCEEEeeeeccCCccccccCCCCc Confidence 333221 11111110 00000 11111111 00000000 111322222 1211 2344444 Q ss_pred cCcccccceeccceeEEE--eeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhH Q lcl|Aclame:pro 146 PTARSIQPVYVPNFTQIF--RNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQ 223 (418) Q Consensus 146 ~~~~~~~~~~~~N~tQIf--~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~ 223 (418) +...-.... .-..|. .+.|++++-+... ...|-+..-......-+.+.+++.++.--+. + T Consensus 71 ~~~~lt~~~---~~~~i~~~~~~~~i~D~~~~~---~~~d~~~~~~~~~a~~~a~~~d~~ll~~l~~-----a------- 132 (275) T protein:vir:96 71 PIDLIETKK---RQATIRKIGKGTVLTDEALLS---GYGDPKGEAVRQHGLAIANKVDNDVLEALQG-----A------- 132 (275) T ss_pred chhhcccce---eeEEeehhcccccccHHHHHh---hccchHHHHHHHHHHHHHHHHHHHHHHHHhc-----c------- Confidence 332222221 122333 4445555554433 2335566666666677888888877621110 0 Q ss_pred HHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccce-ee Q lcl|Aclame:pro 224 GIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET-SY 302 (418) Q Consensus 224 GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~-~~ 302 (418) ++ ..+...++.+.+.++.+++=+ . ....++++|++.....|-+... .++..... .- T Consensus 133 -----------~~---~~~~~~~~~d~i~dA~~~lgd----~-~~~~~~ivv~p~~~~~L~k~~~----~~f~~~~~~g~ 189 (275) T protein:vir:96 133 -----------TL---KVEADITKLAGLQTAIDKFND----E-DLEPMVLFVNPLDAGKLRASAT----DNFTRATLLGD 189 (275) T ss_pred -----------cc---cccccccCHHHHHHHHHHhcc----c-cCCccEEEeCHHHHHHHHhccc----ccccccccccc Confidence 00 012235688888888877632 2 2356799999998877755321 12111111 11 Q ss_pred ceEEEE-EEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccc Q lcl|Aclame:pro 303 GMVFTE-WKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQG 381 (418) Q Consensus 303 G~~v~~-~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k 381 (418) +....- |-+-.| +.|+.++ ++|.++++++.+..+.+.. .++...|..+..- +..|... T Consensus 190 ~~~~~G~ig~~~G-~~Vi~s~-----~~p~~t~~i~~~gA~~~~~--~~~~~vE~~Rd~~-------------~~~d~i~ 248 (275) T protein:vir:96 190 NVIVKGAFGEALG-AIIVRSN-----KIKEGEAILAKRGAVKLIT--KRDFFLETERHAS-------------HKSTALF 248 (275) T ss_pred cceeccccceecC-eeEEEeC-----CCCcceEEEEeccceeeee--cCCcccccccchh-------------hcCcEEE Confidence 111111 111123 3666664 4578999999988877533 4665566554332 2224443 Q ss_pred cEEEEEEEEEEecccceEEeecCccccccc Q lcl|Aclame:pro 382 GSLTSEWALELLNPQGCAVITGLQKAKERV 411 (418) Q Consensus 382 ~~i~~E~tLev~N~kA~a~I~gL~~~~~~~ 411 (418) +..+ |+..+.||.+..+++= +++---| T Consensus 249 ~~~~--y~~~~~~~~~vv~~t~-~~~~~~~ 275 (275) T protein:vir:96 249 SDKH--YVAYLYDESKVVKITK-SASGLGV 275 (275) T ss_pred EeEE--EEEEEEcCccEEEEEe-cccccCC Confidence 3333 6889999998888741 2221112 No 98 >protein:vir:5694 Length: 357 # NCBI annotation: gpN # Family: family:all:201 # MgeID: mge:120 # MgeName: L-413C # Cross-refs: genbank:acc:NP_839853;genbank:gi:30065708;genbank:GeneID:1260602 Probab=33.06 E-value=0.53 Score=22.07 Aligned_cols=327 Identities=12% Similarity=0.052 Sum_probs=131.3 Q ss_pred hhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeEec Q lcl|Aclame:pro 17 LNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNE 96 (418) Q Consensus 17 ~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~ 96 (418) ++++ .+..-| .-+.++-.+.|...... -++|+..-...+ ++-. . -..+++.+....++. T Consensus 1 M~~~------tr~~~~--~y~~~~A~~ngv~~~d~--~~~FsV~P~v~q-~L~~-------~-i~ess~FL~~INvv~-- 59 (357) T protein:vir:56 1 MRQE------TRFKFN--AYLSRVAELNGIDAGDV--SKKFTVEPSVTQ-TLMN-------T-MQESSDFLTRINIVP-- 59 (357) T ss_pred CChH------HHHHHH--HHHHHHHHHhCCChHHh--cceeecCHHHHH-HHHH-------H-HHHHHHHhccCCccc-- Confidence 1000 000000 11112222222111100 012221100000 0000 0 011333333333321 Q ss_pred cCceEEEEEEecCceeEE--EccccccchhhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHH Q lcl|Aclame:pro 97 ATGENMRLELVNGLNLTV--KRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTAR 174 (418) Q Consensus 97 ~~~E~~~Vtav~g~~~tv--~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~ 174 (418) |..+.|.++-+ .....++|... +. -.| +-.|.. ..... .-.|+=-.--..+++-. T Consensus 60 -------V~e~~Ge~i~lg~~g~iagrtdT~---~~-~~R------~~~~~~--~l~~~---~Y~c~qTn~dt~i~Y~~- 116 (357) T protein:vir:56 60 -------VSEMKGEKIGIGVTGSIASTTDTA---GG-TER------QPKDFS--KLASN---KYECDQINFDFYIRYKT- 116 (357) T ss_pred -------cccceeeEEecccCccccccccCC---CC-CCc------cccccc--ccCCC---ccEEEEeeecccccHHH- Confidence 33333444322 11111111100 00 000 000000 00000 01222222223333332 Q ss_pred HHhhhcccchHHHHHHH-HHHHHHHHHhHHHhcCcccccCcCCccchh----hHHHHHHHhhccccCcccc------C-- Q lcl|Aclame:pro 175 ASYAEAGYSNITESRRD-CMDFHATEQETAIFFGQAFMGTYNGQPLHT----TQGIVDAVRQYAPDNVNAM------P-- 241 (418) Q Consensus 175 Av~~~g~~dela~q~~k-k~~EikrdmE~a~i~G~k~~~~s~~~~~r~----t~GI~~~i~~~~~~nv~~~------~-- 241 (418) ........+|...+.. -.+.+.+||-.+=++|+..-..++-..-.. =-|++-.++.+.+..+... . T Consensus 117 -lD~WA~~~dF~~r~~~~i~~~~ALD~i~IGfNGts~A~~Td~~~nPllqDVN~GWlQ~~Re~ap~rVm~~~~~~~g~~~ 195 (357) T protein:vir:56 117 -LDLWARYQDFQLRVRNAIIKRQSLDFIMAGFNGVKRAETSDRSSNPMLQDVAVGWLQKYRNEAPARVMSKVTDEEGHTT 195 (357) T ss_pred -HHHHhcChhHHHHHHHHHHHHHhhccceecccceeeeccCChhhCcCccccchhHHHHHHhhchhhhhccccccCCccc Confidence 2222233456555544 345678999999999997554443221111 1277777777665544321 0 Q ss_pred -----CCCccchHHHHHHHHHHHHhcccCC--CceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEc--C Q lcl|Aclame:pro 242 -----NPTAVTYDDVVDATIDAFKWSVNVG--DNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKF--F 312 (418) Q Consensus 242 -----~~a~~te~~l~d~~~~~~~~g~~~~--g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~S--d 312 (418) -|..-++..|..++.++...-...- ....=+++||.++.. .+....-++- ...+++.. .+.+.| - T Consensus 196 ~~~i~~G~~gdy~NLDalV~D~~~~lI~~~~~~d~dLVvivG~dLla--~k~~~l~n~~-~~pTE~~A---a~~i~s~k~ 269 (357) T protein:vir:56 196 SEVIRVGKGGDYASLDALVMDATNNLIEPWYQEDPDLVVIVGRQLLA--DKYFPIVNKE-QDNSEMLA---ADVIISQKR 269 (357) T ss_pred cceeeecCCCCcccHHHHHHHHHhccCChHHhcCCCEEEEEchhhhh--hhhhhHhhcc-CChHHHHH---HHHHHHhhh Confidence 1122356777777777765322211 111247889988764 2211100110 11223322 222333 4 Q ss_pred CeEEEEEECccccccCCCCCeEEEEchhhceeeeccCC---CcccccccccCccccccccccccccCccccccEEEEEEE Q lcl|Aclame:pro 313 KGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGR---NAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWA 389 (418) Q Consensus 313 fG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r---~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~t 389 (418) +|-+..+.-|+| |++.++|--.++|++.|..|- ....++ .+. |.. + ++.. --+ T Consensus 270 iGGl~a~~~PfF-----P~~~llVT~L~NLsIY~Q~gs~RR~~~d~p-~r~----riE--~--------y~s~----Ne~ 325 (357) T protein:vir:56 270 IGNLPAVRVPYF-----PADAMLITKLENLSIYYMDDSHRRVIEENP-KLD----RVE--N--------YESM----NID 325 (357) T ss_pred hCCceeEEcccc-----CCCceEEeeccccEEEEecCcEEEEEEecc-ccc----ccc--c--------hhhh----cce Confidence 677888888875 889999999999999999652 221111 111 111 1 1100 012 Q ss_pred EEEecccceEEeecCcccccccC-CCCCCC Q lcl|Aclame:pro 390 LELLNPQGCAVITGLQKAKERVY-LTAPAP 418 (418) Q Consensus 390 Lev~N~kA~a~I~gL~~~~~~~~-~~~~~~ 418 (418) -.|.+..+.|.|++++-+++..| ..+|.| T Consensus 326 YvVEd~~~~a~iE~i~i~~~~~~~~~~~~~ 355 (357) T protein:vir:56 326 YVVEDYAAGCLVEKIKVGDFSTPAKATEEP 355 (357) T ss_pred eeeeccccEEEeeeeeeccCCCCcccCCCC Confidence 23445556889999877754443 344555 No 99 >protein:vir:2016 Length: 357 # NCBI annotation: gpN # Family: family:all:201 # MgeID: mge:315 # MgeName: P2 # Cross-refs: genbank:acc:NP_046760;genbank:gi:9630331;genbank:GeneID:1261541 Probab=29.78 E-value=0.7 Score=21.42 Aligned_cols=327 Identities=12% Similarity=0.055 Sum_probs=129.6 Q ss_pred hhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEEEccccccccCceeEec Q lcl|Aclame:pro 17 LNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYNE 96 (418) Q Consensus 17 ~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~~ 96 (418) ++++ .+..-| .-+.++-.+.|...... -++|+..-...+ ++-. . -..+++.+....++. T Consensus 1 M~~~------tr~~~~--~y~~~~A~~ngv~~~d~--~~~FsV~P~v~q-~L~~-------~-i~ess~FL~~INvv~-- 59 (357) T protein:vir:20 1 MRQE------TRFKFN--AYLSRVAELNGIDAGDV--SKKFTVEPSVTQ-TLMN-------T-MQESSDFLTRINIVP-- 59 (357) T ss_pred CChH------HHHHHH--HHHHHHHHHhCCChHHh--cceeecCHHHHH-HHHH-------H-HHHHHHHhccCCccc-- Confidence 1000 000000 11112222222111100 012221100000 0000 0 011333333333321 Q ss_pred cCceEEEEEEecCceeEE--EccccccchhhhhCCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHH Q lcl|Aclame:pro 97 ATGENMRLELVNGLNLTV--KRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTAR 174 (418) Q Consensus 97 ~~~E~~~Vtav~g~~~tv--~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~ 174 (418) |..+.|.++-+ .....++|... +. -.| +-.|.. ..... .-.|+=-.--..+++-. T Consensus 60 -------V~e~~Ge~i~lg~~g~iagrtdT~---~~-~~R------~~~~~~--~l~~~---~Y~c~qTn~dt~i~Y~~- 116 (357) T protein:vir:20 60 -------VSEMKGEKIGIGVTGSIASTTDTA---GG-TER------QPKDFS--KLASN---KYECDQINFDFYIRYKT- 116 (357) T ss_pred -------cccceeeEEecccCccccccccCC---CC-CCc------cccccc--ccCCC---ccEEEEeeecccccHHH- Confidence 33333444321 00111111100 00 000 000000 00000 01222222223333332 Q ss_pred HHhhhcccchHHHHHHH-HHHHHHHHHhHHHhcCcccccCcCCccchh----hHHHHHHHhhccccCcccc--------- Q lcl|Aclame:pro 175 ASYAEAGYSNITESRRD-CMDFHATEQETAIFFGQAFMGTYNGQPLHT----TQGIVDAVRQYAPDNVNAM--------- 240 (418) Q Consensus 175 Av~~~g~~dela~q~~k-k~~EikrdmE~a~i~G~k~~~~s~~~~~r~----t~GI~~~i~~~~~~nv~~~--------- 240 (418) ........+|...+.. -.+.+.+||-.+=++|+..-..++-..-.. =-|++-.++.+.+..+... T Consensus 117 -lD~WA~~~dF~~r~~~~i~~~~ALD~i~IGfNGts~A~~Td~~~nPllqDVN~GWlQ~~Re~ap~rVm~~~~~~~g~~~ 195 (357) T protein:vir:20 117 -LDLWARYQDFQLRIRNAIIKRQSLDFIMAGFNGVKRAETSDRSSNPMLQDVAVGWLQKYRNEAPARVMSKVTDEEGRTT 195 (357) T ss_pred -HHHHhcChhHHHHHHHHHHHHHhhccceecccceeeeccCChhhCcCccccchhHHHHHHhhchhhhhccccccccccc Confidence 2222233456555544 345678999999999997554443221111 1277767777655544321 Q ss_pred ----CCCCccchHHHHHHHHHHHHhcccCC--CceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEc--C Q lcl|Aclame:pro 241 ----PNPTAVTYDDVVDATIDAFKWSVNVG--DNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKF--F 312 (418) Q Consensus 241 ----~~~a~~te~~l~d~~~~~~~~g~~~~--g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~S--d 312 (418) .-|..-++..|..++.++...-...- ....=+++||.++.. .+....-++- ...+++.. .+.+.| - T Consensus 196 ~~~i~~G~~gdy~NLDalV~D~~~~lI~~~~~~d~dLVvivG~dLla--~k~~~l~n~~-~~ptE~~A---a~~i~s~k~ 269 (357) T protein:vir:20 196 SEVIRVGKGGDYASLDALVMDATNNLIEPWYQEDPDLVVIVGRQLLA--DKYFPIVNKE-QDNSEMLA---ADVIISQKR 269 (357) T ss_pred cceeeecCCCCcccHHHHHHHHHhccCChHHhcCCCEEEEEchhhhh--hhhhhHhhcc-CChHHHHH---HHHHHHhhh Confidence 01112356777777777765322211 111247889988764 2211100110 11223322 222333 4 Q ss_pred CeEEEEEECccccccCCCCCeEEEEchhhceeeeccCC---CcccccccccCccccccccccccccCccccccEEEEEEE Q lcl|Aclame:pro 313 KGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGR---NAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWA 389 (418) Q Consensus 313 fG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r---~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~t 389 (418) +|-+..+.-|+| |++.++|--.++|++.+..|- ....++ .+. |.. +|-. ..- + T Consensus 270 iGGl~a~~~PfF-----P~~~ilVT~L~NLsIY~Q~gs~RR~~~d~p-~r~----riE--~y~s-----~Ne-------~ 325 (357) T protein:vir:20 270 IGNLPAVRVPYF-----PADAMLITKLENLSIYYMDDSHRRVIEENP-KLD----RVE--NYES-----MNI-------D 325 (357) T ss_pred hCCceeEEcccc-----CCCceEEeeccccEEEEecCcEEEEEEecc-ccc----ccc--chhh-----hcc-------e Confidence 677888888875 889999999999999999652 221111 111 111 1100 011 2 Q ss_pred EEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 390 LELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 390 Lev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) -.|.+..+.|.|++++-+++..|....+- T Consensus 326 YvVEd~~~~a~iE~i~~~~~~~p~~~~~~ 354 (357) T protein:vir:20 326 YVVEDYAAGCLVEKIKVGDFSTPAKATAE 354 (357) T ss_pred eeeeccccEEEeeeeeeccccCCccCCCC Confidence 23445556788999877755433322222 No 100 >protein:vir:104342 Length: 314 # NCBI annotation: hypothetical protein # Family: family:all:463 # MgeID: mge:1593 # MgeName: RTP # Cross-refs: genbank:acc:YP_398971;genbank:gi:81343955;genbank:GeneID:3778874 Probab=29.24 E-value=1.7 Score=19.35 Aligned_cols=292 Identities=13% Similarity=0.059 Sum_probs=111.9 Q ss_pred eeeeeeeee-eecccceeEEEEEeecCceEEEEccccccccCceeEe---c-cCceEEEEE-Eec-CceeEEE-cccccc Q lcl|Aclame:pro 50 KASTHGYFS-KTMVFASAVVTAEAAADATVLTVENSDGLTKGMIFYN---E-ATGENMRLE-LVN-GLNLTVK-RQTGRI 121 (418) Q Consensus 50 ~~~~~~~~~-~~~~~~~~t~~a~~~a~~t~~tV~~~~~~~~~~~~~~---~-~~~E~~~Vt-av~-g~~~tv~-rg~~~t 121 (418) -+|+++ .+ -.+.....++-.....++..+.+..-+ +....+... + ...+.+-|. .++ +.. +++ +.+. T Consensus 1 ~~~~~~-~~~~~~~~~~~~~~~~~~d~~~~fl~~ql~-~id~~v~e~~~~~~~~~~~i~v~~~~~~~~e-t~~~~~~e-- 75 (314) T protein:vir:10 1 MAIKFD-AEQAKITTHLEQMGVEKADAAGIWAVSQLT-AALNRAYEKEYAENSVVNIFPVTNEIPGHAK-YFEYPEFD-- 75 (314) T ss_pred CccchH-HHHHHHHHHHHhhcccchhhhHHHHHHHHH-HHHHHHhhhhccccccceeeccccCCCCcee-EEEeeeec-- Confidence 233333 11 111111111111111111111111000 000000000 0 011222221 111 111 111 1111 Q ss_pred chhhhhCCceEEEeecccccccCCcCcccccceecc-c--eeEEEeeeeeechhHH--HHhhhcccchHHHHHHHHHHHH Q lcl|Aclame:pro 122 SAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVP-N--FTQIFRNAWALTDTAR--ASYAEAGYSNITESRRDCMDFH 196 (418) Q Consensus 122 ta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~-N--~tQIf~~~v~VSgTa~--Av~~~g~~dela~q~~kk~~Ei 196 (418) ..|.+..=| |..+ -.|.+.++ + ..+|++-...+..+.+ +.....+.+.-.....-....+ T Consensus 76 ------------~~G~a~~~~-d~~~--dip~vd~~~~~~~~~i~~~~~~~~~~~~El~~a~~~g~~l~~~k~~aA~~~~ 140 (314) T protein:vir:10 76 ------------GVGIAQIIA-DYSD--DLPLVDAFMTEKQGKVFRFGNAFLISTDEIKAGAATGQSLSARKQALAFEAH 140 (314) T ss_pred ------------cccceeeeC-Cccc--ccceeecccceeEEEEEEEEeeEEecHHHHHHHHHhCCChHHHHHHHHHHHH Confidence 111111111 1110 01222211 1 3344554444444433 3333444453344445555666 Q ss_pred HHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccccCCCCc-----cchHHHHHHHHHHHHhcccCCCceeE Q lcl|Aclame:pro 197 ATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNAMPNPTA-----VTYDDVVDATIDAFKWSVNVGDNTQR 271 (418) Q Consensus 197 krdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~~~~~a~-----~te~~l~d~~~~~~~~g~~~~g~~~~ 271 (418) .+.+.+..++|.+.. ..-|++. . .++....+... --.+|+..++.++|..++.. ..+. T Consensus 141 ~~~~n~i~f~G~~~~---------g~~GLlN---~---p~v~~~~~~~~WaT~~ei~~Di~~~~~~l~~~s~g~--~~p~ 203 (314) T protein:vir:10 141 DNLLDKLVWSGSAPH---------GIVSVFD---Q---PNINNVVATPNWSVPQNAIDDVTAMIDAVESSTQGL--HHVT 203 (314) T ss_pred HHhhceEEEeecccc---------cceeEee---c---CCCccccCCCCcccHHHHHHHHHHHHHHHHHhcCcc--ccce Confidence 677777777775422 1223331 1 01111111111 12567788888888765432 3345 Q ss_pred EEEeChHHHHHHHhhhhccceEEEcccceeeceEE-EEEEcCCeEEEEEECccccccCCCC-CeEEEE--chhhceeeec Q lcl|Aclame:pro 272 VMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVF-TEWKFFKGRLILKEHPLFSAIGISP-GFAVVV--DVPAVKLAYM 347 (418) Q Consensus 272 ~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v-~~~~SdfG~v~vv~n~~l~~~~mp~-d~~lv~--D~~~~~~~~L 347 (418) .+.+++.+...|+.... ..|..+ +.+.-++=-+.|+.-|.|...+... +.++++ |++++.+++- T Consensus 204 ~l~Lpp~~~~~L~~~~~------------~~~~tvl~~l~~n~~~l~I~~~~el~~ag~~g~~~~v~y~~~~~~~~~~vp 271 (314) T protein:vir:10 204 DILLPASARRVMQGLVP------------QTNLSYGELFTRNNPGLTIRFLQFLDNYDGAGGKAALAFEKSPLNMSIEIP 271 (314) T ss_pred eEEecHHHHHhhccccc------------CCCccHHHHHHHhCCCcEEEEcccccccCCCcceEEEEEecCCcEEEEecC Confidence 67778887776654211 112221 1122223345666667665544322 334444 3555555432 Q ss_pred cCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecccceEEeecCccc Q lcl|Aclame:pro 348 DGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGCAVITGLQKA 407 (418) Q Consensus 348 ~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~ 407 (418) .++..-+.-+.+ . ..+-.-+-.=.+++++-|.|.+.+.|++-| T Consensus 272 --~~~~~l~~e~~~-----~----------~~~~~~~~r~~Gv~i~~P~ai~~~dGI~~~ 314 (314) T protein:vir:10 272 --EVTNVLPAQPKD-----L----------HFRYPVTSKATGLIVYRPLTMAVIKGITFA 314 (314) T ss_pred --ccceeecceecC-----c----------eEEEcceeeeEEEEEECcceeEeeeeeecC Confidence 122211111111 1 111111122247999999999999999999 No 101 >protein:vir:105334 Length: 276 # NCBI annotation: putative phage major capsid protein # Family: family:all:522 # MgeID: mge:1679 # MgeName: PH15 # Cross-refs: genbank:acc:YP_950669;genbank:gi:119967839;genbank:GeneID:4643213 Probab=28.94 E-value=1.7 Score=19.32 Aligned_cols=258 Identities=15% Similarity=0.078 Sum_probs=119.4 Q ss_pred Eccccccc----cCceeEeccCc---eEEEEEEecCceeEEEccccccchhhhhCCceEEE-----eecc--cccccCCc Q lcl|Aclame:pro 81 VENSDGLT----KGMIFYNEATG---ENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIV-----IGTA--FEEGSQRP 146 (418) Q Consensus 81 V~~~~~~~----~~~~~~~~~~~---E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~-----~g~a--~~EGada~ 146 (418) -++...-. .+.++..-+.+ +.++...+.-..-+.. |.. |..+.+ +|.+ ..||.+.+ T Consensus 1 Ma~~~T~l~d~i~Pev~~~~v~~~~~~~~~~~~~~~~~~~l~-g~~---------G~ti~iP~~~~igda~~~~eg~~i~ 70 (276) T protein:vir:10 1 MAQGTTTKSTQIVPEVLAPMMQAELDKKLRFAQFADIDSTLV-GQP---------GDTLTFPAFVYSGDATVVPEGQKIP 70 (276) T ss_pred CCcceeehhhhhchHHHHHHHHHHHHhhhhhcccceeccccc-CCC---------CCEEEeeeecCCCccccccCCCccC Confidence 22211111 11111100000 1111111100000000 111 222221 1222 34665544 Q ss_pred CcccccceeccceeEEE--eeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHH Q lcl|Aclame:pro 147 TARSIQPVYVPNFTQIF--RNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQG 224 (418) Q Consensus 147 ~~~~~~~~~~~N~tQIf--~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~G 224 (418) ...-.... .-..|+ .+.|++++-+... ...|-+..-......-+.+.+.+.++.--+. + T Consensus 71 ~~~lt~~~---~~a~i~~~~k~~~~tD~a~~~---~~~dp~~~~~~~~~~~~a~~~d~~~~~~l~~-----~-------- 131 (276) T protein:vir:10 71 VDKIETNR---REAKIHKIGKGTDITDEALLS---GYGDPQGEAVRQHGLAIANKVDNDVLEALRG-----T-------- 131 (276) T ss_pred ccccccce---eeEEeehccccccccHHHHHh---hccchHHHHHHHHHHHHHHHHHHHHHHHHhc-----c-------- Confidence 33322222 233333 4556666555443 3446666666667777788888776621110 0 Q ss_pred HHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcc-cceeec Q lcl|Aclame:pro 225 IVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQ-RETSYG 303 (418) Q Consensus 225 I~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~-~~~~~G 303 (418) ...+ +..+++.+.+.++.+++=+ . ....++++|++...-.|-+... .++.. ++...+ T Consensus 132 ---------~~~~----~~~~~t~d~i~~A~~~lgd----~-~~~~~~ivv~p~~~~~L~k~~~----~~f~~~s~~g~~ 189 (276) T protein:vir:10 132 ---------KLTV----SADIGTLAGLEAAIDTFDD----E-DLEPMVLFINPKDAGKLRSSAS----DNFTRATELGDN 189 (276) T ss_pred ---------cccc----cccccCHHHHHHHHHHhcc----c-cCcccEEEEcHHHHHHHHHhcc----cccccccccccc Confidence 0001 2235677877777766532 2 2356789999988777755321 11111 111111 Q ss_pred eEEE-EEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCcccccc Q lcl|Aclame:pro 304 MVFT-EWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGG 382 (418) Q Consensus 304 ~~v~-~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~ 382 (418) +... .|-+..| +.|+.++. +|.++.+++.+..+.+.. +++...|..+..- +..|...+ T Consensus 190 ~~~~G~ig~~~G-~~Vi~s~~-----~p~~t~~l~~~gAi~~~~--~~~~~vE~dRd~~-------------~~~d~i~~ 248 (276) T protein:vir:10 190 IIVKGAFGEALG-AVIVRSKK-----LDEGEAILAKRGAVKLIT--KRDFFLETDRDPS-------------TKTTALYS 248 (276) T ss_pred ceeccccceecc-eeEEEcCC-----CCcceEEEEeccceeeee--cCCceeecccchh-------------hcccEEEE Confidence 1111 1223345 47777754 578999999998877543 4666666554332 22244333 Q ss_pred EEEEEEEEEEecccceEEeecCcccccccCCCC Q lcl|Aclame:pro 383 SLTSEWALELLNPQGCAVITGLQKAKERVYLTA 415 (418) Q Consensus 383 ~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~ 415 (418) ..+ |+..+.||.+..+|+ ++.-..|.-| T Consensus 249 ~~~--y~~~~~~~~~vv~~t---~~~~~~~~~~ 276 (276) T protein:vir:10 249 DKH--YVAYLYDESKAVKVT---KGAGTTDSGA 276 (276) T ss_pred eeE--EEEEEEcCcceEEEe---cCCcCCcCCC Confidence 333 788999999999886 4433344444 No 102 >protein:vir:1239 Length: 274 # NCBI annotation: similar to phage B1 major head protein # Family: family:all:522 # MgeID: mge:25 # MgeName: phi ETA # Cross-refs: genbank:acc:NP_510938;genbank:gi:17426272;genbank:GeneID:927376 Probab=27.21 E-value=1.9 Score=19.10 Aligned_cols=256 Identities=16% Similarity=0.106 Sum_probs=119.8 Q ss_pred EccccccccCceeEec----cC---ceEEEEEEec--CceeEEEccccccchhhhhCCceEEE-----eecc--cccccC Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNE----AT---GENMRLELVN--GLNLTVKRQTGRISAAIIAANTKLIV-----IGTA--FEEGSQ 144 (418) Q Consensus 81 V~~~~~~~~~~~~~~~----~~---~E~~~Vtav~--g~~~tv~rg~~~tta~~~~~gt~v~~-----~g~a--~~EGad 144 (418) -++...-..+.|+--. +. .+.++...+- ...+ . |. .|..|.+ +|.+ ..||.+ T Consensus 1 ma~~~T~l~d~iiPev~~~~v~~~~~~~l~~~~~~~~d~~l--~-g~---------~G~tv~iP~~~~ig~a~~~~~g~~ 68 (274) T protein:vir:12 1 MAQGLTKTSNQIIPEVLAPMMQAQLEKKLRFASFAEVDSTL--Q-GQ---------PGDTLTFPAFVYSGDAQVVAEGEK 68 (274) T ss_pred CCcceeehhhhhchHHHHHHHHHHHHhhhhhcccceecccc--c-CC---------CCCEEEEeeecCCCccccccCCCc Confidence 3332221111221100 00 0111111110 0001 0 11 2332222 1211 234444 Q ss_pred CcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHH Q lcl|Aclame:pro 145 RPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQG 224 (418) Q Consensus 145 a~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~G 224 (418) .+...-......--..|+ .+.|++++-+.+.. ..|-+.........-+.+.++..++.--+. ++ T Consensus 69 i~~~~lt~~~~~~~i~~~-~~~~~i~D~~~~~~---~~d~~~~~~~q~~~~~a~~vd~~~l~~~~~-----a~------- 132 (274) T protein:vir:12 69 IPTDILETKKREAKIRKI-AKGTSITDEALLSG---YGDPQGEQVRQHGLAHANKVDNDVLEALMG-----AK------- 132 (274) T ss_pred cchhhcccceeeEEeeee-cceeeecHHHHHhc---ccchHHHHHHHHHHHHHHHHHHHHHHHHhc-----cc------- Confidence 332222222221123442 56788887665542 345566666666677788888877632210 00 Q ss_pred HHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccce-eec Q lcl|Aclame:pro 225 IVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET-SYG 303 (418) Q Consensus 225 I~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~-~~G 303 (418) ..+ ...+++.+.+.++.+++=+ . ....++++|++.....|-+... .++..... ..+ T Consensus 133 ----------~~~----~~~a~~~d~i~dA~~~lgd----~-~~~~~~ivv~p~~~~~L~k~~~----~~fv~~s~~g~~ 189 (274) T protein:vir:12 133 ----------LTV----NADITKLNGLQSAIDKFND----E-DLEPMVLFINPLDAGKLRGDAS----TNFTRATELGDD 189 (274) T ss_pred ----------ccc----cccccCHHHHHHHHHHhcc----c-cccccEEEeCHHHHHHHHhhhh----hhcccccccccc Confidence 001 1235788889998877522 2 2356799999998877765321 11111111 111 Q ss_pred eEEEE-EEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCcccccc Q lcl|Aclame:pro 304 MVFTE-WKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGG 382 (418) Q Consensus 304 ~~v~~-~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~ 382 (418) +...- |-+--| +.|+.++ .+|.++.+++-+..+.+. .+++...|..+..- ++.|...+ T Consensus 190 ~~~~G~ig~~~G-~~Vi~s~-----~~p~~t~~l~~~gA~~~~--~~~~~~vE~~Rd~~-------------~~~d~i~~ 248 (274) T protein:vir:12 190 IIVKGAFGEALG-AIIVRSN-----KLEAGTAILAKKGAVKLI--LKRDFFLEVARDAS-------------TKTTALYS 248 (274) T ss_pred ceecccceeecC-eeEEEeC-----CCCcceEEEEeccceeee--ecCCceeccccchh-------------hcccEEEe Confidence 11111 112234 4666664 468899999998877653 34666666655442 22344444 Q ss_pred EEEEEEEEEEecccceEEeecCccccccc Q lcl|Aclame:pro 383 SLTSEWALELLNPQGCAVITGLQKAKERV 411 (418) Q Consensus 383 ~i~~E~tLev~N~kA~a~I~gL~~~~~~~ 411 (418) ..+ |+..+-||.+..+|+- ..+--+- T Consensus 249 ~~~--y~~~~~~~~~vv~~t~-~~~~~~~ 274 (274) T protein:vir:12 249 DKH--YVAYLYDESKAVKITK-GSGSLEM 274 (274) T ss_pred eeE--EEEEEEcCCceEEEEc-CCccccC Confidence 433 7888999999998872 2221111 No 103 >protein:vir:107826 Length: 331 # NCBI annotation: hypothetical protein predicted by GeneMark # Family: family:all:1903 # MgeID: mge:1673 # MgeName: BIP-1 # Cross-refs: genbank:acc:NP_996627;genbank:gi:45580761;genbank:GeneID:2767902 Probab=25.18 E-value=2.1 Score=18.83 Aligned_cols=238 Identities=13% Similarity=0.048 Sum_probs=101.0 Q ss_pred cccceeEEEEEeecCceEEEEcccccc-cc-----CceeEe-ccCceEE---EEEEec---CceeEEEccccccchhhhh Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSDGL-TK-----GMIFYN-EATGENM---RLELVN---GLNLTVKRQTGRISAAIIA 127 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~~~-~~-----~~~~~~-~~~~E~~---~Vtav~---g~~~tv~rg~~~tta~~~~ 127 (418) |.....+ .+|..+.-+. .+ ..|++. .-..|++ .....| ++.-+|. + .+| T Consensus 1 m~~~~~~----------~~TL~e~Ak~~~~~~~l~~~IIE~l~~tn~IL~~lpf~e~N~~t~~~~~vr-----t---~LP 62 (331) T protein:vir:10 1 MPTLSTT----------NPTLADVAARMTPDGKIDPQIVEMLNETNEILDDMTVIEANGFTEHKTTVR-----S---GLP 62 (331) T ss_pred CCccccC----------cccHHHHHHhcCcchhHHHHHHHHHhcCchHHhhceeeeccCCccceeeEE-----e---ccC Confidence 2211111 1111111100 00 001110 0011221 111111 1121111 0 112 Q ss_pred CCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccch-HHHHHHHHHHHHHHHHhHHHhc Q lcl|Aclame:pro 128 ANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSN-ITESRRDCMDFHATEQETAIFF 206 (418) Q Consensus 128 ~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~de-la~q~~kk~~EikrdmE~a~i~ 206 (418) +..+..++ +|- .+....+.+++=.|=||.-.++|..-. .+..|...+ .+.|.+.+++-|..+++..||+ T Consensus 63 -~~~fR~lN----~g~---~~s~~tt~q~t~~l~ilgg~~eVDk~l--a~~~Gn~~~~ra~e~~~~ik~m~~~~~~~~iy 132 (331) T protein:vir:10 63 -TGTWRKLN----YGV---QPEKSRTVQVKDSMGMLETYAEVDKAL--ADLNGNSAAWRLSEDRAFIEGMNQTQATTLFY 132 (331) T ss_pred -CchhhccC----Ccc---CcccceeEEEEEEEEEeccceeechHH--HhhcCCHHHHHHHHHHHHHHHHHHHHHHHHhc Confidence 33443332 221 222333556667899999999999853 334455444 4889999999999999999999 Q ss_pred Cccccc--------------------------CcCCc--cc-------hhhHHHHHHHhh-------ccc---------- Q lcl|Aclame:pro 207 GQAFMG--------------------------TYNGQ--PL-------HTTQGIVDAVRQ-------YAP---------- 234 (418) Q Consensus 207 G~k~~~--------------------------~s~~~--~~-------r~t~GI~~~i~~-------~~~---------- 234 (418) |--..+ ++++. .+ ..+.||+.--.+ ..+ T Consensus 133 GD~a~~p~~F~GL~kR~~~~~a~~~~q~IdaGgtG~~~TSI~~v~~~~~~~~giyPkG~~~Gl~~~d~g~~~~~~~~G~~ 212 (331) T protein:vir:10 133 GDSSIDAEKFMGLTPRFNSLSAENGQNIIDAGGTGSDNASIWLTVWGPNTLHTIYPKGSQAGLQSRDLGEDTLIDAAGGR 212 (331) T ss_pred CCcccChhhhccchhhccccccccccceeecCCCCCCceEEEEEEEcCCeeEEecccccccCceEeecCceeeecCCCCe Confidence 842100 00000 00 112233210000 000 Q ss_pred -------------------------cCcccc--CCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhh Q lcl|Aclame:pro 235 -------------------------DNVNAM--PNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIG 287 (418) Q Consensus 235 -------------------------~nv~~~--~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~ 287 (418) .|.+.. ... +-+..+|.+++-++..+= .+.+....++||+.+....|.+-. T Consensus 213 y~~y~~~~~w~~Gl~i~d~r~v~ri~NIdvs~l~~~-~~~~~dl~~lm~~a~~~i-p~~~~~~~~~y~n~~v~~~L~~q~ 290 (331) T protein:vir:10 213 YQGYRTHYKWDIGLTLRDWRYVVRIANVDVSELTKN-ASAGADLIDLMTQAVELI-PNVGMGRPAFYMPRKIRSFLRRQI 290 (331) T ss_pred eeEEEEEEEeeeeeEEcCcccEEEEeccchhccCCC-cchhhhHHHHHHHHHHHh-cccCCCCeEEEechHHHHHHHHHH Confidence 011000 000 113355677776666541 112222246899999888887643 Q ss_pred hccceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEE Q lcl|Aclame:pro 288 RFFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVV 337 (418) Q Consensus 288 ~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~ 337 (418) ...++..+...+...|. .+|.|+-+.|....-+.+ . +..|+ T Consensus 291 ~~~~~~~~~~~~~~~g~----~~t~~~gipir~~dai~~---t--E~~Vv 331 (331) T protein:vir:10 291 TNKVAASTLTMEEIAGK----KVVAFDGIPCRRTDALLL---T--EARVV 331 (331) T ss_pred hhccceeeeeeeecCCc----ceeEECCeeEEEeeeeec---C--ccccC Confidence 22234444444455554 445566555554432211 1 22222 No 104 >protein:vir:107388 Length: 331 # NCBI annotation: Bbp17 # Family: family:all:1903 # MgeID: mge:1537 # MgeName: BPP-1 # Cross-refs: genbank:acc:NP_958686;genbank:gi:41179378;genbank:GeneID:2717182 Probab=25.18 E-value=2.1 Score=18.83 Aligned_cols=238 Identities=13% Similarity=0.048 Sum_probs=101.0 Q ss_pred cccceeEEEEEeecCceEEEEcccccc-cc-----CceeEe-ccCceEE---EEEEec---CceeEEEccccccchhhhh Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSDGL-TK-----GMIFYN-EATGENM---RLELVN---GLNLTVKRQTGRISAAIIA 127 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~~~-~~-----~~~~~~-~~~~E~~---~Vtav~---g~~~tv~rg~~~tta~~~~ 127 (418) |.....+ .+|..+.-+. .+ ..|++. .-..|++ .....| ++.-+|. + .+| T Consensus 1 m~~~~~~----------~~TL~e~Ak~~~~~~~l~~~IIE~l~~tn~IL~~lpf~e~N~~t~~~~~vr-----t---~LP 62 (331) T protein:vir:10 1 MPTLSTT----------NPTLADVAARMTPDGKIDPQIVEMLNETNEILDDMTVIEANGFTEHKTTVR-----S---GLP 62 (331) T ss_pred CCccccC----------cccHHHHHHhcCcchhHHHHHHHHHhcCchHHhhceeeeccCCccceeeEE-----e---ccC Confidence 2211111 1111111100 00 001110 0011221 111111 1121111 0 112 Q ss_pred CCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccch-HHHHHHHHHHHHHHHHhHHHhc Q lcl|Aclame:pro 128 ANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSN-ITESRRDCMDFHATEQETAIFF 206 (418) Q Consensus 128 ~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~de-la~q~~kk~~EikrdmE~a~i~ 206 (418) +..+..++ +|- .+....+.+++=.|=||.-.++|..-. .+..|...+ .+.|.+.+++-|..+++..||+ T Consensus 63 -~~~fR~lN----~g~---~~s~~tt~q~t~~l~ilgg~~eVDk~l--a~~~Gn~~~~ra~e~~~~ik~m~~~~~~~~iy 132 (331) T protein:vir:10 63 -TGTWRKLN----YGV---QPEKSRTVQVKDSMGMLETYAEVDKAL--ADLNGNSAAWRLSEDRAFIEGMNQTQATTLFY 132 (331) T ss_pred -CchhhccC----Ccc---CcccceeEEEEEEEEEeccceeechHH--HhhcCCHHHHHHHHHHHHHHHHHHHHHHHHhc Confidence 33443332 221 222333556667899999999999853 334455444 4889999999999999999999 Q ss_pred Cccccc--------------------------CcCCc--cc-------hhhHHHHHHHhh-------ccc---------- Q lcl|Aclame:pro 207 GQAFMG--------------------------TYNGQ--PL-------HTTQGIVDAVRQ-------YAP---------- 234 (418) Q Consensus 207 G~k~~~--------------------------~s~~~--~~-------r~t~GI~~~i~~-------~~~---------- 234 (418) |--..+ ++++. .+ ..+.||+.--.+ ..+ T Consensus 133 GD~a~~p~~F~GL~kR~~~~~a~~~~q~IdaGgtG~~~TSI~~v~~~~~~~~giyPkG~~~Gl~~~d~g~~~~~~~~G~~ 212 (331) T protein:vir:10 133 GDSSIDAEKFMGLTPRFNSLSAENGQNIIDAGGTGSDNASIWLTVWGPNTLHTIYPKGSQAGLQSRDLGEDTLIDAAGGR 212 (331) T ss_pred CCcccChhhhccchhhccccccccccceeecCCCCCCceEEEEEEEcCCeeEEecccccccCceEeecCceeeecCCCCe Confidence 842100 00000 00 112233210000 000 Q ss_pred -------------------------cCcccc--CCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhh Q lcl|Aclame:pro 235 -------------------------DNVNAM--PNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIG 287 (418) Q Consensus 235 -------------------------~nv~~~--~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~ 287 (418) .|.+.. ... +-+..+|.+++-++..+= .+.+....++||+.+....|.+-. T Consensus 213 y~~y~~~~~w~~Gl~i~d~r~v~ri~NIdvs~l~~~-~~~~~dl~~lm~~a~~~i-p~~~~~~~~~y~n~~v~~~L~~q~ 290 (331) T protein:vir:10 213 YQGYRTHYKWDIGLTLRDWRYVVRIANVDVSELTKN-ASAGADLIDLMTQAVELI-PNVGMGRPAFYMPRKIRSFLRRQI 290 (331) T ss_pred eeEEEEEEEeeeeeEEcCcccEEEEeccchhccCCC-cchhhhHHHHHHHHHHHh-cccCCCCeEEEechHHHHHHHHHH Confidence 011000 000 113355677776666541 112222246899999888887643 Q ss_pred hccceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEE Q lcl|Aclame:pro 288 RFFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVV 337 (418) Q Consensus 288 ~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~ 337 (418) ...++..+...+...|. .+|.|+-+.|....-+.+ . +..|+ T Consensus 291 ~~~~~~~~~~~~~~~g~----~~t~~~gipir~~dai~~---t--E~~Vv 331 (331) T protein:vir:10 291 TNKVAASTLTMEEIAGK----KVVAFDGIPCRRTDALLL---T--EARVV 331 (331) T ss_pred hhccceeeeeeeecCCc----ceeEECCeeEEEeeeeec---C--ccccC Confidence 22234444444455554 445566555554432211 1 22222 No 105 >protein:vir:98525 Length: 331 # NCBI annotation: hypothetical protein predicted by GeneMark # Family: family:all:1903 # MgeID: mge:1592 # MgeName: BMP-1 # Cross-refs: genbank:acc:NP_996579;genbank:gi:45569510;genbank:GeneID:2767853 Probab=25.18 E-value=2.1 Score=18.83 Aligned_cols=238 Identities=13% Similarity=0.048 Sum_probs=101.0 Q ss_pred cccceeEEEEEeecCceEEEEcccccc-cc-----CceeEe-ccCceEE---EEEEec---CceeEEEccccccchhhhh Q lcl|Aclame:pro 61 MVFASAVVTAEAAADATVLTVENSDGL-TK-----GMIFYN-EATGENM---RLELVN---GLNLTVKRQTGRISAAIIA 127 (418) Q Consensus 61 ~~~~~~t~~a~~~a~~t~~tV~~~~~~-~~-----~~~~~~-~~~~E~~---~Vtav~---g~~~tv~rg~~~tta~~~~ 127 (418) |.....+ .+|..+.-+. .+ ..|++. .-..|++ .....| ++.-+|. + .+| T Consensus 1 m~~~~~~----------~~TL~e~Ak~~~~~~~l~~~IIE~l~~tn~IL~~lpf~e~N~~t~~~~~vr-----t---~LP 62 (331) T protein:vir:98 1 MPTLSTT----------NPTLADVAARMTPDGKIDPQIVEMLNETNEILDDMTVIEANGFTEHKTTVR-----S---GLP 62 (331) T ss_pred CCccccC----------cccHHHHHHhcCcchhHHHHHHHHHhcCchHHhhceeeeccCCccceeeEE-----e---ccC Confidence 2211111 1111111100 00 001110 0011221 111111 1121111 0 112 Q ss_pred CCceEEEeecccccccCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccch-HHHHHHHHHHHHHHHHhHHHhc Q lcl|Aclame:pro 128 ANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSN-ITESRRDCMDFHATEQETAIFF 206 (418) Q Consensus 128 ~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~de-la~q~~kk~~EikrdmE~a~i~ 206 (418) +..+..++ +|- .+....+.+++=.|=||.-.++|..-. .+..|...+ .+.|.+.+++-|..+++..||+ T Consensus 63 -~~~fR~lN----~g~---~~s~~tt~q~t~~l~ilgg~~eVDk~l--a~~~Gn~~~~ra~e~~~~ik~m~~~~~~~~iy 132 (331) T protein:vir:98 63 -TGTWRKLN----YGV---QPEKSRTVQVKDSMGMLETYAEVDKAL--ADLNGNSAAWRLSEDRAFIEGMNQTQATTLFY 132 (331) T ss_pred -CchhhccC----Ccc---CcccceeEEEEEEEEEeccceeechHH--HhhcCCHHHHHHHHHHHHHHHHHHHHHHHHhc Confidence 33443332 221 222333556667899999999999853 334455444 4889999999999999999999 Q ss_pred Cccccc--------------------------CcCCc--cc-------hhhHHHHHHHhh-------ccc---------- Q lcl|Aclame:pro 207 GQAFMG--------------------------TYNGQ--PL-------HTTQGIVDAVRQ-------YAP---------- 234 (418) Q Consensus 207 G~k~~~--------------------------~s~~~--~~-------r~t~GI~~~i~~-------~~~---------- 234 (418) |--..+ ++++. .+ ..+.||+.--.+ ..+ T Consensus 133 GD~a~~p~~F~GL~kR~~~~~a~~~~q~IdaGgtG~~~TSI~~v~~~~~~~~giyPkG~~~Gl~~~d~g~~~~~~~~G~~ 212 (331) T protein:vir:98 133 GDSSIDAEKFMGLTPRFNSLSAENGQNIIDAGGTGSDNASIWLTVWGPNTLHTIYPKGSQAGLQSRDLGEDTLIDAAGGR 212 (331) T ss_pred CCcccChhhhccchhhccccccccccceeecCCCCCCceEEEEEEEcCCeeEEecccccccCceEeecCceeeecCCCCe Confidence 842100 00000 00 112233210000 000 Q ss_pred -------------------------cCcccc--CCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhh Q lcl|Aclame:pro 235 -------------------------DNVNAM--PNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIG 287 (418) Q Consensus 235 -------------------------~nv~~~--~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~ 287 (418) .|.+.. ... +-+..+|.+++-++..+= .+.+....++||+.+....|.+-. T Consensus 213 y~~y~~~~~w~~Gl~i~d~r~v~ri~NIdvs~l~~~-~~~~~dl~~lm~~a~~~i-p~~~~~~~~~y~n~~v~~~L~~q~ 290 (331) T protein:vir:98 213 YQGYRTHYKWDIGLTLRDWRYVVRIANVDVSELTKN-ASAGADLIDLMTQAVELI-PNVGMGRPAFYMPRKIRSFLRRQI 290 (331) T ss_pred eeEEEEEEEeeeeeEEcCcccEEEEeccchhccCCC-cchhhhHHHHHHHHHHHh-cccCCCCeEEEechHHHHHHHHHH Confidence 011000 000 113355677776666541 112222246899999888887643 Q ss_pred hccceEEEcccceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEE Q lcl|Aclame:pro 288 RFFGEVTVTQRETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVV 337 (418) Q Consensus 288 ~~~~~~~~~~~~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~ 337 (418) ...++..+...+...|. .+|.|+-+.|....-+.+ . +..|+ T Consensus 291 ~~~~~~~~~~~~~~~g~----~~t~~~gipir~~dai~~---t--E~~Vv 331 (331) T protein:vir:98 291 TNKVAASTLTMEEIAGK----KVVAFDGIPCRRTDALLL---T--EARVV 331 (331) T ss_pred hhccceeeeeeeecCCc----ceeEECCeeEEEeeeeec---C--ccccC Confidence 22234444444455554 445566555554432211 1 22222 No 106 >protein:vir:81160 Length: 371 # NCBI annotation: major capsid protein # Family: family:all:21 # MgeID: mge:1892 # MgeName: Geobacillus virus E2 # Cross-refs: genbank:acc:YP_001285811;genbank:gi:148747732;genbank:GeneID:5247203 Probab=23.69 E-value=2.3 Score=18.63 Aligned_cols=297 Identities=11% Similarity=0.034 Sum_probs=105.8 Q ss_pred Ccceeeeecc-CCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEE Q lcl|Aclame:pro 1 MSVYAGIFNT-TLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVL 79 (418) Q Consensus 1 ~~~~~~~~~~-~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~ 79 (418) .++....-.. .+...+-.++.+... | +.+ -. ..+ +. -+.+.+.. T Consensus 57 ~~~~~~~~~~~~~~~~~~~~~~~~~~--------------l-~~~-~~-----------~a~-------~~-~t~~~gg~ 101 (371) T protein:vir:81 57 QTIEDKEPLKPTVQVKENEVEAFVNH--------------I-RTR-FR-----------NAM-------SE-GSNQDGGY 101 (371) T ss_pred HhhccccccccchhhHHHHHHHHHHH--------------H-HHH-HH-----------Hhh-------cc-CCCccCce Confidence 1010000000 000010011111100 0 000 00 000 00 00011111 Q ss_pred EEccccccccCceeEeccCce----EEEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccccCCcCcccccc Q lcl|Aclame:pro 80 TVENSDGLTKGMIFYNEATGE----NMRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQP 153 (418) Q Consensus 80 tV~~~~~~~~~~~~~~~~~~E----~~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~ 153 (418) .|. ..+. ..|+......- .+.+..+.+.. ..+.+...+..+ .|. .||++.++... T Consensus 102 ~vP--~~~~-~~ii~~~~~~s~i~~~~~~~~~~~~~~~~~~~~~~~~~~a-------~~v------~Eg~~~~~~~~--- 162 (371) T protein:vir:81 102 TVP--QDIQ-TRINELRESKDALQNLITVEPVTTLSGSRVFKKRSQQTGF-------VEV------AEGAAIGEKAT--- 162 (371) T ss_pred eec--HhHH-HHHHHHHHhhhhhhhhceeeeccCCceeEEEEeecCCcce-------eee------ccccccccccc--- Confidence 111 0010 01111001111 12233344433 223322222111 111 46655442211 Q ss_pred eeccceeEEEeeeeeec----hhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHH Q lcl|Aclame:pro 154 VYVPNFTQIFRNAWALT----DTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAV 229 (418) Q Consensus 154 ~~~~N~tQIf~~~v~VS----gTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i 229 (418) ..+.||--+...+. =|.+...... .+-.+|-...-...+.+.+|.++++|... +. T Consensus 163 ---~~f~~i~~~~~k~~~~~~iS~ell~ds~-~~l~~~i~~~l~~a~~~~~~~~i~~g~g~----~~------------- 221 (371) T protein:vir:81 163 ---PQFTLLQYQVKKYAGFFRVTNELLNDST-EAIVNTLVRWIGDESRVTRNGLIINVLNT----KA------------- 221 (371) T ss_pred ---cceeeEEeeeeEEEEeehhhHHHHhhhh-HHHHHHHHHHHHHHHHHHHHHHHHhhccc----cc------------- Confidence 13344433333333 2333333211 23234444444556788889999987542 11 Q ss_pred hhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEccc------ceeec Q lcl|Aclame:pro 230 RQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQR------ETSYG 303 (418) Q Consensus 230 ~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~------~~~~G 303 (418) ..+..+.+++.+++...-......+ ..+++++.....|.++...+|++-+... ..-+| T Consensus 222 ------------~~~~~~~~~i~~~~~~~l~~~~~~~----a~~vmn~~~~~~L~~lkd~~g~~l~~~~~~~~~~~~l~G 285 (371) T protein:vir:81 222 ------------KTAIADLDGLKQIINVQLDPVFRST----SSVIVNQDAFNWLDTLKDQNGQYLLQPSISSPTGRQLLG 285 (371) T ss_pred ------------ccccccHHHHHHHHHhhcchhhhcC----CEEEEcHHHHHHHHHhhccCCCeeeecccCCCCCceecc Confidence 0112334445554432211111111 2467888778888887544555544321 12233 Q ss_pred eEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhh-ceeeeccCCCcccccccccCccccccccccccccCcccccc Q lcl|Aclame:pro 304 MVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPA-VKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGG 382 (418) Q Consensus 304 ~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~-~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~ 382 (418) .-| +.++.--+ ........+.+...+++-|+.. +.+..- .++..+.....+. + + ..|.... T Consensus 286 ~pV--~~~~~~~~---~~~~~~~~~~~~~~i~~Gd~~~~~~~~~~--~~~~i~~~~~~~~--~-f--------~~~~v~~ 347 (371) T protein:vir:81 286 LPV--VIVSNKVL---ANRVDGGTGAQFAPIIVGDLKEAVVMFDR--QRTEIMSSNVAMD--A-F--------ETDATLW 347 (371) T ss_pred eeE--EEeccccc---CccccccccCCcceEEEEehhceEEEEee--cceEEEEeccccc--h-h--------hcCceEE Confidence 322 33332100 0000001112234667777654 222111 1221111111110 0 0 0033444 Q ss_pred EEEEEEEEEEecccceEEeecCccc Q lcl|Aclame:pro 383 SLTSEWALELLNPQGCAVITGLQKA 407 (418) Q Consensus 383 ~i~~E~tLev~N~kA~a~I~gL~~~ 407 (418) +....+.+.+++|+|..+++ +++| T Consensus 348 ~~~~r~d~~~~~~~a~~~~~-~~~A 371 (371) T protein:vir:81 348 RAIERMDVKMRDDEAFVFGE-VQLA 371 (371) T ss_pred EEEEeeccEEecccceEEEE-EecC Confidence 56666799999999999998 8888 No 107 >protein:vir:1025 Length: 408 # NCBI annotation: capsid protein # Family: family:all:21 # MgeID: mge:20 # MgeName: bIL286 # Cross-refs: genbank:acc:NP_076679;genbank:gi:13095788;genbank:GeneID:920362 Probab=22.40 E-value=2.5 Score=18.45 Aligned_cols=318 Identities=15% Similarity=0.102 Sum_probs=114.8 Q ss_pred Ccceeeeec-cCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEE Q lcl|Aclame:pro 1 MSVYAGIFN-TTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVL 79 (418) Q Consensus 1 ~~~~~~~~~-~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~ 79 (418) -..-....+ ......+--.+.+...+. ... -.+... .. + + + .+ .+.++.-. T Consensus 75 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~--~~~--~~~~~~-~~-~---a-----------~-------~~-~t~~~gg~ 126 (408) T protein:vir:10 75 REEEKGPLNKSENELKDKFVKDFVNMVR--NPM--AFMNTV-SS-K---T-----------E-------TS-GSDSAAGL 126 (408) T ss_pred ccccccccccchhhhHHHHHHHHHHHhh--cch--hhhhhh-hh-h---h-----------h-------hc-ccccCCce Confidence 000000000 111111111122222111 111 111111 00 0 0 0 00 00001111 Q ss_pred EEccccccccCceeEeccCc----eEEEEEEecCc--eeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccc Q lcl|Aclame:pro 80 TVENSDGLTKGMIFYNEATG----ENMRLELVNGL--NLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQP 153 (418) Q Consensus 80 tV~~~~~~~~~~~~~~~~~~----E~~~Vtav~g~--~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~ 153 (418) .|. ..+. ..|+...... ..+.+..+.+. ++.+.+...++ + ...|. .||+..+.... T Consensus 127 ~vP--~~~~-~~Ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~~~-~-----~a~~v------~E~~~~~~~~~--- 188 (408) T protein:vir:10 127 TIP--QDIR-TMINTLVRQYDSLQQYVRVESVSTSNGSRVYEKWTDVT-P-----LTVMD------AEDGKIPDLDN--- 188 (408) T ss_pred ecc--HhHH-HHHHHHHHhhchhhhhcceeeccCCcceEEEeeccccc-c-----ceeee------cCccccccccC--- Confidence 111 0010 0111000000 01112222221 12222221111 0 11122 45655442211 Q ss_pred eeccceeEE----EeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHH Q lcl|Aclame:pro 154 VYVPNFTQI----FRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAV 229 (418) Q Consensus 154 ~~~~N~tQI----f~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i 229 (418) ..+.|| ++-...+.-|.+..+.. ..+-..+-...-...+.+.+|.+||+|... + ++ T Consensus 189 ---~~~~~i~~~~~k~~~~~~iS~ell~ds-~~~l~~~i~~~l~~~~~~~~~~~il~g~g~----~-~~----------- 248 (408) T protein:vir:10 189 ---PQLTIIKYLIKRYAGIITATNTSLKDT-AENILAWLSSWIAKKVVVTRNQAIIEVMKA----A-PK----------- 248 (408) T ss_pred ---cceeeEEeeeeeEEeeehhHHHHHhhc-hHHHHHHHHHHHHHHHHHHHHHHHhhcccc----c-cc----------- Confidence 123333 22222333344444332 223344445555566778888888877541 1 11 Q ss_pred hhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEE Q lcl|Aclame:pro 230 RQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEW 309 (418) Q Consensus 230 ~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~ 309 (418) .++..+.+++.+++..........+ ..+++++....+|.++...+|++.+...-.. |. - T Consensus 249 ------------~~~~~~~~~l~~~~~~~~~~~~~~~----a~~v~n~~~~~~l~~lkd~~G~~i~~~~~~~-~~----~ 307 (408) T protein:vir:10 249 ------------KPTIAKFDDVITMINTAVDPAIIAT----SSLLTNQSGLNKLALVKTAEGKYLLEPDPTK-PN----S 307 (408) T ss_pred ------------ccccccHHHHHHHHHHhhhhhhccC----CEEEEcHHHHHHHHHhhccCCceEeccCcCC-CC----C Confidence 1123456677776644333322222 3577898888889888655666554321110 10 0 Q ss_pred EcCCeE-EEEEECccccccCCCCCeEEEEchhhc-eeeeccCCCcccccccccCccccccccccccccCccccccEEEEE Q lcl|Aclame:pro 310 KFFKGR-LILKEHPLFSAIGISPGFAVVVDVPAV-KLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSE 387 (418) Q Consensus 310 ~SdfG~-v~vv~n~~l~~~~mp~d~~lv~D~~~~-~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E 387 (418) .+=+|. |.+..+..+...+.....+++.|+... .+..- .+...+.....+.. .-.|........- T Consensus 308 ~~l~G~PV~~~~~~~~~~~~~~~~~i~~gd~~~~~~~~~~--~~~~v~~~~~~~~~-----------f~~~~~~~r~~~r 374 (408) T protein:vir:10 308 YLIKGKQVIVVADRWLPNTGSTVYPLYYGDMSQAITLFDR--ENMSLLPTNIGAGA-----------FETDTTKIRVIDR 374 (408) T ss_pred ceecceeeEEecccccCccCCCceEEEEEehhccEEEEEe--cceEEEEcccccch-----------hhcCceEEEEEEe Confidence 011342 223223333222222123566687642 22211 11111111111100 0002333345555 Q ss_pred EEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 388 WALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 388 ~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) +...+.+|+|+.+++--..+.+......|+. T Consensus 375 ~d~~v~~~~a~~~~~~~~~~~~~~~~~~~~~ 405 (408) T protein:vir:10 375 FDVKATDSEALVAGSFSAIADQVGNFKTTTS 405 (408) T ss_pred eccEEeccccEEEEEeeccccCCCCCCCCCc Confidence 8999999999988876655544433334443 No 108 >protein:vir:101607 Length: 379 # NCBI annotation: major capsid protein precursor # Family: family:all:585 # MgeID: mge:1646 # MgeName: 11b # Cross-refs: genbank:acc:YP_112497;genbank:gi:53793597;uniprot:Q5ZGF6;genbank:GeneID:3101715 Probab=22.19 E-value=2.5 Score=18.42 Aligned_cols=305 Identities=11% Similarity=-0.032 Sum_probs=101.6 Q ss_pred CcceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) Q Consensus 1 ~~~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~t 80 (418) .+......+..+....-+++.... .+.......+- -+.....+.....+-.+... .-.. . T Consensus 71 ~~~~~~~~~~~~~~~~~~~~~~~~--~~~~~~~~~~~-----~~~~~~~~~~~~~ip~~~~~------------~ii~-~ 130 (379) T protein:vir:10 71 KAKSEDKSDSLVKSITENFNDIKE--VRNGKSIQVKA-----VGDMTLPVNLTGAQPKDYNF------------DVVL-N 130 (379) T ss_pred cccccccchhHHHHHHHHHHhHHH--HHhhhhhhhhh-----hcccccCCCCccccchhhhh------------HHHH-h Confidence 111111111100000000000000 00000000000 00000000000000000000 0000 0 Q ss_pred EccccccccCceeEeccCceEEEEEEecCceeEEEccccccchhhhhCCceEEEeecccccccCCcCcccccceecccee Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATGENMRLELVNGLNLTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPVYVPNFT 160 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~E~~~Vtav~g~~~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~~~~N~t 160 (418) +.....+. -.+.+..+.+..+++-+..+.+.++.. | ..||.+.|..... ...+. . T Consensus 131 ~~~~~~i~-----------~~~~~~~~~~~~~~~~~~~~~~~~~~~-----~------v~Eg~~~~~~~~~-f~~i~--~ 185 (379) T protein:vir:10 131 PSQMLNVS-----------DIVGAVSISGGTYTFVRENGAGEGAIG-----A------QVEGATKGQKDYD-ISMID--V 185 (379) T ss_pred HHhhhhHH-----------hhceeeeccCCceEEEEeecCCCcccc-----c------ccCCccccccccc-eeeeE--e Confidence 00000000 001111122222222222111111111 1 1355554432111 11111 1 Q ss_pred EEEeeeeeechhHHHHhhhcccchHHHHHHH-HHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccccCccc Q lcl|Aclame:pro 161 QIFRNAWALTDTARASYAEAGYSNITESRRD-CMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAPDNVNA 239 (418) Q Consensus 161 QIf~~~v~VSgTa~Av~~~g~~dela~q~~k-k~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~~nv~~ 239 (418) .+++-...+.=|.+...-.. . +...+.+ -...+.+-++.+|+.|... +++ .+ . T Consensus 186 ~~~k~~~~~~iS~ell~D~~--~-l~~~i~~~la~~~~~~~~~~~~~g~~~----~~~-----~~------------~-- 239 (379) T protein:vir:10 186 NTDFIAGFTRYSKKMANNLP--F-LTSFIPNALRRDYAKAENAAFNAVLAA----NAT-----AS------------T-- 239 (379) T ss_pred eeeeEEeeehhhHHHHhhHH--H-HHHHHHHHHHHHHHHHHHHHHhccccc----ccc-----cc------------c-- Confidence 11111111122233333221 1 2222222 2234456667777765421 100 00 0 Q ss_pred cCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccce-eeceEEEEEEcCCeEEEE Q lcl|Aclame:pro 240 MPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRET-SYGMVFTEWKFFKGRLIL 318 (418) Q Consensus 240 ~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~-~~G~~v~~~~SdfG~v~v 318 (418) .+.....+.+++.+++.++-..+... ..+++++.....|.++...+|++.....-. ..|.. .+=+| +.| T Consensus 240 ~~~~~~~~~d~i~~~~~~~~~~~~~~-----~~~vmn~~~~~~l~~lkd~~G~~l~~~~~~~~~~~~----~~l~G-~pv 309 (379) T protein:vir:10 240 EIITNKNKVEMLINEIAKQENLDFPV-----TAIVLRPTDYYDILVTQKSVGAGYGLPGVVTQDNGV----LRING-IPL 309 (379) T ss_pred ccccCcccHHHHHHHHHhhhhccCCC-----CEEEEcHHHHHHHHHhhccCCceeccCCccCCCCCc----ceecc-eee Confidence 01112334566666665554332222 246678887788888765566654432111 01100 01124 355 Q ss_pred EECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEEEEEEEecccce Q lcl|Aclame:pro 319 KEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSEWALELLNPQGC 398 (418) Q Consensus 319 v~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E~tLev~N~kA~ 398 (418) +.++ +||++++++.|.+.+.+.+- ++...+.....+. .+ ..|-.......-+.+.+++|.|+ T Consensus 310 v~s~-----~~~ag~~~~gdf~~~~~~~~--~~~~i~~~~~~~~---~f--------~~~~~~~r~~~R~~~~v~~p~a~ 371 (379) T protein:vir:10 310 FRAT-----WLAANKYYVGDWTRVTKVTT--EGLSLEFSEVEGT---NF--------VKNNITARIEAQVALAVEQPAAL 371 (379) T ss_pred EecC-----CCCCCceEEeecccEEEEEE--eceEEEEeecccc---cc--------cCCcEEEEEEEEeccEEecCccE Confidence 5554 46889999999988654332 2222121111110 00 00333334446788999999998 Q ss_pred EE--eecC Q lcl|Aclame:pro 399 AV--ITGL 404 (418) Q Consensus 399 a~--I~gL 404 (418) .+ ++.+ T Consensus 372 v~~~~~~~ 379 (379) T protein:vir:10 372 IFGDFTAV 379 (379) T ss_pred EEEEecCC Confidence 77 4444 No 109 >protein:vir:107593 Length: 392 # NCBI annotation: major capsid protein, HK97 family # Family: family:all:21 # MgeID: mge:1491 # MgeName: Gamma # Cross-refs: genbank:acc:YP_338188;genbank:gi:77020144;genbank:GeneID:3703724 Probab=21.06 E-value=2.7 Score=18.25 Aligned_cols=300 Identities=11% Similarity=0.059 Sum_probs=104.9 Q ss_pred CcceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) Q Consensus 1 ~~~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~t 80 (418) -+.+..+-+..++..+ +.+..... -.. .+.. .+.++..+. T Consensus 78 ~~~~~~l~~~~~~~~~---~~~~~~~~----------~~~-~~~~--------------------------~t~~~gg~~ 117 (392) T protein:vir:10 78 DVFMKALRNKPLNAEE---REFLEDDL----------EQR-AMSG--------------------------LTGEDGGLV 117 (392) T ss_pred HHHHHHHhcccccHHH---HHHHhhhh----------hhh-hccc--------------------------cccCCCcee Confidence 1111111112222221 11111100 000 0000 000111111 Q ss_pred EccccccccCceeEeccCc----eEEEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccccCCcCcccccce Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATG----ENMRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPV 154 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~----E~~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~ 154 (418) |.. .+. ..|+...... -.+.+..|.+.. +.+.+...+..+ .|. .||+..+......-. T Consensus 118 vP~--~~~-~~ii~~~~~~s~l~~~~~~~~~~~~~~~~~~~~~~~~~~a-------~~v------~E~~~~~~~~~~~~~ 181 (392) T protein:vir:10 118 IPQ--DIQ-TQINELARSFDALEQYVTVEPVRTRSGSRVLEKNSDMIPF-------AEI------TEMGEIPETDNPKFS 181 (392) T ss_pred cch--hHH-HHHHHHHHhhhhhhhhceeeeccCCceeEEEEeecCCccc-------eee------cccccccccccccce Confidence 110 000 0011000000 112344444332 222222222221 121 355544321111111 Q ss_pred eccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccc Q lcl|Aclame:pro 155 YVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAP 234 (418) Q Consensus 155 ~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~ 234 (418) .+.=-..-+...+.|| .+..... ..+..++-...-...+.+.++.++++|... + + T Consensus 182 ~v~l~~~k~~~~~~iS--~ell~ds-~~~l~~~i~~~l~~~i~~~~d~~~~~g~g~----~-~----------------- 236 (392) T protein:vir:10 182 NVQYAVKDRAGILPLS--RSLLQDS-DQNILKYVTKWLGKKSKVTRNVLILGVIEK----L-T----------------- 236 (392) T ss_pred eEEeeeeeEEEeehhh--HHHHhhh-HHHHHHHHHHHHHHHHHHHHHHHHhhcccc----c-c----------------- Confidence 1110111122223333 3333321 123334444444555677788888765531 0 0 Q ss_pred cCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCe Q lcl|Aclame:pro 235 DNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKG 314 (418) Q Consensus 235 ~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG 314 (418) ..+..+.+++.+++..........+ ..+++++....+|.++...+|++-+...-.. |. -.+=+| T Consensus 237 -------~~~~~~~d~i~~~~~~~l~~~~~~~----a~~vm~~~~~~~L~~lkd~~G~~l~~~~~~~-~~----~~tllG 300 (392) T protein:vir:10 237 -------KQAIKSLDDIKDVLNVKLDPAISPN----AILLTNQDGFNYLDKLKDKDGKYILQSDPTQ-KN----KKLFAG 300 (392) T ss_pred -------ccCccCHHHHHHHHHHhhhhhhccC----CEEEEcHHHHHHHHHhhccCCCeEeecCccC-Cc----cccccC Confidence 1123556777776643333332222 2477888888889887555566554321100 00 001133 Q ss_pred EEEEE--ECccccccCC--CCCeEEEEchhh-ceeeeccCCCcccccccccCccccccccccccccCccccc----cEEE Q lcl|Aclame:pro 315 RLILK--EHPLFSAIGI--SPGFAVVVDVPA-VKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQG----GSLT 385 (418) Q Consensus 315 ~v~vv--~n~~l~~~~m--p~d~~lv~D~~~-~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k----~~i~ 385 (418) .--++ .+..+...+. ....+++-|++. +.+..- .+...+.....+ .++.+ ...+ T Consensus 301 ~~~v~~~~~~~~~~~~~~~~~~~~~~gdfs~~~~i~~~--~~~~~~~~~~~~---------------~~f~~~~~~~r~~ 363 (392) T protein:vir:10 301 TNPVVVVSNRFLKSKGTTAKKAPLIIGDLKEAIVLFKR--EDMELASTDVGG---------------KAFTRNTLDLRAI 363 (392) T ss_pred cccEEEecccccCCCcccCCceEEEEEehhceEEEEee--cceEEEEecccc---------------chhhcCceEEEEE Confidence 21111 1221111111 112345556653 222111 111111111111 02233 3444 Q ss_pred EEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 386 SEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 386 ~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) .-+...+++++|+.+++.=.++ |...|+- T Consensus 364 ~r~d~~v~~~~a~~~l~~~~~a----~~~~~~~ 392 (392) T protein:vir:10 364 QRDDVQMWDNEAAVYGEIDLSA----PVEQPQG 392 (392) T ss_pred EeeccEEecccceEEEEecccc----cccCCCC Confidence 5578899999999998544333 3333444 No 110 >protein:vir:102082 Length: 392 # NCBI annotation: major head protein # Family: family:all:21 # MgeID: mge:1503 # MgeName: Fah # Cross-refs: genbank:acc:YP_512315;genbank:gi:89152484;genbank:GeneID:3953075 Probab=21.06 E-value=2.7 Score=18.25 Aligned_cols=300 Identities=11% Similarity=0.059 Sum_probs=104.9 Q ss_pred CcceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) Q Consensus 1 ~~~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~t 80 (418) -+.+..+-+..++..+ +.+..... -.. .+.. .+.++..+. T Consensus 78 ~~~~~~l~~~~~~~~~---~~~~~~~~----------~~~-~~~~--------------------------~t~~~gg~~ 117 (392) T protein:vir:10 78 DVFMKALRNKPLNAEE---REFLEDDL----------EQR-AMSG--------------------------LTGEDGGLV 117 (392) T ss_pred HHHHHHHhcccccHHH---HHHHhhhh----------hhh-hccc--------------------------cccCCCcee Confidence 1111111112222221 11111100 000 0000 000111111 Q ss_pred EccccccccCceeEeccCc----eEEEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccccCCcCcccccce Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATG----ENMRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPV 154 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~----E~~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~ 154 (418) |.. .+. ..|+...... -.+.+..|.+.. +.+.+...+..+ .|. .||+..+......-. T Consensus 118 vP~--~~~-~~ii~~~~~~s~l~~~~~~~~~~~~~~~~~~~~~~~~~~a-------~~v------~E~~~~~~~~~~~~~ 181 (392) T protein:vir:10 118 IPQ--DIQ-TQINELARSFDALEQYVTVEPVRTRSGSRVLEKNSDMIPF-------AEI------TEMGEIPETDNPKFS 181 (392) T ss_pred cch--hHH-HHHHHHHHhhhhhhhhceeeeccCCceeEEEEeecCCccc-------eee------cccccccccccccce Confidence 110 000 0011000000 112344444332 222222222221 121 355544321111111 Q ss_pred eccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccc Q lcl|Aclame:pro 155 YVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAP 234 (418) Q Consensus 155 ~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~ 234 (418) .+.=-..-+...+.|| .+..... ..+..++-...-...+.+.++.++++|... + + T Consensus 182 ~v~l~~~k~~~~~~iS--~ell~ds-~~~l~~~i~~~l~~~i~~~~d~~~~~g~g~----~-~----------------- 236 (392) T protein:vir:10 182 NVQYAVKDRAGILPLS--RSLLQDS-DQNILKYVTKWLGKKSKVTRNVLILGVIEK----L-T----------------- 236 (392) T ss_pred eEEeeeeeEEEeehhh--HHHHhhh-HHHHHHHHHHHHHHHHHHHHHHHHhhcccc----c-c----------------- Confidence 1110111122223333 3333321 123334444444555677788888765531 0 0 Q ss_pred cCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCe Q lcl|Aclame:pro 235 DNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKG 314 (418) Q Consensus 235 ~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG 314 (418) ..+..+.+++.+++..........+ ..+++++....+|.++...+|++-+...-.. |. -.+=+| T Consensus 237 -------~~~~~~~d~i~~~~~~~l~~~~~~~----a~~vm~~~~~~~L~~lkd~~G~~l~~~~~~~-~~----~~tllG 300 (392) T protein:vir:10 237 -------KQAIKSLDDIKDVLNVKLDPAISPN----AILLTNQDGFNYLDKLKDKDGKYILQSDPTQ-KN----KKLFAG 300 (392) T ss_pred -------ccCccCHHHHHHHHHHhhhhhhccC----CEEEEcHHHHHHHHHhhccCCCeEeecCccC-Cc----cccccC Confidence 1123556777776643333332222 2477888888889887555566554321100 00 001133 Q ss_pred EEEEE--ECccccccCC--CCCeEEEEchhh-ceeeeccCCCcccccccccCccccccccccccccCccccc----cEEE Q lcl|Aclame:pro 315 RLILK--EHPLFSAIGI--SPGFAVVVDVPA-VKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQG----GSLT 385 (418) Q Consensus 315 ~v~vv--~n~~l~~~~m--p~d~~lv~D~~~-~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k----~~i~ 385 (418) .--++ .+..+...+. ....+++-|++. +.+..- .+...+.....+ .++.+ ...+ T Consensus 301 ~~~v~~~~~~~~~~~~~~~~~~~~~~gdfs~~~~i~~~--~~~~~~~~~~~~---------------~~f~~~~~~~r~~ 363 (392) T protein:vir:10 301 TNPVVVVSNRFLKSKGTTAKKAPLIIGDLKEAIVLFKR--EDMELASTDVGG---------------KAFTRNTLDLRAI 363 (392) T ss_pred cccEEEecccccCCCcccCCceEEEEEehhceEEEEee--cceEEEEecccc---------------chhhcCceEEEEE Confidence 21111 1221111111 112345556653 222111 111111111111 02233 3444 Q ss_pred EEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 386 SEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 386 ~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) .-+...+++++|+.+++.=.++ |...|+- T Consensus 364 ~r~d~~v~~~~a~~~l~~~~~a----~~~~~~~ 392 (392) T protein:vir:10 364 QRDDVQMWDNEAAVYGEIDLSA----PVEQPQG 392 (392) T ss_pred EeeccEEecccceEEEEecccc----cccCCCC Confidence 5578899999999998544333 3333444 No 111 >protein:vir:105004 Length: 392 # NCBI annotation: putative major capsid protein # Family: family:all:21 # MgeID: mge:1490 # MgeName: W Beta # Cross-refs: genbank:acc:YP_459969;genbank:gi:85701384;genbank:GeneID:3882145 Probab=21.06 E-value=2.7 Score=18.25 Aligned_cols=300 Identities=11% Similarity=0.059 Sum_probs=104.9 Q ss_pred CcceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) Q Consensus 1 ~~~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~t 80 (418) -+.+..+-+..++..+ +.+..... -.. .+.. .+.++..+. T Consensus 78 ~~~~~~l~~~~~~~~~---~~~~~~~~----------~~~-~~~~--------------------------~t~~~gg~~ 117 (392) T protein:vir:10 78 DVFMKALRNKPLNAEE---REFLEDDL----------EQR-AMSG--------------------------LTGEDGGLV 117 (392) T ss_pred HHHHHHHhcccccHHH---HHHHhhhh----------hhh-hccc--------------------------cccCCCcee Confidence 1111111112222221 11111100 000 0000 000111111 Q ss_pred EccccccccCceeEeccCc----eEEEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccccCCcCcccccce Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATG----ENMRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPV 154 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~----E~~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~ 154 (418) |.. .+. ..|+...... -.+.+..|.+.. +.+.+...+..+ .|. .||+..+......-. T Consensus 118 vP~--~~~-~~ii~~~~~~s~l~~~~~~~~~~~~~~~~~~~~~~~~~~a-------~~v------~E~~~~~~~~~~~~~ 181 (392) T protein:vir:10 118 IPQ--DIQ-TQINELARSFDALEQYVTVEPVRTRSGSRVLEKNSDMIPF-------AEI------TEMGEIPETDNPKFS 181 (392) T ss_pred cch--hHH-HHHHHHHHhhhhhhhhceeeeccCCceeEEEEeecCCccc-------eee------cccccccccccccce Confidence 110 000 0011000000 112344444332 222222222221 121 355544321111111 Q ss_pred eccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccc Q lcl|Aclame:pro 155 YVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAP 234 (418) Q Consensus 155 ~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~ 234 (418) .+.=-..-+...+.|| .+..... ..+..++-...-...+.+.++.++++|... + + T Consensus 182 ~v~l~~~k~~~~~~iS--~ell~ds-~~~l~~~i~~~l~~~i~~~~d~~~~~g~g~----~-~----------------- 236 (392) T protein:vir:10 182 NVQYAVKDRAGILPLS--RSLLQDS-DQNILKYVTKWLGKKSKVTRNVLILGVIEK----L-T----------------- 236 (392) T ss_pred eEEeeeeeEEEeehhh--HHHHhhh-HHHHHHHHHHHHHHHHHHHHHHHHhhcccc----c-c----------------- Confidence 1110111122223333 3333321 123334444444555677788888765531 0 0 Q ss_pred cCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCe Q lcl|Aclame:pro 235 DNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKG 314 (418) Q Consensus 235 ~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG 314 (418) ..+..+.+++.+++..........+ ..+++++....+|.++...+|++-+...-.. |. -.+=+| T Consensus 237 -------~~~~~~~d~i~~~~~~~l~~~~~~~----a~~vm~~~~~~~L~~lkd~~G~~l~~~~~~~-~~----~~tllG 300 (392) T protein:vir:10 237 -------KQAIKSLDDIKDVLNVKLDPAISPN----AILLTNQDGFNYLDKLKDKDGKYILQSDPTQ-KN----KKLFAG 300 (392) T ss_pred -------ccCccCHHHHHHHHHHhhhhhhccC----CEEEEcHHHHHHHHHhhccCCCeEeecCccC-Cc----cccccC Confidence 1123556777776643333332222 2477888888889887555566554321100 00 001133 Q ss_pred EEEEE--ECccccccCC--CCCeEEEEchhh-ceeeeccCCCcccccccccCccccccccccccccCccccc----cEEE Q lcl|Aclame:pro 315 RLILK--EHPLFSAIGI--SPGFAVVVDVPA-VKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQG----GSLT 385 (418) Q Consensus 315 ~v~vv--~n~~l~~~~m--p~d~~lv~D~~~-~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k----~~i~ 385 (418) .--++ .+..+...+. ....+++-|++. +.+..- .+...+.....+ .++.+ ...+ T Consensus 301 ~~~v~~~~~~~~~~~~~~~~~~~~~~gdfs~~~~i~~~--~~~~~~~~~~~~---------------~~f~~~~~~~r~~ 363 (392) T protein:vir:10 301 TNPVVVVSNRFLKSKGTTAKKAPLIIGDLKEAIVLFKR--EDMELASTDVGG---------------KAFTRNTLDLRAI 363 (392) T ss_pred cccEEEecccccCCCcccCCceEEEEEehhceEEEEee--cceEEEEecccc---------------chhhcCceEEEEE Confidence 21111 1221111111 112345556653 222111 111111111111 02233 3444 Q ss_pred EEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 386 SEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 386 ~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) .-+...+++++|+.+++.=.++ |...|+- T Consensus 364 ~r~d~~v~~~~a~~~l~~~~~a----~~~~~~~ 392 (392) T protein:vir:10 364 QRDDVQMWDNEAAVYGEIDLSA----PVEQPQG 392 (392) T ss_pred EeeccEEecccceEEEEecccc----cccCCCC Confidence 5578899999999998544333 3333444 No 112 >protein:vir:102873 Length: 392 # NCBI annotation: major capsid protein, HK97 family # Family: family:all:21 # MgeID: mge:1492 # MgeName: Cherry # Cross-refs: genbank:acc:YP_338137;genbank:gi:77020198;genbank:GeneID:3703782 Probab=21.06 E-value=2.7 Score=18.25 Aligned_cols=300 Identities=11% Similarity=0.059 Sum_probs=104.9 Q ss_pred CcceeeeeccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEEE Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVLT 80 (418) Q Consensus 1 ~~~~~~~~~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~t 80 (418) -+.+..+-+..++..+ +.+..... -.. .+.. .+.++..+. T Consensus 78 ~~~~~~l~~~~~~~~~---~~~~~~~~----------~~~-~~~~--------------------------~t~~~gg~~ 117 (392) T protein:vir:10 78 DVFMKALRNKPLNAEE---REFLEDDL----------EQR-AMSG--------------------------LTGEDGGLV 117 (392) T ss_pred HHHHHHHhcccccHHH---HHHHhhhh----------hhh-hccc--------------------------cccCCCcee Confidence 1111111112222221 11111100 000 0000 000111111 Q ss_pred EccccccccCceeEeccCc----eEEEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccccCCcCcccccce Q lcl|Aclame:pro 81 VENSDGLTKGMIFYNEATG----ENMRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQPV 154 (418) Q Consensus 81 V~~~~~~~~~~~~~~~~~~----E~~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~~ 154 (418) |.. .+. ..|+...... -.+.+..|.+.. +.+.+...+..+ .|. .||+..+......-. T Consensus 118 vP~--~~~-~~ii~~~~~~s~l~~~~~~~~~~~~~~~~~~~~~~~~~~a-------~~v------~E~~~~~~~~~~~~~ 181 (392) T protein:vir:10 118 IPQ--DIQ-TQINELARSFDALEQYVTVEPVRTRSGSRVLEKNSDMIPF-------AEI------TEMGEIPETDNPKFS 181 (392) T ss_pred cch--hHH-HHHHHHHHhhhhhhhhceeeeccCCceeEEEEeecCCccc-------eee------cccccccccccccce Confidence 110 000 0011000000 112344444332 222222222221 121 355544321111111 Q ss_pred eccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhccc Q lcl|Aclame:pro 155 YVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYAP 234 (418) Q Consensus 155 ~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~~ 234 (418) .+.=-..-+...+.|| .+..... ..+..++-...-...+.+.++.++++|... + + T Consensus 182 ~v~l~~~k~~~~~~iS--~ell~ds-~~~l~~~i~~~l~~~i~~~~d~~~~~g~g~----~-~----------------- 236 (392) T protein:vir:10 182 NVQYAVKDRAGILPLS--RSLLQDS-DQNILKYVTKWLGKKSKVTRNVLILGVIEK----L-T----------------- 236 (392) T ss_pred eEEeeeeeEEEeehhh--HHHHhhh-HHHHHHHHHHHHHHHHHHHHHHHHhhcccc----c-c----------------- Confidence 1110111122223333 3333321 123334444444555677788888765531 0 0 Q ss_pred cCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEcccceeeceEEEEEEcCCe Q lcl|Aclame:pro 235 DNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQRETSYGMVFTEWKFFKG 314 (418) Q Consensus 235 ~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~~~~~G~~v~~~~SdfG 314 (418) ..+..+.+++.+++..........+ ..+++++....+|.++...+|++-+...-.. |. -.+=+| T Consensus 237 -------~~~~~~~d~i~~~~~~~l~~~~~~~----a~~vm~~~~~~~L~~lkd~~G~~l~~~~~~~-~~----~~tllG 300 (392) T protein:vir:10 237 -------KQAIKSLDDIKDVLNVKLDPAISPN----AILLTNQDGFNYLDKLKDKDGKYILQSDPTQ-KN----KKLFAG 300 (392) T ss_pred -------ccCccCHHHHHHHHHHhhhhhhccC----CEEEEcHHHHHHHHHhhccCCCeEeecCccC-Cc----cccccC Confidence 1123556777776643333332222 2477888888889887555566554321100 00 001133 Q ss_pred EEEEE--ECccccccCC--CCCeEEEEchhh-ceeeeccCCCcccccccccCccccccccccccccCccccc----cEEE Q lcl|Aclame:pro 315 RLILK--EHPLFSAIGI--SPGFAVVVDVPA-VKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQG----GSLT 385 (418) Q Consensus 315 ~v~vv--~n~~l~~~~m--p~d~~lv~D~~~-~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k----~~i~ 385 (418) .--++ .+..+...+. ....+++-|++. +.+..- .+...+.....+ .++.+ ...+ T Consensus 301 ~~~v~~~~~~~~~~~~~~~~~~~~~~gdfs~~~~i~~~--~~~~~~~~~~~~---------------~~f~~~~~~~r~~ 363 (392) T protein:vir:10 301 TNPVVVVSNRFLKSKGTTAKKAPLIIGDLKEAIVLFKR--EDMELASTDVGG---------------KAFTRNTLDLRAI 363 (392) T ss_pred cccEEEecccccCCCcccCCceEEEEEehhceEEEEee--cceEEEEecccc---------------chhhcCceEEEEE Confidence 21111 1221111111 112345556653 222111 111111111111 02233 3444 Q ss_pred EEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 386 SEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 386 ~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) .-+...+++++|+.+++.=.++ |...|+- T Consensus 364 ~r~d~~v~~~~a~~~l~~~~~a----~~~~~~~ 392 (392) T protein:vir:10 364 QRDDVQMWDNEAAVYGEIDLSA----PVEQPQG 392 (392) T ss_pred EeeccEEecccceEEEEecccc----cccCCCC Confidence 5578899999999998544333 3333444 No 113 >protein:vir:98339 Length: 415 # NCBI annotation: putative capsid protein # Family: family:all:21 # MgeID: mge:1581 # MgeName: phiPVL(108) # Cross-refs: genbank:acc:YP_918931;genbank:gi:119443693;genbank:GeneID:4594501 Probab=20.49 E-value=2.8 Score=18.16 Aligned_cols=314 Identities=12% Similarity=0.009 Sum_probs=124.8 Q ss_pred Ccceeeee-ccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEE Q lcl|Aclame:pro 1 MSVYAGIF-NTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVL 79 (418) Q Consensus 1 ~~~~~~~~-~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~ 79 (418) +..+.+-+ ...+...+. +.+...+.......+ + .++ ..++...+ T Consensus 89 ~~~~~~~~~~~~~~~~~~--~~~~~~~~~~~~~~~---------~----------------------~~~--~~~gg~~i 133 (415) T protein:vir:98 89 INDLGISIQNTKVTSQEV--RDFTEYLETRNDIQG---------G----------------------SLK--TDSGFVVI 133 (415) T ss_pred HHHHhhhhhhhhhHHHHH--HHHHHHHhhhhhhhh---------c----------------------ccc--cccccccc Confidence 11111111 122223333 444433322211100 0 000 00000111 Q ss_pred EEccccccccCceeEeccC----ceEEEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccccCCcCcccccc Q lcl|Aclame:pro 80 TVENSDGLTKGMIFYNEAT----GENMRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQP 153 (418) Q Consensus 80 tV~~~~~~~~~~~~~~~~~----~E~~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~ 153 (418) +.. +. ..|+..... ...+.|..+.+.. +.+.+...+..+ .| ..||++.+......- T Consensus 134 P~~----~~-~~ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~~-------~~------v~E~~~~~~~~~~~~ 195 (415) T protein:vir:98 134 PEE----IV-TDILKLKEVEFNLDKYVTVKRVTNGSGKYPVVRQSEVAAL-------EK------VEELEENPELAVKPF 195 (415) T ss_pred chH----HH-HHHHHHHHhhhhhhhheeeeeccCCceeEEEEeecCCccc-------ee------eccccccCcccccce Confidence 100 00 001100000 0112233333332 223322222111 11 136666553221111 Q ss_pred eeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhcc Q lcl|Aclame:pro 154 VYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYA 233 (418) Q Consensus 154 ~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~ 233 (418) ..+ -..+++-..-+.-|.+..... ..+-..+-..+-...+.+.+|.++|+|.-. +... . ++.... T Consensus 196 ~~v--~~~~~k~~~~~~iS~ell~ds-~~~l~~~i~~~l~~~~~~~~~~~il~g~g~----g~~~-~---~~~~~~---- 260 (415) T protein:vir:98 196 FQL--AYDINTHRGYFRISREAIEDA-KVNVLQELKLWMARTIAATRNKAIIDVITK----GSTG-S---TSSGFE---- 260 (415) T ss_pred eeE--EeeeeeeEeeehhhHHHHhhc-hHHHHHHHHHHHHHHHHHHHHHHHhhcccc----Cccc-c---cccccc---- Confidence 111 112222222333344444332 223344555555667789999999987631 1111 1 111110 Q ss_pred ccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEccc------ceeeceEEE Q lcl|Aclame:pro 234 PDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQR------ETSYGMVFT 307 (418) Q Consensus 234 ~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~------~~~~G~~v~ 307 (418) .........+..+.++|.+++.++-...... ..+++++.....|.++...+|++.+... ..-+|.-| T Consensus 261 -~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~-----~~~v~n~~~~~~l~~lkd~~G~~l~~~~~~~~~~~~l~G~pV- 333 (415) T protein:vir:98 261 -KEGKKLEVKKAKSLDDIKDAINLNVKPNYEH-----NVAIVSQTMFAKLDKMKDKLGNYLIQPDVKEKTQQRLLGAKI- 333 (415) T ss_pred -ccccccccccccchhHHHHHHHhhhhhccCC-----CEEEEcHHHHHHHHHhhccCCceeeccCcCCCCCceecceee- Confidence 1112223445678888888887765432221 2477898888889887555566544321 11223222 Q ss_pred EEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEE Q lcl|Aclame:pro 308 EWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSE 387 (418) Q Consensus 308 ~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E 387 (418) +..+.+..-.-....+++.|+.....-+. ..+...+... +. .+...-+.+.- T Consensus 334 -----------~~~~~~~~~~~~~~~~~~Gd~~~~~~~~~-~~~~~v~~~~----------~~------~~~~~~~~~~r 385 (415) T protein:vir:98 334 -----------EILPDEVLGQKGNNTLIIGNLKDAIVLFD-RSQYQASWTD----------YM------HFGECLMIAVR 385 (415) T ss_pred -----------EEecccccCCCCccEEEEEehhccEEEEe-ecceEEEEec----------cc------cCceEEEEEEE Confidence 22221110000111355566654321111 0111111100 00 02223356677 Q ss_pred EEEEEecccceEEeecCcccccccCCCCCC Q lcl|Aclame:pro 388 WALELLNPQGCAVITGLQKAKERVYLTAPA 417 (418) Q Consensus 388 ~tLev~N~kA~a~I~gL~~~~~~~~~~~~~ 417 (418) +...+.+|+|+.+++--+++++.-.+---+ T Consensus 386 ~d~~v~~~~a~~~~~~~~~~~~~~~~~~~~ 415 (415) T protein:vir:98 386 QDCRILDYKSAIVIEYDDSERGEGDLGLEA 415 (415) T ss_pred eccEEeccccEEEEEEeccCCCCCccccCC Confidence 889999999999999888776655444333 No 114 >protein:vir:79987 Length: 415 # NCBI annotation: head protein # Family: family:all:21 # MgeID: mge:1875 # MgeName: tp310-3 # Cross-refs: genbank:acc:YP_001430002;genbank:gi:156604057;genbank:GeneID:5525447 Probab=20.49 E-value=2.8 Score=18.16 Aligned_cols=314 Identities=12% Similarity=0.009 Sum_probs=124.8 Q ss_pred Ccceeeee-ccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEE Q lcl|Aclame:pro 1 MSVYAGIF-NTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVL 79 (418) Q Consensus 1 ~~~~~~~~-~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~ 79 (418) +..+.+-+ ...+...+. +.+...+.......+ + .++ ..++...+ T Consensus 89 ~~~~~~~~~~~~~~~~~~--~~~~~~~~~~~~~~~---------~----------------------~~~--~~~gg~~i 133 (415) T protein:vir:79 89 INDLGISIQNTKVTSQEV--RDFTEYLETRNDIQG---------G----------------------SLK--TDSGFVVI 133 (415) T ss_pred HHHHhhhhhhhhhHHHHH--HHHHHHHhhhhhhhh---------c----------------------ccc--cccccccc Confidence 11111111 122223333 444433322211100 0 000 00000111 Q ss_pred EEccccccccCceeEeccC----ceEEEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccccCCcCcccccc Q lcl|Aclame:pro 80 TVENSDGLTKGMIFYNEAT----GENMRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQP 153 (418) Q Consensus 80 tV~~~~~~~~~~~~~~~~~----~E~~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~ 153 (418) +.. +. ..|+..... ...+.|..+.+.. +.+.+...+..+ .| ..||++.+......- T Consensus 134 P~~----~~-~~ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~~-------~~------v~E~~~~~~~~~~~~ 195 (415) T protein:vir:79 134 PEE----IV-TDILKLKEVEFNLDKYVTVKRVTNGSGKYPVVRQSEVAAL-------EK------VEELEENPELAVKPF 195 (415) T ss_pred chH----HH-HHHHHHHHhhhhhhhheeeeeccCCceeEEEEeecCCccc-------ee------eccccccCcccccce Confidence 100 00 001100000 0112233333332 223322222111 11 136666553221111 Q ss_pred eeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhcc Q lcl|Aclame:pro 154 VYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYA 233 (418) Q Consensus 154 ~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~ 233 (418) ..+ -..+++-..-+.-|.+..... ..+-..+-..+-...+.+.+|.++|+|.-. +... . ++.... T Consensus 196 ~~v--~~~~~k~~~~~~iS~ell~ds-~~~l~~~i~~~l~~~~~~~~~~~il~g~g~----g~~~-~---~~~~~~---- 260 (415) T protein:vir:79 196 FQL--AYDINTHRGYFRISREAIEDA-KVNVLQELKLWMARTIAATRNKAIIDVITK----GSTG-S---TSSGFE---- 260 (415) T ss_pred eeE--EeeeeeeEeeehhhHHHHhhc-hHHHHHHHHHHHHHHHHHHHHHHHhhcccc----Cccc-c---cccccc---- Confidence 111 112222222333344444332 223344555555667789999999987631 1111 1 111110 Q ss_pred ccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEccc------ceeeceEEE Q lcl|Aclame:pro 234 PDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQR------ETSYGMVFT 307 (418) Q Consensus 234 ~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~------~~~~G~~v~ 307 (418) .........+..+.++|.+++.++-...... ..+++++.....|.++...+|++.+... ..-+|.-| T Consensus 261 -~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~-----~~~v~n~~~~~~l~~lkd~~G~~l~~~~~~~~~~~~l~G~pV- 333 (415) T protein:vir:79 261 -KEGKKLEVKKAKSLDDIKDAINLNVKPNYEH-----NVAIVSQTMFAKLDKMKDKLGNYLIQPDVKEKTQQRLLGAKI- 333 (415) T ss_pred -ccccccccccccchhHHHHHHHhhhhhccCC-----CEEEEcHHHHHHHHHhhccCCceeeccCcCCCCCceecceee- Confidence 1112223445678888888887765432221 2477898888889887555566544321 11223222 Q ss_pred EEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEE Q lcl|Aclame:pro 308 EWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSE 387 (418) Q Consensus 308 ~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E 387 (418) +..+.+..-.-....+++.|+.....-+. ..+...+... +. .+...-+.+.- T Consensus 334 -----------~~~~~~~~~~~~~~~~~~Gd~~~~~~~~~-~~~~~v~~~~----------~~------~~~~~~~~~~r 385 (415) T protein:vir:79 334 -----------EILPDEVLGQKGNNTLIIGNLKDAIVLFD-RSQYQASWTD----------YM------HFGECLMIAVR 385 (415) T ss_pred -----------EEecccccCCCCccEEEEEehhccEEEEe-ecceEEEEec----------cc------cCceEEEEEEE Confidence 22221110000111355566654321111 0111111100 00 02223356677 Q ss_pred EEEEEecccceEEeecCcccccccCCCCCC Q lcl|Aclame:pro 388 WALELLNPQGCAVITGLQKAKERVYLTAPA 417 (418) Q Consensus 388 ~tLev~N~kA~a~I~gL~~~~~~~~~~~~~ 417 (418) +...+.+|+|+.+++--+++++.-.+---+ T Consensus 386 ~d~~v~~~~a~~~~~~~~~~~~~~~~~~~~ 415 (415) T protein:vir:79 386 QDCRILDYKSAIVIEYDDSERGEGDLGLEA 415 (415) T ss_pred eccEEeccccEEEEEEeccCCCCCccccCC Confidence 889999999999999888776655444333 No 115 >protein:vir:81100 Length: 415 # NCBI annotation: capsid protein # Family: family:all:21 # MgeID: mge:1891 # MgeName: tp310-1 # Cross-refs: genbank:acc:YP_001429874;genbank:gi:156603927;genbank:GeneID:5525320 Probab=20.49 E-value=2.8 Score=18.16 Aligned_cols=314 Identities=12% Similarity=0.009 Sum_probs=124.8 Q ss_pred Ccceeeee-ccCCChhhhhhhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEeecCceEE Q lcl|Aclame:pro 1 MSVYAGIF-NTTLNPQELNMKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAAADATVL 79 (418) Q Consensus 1 ~~~~~~~~-~~~~~~~~~~~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~a~~t~~ 79 (418) +..+.+-+ ...+...+. +.+...+.......+ + .++ ..++...+ T Consensus 89 ~~~~~~~~~~~~~~~~~~--~~~~~~~~~~~~~~~---------~----------------------~~~--~~~gg~~i 133 (415) T protein:vir:81 89 INDLGISIQNTKVTSQEV--RDFTEYLETRNDIQG---------G----------------------SLK--TDSGFVVI 133 (415) T ss_pred HHHHhhhhhhhhhHHHHH--HHHHHHHhhhhhhhh---------c----------------------ccc--cccccccc Confidence 11111111 122223333 444433322211100 0 000 00000111 Q ss_pred EEccccccccCceeEeccC----ceEEEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccccCCcCcccccc Q lcl|Aclame:pro 80 TVENSDGLTKGMIFYNEAT----GENMRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEGSQRPTARSIQP 153 (418) Q Consensus 80 tV~~~~~~~~~~~~~~~~~----~E~~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EGada~~~~~~~~ 153 (418) +.. +. ..|+..... ...+.|..+.+.. +.+.+...+..+ .| ..||++.+......- T Consensus 134 P~~----~~-~~ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~~-------~~------v~E~~~~~~~~~~~~ 195 (415) T protein:vir:81 134 PEE----IV-TDILKLKEVEFNLDKYVTVKRVTNGSGKYPVVRQSEVAAL-------EK------VEELEENPELAVKPF 195 (415) T ss_pred chH----HH-HHHHHHHHhhhhhhhheeeeeccCCceeEEEEeecCCccc-------ee------eccccccCcccccce Confidence 100 00 001100000 0112233333332 223322222111 11 136666553221111 Q ss_pred eeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhhHHHHHHHhhcc Q lcl|Aclame:pro 154 VYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTTQGIVDAVRQYA 233 (418) Q Consensus 154 ~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t~GI~~~i~~~~ 233 (418) ..+ -..+++-..-+.-|.+..... ..+-..+-..+-...+.+.+|.++|+|.-. +... . ++.... T Consensus 196 ~~v--~~~~~k~~~~~~iS~ell~ds-~~~l~~~i~~~l~~~~~~~~~~~il~g~g~----g~~~-~---~~~~~~---- 260 (415) T protein:vir:81 196 FQL--AYDINTHRGYFRISREAIEDA-KVNVLQELKLWMARTIAATRNKAIIDVITK----GSTG-S---TSSGFE---- 260 (415) T ss_pred eeE--EeeeeeeEeeehhhHHHHhhc-hHHHHHHHHHHHHHHHHHHHHHHHhhcccc----Cccc-c---cccccc---- Confidence 111 112222222333344444332 223344555555667789999999987631 1111 1 111110 Q ss_pred ccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEccc------ceeeceEEE Q lcl|Aclame:pro 234 PDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQR------ETSYGMVFT 307 (418) Q Consensus 234 ~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~------~~~~G~~v~ 307 (418) .........+..+.++|.+++.++-...... ..+++++.....|.++...+|++.+... ..-+|.-| T Consensus 261 -~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~-----~~~v~n~~~~~~l~~lkd~~G~~l~~~~~~~~~~~~l~G~pV- 333 (415) T protein:vir:81 261 -KEGKKLEVKKAKSLDDIKDAINLNVKPNYEH-----NVAIVSQTMFAKLDKMKDKLGNYLIQPDVKEKTQQRLLGAKI- 333 (415) T ss_pred -ccccccccccccchhHHHHHHHhhhhhccCC-----CEEEEcHHHHHHHHHhhccCCceeeccCcCCCCCceecceee- Confidence 1112223445678888888887765432221 2477898888889887555566544321 11223222 Q ss_pred EEEcCCeEEEEEECccccccCCCCCeEEEEchhhceeeeccCCCcccccccccCccccccccccccccCccccccEEEEE Q lcl|Aclame:pro 308 EWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAVKLAYMDGRNAKVENYGQGGGENKSGATDYSYGHGVDAQGGSLTSE 387 (418) Q Consensus 308 ~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~g~Da~k~~i~~E 387 (418) +..+.+..-.-....+++.|+.....-+. ..+...+... +. .+...-+.+.- T Consensus 334 -----------~~~~~~~~~~~~~~~~~~Gd~~~~~~~~~-~~~~~v~~~~----------~~------~~~~~~~~~~r 385 (415) T protein:vir:81 334 -----------EILPDEVLGQKGNNTLIIGNLKDAIVLFD-RSQYQASWTD----------YM------HFGECLMIAVR 385 (415) T ss_pred -----------EEecccccCCCCccEEEEEehhccEEEEe-ecceEEEEec----------cc------cCceEEEEEEE Confidence 22221110000111355566654321111 0111111100 00 02223356677 Q ss_pred EEEEEecccceEEeecCcccccccCCCCCC Q lcl|Aclame:pro 388 WALELLNPQGCAVITGLQKAKERVYLTAPA 417 (418) Q Consensus 388 ~tLev~N~kA~a~I~gL~~~~~~~~~~~~~ 417 (418) +...+.+|+|+.+++--+++++.-.+---+ T Consensus 386 ~d~~v~~~~a~~~~~~~~~~~~~~~~~~~~ 415 (415) T protein:vir:81 386 QDCRILDYKSAIVIEYDDSERGEGDLGLEA 415 (415) T ss_pred eccEEeccccEEEEEEeccCCCCCccccCC Confidence 889999999999999888776655444333 No 116 >protein:vir:3845 Length: 395 # NCBI annotation: major head protein # Family: family:all:21 # MgeID: mge:322 # MgeName: phi adh # Cross-refs: genbank:acc:NP_050151;swissprot:trembl:q9t1f6;genbank:gi:9633043;uniprot:Q9T1F6;genbank:GeneID:1262163 Probab=20.08 E-value=2.8 Score=18.10 Aligned_cols=327 Identities=11% Similarity=0.023 Sum_probs=106.8 Q ss_pred CcceeeeeccCCChh------hhh-hhhcccceeEeecCCcchhHHHhhhccccceeeeeeeeeeeecccceeEEEEEee Q lcl|Aclame:pro 1 MSVYAGIFNTTLNPQ------ELN-MKSFAGTILRRVPNGSAPLLAMTSVVGSTTAKASTHGYFSKTMVFASAVVTAEAA 73 (418) Q Consensus 1 ~~~~~~~~~~~~~~~------~~~-~~s~~~~~~~~~~~~~~p~~~l~~~~~~~~~~~~~~~~~~~~~~~~~~t~~a~~~ 73 (418) +.-...-++. +... ... .++.. .....++. ..+... .........-.|+.......... T Consensus 43 ~~~l~~~i~~-~~~~~~~~~~~~~~~~~~~-~~~~~~~~-~~~~~~-----~~~~~~~~~~~~~~~~~~~~~~~------ 108 (395) T protein:vir:38 43 INKLNASLKN-AKMAQELAKSAYEDARANL-NAEPVNKK-PLPVKD-----GKPDAQAMKNQFVKDFKNLVTSG------ 108 (395) T ss_pred HHHHHHHHHH-HHHHHHHHHHHHHHHHhhh-hhcccccc-ccchhh-----hhHHHHHHHHHHHHHHHHHHhhc------ Confidence 0000000000 0000 000 00000 00000000 000000 00000111111111111000000 Q ss_pred cCceEEEEccccccccCceeEeccCc----eE-----EEEEEecCce--eEEEccccccchhhhhCCceEEEeecccccc Q lcl|Aclame:pro 74 ADATVLTVENSDGLTKGMIFYNEATG----EN-----MRLELVNGLN--LTVKRQTGRISAAIIAANTKLIVIGTAFEEG 142 (418) Q Consensus 74 a~~t~~tV~~~~~~~~~~~~~~~~~~----E~-----~~Vtav~g~~--~tv~rg~~~tta~~~~~gt~v~~~g~a~~EG 142 (418) ..+..++ ++..+.-+...|-+ +. +.+..+.+.. +.+.+..... + ...|. .|| T Consensus 109 ----~~~~~~g-g~~vP~~~~~~ii~~~~~~~~l~~~~~~~~~~~~~~~~~~~~~~~~~-~-----~a~~v------~E~ 171 (395) T protein:vir:38 109 ----TTGTGNA-GLTIPEDIQLQIRTLTRSFTSLESLANVENVTTSHGSRVYEKLADIT-P-----LKDLD------DES 171 (395) T ss_pred ----cCccCCC-ceecchhHhhHHHHHHHhhcchhhhcceeeccCCcceEEEEeeccCC-c-----ccccc------ccc Confidence 0011111 12222111111111 11 1122222221 1111111110 0 01111 344 Q ss_pred cCCcCcccccceeccceeEEEeeeeeechhHHHHhhhcccchHHHHHHHHHHHHHHHHhHHHhcCcccccCcCCccchhh Q lcl|Aclame:pro 143 SQRPTARSIQPVYVPNFTQIFRNAWALTDTARASYAEAGYSNITESRRDCMDFHATEQETAIFFGQAFMGTYNGQPLHTT 222 (418) Q Consensus 143 ada~~~~~~~~~~~~N~tQIf~~~v~VSgTa~Av~~~g~~dela~q~~kk~~EikrdmE~a~i~G~k~~~~s~~~~~r~t 222 (418) ...+......-. ..-...++-..-+--|.+.++... .+-..+-...-.+.+.+.+|..+|+|... +.. + T Consensus 172 ~~~~~~~~~~f~--~v~~~~~k~~~~~~iS~ell~ds~-~~l~~~i~~~la~~~~~~~~~~il~g~g~----~~~----~ 240 (395) T protein:vir:38 172 ALIGDNDDPELT--VVKYLIHRYAGITTVTNTLLKDTV-DNIIQWLVNWAAKKDVVTRNAKILEVMGK----APK----K 240 (395) T ss_pred ccccccccccee--eEEeeeeeeEeehhhHHHHHhhhH-HHHHHHHHHHHHHHHHHHHHHHHhhcccc----ccc----c Confidence 443321110000 112222333333333444443322 23334444555566788889999987531 111 0 Q ss_pred HHHHHHHhhccccCccccCCCCccchHHHHHHHHHHHHhcccCCCceeEEEEeChHHHHHHHhhhhccceEEEccc---- Q lcl|Aclame:pro 223 QGIVDAVRQYAPDNVNAMPNPTAVTYDDVVDATIDAFKWSVNVGDNTQRVMFCDTVGMRTMQDIGRFFGEVTVTQR---- 298 (418) Q Consensus 223 ~GI~~~i~~~~~~nv~~~~~~a~~te~~l~d~~~~~~~~g~~~~g~~~~~i~v~a~~k~~i~~~~~~~~~~~~~~~---- 298 (418) ++..+.+++.+++...-......+ ..+++++.....|.++...+|++-+... T Consensus 241 --------------------~~~~~~~~i~~~~~~~l~~~~~~~----a~~v~n~~~~~~L~~lkd~~G~~l~~~~~~~~ 296 (395) T protein:vir:38 241 --------------------PTISQFDNIKDLENNTLDPAIEST----SSFITNQSGYNILSKVKDADGRYLMQPDVTSP 296 (395) T ss_pred --------------------cccccHHHHHHHHHHhhhhhhcCC----CEEEEcHHHHHHHHHhhccCCceeeccCcCCC Confidence 112344556665543222222222 2477888888888887555666544321 Q ss_pred --ceeeceEEEEEEcCCeEEEEEECccccccCCCCCeEEEEchhhc-eeeeccCCCcccccccccCcccccccccccccc Q lcl|Aclame:pro 299 --ETSYGMVFTEWKFFKGRLILKEHPLFSAIGISPGFAVVVDVPAV-KLAYMDGRNAKVENYGQGGGENKSGATDYSYGH 375 (418) Q Consensus 299 --~~~~G~~v~~~~SdfG~v~vv~n~~l~~~~mp~d~~lv~D~~~~-~~~~L~~r~~~~e~laKtG~~~~~~~~~~~~~~ 375 (418) ..-+|.-| +.++. -.+.. ......+++-|+... .+..-. +...+.....+.. + T Consensus 297 ~~~~l~G~pV--~~~~~--------~~~~~-~~~~~~i~~gd~~~~~~i~~~~--~~~i~~~~~~~~~---~-------- 352 (395) T protein:vir:38 297 DKYLIDGKPV--IRIAD--------KWLPD-VSGSHPLYFGDLKQGITLFDRQ--QMQIDTTNVGAGS---F-------- 352 (395) T ss_pred Ccceecccee--EEecc--------cccCc-CCCcceEEEEeccccEEEEEec--ceEEEEeccccch---h-------- Confidence 11223322 22221 01111 112234666677642 222211 1111111111100 0 Q ss_pred CccccccEEEEEEEEEEecccceEEeecCcccccccCCCCCCC Q lcl|Aclame:pro 376 GVDAQGGSLTSEWALELLNPQGCAVITGLQKAKERVYLTAPAP 418 (418) Q Consensus 376 g~Da~k~~i~~E~tLev~N~kA~a~I~gL~~~~~~~~~~~~~~ 418 (418) -.|....+.+..+...+.+|+|+.+|+. +++...++.|.=.- T Consensus 353 ~~~~~~~r~~~r~d~~~~~~~a~~~~~~-~~~~~~~~~~~~~~ 394 (395) T protein:vir:38 353 EHDTTKLRFIDRFDVQLIDDGAFAAASF-KTVANQAQGTAGTG 394 (395) T ss_pred hcCceEEEEEEeeccEEecccceEEEEe-ecccCCCCCccCCC Confidence 0034455677789999999999999985 44421111111111 Done!