Query lcl|Aclame:protein:vir:96490|NCBI_annot:head protein|genbank:acc:YP_238492;genbank:gi:66391768;genbank:GeneID:5176912 Match_columns 348 No_of_seqs 131 out of 320 Neff 9.2 Searched_HMMs 1612 Date Sun Dec 1 05:39:59 2013 Command /home/guerois/workspace/virfam/python/lib/hhsearch//hhsearch2 -i .//seq/seq_36 -d /home/guerois/workspace/virfam/python/profile_database/capsid_neck_tail.hhm -glob -cpu 7 -o .//seq/HHR/seq_36_vs_rec_db.hhr No Hit Prob E-value P-value Score SS Cols Query HMM Template HMM 1 protein:vir:2736 Length: 348 # 100.0 3.1E-97 2E-100 549.7 38.9 348 1-348 1-348 (348) 2 protein:vir:4902 Length: 348 # 100.0 4.7E-97 3E-100 548.7 38.5 348 1-348 1-348 (348) 3 protein:vir:96490 Length: 348 100.0 7.8E-97 5E-100 547.5 37.9 348 1-348 1-348 (348) 4 protein:vir:98480 Length: 348 100.0 5.3E-81 3.3E-84 460.7 35.0 331 1-346 1-348 (348) 5 protein:vir:106590 Length: 349 100.0 7.1E-80 4.4E-83 454.5 36.3 330 1-345 1-349 (349) 6 protein:vir:3424 Length: 341 # 100.0 2.6E-74 1.6E-77 424.0 32.4 331 5-345 1-341 (341) 7 protein:vir:393 Length: 341 # 100.0 4.7E-73 2.9E-76 417.1 34.8 328 5-345 1-341 (341) 8 protein:vir:6378 Length: 346 # 100.0 2.6E-72 1.6E-75 413.0 34.8 328 5-345 1-346 (346) 9 protein:vir:79503 Length: 409 100.0 2.3E-65 1.4E-68 374.9 29.3 337 1-348 11-403 (409) 10 protein:vir:78006 Length: 409 100.0 2.3E-65 1.4E-68 374.9 29.3 337 1-348 11-403 (409) 11 protein:vir:10324 Length: 320 100.0 2.3E-48 1.4E-51 281.8 23.8 308 17-348 1-318 (320) 12 protein:vir:95258 Length: 368 100.0 9E-41 5.6E-44 240.1 27.0 327 1-348 1-367 (368) 13 protein:vir:79078 Length: 307 99.9 1.7E-29 1.1E-32 178.3 22.5 294 1-346 1-307 (307) 14 protein:vir:107882 Length: 307 99.9 2.3E-27 1.4E-30 166.6 23.5 292 1-347 1-307 (307) 15 protein:vir:99888 Length: 309 99.9 3.4E-25 2.1E-28 154.7 18.3 295 1-347 1-309 (309) 16 protein:vir:108211 Length: 318 99.1 1.3E-11 8.2E-15 80.2 17.9 277 1-347 1-318 (318) 17 protein:vir:98819 Length: 437 99.0 2.2E-12 1.4E-15 84.5 6.7 324 1-348 1-418 (437) 18 protein:vir:105334 Length: 276 96.7 0.00038 2.4E-07 39.3 17.2 257 1-348 1-271 (276) 19 protein:vir:80930 Length: 278 96.3 0.00082 5.1E-07 37.5 17.0 262 1-348 1-278 (278) 20 protein:vir:93742 Length: 274 96.2 0.00086 5.3E-07 37.4 17.3 257 1-348 1-271 (274) 21 protein:vir:96262 Length: 274 96.1 0.00096 5.9E-07 37.1 19.2 257 1-348 1-271 (274) 22 protein:vir:95898 Length: 274 96.1 0.00096 5.9E-07 37.1 19.2 257 1-348 1-271 (274) 23 protein:vir:95107 Length: 270 96.0 0.0012 7.1E-07 36.7 16.8 254 1-348 1-267 (270) 24 protein:vir:97433 Length: 274 95.8 0.0015 9E-07 36.1 17.1 257 1-348 1-271 (274) 25 protein:vir:94494 Length: 274 95.8 0.0015 9E-07 36.1 17.1 257 1-348 1-271 (274) 26 protein:vir:1239 Length: 274 # 95.7 0.0016 9.7E-07 36.0 16.4 257 1-348 1-271 (274) 27 protein:vir:96833 Length: 275 95.2 0.0025 1.6E-06 34.8 17.5 257 1-348 3-272 (275) 28 protein:vir:3033 Length: 272 # 94.9 0.0032 2E-06 34.2 19.8 260 1-348 1-270 (272) 29 protein:vir:9820 Length: 272 # 94.9 0.0032 2E-06 34.2 19.8 260 1-348 1-270 (272) 30 protein:vir:4600 Length: 415 # 94.9 0.0033 2E-06 34.2 18.8 281 1-348 120-405 (415) 31 protein:vir:4700 Length: 415 # 94.9 0.0033 2E-06 34.2 18.8 281 1-348 120-405 (415) 32 protein:vir:96123 Length: 274 94.9 0.0033 2.1E-06 34.2 17.9 257 1-348 1-271 (274) 33 protein:vir:3613 Length: 272 # 92.6 0.011 6.7E-06 31.4 16.9 254 1-348 1-272 (272) 34 protein:vir:4339 Length: 395 # 91.7 0.015 9.1E-06 30.6 18.6 273 1-347 117-395 (395) 35 protein:vir:9410 Length: 415 # 91.6 0.015 9.4E-06 30.5 18.2 281 1-348 120-405 (415) 36 protein:vir:81100 Length: 415 88.1 0.035 2.1E-05 28.6 18.2 281 1-348 120-405 (415) 37 protein:vir:79987 Length: 415 88.1 0.035 2.1E-05 28.6 18.2 281 1-348 120-405 (415) 38 protein:vir:98339 Length: 415 88.1 0.035 2.1E-05 28.6 18.2 281 1-348 120-405 (415) 39 protein:vir:9574 Length: 300 # 87.7 0.037 2.3E-05 28.4 19.4 295 1-347 1-300 (300) 40 protein:vir:739 Length: 231 # 85.4 0.053 3.3E-05 27.6 11.5 228 23-348 1-231 (231) 41 protein:vir:94673 Length: 419 83.1 0.071 4.4E-05 26.9 19.7 280 1-348 121-418 (419) 42 protein:vir:1886 Length: 385 # 82.6 0.076 4.7E-05 26.7 19.7 272 1-348 105-385 (385) 43 protein:vir:191 Length: 385 # 82.6 0.076 4.7E-05 26.7 19.7 272 1-348 105-385 (385) 44 protein:vir:9927 Length: 295 # 79.5 0.1 6.4E-05 26.0 16.9 275 1-348 1-293 (295) 45 protein:vir:94771 Length: 298 79.2 0.11 6.6E-05 25.9 17.1 296 1-346 1-298 (298) 46 protein:vir:5255 Length: 304 # 77.6 0.12 7.7E-05 25.6 13.9 280 1-344 1-304 (304) 47 protein:vir:5974 Length: 324 # 77.3 0.13 7.9E-05 25.5 14.8 299 1-348 1-322 (324) 48 protein:vir:1638 Length: 298 # 76.9 0.13 8.1E-05 25.4 20.1 297 1-346 1-298 (298) 49 protein:vir:103285 Length: 296 70.0 0.21 0.00013 24.2 20.8 279 1-346 1-296 (296) 50 protein:vir:80446 Length: 367 59.5 0.39 0.00024 22.8 17.3 305 1-348 1-361 (367) 51 protein:vir:102944 Length: 330 58.4 0.41 0.00026 22.7 14.3 302 1-348 1-328 (330) 52 protein:vir:100135 Length: 418 57.2 0.44 0.00027 22.5 21.5 277 1-348 135-416 (418) 53 protein:vir:107687 Length: 319 52.1 0.56 0.00035 22.0 22.0 277 1-345 24-319 (319) 54 protein:vir:79928 Length: 393 51.4 0.58 0.00036 21.9 18.5 288 1-337 74-393 (393) 55 protein:vir:4953 Length: 397 # 48.6 0.66 0.00041 21.6 19.1 268 1-348 109-386 (397) 56 protein:vir:10364 Length: 390 47.0 0.71 0.00044 21.4 20.3 270 1-345 114-390 (390) 57 protein:vir:4856 Length: 293 # 46.2 0.74 0.00046 21.3 16.9 272 1-348 5-282 (293) 58 protein:vir:1268 Length: 397 # 45.8 0.76 0.00047 21.2 17.6 264 1-347 123-397 (397) 59 protein:vir:9875 Length: 296 # 45.5 0.77 0.00048 21.2 16.5 276 1-348 1-296 (296) 60 protein:vir:102655 Length: 322 45.5 0.77 0.00048 21.2 13.0 281 1-348 13-322 (322) 61 protein:vir:97053 Length: 390 43.9 0.83 0.00051 21.0 20.1 269 1-345 113-390 (390) 62 protein:vir:7771 Length: 330 # 39.0 1 0.00065 20.5 18.3 295 1-348 1-324 (330) 63 protein:vir:4997 Length: 397 # 37.5 1.1 0.00069 20.3 19.8 268 1-348 109-386 (397) 64 protein:vir:105905 Length: 304 34.8 1.3 0.00079 20.0 21.0 281 1-346 1-304 (304) 65 protein:vir:94142 Length: 304 34.8 1.3 0.00079 20.0 21.0 281 1-346 1-304 (304) 66 protein:vir:81227 Length: 413 34.7 1.3 0.00079 20.0 18.7 279 1-348 122-411 (413) 67 protein:vir:41 Length: 299 # N 31.7 1.5 0.00092 19.6 18.0 289 1-348 6-299 (299) 68 protein:vir:1583 Length: 351 # 29.3 1.7 0.001 19.4 14.4 304 1-348 1-328 (351) 69 protein:vir:104342 Length: 314 28.3 1.8 0.0011 19.2 20.2 277 1-346 21-314 (314) 70 protein:vir:78148 Length: 123 26.8 1.9 0.0012 19.0 7.8 121 200-347 1-123 (123) 71 protein:vir:94070 Length: 339 24.3 2.2 0.0014 18.7 16.3 272 1-330 46-339 (339) 72 protein:vir:99675 Length: 324 23.2 2.3 0.0015 18.6 8.9 266 34-348 1-305 (324) 73 protein:vir:4830 Length: 397 # 21.8 2.5 0.0016 18.4 20.1 268 1-348 109-386 (397) 74 protein:vir:2344 Length: 397 # 21.3 2.6 0.0016 18.3 18.7 283 1-348 10-307 (397) 75 protein:vir:2504 Length: 305 # 20.7 2.7 0.0017 18.2 12.5 287 1-338 1-305 (305) 76 protein:vir:95763 Length: 297 20.6 2.7 0.0017 18.2 19.7 280 1-348 1-297 (297) 77 protein:vir:103955 Length: 324 20.1 2.8 0.0018 18.1 20.2 281 1-348 30-316 (324) No 1 >protein:vir:2736 Length: 348 # NCBI annotation: putative structural protein # Family: family:all:1083 # MgeID: mge:58 # MgeName: O1205 # Cross-refs: genbank:acc:NP_695109;genbank:gi:23455878;genbank:GeneID:955608 Probab=100.00 E-value=3.1e-97 Score=549.69 Aligned_cols=348 Identities=93% Similarity=1.313 Sum_probs=338.6 Q ss_pred CccchhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEeec Q lcl|Aclame:pro 1 MGLIYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQM 80 (348) Q Consensus 1 Ma~l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~ 80 (348) ||+|.|+|++++|++++++++.+..++|+++|||.+++++++++.+++.++.+++||++++++++++..|+++++.++++ T Consensus 1 M~~i~d~f~~~~l~~~v~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~ 80 (348) T protein:vir:27 1 MGLIYDKVTASNIAGYFNALQENVSSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEMHDEQM 80 (348) T ss_pred CcchhhhcCHHHHHHHHHhccchhhhhhHhhcCCCccccceeEEEEeeccCceeEeeeecCCCCcceecccceeeeeeec Confidence 99999999999999999999988888999999999999999999999999999999999999999999999999999999 Q ss_pred cccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEeeccC Q lcl|Aclame:pro 81 PFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGVK 160 (348) Q Consensus 81 p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDfg~~ 160 (348) |+|++++.++|+|++.++.+++.++++.++++.+++++|+++|.++|++|+||||+|+|++||+.++++|..++||||++ T Consensus 81 p~i~~~~~i~~~d~~~~~~~~~~~~~~~~~~~~~~i~~d~~~l~~~i~~r~E~m~~~al~~Gki~i~~~~~~~~vdfg~~ 160 (348) T protein:vir:27 81 PFFKEAMLVKENDRQQLNLVKDSGNAVLVNTIVAGIFNDNLTLVNGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGVK 160 (348) T ss_pred CccccccccCHHHHHHHHHhhccCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeEEecCCeeEEEeecCC Confidence 99999999999999999999999999999999999999999999999999999999999999999999999999999999 Q ss_pred ccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHHHh Q lcl|Aclame:pro 161 ADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYVAD 240 (348) Q Consensus 161 ~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~~ 240 (348) ++|+++++++|++++|||++||++|++.++++|.+|++++||+++|++|++|++|++++++++.+.+.+++++++.+++. T Consensus 161 ~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~ii~~~~~~~~l~~~~~v~~~~~~~~~~~~~i~~~~~~~~~~~ 240 (348) T protein:vir:27 161 PDHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAVMNAKTFGLIRKAASTVKVIKPLAGDGSAVTKAELENYIAD 240 (348) T ss_pred cccceeeeeccCCCCCCHHHHHHHHHHHHHhcCCcccEEEECHHHHHHHhcCHHHHHHhcccCccccccCHHHHHHHHHh Confidence 99999999999999999999999999999989999999999999999999999999999998888889999999999999 Q ss_pred hcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeecCCCce Q lcl|Aclame:pro 241 NYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPVN 320 (348) Q Consensus 241 ~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~ 320 (348) ++|++|++||++|+|.+|+.+++||+|+++|+|++.+|.++||+++|+.++..+.....++...+.++++++|.+.||++ T Consensus 241 ~~g~~i~~yd~~y~d~~G~~~~~~p~~~vvl~~~~~~G~~~yG~~~e~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~ 320 (348) T protein:vir:27 241 NFGVSIVLENGTYRNDKGEVSKFYPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNAEVEIVDNGIAVTTTKTTDPVN 320 (348) T ss_pred hcCceEEEEeeEEEcCCCcCcccccCCeEEEEcCCcceeEEeccCcchhhhhhccccccceeeeCCeeEEEeeecCCCce Confidence 99999999999999999999999999999999999999999999999999988888888888889999999999999999 Q ss_pred eEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 321 VQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 321 ~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ++++++|+|||||.+||++++||||++| T Consensus 321 ~~~~~~s~~lPv~~~~~~~~~a~Vl~~~ 348 (348) T protein:vir:27 321 VQTKVSMVALPSFERLDDVYMLTVIPAV 348 (348) T ss_pred EEEEEeeeeeccccCCCcEEEEEEecCC Confidence 9999999999999999999999999999 No 2 >protein:vir:4902 Length: 348 # NCBI annotation: gp348 # Family: family:all:1083 # MgeID: mge:107 # MgeName: Sfi11 # Cross-refs: genbank:acc:NP_056680;genbank:gi:9635015;genbank:GeneID:1262657 Probab=100.00 E-value=4.7e-97 Score=548.68 Aligned_cols=348 Identities=94% Similarity=1.319 Sum_probs=338.5 Q ss_pred CccchhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEeec Q lcl|Aclame:pro 1 MGLIYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQM 80 (348) Q Consensus 1 Ma~l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~ 80 (348) ||+|.|+|++++|++++++++.+..+||+++|||.+++++++++.+++.++.+++||+++++++++++.|+++++.++++ T Consensus 1 M~~l~d~f~~~~l~~~v~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~ 80 (348) T protein:vir:49 1 MGLIYDKVTASNIAGYFNALQENVDSTLGESIFPARKQLGTKLSYITGASGQSVALKAAAFDTNVTVRDRVSAEMHDEQM 80 (348) T ss_pred CcchhhhcCHHHHHHHHHhccccchhhhHhhcCCCccccCceeEEEEeecCceeeeeeecCCCCcceecccceeeeeeec Confidence 99999999999999999999988889999999999999999999999999999999999999999999999999999999 Q ss_pred cccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEeeccC Q lcl|Aclame:pro 81 PFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGVK 160 (348) Q Consensus 81 p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDfg~~ 160 (348) |+|++++.++|+|++.++.+.+.++++.++.+.+++++|+++|.++|++|+||||+|+|++||+.++++|++++||||++ T Consensus 81 p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~d~~~l~~~i~~r~E~m~~qal~~Gki~i~~~g~~~~vdyg~~ 160 (348) T protein:vir:49 81 PFFKEAMLVKENDRQQLNLVKDSGNAALVNTIVAGIFNDNLTLVNGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGVK 160 (348) T ss_pred CccccccccCHHHHHHHHHHhccCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhCCeEEEecCCceEEEeecCC Confidence 99999999999999999999999999999999999999999999999999999999999999999999999999999999 Q ss_pred ccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHHHh Q lcl|Aclame:pro 161 ADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYVAD 240 (348) Q Consensus 161 ~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~~ 240 (348) ++|+++++++|+++++||++||++|++.++++|.+|++++||+++|++|++|++|++++++.+.+.+.+++++++.+++. T Consensus 161 ~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~ii~~~~~~~~l~~~~~v~~~~~~~~~~~~~i~~~~~~~~~~~ 240 (348) T protein:vir:49 161 PDHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAVMNAKTFGLIRKAASTVKVIKPLAGDGSSVTKAELDNYIAD 240 (348) T ss_pred cccceeeeeccCCCCCCHHHHHHHHHHHHHhcCCcccEEEeCHHHHHHHhcCHHHHHHhhccCcccccccHHHHHHHHHh Confidence 99999999999999999999999999999999999999999999999999999999999998888889999999999999 Q ss_pred hcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeecCCCce Q lcl|Aclame:pro 241 NYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPVN 320 (348) Q Consensus 241 ~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~ 320 (348) ++|++|++||++|+|++|+.+++||+|+++|+|++.+|.++||+++|+.++..+...+.++...+.++++++|.+.||++ T Consensus 241 ~~g~~i~~y~~~y~d~dG~~~~~~p~~~v~l~~~~~~G~~~yg~~~e~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~ 320 (348) T protein:vir:49 241 NFGVTVVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDNGIAVTTTKTTDPVN 320 (348) T ss_pred hcCceEEEEeeEEEecCCcEeeeecCCeEEEecCCCcceeEEecChhhhhhccccccccceeecCCeEEEeeeecCCCce Confidence 99999999999999999999999999999999999999999999999999888888888888889999999999999999 Q ss_pred eEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 321 VQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 321 ~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ++++++|+|||||.+||++++||||++| T Consensus 321 ~~~~~~s~~lPv~~~~~~~~~a~Vl~~~ 348 (348) T protein:vir:49 321 VQTKVSMVALPSFERLDDVYMLTVIPAV 348 (348) T ss_pred EEEEEeeeccccccCCCcEEEEEEecCC Confidence 9999999999999999999999999999 No 3 >protein:vir:96490 Length: 348 # NCBI annotation: head protein # Family: family:all:1083 # MgeID: mge:1620 # MgeName: 2972 # Cross-refs: genbank:acc:YP_238492;genbank:gi:66391768;genbank:GeneID:5176912 Probab=100.00 E-value=7.8e-97 Score=547.47 Aligned_cols=348 Identities=100% Similarity=1.365 Sum_probs=338.5 Q ss_pred CccchhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEeec Q lcl|Aclame:pro 1 MGLIYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQM 80 (348) Q Consensus 1 Ma~l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~ 80 (348) ||+|+|+|++++|++++++++.+..+||+++|||.+++++++++.+++.++.+++||++++++++++..|+++++.++++ T Consensus 1 M~~i~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~ 80 (348) T protein:vir:96 1 MGLIYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQM 80 (348) T ss_pred CcchhhccCHHHHHHHHHhcccchhhhhhhhcCCCccccceeEEEEeecCCceeEeeeecCCCCcceecccceeeeeeec Confidence 99999999999999999999988888999999999999999999999999999999999999999999999999999999 Q ss_pred cccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEeeccC Q lcl|Aclame:pro 81 PFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGVK 160 (348) Q Consensus 81 p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDfg~~ 160 (348) |+|++++.++|+|++.++.++..++++.++++.+++++|+++|.++|++|+||||+|+|++|||.+.++|.+++||||++ T Consensus 81 p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~d~~~l~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vdfg~~ 160 (348) T protein:vir:96 81 PFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGVK 160 (348) T ss_pred CccccccccCHHHHHHHHhhhccCCchHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeEeecCCeeEEEeccCC Confidence 99999999999999999999988888889999999999999999999999999999999999999999999999999999 Q ss_pred ccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHHHh Q lcl|Aclame:pro 161 ADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYVAD 240 (348) Q Consensus 161 ~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~~ 240 (348) ++|+++++++|++++|||++||++|+++++++|.+|++++||+++|++|++|++|++++++.+.+.+.+++++++.+++. T Consensus 161 ~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~i~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~~ 240 (348) T protein:vir:96 161 ADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYVAD 240 (348) T ss_pred cccceeeccccCCCCCCHHHHHHHHHHHHHhcCCcccEEEeCHHHHHHHhcCHHHHHHHhccCCccccccHHHHHHHHhh Confidence 99999999999999999999999999999999999999999999999999999999999998888889999999999999 Q ss_pred hcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeecCCCce Q lcl|Aclame:pro 241 NYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPVN 320 (348) Q Consensus 241 ~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~ 320 (348) ++|++|++|+++|+|++|+.+++||+|+++|+|++.+|.++||+++|+.++..+...+.++...+.|+++++|.+.||++ T Consensus 241 ~~g~~i~~y~~~y~d~~G~~~~~~p~~~v~l~~~~~~G~~~yg~~~e~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~ 320 (348) T protein:vir:96 241 NYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPVN 320 (348) T ss_pred hcCceEEEEccEEEecCCcEeccccCCeEEEEcCCCceeEEeccChhhhhhhhcccccccceecCCeeEEEeeecCCCce Confidence 99999999999999999999999999999999999999999999999999988888888888889999999999999999 Q ss_pred eEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 321 VQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 321 ~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ++++++|+|||||.+||++++|||||+| T Consensus 321 ~~~~~~s~plPv~~~~~~~~~a~Vl~~~ 348 (348) T protein:vir:96 321 VQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) T ss_pred EEEEEeeeeeccccCCCcEEEEEEecCC Confidence 9999999999999999999999999999 No 4 >protein:vir:98480 Length: 348 # NCBI annotation: ORFp38 # Family: family:all:1083 # MgeID: mge:1589 # MgeName: VWB # Cross-refs: genbank:acc:NP_958280;genbank:gi:41057254;uniprot:Q38595;genbank:GeneID:2732864 Probab=100.00 E-value=5.3e-81 Score=460.68 Aligned_cols=331 Identities=21% Similarity=0.300 Sum_probs=299.0 Q ss_pred Cccc--hhhcCHHHHHHHHHhhcc--chhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeee Q lcl|Aclame:pro 1 MGLI--YDKVTASNIAGYFNTLQE--NVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIH 76 (348) Q Consensus 1 Ma~l--~d~f~~~~l~~~i~~~~~--~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~ 76 (348) |+.+ +|+|++++|++++++.+. +.++|++++|||.+++.+.+++.+.+.++.+++|+++++++++++..|+++++. T Consensus 1 M~~~~~~d~~~~~~l~~~i~~~~~~~~~~~~l~~~~fp~~~~~~~~~~~~~~~~~~~~~a~~~~~~~~~~~~~r~g~~~~ 80 (348) T protein:vir:98 1 MSWTLDTEFIEPTQLTGLIREALRDLQVNRFRLARWLPNVDVDDITFEFLRGGGGLAETASYRSWDTESKIGRREGLAKV 80 (348) T ss_pred CcchhhhhccCHHHHHHHHHHHhhccCcchhhHHhcCCCccccceEEEEEeccCCceeeeeeecCCCccceeecccceee Confidence 9975 589999999999998863 446799999999999999999999999999999999999999999999999999 Q ss_pred EeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEe Q lcl|Aclame:pro 77 DEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDID 156 (348) Q Consensus 77 ~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vD 156 (348) ++++|+|++++.++|+|+++++.. ..+++.+.+++++++|.++|++|+||||+|+|++||+++++++ ++|| T Consensus 81 ~~~~~~i~~~~~i~~~d~~~~~~~-------~~~~~~~~i~~d~~~l~~~i~~r~E~m~~qal~~Gki~~~g~~--~~vD 151 (348) T protein:vir:98 81 MGELPPISEKIPLNEYDRLRLRKL-------SRDEALPFIARDAQRLARNIGARFEVARGSALVNATVPVTELQ--QTVD 151 (348) T ss_pred eeeccccccccccCHHHHHHhcCC-------hHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhCCeEEEecCc--eEEc Confidence 999999999999999999877533 2356778999999999999999999999999999999997766 5799 Q ss_pred eccCccceeeeeecCC-CCCccHHHHHHHHHHHHHh-cCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCC--cccccHH Q lcl|Aclame:pro 157 YGVKADHKKQVSKSWA-EPGATPLADLEDAIETARE-LGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGD--GSSVTKA 232 (348) Q Consensus 157 fg~~~~~~~t~~~~W~-~~~adp~~di~~~~~~~~~-~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~--~~~~~~~ 232 (348) ||++++|++++++.|+ +++|||++||++|++.+++ .|.+|++++||+++|++|++|+++++++++.+.+ .+.++++ T Consensus 152 yg~~~~~~~t~~~~Ws~~~~adp~~di~~~~~~~~~~~G~~p~~~vm~~~~~~~l~~~~~i~~~~~~~~~~~~~~~~~~~ 231 (348) T protein:vir:98 152 FGRIGSHSVVAAVLWSVHATATPISDLESWVATYEDTNGQSPGVILMPKAAVSHMRQCEEVIRQVFPLAPSGTAPMVSVE 231 (348) T ss_pred cccCcccccccccccCCCCCCCHHHHHHHHHHHHHHccCCcceEEEeCHHHHHHHhcCHHHHHHHhccCccccccccCHH Confidence 9999999999999997 4789999999999999876 5899999999999999999999999999877543 4678999 Q ss_pred HHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCC---------ccceeEeccchhhhccccccccccceee Q lcl|Aclame:pro 233 ELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNG---------PLGNTVFGTTPEESDLFADNTVNADVEI 303 (348) Q Consensus 233 ~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~---------~~G~~~yg~~~~~~~~~~~~~~~~~~~~ 303 (348) +++.+++.+|++.|++||.+|.+ +|+.+++||+|+++|+|.+ .+|+++||+++|+.++..+.. .. T Consensus 232 ~~~~~~~~~g~~~i~~~d~~~~~-~g~~~~~~p~~~i~l~p~~~~~~~~~~~~~G~t~~G~~~e~~~~~~~~~-----~~ 305 (348) T protein:vir:98 232 QLNTVLSSMGLPPIEVYDAKVAV-DGVSTRITPANAIALLPEPGATDAAQPTELGATLLGTTAESLEDDYALA-----PG 305 (348) T ss_pred HHHHHHHhhCCeEEEEeeeEEEc-CCceeceecCCeEEEEecCCcccccccccccceecccchhhhccccccc-----ee Confidence 99999999999999999999876 6889999999999999864 379999999999887654322 23 Q ss_pred cCCceEEEEeecCCCceeEEeeeeeeeeeecCCCcEEEEEEec Q lcl|Aclame:pro 304 VDSGIAVTTTKTTDPVNVQTKVSMVALPSFERLGDVYMLTVIP 346 (348) Q Consensus 304 ~~~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~ 346 (348) ...|+++++|.+.||++++++++|+|||||.+||++++||||| T Consensus 306 ~~~~i~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~a~Vl~ 348 (348) T protein:vir:98 306 EQPGIVAATWKTKDPVRLWTHAAAVGIPVLREPNLTFKAQVLA 348 (348) T ss_pred ccCceeeeeeeecCCcEEEEEEeeeeeccccCCCcEEEEEEeC Confidence 4678999999999999999999999999999999999999999 No 5 >protein:vir:106590 Length: 349 # NCBI annotation: putative major head protein # Family: family:all:1083 # MgeID: mge:1598 # MgeName: Lj965 # Cross-refs: genbank:acc:NP_958585;genbank:gi:41179245;genbank:GeneID:2717126 Probab=100.00 E-value=7.1e-80 Score=454.50 Aligned_cols=330 Identities=27% Similarity=0.431 Sum_probs=293.5 Q ss_pred Ccc-------------chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcce Q lcl|Aclame:pro 1 MGL-------------IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTI 67 (348) Q Consensus 1 Ma~-------------l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~ 67 (348) |+| +.|+|++..|+++++++|. ++||+++|||.+++++++++.+++.++.+++|+++++++++++ T Consensus 1 ~~~~~~~~~~~~~~~~~~d~~~~~~l~~~~~~~~~--~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~ 78 (349) T protein:vir:10 1 MKNQKLQLDLQRFATPILDMFSQNTVLDYTRNRQY--PEMLGDTLFPAVKVPTLEVDILKAGSRVPTIASVSAFDAEAEI 78 (349) T ss_pred CCcchhhHHHHHHHHHhhcccCHHHHHHHHHhcCc--chhhHhhcCCccccccceeEEEeeccCcceeeeeecCCCCcce Confidence 443 3578999999999999874 4799999999999999999999999999999999999999999 Q ss_pred ecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeec Q lcl|Aclame:pro 68 RDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFT 147 (348) Q Consensus 68 ~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~ 147 (348) ++|.+ ++.++++|++++++.++|.|+++++.. ++++..+.+.+.+++++.+|.++|++|+||||+|+|++||++++ T Consensus 79 ~~r~~-~~~~~~~p~ik~~~~i~e~dl~~~~~~---~~~~~~~~~~~~i~~d~~~l~~~i~~r~E~m~~q~l~~Gki~~~ 154 (349) T protein:vir:10 79 GTREA-SKMTAELAYVKRKMQITEEMLIKLQSP---RNTAEENYLKQYVFDDIDAMVQAVKARGEKMTMEMFATGKITDK 154 (349) T ss_pred ecccc-eeEEeeccccccccccCHHHHHHHhhc---cCcchHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhCCeeEEc Confidence 98876 577899999999999999998776644 45566678889999999999999999999999999999999998 Q ss_pred CCceeEEEeeccCccceeeee--ecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCC Q lcl|Aclame:pro 148 SDGVNKDIDYGVKADHKKQVS--KSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGD 225 (348) Q Consensus 148 ~~~~~~~vDfg~~~~~~~t~~--~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~ 225 (348) ++| ++||||++++|+++++ .+|++++|||++||++|++.+ |.+|++++||+++|++|++|++|+++++++. . T Consensus 155 ~~g--~~vD~g~~~~~~~~lt~~~~Ws~~~adpi~Di~~~~~~~---g~~p~~~vm~~~~~~~l~~~~~i~~~~~~~~-~ 228 (349) T protein:vir:10 155 KNG--IAIDYGVPKKHQETLSGTKTWDKSDASIIDNLQDWSDSL---DVTPTRALTSKKVLRILMRSTEIKEAIFGKD-T 228 (349) T ss_pred CCc--EEEecccCccceeEecCcccCCCCCCCHHHHHHHHHHHh---CCCccEEEeCHHHHHHHhcCHHHHHHhcccc-c Confidence 877 5799999999987664 579999999999999998654 8899999999999999999999999998764 4 Q ss_pred cccccHHHHHHHHHhhcCceEEEEeeEEEcCCC----cccccccCCeEEEEeCCccceeEeccchhhhccccccccccce Q lcl|Aclame:pro 226 GSSVTKAELQNYVADNYGVEIVLENGTYRNEKG----EVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADV 301 (348) Q Consensus 226 ~~~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g----~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~ 301 (348) ...++.++++.+++.++|++|++||++|+|.+| +++++||+|.|+|+|++.+|.++||+++++.++..|.. .. T Consensus 229 ~~~~~~~~~~~~l~~~~~~~i~~yd~~y~d~~~~~~~t~~~~~p~~~v~l~~~~~~G~~~yG~~~e~~~~~~g~~---~~ 305 (349) T protein:vir:10 229 GRVVGQADLDQWMTAQGLPIIRAYDGKYRDEDSRGNLTTNSYFPEDRIVLFNDEVPGQKIYGPTPEENRLISSNA---QV 305 (349) T ss_pred ccccCHHHHHHHHHhcCCceEEEEeeEEEeecCCCceeecccccCCeEEEecCCCceeEEeeccchhhhhccccc---ce Confidence 456788999999999999999999999998766 67899999999999999999999999999888776543 33 Q ss_pred eecCCceEEEEeecCCCceeEEeeeeeeeeeecCCCcEEEEEEe Q lcl|Aclame:pro 302 EIVDSGIAVTTTKTTDPVNVQTKVSMVALPSFERLGDVYMLTVI 345 (348) Q Consensus 302 ~~~~~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~ 345 (348) ...+.+++++.|.+.||++++++++|+|||+|.+||++++|||| T Consensus 306 ~~~~~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~a~Vl 349 (349) T protein:vir:10 306 SNVGNIMAKIYETSEDPIGTWILASATMLPSFASADDVFQAKVL 349 (349) T ss_pred eeccceEEEeeeecCCCceEEEEEeeeeeeeecCCCcEEEEEeC Confidence 34556677777789999999999999999999999999999999 No 6 >protein:vir:3424 Length: 341 # NCBI annotation: capsid component # Family: family:all:1021 # MgeID: mge:70 # MgeName: lambda # Cross-refs: genbank:acc:NP_040587;genbank:gi:9626251;genbank:GeneID:2703482 Probab=100.00 E-value=2.6e-74 Score=423.99 Aligned_cols=331 Identities=13% Similarity=0.102 Sum_probs=284.3 Q ss_pred hhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEeeccccc Q lcl|Aclame:pro 5 YDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQMPFFK 84 (348) Q Consensus 5 ~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~p~i~ 84 (348) .|+|++++|+++++++|. ..++|+++|||.+.+..++.+.++..++...+||+|++++++....|+++++.++++|+|+ T Consensus 1 ~d~f~~~~L~~~i~~~~~-~~~~l~d~~fp~~~~~~t~~v~~~~~~~~~~lap~v~~~~~~~~~~~~~~~~~~~~~p~i~ 79 (341) T protein:vir:34 1 MSMYTTAQLLAANEQKFK-FDPLFLRLFFRESYPFTTEKVYLSQIPGLVNMALYVSPIVSGEVIRSRGGSTSEFTPGYVK 79 (341) T ss_pred CCCcCHHHHHHHHHhccC-ccchhHHhcCCcccccccceEEEEEeeCCeeEEEeecCCCCcceeccCceeeeEEecCccC Confidence 799999999999999985 5689999999999888888777888888999999999999999999999999999999999 Q ss_pred cccccCHHHHHHHHhhcCc-CCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCce-eEEEeeccCcc Q lcl|Aclame:pro 85 EALLVKENDRQQLNLVKDT-GNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGV-NKDIDYGVKAD 162 (348) Q Consensus 85 ~~~~i~~~d~~~l~~~~~~-~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~-~~~vDfg~~~~ 162 (348) +++.++++|+++++..... +.....+++.+.+++++.++.++|++|+||||+|+|++|||.+.++|+ .++||||++++ T Consensus 80 ~~~~i~~~d~~~r~~g~~~~~~~~~~~~~~~~i~~~l~~l~~~i~~~~E~m~~qaL~~Gki~~~~~g~~~~~vDfg~~~~ 159 (341) T protein:vir:34 80 PKHEVNPQMTLRRLPDEDPQNLADPAYRRRRIIMQNMRDEELAIAQVEEMQAVSAVLKGKYTMTGEAFDPVEVDMGRSEE 159 (341) T ss_pred ccceeCHHHHHHHhhccccccCcCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCcEEEecCCccEEEEEeCCCCc Confidence 9999999998865543332 233456778889999999999999999999999999999999988776 48999999999 Q ss_pred ceeeee--ecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccccc-----HHHHH Q lcl|Aclame:pro 163 HKKQVS--KSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVT-----KAELQ 235 (348) Q Consensus 163 ~~~t~~--~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~-----~~~~~ 235 (348) |+++++ ++|+++++++.++|++|.+.+++.|.+|++++||+++|++|++|++|+++++++..+.+.+. ..+.. T Consensus 160 ~~~~~t~~~~W~~~~~~~~d~l~di~~~~~~~g~~~~~~i~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~~ 239 (341) T protein:vir:34 160 NNITQSGGTEWSKRDKSTYDPTDDIEAYALNASGVVNIIVFDPKGWALFRSFKAVKEKLDTRRGSNSELETAVKDLGKAV 239 (341) T ss_pred cceEecCCccCCcCCCchHHHHHHHHHHHHhcCCceEEEEeCHHHHHHHhcCHHHHHHHhhcccccccccccccccccce Confidence 998765 57999876555555555555677899999999999999999999999999987766555443 33455 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEee- Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTK- 314 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~- 314 (348) .+++.++|++|++||++|+| +|+.+++||+|+++|+|.+.+|.++||++++.+....+. ....++++.|. T Consensus 240 ~~~~~~~g~~i~~y~~~y~d-dG~~~~~ip~~~v~l~p~g~~g~~~yg~~~d~~~~~~~~--------~~~~~~~~~~~~ 310 (341) T protein:vir:34 240 SYKGMYGDVAIVVYSGQYVE-NGVKKNFLPDNTMVLGNTQARGLRTYGCIQDADAQREGI--------NASARYPKNWVT 310 (341) T ss_pred eeeeecCCceEEEEcCEEEE-CCcEEeeecCCeEEEeeCCCcceEEEeecccccccccce--------eeeeEeeeeeee Confidence 67778899999999999997 799999999999999999999999999998766544331 12346788885 Q ss_pred cCCCceeEEeeeeeeeeeecCCCcEEEEEEe Q lcl|Aclame:pro 315 TTDPVNVQTKVSMVALPSFERLGDVYMLTVI 345 (348) Q Consensus 315 ~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~ 345 (348) +.||++++++++|+|||++.+||++++|||= T Consensus 311 ~~dp~~~~~~~~s~pLPv~~~pd~~~~a~V~ 341 (341) T protein:vir:34 311 TGDPAREFTMIQSAPLMLLADPDEFVSVQLA 341 (341) T ss_pred cCCCcEEEEEEcccceeeeeCCCcEEEEEeC Confidence 4589999999999999999999999999998 No 7 >protein:vir:393 Length: 341 # NCBI annotation: gp8 # Family: family:all:1021 # MgeID: mge:325 # MgeName: N15 # Cross-refs: genbank:acc:NP_046903;genbank:gi:9630472;genbank:GeneID:1261647 Probab=100.00 E-value=4.7e-73 Score=417.12 Aligned_cols=328 Identities=13% Similarity=0.095 Sum_probs=281.0 Q ss_pred hhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEeeccccc Q lcl|Aclame:pro 5 YDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQMPFFK 84 (348) Q Consensus 5 ~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~p~i~ 84 (348) .|+|++++|+++++++|.+ .++|+++|||++++.+++.+.++..++...+||+|++++++++.+|+++++.++++|+|+ T Consensus 1 ~d~f~~~~L~~~i~~~~~~-~~~l~~~~Fp~~~~~~t~~v~~~~~~~~~~lap~v~~~~~~~~~~~~~~~~~~~~~p~i~ 79 (341) T protein:vir:39 1 MSVYTTAQLLAVNEKKFKF-DPLFLRIFFRETYPFSTEKVYLSQIPGLVNMALYVSPIVSGKVIRSRGGSTSEFTPGYVK 79 (341) T ss_pred CCccCHHHHHHHHHhhcCc-cchhHhhcCCcccccCcceEEEEEecCCceeeEEecCCCCcceecccceeeeeEeccccC Confidence 7999999999999999864 589999999999998888777888888899999999999999999999999999999999 Q ss_pred cccccCHHHHHHHHhhcCc-CCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCce-eEEEeeccCcc Q lcl|Aclame:pro 85 EALLVKENDRQQLNLVKDT-GNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGV-NKDIDYGVKAD 162 (348) Q Consensus 85 ~~~~i~~~d~~~l~~~~~~-~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~-~~~vDfg~~~~ 162 (348) +++.++++|+++++..... +.....++..+.++++++++.++|++|+||||+|+|++|||.++++|+ .++||||++++ T Consensus 80 ~~~~i~~~d~~~r~~g~~~~~~~~~~~~~~~~i~~~~~~l~~~i~~r~E~m~~qaL~~Gki~i~~~g~~~~~vDfg~~~~ 159 (341) T protein:vir:39 80 PKHEVNPLMTLRRLPDEDPQNLADPVYRRRRIILQNMKDEELAIAQVEEKQAVAAVLSGKYTMTGEAFEPVEVDMGRSAG 159 (341) T ss_pred cccccCHHHHHHHhhcccccccCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCceEEEcCCCcEEEEeccCCcc Confidence 9999999998765443221 233445667788999999999999999999999999999999988777 58999999999 Q ss_pred ceeeee--ecCCCCCc---cHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccccc-----HH Q lcl|Aclame:pro 163 HKKQVS--KSWAEPGA---TPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVT-----KA 232 (348) Q Consensus 163 ~~~t~~--~~W~~~~a---dp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~-----~~ 232 (348) |+++++ ..|+++++ ||++||++| +++.|.+|++++||+++|++|++|++|++++++...+.+.+. .. T Consensus 160 ~~~~lt~~~~W~~~~~~~~d~l~di~~~---~~~~g~~~~~ii~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~ 236 (341) T protein:vir:39 160 NNIVQAGAAAWSSRDKETYDPTDDIEAY---ALNASGVVNIIVFDPKGWALFRSFKAVKEKLDTRRGSNSELETALKDLG 236 (341) T ss_pred ceeEecCCccCCCCCCchHHHHHHHHHH---HHhcCCceEEEEeChHHHHHHhcCHHHHHHHhhcccccccccchhhhhh Confidence 997765 57999875 566666655 456788999999999999999999999999987665555443 23 Q ss_pred HHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEE Q lcl|Aclame:pro 233 ELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTT 312 (348) Q Consensus 233 ~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 312 (348) +...+++.++|++|++||++|+| +|+.+++||+|.++|+|.+.+|.++||++.+.+....+. ....++++. T Consensus 237 ~~~~~~~~~~g~~i~~y~~~y~d-~g~~~~~ip~~~~~l~p~~~~g~~~yg~~~d~~~~~~~~--------~~~~~~~~~ 307 (341) T protein:vir:39 237 KAVSYKGMYGDVAIVVYSGQYIE-NDVKKNYLPDLTMVLGNTQARGLRTYGCILDADAQREGI--------NASTRYPKN 307 (341) T ss_pred hHhhhhhhhcCceEEEEccEEEe-cCcEEeeecCCeEEEeeCCCcceEEEecccchhhcccce--------eeeeeeeee Confidence 45577888899999999999997 789999999999999999999999999998765543331 123468899 Q ss_pred eec-CCCceeEEeeeeeeeeeecCCCcEEEEEEe Q lcl|Aclame:pro 313 TKT-TDPVNVQTKVSMVALPSFERLGDVYMLTVI 345 (348) Q Consensus 313 ~~~-~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~ 345 (348) |.+ .||++++++++|+|||+|.+||++++|||= T Consensus 308 ~~~~~dp~~~~~~~~s~plPv~~~p~~~~~a~V~ 341 (341) T protein:vir:39 308 WVQTGDPAREFTMIQSAPLMLLADPDEFVSVKLA 341 (341) T ss_pred eeecCCCcEEEEEEeccccceeeCCCcEEEEEeC Confidence 965 599999999999999999999999999998 No 8 >protein:vir:6378 Length: 346 # NCBI annotation: capsid protein E # Family: family:all:1021 # MgeID: mge:133 # MgeName: BcepNazgul # Cross-refs: genbank:acc:NP_918991;genbank:gi:34610166;genbank:GeneID:2559600 Probab=100.00 E-value=2.6e-72 Score=413.01 Aligned_cols=328 Identities=13% Similarity=0.145 Sum_probs=285.0 Q ss_pred hhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEeeccccc Q lcl|Aclame:pro 5 YDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQMPFFK 84 (348) Q Consensus 5 ~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~p~i~ 84 (348) .|+|++.+|+++++++|. .++|+++|||++.+..++.+.++..++...+||++++++++....++++++.+|++|+|+ T Consensus 1 ~d~f~~~~l~~~i~~~p~--~~~l~~~~fp~~~~~~t~~i~i~~~~g~~~la~~v~~~~~~~~~~~~g~~~~~~~~p~i~ 78 (346) T protein:vir:63 1 MEIFDTLTLAGVIQSGPA--LSMYWQGFYPNEITFDTDEILFDLVFKDKKLAPFVAPNVQGRVIAARGYTTKTFRPAYVK 78 (346) T ss_pred CCccCHHHHHHHHHhcCC--ccchhhhcCccccccccceEEEEEecCceeeeeeecCCCCcceecccceeeeEeecCccC Confidence 799999999999999873 578999999998888877777788888899999999999999999999999999999999 Q ss_pred cccccCHHHHHHHHhhcC--cCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCce-eEEEeeccCc Q lcl|Aclame:pro 85 EALLVKENDRQQLNLVKD--TGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGV-NKDIDYGVKA 161 (348) Q Consensus 85 ~~~~i~~~d~~~l~~~~~--~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~-~~~vDfg~~~ 161 (348) +++.++++|+++++.... .++...++++.+.+++++.+|.++|++|+||||+|+|++|++++++++. .+.||||+++ T Consensus 79 ~~~~i~~~d~~~~~~~~~~~~~~~~~~~~~~~~i~~~~~~l~~~i~~~~E~m~~~al~~gki~~~g~~~~~~~vdfg~~~ 158 (346) T protein:vir:63 79 PKDVINPNRTLKRRAGEQPIIGGMSLQERFQAVVADSQLEQRQRIENRIEWMCAMATIYGYVDVVGEAFPMQRVDFGRDP 158 (346) T ss_pred ccceeCHHHHHHHhhhhhhccCCcCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCCEEEeeCCceeEEEEeeCCCc Confidence 999999999987664332 3556677788889999999999999999999999999999999988876 5889999999 Q ss_pred cceeeee--ecCCCCCccHHHHHHHHHHHHHh-cCCeeEEEEeCHHHHHHHhcCHHHHHHhcccC-CCcccccHHHH--- Q lcl|Aclame:pro 162 DHKKQVS--KSWAEPGATPLADLEDAIETARE-LGLNPERAIMNAKTFGLIRKAASTVKAIKPLA-GDGSSVTKAEL--- 234 (348) Q Consensus 162 ~~~~t~~--~~W~~~~adp~~di~~~~~~~~~-~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~-~~~~~~~~~~~--- 234 (348) +|+++++ ..|+++++||++||++|++.+++ .|..|++++||+++|++|++|++|+++++..+ ...+.+.++.+ T Consensus 159 ~~~~~lt~~~~W~~~~adp~~di~~~~~~~~~~~g~~~~~~i~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~l~~~ 238 (346) T protein:vir:63 159 ALTVQLTGGAAWDQATSDPLGNIQTMRTTAWKKSNSTITRLTMGLDAWSLFSQKPAVVELLNLFYKGSTSDFNRSRLDDG 238 (346) T ss_pred cceeeecccccCCCCCCCHHHHHHHHHHHHHHccCCceEEEEECHHHHHHHhcCHHHHHHHhhhccccccccchhhcccc Confidence 9998754 57999999999999999999976 58899999999999999999999999997543 23333333222 Q ss_pred --H------HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCC Q lcl|Aclame:pro 235 --Q------NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDS 306 (348) Q Consensus 235 --~------~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~ 306 (348) . ..+...+|++|++|+++|+|.+|+.+++||+|+++|+|.+.+|.++||++++.... ..+. T Consensus 239 ~~~~~~~~~~~~~~~~gi~i~~y~~~y~d~~G~~~~~ip~~~v~~~p~~~~g~~~yg~~~d~~~~-----------~~~~ 307 (346) T protein:vir:63 239 SPVQYQGTIGGYNGMGTLELYTYHDTYTGDDNTEQEILGSYDVVGTGPGLQGTQCFGAIMDFKNG-----------LVPT 307 (346) T ss_pred hhhhhhhhHhhhhccCCeEEEEeccEEEcCCCceeccccCCeEEEEecCCcceEEEeeccccccC-----------cccc Confidence 1 11234578999999999999999999999999999999999999999999765431 2234 Q ss_pred ceEEEEeecCCCceeEEeeeeeeeeeecCCCcEEEEEEe Q lcl|Aclame:pro 307 GIAVTTTKTTDPVNVQTKVSMVALPSFERLGDVYMLTVI 345 (348) Q Consensus 307 ~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~ 345 (348) .++++.|.+.||.+++++++|+|||+|.+||+++++||= T Consensus 308 ~~~~~~~~~~dp~~~~~~~~s~plPv~~~p~~~~~~~V~ 346 (346) T protein:vir:63 308 RMFPKMWEEEDPSVAMLMTQSAPLMVPAQPNASFRMTVK 346 (346) T ss_pred eeeeEEEEecCCCEEEEEEeeeccceecCCCcEEEEEeC Confidence 578999999999999999999999999999999999999 No 9 >protein:vir:79503 Length: 409 # NCBI annotation: major head protein # Family: family:all:11999 # MgeID: mge:1870 # MgeName: P74-26 # Cross-refs: genbank:acc:YP_001468058;genbank:gi:157265500;genbank:GeneID:5600620 Probab=100.00 E-value=2.3e-65 Score=374.94 Aligned_cols=337 Identities=18% Similarity=0.244 Sum_probs=258.0 Q ss_pred Cccchh-----------hcC-HHHHHHHHHhhccchhhhHHHHhCCCccccceeEEE----EEeecCceeeeeeeeCCCC Q lcl|Aclame:pro 1 MGLIYD-----------KVT-ASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSY----IKGASGQSVALKAAAFDTN 64 (348) Q Consensus 1 Ma~l~d-----------~f~-~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~----~~~~~~~~~~a~~v~~~~~ 64 (348) +|-++| .++ ...|+.+++.+|. .++|.++|||+.+++.++.+. ..+.++.+..+.++.++++ T Consensus 11 ~~~~~~~~~~~~~~~~~~~~~~~~ia~~~~~~p~--~~~L~d~~FP~~~~f~t~l~~~~~~~kg~kk~~~~~~~~~~d~~ 88 (409) T protein:vir:79 11 LARVRDPLSIGGLKFPTTKEIQEAVAAIADKFNQ--ENDLVDRFFPEDSTFASELELYLLRTQDAEQTGMTFVHQVGSTS 88 (409) T ss_pred hhhhcCcchhcceecCchHHHHHHHHHHHHhcCC--ccchhhccCCCCccccceEEEEeeeccCcccccceEeeecCCcc Confidence 111111 111 1344666666653 468999999999988876554 3455677888888999999 Q ss_pred cceecccc---eeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhc Q lcl|Aclame:pro 65 VTIRDRVS---AEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLAT 141 (348) Q Consensus 65 ~~~~~r~~---~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~ 141 (348) .++..|.+ +++.+++||+||+++.++|+|++.++. .++++..+.+.+++++|+++|.++|++|+||||+|+|++ T Consensus 89 ~pv~~r~~~~~~~~~t~epp~iK~k~~i~e~dl~~~~~---~~n~~~~~~i~~~i~~D~~~L~~~I~~R~E~Ma~q~L~t 165 (409) T protein:vir:79 89 LPVEARVAKVDLAKATWSPLAFKESRVWDEKEILYLGR---LADEVQAGVINEQIAESLTWLMARMRNRRRWLTWQVMRT 165 (409) T ss_pred ccccccceeeeeeeecccccccccccccCHHHHHHHhC---CCChhHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhC Confidence 99887764 578889999999999999999876653 456667778889999999999999999999999999999 Q ss_pred CeeeecCC------ceeEEEeeccCccceeeee--ecCCCCCccHHHHHHHHHHHHHhcC-C--eeEEEEeCHHHHHHHh Q lcl|Aclame:pro 142 GKIAFTSD------GVNKDIDYGVKADHKKQVS--KSWAEPGATPLADLEDAIETARELG-L--NPERAIMNAKTFGLIR 210 (348) Q Consensus 142 Gki~~~~~------~~~~~vDfg~~~~~~~t~~--~~W~~~~adp~~di~~~~~~~~~~G-~--~~~~~~~~~~~~~~l~ 210 (348) |||.+.++ |..++||||+|++|+++++ ..|++++|||++||++|++.+++.| . ++.+++|++++|+.++ T Consensus 166 Gki~i~g~~~~~~~g~~~~vDyg~pa~hkvtlTgt~~W~~~~AdPi~DIe~w~~~i~~~~g~~~t~~~~imt~~~~~~l~ 245 (409) T protein:vir:79 166 GRITIQPNDPYNPNGLKYVIDYGVTDIELPLPQKFDAKDGNGNSAVDPIQYFRDLIKAATYFPDRRPVAIIVGPGFDEVL 245 (409) T ss_pred CeEEEEecCCCccccceEEEecCCCcccceeecccccCCCCCCChHHHHHHHHHHHHHhcCCCCCccEEEEcHHHHHHHH Confidence 99998554 4468999999999998765 4899999999999999999997754 3 4567999999997755 Q ss_pred -cCHHHHHHhcccCCCccc----ccHHHH-----HHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEe--CCccc Q lcl|Aclame:pro 211 -KAASTVKAIKPLAGDGSS----VTKAEL-----QNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIP--NGPLG 278 (348) Q Consensus 211 -~~~~v~~~~~~~~~~~~~----~~~~~~-----~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p--~~~~G 278 (348) +|+.++++++.+++..+. +++..+ ..++....|++|++||++|+|+||+.+++||+|.++|++ .+.+| T Consensus 246 ~~n~~ik~~l~~~~~~~~~~~~~~~~~~l~~~~~ln~~~~~~GL~I~vYd~~Y~dedGt~k~~~Pd~~vvLl~ap~g~LG 325 (409) T protein:vir:79 246 ADNTFVQKYVEYEKGWVVGQNTVQPPREVYRQAALDIFKRYTGLEVMVYDKTYRDQDGSVKYWIPVGELIVLNQSTGPVG 325 (409) T ss_pred hCcHHHHHhhhcccccccccccccchhhhcchhHhHhhhhhcCceEEEEeeEEEecCCcccceecCCeEEEEcCCccccc Confidence 667788888876554432 222222 134555667999999999999999999999999999884 56799 Q ss_pred eeEeccchhhhccccccccccceeecCCceEEEEeecCCCceeEEeeeeeeeeeecCCC--cEEEEE---------E--- Q lcl|Aclame:pro 279 NTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPVNVQTKVSMVALPSFERLG--DVYMLT---------V--- 344 (348) Q Consensus 279 ~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~--~~~~~~---------V--- 344 (348) +++||++.+...+.. .+...+.++.++.|.+.||..+|+.+++..|||+..+| .++... | T Consensus 326 ~T~yGa~~~~~~~~~------~v~~~g~~i~~~~~~~~dP~~~~~~~~~~~~p~l~~~~~~~~~~~~~~~~~~~~~~~~~ 399 (409) T protein:vir:79 326 RFVYTAHVAGQRNGK------VVYATGPYLTVKDHLQDDPPYYAIIAGFHGLPQLSGYNTEDFSFHRFKWLKYANNVQSY 399 (409) T ss_pred ceecccccccccchh------hhccccceeEecccccCCcceeeeecceEEeeeeecCCccceeehhhhhhhhhcchhhh Confidence 999999765443221 12234677889999999999999999999999999554 443321 1 Q ss_pred ecCC Q lcl|Aclame:pro 345 IPGV 348 (348) Q Consensus 345 ~~~~ 348 (348) ||+. T Consensus 400 ~~~~ 403 (409) T protein:vir:79 400 LPPF 403 (409) T ss_pred cCCC Confidence 1111 No 10 >protein:vir:78006 Length: 409 # NCBI annotation: major head protein # Family: family:all:11999 # MgeID: mge:1843 # MgeName: P23-45 # Cross-refs: genbank:acc:YP_001467942;genbank:gi:157265383;genbank:GeneID:5600496 Probab=100.00 E-value=2.3e-65 Score=374.94 Aligned_cols=337 Identities=18% Similarity=0.244 Sum_probs=258.0 Q ss_pred Cccchh-----------hcC-HHHHHHHHHhhccchhhhHHHHhCCCccccceeEEE----EEeecCceeeeeeeeCCCC Q lcl|Aclame:pro 1 MGLIYD-----------KVT-ASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSY----IKGASGQSVALKAAAFDTN 64 (348) Q Consensus 1 Ma~l~d-----------~f~-~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~----~~~~~~~~~~a~~v~~~~~ 64 (348) +|-++| .++ ...|+.+++.+|. .++|.++|||+.+++.++.+. ..+.++.+..+.++.++++ T Consensus 11 ~~~~~~~~~~~~~~~~~~~~~~~~ia~~~~~~p~--~~~L~d~~FP~~~~f~t~l~~~~~~~kg~kk~~~~~~~~~~d~~ 88 (409) T protein:vir:78 11 LARVRDPLSIGGLKFPTTKEIQEAVAAIADKFNQ--ENDLVDRFFPEDSTFASELELYLLRTQDAEQTGMTFVHQVGSTS 88 (409) T ss_pred hhhhcCcchhcceecCchHHHHHHHHHHHHhcCC--ccchhhccCCCCccccceEEEEeeeccCcccccceEeeecCCcc Confidence 111111 111 1344666666653 468999999999988876554 3455677888888999999 Q ss_pred cceecccc---eeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhc Q lcl|Aclame:pro 65 VTIRDRVS---AEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLAT 141 (348) Q Consensus 65 ~~~~~r~~---~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~ 141 (348) .++..|.+ +++.+++||+||+++.++|+|++.++. .++++..+.+.+++++|+++|.++|++|+||||+|+|++ T Consensus 89 ~pv~~r~~~~~~~~~t~epp~iK~k~~i~e~dl~~~~~---~~n~~~~~~i~~~i~~D~~~L~~~I~~R~E~Ma~q~L~t 165 (409) T protein:vir:78 89 LPVEARVAKVDLAKATWSPLAFKESRVWDEKEILYLGR---LADEVQAGVINEQIAESLTWLMARMRNRRRWLTWQVMRT 165 (409) T ss_pred ccccccceeeeeeeecccccccccccccCHHHHHHHhC---CCChhHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhC Confidence 99887764 578889999999999999999876653 456667778889999999999999999999999999999 Q ss_pred CeeeecCC------ceeEEEeeccCccceeeee--ecCCCCCccHHHHHHHHHHHHHhcC-C--eeEEEEeCHHHHHHHh Q lcl|Aclame:pro 142 GKIAFTSD------GVNKDIDYGVKADHKKQVS--KSWAEPGATPLADLEDAIETARELG-L--NPERAIMNAKTFGLIR 210 (348) Q Consensus 142 Gki~~~~~------~~~~~vDfg~~~~~~~t~~--~~W~~~~adp~~di~~~~~~~~~~G-~--~~~~~~~~~~~~~~l~ 210 (348) |||.+.++ |..++||||+|++|+++++ ..|++++|||++||++|++.+++.| . ++.+++|++++|+.++ T Consensus 166 Gki~i~g~~~~~~~g~~~~vDyg~pa~hkvtlTgt~~W~~~~AdPi~DIe~w~~~i~~~~g~~~t~~~~imt~~~~~~l~ 245 (409) T protein:vir:78 166 GRITIQPNDPYNPNGLKYVIDYGVTDIELPLPQKFDAKDGNGNSAVDPIQYFRDLIKAATYFPDRRPVAIIVGPGFDEVL 245 (409) T ss_pred CeEEEEecCCCccccceEEEecCCCcccceeecccccCCCCCCChHHHHHHHHHHHHHhcCCCCCccEEEEcHHHHHHHH Confidence 99998554 4468999999999998765 4899999999999999999997754 3 4567999999997755 Q ss_pred -cCHHHHHHhcccCCCccc----ccHHHH-----HHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEe--CCccc Q lcl|Aclame:pro 211 -KAASTVKAIKPLAGDGSS----VTKAEL-----QNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIP--NGPLG 278 (348) Q Consensus 211 -~~~~v~~~~~~~~~~~~~----~~~~~~-----~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p--~~~~G 278 (348) +|+.++++++.+++..+. +++..+ ..++....|++|++||++|+|+||+.+++||+|.++|++ .+.+| T Consensus 246 ~~n~~ik~~l~~~~~~~~~~~~~~~~~~l~~~~~ln~~~~~~GL~I~vYd~~Y~dedGt~k~~~Pd~~vvLl~ap~g~LG 325 (409) T protein:vir:78 246 ADNTFVQKYVEYEKGWVVGQNTVQPPREVYRQAALDIFKRYTGLEVMVYDKTYRDQDGSVKYWIPVGELIVLNQSTGPVG 325 (409) T ss_pred hCcHHHHHhhhcccccccccccccchhhhcchhHhHhhhhhcCceEEEEeeEEEecCCcccceecCCeEEEEcCCccccc Confidence 667788888876554432 222222 134555667999999999999999999999999999884 56799 Q ss_pred eeEeccchhhhccccccccccceeecCCceEEEEeecCCCceeEEeeeeeeeeeecCCC--cEEEEE---------E--- Q lcl|Aclame:pro 279 NTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPVNVQTKVSMVALPSFERLG--DVYMLT---------V--- 344 (348) Q Consensus 279 ~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~--~~~~~~---------V--- 344 (348) +++||++.+...+.. .+...+.++.++.|.+.||..+|+.+++..|||+..+| .++... | T Consensus 326 ~T~yGa~~~~~~~~~------~v~~~g~~i~~~~~~~~dP~~~~~~~~~~~~p~l~~~~~~~~~~~~~~~~~~~~~~~~~ 399 (409) T protein:vir:78 326 RFVYTAHVAGQRNGK------VVYATGPYLTVKDHLQDDPPYYAIIAGFHGLPQLSGYNTEDFSFHRFKWLKYANNVQSY 399 (409) T ss_pred ceecccccccccchh------hhccccceeEecccccCCcceeeeecceEEeeeeecCCccceeehhhhhhhhhcchhhh Confidence 999999765443221 12234677889999999999999999999999999554 443321 1 Q ss_pred ecCC Q lcl|Aclame:pro 345 IPGV 348 (348) Q Consensus 345 ~~~~ 348 (348) ||+. T Consensus 400 ~~~~ 403 (409) T protein:vir:78 400 LPPF 403 (409) T ss_pred cCCC Confidence 1111 No 11 >protein:vir:10324 Length: 320 # NCBI annotation: ORF26 # Family: family:all:570 # MgeID: mge:182 # MgeName: VHML # Cross-refs: genbank:acc:NP_758919;genbank:gi:27311193;genbank:GeneID:956155 Probab=100.00 E-value=2.3e-48 Score=281.79 Aligned_cols=308 Identities=12% Similarity=0.118 Sum_probs=230.6 Q ss_pred HHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEeeccccccccccCHHHHHH Q lcl|Aclame:pro 17 FNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQMPFFKEALLVKENDRQQ 96 (348) Q Consensus 17 i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~p~i~~~~~i~~~d~~~ 96 (348) |+.+|.. -..+...||+++.+.+ ..+.++...+...++|++++++++....+++.+...|++|||+++..++++|++. T Consensus 1 i~~~P~~-~g~~~glff~~~~v~T-~~V~ie~~~~~l~lip~v~rg~~g~~~~~~~~~~~~f~~p~~~~~d~i~a~eiq~ 78 (320) T protein:vir:10 1 MNLLPVN-YGDSRALFAREKKVRT-RTILVEEKNGVLTLIQSREPGSTENVAKRGKRKVRSFVIPHLPLEDVILPDEYEG 78 (320) T ss_pred CCcCCch-hhhhhhhccCCCCccc-ceEEEEEecCceeeeeccCCCCCceeecCCcceEEEEecceeccCCccCHHHHcC Confidence 7766632 2234566778776644 4466777888889999999999999999999999999999999999999999866 Q ss_pred HHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEe----eccCccceeeeeecCC Q lcl|Aclame:pro 97 LNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDID----YGVKADHKKQVSKSWA 172 (348) Q Consensus 97 l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vD----fg~~~~~~~t~~~~W~ 172 (348) ++.+ |+ ...+++.+.+.+.+..+++.+++|.||||+|||+ |+|. +.+| ++.+| ||+... +....++ T Consensus 79 ~Ra~---G~-~~~~~~~~~v~~~l~~lr~~~~~T~E~m~~~AL~-G~il-dadG-tv~~d~y~~fGi~~~---~i~~~l~ 148 (320) T protein:vir:10 79 LRGF---GT-TALAAKSELVKERXETMKSSHDITHEHLRMGAKK-GQIL-DADG-TVLYDLYAEFGITKK---TIYFGLD 148 (320) T ss_pred cccC---CC-chHHHHHHHHHHHHHHHHHHHHHHHHHHHHhhhc-CeEE-cCCC-cEEEechhhhCCccc---eeEEecC Confidence 5543 44 3456777888999999999999999999999996 9974 4444 44455 676321 1222334 Q ss_pred CCCccHHHHHHHHHHHH----HhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHHHhhcCceEEE Q lcl|Aclame:pro 173 EPGATPLADLEDAIETA----RELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYVADNYGVEIVL 248 (348) Q Consensus 173 ~~~adp~~di~~~~~~~----~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i~~ 248 (348) +++.|+.+.+..+.+.+ +..+.+..+++||+++|++|++|++|++++.+.......+. ......+ .++|+.|+. T Consensus 149 ~a~~dv~~~~~~~~~~i~~~l~g~~~t~v~al~g~~f~~al~~h~~Vke~y~~~~~~~~~l~-~~~~~~f-~~gGi~~~~ 226 (320) T protein:vir:10 149 NKDANVAESCRQVLRHVEDNLRGDVMKDVSVDVSEEFFDKFIKHASVKEVFLNHEAAVNRLG-GDTRKGF-KFGGLIFNE 226 (320) T ss_pred CCCccHHHHHHHHHHHHHHHhccCCCCceEEEEChHHHHHHhcCHHHHHHHHhhhhhhhhcc-ccccceE-EecCEEEEE Confidence 44556555555555444 33445567899999999999999999999876543221111 1111111 468999999 Q ss_pred EeeEEEcCCCcccccccCCeEEEEeCCccc--eeEeccchhhhccccccccccceeecCCceEEEEeecCCCceeEEeee Q lcl|Aclame:pro 249 ENGTYRNEKGEVSKFFPDGHLTLIPNGPLG--NTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPVNVQTKVS 326 (348) Q Consensus 249 yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G--~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~~~~~~~ 326 (348) |+++|.|.+|+.+++||+++++|+|.+..| .++|++ ++..+.... .+..++++.|...+|.+.+++++ T Consensus 227 Y~g~~~d~~g~~~~~I~~~~~~~~p~g~~~~f~~~~ap-ad~~e~vnt---------~g~p~y~k~~~~~~~~g~~l~~q 296 (320) T protein:vir:10 227 NRARHVDEEGKETRFIKAGKGHAFPTGTTNTFFTALAP-ADFNETAGT---------LGKRYYAKMEPRRMGRGFDLHSQ 296 (320) T ss_pred cccEEEcCCCCeeEeecCCeeEEEEecCchhheeeecc-cCcHhhcCC---------cccccccccccccCCCeEEEEee Confidence 999999999999999999999999988654 556655 332221111 23468899999999999999999 Q ss_pred eeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 327 MVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 327 s~~lPv~~~~~~~~~~~V~~~~ 348 (348) |.|||++.+|+.++++++-|-- T Consensus 297 S~PLpi~~rP~~lv~~~~~a~~ 318 (320) T protein:vir:10 297 SNVLPMCCRPGVLVELDAAAQP 318 (320) T ss_pred ecccccccCcceEEEEEecCCC Confidence 9999999999999999999555 No 12 >protein:vir:95258 Length: 368 # NCBI annotation: Phage conserved protein # Family: family:all:570 # MgeID: mge:1561 # MgeName: Felix 01 # Cross-refs: genbank:acc:NP_944891;genbank:gi:38707831;genbank:GeneID:2744044 Probab=100.00 E-value=9e-41 Score=240.13 Aligned_cols=327 Identities=15% Similarity=0.126 Sum_probs=248.2 Q ss_pred Cccc--hhhcCHHHHHHHHHhhccchhhhHHHH-hCCCccccceeEEEEEeecCceeeeeeeeCCC-Ccceecccceeee Q lcl|Aclame:pro 1 MGLI--YDKVTASNIAGYFNTLQENVDSTLGES-IFPARKQLGTKLSYIKGASGQSVALKAAAFDT-NVTIRDRVSAEIH 76 (348) Q Consensus 1 Ma~l--~d~f~~~~l~~~i~~~~~~~~~~l~~~-~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~-~~~~~~r~~~~~~ 76 (348) |.++ .|.|+..+||++|+.+| ....+|.+. +|+.+.+.++. +.++...+...+.|.+++++ ++...+++..+.+ T Consensus 1 ~~d~f~~d~Fs~~~LT~ain~~p-~~p~~l~~lglF~~~~v~t~~-v~iE~~~~~l~Lvp~~~rg~~~~~~~~~~~r~~~ 78 (368) T protein:vir:95 1 MLTNSEKSRFFLADLTGEVQSIP-NTYGYISNLGLFRSAPITQTT-FLMDLTDWDVSLLDAVDRDSRKAETSAPERVRQI 78 (368) T ss_pred CcccccCCcccHHHHHHHHHhcC-CCcceecccccccCCCccceE-EEEEEEcCeEEEccccCCCCCCcccccCCceeEE Confidence 8877 47899999999999997 455566655 78777766544 44566777888999999998 5567778888899 Q ss_pred EeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEe Q lcl|Aclame:pro 77 DEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDID 156 (348) Q Consensus 77 ~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vD 156 (348) .|++|+|+++..|.++|++ +.+..|++.+.+++.+.+.+.+..+++.++.|+||||++||. |+|...++ .+.+| T Consensus 79 ~f~~ph~~~~d~I~a~eiQ---g~RafG~~~~l~~v~~~v~~kl~~~r~~~d~T~E~~r~gAL~-G~ilDadG--tvl~d 152 (368) T protein:vir:95 79 SFPMMYFKEVESITPDEIQ---GVRQPGTANELTTEAVVRAKKLMKIRTKFDITREFLFMQALK-GKVVDARG--TLYAD 152 (368) T ss_pred EEecceeccccccchHHHc---cccCCCChhHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhhc-CeeECCCC--cEEec Confidence 9999999999999999974 556677888888899999999999999999999999999996 99864444 33344 Q ss_pred ----eccCccceeeeeecCCCCCccHHHHHHHHHHHHHhc--C--Ce---eEEEEeCHHHHHHHhcCHHHHHHhcccCCC Q lcl|Aclame:pro 157 ----YGVKADHKKQVSKSWAEPGATPLADLEDAIETAREL--G--LN---PERAIMNAKTFGLIRKAASTVKAIKPLAGD 225 (348) Q Consensus 157 ----fg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~--G--~~---~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~ 225 (348) ||... . +..-.-++++.|+.+.+++|.+.++++ | +. ..+++||+++|++|.+|++|++++.+.... T Consensus 153 ly~eFGit~-~--~v~f~l~~~~tdv~~~~~~~~~~i~d~l~g~~~~~~~~v~alcg~~Ffd~L~~h~~Vkeay~~~~~a 229 (368) T protein:vir:95 153 LYKQFDVEK-K--TIYFDLDNPNADIDASIEELRMHMEDEAKTGTVINGEEIHVVVDRVFFSKLTKHPKIRDAYLAQQTP 229 (368) T ss_pred chhhhCCcc-c--eEEEEeCCCCcCHHHHHHHHHHHHHHhhcccccccccceEEEEChHHHHHhhcChhHHHHHHHHHhh Confidence 67632 1 233344678889999999998887642 2 22 368999999999999999999998755322 Q ss_pred cc-cccHHHH--------HHHH--HhhcCceEEEEeeEEEcCCCcccccccC-------CeEEEEeCC-------cccee Q lcl|Aclame:pro 226 GS-SVTKAEL--------QNYV--ADNYGVEIVLENGTYRNEKGEVSKFFPD-------GHLTLIPNG-------PLGNT 280 (348) Q Consensus 226 ~~-~~~~~~~--------~~~~--~~~~~~~i~~yd~~y~d~~g~~~~~~~~-------~~vv~~p~~-------~~G~~ 280 (348) .. ......+ ..-+ ..++|+.++.|.+++.+.+|+.++++++ ++..++|.+ .+..+ T Consensus 230 ~~~~~lr~~~r~g~~~~~~~~~~~F~fgGi~f~eYrg~~~~~~g~~~~~v~~d~v~I~~gea~~~P~G~~~~~~~~~F~~ 309 (368) T protein:vir:95 230 LAWQQITGSLRTGGADGVQAHMNTFYYGGVKFVQYNGKFKDKRGKVHTLVSIDSVADTVGVGHAFPNVAMLGEANNIFEV 309 (368) T ss_pred hhhhhhccccccccccccccccceeEecCEEEEEcceeecCCCcceeeeecCCceeeccCceEEEeecccccccCcceEE Confidence 11 0000011 0011 1467999999999999999998887665 567788865 45678 Q ss_pred EeccchhhhccccccccccceeecCCceEEEEeecCCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 281 VFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 281 ~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) +|+|... .+... -.+..++.+.|...++.+.++.++|.|||++.+|+.+++++.-|.- T Consensus 310 ~~aPad~-~e~vN---------t~g~p~Ya~~~~~~~~~g~~le~qSnpLpic~RP~~lv~~~~~a~~ 367 (368) T protein:vir:95 310 AYGPCPK-MGYAN---------TLGQELYVFEYEKDRDEGIDFEAHSYMLPYCTRPQLLVDVRADAKG 367 (368) T ss_pred EecCCCc-HhhcC---------CCcccccceeeeccCCCeeEEEEeecccchhcccceeEEEEecCCC Confidence 8887532 22111 1234578899999999999999999999999999999999999766 No 13 >protein:vir:79078 Length: 307 # NCBI annotation: gp8 # Family: family:all:908 # MgeID: mge:1862 # MgeName: phiE255 # Cross-refs: genbank:acc:YP_001111208;genbank:gi:134288798;genbank:GeneID:4960752 Probab=99.95 E-value=1.7e-29 Score=178.32 Aligned_cols=294 Identities=13% Similarity=0.111 Sum_probs=183.7 Q ss_pred CccchhhcCH-HHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCc-eeeeeeeeCCCCcceecccceeeeEe Q lcl|Aclame:pro 1 MGLIYDKVTA-SNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQ-SVALKAAAFDTNVTIRDRVSAEIHDE 78 (348) Q Consensus 1 Ma~l~d~f~~-~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~-~~~a~~v~~~~~~~~~~r~~~~~~~~ 78 (348) |..+...|.. +.|+.+...... ..|+.+.+||..++....+.+....+.. .+.-.-+.+++........+++...+ T Consensus 1 m~~~~~~~~~dp~LT~~A~gy~n--~~~Iad~lfP~vpV~~~~~k~~~f~~e~f~~~~t~ra~~~~~~~v~~~~~~~~~~ 78 (307) T protein:vir:79 1 MGRLSKLRIVDPVLTNLAIGYTN--AEFIGQTLMPVVEVEKEGGKIPKFGKESFRLYQTERALRAKSNRMNPEDIDSVDV 78 (307) T ss_pred CCCCCCCcccCHHHHHHHhhccc--hhhhhhhcCCcccccccccceeeeccccccccccccccCCCcceeeeeccccccc Confidence 8888766654 589999988863 4589999999998887777766543211 11001122232333333333333333 Q ss_pred eccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEeec Q lcl|Aclame:pro 79 QMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYG 158 (348) Q Consensus 79 ~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDfg 158 (348) .+........++- +.... ..-.+.+ ..++.+.+.|.+++||||+++++++.. T Consensus 79 ~~~~~~l~~~id~------r~~~~-~~~~~~~-------~Av~~l~d~I~l~~E~~~A~l~~~~~~-------------- 130 (307) T protein:vir:79 79 NLDEHDLEYPIDY------REDQE-SAFPLEQ-------AAVQTATDAIQLRREKMIADLSQNPSS-------------- 130 (307) T ss_pred cccccchhhcccc------hhcCC-CCCCHHH-------HHHHHHHHHHHhHHHHHHHHHhccccc-------------- Confidence 2222111111110 11111 1111222 335667889999999999999987442 Q ss_pred cCccceeeeee--cCCCCCccHHHHHHHHHHHHHh-cCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 159 VKADHKKQVSK--SWAEPGATPLADLEDAIETARE-LGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 159 ~~~~~~~t~~~--~W~~~~adp~~di~~~~~~~~~-~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) ++++|++++++ +||+++|||++||++|++++++ .|.+|++++||+++|++|++|++|++++++++ .+.++++++. T Consensus 131 y~~~~k~tLsgt~~Wsd~~sDPi~di~~~~~ai~~~~g~~Pn~~vlg~~a~~~l~~h~~i~~~lk~~~--~g~it~~~la 208 (307) T protein:vir:79 131 YAAGNKKQLSATEKFTAANSDPVGVIEDGKEAIRTKIGRRPNTMVIGASAYKTLKAHPQLIEKIKYSM--KGIVTVDLLK 208 (307) T ss_pred cCCCceEEEccCcccCCCCCCcHHHHHHHHHHHHHhhCCccceEEeCHHHHHHHhcCHHHHHHhcCcc--ccccCHHHHH Confidence 36788888865 6999999999999999999975 68999999999999999999999999999865 5789999888 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCc-------cceeEeccchhhhccccccccccceeecCCce Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGP-------LGNTVFGTTPEESDLFADNTVNADVEIVDSGI 308 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~-------~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~ 308 (348) ++|+ .-+|.+++++|.+.+++.+++|+++.+++.-+.. ++.-.||.|+.. . ++. T Consensus 209 ~l~~---v~~V~vg~a~y~~~~~~~~~iw~~~~~l~y~~~~~~~~~~~~~~ps~Gyt~~~---------------~-g~~ 269 (307) T protein:vir:79 209 EIFE---VENIAVGEAIYADDKDRFTDIWGANIVLAYVPLQRGGQQRTPYEPSYGYTLRK---------------K-GNP 269 (307) T ss_pred HHhC---ceeEEEeeeeeecccccchhcCCCceEEEecccccCCCCCcccccccceeEEe---------------c-Cce Confidence 8763 4469999999999999999999888776653211 222245544321 1 111 Q ss_pred EEEEeecCCCceeEEeeeeeeeeeecCCCcE-EEEEEec Q lcl|Aclame:pro 309 AVTTTKTTDPVNVQTKVSMVALPSFERLGDV-YMLTVIP 346 (348) Q Consensus 309 ~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~-~~~~V~~ 346 (348) ++....+ ++.++.+.+.-.--|++.-+++= ++..++- T Consensus 270 ~~d~~~~-~~~~~~vrv~~~~~~~i~~~~~G~li~~~v~ 307 (307) T protein:vir:79 270 VVDTRIE-DGKLELVRATDIFRPYLLGADAGYLISGING 307 (307) T ss_pred EEecccC-CCceeEEeecccccceeeccccchhhccCCC Confidence 2222222 34444444444444444433322 2222222 No 14 >protein:vir:107882 Length: 307 # NCBI annotation: gp34 # Family: family:all:908 # MgeID: mge:1565 # MgeName: BcepMu # Cross-refs: genbank:acc:YP_024707;genbank:gi:48696944;genbank:GeneID:2845970 Probab=99.93 E-value=2.3e-27 Score=166.61 Aligned_cols=292 Identities=16% Similarity=0.164 Sum_probs=180.7 Q ss_pred CccchhhcC-HHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEee Q lcl|Aclame:pro 1 MGLIYDKVT-ASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQ 79 (348) Q Consensus 1 Ma~l~d~f~-~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~ 79 (348) |..+...|. .+.|+.+...... ..|+.+.+||..++....+.+....+ ..|+-++.. +.+. .....++ T Consensus 1 m~~~~~~~~~dp~LT~~A~gy~n--~~~ia~~l~P~vpv~~~~~k~~~f~~-----eaF~~~~t~---r~~~-~~~~~v~ 69 (307) T protein:vir:10 1 MGRLSKLRIVDPVLTNLAIGYTN--AEFIGQSLMPVVEVEKEGGKIPKFGK-----ESFRLYKTE---RALR-ARSNRMN 69 (307) T ss_pred CCCCCCCcccChhHHHHHHhhcc--hhhhhhhcCCcccccccccceeeECc-----ccccchhhh---cccC-CCcceee Confidence 777766554 4689998887754 35899999999888777766655422 123322221 1111 1333445 Q ss_pred ccccccc-cccCHHHHHH---HHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEE Q lcl|Aclame:pro 80 MPFFKEA-LLVKENDRQQ---LNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDI 155 (348) Q Consensus 80 ~p~i~~~-~~i~~~d~~~---l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~v 155 (348) +.++... ..+.+.++.. .+..... .-.+. ...++.+.+.|.+++|++|++++++.. T Consensus 70 ~~~~~~~~~~~~~~~L~~~id~r~~~~~-~~~~~-------~~av~~l~d~I~l~~E~~~A~l~~~~~------------ 129 (307) T protein:vir:10 70 PEDLGSIDIVLDEHDLEYPIDYREDQES-AFPLE-------QAAVQTATEAIQLRREKMVADLAQNPN------------ 129 (307) T ss_pred cccccccccccccccccccCChhhcCCC-CCCHH-------HHHHHHHHHHHHHHHHHHHHHHhcCcc------------ Confidence 5444432 3344433211 1111111 11122 234566778999999999999987632 Q ss_pred eeccCccceeeeee--cCCCCCccHHHHHHHHHHHHHh-cCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSK--SWAEPGATPLADLEDAIETARE-LGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKA 232 (348) Q Consensus 156 Dfg~~~~~~~t~~~--~W~~~~adp~~di~~~~~~~~~-~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~ 232 (348) .++++|++++++ +||+++|||++||++|++++++ .|.+|++++||+++|++|++|++|++++++++ .+.++++ T Consensus 130 --~y~~~~k~tLsGt~~Wsd~~sDPi~di~~~~~ai~~~~g~~Pn~~vlg~~a~~al~~hp~i~e~lk~~~--~g~it~~ 205 (307) T protein:vir:10 130 --SYAGGNKKQLSATEKFTAAGSDPVGVIEDGKEAIRTKIGRRPNTMVIGASAYKTLKAHPQLIEKIKYSM--KGIVTVD 205 (307) T ss_pred --ccCCCceEEeccccccCCCCCCcHHHHHHHHHHHHhhhCCccceEEeCHHHHHHHhcCHHHHHHhCCcc--ccccCHH Confidence 246678887765 7999999999999999999975 68999999999999999999999999998764 5789999 Q ss_pred HHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCC-------ccceeEeccchhhhccccccccccceeecC Q lcl|Aclame:pro 233 ELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNG-------PLGNTVFGTTPEESDLFADNTVNADVEIVD 305 (348) Q Consensus 233 ~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~-------~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~ 305 (348) ++.++|+ .-+|.+.+++|.+.+++.+++|+++.+++..+. .++.-.||.|+... T Consensus 206 ~la~ll~---v~~i~vg~a~~~~~~~~~~~iw~~~~vl~yv~~~~~~~~~~~~epsfGyT~~~~---------------- 266 (307) T protein:vir:10 206 LLKEIFE---VENIAVGEAIYADDKDRFTDIWGANIVLAYVPLQRGGQQRTPYEPSYGYTLRKK---------------- 266 (307) T ss_pred HHHHHhC---ceeEEEeeeeeeccCCccceeCCCceEEEecccccCCCCCcccccccceeEEEc---------------- Confidence 9988863 446777788888888999999988877665321 12233566665311 Q ss_pred CceEEEEeecCCCceeEEeeeeeeeeeecCCCcEEEEEEecC Q lcl|Aclame:pro 306 SGIAVTTTKTTDPVNVQTKVSMVALPSFERLGDVYMLTVIPG 347 (348) Q Consensus 306 ~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~ 347 (348) ++.++.+..+ +-.++.+.+.-.-=|++.-+++=|.++=.-| T Consensus 267 g~~~~d~~~~-~~~~~~~r~~~~~~~~i~~~~~G~li~~~~~ 307 (307) T protein:vir:10 267 GNPVVDTRIE-DGKLELVRSTDIFRPYLLGADAGYLISGING 307 (307) T ss_pred CCeEeeceec-CCceeEEeccccccceeecccccceeccCCC Confidence 1122211111 1122222233222233333332222222222 No 15 >protein:vir:99888 Length: 309 # NCBI annotation: capsid protein # Family: family:all:908 # MgeID: mge:1480 # MgeName: B3 # Cross-refs: genbank:acc:YP_164075;genbank:gi:56692607;genbank:GeneID:3192616 Probab=99.89 E-value=3.4e-25 Score=154.75 Aligned_cols=295 Identities=15% Similarity=0.150 Sum_probs=183.3 Q ss_pred CccchhhcC-HHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCc--eeeeeeeeCCCCcceecccceeeeE Q lcl|Aclame:pro 1 MGLIYDKVT-ASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQ--SVALKAAAFDTNVTIRDRVSAEIHD 77 (348) Q Consensus 1 Ma~l~d~f~-~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~--~~~a~~v~~~~~~~~~~r~~~~~~~ 77 (348) |++= .|. .+.|+.+...... ..++.+.+||..++....+.+....+.. .+.-..+.+++......-. ..... T Consensus 1 ~~~~--~~~~dp~LT~~A~gy~n--~~~Ia~~l~P~vpV~~~~~~~~~f~~~e~F~~~~t~r~~~~~~~~v~~~-~~~~~ 75 (309) T protein:vir:99 1 MSNA--PFPIDPELTAIAIAYRN--GRMISDEVLPRVPVGKQEFKFWKYDLAQGFTVPETLVGRKSKPNEVEFS-ATDET 75 (309) T ss_pred CCCC--CcCcCHhHHHHHhhccC--hhhhhhhcCCccccCccccceeeechhhcccccchhhccCCCcceEeec-ccCce Confidence 8773 444 5689998888753 4589999999998887777766644321 1122223333222222221 11122 Q ss_pred eeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEee Q lcl|Aclame:pro 78 EQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDY 157 (348) Q Consensus 78 ~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDf 157 (348) +..---+....++-.++.+ ... +-.+ ....++.+.+.|..++|+++++.+++.. T Consensus 76 ~~~~~~~L~~~i~~~~~~~---a~~--~~d~-------~~~Av~~l~~~i~l~rE~~~A~lv~~~a-------------- 129 (309) T protein:vir:99 76 GSTEDHGLDAPVPQADIDN---APT--NYNP-------LGHATEQTTNLILLDREARTSKLVFSPN-------------- 129 (309) T ss_pred eeecccceeecCCchhhhh---ccC--CCCH-------HHHHHHHHHHHHHHHHHHHHHHHhcChh-------------- Confidence 2222222333333333221 111 1112 2233566789999999999999887532 Q ss_pred ccCccceeeeee--cCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 158 GVKADHKKQVSK--SWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 158 g~~~~~~~t~~~--~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) .++++|++++++ +|++++|||++||++|++.+ |++|++++||.++|++|++|++|++++++++.+.+.++++++. T Consensus 130 ~y~~~~k~~Lsgt~~wsd~~SDPi~~i~~~~~~~---g~~PN~~vlg~~~~~~l~~hp~i~~~ik~~~~~~g~it~~~la 206 (309) T protein:vir:99 130 SYAAGNKTTLSGADQWSDPTSNPLPVITDALDSV---ILRPNIGVLGRRTATILRRHPKIVKAYNGSLGDEGMVPMAFLQ 206 (309) T ss_pred hcCCCceEEecCccccCCCCCCcHHHHHHHHHhh---CCCcceEEechHHHHHHhhCHHHHHHhcCCCccccccCHHHHH Confidence 347789988765 69999999999999998765 8999999999999999999999999999988888899999988 Q ss_pred HHHHhhcCceEEEEeeEEE----cCCCcccccccCCeEEEEeCCccce----eEeccchhhhccccccccccceeecCCc Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYR----NEKGEVSKFFPDGHLTLIPNGPLGN----TVFGTTPEESDLFADNTVNADVEIVDSG 307 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~----d~~g~~~~~~~~~~vv~~p~~~~G~----~~yg~~~~~~~~~~~~~~~~~~~~~~~~ 307 (348) ++|+- -+|.+-++.|. ..++..+++|.++.+++.- +..+. ..||.|+.-.....| . T Consensus 207 ~l~~v---e~V~vg~a~~n~a~~g~~~~~~~iwg~~~~L~y~-~~~~~~~~~ps~G~t~~~~~r~~g-----------~- 270 (309) T protein:vir:99 207 ELLEL---DAIYIGEARLNIARPGQNPNLIRAWGPHASFIYR-DRLADTRNGTTFGLTAQWGDRVSG-----------S- 270 (309) T ss_pred HHhCc---ceEEeecceeeccccccccccccccCCcEEEEEc-CCCCCCcccccccceeecccccCC-----------c- Confidence 87632 26777666663 4567788999988765442 22233 334444332222211 1 Q ss_pred eEEEEeecCCCceeEEeeeeeeeeeecCCC-cEEEEEEecC Q lcl|Aclame:pro 308 IAVTTTKTTDPVNVQTKVSMVALPSFERLG-DVYMLTVIPG 347 (348) Q Consensus 308 ~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~-~~~~~~V~~~ 347 (348) ++...+. ...++++++.-.-=|++.-++ +.++..++|+ T Consensus 271 ~~d~~~~--~~g~~~vr~~~~~k~~i~~~d~G~li~~~va~ 309 (309) T protein:vir:99 271 IADPNIG--LRGGQRVRVGESVKELVTAPDLGFFFENAVAA 309 (309) T ss_pred eeeeeec--cCCceEEEEeccccchhcchhcchhhhhcccC Confidence 1111221 233455655544444444433 4566677888 No 16 >protein:vir:108211 Length: 318 # NCBI annotation: gp9 # Family: family:all:6420 # MgeID: mge:2004 # MgeName: Giles # Cross-refs: genbank:acc:YP_001552338;genbank:gi:160700658;genbank:GeneID:5758931 Probab=99.13 E-value=1.3e-11 Score=80.22 Aligned_cols=277 Identities=14% Similarity=0.140 Sum_probs=158.3 Q ss_pred Cc--------------cchhhcC-HHHHHHHHHhhccchhhhHHHHhCCCcc-ccceeEEEEEeecCc-eeeeeeeeCCC Q lcl|Aclame:pro 1 MG--------------LIYDKVT-ASNIAGYFNTLQENVDSTLGESIFPARK-QLGTKLSYIKGASGQ-SVALKAAAFDT 63 (348) Q Consensus 1 Ma--------------~l~d~f~-~~~l~~~i~~~~~~~~~~l~~~~Fp~~~-~~~~~~~~~~~~~~~-~~~a~~v~~~~ 63 (348) |- +++|++. |.-|-..++++.. ..|+.+.||.... +.+..+.+.+..... ..-+.-|.+++ T Consensus 1 ~~~~~~i~s~~~~~~itv~~ll~~P~~I~~~i~e~~~--~~~iad~lf~~~~a~~~~~v~f~~~~p~~~~~d~e~VaEgg 78 (318) T protein:vir:10 1 MTAPTGIVSVSDGPAITVRELVGNPLWIPTALKKMMV--NQFISESLFRNGGANPNGVVAYNEGNPSFLEDDVADVAEFG 78 (318) T ss_pred CCCCCcceeeecCCceehHHhhCCchhHHHHHHHHHh--ccchhhhhhhcccccccceeEEEecccccccCcHhhccCcc Confidence 22 3456665 4555667777764 4589999998653 344444544433211 11122345566 Q ss_pred CcceecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCe Q lcl|Aclame:pro 64 NVTIRDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGK 143 (348) Q Consensus 64 ~~~~~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gk 143 (348) +-|+..-..........=+.+.+..++.+.+.. ++- +.+.+.+.++.+.+.+..+-+++++|+.+. T Consensus 79 EiP~~~~~~G~~~ia~~~K~G~~~~vS~Em~~~-------n~~-------~~v~r~~~~l~Nti~r~~d~~a~dal~sa~ 144 (318) T protein:vir:10 79 EIPVSAGARGLPRTAFAVKKALGVRVSKEMIDE-------NRV-------GAVNDQMLQLRNTFIRANDRSAKALLQSPI 144 (318) T ss_pred cccccCCCCCchhhhhhehhccceeccHHHHhh-------cCh-------hHHHHHHHHHHHHHHHHHHHHHHHHHhccc Confidence 655555333332222223566666776544321 111 223344666778888889999999998654 Q ss_pred eeecCCceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHH----------------HhcCCeeEEEEeCHHHHH Q lcl|Aclame:pro 144 IAFTSDGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETA----------------RELGLNPERAIMNAKTFG 207 (348) Q Consensus 144 i~~~~~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~----------------~~~G~~~~~~~~~~~~~~ 207 (348) + +++.+++.|++ ++++..|+-...+.+ .+.|+.|++|+|++..|. T Consensus 145 t------------------~~~~~s~~w~~-~~~~~~d~~~A~e~v~~a~~~~~~a~~~~~~~~~GY~pdtIVlhP~~~~ 205 (318) T protein:vir:10 145 V------------------PTLAVPTAWDN-GGKVRTDIAIAIEQISTAAPTAYPAGVGSSDEYFGFIPDTIVMHYALLP 205 (318) T ss_pred c------------------ccccCCcCCCC-cccccccchhhhhhhhhhhhhhhhhhhhhhhhccCccceeeEECHHHHH Confidence 2 44567778886 344444433332211 235899999999999999 Q ss_pred HHhcCHHHHHHhcccCCCcccccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchh Q lcl|Aclame:pro 208 LIRKAASTVKAIKPLAGDGSSVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPE 287 (348) Q Consensus 208 ~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~ 287 (348) .|++|+.+++++..+..... ........+-+...|++++ ..+.+|.++++++-.+..|.+...- T Consensus 206 ~l~~n~~~~~~y~~~a~~~~-~~~~~tg~~~g~~lGl~vi------------~s~~~p~~~alvlq~g~vG~~~d~~--- 269 (318) T protein:vir:10 206 ILMDNENFMKVYERNANYVS-TAPDWTGNFPGSVMGLNVI------------RSRTFPIDRVLIMERGTVGFYSDTR--- 269 (318) T ss_pred HHhcchhhhhhhhccchhhh-hcccccccccceeeceEEe------------ecCccCCCeeEEEecCCcceeeccc--- Confidence 99999999999865532110 0000000011122344332 3467889999999999988655321 Q ss_pred hhccccccccccceeecCCceEEEEeecC--CC-----ceeEEeeeeeeeeeecCCCcEEEEEEe-cC Q lcl|Aclame:pro 288 ESDLFADNTVNADVEIVDSGIAVTTTKTT--DP-----VNVQTKVSMVALPSFERLGDVYMLTVI-PG 347 (348) Q Consensus 288 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~--dP-----~~~~~~~~s~~lPv~~~~~~~~~~~V~-~~ 347 (348) ++.++.|..+ +| ......+....-+.+.+|.+++.+|=+ .+ T Consensus 270 -------------------pl~~t~~~~egg~~~g~~~~s~~~~~~~~~~~~V~~PkA~~~itgi~~~ 318 (318) T protein:vir:10 270 -------------------PLQFTALYPEGNGPNGGPTESYRADASHKRALAVDQPKAALWLTGIVTP 318 (318) T ss_pred -------------------cceeeecccCCCCCCCCcchhhheehheeeeeeeeCcceeEEEeeccCC Confidence 2223333321 22 234555666677888899999988744 33 No 17 >protein:vir:98819 Length: 437 # NCBI annotation: hypothetical protein # Family: family:all:32561 # MgeID: mge:1530 # MgeName: Ma-LMM01 # Cross-refs: genbank:acc:YP_851100;genbank:gi:117530257;genbank:GeneID:4484483 Probab=98.95 E-value=2.2e-12 Score=84.51 Aligned_cols=324 Identities=13% Similarity=0.122 Sum_probs=184.3 Q ss_pred Cc-----cchhhcCHHHH---------------HHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeee Q lcl|Aclame:pro 1 MG-----LIYDKVTASNI---------------AGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAA 60 (348) Q Consensus 1 Ma-----~l~d~f~~~~l---------------~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~ 60 (348) |. +|+.+++++.| .+.|.... |.. -.+..||++.....-+...+...+...+-|+|. T Consensus 1 msdipspnlqalisspylvdnttfprepvytelarsilakl-pat--plsavfpdetiaeriviaehviegvntifpvve 77 (437) T protein:vir:98 1 MSDIPSPNLQALISSPYLVDNTTFPREPVYTELARSILAKL-PAT--PLSAVFPDETIAERIVIAEHVIEGVNTIFPVVE 77 (437) T ss_pred CCCCCCcchHhhhcCceeeccccCCccchHHHHHHHHHHhc-CCc--cccccccchhhhhhhhhHHHHHhhhhhhhhhhc Confidence 44 34444444332 22222111 222 246678887776655554455667777889999 Q ss_pred CCCCcceecccceeee--EeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHH Q lcl|Aclame:pro 61 FDTNVTIRDRVSAEIH--DEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQV 138 (348) Q Consensus 61 ~~~~~~~~~r~~~~~~--~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qa 138 (348) .+++.-+.+.+++... ++++..|+.++.++-.+++. -...|+.+++....++|.+++.++++... +-|...|+ T Consensus 78 wgapdlfvdddgytvyrqsyqplpirqsmymsyaqlnn---tvregttnerataaeqiekkltrqmqkhq--ltwnvfqa 152 (437) T protein:vir:98 78 WGAPDLFVDDDGYTVYRQSYQPLPIRQSMYMSYAQLNN---TVREGTTNERATAAEQIEKKLTRQMQKHQ--LTWNVFQA 152 (437) T ss_pred cCCcceeecCCCceeeecccCCccchhhhhhhhhhhhh---hhhccccchhhhhHHHHHHHHHHHHHhhh--hhHHHHHH Confidence 9999999998888654 68898999999888766543 33334445555666777777777766544 44555554 Q ss_pred -HhcCeeeecCCc--eeEEEeeccCccceeeeee---------------------cCCC----CCccHHHHHHHHHHH-- Q lcl|Aclame:pro 139 -LATGKIAFTSDG--VNKDIDYGVKADHKKQVSK---------------------SWAE----PGATPLADLEDAIET-- 188 (348) Q Consensus 139 -l~~Gki~~~~~~--~~~~vDfg~~~~~~~t~~~---------------------~W~~----~~adp~~di~~~~~~-- 188 (348) |+-|.|++++.. +.+..--.+|+.|.+...+ .-+- +-.||.=-|....+. T Consensus 153 ammlgginytdprsgvrvkapayiparnffnfnttqgyrgrnearlfrnlidlnaggtpssgipitdpqfalsnftrrln 232 (437) T protein:vir:98 153 AMMLGGINYTDPRSGVRVKAPAYIPARNFFNFNTTQGYRGRNEARLFRNLIDLNAGGTPSSGIPITDPQFALSNFTRRLN 232 (437) T ss_pred HHHhccccccCcccceeeecccccccccccccccccccccchHHHHHHHHhhccCCCCCcCCcccccchhhHHHHHHHHH Confidence 445899987753 3322222333333322111 0000 112332222222211 Q ss_pred --HHhcC-CeeEEEEeCHHHHHHHhcCHHHHHHhc------------------ccCCCcccccHHHHHHHHH-------- Q lcl|Aclame:pro 189 --ARELG-LNPERAIMNAKTFGLIRKAASTVKAIK------------------PLAGDGSSVTKAELQNYVA-------- 239 (348) Q Consensus 189 --~~~~G-~~~~~~~~~~~~~~~l~~~~~v~~~~~------------------~~~~~~~~~~~~~~~~~~~-------- 239 (348) .+++. ...+.+.|+++.-+.++.+++.+-+-. ++.++.+.+.+..+...++ T Consensus 233 rwfkdtnksditdmymgpemrdvilmseearlaqggiiprlgavfgdstidsngsggsfgplppgglgtgmglvlgtrge 312 (437) T protein:vir:98 233 RWFKDTNKSDITDMYMGPEMRDVILMSEEARLAQGGIIPRLGAVFGDSTIDSNGSGGSFGPLPPGGLGTGMGLVLGTRGE 312 (437) T ss_pred HHhhccccccchhhhcCccceeeeeeccchhhhhcccchhhhhhhccccccCCCCCcccCCCCccccccccceeeecccc Confidence 23332 346778888888877776666553321 1112223344444443222 Q ss_pred --hhcCceEEEEeeEEEc-CCCcccccccCCeEEEEeC-------CccceeEeccchhhhccccccccccceeecCCceE Q lcl|Aclame:pro 240 --DNYGVEIVLENGTYRN-EKGEVSKFFPDGHLTLIPN-------GPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIA 309 (348) Q Consensus 240 --~~~~~~i~~yd~~y~d-~~g~~~~~~~~~~vv~~p~-------~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~ 309 (348) ++.|+.+.+.|.-|+| .||..+++||.++++.++- ...|+++|...... +...|.. T Consensus 313 ilsiaginvhvvdtiykdpvdgvekrvwpknkivavsfrdsdgnveapgrtqycssens--------------idspglw 378 (437) T protein:vir:98 313 ILSIAGINVHVVDTIYKDPVDGVEKRVWPKNKIVAVSFRDSDGNVEAPGRTQYCSSENS--------------IDSPGLW 378 (437) T ss_pred eeEeecceeeeehhhhhcchhhhhhhcCCccceEEEEEecCCCcccCCccccccccccc--------------cCCCcce Confidence 2347888999999998 6999999999999998862 23588888543111 1123333 Q ss_pred EEEeecCCC---ceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 310 VTTTKTTDP---VNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 310 ~~~~~~~dP---~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ..+..+-.| .+..++...+.||.+..|-.+.. |++-. T Consensus 379 trtvtdvpppaapgiavqmgnaglpyfkypyrvch--vtpct 418 (437) T protein:vir:98 379 TRTVTDVPPPAAPGIAVQMGNAGLPYFKYPYRVCH--VTPCT 418 (437) T ss_pred eeeeccCCCCCCCcceEeecCCCCcccccceeeee--ecccc Confidence 333333222 46667777788999988876554 33322 No 18 >protein:vir:105334 Length: 276 # NCBI annotation: putative phage major capsid protein # Family: family:all:522 # MgeID: mge:1679 # MgeName: PH15 # Cross-refs: genbank:acc:YP_950669;genbank:gi:119967839;genbank:GeneID:4643213 Probab=96.72 E-value=0.00038 Score=39.30 Aligned_cols=257 Identities=14% Similarity=0.147 Sum_probs=120.3 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eecccce-- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRVSA-- 73 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~~~-- 73 (348) ||+ +.|++.|..+..++.+.-.. ...|...-+.+.+ +.+..|..+--|+...-+.+. +.+...+ T Consensus 1 Ma~~~T~l~d~i~Pev~~~~v~~~~~~------~~~~~~~~~~~~~---l~g~~G~ti~iP~~~~igda~~~~eg~~i~~ 71 (276) T protein:vir:10 1 MAQGTTTKSTQIVPEVLAPMMQAELDK------KLRFAQFADIDST---LVGQPGDTLTFPAFVYSGDATVVPEGQKIPV 71 (276) T ss_pred CCcceeehhhhhchHHHHHHHHHHHHh------hhhhcccceeccc---ccCCCCCEEEeeeecCCCccccccCCCccCc Confidence 995 57899999999999765321 2223322222222 234455555555544332221 1111111 Q ss_pred -----eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecC Q lcl|Aclame:pro 74 -----EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTS 148 (348) Q Consensus 74 -----~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~ 148 (348) ......+-+. .+.+...|+..++...+ .+.+-.+.+...+.++.+--++..|.++...+ T Consensus 72 ~~lt~~~~~a~i~~~--~k~~~~tD~a~~~~~~d------------p~~~~~~~~~~~~a~~~d~~~~~~l~~~~~~~-- 135 (276) T protein:vir:10 72 DKIETNRREAKIHKI--GKGTDITDEALLSGYGD------------PQGEAVRQHGLAIANKVDNDVLEALRGTKLTV-- 135 (276) T ss_pred cccccceeeEEeehc--cccccccHHHHHhhccc------------hHHHHHHHHHHHHHHHHHHHHHHHHhcccccc-- Confidence 1111122111 22333334333332221 12222333444555555555566665432211 Q ss_pred CceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 149 DGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 149 ~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) +.. ..-.+.|.+....+.+.+..++.++|+++++..|++..... .+......... T Consensus 136 -----------------------~~~-~~t~d~i~~A~~~lgd~~~~~~~ivv~p~~~~~L~k~~~~~-f~~~s~~g~~~ 190 (276) T protein:vir:10 136 -----------------------SAD-IGTLAGLEAAIDTFDDEDLEPMVLFINPKDAGKLRSSASDN-FTRATELGDNI 190 (276) T ss_pred -----------------------ccc-ccCHHHHHHHHHHhccccCcccEEEEcHHHHHHHHHhcccc-ccccccccccc Confidence 110 11134455555566555667889999999999887643111 01111111111 Q ss_pred ccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCce Q lcl|Aclame:pro 229 VTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGI 308 (348) Q Consensus 229 ~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~ 308 (348) ..+..++.+.|.+|++-+. +|+++.++...+.+|... +.. + T Consensus 191 ----~~~G~ig~~~G~~Vi~s~~------------~p~~t~~l~~~gAi~~~~-~~~----------------------~ 231 (276) T protein:vir:10 191 ----IVKGAFGEALGAVIVRSKK------------LDEGEAILAKRGAVKLIT-KRD----------------------F 231 (276) T ss_pred ----eeccccceecceeEEEcCC------------CCcceEEEEeccceeeee-cCC----------------------c Confidence 1233455566877775331 456777777665544221 111 0 Q ss_pred EEEEeecCCC--ceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 309 AVTTTKTTDP--VNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 309 ~~~~~~~~dP--~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+ +.+.|+ -.-.+.+-.+--..+.+|..+++++.-+|. T Consensus 232 ~v--E~dRd~~~~~d~i~~~~~y~~~~~~~~~vv~~t~~~~~ 271 (276) T protein:vir:10 232 FL--ETDRDPSTKTTALYSDKHYVAYLYDESKAVKVTKGAGT 271 (276) T ss_pred ee--ecccchhhcccEEEEeeEEEEEEEcCcceEEEecCCcC Confidence 01 111111 122333334445577788888888887777 No 19 >protein:vir:80930 Length: 278 # NCBI annotation: Cps # Family: family:all:522 # MgeID: mge:1886 # MgeName: A500 # Cross-refs: genbank:acc:YP_001468392;genbank:gi:157324966;genbank:GeneID:5601363 Probab=96.26 E-value=0.00082 Score=37.51 Aligned_cols=262 Identities=11% Similarity=0.068 Sum_probs=116.0 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eecccce-- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRVSA-- 73 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~~~-- 73 (348) ||+ +.++|.|..+..++.+.... ......+.. .+.+ +.+..|..+--|+...-+.+. +.+..+. T Consensus 1 Ma~~~T~~~~~iiPev~s~~v~~~~~~--~~v~~~~~~----~~~~---l~g~~G~tv~ip~~~~~g~a~~~~~g~~i~~ 71 (278) T protein:vir:80 1 MADLTTKLANLIDPEVMGPMISAKLPK--AIKFGKIAP----IDNS---LEGQPGSEITVPKYKYIGDAQDVAEGAAIDY 71 (278) T ss_pred CCCcceehhheecHHHHHHHHHHHHHH--hhhhcccce----eccc---ccCCCCCEEEEeeeccCCcceeecCCCcCcc Confidence 885 46889999999998754321 111122221 1111 123334444444443222111 1111111 Q ss_pred -----eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecC Q lcl|Aclame:pro 74 -----EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTS 148 (348) Q Consensus 74 -----~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~ 148 (348) ......+-+. .+.+..+|+..++... +.+.+-.+.+...+.+..+..++..|.+.... T Consensus 72 ~~lt~~~~~~~i~~~--~~a~~v~D~~~~~~~~------------d~~~~~~~~~a~~~a~~~d~~l~~~l~~a~~~--- 134 (278) T protein:vir:80 72 SALETESVKHGIKKA--GKGVKLTDESVLSGYG------------DPVEEAQKQIRMAIASKVDNDILEEALTTTLE--- 134 (278) T ss_pred cccccceeeEeeehh--hccccccHHHHhhccc------------cHHHHHHHHHHHHHHHHHHHHHHHHHhccccc--- Confidence 1111111111 2233333433332211 22223344455666666676777776532111 Q ss_pred CceeEEEeeccCccceeeeeecCCCCCcc-HHHHHHHHHHHHHhcCC-eeEEEEeCHHHHHHHhcCHHHHHHhcccCCCc Q lcl|Aclame:pro 149 DGVNKDIDYGVKADHKKQVSKSWAEPGAT-PLADLEDAIETARELGL-NPERAIMNAKTFGLIRKAASTVKAIKPLAGDG 226 (348) Q Consensus 149 ~~~~~~vDfg~~~~~~~t~~~~W~~~~ad-p~~di~~~~~~~~~~G~-~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~ 226 (348) .+ +..+..+.+ .+..+-...+++...+. ...+++|+++++..|++++...-. ....... T Consensus 135 ----------------~~--~~~t~~~~~~~~~~~~da~~~l~~~~~~~~~~ivv~p~~~~~L~k~~~~~~~-~~~~~g~ 195 (278) T protein:vir:80 135 ----------------VK--GAINIGLIDKIENTFTDAPDAIEDESITTTGVLFLNYKDTAKLREEAAGSWT-KASQLGD 195 (278) T ss_pred ----------------cc--cccccchhhhHHHHHHHHHHhhcccCCCcccEEEECHHHHHHHHhhhhhhcc-ccccccc Confidence 11 111111111 12333344444544333 355789999999999887643211 1111111 Q ss_pred ccccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCC Q lcl|Aclame:pro 227 SSVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDS 306 (348) Q Consensus 227 ~~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~ 306 (348) +. ..+..++.+.|.+|++=+. +|+++.+++..+.+|... +.... T Consensus 196 ~~----~~~G~ig~~~G~~Vi~s~~------------~p~~t~~l~~~gAi~~~~-~~~~~------------------- 239 (278) T protein:vir:80 196 DL----LVKGAFGELLGWEIVRTKK------------LADGNALAVKAGALKTFL-KRNLL------------------- 239 (278) T ss_pred cc----eeeccceeecceeEEEcCC------------CCcceEEEEeccceeeee-cCCcc------------------- Confidence 11 1234455667877766332 456777777666544221 11100 Q ss_pred ceEEEEeecCCCc--eeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 307 GIAVTTTKTTDPV--NVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 307 ~~~~~~~~~~dP~--~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) + +.+.|+. .-.+.+-.+--.-+.+|.+++.++.-||- T Consensus 240 ---v--E~~Rd~~~~~d~i~~~~~yg~~v~~~~~~v~it~~a~~ 278 (278) T protein:vir:80 240 ---A--ESGRDMDHKLTKFNADQHYAVALVDETKAVKVVPVAGN 278 (278) T ss_pred ---c--ccccchhhccceeeeeeEEEEEEEcCcceEEEeeccCC Confidence 0 0111111 11222222233446789999999999999 No 20 >protein:vir:93742 Length: 274 # NCBI annotation: ORF013 # Family: family:all:522 # MgeID: mge:1475 # MgeName: 55 # Cross-refs: genbank:acc:YP_240459;genbank:gi:66396126;genbank:GeneID:5133511 Probab=96.22 E-value=0.00086 Score=37.39 Aligned_cols=257 Identities=14% Similarity=0.106 Sum_probs=117.5 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCc-ceecccce-- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNV-TIRDRVSA-- 73 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~-~~~~r~~~-- 73 (348) ||+ +.|++.|..+..++.+.... ......+.. .+.+ +.+..|..+--|+...-+.. .+.+.+.+ T Consensus 1 ma~~~T~~~~~iiPev~~~~v~~~~~~--~~~~~~~~~----~~~~---l~g~~G~tv~ip~~~~~g~~~~~~eg~~i~~ 71 (274) T protein:vir:93 1 MPQGITKTSNQIIPEVLAPMMQAQLEK--KLRFASFAE----VDST---LQGQPGDTLTFPAFVYSGDAQVVAEGEKIPT 71 (274) T ss_pred CCccceehhheechHHHHHHHHHHHHh--hhhhccccc----cccc---ccCCCCCEEEEEeeccCCCcccccCCCcccc Confidence 997 56889999999998755322 111122221 1111 12333433434444321111 11111111 Q ss_pred -----eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecC Q lcl|Aclame:pro 74 -----EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTS 148 (348) Q Consensus 74 -----~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~ 148 (348) +.....+-+. ...+...|+...+... + .+.. -.+.+..++.+..+-.++..+.+++.. T Consensus 72 ~~it~~~~~~~i~~~--~~~~~i~D~~~~~~~~---d--~~~~-------~~~~~~~~~a~~~d~~~~~~~~~a~~~--- 134 (274) T protein:vir:93 72 DILETKKREAKIRKI--AKGTSITDEALLSGYG---D--PQGE-------QVRQHGLAHANKVDNDVLEALMGAKLT--- 134 (274) T ss_pred cccccceeEEEeeee--cccccccHHHHHhhcc---c--hHHH-------HHHHHHHHHHHHHHHHHHHHHhccccc--- Confidence 1111122111 1223333333332211 1 1222 233444555566665566666433211 Q ss_pred CceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 149 DGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 149 ~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) . ++++...+.|.....++.+.+..+..++|+++++..|++++...- +......... T Consensus 135 ----------------~-------~~~~~~~d~i~dA~~~l~d~~~~~~~ivv~p~~~~~L~k~~~~~f-~~~s~~g~~~ 190 (274) T protein:vir:93 135 ----------------V-------NADITKLNGLQSAIDKFNDEDLEPMVLFINPLDAGKLRGDASTNF-TRATELGDDI 190 (274) T ss_pred ----------------c-------cccccCHHHHHHHHHHhhhccCCccEEEeCHHHHHHHHhhhhhcc-cccccccccc Confidence 0 011122455555666666666678899999999999988764321 1111111111 Q ss_pred ccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCce Q lcl|Aclame:pro 229 VTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGI 308 (348) Q Consensus 229 ~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~ 308 (348) ..+..++.+.|.+|++=+ -+|+++.++...+.+|... +...... T Consensus 191 ----~~~G~ig~~~G~~Vi~s~------------~~p~~t~~l~~~gai~~~~-~~~~~vE------------------- 234 (274) T protein:vir:93 191 ----IVKGAFGEALGAIIVRTN------------KLEAGTAILAKKGAVKLIL-KRDFFLE------------------- 234 (274) T ss_pred ----eeecccceecCeeEEEcC------------CCCcceEEEEeCCeEEEEe-cCCcccc------------------- Confidence 123345556677766522 2567888888776655322 2111100 Q ss_pred EEEEeecCCC--ceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 309 AVTTTKTTDP--VNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 309 ~~~~~~~~dP--~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+.|+ -.-.+.+-.+--.-+.+|+++++++.-++- T Consensus 235 -----~~Rd~~~~~d~i~~~~~y~~~~~~~~~~v~~t~~~~s 271 (274) T protein:vir:93 235 -----VARDASTKTTALYSDKHYVAYLYDESKAVKITKGSGS 271 (274) T ss_pred -----cccchhhcccEEEEEEEEEEEEEcCCceEEEeeCccc Confidence 00011 011222223333456678888887766666 No 21 >protein:vir:96262 Length: 274 # NCBI annotation: ORF013 # Family: family:all:522 # MgeID: mge:1612 # MgeName: ROSA # Cross-refs: genbank:acc:YP_240311;genbank:gi:66395978;genbank:GeneID:5133339 Probab=96.14 E-value=0.00096 Score=37.14 Aligned_cols=257 Identities=14% Similarity=0.140 Sum_probs=119.4 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eecccc--- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRVS--- 72 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~~--- 72 (348) ||+ +.|+|.|..+..++.+.-. ....|...-+.+.+ +.+..|..+--|+...-+... +.+... T Consensus 1 m~~~~T~l~d~i~Pev~~~~v~~~~~------~~l~~~~~~~~~~~---l~g~~G~tv~iP~~~~ig~a~~~~~g~~i~~ 71 (274) T protein:vir:96 1 MAQGMTKLTNQIVPEVLAPMMQAELE------KKLRFASFAEIDNT---LVGQPGDTLTFPAFIYSGDAKVVAEGEKIPT 71 (274) T ss_pred CCcceeehhheechHHHHHHHHHHHH------hhhhccccceeccc---ccCCCCCEEEeeeecCCCccccccCCCccch Confidence 887 6799999999999976432 12223222111222 234445555445543322211 111111 Q ss_pred --e--eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecC Q lcl|Aclame:pro 73 --A--EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTS 148 (348) Q Consensus 73 --~--~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~ 148 (348) . ......+-+. .+.+...|+..++...+ .+.+-.+.+...+.+..+-.++.++.++...+ T Consensus 72 ~~lt~~~~~~~i~~~--~~a~~i~D~~~~~~~~d------------~~~~~~~~~~~~~a~~vd~~i~~~l~~a~~~~-- 135 (274) T protein:vir:96 72 DILETKKREAKIRKI--AKGTSISDEALLSGYGD------------PQGEQVRQHGLAHANKVDDDVLEALKSAKLTV-- 135 (274) T ss_pred hhcccceeEEEeeee--ecceeehHHHHhhccch------------HHHHHHHHHHHHHHHHHHHHHHHHHhcccccc-- Confidence 1 1111122111 22344444433332221 12222333445555555555666665432111 Q ss_pred CceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 149 DGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 149 ~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) + +++...+.|.+....+.+.+..+..++|+++++..|++++...-. ........ T Consensus 136 -----------------------~-~~~~~~d~i~~A~~~lgd~~~~~~~ivv~p~~~~~L~k~~~~~f~-~~s~~g~~- 189 (274) T protein:vir:96 136 -----------------------E-ADITKLTGLQTAIDKFNDEDLEPMVLFISPLDAGKLRGDATTNFT-RATELGDD- 189 (274) T ss_pred -----------------------c-ccccCHHHHHHHHHHhccccccccEEEeCHHHHHHHHhhcccccc-cccccccc- Confidence 0 011113445555555655556788999999999999887632211 11111111 Q ss_pred ccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCce Q lcl|Aclame:pro 229 VTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGI 308 (348) Q Consensus 229 ~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~ 308 (348) -..+..++.+.|.+|++=+. +|+++.++...+.+|... +... T Consensus 190 ---~~~~G~ig~~~G~~Vi~s~~------------~~~~t~~l~~~gA~~~~~-~~~~---------------------- 231 (274) T protein:vir:96 190 ---VIVKGAFGEALGAVIVRSNK------------LEAGTAILAKKGAVKLIT-KRDF---------------------- 231 (274) T ss_pred ---ceeccccceecCeEEEEeCC------------CCCceEEEEeccceeeee-cCCc---------------------- Confidence 12244566677888775331 456666666555544211 1110 Q ss_pred EEEEeecCCCce--eEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 309 AVTTTKTTDPVN--VQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 309 ~~~~~~~~dP~~--~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ..+.+.||.. -.+.+--+--..+.+|.++++++.-+|- T Consensus 232 --~vE~~Rd~~~~~d~i~~~~~y~~~~~~~~~~v~~tk~~~~ 271 (274) T protein:vir:96 232 --FLETDRDPSTKTTALYSDKHYVAYLYDESKAVKITKGSGS 271 (274) T ss_pred --ccccccccccccCEEEEeEEEEEEEEcCCcEEEEEcCCcc Confidence 1111222222 2222223344566778888888877777 No 22 >protein:vir:95898 Length: 274 # NCBI annotation: ORF014 # Family: family:all:522 # MgeID: mge:1588 # MgeName: 71 # Cross-refs: genbank:acc:YP_240385;genbank:gi:66396054;genbank:GeneID:5133409 Probab=96.14 E-value=0.00096 Score=37.14 Aligned_cols=257 Identities=14% Similarity=0.140 Sum_probs=119.4 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eecccc--- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRVS--- 72 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~~--- 72 (348) ||+ +.|+|.|..+..++.+.-. ....|...-+.+.+ +.+..|..+--|+...-+... +.+... T Consensus 1 m~~~~T~l~d~i~Pev~~~~v~~~~~------~~l~~~~~~~~~~~---l~g~~G~tv~iP~~~~ig~a~~~~~g~~i~~ 71 (274) T protein:vir:95 1 MAQGMTKLTNQIVPEVLAPMMQAELE------KKLRFASFAEIDNT---LVGQPGDTLTFPAFIYSGDAKVVAEGEKIPT 71 (274) T ss_pred CCcceeehhheechHHHHHHHHHHHH------hhhhccccceeccc---ccCCCCCEEEeeeecCCCccccccCCCccch Confidence 887 6799999999999976432 12223222111222 234445555445543322211 111111 Q ss_pred --e--eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecC Q lcl|Aclame:pro 73 --A--EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTS 148 (348) Q Consensus 73 --~--~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~ 148 (348) . ......+-+. .+.+...|+..++...+ .+.+-.+.+...+.+..+-.++.++.++...+ T Consensus 72 ~~lt~~~~~~~i~~~--~~a~~i~D~~~~~~~~d------------~~~~~~~~~~~~~a~~vd~~i~~~l~~a~~~~-- 135 (274) T protein:vir:95 72 DILETKKREAKIRKI--AKGTSISDEALLSGYGD------------PQGEQVRQHGLAHANKVDDDVLEALKSAKLTV-- 135 (274) T ss_pred hhcccceeEEEeeee--ecceeehHHHHhhccch------------HHHHHHHHHHHHHHHHHHHHHHHHHhcccccc-- Confidence 1 1111122111 22344444433332221 12222333445555555555666665432111 Q ss_pred CceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 149 DGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 149 ~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) + +++...+.|.+....+.+.+..+..++|+++++..|++++...-. ........ T Consensus 136 -----------------------~-~~~~~~d~i~~A~~~lgd~~~~~~~ivv~p~~~~~L~k~~~~~f~-~~s~~g~~- 189 (274) T protein:vir:95 136 -----------------------E-ADITKLTGLQTAIDKFNDEDLEPMVLFISPLDAGKLRGDATTNFT-RATELGDD- 189 (274) T ss_pred -----------------------c-ccccCHHHHHHHHHHhccccccccEEEeCHHHHHHHHhhcccccc-cccccccc- Confidence 0 011113445555555655556788999999999999887632211 11111111 Q ss_pred ccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCce Q lcl|Aclame:pro 229 VTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGI 308 (348) Q Consensus 229 ~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~ 308 (348) -..+..++.+.|.+|++=+. +|+++.++...+.+|... +... T Consensus 190 ---~~~~G~ig~~~G~~Vi~s~~------------~~~~t~~l~~~gA~~~~~-~~~~---------------------- 231 (274) T protein:vir:95 190 ---VIVKGAFGEALGAVIVRSNK------------LEAGTAILAKKGAVKLIT-KRDF---------------------- 231 (274) T ss_pred ---ceeccccceecCeEEEEeCC------------CCCceEEEEeccceeeee-cCCc---------------------- Confidence 12244566677888775331 456666666555544211 1110 Q ss_pred EEEEeecCCCce--eEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 309 AVTTTKTTDPVN--VQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 309 ~~~~~~~~dP~~--~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ..+.+.||.. -.+.+--+--..+.+|.++++++.-+|- T Consensus 232 --~vE~~Rd~~~~~d~i~~~~~y~~~~~~~~~~v~~tk~~~~ 271 (274) T protein:vir:95 232 --FLETDRDPSTKTTALYSDKHYVAYLYDESKAVKITKGSGS 271 (274) T ss_pred --ccccccccccccCEEEEeEEEEEEEEcCCcEEEEEcCCcc Confidence 1111222222 2222223344566778888888877777 No 23 >protein:vir:95107 Length: 270 # NCBI annotation: ORF013 # Family: family:all:522 # MgeID: mge:1549 # MgeName: X2 # Cross-refs: genbank:acc:YP_240822;genbank:gi:66394683;genbank:GeneID:5133901 Probab=95.99 E-value=0.0012 Score=36.70 Aligned_cols=254 Identities=12% Similarity=0.065 Sum_probs=117.1 Q ss_pred Cc--cchhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eeccccee--- Q lcl|Aclame:pro 1 MG--LIYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRVSAE--- 74 (348) Q Consensus 1 Ma--~l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~~~~--- 74 (348) || .+.|++.|..+..|+.+.-... ..|.+--.+.. .+.+..|..+--|+...-+++. +.+..... T Consensus 1 Ma~T~~~d~I~Pev~~~~V~e~~~~~-----~~~~~~~~~d~----~L~g~~G~ti~~P~~~~igdae~~~eg~~i~~~~ 71 (270) T protein:vir:95 1 MTQTKKANLINPEVLANVVSAQMQNA-----IRFTPYAVTDD----TLVGQPGDTITRPKYAYIGAAEDLQEGVAMDTTQ 71 (270) T ss_pred CCceehhhhcchHHHHHHHHHHHHhH-----Hhhcccccccc----ccCCCCCCEEEeeeecCCCccccccCCCccchhh Confidence 99 4789999999999997653211 22333222211 1334556666666654433332 11111110 Q ss_pred ----eeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCc Q lcl|Aclame:pro 75 ----IHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDG 150 (348) Q Consensus 75 ----~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~ 150 (348) .....+-+. ...+...|+..+. ..+ +-+.+-...+...+.++.+..++.+|.+.. T Consensus 72 lt~~~~~a~i~~~--gk~~~itD~a~~~---~~~---------dp~~~~~~q~a~~~a~~~d~~li~~l~~a~------- 130 (270) T protein:vir:95 72 MSMTTTKVTVKET--GKAVEVTQTAIIT---NVN---------GTLQEASRQLAMSLADKVEIDYIAELNKSK------- 130 (270) T ss_pred cccchheeeeehh--hCcceecHHHHhh---hcc---------chHHHHHHHHHHHHHHHHHHHHHHHhcccc------- Confidence 001111111 1122222222221 111 222333444556666666666777775321 Q ss_pred eeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccccc Q lcl|Aclame:pro 151 VNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVT 230 (348) Q Consensus 151 ~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~ 230 (348) |+...+.-.++|......+.+.+..++.++|+++++..|+++..+.. ...... T Consensus 131 --------------------~~~~~~~t~~~~~dA~~~lgd~~~~~~~i~vhs~~~~~Lrk~~~~~~----~~~~~~--- 183 (270) T protein:vir:95 131 --------------------QTATVSADATGILDAIEVFNSENDEDYVLYVNPKDYNKLVKSLFKVG----GNVQDR--- 183 (270) T ss_pred --------------------cccccccCHHHHHHHHHHhccccCCCcEEEEcHHHHHHHHhhhcccc----cccccc--- Confidence 11111112345555556666666778899999999999988763321 111111 Q ss_pred HHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEE Q lcl|Aclame:pro 231 KAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAV 310 (348) Q Consensus 231 ~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~ 310 (348) ...+..++.+.|.++++-|.. .++++.++.-.+.+|... +. ++. T Consensus 184 -~~~~G~ig~~~G~~Viv~s~~-----------~~~~~~~l~~~gAi~~~~-~~----------------------~~~- 227 (270) T protein:vir:95 184 -AISKGDLVEIVGVSDIVKSKR-----------VSENTAFLQRYGAMEIVN-KK----------------------KPE- 227 (270) T ss_pred -hhcccccceecceeEEEeCCC-----------CCceeEEEEeccceeeee-cC----------------------Cce- Confidence 122334555667776643321 234555666555544211 10 000 Q ss_pred EEeecCCCcee--EEeeeeeeeeeecCCCcEEEEEEe-cCC Q lcl|Aclame:pro 311 TTTKTTDPVNV--QTKVSMVALPSFERLGDVYMLTVI-PGV 348 (348) Q Consensus 311 ~~~~~~dP~~~--~~~~~s~~lPv~~~~~~~~~~~V~-~~~ 348 (348) .+.++|+... .+.+-.+-...+.++..++++|.- ||- T Consensus 228 -vEtdRd~~~~~d~i~~~~~y~v~~~~~skvv~~t~~~a~~ 267 (270) T protein:vir:95 228 -AYTDFDILKRTHLLSTNYHYSVNLKDETGVVKVTFKPSGS 267 (270) T ss_pred -eeeccchhhcccEEEeeeEEEEEEEccceEEEEEecCCCC Confidence 1111122111 222223344556667777777664 222 No 24 >protein:vir:97433 Length: 274 # NCBI annotation: ORF014 # Family: family:all:522 # MgeID: mge:1676 # MgeName: 92 # Cross-refs: genbank:acc:YP_240749;genbank:gi:66396420;genbank:GeneID:5133789 Probab=95.79 E-value=0.0015 Score=36.14 Aligned_cols=257 Identities=15% Similarity=0.139 Sum_probs=118.2 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eecccce-- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRVSA-- 73 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~~~-- 73 (348) ||+ +.|++.|..+..++.+.... .+ .|...-+.+.+. .+..|..+--|+...-+... +.+.... T Consensus 1 ma~~~T~~~d~iiPev~~~~v~~~~~~--~l----~~~~~~~~d~~l---~g~~G~tv~iP~~~~~g~a~~~~~g~~i~~ 71 (274) T protein:vir:97 1 MPQGLTKTSDQIIPEVLAPMMQAQLEK--KL----RFASFAEVDSTL---QGQPGDTLTFPAFVYSGDAQVVAEGEKIPT 71 (274) T ss_pred CCccceehhheechHHHHHHHHHhhhh--hh----hhcccceecccc---cCCCCCEEEEeeecCCCccccccCCCcccc Confidence 997 56899999999999765421 12 222211122111 23334444445443221111 1111111 Q ss_pred -----eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecC Q lcl|Aclame:pro 74 -----EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTS 148 (348) Q Consensus 74 -----~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~ 148 (348) ......+-+. .+.+...|+..++.. ++ .+.. -.+.+..++.+..+-.++.+|.++.... T Consensus 72 ~~lt~~~~~~~i~~~--~~~~~i~D~~~~~~~---~d--p~~~-------~~~~~a~a~a~~vd~~~~~~l~~a~~~~-- 135 (274) T protein:vir:97 72 DILETKKREAKIRKI--AKGTSITDEALLSGY---GD--PQGE-------QVRQHGLAHANKVDNDVLEALMGAKLTV-- 135 (274) T ss_pred cccccceeEEEeeee--cceecccHHHHHhcc---ch--HHHH-------HHHHHHHHHHHHHHHHHHHHHhccCccc-- Confidence 1111222111 122333333333221 11 1222 2344445666666666666665432111 Q ss_pred CceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 149 DGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 149 ~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) ++++...+.|......+.+.+..+..++|+++++..|++++...- +......... T Consensus 136 ------------------------~~~~~~~d~i~dA~~~l~d~~~~~~~ivv~p~~~~~L~k~~~~~f-~~~s~~g~~~ 190 (274) T protein:vir:97 136 ------------------------NADITKLNGLQSAIDKFNDEDLEPMVLFVNPLDAGKLRGDASTNF-TRATELGDDI 190 (274) T ss_pred ------------------------cccccCHHHHHHHHHHhhccCCCceEEEeCHHHHHHHHhhhhhhc-cccCcccccc Confidence 011112455656666666666678899999999999988754321 1111111111 Q ss_pred ccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCce Q lcl|Aclame:pro 229 VTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGI 308 (348) Q Consensus 229 ~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~ 308 (348) ..+..++.+.|.+|++=+ -+|+++.+++..+.+|... +.... T Consensus 191 ----~~~G~ig~~~G~~Vi~s~------------~~p~~t~~l~~~gA~~~~~-~~~~~--------------------- 232 (274) T protein:vir:97 191 ----IVKGAFGEALGAIIVRTN------------KLEAGTAILAKKGAVKLIL-KRDFF--------------------- 232 (274) T ss_pred ----eeccccceecCeeEEEcC------------CCCcceEEEEeCcceEeee-cCCce--------------------- Confidence 123445566677776522 1467777777666655322 11100 Q ss_pred EEEEeecCCCce--eEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 309 AVTTTKTTDPVN--VQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 309 ~~~~~~~~dP~~--~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+.++||.. -.+.+--+--..+.+|.++++++...+- T Consensus 233 ---vE~~Rd~~~~~d~i~~~~~y~~~~~~~~~vv~~t~~~~~ 271 (274) T protein:vir:97 233 ---LEVARDASTKTTALYSDKHYVAYLYDESKAVKITKGSGS 271 (274) T ss_pred ---eccccchhhcccEEEEEEEEEEEEEcCCceEEEecCccc Confidence 011111111 1122222333456677777777766555 No 25 >protein:vir:94494 Length: 274 # NCBI annotation: ORF015 # Family: family:all:522 # MgeID: mge:1508 # MgeName: 88 # Cross-refs: genbank:acc:YP_240676;genbank:gi:66396348;genbank:GeneID:5133758 Probab=95.79 E-value=0.0015 Score=36.14 Aligned_cols=257 Identities=15% Similarity=0.139 Sum_probs=118.2 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eecccce-- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRVSA-- 73 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~~~-- 73 (348) ||+ +.|++.|..+..++.+.... .+ .|...-+.+.+. .+..|..+--|+...-+... +.+.... T Consensus 1 ma~~~T~~~d~iiPev~~~~v~~~~~~--~l----~~~~~~~~d~~l---~g~~G~tv~iP~~~~~g~a~~~~~g~~i~~ 71 (274) T protein:vir:94 1 MPQGLTKTSDQIIPEVLAPMMQAQLEK--KL----RFASFAEVDSTL---QGQPGDTLTFPAFVYSGDAQVVAEGEKIPT 71 (274) T ss_pred CCccceehhheechHHHHHHHHHhhhh--hh----hhcccceecccc---cCCCCCEEEEeeecCCCccccccCCCcccc Confidence 997 56899999999999765421 12 222211122111 23334444445443221111 1111111 Q ss_pred -----eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecC Q lcl|Aclame:pro 74 -----EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTS 148 (348) Q Consensus 74 -----~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~ 148 (348) ......+-+. .+.+...|+..++.. ++ .+.. -.+.+..++.+..+-.++.+|.++.... T Consensus 72 ~~lt~~~~~~~i~~~--~~~~~i~D~~~~~~~---~d--p~~~-------~~~~~a~a~a~~vd~~~~~~l~~a~~~~-- 135 (274) T protein:vir:94 72 DILETKKREAKIRKI--AKGTSITDEALLSGY---GD--PQGE-------QVRQHGLAHANKVDNDVLEALMGAKLTV-- 135 (274) T ss_pred cccccceeEEEeeee--cceecccHHHHHhcc---ch--HHHH-------HHHHHHHHHHHHHHHHHHHHHhccCccc-- Confidence 1111222111 122333333333221 11 1222 2344445666666666666665432111 Q ss_pred CceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 149 DGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 149 ~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) ++++...+.|......+.+.+..+..++|+++++..|++++...- +......... T Consensus 136 ------------------------~~~~~~~d~i~dA~~~l~d~~~~~~~ivv~p~~~~~L~k~~~~~f-~~~s~~g~~~ 190 (274) T protein:vir:94 136 ------------------------NADITKLNGLQSAIDKFNDEDLEPMVLFVNPLDAGKLRGDASTNF-TRATELGDDI 190 (274) T ss_pred ------------------------cccccCHHHHHHHHHHhhccCCCceEEEeCHHHHHHHHhhhhhhc-cccCcccccc Confidence 011112455656666666666678899999999999988754321 1111111111 Q ss_pred ccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCce Q lcl|Aclame:pro 229 VTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGI 308 (348) Q Consensus 229 ~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~ 308 (348) ..+..++.+.|.+|++=+ -+|+++.+++..+.+|... +.... T Consensus 191 ----~~~G~ig~~~G~~Vi~s~------------~~p~~t~~l~~~gA~~~~~-~~~~~--------------------- 232 (274) T protein:vir:94 191 ----IVKGAFGEALGAIIVRTN------------KLEAGTAILAKKGAVKLIL-KRDFF--------------------- 232 (274) T ss_pred ----eeccccceecCeeEEEcC------------CCCcceEEEEeCcceEeee-cCCce--------------------- Confidence 123445566677776522 1467777777666655322 11100 Q ss_pred EEEEeecCCCce--eEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 309 AVTTTKTTDPVN--VQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 309 ~~~~~~~~dP~~--~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+.++||.. -.+.+--+--..+.+|.++++++...+- T Consensus 233 ---vE~~Rd~~~~~d~i~~~~~y~~~~~~~~~vv~~t~~~~~ 271 (274) T protein:vir:94 233 ---LEVARDASTKTTALYSDKHYVAYLYDESKAVKITKGSGS 271 (274) T ss_pred ---eccccchhhcccEEEEEEEEEEEEEcCCceEEEecCccc Confidence 011111111 1122222333456677777777766555 No 26 >protein:vir:1239 Length: 274 # NCBI annotation: similar to phage B1 major head protein # Family: family:all:522 # MgeID: mge:25 # MgeName: phi ETA # Cross-refs: genbank:acc:NP_510938;genbank:gi:17426272;genbank:GeneID:927376 Probab=95.72 E-value=0.0016 Score=35.96 Aligned_cols=257 Identities=14% Similarity=0.123 Sum_probs=116.6 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eecccce-- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRVSA-- 73 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~~~-- 73 (348) ||+ +.|++.|..+..++.+... ....|...-+.+.+ +.+..|..+--|+...-+... +.+.... T Consensus 1 ma~~~T~l~d~iiPev~~~~v~~~~~------~~l~~~~~~~~d~~---l~g~~G~tv~iP~~~~ig~a~~~~~g~~i~~ 71 (274) T protein:vir:12 1 MAQGLTKTSNQIIPEVLAPMMQAQLE------KKLRFASFAEVDST---LQGQPGDTLTFPAFVYSGDAQVVAEGEKIPT 71 (274) T ss_pred CCcceeehhhhhchHHHHHHHHHHHH------hhhhhcccceeccc---ccCCCCCEEEEeeecCCCccccccCCCccch Confidence 997 5689999999999975431 12233222222222 234445555555544322221 1111111 Q ss_pred -----eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecC Q lcl|Aclame:pro 74 -----EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTS 148 (348) Q Consensus 74 -----~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~ 148 (348) +.....+-+ ..+.+...|+..++... + .+..+ .+.+...+.+..+-.++..+.++... T Consensus 72 ~~lt~~~~~~~i~~--~~~~~~i~D~~~~~~~~---d--~~~~~-------~~q~~~~~a~~vd~~~l~~~~~a~~~--- 134 (274) T protein:vir:12 72 DILETKKREAKIRK--IAKGTSITDEALLSGYG---D--PQGEQ-------VRQHGLAHANKVDNDVLEALMGAKLT--- 134 (274) T ss_pred hhcccceeeEEeee--ecceeeecHHHHHhccc---c--hHHHH-------HHHHHHHHHHHHHHHHHHHHhccccc--- Confidence 111112211 12233344443333222 1 12222 23334445555555556666433211 Q ss_pred CceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 149 DGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 149 ~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) .++++...+.|-.....+.+.+..+..++|+++++..|++++... .+........ T Consensus 135 -----------------------~~~~a~~~d~i~dA~~~lgd~~~~~~~ivv~p~~~~~L~k~~~~~-fv~~s~~g~~- 189 (274) T protein:vir:12 135 -----------------------VNADITKLNGLQSAIDKFNDEDLEPMVLFINPLDAGKLRGDASTN-FTRATELGDD- 189 (274) T ss_pred -----------------------ccccccCHHHHHHHHHHhccccccccEEEeCHHHHHHHHhhhhhh-cccccccccc- Confidence 111222344455555556555557888999999999998876322 1111111111 Q ss_pred ccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCce Q lcl|Aclame:pro 229 VTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGI 308 (348) Q Consensus 229 ~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~ 308 (348) ...+..++.+.|.+|++=| -+|.++.++...+.+|... +... T Consensus 190 ---~~~~G~ig~~~G~~Vi~s~------------~~p~~t~~l~~~gA~~~~~-~~~~---------------------- 231 (274) T protein:vir:12 190 ---IIVKGAFGEALGAIIVRSN------------KLEAGTAILAKKGAVKLIL-KRDF---------------------- 231 (274) T ss_pred ---ceecccceeecCeeEEEeC------------CCCcceEEEEeccceeeee-cCCc---------------------- Confidence 1224455666788776632 1456666666555544221 1110 Q ss_pred EEEEeecCCCce--eEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 309 AVTTTKTTDPVN--VQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 309 ~~~~~~~~dP~~--~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ..+...||.. -.+.+-.+--..+.+|..+++++.-.+- T Consensus 232 --~vE~~Rd~~~~~d~i~~~~~y~~~~~~~~~vv~~t~~~~~ 271 (274) T protein:vir:12 232 --FLEVARDASTKTTALYSDKHYVAYLYDESKAVKITKGSGS 271 (274) T ss_pred --eeccccchhhcccEEEeeeEEEEEEEcCCceEEEEcCCcc Confidence 0111111111 1222223334455677777777755444 No 27 >protein:vir:96833 Length: 275 # NCBI annotation: ORF015 # Family: family:all:522 # MgeID: mge:1642 # MgeName: EW # Cross-refs: genbank:acc:YP_240157;genbank:gi:66395822;genbank:GeneID:5133174 Probab=95.21 E-value=0.0025 Score=34.83 Aligned_cols=257 Identities=12% Similarity=0.088 Sum_probs=115.4 Q ss_pred Ccc---chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eecccce--- Q lcl|Aclame:pro 1 MGL---IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRVSA--- 73 (348) Q Consensus 1 Ma~---l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~~~--- 73 (348) |++ +.|++.|..+..++++.-. ....|...-+.+.+ +.+..|..+--|+...-+... +.+...+ T Consensus 3 ~~~~T~l~d~i~PEv~~~~v~~~~~------~~~~~~~~~~~~~~---l~g~~G~tv~iP~~~~ig~a~~~~~g~~i~~~ 73 (275) T protein:vir:96 3 LENMTKLANMVNPEVLAPMMQAELD------KKLKFAQFADIDNT---LVGQPGNTITFPAFVYSGDAKVVPEGEEIPID 73 (275) T ss_pred CcccchhhhhhchHHHHHHHHHHHH------Hhhhhcccceeccc---ccCCCCCEEEeeeeccCCccccccCCCCcchh Confidence 554 5689999999999976532 12233222222222 234445555555544322221 1111111 Q ss_pred ----eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCC Q lcl|Aclame:pro 74 ----EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSD 149 (348) Q Consensus 74 ----~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~ 149 (348) ......+-+. ...+...|+..++... +.+.+-.+.+...+.++.+--++..+.++... T Consensus 74 ~lt~~~~~~~i~~~--~~~~~i~D~~~~~~~~------------d~~~~~~~~~a~~~a~~~d~~ll~~l~~a~~~---- 135 (275) T protein:vir:96 74 LIETKKRQATIRKI--GKGTVLTDEALLSGYG------------DPKGEAVRQHGLAIANKVDNDVLEALQGATLK---- 135 (275) T ss_pred hcccceeeEEeehh--cccccccHHHHHhhcc------------chHHHHHHHHHHHHHHHHHHHHHHHHhccccc---- Confidence 1111111111 1222233332222211 22233334444555556555566666432211 Q ss_pred ceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccc Q lcl|Aclame:pro 150 GVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSV 229 (348) Q Consensus 150 ~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~ 229 (348) ... ++.-.+.|-.....+.+.+..+..++|+++++..|++++...-. ......... T Consensus 136 ---------------~~~-------~~~~~d~i~dA~~~lgd~~~~~~~ivv~p~~~~~L~k~~~~~f~-~~~~~g~~~- 191 (275) T protein:vir:96 136 ---------------VEA-------DITKLAGLQTAIDKFNDEDLEPMVLFVNPLDAGKLRASATDNFT-RATLLGDNV- 191 (275) T ss_pred ---------------ccc-------cccCHHHHHHHHHHhccccCCccEEEeCHHHHHHHHhccccccc-ccccccccc- Confidence 100 11113445555555655556788999999999999887532110 111111111 Q ss_pred cHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceE Q lcl|Aclame:pro 230 TKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIA 309 (348) Q Consensus 230 ~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~ 309 (348) ..+..++.+.|.+|++=+. +|+++.+++..+.+|... .... T Consensus 192 ---~~~G~ig~~~G~~Vi~s~~------------~p~~t~~i~~~gA~~~~~-~~~~----------------------- 232 (275) T protein:vir:96 192 ---IVKGAFGEALGAIIVRSNK------------IKEGEAILAKRGAVKLIT-KRDF----------------------- 232 (275) T ss_pred ---eeccccceecCeeEEEeCC------------CCcceEEEEeccceeeee-cCCc----------------------- Confidence 1234456667887765331 356666666555544211 1110 Q ss_pred EEEeecCCCc--eeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 310 VTTTKTTDPV--NVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 310 ~~~~~~~dP~--~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ..+.++|+. .-.+.+-.+--..+.+|.++++++..|.- T Consensus 233 -~vE~~Rd~~~~~d~i~~~~~y~~~~~~~~~vv~~t~~~~~ 272 (275) T protein:vir:96 233 -FLETERHASHKSTALFSDKHYVAYLYDESKVVKITKSASG 272 (275) T ss_pred -ccccccchhhcCcEEEEeEEEEEEEEcCccEEEEEecccc Confidence 001111111 12222223333456678888888877433 No 28 >protein:vir:3033 Length: 272 # NCBI annotation: major capsid protein # Family: family:all:522 # MgeID: mge:61 # MgeName: PhiNIH1.1 # Cross-refs: genbank:acc:NP_438146;genbank:gi:16271809;genbank:GeneID:929235 Probab=94.90 E-value=0.0032 Score=34.24 Aligned_cols=260 Identities=11% Similarity=0.090 Sum_probs=113.4 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCC-Cc---cccceeEEEEEeecCceeeeeeeeCCCCcceecccc Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFP-AR---KQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVS 72 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp-~~---~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~ 72 (348) ||+ +.++|.|..+..++.+... ....+ ..+-. .. ......+.... ... ...+..+..+...+. ..-+ T Consensus 1 MA~~~T~~~~~~iPev~s~~v~~~~~-~~~~~-~~~~~~~~~~~g~~G~tv~iP~-~~~-~~~a~~v~eg~~i~~-~~~~ 75 (272) T protein:vir:30 1 MAVGTTKMAQMLDPEVLADMIDAEVG-KAIRF-APLAEVDTTLEGQPGTTLTVPK-WDY-IGDAEDVAEGEAIPM-TQLG 75 (272) T ss_pred CCCccccchheechHHHHHHHHHHHH-HHhhh-hccccccccccCCCCCEEEEEE-ecC-CCCcccccCCCcccc-cccc Confidence 995 4578999999988865432 11111 11110 00 01111111111 111 111233333333222 2223 Q ss_pred eeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCcee Q lcl|Aclame:pro 73 AEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVN 152 (348) Q Consensus 73 ~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~ 152 (348) .......+-+++....++..+ ..+.. ......+. +.+...+.+..|..+...+.+.. T Consensus 76 ~~~~~~~~~~~~~~~~itd~~--~~~s~-----~d~~~~~~-------~~~~~~~a~~~d~~i~~~~~~a~--------- 132 (272) T protein:vir:30 76 FKKTTMTIKKAGKGVEITDEA--ILSGY-----GDPVGQAA-------KQIVEAIDHKVDADVLDALSKST--------- 132 (272) T ss_pred cceEEEEeeeeeeeeeecHHH--Hhhcc-----ccHHHHHH-------HHHHHHHHHHHHHHHHHHhcccc--------- Confidence 444444444444333443322 22211 11222222 33334444555555555553211 Q ss_pred EEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHH Q lcl|Aclame:pro 153 KDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKA 232 (348) Q Consensus 153 ~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~ 232 (348) +.++. ....++|.+....+.+.+..+..++|+++++..|++++...- .......... T Consensus 133 ----------~~~~~--------~~t~d~i~da~~~l~~~~~~~~~~vv~p~~~~~L~k~~~~~~-~~~~~~~~~~---- 189 (272) T protein:vir:30 133 ----------QTVEA--------TATVDGVSKALDIFNDEDDAETVIVMNPADASTLRLDAAKEW-LGATEVGANR---- 189 (272) T ss_pred ----------ccccc--------ccCHHHHHHHHHHHhccCCCccEEEEcHHHHHHHHHhccccc-cccccccccc---- Confidence 11111 112345556666676667778899999999999876653321 1111111111 Q ss_pred HHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEE Q lcl|Aclame:pro 233 ELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTT 312 (348) Q Consensus 233 ~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 312 (348) ..+..++.+.|+++++=+ .+|+++++++..+.++...-.. +.+.+ T Consensus 190 ~~~g~ig~i~G~~Vi~s~------------~~p~~t~~~~~~~a~~~~~~~~-----------------------~~ve~ 234 (272) T protein:vir:30 190 VVSGVYGEVLGVQIVRSR------------KCPKGTAYMVRKGALRIMLKRN-----------------------TMVET 234 (272) T ss_pred cccccchhhcCeeEEEcC------------CCCcceEEEEcCCeEEEEecCC-----------------------ceeee Confidence 112233455677665422 2467777777665443322111 11111 Q ss_pred eecCCCc--eeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 313 TKTTDPV--NVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 313 ~~~~dP~--~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) +.++. .-.+.+-.+.-.-+.+|.+++.+|+-|-- T Consensus 235 --~r~~~~~~~~i~~~~~~~~~v~~~~~vv~~t~~~a~ 270 (272) T protein:vir:30 235 --DRDITKAINQIVANKHYGVYLYKAEKAVKITLKDAA 270 (272) T ss_pred --ccccccceeEEEEEEEEEEEEEcCCceEEEEecccc Confidence 11111 12222223333445678888888887333 No 29 >protein:vir:9820 Length: 272 # NCBI annotation: putative major capsid/head protein # Family: family:all:522 # MgeID: mge:176 # MgeName: 315.4 # Cross-refs: genbank:acc:NP_795582;genbank:gi:28876339;genbank:GeneID:1257858 Probab=94.90 E-value=0.0032 Score=34.24 Aligned_cols=260 Identities=11% Similarity=0.090 Sum_probs=113.4 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCC-Cc---cccceeEEEEEeecCceeeeeeeeCCCCcceecccc Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFP-AR---KQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVS 72 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp-~~---~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~ 72 (348) ||+ +.++|.|..+..++.+... ....+ ..+-. .. ......+.... ... ...+..+..+...+. ..-+ T Consensus 1 MA~~~T~~~~~~iPev~s~~v~~~~~-~~~~~-~~~~~~~~~~~g~~G~tv~iP~-~~~-~~~a~~v~eg~~i~~-~~~~ 75 (272) T protein:vir:98 1 MAVGTTKMAQMLDPEVLADMIDAEVG-KAIRF-APLAEVDTTLEGQPGTTLTVPK-WDY-IGDAEDVAEGEAIPM-TQLG 75 (272) T ss_pred CCCccccchheechHHHHHHHHHHHH-HHhhh-hccccccccccCCCCCEEEEEE-ecC-CCCcccccCCCcccc-cccc Confidence 995 4578999999988865432 11111 11110 00 01111111111 111 111233333333222 2223 Q ss_pred eeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCcee Q lcl|Aclame:pro 73 AEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVN 152 (348) Q Consensus 73 ~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~ 152 (348) .......+-+++....++..+ ..+.. ......+. +.+...+.+..|..+...+.+.. T Consensus 76 ~~~~~~~~~~~~~~~~itd~~--~~~s~-----~d~~~~~~-------~~~~~~~a~~~d~~i~~~~~~a~--------- 132 (272) T protein:vir:98 76 FKKTTMTIKKAGKGVEITDEA--ILSGY-----GDPVGQAA-------KQIVEAIDHKVDADVLDALSKST--------- 132 (272) T ss_pred cceEEEEeeeeeeeeeecHHH--Hhhcc-----ccHHHHHH-------HHHHHHHHHHHHHHHHHHhcccc--------- Confidence 444444444444333443322 22211 11222222 33334444555555555553211 Q ss_pred EEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHH Q lcl|Aclame:pro 153 KDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKA 232 (348) Q Consensus 153 ~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~ 232 (348) +.++. ....++|.+....+.+.+..+..++|+++++..|++++...- .......... T Consensus 133 ----------~~~~~--------~~t~d~i~da~~~l~~~~~~~~~~vv~p~~~~~L~k~~~~~~-~~~~~~~~~~---- 189 (272) T protein:vir:98 133 ----------QTVEA--------TATVDGVSKALDIFNDEDDAETVIVMNPADASTLRLDAAKEW-LGATEVGANR---- 189 (272) T ss_pred ----------ccccc--------ccCHHHHHHHHHHHhccCCCccEEEEcHHHHHHHHHhccccc-cccccccccc---- Confidence 11111 112345556666676667778899999999999876653321 1111111111 Q ss_pred HHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEE Q lcl|Aclame:pro 233 ELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTT 312 (348) Q Consensus 233 ~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 312 (348) ..+..++.+.|+++++=+ .+|+++++++..+.++...-.. +.+.+ T Consensus 190 ~~~g~ig~i~G~~Vi~s~------------~~p~~t~~~~~~~a~~~~~~~~-----------------------~~ve~ 234 (272) T protein:vir:98 190 VVSGVYGEVLGVQIVRSR------------KCPKGTAYMVRKGALRIMLKRN-----------------------TMVET 234 (272) T ss_pred cccccchhhcCeeEEEcC------------CCCcceEEEEcCCeEEEEecCC-----------------------ceeee Confidence 112233455677665422 2467777777665443322111 11111 Q ss_pred eecCCCc--eeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 313 TKTTDPV--NVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 313 ~~~~dP~--~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) +.++. .-.+.+-.+.-.-+.+|.+++.+|+-|-- T Consensus 235 --~r~~~~~~~~i~~~~~~~~~v~~~~~vv~~t~~~a~ 270 (272) T protein:vir:98 235 --DRDITKAINQIVANKHYGVYLYKAEKAVKITLKDAA 270 (272) T ss_pred --ccccccceeEEEEEEEEEEEEEcCCceEEEEecccc Confidence 11111 12222223333445678888888887333 No 30 >protein:vir:4600 Length: 415 # NCBI annotation: capsid protein # Family: family:all:21 # MgeID: mge:101 # MgeName: PVL # Cross-refs: genbank:acc:NP_058445;genbank:gi:9635171;genbank:GeneID:1262708 Probab=94.89 E-value=0.0033 Score=34.22 Aligned_cols=281 Identities=11% Similarity=0.035 Sum_probs=125.7 Q ss_pred Cccch-----hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee Q lcl|Aclame:pro 1 MGLIY-----DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI 75 (348) Q Consensus 1 Ma~l~-----d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~ 75 (348) ++... ...-|..+...|.+...... -+.+ +....++.................+.++..++..+-.+...+.. T Consensus 120 ~~~~~~t~~g~~~iP~~~~~~ii~~~~~~~-~l~~-~~~~~~~~~~~~~~~~~~~~~~~~~~~v~Eg~~~~~~~~~~~~~ 197 (415) T protein:vir:46 120 QGGSLKTDSGFVVIPEEIVTDILKLKEVEF-NLDK-YVTVKRVTNGSGKYPVVRQSEVAALEKVEELEENPELAVKPFFQ 197 (415) T ss_pred hhccccccCCcccccHHHHHHHHHHHHhhh-hhhh-hcceeeccCCceeEEEEEecCCcceeecccccccccccccceee Confidence 11000 11223333333333332222 2323 33333333333222211112222345666666655444456777 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDI 155 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~v 155 (348) ..+.+-.+.....++.+-+ .++. . .+...+ ...+..++.+.+|..+....-+|.-. .... T Consensus 198 v~~~~~k~~~~~~iS~ell------~ds~-~----~l~~~i---~~~l~~~i~~~~d~~il~g~g~g~~~------~~~~ 257 (415) T protein:vir:46 198 LAYDINTHRGYFRISREAI------EDAK-V----NVLQEL---KLWMARTIAATRNKAIIDVITKGSTG------STSS 257 (415) T ss_pred EEeeeeeeEeeehhhHHHH------hhch-H----HHHHHH---HHHHHHHHHHHHHHHHhhccccCCcc------cccc Confidence 7777776766666654322 1111 1 111222 34456667777776665444322210 0000 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) ........+..++...++||.+++..+...+..+..++|++..|..|+. +++.- + ...+.+...+ T Consensus 258 -------~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~v~n~~~~~~L~~---lkd~~----G-~~i~~~~~~~ 322 (415) T protein:vir:46 258 -------GFEKEGKKLEVKKAKSLDDIKDAINLNVKPNYEHNVAIVSQTMFAKLDK---MKDKL----G-NYLIQPDVKE 322 (415) T ss_pred -------ccccccceeccccccchHHHHHHHHhhhhhccCCCEEEEcHHHHHHHHH---hhccC----C-CeeeccCcCC Confidence 0011122344456677888888887777767778899999999998743 33221 1 1111111111 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) ..-..+.|.++++.+.......|+. .++|..-.. +...+ ...++.+. |.. T Consensus 323 ~~~~~l~G~pV~~~~~~~~~~~~~~-------~~~~gd~~~-~~~~~---------------------~~~~~~v~-~~~ 372 (415) T protein:vir:46 323 KTQQRLLGAKIEILPDEVLGQKGNN-------TLIIGNLKD-AIVLF---------------------DRSQYQAS-WTD 372 (415) T ss_pred CCCccccceeeEEeccccccCCCcc-------EEEEEehhc-cEEEE---------------------eecceEEE-eec Confidence 1112345777766654321111111 122221111 00000 00111111 111 Q ss_pred CCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 316 TDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 316 ~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+-.....++..+.=..+.+|++++.+++.+-+ T Consensus 373 ~~~~~~~~~~~~r~d~~v~~~~a~~~~~~~~~~ 405 (415) T protein:vir:46 373 YMHFGECLMIAVRQDCRILDYKSAIVIEYDDSE 405 (415) T ss_pred cccCceEEEEEEEeccEEeccccEEEEEeeccC Confidence 111123345556666778899999999999877 No 31 >protein:vir:4700 Length: 415 # NCBI annotation: phi PVL ORF 7 homologue # Family: family:all:21 # MgeID: mge:102 # MgeName: phiPV83 # Cross-refs: genbank:acc:NP_061632;genbank:gi:9635719;genbank:GeneID:1262976 Probab=94.89 E-value=0.0033 Score=34.22 Aligned_cols=281 Identities=11% Similarity=0.035 Sum_probs=125.7 Q ss_pred Cccch-----hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee Q lcl|Aclame:pro 1 MGLIY-----DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI 75 (348) Q Consensus 1 Ma~l~-----d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~ 75 (348) ++... ...-|..+...|.+...... -+.+ +....++.................+.++..++..+-.+...+.. T Consensus 120 ~~~~~~t~~g~~~iP~~~~~~ii~~~~~~~-~l~~-~~~~~~~~~~~~~~~~~~~~~~~~~~~v~Eg~~~~~~~~~~~~~ 197 (415) T protein:vir:47 120 QGGSLKTDSGFVVIPEEIVTDILKLKEVEF-NLDK-YVTVKRVTNGSGKYPVVRQSEVAALEKVEELEENPELAVKPFFQ 197 (415) T ss_pred hhccccccCCcccccHHHHHHHHHHHHhhh-hhhh-hcceeeccCCceeEEEEEecCCcceeecccccccccccccceee Confidence 11000 11223333333333332222 2323 33333333333222211112222345666666655444456777 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDI 155 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~v 155 (348) ..+.+-.+.....++.+-+ .++. . .+...+ ...+..++.+.+|..+....-+|.-. .... T Consensus 198 v~~~~~k~~~~~~iS~ell------~ds~-~----~l~~~i---~~~l~~~i~~~~d~~il~g~g~g~~~------~~~~ 257 (415) T protein:vir:47 198 LAYDINTHRGYFRISREAI------EDAK-V----NVLQEL---KLWMARTIAATRNKAIIDVITKGSTG------STSS 257 (415) T ss_pred EEeeeeeeEeeehhhHHHH------hhch-H----HHHHHH---HHHHHHHHHHHHHHHHhhccccCCcc------cccc Confidence 7777776766666654322 1111 1 111222 34456667777776665444322210 0000 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) ........+..++...++||.+++..+...+..+..++|++..|..|+. +++.- + ...+.+...+ T Consensus 258 -------~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~v~n~~~~~~L~~---lkd~~----G-~~i~~~~~~~ 322 (415) T protein:vir:47 258 -------GFEKEGKKLEVKKAKSLDDIKDAINLNVKPNYEHNVAIVSQTMFAKLDK---MKDKL----G-NYLIQPDVKE 322 (415) T ss_pred -------ccccccceeccccccchHHHHHHHHhhhhhccCCCEEEEcHHHHHHHHH---hhccC----C-CeeeccCcCC Confidence 0011122344456677888888887777767778899999999998743 33221 1 1111111111 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) ..-..+.|.++++.+.......|+. .++|..-.. +...+ ...++.+. |.. T Consensus 323 ~~~~~l~G~pV~~~~~~~~~~~~~~-------~~~~gd~~~-~~~~~---------------------~~~~~~v~-~~~ 372 (415) T protein:vir:47 323 KTQQRLLGAKIEILPDEVLGQKGNN-------TLIIGNLKD-AIVLF---------------------DRSQYQAS-WTD 372 (415) T ss_pred CCCccccceeeEEeccccccCCCcc-------EEEEEehhc-cEEEE---------------------eecceEEE-eec Confidence 1112345777766654321111111 122221111 00000 00111111 111 Q ss_pred CCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 316 TDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 316 ~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+-.....++..+.=..+.+|++++.+++.+-+ T Consensus 373 ~~~~~~~~~~~~r~d~~v~~~~a~~~~~~~~~~ 405 (415) T protein:vir:47 373 YMHFGECLMIAVRQDCRILDYKSAIVIEYDDSE 405 (415) T ss_pred cccCceEEEEEEEeccEEeccccEEEEEeeccC Confidence 111123345556666778899999999999877 No 32 >protein:vir:96123 Length: 274 # NCBI annotation: ORF013 # Family: family:all:522 # MgeID: mge:1602 # MgeName: 37 # Cross-refs: genbank:acc:YP_240078;genbank:gi:66395742;genbank:GeneID:5133103 Probab=94.87 E-value=0.0033 Score=34.18 Aligned_cols=257 Identities=14% Similarity=0.142 Sum_probs=112.5 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eeccc---- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRV---- 71 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~---- 71 (348) ||+ +.|++.|..+..++.+... ....|...-+.+.++ .+..|..+--|+....+... +.+.. T Consensus 1 ma~~~T~~~d~i~Pev~s~~v~~~~~------~~~~~~~~~~~~~~l---~g~~G~tv~ip~~~~~g~~~~~~~g~~i~~ 71 (274) T protein:vir:96 1 MAQGTTKVSNLIVPEVLAPMMQAELD------KKLRFAQFADIDSTL---VGQPGDTLTFPAFTYSGDAQVIAEGEKIPV 71 (274) T ss_pred CCccccchhhhhhhHHHHHHHHHHHH------hhhhhcccccccccc---cCCCCCEEEEEeeccCCCccccCCCCcCch Confidence 997 5689999999999876432 122332222222221 23334444445443221111 11111 Q ss_pred ---ceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecC Q lcl|Aclame:pro 72 ---SAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTS 148 (348) Q Consensus 72 ---~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~ 148 (348) +.......+-+.+ ..+...|+...+...+ .... -...+...+.+..+-.++..|.++.. T Consensus 72 ~~it~~~~~~~i~~~~--~~~~i~D~~~~~~~~d-----~~~~-------~~~~~~~~~a~~~d~~i~~~l~~a~~---- 133 (274) T protein:vir:96 72 DQIGTSKREAKVRKIG--KGTELTDEAVLSGFGD-----PQGE-------AVRQHGLAIANKVDNDVLEALKGATL---- 133 (274) T ss_pred hhcccceeEEEEEeee--ceeeecHHHHHhhcch-----HHHH-------HHHHHHHHHHHHHHHHHHHHHhcCCC---- Confidence 1111122221212 2233334333322111 1222 23334455555666566666643211 Q ss_pred CceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 149 DGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 149 ~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) ... +++.-.+.|-.....+.+.+..+..++|+++++..|++++... .+.......+. T Consensus 134 ---------------~~~-------~~~~~~d~i~dA~~~l~d~~~~~~~ivv~p~~~~~L~k~~~~~-f~~~~~~g~~~ 190 (274) T protein:vir:96 134 ---------------TVE-------ADITKLDGLQTAIDKFNDEDLEPMVLFVNPLDAGGLRTSASDN-FTRPTQLGDNI 190 (274) T ss_pred ---------------CcC-------cccccHHHHHHHHHHhcccCCCceEEEeCHHHHHHHHhccccc-ccccccccccc Confidence 100 1111134455555556555567889999999999998876321 11111111111 Q ss_pred ccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCce Q lcl|Aclame:pro 229 VTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGI 308 (348) Q Consensus 229 ~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~ 308 (348) + .+..++.+.|.+|++=+ -+|.++.+++..+.+|... +.... T Consensus 191 ~----~~g~ig~~~G~~Vi~s~------------~~p~~t~~l~~~gA~~~~~-~~~~~--------------------- 232 (274) T protein:vir:96 191 I----VKGAFGEALGAVIVRSN------------KLNKGEALLAKKGAVKLIT-KRDFF--------------------- 232 (274) T ss_pred e----eecccceecCeeEEEcC------------CCCcceEEEEeCcceeeee-cCCcc--------------------- Confidence 1 12345566787776522 1466777777666554321 21110 Q ss_pred EEEEeecCCCc--eeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 309 AVTTTKTTDPV--NVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 309 ~~~~~~~~dP~--~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) + +.+.||. .-.+.+-.+--.-+.+|.++++++.-++- T Consensus 233 -v--E~~Rd~~~~~d~i~~~~~yg~~~~~~~~vv~~t~~~~~ 271 (274) T protein:vir:96 233 -L--EKDRDASRKSTALYSDKHYVAYLYDESKVVKITKGAGD 271 (274) T ss_pred -c--ccccchhhcccEEEEeeEEEEEEEcCccEEEEEcCccc Confidence 0 0011111 11222222233344556666666555443 No 33 >protein:vir:3613 Length: 272 # NCBI annotation: MHP # Family: family:all:522 # MgeID: mge:74 # MgeName: TP901-1 # Cross-refs: genbank:acc:NP_112699;genbank:gi:13786567;genbank:GeneID:921035 Probab=92.58 E-value=0.011 Score=31.36 Aligned_cols=254 Identities=15% Similarity=0.147 Sum_probs=108.7 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcc-eeccc---- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVT-IRDRV---- 71 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~-~~~r~---- 71 (348) ||+ +.|++.|..+..++.+.-.. ...|-.--+.+.+ +.+..|..+--|+...-+++. +.+.. T Consensus 1 ma~~~T~~~d~iiPev~~~~v~~~~~~------~~~~~~~~~~~~~---l~g~~G~ti~iP~~~~~gda~~~~eg~~i~~ 71 (272) T protein:vir:36 1 MSKQKTTLADLVNPEVLAPIVSYELNK------ALRFAPLAQVDTT---LQGQPGNTLKFPAFTYIGDAADVAEGGEISL 71 (272) T ss_pred CCCcceehhhhhchHHHHHHHHHHHHh------hhhhccccccccc---cccCCCCEEEEeeeccCccccccCCCCccCh Confidence 996 67899999999998654311 1122111111111 223334444444433222211 11111 Q ss_pred ---ceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecC Q lcl|Aclame:pro 72 ---SAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTS 148 (348) Q Consensus 72 ---~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~ 148 (348) +.......+-+. .+.+...|+..++... +.+.+-.+++...+.+..+..++.++. |. T Consensus 72 ~~lt~~~~~~~i~~~--~k~~~vtD~~~~~~~~------------d~~~~~~~~~a~~~a~~~d~~i~~~l~-~~----- 131 (272) T protein:vir:36 72 DKIGTTTKSVTIKKA--AKGTEITDEAALSGYG------------DPIGESNKQLGLSLANKVDDDLLSAAK-TT----- 131 (272) T ss_pred hhcCCcceeEeeehh--hccccccHHHHhhccc------------hHHHHHHHHHHHHHHHHHHHHHHHHhc-cc----- Confidence 111112222121 2223333333332211 112222333444555556655666664 21 Q ss_pred CceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 149 DGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 149 ~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) .++.+. +.-.++|..+...+.+.+..++.++|+++++..|++++.+....... ++. . T Consensus 132 -------------~~~~~~--------~~~~d~i~~A~~~lgd~~~~~~~ivv~p~~~~~L~k~~~~~~~~~~~-~~~-~ 188 (272) T protein:vir:36 132 -------------SQTVST--------KANVDGVQAALDIFNDEDAQAYVLIVNPKDAAKIRKDANAKNIGSEV-GAN-A 188 (272) T ss_pred -------------cccccc--------cccHHHHHHHHHHhhhcCCCceEEEEcHHHHHHHhcccccccccccc-ccc-c Confidence 111111 11134556666667677777889999999999999877655442211 111 1 Q ss_pred ccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEE----EEeCCccceeEeccchhhhccccccccccceeec Q lcl|Aclame:pro 229 VTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLT----LIPNGPLGNTVFGTTPEESDLFADNTVNADVEIV 304 (348) Q Consensus 229 ~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv----~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~ 304 (348) ..+..++.+.|.+|++=+. +|.++.+ +...+.+| |+.- T Consensus 189 ----~~~G~ig~~~G~~Vv~s~~------------~p~~~~~~~~~~~~~gA~~---~~~~------------------- 230 (272) T protein:vir:36 189 ----LINGTYADVLGAQIVRSKK------------LAEGSALMFKIVSNSPALK---LVLK------------------- 230 (272) T ss_pred ----eeeeccceecCeeEEEeCC------------CCCCceeEEEEEeccccee---eeec------------------- Confidence 1122345566877765332 2223221 11122222 1100 Q ss_pred CCceEEEEeecCCCc--eeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 305 DSGIAVTTTKTTDPV--NVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 305 ~~~~~~~~~~~~dP~--~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .++- .+.+.++. .-.+.+..+--.-+.+|.++++++. +|| T Consensus 231 -~~~~--vE~~R~~~~~~d~i~~~~~y~~~v~~~~~vv~~t~-~g~ 272 (272) T protein:vir:36 231 -RGVQ--VETDRDIVTKTTVITADEHYAAYLYDLTKVVNITF-TGV 272 (272) T ss_pred -CCcc--cccccchhhcCcEEEEEEEEEEEEEcCccEEEEee-cCC Confidence 0000 01111111 1122222333355566777776653 677 No 34 >protein:vir:4339 Length: 395 # NCBI annotation: major head protein # Family: family:all:585 # MgeID: mge:93 # MgeName: D3 # Cross-refs: genbank:acc:NP_061502;genbank:gi:9635591;genbank:GeneID:1262860 Probab=91.68 E-value=0.015 Score=30.63 Aligned_cols=273 Identities=11% Similarity=0.098 Sum_probs=123.1 Q ss_pred Cccchh-hcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEee Q lcl|Aclame:pro 1 MGLIYD-KVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQ 79 (348) Q Consensus 1 Ma~l~d-~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~ 79 (348) ...-.. ++.+.....++.. ..+..+ |.+ +.+..++.+....+... .+....+.++..++..+.. ...+....+. T Consensus 117 ~~~~~g~~vp~~~~~~ii~~-~~~~~~-l~~-l~~~~~~~~~~~~~~~~-~~~~~~a~~v~E~~~~~~~-~~~~~~i~~~ 191 (395) T protein:vir:43 117 IDGSGGALVAPDRRPGVVAA-PQRRLT-IRD-LVAPGTTESNSVEYVRE-TGFVNNAAPVSEGTQKPYS-DLTFELENAP 191 (395) T ss_pred cCCCCccccchhhHHHHHHH-HHhhhh-HHh-hccceecCCCceEEEEE-ecCCCceeeecCCcccccc-ccceeEEEEe Confidence 000000 1222223333333 222222 333 35544444444443332 2222345667776665544 3467777777 Q ss_pred ccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEeecc Q lcl|Aclame:pro 80 MPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGV 159 (348) Q Consensus 80 ~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDfg~ 159 (348) +-.++-...++.+ ++ + +. .. +...+ ...+.+++...+|..++ +|. +.+... -|+ T Consensus 192 ~~k~~~~~~is~e-ll--~---d~--~~----l~~~v---~~~la~a~~~~~d~~~l----~G~----g~~~~~---~Gi 245 (395) T protein:vir:43 192 VRTIAHLFKASRQ-IL--D---DA--SA----LQSYI---DARARYGLMLVEECQLL----YGN----GTGANL---HGI 245 (395) T ss_pred eeeEEEeehhhHH-HH--H---hH--HH----HHHHH---HHHHHHHHHHHHHHHHH----hcc----CCCCcc---ccc Confidence 7777766666643 22 1 11 11 11222 23345555566664433 342 111110 011 Q ss_pred Ccc-ceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHH Q lcl|Aclame:pro 160 KAD-HKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYV 238 (348) Q Consensus 160 ~~~-~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~ 238 (348) -.. ...+.+.....++.+.+++|..+...+...+..+..++|++.+|..|++ +++.- ...+.+......- T Consensus 246 ~~~~~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~vmn~~~~~~l~~---lkd~~------G~~i~~~~~~~~~ 316 (395) T protein:vir:43 246 IPQAQAYAPPSGVVVTAEQRIDRIRLAILQAQLAEFPASGIVLNPIDWALIEL---NKDAE------NRYIIGSPQNGTT 316 (395) T ss_pred cccccccccccccccccchhHHHHHHHHHhhccccCCCcEEEEcHHHHHHHHH---hhccC------CceeccccccCCC Confidence 000 0011111223334567888888877777667778889999999987743 22221 1111111111111 Q ss_pred HhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeecCC- Q lcl|Aclame:pro 239 ADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTD- 317 (348) Q Consensus 239 ~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d- 317 (348) ..+.|++|++.+ .+|++.+++.-... +...+ . ..++-+....+.. T Consensus 317 ~~l~G~pVv~~~------------~~~~~~~~~gd~~~-~~~~~--~-------------------~~~~~i~~~~~~~~ 362 (395) T protein:vir:43 317 PTLWRLPVVETQ------------AITQDEFLTGAFSL-GAQIF--D-------------------RMDIEVLVSTENDK 362 (395) T ss_pred ceecceeeEEcC------------CCCCCcEEEEeccc-eEEEE--E-------------------ecceEEEEeccccc Confidence 123455654432 35666666543222 11111 0 0011111111100 Q ss_pred ---CceeEEeeeeeeeeeecCCCcEEEEEEecC Q lcl|Aclame:pro 318 ---PVNVQTKVSMVALPSFERLGDVYMLTVIPG 347 (348) Q Consensus 318 ---P~~~~~~~~s~~lPv~~~~~~~~~~~V~~~ 347 (348) =......+..+.=..+.+|++++.++|.+= T Consensus 363 ~f~~~~~~~r~~~r~d~~v~~~~a~~~~~~taa 395 (395) T protein:vir:43 363 DFENNMVTIRAEERLAFAVYRPEAFVTGSLTAS 395 (395) T ss_pred hhhcCcEEEEEEEeeccEEecccceEEEEeccC Confidence 013345566677778889999999999966 No 35 >protein:vir:9410 Length: 415 # NCBI annotation: head protein # Family: family:all:21 # MgeID: mge:167 # MgeName: phi 13 # Cross-refs: genbank:acc:NP_803388;genbank:gi:29028700;genbank:GeneID:1258136 Probab=91.57 E-value=0.015 Score=30.55 Aligned_cols=281 Identities=12% Similarity=0.044 Sum_probs=117.2 Q ss_pred Cccch-----hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee Q lcl|Aclame:pro 1 MGLIY-----DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI 75 (348) Q Consensus 1 Ma~l~-----d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~ 75 (348) .+... .+.-|.++..-|.+......+ + ..+.+..++.+...............+.++..++..+-..-..+.. T Consensus 120 ~~~~~~~~~g~~~iP~~~~~~ii~~~~~~~~-l-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~v~Eg~~~~~~~~~~~~~ 197 (415) T protein:vir:94 120 QGGSLKTDSGFVVIPEEIVTDILKLKEVEFN-L-DKYVTVKRVTNGSGKYPVVRQSEVAALEKVEELEENPELAVKPFFQ 197 (415) T ss_pred hhhccccccccccCcHHHHHHHHHHHHhhhh-h-hhhcceeeccCCceeEEEEeecCCccceecccccccccccccccee Confidence 00000 011222333323222222211 2 2233333333222221111111122345565555554333345666 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDI 155 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~v 155 (348) ..+.+-.+.....++.+ + +.++. . .+...| ...+.+++...+|..+....-+|.-..... T Consensus 198 i~~~~~k~~~~~~is~e-l-----l~ds~-~----~~~~~i---~~~l~~~~~~~~~~~il~g~g~g~~~~~~~------ 257 (415) T protein:vir:94 198 LAYDINTHRGYFRISRE-A-----IEDAK-V----NVLQEL---KLWMARTIAATRNKAIIDVITKGSTGSTSS------ 257 (415) T ss_pred eEeeheeeeeechhhHH-H-----Hhhch-H----HHHHHH---HHHHHHHHHHHHHHHHhhccccCccccccc------ Confidence 66666666555555432 1 11111 1 111222 334556667777766665443332210000 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) ........++.++...++||.++...+...+..+..++|++..|..|+. +++.-. ...+.+...+ T Consensus 258 -------~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~vmn~~~~~~l~~---lkd~~G-----~~l~~~~~~~ 322 (415) T protein:vir:94 258 -------GFEKEGKKLEVKKAKSLDDIKDAINLNVKPNYEHNVAIVSQTMFAKLDK---MKDKLG-----NYLIQPDVKE 322 (415) T ss_pred -------cccccccccccccccchHHHHHHHHhhhhhccCCCEEEEcHHHHHHHHH---hhccCC-----CeeeccCcCC Confidence 0011122344445567788888887777777778899999999998853 332211 1111111111 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) ..-..+.|.++++.+..-....|+ ..++|..-.. +...+ . ..++-+. |.. T Consensus 323 ~~~~~l~G~pV~~~~~~~~~~~~~-------~~i~~gd~~~-~~~~~--~-------------------~~~~~v~-~~~ 372 (415) T protein:vir:94 323 KTQQRLLGAKIEILPDEVLGQKGN-------NTLIIGNLKD-AIVLF--D-------------------RSQYQAS-WTD 372 (415) T ss_pred CCCceecceeeEEecccccCCCCc-------cEEEEEehhc-cEEEE--e-------------------ecceEEE-Eec Confidence 111234567776665432111111 1122221111 00000 0 0011110 111 Q ss_pred CCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 316 TDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 316 ~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ..-.....++..+.=..+.+|++++.+++.+-+ T Consensus 373 ~~~~~~~~r~~~r~d~~~~~~~a~~~~~~~~~~ 405 (415) T protein:vir:94 373 YMHFGECLMIAVRQDCRILDYKSAIVIEYDDSE 405 (415) T ss_pred cccCceEEEEEEEeccEEeccccEEEEEEeccC Confidence 111112233444444666789999999998777 No 36 >protein:vir:81100 Length: 415 # NCBI annotation: capsid protein # Family: family:all:21 # MgeID: mge:1891 # MgeName: tp310-1 # Cross-refs: genbank:acc:YP_001429874;genbank:gi:156603927;genbank:GeneID:5525320 Probab=88.08 E-value=0.035 Score=28.59 Aligned_cols=281 Identities=11% Similarity=0.031 Sum_probs=116.5 Q ss_pred Ccc-ch----hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee Q lcl|Aclame:pro 1 MGL-IY----DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI 75 (348) Q Consensus 1 Ma~-l~----d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~ 75 (348) ++. .. .+.-|.++...|.+......+ +.+ +....++.+...............+..+..++..+-.....+.. T Consensus 120 ~~~~~~~~~gg~~iP~~~~~~ii~~~~~~~~-l~~-~~~~~~~~~~~~~~~~~~~~~~~~~~~v~E~~~~~~~~~~~~~~ 197 (415) T protein:vir:81 120 QGGSLKTDSGFVVIPEEIVTDILKLKEVEFN-LDK-YVTVKRVTNGSGKYPVVRQSEVAALEKVEELEENPELAVKPFFQ 197 (415) T ss_pred hhccccccccccccchHHHHHHHHHHHhhhh-hhh-heeeeeccCCceeEEEEeecCCccceeeccccccCcccccceee Confidence 000 00 112223333333223222222 222 23333333222221111111222345566655555434445666 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDI 155 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~v 155 (348) ..+.+-.++-...++.+=+ .++. .+ +...+ ...+.+++...+|..+....-+|.-. ...+ T Consensus 198 v~~~~~k~~~~~~iS~ell------~ds~-~~----l~~~i---~~~l~~~~~~~~~~~il~g~g~g~~~------~~~~ 257 (415) T protein:vir:81 198 LAYDINTHRGYFRISREAI------EDAK-VN----VLQEL---KLWMARTIAATRNKAIIDVITKGSTG------STSS 257 (415) T ss_pred EEeeeeeeEeeehhhHHHH------hhch-HH----HHHHH---HHHHHHHHHHHHHHHHhhccccCccc------cccc Confidence 6777766666555554311 1111 11 11222 23345666666766555444322210 0000 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) +........+.++...++||.+++..+...+..+..++|++++|..|+. +++. + +...+.+...+ T Consensus 258 -------~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~v~n~~~~~~l~~---lkd~----~-G~~l~~~~~~~ 322 (415) T protein:vir:81 258 -------GFEKEGKKLEVKKAKSLDDIKDAINLNVKPNYEHNVAIVSQTMFAKLDK---MKDK----L-GNYLIQPDVKE 322 (415) T ss_pred -------cccccccccccccccchhHHHHHHHhhhhhccCCCEEEEcHHHHHHHHH---hhcc----C-CceeeccCcCC Confidence 0011112334445567788888877776667778889999999987753 2222 1 11111111111 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) ..-..+.|.++++.+.......|+. .++|..... +.+.+ + ..++-+. |.. T Consensus 323 ~~~~~l~G~pV~~~~~~~~~~~~~~-------~~~~Gd~~~-~~~~~----~-----------------~~~~~v~-~~~ 372 (415) T protein:vir:81 323 KTQQRLLGAKIEILPDEVLGQKGNN-------TLIIGNLKD-AIVLF----D-----------------RSQYQAS-WTD 372 (415) T ss_pred CCCceecceeeEEecccccCCCCcc-------EEEEEehhc-cEEEE----e-----------------ecceEEE-Eec Confidence 1112345666665553321111111 122221110 00000 0 0011111 111 Q ss_pred CCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 316 TDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 316 ~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+-....+.+..+.=..+.+|++++.+++.+-+ T Consensus 373 ~~~~~~~~~~~~r~d~~v~~~~a~~~~~~~~~~ 405 (415) T protein:vir:81 373 YMHFGECLMIAVRQDCRILDYKSAIVIEYDDSE 405 (415) T ss_pred cccCceEEEEEEEeccEEeccccEEEEEEeccC Confidence 111112233444555667789999999999777 No 37 >protein:vir:79987 Length: 415 # NCBI annotation: head protein # Family: family:all:21 # MgeID: mge:1875 # MgeName: tp310-3 # Cross-refs: genbank:acc:YP_001430002;genbank:gi:156604057;genbank:GeneID:5525447 Probab=88.08 E-value=0.035 Score=28.59 Aligned_cols=281 Identities=11% Similarity=0.031 Sum_probs=116.5 Q ss_pred Ccc-ch----hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee Q lcl|Aclame:pro 1 MGL-IY----DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI 75 (348) Q Consensus 1 Ma~-l~----d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~ 75 (348) ++. .. .+.-|.++...|.+......+ +.+ +....++.+...............+..+..++..+-.....+.. T Consensus 120 ~~~~~~~~~gg~~iP~~~~~~ii~~~~~~~~-l~~-~~~~~~~~~~~~~~~~~~~~~~~~~~~v~E~~~~~~~~~~~~~~ 197 (415) T protein:vir:79 120 QGGSLKTDSGFVVIPEEIVTDILKLKEVEFN-LDK-YVTVKRVTNGSGKYPVVRQSEVAALEKVEELEENPELAVKPFFQ 197 (415) T ss_pred hhccccccccccccchHHHHHHHHHHHhhhh-hhh-heeeeeccCCceeEEEEeecCCccceeeccccccCcccccceee Confidence 000 00 112223333333223222222 222 23333333222221111111222345566655555434445666 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDI 155 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~v 155 (348) ..+.+-.++-...++.+=+ .++. .+ +...+ ...+.+++...+|..+....-+|.-. ...+ T Consensus 198 v~~~~~k~~~~~~iS~ell------~ds~-~~----l~~~i---~~~l~~~~~~~~~~~il~g~g~g~~~------~~~~ 257 (415) T protein:vir:79 198 LAYDINTHRGYFRISREAI------EDAK-VN----VLQEL---KLWMARTIAATRNKAIIDVITKGSTG------STSS 257 (415) T ss_pred EEeeeeeeEeeehhhHHHH------hhch-HH----HHHHH---HHHHHHHHHHHHHHHHhhccccCccc------cccc Confidence 6777766666555554311 1111 11 11222 23345666666766555444322210 0000 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) +........+.++...++||.+++..+...+..+..++|++++|..|+. +++. + +...+.+...+ T Consensus 258 -------~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~v~n~~~~~~l~~---lkd~----~-G~~l~~~~~~~ 322 (415) T protein:vir:79 258 -------GFEKEGKKLEVKKAKSLDDIKDAINLNVKPNYEHNVAIVSQTMFAKLDK---MKDK----L-GNYLIQPDVKE 322 (415) T ss_pred -------cccccccccccccccchhHHHHHHHhhhhhccCCCEEEEcHHHHHHHHH---hhcc----C-CceeeccCcCC Confidence 0011112334445567788888877776667778889999999987753 2222 1 11111111111 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) ..-..+.|.++++.+.......|+. .++|..... +.+.+ + ..++-+. |.. T Consensus 323 ~~~~~l~G~pV~~~~~~~~~~~~~~-------~~~~Gd~~~-~~~~~----~-----------------~~~~~v~-~~~ 372 (415) T protein:vir:79 323 KTQQRLLGAKIEILPDEVLGQKGNN-------TLIIGNLKD-AIVLF----D-----------------RSQYQAS-WTD 372 (415) T ss_pred CCCceecceeeEEecccccCCCCcc-------EEEEEehhc-cEEEE----e-----------------ecceEEE-Eec Confidence 1112345666665553321111111 122221110 00000 0 0011111 111 Q ss_pred CCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 316 TDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 316 ~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+-....+.+..+.=..+.+|++++.+++.+-+ T Consensus 373 ~~~~~~~~~~~~r~d~~v~~~~a~~~~~~~~~~ 405 (415) T protein:vir:79 373 YMHFGECLMIAVRQDCRILDYKSAIVIEYDDSE 405 (415) T ss_pred cccCceEEEEEEEeccEEeccccEEEEEEeccC Confidence 111112233444555667789999999999777 No 38 >protein:vir:98339 Length: 415 # NCBI annotation: putative capsid protein # Family: family:all:21 # MgeID: mge:1581 # MgeName: phiPVL(108) # Cross-refs: genbank:acc:YP_918931;genbank:gi:119443693;genbank:GeneID:4594501 Probab=88.08 E-value=0.035 Score=28.59 Aligned_cols=281 Identities=11% Similarity=0.031 Sum_probs=116.5 Q ss_pred Ccc-ch----hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee Q lcl|Aclame:pro 1 MGL-IY----DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI 75 (348) Q Consensus 1 Ma~-l~----d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~ 75 (348) ++. .. .+.-|.++...|.+......+ +.+ +....++.+...............+..+..++..+-.....+.. T Consensus 120 ~~~~~~~~~gg~~iP~~~~~~ii~~~~~~~~-l~~-~~~~~~~~~~~~~~~~~~~~~~~~~~~v~E~~~~~~~~~~~~~~ 197 (415) T protein:vir:98 120 QGGSLKTDSGFVVIPEEIVTDILKLKEVEFN-LDK-YVTVKRVTNGSGKYPVVRQSEVAALEKVEELEENPELAVKPFFQ 197 (415) T ss_pred hhccccccccccccchHHHHHHHHHHHhhhh-hhh-heeeeeccCCceeEEEEeecCCccceeeccccccCcccccceee Confidence 000 00 112223333333223222222 222 23333333222221111111222345566655555434445666 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDI 155 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~v 155 (348) ..+.+-.++-...++.+=+ .++. .+ +...+ ...+.+++...+|..+....-+|.-. ...+ T Consensus 198 v~~~~~k~~~~~~iS~ell------~ds~-~~----l~~~i---~~~l~~~~~~~~~~~il~g~g~g~~~------~~~~ 257 (415) T protein:vir:98 198 LAYDINTHRGYFRISREAI------EDAK-VN----VLQEL---KLWMARTIAATRNKAIIDVITKGSTG------STSS 257 (415) T ss_pred EEeeeeeeEeeehhhHHHH------hhch-HH----HHHHH---HHHHHHHHHHHHHHHHhhccccCccc------cccc Confidence 6777766666555554311 1111 11 11222 23345666666766555444322210 0000 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) +........+.++...++||.+++..+...+..+..++|++++|..|+. +++. + +...+.+...+ T Consensus 258 -------~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~v~n~~~~~~l~~---lkd~----~-G~~l~~~~~~~ 322 (415) T protein:vir:98 258 -------GFEKEGKKLEVKKAKSLDDIKDAINLNVKPNYEHNVAIVSQTMFAKLDK---MKDK----L-GNYLIQPDVKE 322 (415) T ss_pred -------cccccccccccccccchhHHHHHHHhhhhhccCCCEEEEcHHHHHHHHH---hhcc----C-CceeeccCcCC Confidence 0011112334445567788888877776667778889999999987753 2222 1 11111111111 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) ..-..+.|.++++.+.......|+. .++|..... +.+.+ + ..++-+. |.. T Consensus 323 ~~~~~l~G~pV~~~~~~~~~~~~~~-------~~~~Gd~~~-~~~~~----~-----------------~~~~~v~-~~~ 372 (415) T protein:vir:98 323 KTQQRLLGAKIEILPDEVLGQKGNN-------TLIIGNLKD-AIVLF----D-----------------RSQYQAS-WTD 372 (415) T ss_pred CCCceecceeeEEecccccCCCCcc-------EEEEEehhc-cEEEE----e-----------------ecceEEE-Eec Confidence 1112345666665553321111111 122221110 00000 0 0011111 111 Q ss_pred CCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 316 TDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 316 ~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+-....+.+..+.=..+.+|++++.+++.+-+ T Consensus 373 ~~~~~~~~~~~~r~d~~v~~~~a~~~~~~~~~~ 405 (415) T protein:vir:98 373 YMHFGECLMIAVRQDCRILDYKSAIVIEYDDSE 405 (415) T ss_pred cccCceEEEEEEEeccEEeccccEEEEEEeccC Confidence 111112233444555667789999999999777 No 39 >protein:vir:9574 Length: 300 # NCBI annotation: gp40 # Family: family:all:966 # MgeID: mge:171 # MgeName: SM1 # Cross-refs: genbank:acc:NP_862879;genbank:gi:32469471;genbank:GeneID:1461316 Probab=87.74 E-value=0.037 Score=28.45 Aligned_cols=295 Identities=10% Similarity=-0.006 Sum_probs=131.1 Q ss_pred Cccchh----hcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeee Q lcl|Aclame:pro 1 MGLIYD----KVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIH 76 (348) Q Consensus 1 Ma~l~d----~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~ 76 (348) ||+-.+ ++.+.....++..+ .+. +.+. .+++..++.......... .+. ..|.++..+.+.+... ..+... T Consensus 1 ma~~t~~~G~lip~~~~~~ii~~l-~~~-s~i~-~l~~~~~~~~~~~~~p~~-~~~-~~a~wv~Eg~~~~~s~-~~f~~v 74 (300) T protein:vir:95 1 MSEAQLSKGNLFNPELVTKVINKV-KGH-SSIA-KLSPQKPIPFNGQREFVF-DFD-SDIDIVAENGKKTHGG-VSLDPV 74 (300) T ss_pred CcccccCCcceechhhHHHHHHHH-Hhh-hhhh-hhcceeeccCCceEEEEE-ecC-cceEEeeCCccccccc-ccceee Confidence 997532 23333333444333 222 2343 356655555444433332 222 3467888876666443 456666 Q ss_pred EeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEe Q lcl|Aclame:pro 77 DEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDID 156 (348) Q Consensus 77 ~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vD 156 (348) .+++-+++---.++.+ ++ +..... . -.+...+ .+++.+++.+.+|..+.. |.-.-++.+....-. T Consensus 75 ~l~~~k~~~~~~iS~e-ll-----~~~~d~-~-~~l~~~i---~~~l~~aia~~~d~~~l~----G~~~~~g~~~~~~~~ 139 (300) T protein:vir:95 75 TIVPLKVEYGARVSDE-FL-----HASEEA-K-VDMLTDF---VEGFSKKLARGLDIMSIH----GINPRTKQASTIIGD 139 (300) T ss_pred EeeeEEEEEeehhhHH-Hh-----ccCCCC-H-HHHHHHH---HHHHHHHHHHHHHHhhhh----cccCCCCCCcccccc Confidence 6666666665555543 21 111111 0 1122222 445677788888877774 321111111111000 Q ss_pred eccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccH-HHHH Q lcl|Aclame:pro 157 YGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTK-AELQ 235 (348) Q Consensus 157 fg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~-~~~~ 235 (348) -........+. ...+.++..+|.++...+...+..+...+|++.++.+|++-+ +. +...+-+ .... T Consensus 140 ~~~~~~~~~~~----~~~~~~~~~~i~~~~~~~~~~~~~~~~~vmn~~~~~~L~~lk---d~------~G~~i~~~~~~~ 206 (300) T protein:vir:95 140 NCFDKKVTQTV----PFKDTNPDESMEDAVGMIDGSERDITGAILDPIFTTALSKMK---NA------EGGKLYPELAWG 206 (300) T ss_pred cccccccceee----cccccchHHHHHHHHHHhhhcCCCccEEEECHHHHHHHHHhh---cc------CCCeeccCcccc Confidence 00111111111 112456778899988888777888888999999998774322 11 1111111 0001 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) ..-..+.|+++++-+.- +...+..+ ..+|+.+=. ....||.--+....... +.+ ..+..+..|.+ T Consensus 207 ~~~~~l~G~Pv~~s~~v--~~~~~~~~-----~~~~~GDf~-~~~~~~~~~~~~~~v~~---~~~----~d~~~~~~f~~ 271 (300) T protein:vir:95 207 GVPDAINGLAVDKNRTV--SYSQTDPK-----NTAIVGDFE-TMFKWGYAKEVPMEIIK---YGD----PDNSGRDLKGY 271 (300) T ss_pred CCCceecceeeEEecCC--CCCCCCCc-----cEEEEeecc-ceEEEEEecccEEEEee---ccC----CCCcchhhhhc Confidence 11123456676544321 11111100 111221100 00122211000000000 000 00000111211 Q ss_pred CCCceeEEeeeeeeeeeecCCCcEEEEEEecC Q lcl|Aclame:pro 316 TDPVNVQTKVSMVALPSFERLGDVYMLTVIPG 347 (348) Q Consensus 316 ~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~ 347 (348) -....++..+.=..+.+|++++++|-.|| T Consensus 272 ---~~v~~r~~~r~d~~v~~~~a~~~l~~~~g 300 (300) T protein:vir:95 272 ---NQIYIRCEAYIGWGIMDAASFARIVKTGG 300 (300) T ss_pred ---CcEEEEEEEeecceeecccceEEEecCCC Confidence 13555666666677888999999999999 No 40 >protein:vir:739 Length: 231 # NCBI annotation: major structural protein 4 # Family: family:all:522 # MgeID: mge:14 # MgeName: Tuc2009 # Cross-refs: genbank:acc:NP_108716;genbank:gi:13487838;genbank:GeneID:920884 Probab=85.39 E-value=0.053 Score=27.57 Aligned_cols=228 Identities=14% Similarity=0.098 Sum_probs=94.6 Q ss_pred chhhhHHHHh-CCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEeeccccccccccCHHHHHHHHhhc Q lcl|Aclame:pro 23 NVDSTLGESI-FPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVK 101 (348) Q Consensus 23 ~~~~~l~~~~-Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~ 101 (348) .+.--.++++ || .+ .--|.-++.+.+.+...- +.++...++-+.+....++..+ .+.... T Consensus 1 ~~~~~~Gdtit~P---------~~-------iGda~~v~eG~~i~~~~l-~~t~~~atIk~~gk~~~itD~a--~l~~~g 61 (231) T protein:vir:73 1 ENGINLANLCEYP---------ND-------IGDAADVAEGGEISLDKI-GTTTKSVTIKKAAKGTEITDEA--ALSGYG 61 (231) T ss_pred CccccCCceEEec---------cc-------ccchhhhcCCCcCChhhc-cccceeeeEeeeccceeeeHHH--HhhccC Confidence 0000011110 11 00 001222333333222211 2233344444444444444333 333222 Q ss_pred CcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEeeccCccceeeeeecCCCCCccHHHH Q lcl|Aclame:pro 102 DTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGVKADHKKQVSKSWAEPGATPLAD 181 (348) Q Consensus 102 ~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~d 181 (348) ++ +.+....+..++.+...--++.++.+. .|+.+++.-.+. T Consensus 62 ---Dp---------~~ea~~Q~~~~iA~kvD~di~~~~~~a---------------------------~l~~~~~~t~d~ 102 (231) T protein:vir:73 62 ---DP---------IGESNKQLGLSLANKVDDDLLKAAKTT---------------------------SQTVSTKANVDG 102 (231) T ss_pred ---ch---------HHHHHHHHHHHHHHhhhHHHHHhhccc---------------------------cccccccccHHH Confidence 22 112222233344444433344444421 233334445677 Q ss_pred HHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHHHhhcCceEEEEeeEEEcCCCccc Q lcl|Aclame:pro 182 LEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYVADNYGVEIVLENGTYRNEKGEVS 261 (348) Q Consensus 182 i~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~ 261 (348) |....+.+.+....+..++|+++.+..|++++...+.-.. ..... ..+..++...|++|++=+ .....++... T Consensus 103 i~~A~~~fgde~~~~~vivv~p~~~~~Lrk~~~~~~~~~~--~g~~i----~~~G~iG~i~G~~Vi~S~-~~~~~~~~~~ 175 (231) T protein:vir:73 103 VQAALDIFNDEDAQAYVLIVNPKDAAKIRKDANAKNIGSE--VGANA----LINGTYADVLGAQIVRSK-KLAEGSALMF 175 (231) T ss_pred HHHHHHHhccccccceEEEEcchHHHhhhhccchhhhhhh--hccce----eeecccceEcceEEEEcC-CCCCCceeee Confidence 7777777777777889999999999999887764333111 11111 124455666787776532 1111111111 Q ss_pred ccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeecCCCceeEEee--eeeeeeeecCCCcE Q lcl|Aclame:pro 262 KFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPVNVQTKV--SMVALPSFERLGDV 339 (348) Q Consensus 262 ~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~~~~~~--~s~~lPv~~~~~~~ 339 (348) + ++.. .+. +.+.. ..++.+- .+.|+....+.. ..+-...+.++..+ T Consensus 176 ~------~i~~-~gA---l~~~~--------------------k~~~~vE--tdRd~~~k~~~i~~~~~y~v~l~~~~~v 223 (231) T protein:vir:73 176 K------IVSN-SPA---LKLVL--------------------KRGVQVE--TDRDIVTKTTVITADEHYAAYLYDLTKV 223 (231) T ss_pred e------EEee-ccc---eeeee--------------------cccceee--ccccccccccEEEEeEEEEEEEEcCccE Confidence 1 1111 111 11110 1111121 223333333333 33445666677776 Q ss_pred EEEEEecCC Q lcl|Aclame:pro 340 YMLTVIPGV 348 (348) Q Consensus 340 ~~~~V~~~~ 348 (348) +++++ +|| T Consensus 224 v~~t~-~g~ 231 (231) T protein:vir:73 224 VNITF-TGV 231 (231) T ss_pred EEEEe-ecC Confidence 66653 677 No 41 >protein:vir:94673 Length: 419 # NCBI annotation: major capsid protein # Family: family:all:585 # MgeID: mge:1527 # MgeName: mu1/6 # Cross-refs: genbank:acc:YP_579208;genbank:gi:93007444;genbank:GeneID:5076792 Probab=83.12 E-value=0.071 Score=26.88 Aligned_cols=280 Identities=13% Similarity=0.076 Sum_probs=120.9 Q ss_pred Cccch-------hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeec------CceeeeeeeeCCCCcce Q lcl|Aclame:pro 1 MGLIY-------DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGAS------GQSVALKAAAFDTNVTI 67 (348) Q Consensus 1 Ma~l~-------d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~------~~~~~a~~v~~~~~~~~ 67 (348) +.... ....+..+...+...+.. ...+ ..++....+......+..... .....|.++..++..+. T Consensus 121 ~~~~~~~~~~~~~~~~p~~~~~~i~~~~~~-~~~i-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~a~~v~Eg~~~~~ 198 (419) T protein:vir:94 121 RDAPAGTITNPNVPHLPQLVPGIVPTTPDL-PLLV-ADLLDQQNADYNVLEYIRDTSGTAGAGSTWNKAAVVPEGTAKPQ 198 (419) T ss_pred cccccccccCCcccccchhhhHHHHHHHhh-hhhh-hhcceeeeccCCceeeeeeccccccccccCcccceecCCccccc Confidence 11000 012233334444433321 1122 223443333332222221111 11122445555555443 Q ss_pred ecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeec Q lcl|Aclame:pro 68 RDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFT 147 (348) Q Consensus 68 ~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~ 147 (348) .. ..+....+.+-.+.-.-.++.+-++ +. . .+...| ...+.+++...+|..+. +|- T Consensus 199 ~~-~~~~~i~~~~~k~~~~~~is~ell~------d~--~----~l~~~i---~~~la~a~~~~~d~aii----~G~---- 254 (419) T protein:vir:94 199 ST-LSFDTITTTLKTVAHWLPITRQAAD------DN--S----QLMGYI---QGRLTYGLRFLRDRQLL----NGN---- 254 (419) T ss_pred cc-cceeeEEeeeeeEEEeehhhHHHHH------hH--H----HHHHHH---HHHHHHHHHHHHHHHHH----hcc---- Confidence 32 3466666666666665566543221 11 1 122222 23345666666664443 331 Q ss_pred CCceeEEEeeccCccceeeeeecC-CCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCc Q lcl|Aclame:pro 148 SDGVNKDIDYGVKADHKKQVSKSW-AEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDG 226 (348) Q Consensus 148 ~~~~~~~vDfg~~~~~~~t~~~~W-~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~ 226 (348) +.+....+ +..+.....+....+ ...+...++||..++..+...+..+..++|++.+|..|++-. +. . +.. T Consensus 255 G~~~p~Gi-~~~~~~~~~~~~~~~~~~t~~~~~~~l~~~~~~~~~~~~~~~~~v~n~~~~~~l~~~k---~~---~-~~~ 326 (419) T protein:vir:94 255 GSTEMQGI-LTTPGIGTYQQPKPTAPATDEPPLVDIRRAKTVAEIAGFPPDGVVVHPQDWESIELDQ---AP---G-SGV 326 (419) T ss_pred Ccccccce-ecccccccccccccccccccchhHHHHHHHHHhhhhccCCCCEEEEcHHHHHHHHHHh---hc---C-CCc Confidence 11111111 011111112222222 223456788899998888777778889999999998764322 11 1 110 Q ss_pred ccccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCC Q lcl|Aclame:pro 227 SSVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDS 306 (348) Q Consensus 227 ~~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~ 306 (348) ..+.+......-..+.|.++++-+ .+|++.++|.-... + +++. ... T Consensus 327 ~~~~~~~~~~~~~~l~G~pV~~~~------------~~~~~~~~~gd~~~-~--~~~~-------------------~~~ 372 (419) T protein:vir:94 327 FRVIANVQGEATPRIWGLNVVSTV------------AIAQGTALVGGFRQ-G--ATLW-------------------SRQ 372 (419) T ss_pred eeecCCcccCCCccccceeeEEcC------------CCCCccEEEeeccc-e--EEEE-------------------Eec Confidence 011110001011123466664432 23555555542221 1 1110 001 Q ss_pred ceEEEEeecCC----CceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 307 GIAVTTTKTTD----PVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 307 ~~~~~~~~~~d----P~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ++.+..+.+.. =......+..+.=..+.+|++++++++.|=+ T Consensus 373 ~~~v~~~~~~~~~~~~~~~~~r~~~r~d~~v~~~~a~~~~~~~aa~ 418 (419) T protein:vir:94 373 GITVLMTDSHADFFTANTLVILAEFRANLAVYQPKAFVRVTFAAAT 418 (419) T ss_pred ceEEEEeccccchhhcCcEEEEEEEeeccEEeccccEEEEEeccCC Confidence 12222111110 0134455666777778889999999999888 No 42 >protein:vir:1886 Length: 385 # NCBI annotation: major capsid subunit precursor # Family: family:all:585 # MgeID: mge:41 # MgeName: HK022 # Cross-refs: genbank:acc:NP_037666;genbank:gi:9634124;genbank:GeneID:1262513 Probab=82.58 E-value=0.076 Score=26.73 Aligned_cols=272 Identities=13% Similarity=0.121 Sum_probs=125.8 Q ss_pred Cccchh----hcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeee Q lcl|Aclame:pro 1 MGLIYD----KVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIH 76 (348) Q Consensus 1 Ma~l~d----~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~ 76 (348) |..-.+ ++.+.....++..+ ....+ +++ +++..++....+.... .......+.++..+...+... ..+... T Consensus 105 ~~~~~~~~g~~i~~~~~~~ii~~~-~~~~~-l~~-~~~~~~~~~~~~~~~~-~~~~~~~a~~v~E~~~~~~~~-~~~~~~ 179 (385) T protein:vir:18 105 LGSDADSAGSLIQPMQIPGIIMPG-LRRLT-IRD-LLAQGRTSSNALEYVR-EEVFTNNADVVAEKALKPESD-ITFSKQ 179 (385) T ss_pred hccccccCCceecchhhhHHHHHh-hhccc-hhh-hcceecccCcceEEEE-EecCCcceeeeccCccccccc-cceeEE Confidence 221111 12222233333332 22222 333 4555554444444333 222333556777766555444 467777 Q ss_pred EeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCcee-EEE Q lcl|Aclame:pro 77 DEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVN-KDI 155 (348) Q Consensus 77 ~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~-~~v 155 (348) ...+-.+.-...++.+ +++ +. .. +...+ ...+.+++...+|..++ +|- +.+.. ..| T Consensus 180 ~~~~~k~~~~~~is~e-ll~-----d~--~~----l~~~i---~~~la~a~~~~~d~~~l----~G~----g~~~~~~Gi 236 (385) T protein:vir:18 180 TANVKTIAHWVQASRQ-VMD-----DA--PM----LQSYI---NNRLMYGLALKEEGQLL----NGD----GTGDNLEGL 236 (385) T ss_pred EEeeeeEEEeehhhHH-HHh-----hH--HH----HHHHH---HHHHHHHHHHHHHHHHH----hcc----CCCCccccc Confidence 7777777766666643 211 11 11 22222 23345556666664433 442 11111 001 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) . .... +.+..++..+...+++|..+...+...+..+..++|++..|..|++ +++. ++ ..+-+.... T Consensus 237 ~-~~~~----~~~~~~~~~~~~~~d~i~~~~~~l~~~~~~~~~~~~~~~~~~~l~~---lkd~----~G--~~l~~~~~~ 302 (385) T protein:vir:18 237 N-KVAT----AYDTSLNATGDTRADIIAHAIYQVTESEFSASGIVLNPRDWHNIAL---LKDN----EG--RYIFGGPQA 302 (385) T ss_pred c-cccc----cccccccccccchHHHHHHHHHhhccccCCCCEEEEcHHHHHHHHH---hhcC----CC--ceeccCccc Confidence 0 0000 1111233344557788888887787777788899999999987753 2221 11 111100000 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) ..-..+.|+++++.+ .+|++.++|.-... +...+ + ..++.+....+ T Consensus 303 ~~~~~l~G~pV~~~~------------~~p~~~~~~gd~~~-~~~~~----~-----------------~~~~~v~~~~~ 348 (385) T protein:vir:18 303 FTSNIMWGLPVVPTK------------AQAAGTFTVGGFDM-ASQVW----D-----------------RMDATVEVSRE 348 (385) T ss_pred CCCceecceeeEEcC------------cCCCCcEEEeeccc-EEEEE----E-----------------ecceEEEEecc Confidence 001123455554322 34666666653221 11111 0 01111111111 Q ss_pred -CCC---ceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 316 -TDP---VNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 316 -~dP---~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .++ ......+..+.=..+.+|++++++|+.+.- T Consensus 349 ~~~~~~~~~~~~~~~~r~~~~v~~~~a~~~~~~~aa~ 385 (385) T protein:vir:18 349 DRDNFVKNMLTILCEERLALAHYRPTAIIKGTFSSGS 385 (385) T ss_pred ccchhhcCcEEEEEEEeeccEEecccceEEEEeccCC Confidence 011 123445666666778899999999999877 No 43 >protein:vir:191 Length: 385 # NCBI annotation: major head subunit precursor # Family: family:all:585 # MgeID: mge:6 # MgeName: HK97 # Cross-refs: genbank:acc:NP_037701;genbank:gi:9634158;genbank:GeneID:1262530 Probab=82.58 E-value=0.076 Score=26.73 Aligned_cols=272 Identities=13% Similarity=0.121 Sum_probs=125.8 Q ss_pred Cccchh----hcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeee Q lcl|Aclame:pro 1 MGLIYD----KVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIH 76 (348) Q Consensus 1 Ma~l~d----~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~ 76 (348) |..-.+ ++.+.....++..+ ....+ +++ +++..++....+.... .......+.++..+...+... ..+... T Consensus 105 ~~~~~~~~g~~i~~~~~~~ii~~~-~~~~~-l~~-~~~~~~~~~~~~~~~~-~~~~~~~a~~v~E~~~~~~~~-~~~~~~ 179 (385) T protein:vir:19 105 LGSDADSAGSLIQPMQIPGIIMPG-LRRLT-IRD-LLAQGRTSSNALEYVR-EEVFTNNADVVAEKALKPESD-ITFSKQ 179 (385) T ss_pred hccccccCCceecchhhhHHHHHh-hhccc-hhh-hcceecccCcceEEEE-EecCCcceeeeccCccccccc-cceeEE Confidence 221111 12222233333332 22222 333 4555554444444333 222333556777766555444 467777 Q ss_pred EeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCcee-EEE Q lcl|Aclame:pro 77 DEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVN-KDI 155 (348) Q Consensus 77 ~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~-~~v 155 (348) ...+-.+.-...++.+ +++ +. .. +...+ ...+.+++...+|..++ +|- +.+.. ..| T Consensus 180 ~~~~~k~~~~~~is~e-ll~-----d~--~~----l~~~i---~~~la~a~~~~~d~~~l----~G~----g~~~~~~Gi 236 (385) T protein:vir:19 180 TANVKTIAHWVQASRQ-VMD-----DA--PM----LQSYI---NNRLMYGLALKEEGQLL----NGD----GTGDNLEGL 236 (385) T ss_pred EEeeeeEEEeehhhHH-HHh-----hH--HH----HHHHH---HHHHHHHHHHHHHHHHH----hcc----CCCCccccc Confidence 7777777766666643 211 11 11 22222 23345556666664433 442 11111 001 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) . .... +.+..++..+...+++|..+...+...+..+..++|++..|..|++ +++. ++ ..+-+.... T Consensus 237 ~-~~~~----~~~~~~~~~~~~~~d~i~~~~~~l~~~~~~~~~~~~~~~~~~~l~~---lkd~----~G--~~l~~~~~~ 302 (385) T protein:vir:19 237 N-KVAT----AYDTSLNATGDTRADIIAHAIYQVTESEFSASGIVLNPRDWHNIAL---LKDN----EG--RYIFGGPQA 302 (385) T ss_pred c-cccc----cccccccccccchHHHHHHHHHhhccccCCCCEEEEcHHHHHHHHH---hhcC----CC--ceeccCccc Confidence 0 0000 1111233344557788888887787777788899999999987753 2221 11 111100000 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) ..-..+.|+++++.+ .+|++.++|.-... +...+ + ..++.+....+ T Consensus 303 ~~~~~l~G~pV~~~~------------~~p~~~~~~gd~~~-~~~~~----~-----------------~~~~~v~~~~~ 348 (385) T protein:vir:19 303 FTSNIMWGLPVVPTK------------AQAAGTFTVGGFDM-ASQVW----D-----------------RMDATVEVSRE 348 (385) T ss_pred CCCceecceeeEEcC------------cCCCCcEEEeeccc-EEEEE----E-----------------ecceEEEEecc Confidence 001123455554322 34666666653221 11111 0 01111111111 Q ss_pred -CCC---ceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 316 -TDP---VNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 316 -~dP---~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .++ ......+..+.=..+.+|++++++|+.+.- T Consensus 349 ~~~~~~~~~~~~~~~~r~~~~v~~~~a~~~~~~~aa~ 385 (385) T protein:vir:19 349 DRDNFVKNMLTILCEERLALAHYRPTAIIKGTFSSGS 385 (385) T ss_pred ccchhhcCcEEEEEEEeeccEEecccceEEEEeccCC Confidence 011 123445666666778899999999999877 No 44 >protein:vir:9927 Length: 295 # NCBI annotation: hypothetical protein # Family: family:all:1178 # MgeID: mge:178 # MgeName: 315.6 # Cross-refs: genbank:acc:NP_795689;genbank:gi:28876459;genbank:GeneID:1258000 Probab=79.53 E-value=0.1 Score=25.98 Aligned_cols=275 Identities=14% Similarity=0.148 Sum_probs=128.9 Q ss_pred CccchhhcCHHHH-----HHHHHhhccchhhhHHHH-----hCCCccccce---eEEEEEeecCceeeeeeeeCCCCcce Q lcl|Aclame:pro 1 MGLIYDKVTASNI-----AGYFNTLQENVDSTLGES-----IFPARKQLGT---KLSYIKGASGQSVALKAAAFDTNVTI 67 (348) Q Consensus 1 Ma~l~d~f~~~~l-----~~~i~~~~~~~~~~l~~~-----~Fp~~~~~~~---~~~~~~~~~~~~~~a~~v~~~~~~~~ 67 (348) ||.- ++-....| ..+++.....-.. |.+. +-|-..=... +|.++ .-|.-|..+...|+ T Consensus 1 mAe~-nlt~~~dL~~~~sidfv~~f~~~i~~-L~~~Lgi~r~~p~a~G~tIt~pK~~~t-------gda~dVaEGe~Ipl 71 (295) T protein:vir:99 1 MAEK-NLNTMADLGDIKSIDFVNKFSKNIND-LLKLLGVTRRETLTNDLKIQTYKWEVT-------LDQTDPGEGETIPL 71 (295) T ss_pred CCCc-ccccHhhccCceeehhhHHhhhhHHH-HHHHhccccccccccCCeEEeeeeeee-------cccccccCCcccch Confidence 8861 23223333 2344444322222 2222 2232211111 12221 12334666666555 Q ss_pred ecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeec Q lcl|Aclame:pro 68 RDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFT 147 (348) Q Consensus 68 ~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~ 147 (348) .+-..-.....++..-|..+.++.+.++. ...+. ++ .+...++..+|.+...--+..+|.+|+.+++ T Consensus 72 skvt~~~~~t~t~kikK~rK~tTdEAIql----sGygd--pv-------gead~qL~~~ia~kId~D~~~~lktat~t~t 138 (295) T protein:vir:99 72 SKVTRTKDKDYTVKWFKKRRATTAEAIAR----HGAAR--AI-------TEADKRIMRELQNGIKDAFFTFLKTKPTKVK 138 (295) T ss_pred hhheeeeeeeeEEEeeeecccccHHHHHh----cCCCc--hh-------HHHHHHHHHHHHHhhhHHHHHHhccCceeee Confidence 54332222234443333344555443321 11121 22 2233445566666666677888887776544 Q ss_pred CCceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcc Q lcl|Aclame:pro 148 SDGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGS 227 (348) Q Consensus 148 ~~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~ 227 (348) +.+. +...+..|.. .+...+....+.+++++++=...+++++.+.-. ... T Consensus 139 g~~l------------q~a~a~~~~a------------l~~f~Ee~~~~~V~FVnP~D~a~yl~~A~~~~~------~a~ 188 (295) T protein:vir:99 139 GVGL------------QKALSASWAK------------LATFNEFEGSPLVSFVSPLDVANYLGDTKVGAD------ASN 188 (295) T ss_pred hhhH------------HHHHHHhhhh------------hhhcccccCCceEEEEehHHHHHHHhccccccc------hhh Confidence 3221 1111122221 111112222467888899888888777765210 000 Q ss_pred cccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCc Q lcl|Aclame:pro 228 SVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSG 307 (348) Q Consensus 228 ~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~ 307 (348) .+. -+++..+.|.+.++-. +-+|++++++.+.+++ ..+|-+.- ..+.. +.. ..-..+.| T Consensus 189 ~fG----~~~L~nfLG~q~II~S-----------~kv~~G~~~aT~~~Ni-~~ay~~~~-~g~l~--~~f--~~~~D~tg 247 (295) T protein:vir:99 189 VFG----MTLLKNFLGMQNVIVM-----------PSVPEGKIYSTAVENL-VFASLNVK-GGDLG--GLF--ADFTDETG 247 (295) T ss_pred hhh----hhhhhhhhccceEEEc-----------ccCCCceEEEeeccce-EEEEecCC-chhhh--hhh--hhccCccc Confidence 111 1233345566532322 3378888888888775 33443221 11110 000 00112233 Q ss_pred -eEEEEeecCCCceeEEeeeeeeeeeecCCCcEEEEEE----ecCC Q lcl|Aclame:pro 308 -IAVTTTKTTDPVNVQTKVSMVALPSFERLGDVYMLTV----IPGV 348 (348) Q Consensus 308 -~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V----~~~~ 348 (348) |-+.+-...+.....+..-+...--|..+|+++++++ +||| T Consensus 248 lIg~~h~~~~~~~t~et~~~~~~~lfpE~~dgiv~~tI~~~~~~~~ 293 (295) T protein:vir:99 248 LIAAARNRQLSNLTYESVFFGANVLFAEIPEGVVEATIEAAAVPGI 293 (295) T ss_pred ceEEEeccccceeeehhhhHhHHHhcccccceEEEEEEecCcCCCC Confidence 3355555666677777777888888899999999999 5666 No 45 >protein:vir:94771 Length: 298 # NCBI annotation: major head protein # Family: family:all:966 # MgeID: mge:1529 # MgeName: phi LC3 # Cross-refs: genbank:acc:NP_996706;genbank:gi:45597421;genbank:GeneID:2769044 Probab=79.17 E-value=0.11 Score=25.90 Aligned_cols=296 Identities=10% Similarity=0.011 Sum_probs=124.2 Q ss_pred CccchhhcCHHHHHH-HHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEee Q lcl|Aclame:pro 1 MGLIYDKVTASNIAG-YFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQ 79 (348) Q Consensus 1 Ma~l~d~f~~~~l~~-~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~ 79 (348) |+.---.+-+.++.. +++.+. +. +.+ ..+++..++.......... .+.. .|.++..+.+.+.. ...+....++ T Consensus 1 ma~~gG~lip~~~~~~ii~~~~-~~-s~i-~~~~~~~~~~~~~~~~p~~-~~~~-~a~~v~Eg~~~~~~-~~~f~~v~l~ 74 (298) T protein:vir:94 1 MVLNKGTLFDPELVTDLISKVA-GK-SSI-ARLSAQKPIPFNGEKVFTF-TMDS-EIDVVAESGKKTHG-GVTLAPQTMV 74 (298) T ss_pred CeeccccccChhHHHHHHHHHH-hh-chh-hhhcceeeccCCceEEEEE-ecCc-ceEEeeCCcccccc-ccceeEEEEe Confidence 998655555555544 444432 22 234 3346666555444333222 2222 35778877666643 4456666666 Q ss_pred ccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEeecc Q lcl|Aclame:pro 80 MPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGV 159 (348) Q Consensus 80 ~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDfg~ 159 (348) +-+++-...++.+ + ++...... ..+...+ ..++.+++.+.+|..+.. |.-.-.+.+... .+. T Consensus 75 ~~k~~~~~~iS~e-l-----l~~~~~~~--~~l~~~i---~~~la~ai~~~~d~~~l~----G~~~~~g~~~~~---~~~ 136 (298) T protein:vir:94 75 PIKVEYGARISDE-F-----MYASDEEK--INILQAF---NDGFAKKVARGIDLMAFH----GVNPRLGTASAV---IGT 136 (298) T ss_pred eeEEEEeeehhHH-H-----hccCCccH--HHHHHHH---HHHHHHHHHHHHHHHhhc----ccccCCCccccc---ccc Confidence 6666655555443 1 11111111 1122222 344566777777766663 421111111110 111 Q ss_pred C-ccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHH Q lcl|Aclame:pro 160 K-ADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYV 238 (348) Q Consensus 160 ~-~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~ 238 (348) . ..+..+.......+..++..||.++...+...+..+...+|++.++.+|++- ++. . + .....+...+..- T Consensus 137 ~~~~~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~vmn~~~~~~l~~l---kd~---~-G-~~l~~~~~~~~~~ 208 (298) T protein:vir:94 137 NHFDSKVTQKVEAPRGIADPNGAIENAVELLTGVDADVTGIAINPSFRSALAKQ---KDL---Q-G-NALFPELKWGATP 208 (298) T ss_pred cccccccccccccccccccHHHHHHHHHHhhhhcCCCccEEEEcHHHHHHHHHh---hcc---C-C-CeeecCcccCCCC Confidence 0 1111122222344566788999999988887788888999999999887542 211 1 1 1111110001001 Q ss_pred HhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeecCCC Q lcl|Aclame:pro 239 ADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDP 318 (348) Q Consensus 239 ~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP 318 (348) ..+.|+++++-+. ..+..+.. ...+++.--.. + ..||.--+....... +.+ ..+.....|.+ T Consensus 209 ~tl~G~PV~~~~~-v~~~~~~~-----~~~~~~Gdfs~-~-~~~~~~~~~~~~~~~---~~~----~d~~~~~~f~~--- 270 (298) T protein:vir:94 209 DTINGLPVDVNKT-VSDMSLTQ-----RDRAIIGDFAN-G-FKWGYAKEVPLEVIQ---YGD----PDNSGLDLKGY--- 270 (298) T ss_pred ceecceeeEEecc-cccccCCC-----ccEEEEeeccc-e-EEEEEecCceEEEee---cCC----CcCcchhhhhc--- Confidence 2344666654332 11111111 11222221111 0 122211000000000 000 00000001110 Q ss_pred ceeEEeeeeeeeeeecCCCcEEEEEEec Q lcl|Aclame:pro 319 VNVQTKVSMVALPSFERLGDVYMLTVIP 346 (348) Q Consensus 319 ~~~~~~~~s~~lPv~~~~~~~~~~~V~~ 346 (348) .....++..+.=-.+.+|++++++|-.= T Consensus 271 ~~v~~r~~~r~~~~~~~~~a~~~l~~~t 298 (298) T protein:vir:94 271 NQVYIRAELFLGWGILDATKFARVTEAN 298 (298) T ss_pred CcEEEEEEEEeccEeecccceEEEEecC Confidence 0123334444444556677776664333 No 46 >protein:vir:5255 Length: 304 # NCBI annotation: hypothetical protein # Family: family:all:463 # MgeID: mge:117 # MgeName: Aaphi23 # Cross-refs: genbank:acc:NP_852760;genbank:gi:31544035;uniprot:Q7Y5U0;genbank:GeneID:2753552 Probab=77.55 E-value=0.12 Score=25.56 Aligned_cols=280 Identities=10% Similarity=0.091 Sum_probs=107.9 Q ss_pred CccchhhcCHHHHHHHHHhhcc-chhhhHHHHhCCCccccceeEEEEEe-ecCceeeee--eeeCCCCcceecccceeee Q lcl|Aclame:pro 1 MGLIYDKVTASNIAGYFNTLQE-NVDSTLGESIFPARKQLGTKLSYIKG-ASGQSVALK--AAAFDTNVTIRDRVSAEIH 76 (348) Q Consensus 1 Ma~l~d~f~~~~l~~~i~~~~~-~~~~~l~~~~Fp~~~~~~~~~~~~~~-~~~~~~~a~--~v~~~~~~~~~~r~~~~~~ 76 (348) |+-+ .|-..+|...-+.+-. +.+.+-+.++||....-+...+.+.. .....-.|. +++-++.....-.-.+... T Consensus 1 ~~~l--afl~~qL~~id~~vye~~~~~~~~~~lipv~t~~~~~~~~~~~~~~d~~G~a~~~~i~~~a~dip~vd~~~~~~ 78 (304) T protein:vir:52 1 MSLL--AYVKNGLTAVSKDIAETKYPEIVFPQFVYVDQQTAVGITEKLHYGADEHGSLDDGLITVGTSTLDQVEVGFTPT 78 (304) T ss_pred CchH--HHHHHHHHHHhhhhhccccccchhhhhccccCCCCcccceEEEeeeeccCcccccccCCcCCccceeeccccee Confidence 7775 3445666665444432 44566778899965422221111111 111112333 4555555544445556667 Q ss_pred EeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCc---eeE Q lcl|Aclame:pro 77 DEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDG---VNK 153 (348) Q Consensus 77 ~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~---~~~ 153 (348) ..++-.++..+..+-.|+.+-+.....- ++.. ..-.+++++..+ -++.+-|+. ..+ T Consensus 79 ~~~i~~~~~~~~y~~~El~~a~~~g~~l-~~~k----------a~aa~~a~~~~~----------n~v~~~Gd~~~~g~~ 137 (304) T protein:vir:52 79 RSYIVPWAKSVTWTKPELEQGKLLGLAL-NTAK----------IMALNKNAQQTL----------QKVAFLGHAKDSRLT 137 (304) T ss_pred EEEEEEEeeeeeecHHHHHHHHHhCCCc-HHHH----------HHHHHHHHHhhh----------ceEEEEeeccccceE Confidence 7777778888888877765544333211 1111 111122222222 233333321 111 Q ss_pred EEeeccCccceeee-----eecCCCCCc-cHHHHHHHHHHHHHh-cC--CeeEEEEeCHHHHHHHhcCHHHHHHhcccCC Q lcl|Aclame:pro 154 DIDYGVKADHKKQV-----SKSWAEPGA-TPLADLEDAIETARE-LG--LNPERAIMNAKTFGLIRKAASTVKAIKPLAG 224 (348) Q Consensus 154 ~vDfg~~~~~~~t~-----~~~W~~~~a-dp~~di~~~~~~~~~-~G--~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~ 224 (348) .+ +..|.-...+. .+.|.+.++ .++.||.++...+.. +| ..|++++|.+..++.|..- + ..+. T Consensus 138 Gl-lN~p~v~~~~~~~~~a~~~w~~~T~~eI~~di~~~~~~i~~~s~~~~~p~tl~Lpp~~~~~l~~~---~----~~~~ 209 (304) T protein:vir:52 138 GL-LNNKSVEVYAIKGAAQNTKVQAMDFDKAVAFFKEIFLKGMEKTKRIEAPNTFAIDSLDLAHLALV---Q----RANT 209 (304) T ss_pred EE-EeCCCcceeeecCCccCCccccCCHHHHHHHHHHHHHHHHhccCceecCceEEeCHHHHHHHhhc---c----CCCC Confidence 11 12222211111 135766554 588999998887753 55 3599999999999887320 0 0011 Q ss_pred CcccccHHHHHHHHHhhc------CceEEEEeeEEEc-CCCcccccccCCeEEEEeCCccceeEeccchhhhcccccccc Q lcl|Aclame:pro 225 DGSSVTKAELQNYVADNY------GVEIVLENGTYRN-EKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTV 297 (348) Q Consensus 225 ~~~~~~~~~~~~~~~~~~------~~~i~~yd~~y~d-~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~ 297 (348) +. -+.+++...+ .++|.....-... +.|. .+++++.-.+.. ...+- .| T Consensus 210 ~~------Tvl~~l~~n~~~~~g~~l~I~~v~~~~~~~g~~g------~~r~vvY~~d~~-~~~~~-vP----------- 264 (304) T protein:vir:52 210 DT------TALEFLTKHLSAAAGRQVAIKALPSNYGTRVTDG------KTRAMVYVNSKE-HVIFD-VP----------- 264 (304) T ss_pred Cc------hHHHHHHHhcccccCCcceEEEecccccccCCCC------ceEEEEEecChh-heEEe-cC----------- Confidence 11 1222222211 2233332111110 1110 011111111100 00000 00 Q ss_pred ccceeecCCceEEEEeecCCCceeEEeeee-eeeeeecCCCcEEEEEE Q lcl|Aclame:pro 298 NADVEIVDSGIAVTTTKTTDPVNVQTKVSM-VALPSFERLGDVYMLTV 344 (348) Q Consensus 298 ~~~~~~~~~~~~~~~~~~~dP~~~~~~~~s-~~lPv~~~~~~~~~~~V 344 (348) ...+..+ -...++.+..+-..+ ..=..+..|.+++.++= T Consensus 265 -~p~~~l~-------~q~~~~~~~~vp~~~r~gGv~v~~P~a~~y~D~ 304 (304) T protein:vir:52 265 -MSPTVLD-------AQPKGLLAFESGLRMAFGGVTFMEPDSALYVDY 304 (304) T ss_pred -ccccccc-------hhhcCCceEEecceeeeeeEEEEccceeeeecC Confidence 0000000 000000000000000 00011112222222222 No 47 >protein:vir:5974 Length: 324 # NCBI annotation: hypothetical protein # Family: family:all:1522 # MgeID: mge:125 # MgeName: SPP1 # Cross-refs: genbank:acc:NP_690674;genbank:geneid:6329212;genbank:gi:22855068;goa:Q38582;uniprot:Q38582;genbank:GeneID:955303 Probab=77.26 E-value=0.13 Score=25.50 Aligned_cols=299 Identities=10% Similarity=0.026 Sum_probs=121.5 Q ss_pred Ccc--chhhcCHHHHHHHHHhhccchhhhHHHHhC-CCccccceeEEEEEeecCceeeeee----------eeCCCCcce Q lcl|Aclame:pro 1 MGL--IYDKVTASNIAGYFNTLQENVDSTLGESIF-PARKQLGTKLSYIKGASGQSVALKA----------AAFDTNVTI 67 (348) Q Consensus 1 Ma~--l~d~f~~~~l~~~i~~~~~~~~~~l~~~~F-p~~~~~~~~~~~~~~~~~~~~~a~~----------v~~~~~~~~ 67 (348) ||. |.|+|.|..+..|+.+.......|+.+.+. |.-....+ + .....|..+..|+ +..+...+. T Consensus 1 MA~T~lsd~i~peVf~~yv~~~~~~~~~l~qSg~i~~~a~i~~~-l--~~~~~G~~i~~P~~~~l~Gd~~~v~~~~~i~~ 77 (324) T protein:vir:59 1 MAYTKISDVIVPELFNPYVINTTTQLSAFFQSGIAATDDELNAL-A--KKAGGGSTLNMPYWNDLDGDSQVLNDTDDLVP 77 (324) T ss_pred CCceeeeceechhHHHHHHHhhhHHHHHHhhcccccccHHHHHH-h--hccCCCCEEEecccccCCCcccccCCCcccch Confidence 995 679999999999997644333334333222 11100000 0 0001112222222 222222222 Q ss_pred ecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeec Q lcl|Aclame:pro 68 RDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFT 147 (348) Q Consensus 68 ~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~ 147 (348) .+-...+ ....+ .+......+.|+-.+ .. +. ..+..+.++ +...+.++.+-.+..+|. |.+..+ T Consensus 78 ~~l~t~~-~~a~i--~~~~k~~~~tD~a~~---~s-g~-dp~~~i~~q-------~a~~~~~~~~~~lia~l~-g~~~~~ 141 (324) T protein:vir:59 78 QKINAGQ-DKAVL--ILRGNAWSSHDLAAT---LS-GS-DPMQAIGSR-------VAAYWAREMQKIVFAELA-GVFSND 141 (324) T ss_pred hhcccce-eeEEE--EeecCceeehhhhhh---hc-cc-hHHHHHHHH-------HHHHHHHHHHHHHHHHHH-Hhhhcc Confidence 1111111 11111 122233445554332 22 22 223333333 344555566666666663 544322 Q ss_pred CCceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcc Q lcl|Aclame:pro 148 SDGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGS 227 (348) Q Consensus 148 ~~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~ 227 (348) .- +.|+.+.++. ++..-+. ..|....+.+-+.......++|++.++..|++... .+.+....+.. T Consensus 142 ~~-----------~~~~~dvsa~-~~~~~s~-~~l~~A~~~~GD~~~~~~~ivmhS~v~~~L~~~~l-i~~~~~s~~~~- 206 (324) T protein:vir:59 142 DM-----------KDNKLDISGT-ADGIYSA-ETFVDASYKLGDHESLLTAIGMHSATMASAVKQDL-IEFVKDSQSGI- 206 (324) T ss_pred cc-----------ccceeeeecc-ccceecH-HHHHHHHHHhCCcccCcEEEEEchHHHHHHHHhhh-hhhccccccCc- Confidence 21 1233222211 0011111 23334444454444578899999999999987753 34443332221 Q ss_pred cccHHHHHHHHHhhcCceEEEEeeE-EEcCCCcccccccCCeEEEEeCCccceeEecc--chhhhccccccc--ccccee Q lcl|Aclame:pro 228 SVTKAELQNYVADNYGVEIVLENGT-YRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGT--TPEESDLFADNT--VNADVE 302 (348) Q Consensus 228 ~~~~~~~~~~~~~~~~~~i~~yd~~-y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~--~~~~~~~~~~~~--~~~~~~ 302 (348) .++.+.|.+|++=|.- +....|+.. ..+.+++-.+.+|...=.+ ..|.+....++. .+.+.. T Consensus 207 ---------~i~~~~G~~VivdD~~p~~~~~~~~~----~y~s~l~~~GAi~~~~~~~~v~vE~dRd~~~g~~~l~~r~~ 273 (324) T protein:vir:59 207 ---------RFPTYMNKRVIVDDSMPVETLEDGTK----VFTSYLFGAGALGYAEGQPEVPTETARNALGSQDILINRKH 273 (324) T ss_pred ---------eeeeecccEEEEeCCCCccccCCCCc----eEEEEEEecCeEEEeecCCCcceecccCccccceEEEEeeE Confidence 1345567777665431 222222211 1223333333332221111 112221111111 111111 Q ss_pred ecCCceEEEEeec-----CCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 303 IVDSGIAVTTTKT-----TDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 303 ~~~~~~~~~~~~~-----~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .--+..-..|.+ ..|....+...+.+=.| .+++.+-++.++.-. T Consensus 274 -~~~~p~G~s~~~~~~~~~sPt~~~L~~~~NW~~v-~~~k~i~i~~~~~~~ 322 (324) T protein:vir:59 274 -FVLHPRGVKFTENAMAGTTPTDEELANGANWQRV-YDPKKIRIVQFKHRL 322 (324) T ss_pred -EEeEeeeEEecccccCCCCCChhhhcCCcccccc-cCccccceEEEEeec Confidence 111222234532 34655555555544443 346666666666555 No 48 >protein:vir:1638 Length: 298 # NCBI annotation: Structural protein # Family: family:all:966 # MgeID: mge:33 # MgeName: r1t # Cross-refs: genbank:acc:NP_695059;genbank:gi:23455750;genbank:GeneID:955469 Probab=76.86 E-value=0.13 Score=25.43 Aligned_cols=297 Identities=9% Similarity=-0.028 Sum_probs=128.4 Q ss_pred CccchhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEeec Q lcl|Aclame:pro 1 MGLIYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDEQM 80 (348) Q Consensus 1 Ma~l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~~~ 80 (348) ||.---.+-++++..-|-+...+. +-+ ..+.+..++.+....... ..+. ..|.++..+.+.+... ..++...+.+ T Consensus 1 ma~~gG~lvp~~~~~~ii~~~~~~-s~i-~~l~~~~~~~~~~~~ip~-~~~~-~~a~~v~E~~~~~~~~-~~f~~v~l~~ 75 (298) T protein:vir:16 1 MVLNKGTLFDPTLVTDLISKVAGK-SSI-ARLSAQKPIPFNGEKVFT-FTMD-SEIDVVAESGKKTHGG-VTLAPQTMVP 75 (298) T ss_pred CcccCcceechhHHHHHHHHHHhh-hhh-hhhcceeeccCCceEEEE-EecC-cceEEecCCccccccc-cceeEEEEee Confidence 997655555555544333333233 233 334555544443333322 2222 2357787776666443 4567777777 Q ss_pred cccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEeeccC Q lcl|Aclame:pro 81 PFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGVK 160 (348) Q Consensus 81 p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDfg~~ 160 (348) -+++-...++.+-+ +...... ..+...+ ..++.+++.+.+|..+.. |.=.-++..... .+.. T Consensus 76 ~k~a~~~~iS~ell------~~s~d~~--~~l~~~i---~~~la~ai~~~~d~~~l~----G~~~~~g~~~~~---~~~~ 137 (298) T protein:vir:16 76 IKVEYGARISDEFM------YASDEEK--INILQEF---NDGFAKKVARGIDLMAFH----GVNPRLGTASAV---IGTN 137 (298) T ss_pred eeEEEeehhhHHHh------hcCcccH--HHHHHHH---HHHHHHHHHHHHHHHhhc----cccCCCCccccc---cccc Confidence 66666655554321 1111110 1122222 344566777777766653 321111110000 0100 Q ss_pred c-cceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHHH Q lcl|Aclame:pro 161 A-DHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYVA 239 (348) Q Consensus 161 ~-~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~ 239 (348) . ....+........+.++..||.++...+...+..+...+|++..+..|++- ++. . +.....+...+..-+ T Consensus 138 ~~~~~~~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~vmn~~~~~~l~~l---kd~---~--G~~i~~~~~~~~~~~ 209 (298) T protein:vir:16 138 HFDSKVTQKVEAPRGIADPNGAIENAVELLTGVDADVTGIAINPSFRSALAKQ---KDL---Q--DNALFPELKWGATPD 209 (298) T ss_pred ccccccccccccccccccHHHHHHHHHHHhhhcCCCccEEEEcHHHHHHHHHh---hcc---C--CCeeecCcccCCCCc Confidence 0 111112223344556788899999988877777888899999999877542 221 1 111111111111112 Q ss_pred hhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeecCCCc Q lcl|Aclame:pro 240 DNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPV 319 (348) Q Consensus 240 ~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~ 319 (348) .+.|+++++-+.- .+..+.. ...+++.--.. ...||.-....-.... . ....+..+..|.+ . T Consensus 210 ~l~G~PV~~~~~v-~~~~~~~-----~~~~~~GDfs~--~~~~~~~~~~~~~~~~-----~--~~~~~~~~~~f~~---~ 271 (298) T protein:vir:16 210 TINGLPVDVNKTV-SDMSLTQ-----RDRAIIGDFAN--GFKWGYAKEVPLEVIQ-----Y--GDPDNSGLDLKGY---N 271 (298) T ss_pred eecceeeEEeccc-ccccCCC-----ccEEEEeeccc--eEEEEEecCceEEEee-----c--cCCcCcchhhhhc---C Confidence 3457777654421 1111111 11222221111 1122211000000000 0 0000000011111 1 Q ss_pred eeEEeeeeeeeeeecCCCcEEEEEEec Q lcl|Aclame:pro 320 NVQTKVSMVALPSFERLGDVYMLTVIP 346 (348) Q Consensus 320 ~~~~~~~s~~lPv~~~~~~~~~~~V~~ 346 (348) ....++..+.=..+.+|+++.++|-.= T Consensus 272 ~v~~ra~~r~d~~v~~~~a~~~l~~at 298 (298) T protein:vir:16 272 QVYIRAELFLGWGILDATKFARVTEAN 298 (298) T ss_pred cEEEEEEEEEccEeecccceEEEeecC Confidence 234445555555677777777775444 No 49 >protein:vir:103285 Length: 296 # NCBI annotation: hypothetical protein # Family: family:all:463 # MgeID: mge:1605 # MgeName: JK06 # Cross-refs: genbank:acc:YP_277465;genbank:gi:71834107;genbank:GeneID:3562396 Probab=70.01 E-value=0.21 Score=24.24 Aligned_cols=279 Identities=12% Similarity=0.118 Sum_probs=124.5 Q ss_pred Cc--cchh--hcCHHHHHHHHHhhcc-chhhhHHHHhCCCccccce--eEEEEEeecCceeeeeeeeCCCCcceecccce Q lcl|Aclame:pro 1 MG--LIYD--KVTASNIAGYFNTLQE-NVDSTLGESIFPARKQLGT--KLSYIKGASGQSVALKAAAFDTNVTIRDRVSA 73 (348) Q Consensus 1 Ma--~l~d--~f~~~~l~~~i~~~~~-~~~~~l~~~~Fp~~~~~~~--~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~ 73 (348) |- .-.+ .|...+|+..-+.+-. ..+++-..+|||....-+. +......... .-.+...+..+.........+ T Consensus 1 ~~~~~a~~~~~f~~~ql~~id~~v~e~~~~~l~~~~~i~v~~~~~~~~~~~~~~~~~~-~G~a~~~~~~~~dip~v~~~~ 79 (296) T protein:vir:10 1 MGVDKADAAGIWTVKQLTASLNKAYETEYDQNSVVNLFPVSNEIPGYAKYFEYPVFDG-VGIAQIVADYTDDLPLVDALA 79 (296) T ss_pred CcccchhhhHHHHHHHHHHHHHHHHhhhhcccccceecccccCCCCceeEEEeeeeec-cCceeEeCCCccccceeeccc Confidence 43 2222 5777777764444332 3445667788986542211 1111111111 122344444443222222334 Q ss_pred eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCce-- Q lcl|Aclame:pro 74 EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGV-- 151 (348) Q Consensus 74 ~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~-- 151 (348) +....++..+.....++..|+..-+..+. +-..+. .....+++..++ -++.+.|+.. T Consensus 80 ~~~~~~i~~~~~~~~~~~~El~~a~~~g~---~l~~~k--------a~aA~~~~~~~~----------n~~~f~G~~~~g 138 (296) T protein:vir:10 80 TERQGKVFRFGNAFLISIDEIKVGQATGQ---SLSTRK--------QSLAFEAHDKLL----------DKLVWSGSTAHG 138 (296) T ss_pred eeEEEEEEEEEeeeeecHHHHHHHHHhCC---ChHHHH--------HHHHHHHHHHhh----------ceEEEeeccccc Confidence 56677888888888888877654433322 111110 111112222222 1233322211 Q ss_pred eEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHh--cC-CeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 152 NKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARE--LG-LNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 152 ~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~--~G-~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) .+.+ +..|.-...+.++.|.+++ .+++||.+....++. .| ..|.+++++++.+..|.+- . .+.+ T Consensus 139 ~~GL-lN~p~v~~~~~~~~W~~~t-~i~~Di~~~~~~l~~~s~g~~~p~~l~L~p~~~~~L~~~------~--~~~~--- 205 (296) T protein:vir:10 139 IPSV-FDYPNINNVVSGGSWSQPT-TAVSDITSLLDIIETSTNGQHRATHLLLPTTARRIMQNL------V--PGTS--- 205 (296) T ss_pred ceeE-eecCCCccccccCCccCHH-HHHHHHHHHHHHHHHhhCceecceeEEeCHHHHHHHhhc------c--CCCC--- Confidence 1111 1112222344566898876 789999999887643 35 4699999999999877321 0 1111 Q ss_pred ccHHHHHHHHHhh-cCceEEEEeeEEEcCCCcccccccCCeEEEEeCCc-cceeEeccchhhhccccccccccceeecCC Q lcl|Aclame:pro 229 VTKAELQNYVADN-YGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGP-LGNTVFGTTPEESDLFADNTVNADVEIVDS 306 (348) Q Consensus 229 ~~~~~~~~~~~~~-~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~-~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~ 306 (348) ++ +.+++... .+++|.... .+....|. ..+.+++...+. ...+.. ++ T Consensus 206 ~t---~l~~ik~~~~~l~i~~~~-~l~~a~~~-----g~~~~v~~~~~~~~~~~~v----------------------~~ 254 (296) T protein:vir:10 206 VS---YGEFFRQNNSGVTVEFVQ-YLNDYNGT-----GTSAAIAYEKDPNNMAIEI----------------------PE 254 (296) T ss_pred cc---HHHHHHHhcCCceEEEee-eeccCCCC-----cceEEEEEEcCCceEEEEc----------------------Cc Confidence 11 22233332 344454322 12222211 122333332211 111111 11 Q ss_pred ceEEEEeecCCCceeEEeeeeee-eeeecCCCcEEEEEEe--c Q lcl|Aclame:pro 307 GIAVTTTKTTDPVNVQTKVSMVA-LPSFERLGDVYMLTVI--P 346 (348) Q Consensus 307 ~~~~~~~~~~dP~~~~~~~~s~~-lPv~~~~~~~~~~~V~--~ 346 (348) .+....+ +............+. =.++.+|.+++.++=+ | T Consensus 255 ~~~~~~~-e~~~l~~~~~~~~~~~Gv~i~~P~ai~~~dGI~~~ 296 (296) T protein:vir:10 255 ATNALPA-QPKDLHFKIPVTSKATGLIVYRPLTMAVMKGITFA 296 (296) T ss_pred ceeeecc-cccCceEEEeeEeeEEEEEEECCceeEEEeeeecC Confidence 1111111 222333444444443 3677788888877533 3 No 50 >protein:vir:80446 Length: 367 # NCBI annotation: BcepGomrgp07 # Family: family:all:1522 # MgeID: mge:1882 # MgeName: BcepGomr # Cross-refs: genbank:acc:YP_001210227;genbank:gi:146329919;genbank:GeneID:5123555 Probab=59.51 E-value=0.39 Score=22.82 Aligned_cols=305 Identities=10% Similarity=-0.001 Sum_probs=120.6 Q ss_pred Ccc------chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCC-cceecc--- Q lcl|Aclame:pro 1 MGL------IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTN-VTIRDR--- 70 (348) Q Consensus 1 Ma~------l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~-~~~~~r--- 70 (348) ||. |.|+|.+..+..|+.+.+.....|+.+...-.. -++...-...+..+..||...-.+ ...... T Consensus 1 M~~~~~~T~l~Dii~pEvF~~Yv~~~~~e~~~l~qSGiv~~d----~~l~~~~~~gG~~v~iPf~~~L~g~~~n~~~d~~ 76 (367) T protein:vir:80 1 MPDFNNQVRLVDAVIPEVYTSYTAIDRPELTAFFLSGAVASN----DFLSQFLSAPGRLINIPFWRDLDSLEPNYGSDNP 76 (367) T ss_pred CcchhhhhhhhhccchhhhhHHHhhhhhhhhhhhhcceeecC----HHHHHHhhcCCCEEEeeeeccCCCCccccCCCCC Confidence 995 457899999999999877544444443333211 111111123455566677755422 221111 Q ss_pred ------cceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCee Q lcl|Aclame:pro 71 ------VSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKI 144 (348) Q Consensus 71 ------~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki 144 (348) ..+++..-.-..+...+...+.|+-.+.. |. ...+.+.++ +.+... ++.+.+....| +|.+ T Consensus 77 ~~~~t~~kittg~~~a~v~~r~kaw~~~Dla~~ls----G~-dpm~~Ia~q----va~yW~---r~~q~~Lla~L-~Gvf 143 (367) T protein:vir:80 77 NVEAPIDGLGSGEMKTTKTWLNKAYGAMDLTAELA----GS-NPMTRIRNR----FGVYWT---RQWQRRIIAMA-VGVY 143 (367) T ss_pred cccccccccccchheeeeehhcccchhhhHHHHhh----Cc-hHHHHHHHH----HHHHhh---hhhHHHHHHHH-HHhh Confidence 11122222234455556677777655432 22 233333333 332222 33333333333 3665 Q ss_pred eecCCceeEEE-e--------eccCccceeeeeecCCCC--CccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCH Q lcl|Aclame:pro 145 AFTSDGVNKDI-D--------YGVKADHKKQVSKSWAEP--GATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAA 213 (348) Q Consensus 145 ~~~~~~~~~~v-D--------fg~~~~~~~t~~~~W~~~--~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~ 213 (348) ..+..+....+ + .+.-..|....++.=.++ .-++-.-+. ....+-+.+-....++|.+.++..|.+.. T Consensus 144 ~~~~a~~~~~~~~~~~~~a~~~~~~~~~~~Dis~~t~~~~~~~s~~~~~~-A~~~lGD~~~~l~~i~mHS~V~~~L~~~~ 222 (367) T protein:vir:80 144 KSNLAGNFATIKTRGRVPAEVLGTAGDMVIDISGQTNPADAVFNREAFVD-AAFTMGDHVGSIAAIAVHSMVYKRMTNND 222 (367) T ss_pred ccccccchhhhhhhhccccccccccCceeeeeeccCCCccceecHHHHHH-HHHHhccccccccEEEEchHHHHHHHhcc Confidence 44332211111 0 111233444333221111 112222222 34455445556888999999999987763 Q ss_pred HHHHHhcccCCCcccccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccch-----h- Q lcl|Aclame:pro 214 STVKAIKPLAGDGSSVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTP-----E- 287 (348) Q Consensus 214 ~v~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~-----~- 287 (348) +.+.+....++.. +..+.|..+++-|.-=.+..|... .-..+++..|.+ .||-.. | T Consensus 223 -li~~i~~sd~~~~----------i~ty~G~~VIvDD~~Pv~~~~a~~----~yttYlfg~GAi---~~~~~~~~~~~E~ 284 (367) T protein:vir:80 223 -EIEFIPDSKGQLT----------IPTYMGKVVIVDDGMPVFGTGADK----TYLSILFGGAAF---GYADGAPQVPVAV 284 (367) T ss_pred -ccccccCCCCccc----------cceecceeEEEeCCCcccccCCCc----eEEEEEEeccee---eecccCCccceec Confidence 4444443332111 444557666665543111111111 122334444433 233110 1 Q ss_pred hhccccccccccceeecCCceEEEE-eecCCCceeEEeeeeeee----------------ee---e---cCCCcEEEEEE Q lcl|Aclame:pro 288 ESDLFADNTVNADVEIVDSGIAVTT-TKTTDPVNVQTKVSMVAL----------------PS---F---ERLGDVYMLTV 344 (348) Q Consensus 288 ~~~~~~~~~~~~~~~~~~~~~~~~~-~~~~dP~~~~~~~~s~~l----------------Pv---~---~~~~~~~~~~V 344 (348) ..++..+.. .+..+.+.. -.--.|.+..-...+.+- |- + .+-+.++--|- T Consensus 285 ~Rd~~~~~~-------gG~d~L~~Rr~~~~hP~G~s~~~~~v~~~~~~~~~~~~~~~~~sPt~~eLa~~~NW~~v~d~K~ 357 (367) T protein:vir:80 285 GRRELRGNG-------SGLEYILERKEWIVHPGGFNWLDADVTIPDNTGSPSGITSGPPAITLANLANPDNWERVTYRKN 357 (367) T ss_pred ccchhhhcC-------CceEEEEeeeeEEeecceeeecccccccccccccccccccccCCCChHHhcCCcccccccchhh Confidence 111111000 001111111 111223333222111110 11 1 11222222233 Q ss_pred ecCC Q lcl|Aclame:pro 345 IPGV 348 (348) Q Consensus 345 ~~~~ 348 (348) ++=| T Consensus 358 I~iv 361 (367) T protein:vir:80 358 VPMA 361 (367) T ss_pred cceE Confidence 3322 No 51 >protein:vir:102944 Length: 330 # NCBI annotation: major head protein # Family: family:all:1522 # MgeID: mge:1461 # MgeName: EJ-1 # Cross-refs: genbank:acc:NP_945286;genbank:gi:39653721;uniprot:Q708M6;genbank:GeneID:2672858 Probab=58.36 E-value=0.41 Score=22.68 Aligned_cols=302 Identities=14% Similarity=0.111 Sum_probs=118.8 Q ss_pred Ccc----chhhcCHHHHHHHHHhhccchhhhHHHHhC-CCccccceeEEEEEeecCceeeeeeeeCC-CCccee-cc--- Q lcl|Aclame:pro 1 MGL----IYDKVTASNIAGYFNTLQENVDSTLGESIF-PARKQLGTKLSYIKGASGQSVALKAAAFD-TNVTIR-DR--- 70 (348) Q Consensus 1 Ma~----l~d~f~~~~l~~~i~~~~~~~~~~l~~~~F-p~~~~~~~~~~~~~~~~~~~~~a~~v~~~-~~~~~~-~r--- 70 (348) ||+ |.|+|+|..+..|+.+.+.....|+.+..+ |.-..... +.+ .|..+..|+...- +..... +. T Consensus 1 Ma~~~T~l~d~i~pevf~~yv~~~~~~~~~l~qSG~i~~~~~i~~~----~~~-~G~~i~~P~~~~l~G~~~~~~dg~~~ 75 (330) T protein:vir:10 1 MANELTKILDTITPQQYNAYMQQYTAAKSAFVQSGIAVSDERVSKN----ITS-GGLLVNMPFWNDLTGDSEVLGNGDKA 75 (330) T ss_pred CCCCceEeeeeechhHHHHHHHHHhHHhhhhhhcccccccHHHHHH----hhc-CCCEEEecccccCCCcccccCCCccc Confidence 995 679999999999998877433334333222 22111110 011 2333444444322 111111 11 Q ss_pred ---cceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeec Q lcl|Aclame:pro 71 ---VSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFT 147 (348) Q Consensus 71 ---~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~ 147 (348) +..++..-....++..+...+.|+-.+. . +. ...+.+.+++ ...+.++.+-+....|. |.+... T Consensus 76 i~~~ki~t~~~~a~i~~~~k~~~~tD~a~~~---~-g~-dp~~~i~~q~-------a~~w~~~~q~~lla~l~-gvf~~~ 142 (330) T protein:vir:10 76 LETGKITAGADIACVLYRGRGWAANELTGVV---A-GS-DPVRAILNRI-------GAYWLREDQKALIATLN-GIFATG 142 (330) T ss_pred cchhhcccceeEEEEEeecceeeehhhhhhh---c-ch-hHHHHHHHHH-------HHHhhhhHHHHHHHHHH-hhhhhh Confidence 1112222222223333445556654332 1 22 2233333333 23334444444444443 443321 Q ss_pred CCceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcc Q lcl|Aclame:pro 148 SDGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGS 227 (348) Q Consensus 148 ~~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~ 227 (348) .....-. +. ..+..+.++ +.+.-+. +.|....+.+-+.......++|.+.++..|+++. ..+.+.....+. T Consensus 143 ~~~~~~~--~~--~~~~~~~~~--~~a~~s~-~~l~~A~~~~GD~~~~~~~ivmhS~v~~~L~~~~-li~~~~~s~~~~- 213 (330) T protein:vir:10 143 TAGEKGA--LE--ETHVSDQSK--ASTGIDA-GMVLDAKQLLGDSADQVTAIAMHSAVYTKLQKDN-LIQYIQPTTATI- 213 (330) T ss_pred hcccchh--hh--hhheecccc--cccccCH-HHHHHHHHHhccccccceEEEEcHHHHHHHHHhh-hhhhhcccccCc- Confidence 1111000 00 011111110 0011111 2244445555555456889999999999998754 344443322211 Q ss_pred cccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeE---ec-cchhhhc-cccccc-cccce Q lcl|Aclame:pro 228 SVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTV---FG-TTPEESD-LFADNT-VNADV 301 (348) Q Consensus 228 ~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~---yg-~~~~~~~-~~~~~~-~~~~~ 301 (348) .++.+.|.+|++=|.- . .++. ..+.+++-.|.++... -+ ...|.+. +..|.. ...+. T Consensus 214 ---------~i~~~~G~~VivdD~~-p-~~~~------~yt~yl~~~GAi~~~~~~~~~~v~~EtdRd~~~g~~~l~~r~ 276 (330) T protein:vir:10 214 ---------NIPTYLGYRVIIDDGI-A-PTGD------IYTSYLFRTGSIGLNTGNPSGLTTFETSREAAKGNDMIYTRR 276 (330) T ss_pred ---------ccccccceEEEEeCCC-C-CCCC------ceeEEEEecCceeeecccCCccccccccCCccccceEEEEee Confidence 1345567666654422 1 1111 1122233232221110 00 0112221 111110 00111 Q ss_pred eecCCceEEEEeec-------CCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 302 EIVDSGIAVTTTKT-------TDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 302 ~~~~~~~~~~~~~~-------~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .. --+..-.+|.+ ..|....+...+.+=.|. ++..+-++.+.--. T Consensus 277 ~~-~~hp~G~s~~~~~~~~~~~sPt~~~L~~~~NW~~v~-~~k~i~iv~~~~~~ 328 (330) T protein:vir:10 277 AL-VMHPYGVKWTGAEVDAGNITPSNADLAKFKNWKRVY-EPKNIGIIALKHKI 328 (330) T ss_pred EE-EeeeeeeeecccccccCcCCcChHHhcCCcCccccc-ChhhcceEEEEEec Confidence 10 01112234432 235555555555444443 45555555555555 No 52 >protein:vir:100135 Length: 418 # NCBI annotation: gp5 # Family: family:all:585 # MgeID: mge:1639 # MgeName: phi1026b # Cross-refs: genbank:acc:NP_945035;genbank:gi:38707895;genbank:GeneID:2744182 Probab=57.22 E-value=0.44 Score=22.54 Aligned_cols=277 Identities=13% Similarity=0.118 Sum_probs=122.2 Q ss_pred Cccc----hh-hcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee Q lcl|Aclame:pro 1 MGLI----YD-KVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI 75 (348) Q Consensus 1 Ma~l----~d-~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~ 75 (348) .... .. ++.+.....+++.+ ... .-+.+ +.+..++.+........ ......|.++..+++.+... ..+.. T Consensus 135 ~~~~~~~~~g~lvp~~~~~~ii~~~-~~~-~~l~~-~~~~~~~~~~~~~~~~~-~~~~~~a~~v~E~~~~~~~~-~~f~~ 209 (418) T protein:vir:10 135 TVGSGVSGSNSLVVADRQAGIIAPP-QRK-MTIRD-LLMPGQTSSSSIEYTVE-TGFTNNAAAVAEGAQKPTSD-LKFNL 209 (418) T ss_pred hccCCCCCCccccchhHHHHHHHHH-hhh-hhHHh-hcceeeccCCceeEEEE-ecCCCceeeeccCccccccc-cceee Confidence 0000 01 12222223333333 222 22333 35555554444333332 22223456777776655443 46777 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDI 155 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~v 155 (348) ..+.+-.+.-...++.+ +.+ +. .. +...+ ...+.+++...+|..++ +|. +.+.. . T Consensus 210 v~~~~~k~~~~~~is~e-ll~-----ds--~~----l~~~i---~~~l~~a~~~~~d~a~l----~G~----g~~~~--p 264 (418) T protein:vir:10 210 KNQPVRTIAHLFKASRQ-ILD-----DA--PA----LQSYI---DGRARYGLQLTEEGQIL----KGD----GTGAN--I 264 (418) T ss_pred EEEeeeeEEEeehhhHH-HHH-----hH--HH----HHHHH---HHHHHHHHHHHHHHHHh----ccC----CCCcc--c Confidence 77777777666666543 221 11 11 22222 23344555566654333 441 11110 0 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) .|.-.... ......+.++.+.+.||..+...+...+..+..++|++.+|..|.. +++. . +..+-+.... T Consensus 265 -~Gi~~~~~-~~~~~~~~~~~~~~~~i~~~~~~~~~~~~~~~~~v~n~~~~~~L~~---lkd~---~---G~~i~~~~~~ 333 (418) T protein:vir:10 265 -LGILPQAS-AFMPSITLANATPIDKIRLALLQAVLAEFPATGIVLNPIDWASIEL---TKDS---Q---GRYIVGNPVN 333 (418) T ss_pred -cccccccc-cccccccccccccHHHHHHHHHhhccccCCCCEEEEcHHHHHHHHH---hhcC---C---Cceecccccc Confidence 01100000 0111233345567788888877777677778889999999987743 2221 1 1111111111 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) ..-+.+.|+++++.+ .+|++.+++..... +...| .-. + ............ |. T Consensus 334 ~~~~~l~G~pV~~~~------------~~p~~~~~~gd~s~-~~~~~--~~~------~--~~i~~~~~~~~~----f~- 385 (418) T protein:vir:10 334 GTTPRLWNLPVVETQ------------AMTANEFLVGAFSM-AAQIF--DRM------E--IEVLLSTENVDD----FE- 385 (418) T ss_pred CCCceecceeeEEcC------------CCCCCcEEEeeccc-eEEEE--Eec------c--eEEEEecccchh----hh- Confidence 111234466665422 34566666553221 11111 000 0 000000000000 00 Q ss_pred CCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 316 TDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 316 ~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) -.....++..+.=..+.+|++++.+++.+.+ T Consensus 386 --~~~~~~r~~~~~d~~~~~~~a~~~~~~~~~~ 416 (418) T protein:vir:10 386 --KNMVSIRAEERLALAVYRPESFVTGALVEQA 416 (418) T ss_pred --cCceEEEEEEeeccEEecccceEEEEeccCC Confidence 1123444555555678889999999999888 No 53 >protein:vir:107687 Length: 319 # NCBI annotation: hypothetical protein # Family: family:all:463 # MgeID: mge:1518 # MgeName: T1 # Cross-refs: genbank:acc:YP_003898;genbank:gi:45686314;genbank:GeneID:2773027 Probab=52.13 E-value=0.56 Score=21.95 Aligned_cols=277 Identities=11% Similarity=0.072 Sum_probs=118.8 Q ss_pred Cccch---hhcCHHHHHHHHHhh-ccchhhhHHHHhCCCccccce---eEEEEEeecCceeeeeeeeCCCCcceecccce Q lcl|Aclame:pro 1 MGLIY---DKVTASNIAGYFNTL-QENVDSTLGESIFPARKQLGT---KLSYIKGASGQSVALKAAAFDTNVTIRDRVSA 73 (348) Q Consensus 1 Ma~l~---d~f~~~~l~~~i~~~-~~~~~~~l~~~~Fp~~~~~~~---~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~ 73 (348) +.+-. -+|+..+|...-+.. ..+..++-..+|||....-+. .+.+.. ... .-.+...+..+.......-.+ T Consensus 24 ~~da~~~~g~~~~~ql~~id~~v~e~~~~~l~~~~~i~v~~~~~~~~~~~~~~~-~~~-~G~a~~~~d~~~dip~v~~~~ 101 (319) T protein:vir:10 24 KQDAAATMGIWTAQELHRIKSQSYEEDYPVGSALRVFPVTTELSPTDKTFEYMT-FDK-VGTAQIIADYTDDLPLVDALG 101 (319) T ss_pred hhhhhhhhhhHHHHHHHHHHHHHHhhhhcceechhhcccccCCCCceEEEEeee-ecc-ccceeeecCccccccceeccc Confidence 11111 267776766544322 223445667889986532221 111111 111 123444555444322222344 Q ss_pred eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCce-- Q lcl|Aclame:pro 74 EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGV-- 151 (348) Q Consensus 74 ~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~-- 151 (348) +....+++.+...+.++..|+...+..+-.-.... .....+++...+ -++.+.|+.. T Consensus 102 ~~~~~~i~~~~~~~~~~~~El~~a~~~g~~l~~~k-----------~~aA~~~~~~~~----------n~i~f~G~~~~g 160 (319) T protein:vir:10 102 TSEFGKVFRLGNAYLISIDEIKAGQATGRPLSTRK-----------ASACQLAHDQLV----------NRLVFKGSAPHK 160 (319) T ss_pred eeeEEEEEEEEeeeeecHHHHHHHHHhCCChHHHH-----------HHHHHHHHHHhh----------ceEEEeeccccc Confidence 56677888888899999888765443332211111 111112222222 1333333211 Q ss_pred eEEEeeccCccceeeeeecCCC-CCc---cHHHHHHHHHHHHHh-c-C-CeeEEEEeCHHHHHHHhcCHHHHHHhcccCC Q lcl|Aclame:pro 152 NKDIDYGVKADHKKQVSKSWAE-PGA---TPLADLEDAIETARE-L-G-LNPERAIMNAKTFGLIRKAASTVKAIKPLAG 224 (348) Q Consensus 152 ~~~vDfg~~~~~~~t~~~~W~~-~~a---dp~~di~~~~~~~~~-~-G-~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~ 224 (348) .+.+ +..|.-...+. ..|.+ ++. .+++||.+....+.. + | ..|.+++++++.|..|..- .. T Consensus 161 ~~GL-lN~p~~~~~~~-~~~~~~~t~t~~~i~~di~~~~~~l~~~s~g~~~p~~L~L~p~~~~~L~~~----------~~ 228 (319) T protein:vir:10 161 IVSV-FNHPNITKITS-GKWIDVSTMKPETAEAELTQAIETIETITRGQHRATNILIPPSMRKVLAIR----------MP 228 (319) T ss_pred ceeE-EeCCCceeeec-CCCCCccccCHHHHHHHHHHHHHHHHHhcCceeeceEEEecHHHHHhhhcc----------cC Confidence 1111 11222222233 34433 333 467899888877653 3 5 3699999999999887321 01 Q ss_pred CcccccHHHHHHHHHhh-cCceEEEEeeEEEcCCCcccccccCCeEEEEeCCc-cceeEeccchhhhcccccccccccee Q lcl|Aclame:pro 225 DGSSVTKAELQNYVADN-YGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGP-LGNTVFGTTPEESDLFADNTVNADVE 302 (348) Q Consensus 225 ~~~~~~~~~~~~~~~~~-~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~-~G~~~yg~~~~~~~~~~~~~~~~~~~ 302 (348) +.+. .+.+++... .+++|..... +.+..|.. .+.+++...+. ......+ T Consensus 229 ~~~~----t~l~~lk~~~~~l~I~~~pe-l~~ag~~g-----~~~~v~y~~~~~~~~~~v~------------------- 279 (319) T protein:vir:10 229 ETTM----SYLDYFKSQNSGIEIDSIAE-LEDIDGAG-----TKGVLVYEKNPMNMSIEIP------------------- 279 (319) T ss_pred CCCe----eHHHHHHHhcCCceEEEeee-ecccCCCc-----ceEEEEEecCCceEEEecC------------------- Confidence 1111 122233332 2445544332 22222111 12233332211 0111110 Q ss_pred ecCCceEEEEeecCCCceeEEeeeeee-eeeecCCCcEEEEEEe Q lcl|Aclame:pro 303 IVDSGIAVTTTKTTDPVNVQTKVSMVA-LPSFERLGDVYMLTVI 345 (348) Q Consensus 303 ~~~~~~~~~~~~~~dP~~~~~~~~s~~-lPv~~~~~~~~~~~V~ 345 (348) +.+-.... +..+....+....+. =.++.+|.++..++=+ T Consensus 280 ---~~~~~~~~-e~~~l~~~~~~~~r~~Gv~i~~P~ai~~~dGI 319 (319) T protein:vir:10 280 ---EAFNMLPA-QPKDLHFKVPCTSKCTGLTIYRPMTIVLITGV 319 (319) T ss_pred ---cceeeeee-eecCceEEEeeeeeeEEEEEEccceeEeeecC Confidence 11111111 222233333333332 2556778888877766 No 54 >protein:vir:79928 Length: 393 # NCBI annotation: major head protein # Family: family:all:30335 # MgeID: mge:1874 # MgeName: 0305phi8-36 # Cross-refs: genbank:acc:YP_001429616;genbank:gi:156564106;genbank:GeneID:5525693 Probab=51.44 E-value=0.58 Score=21.88 Aligned_cols=288 Identities=10% Similarity=0.050 Sum_probs=105.0 Q ss_pred Cccch-hhcCHHHHHHHHHhhccchhhhHHHHhCCCccc-cceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEe Q lcl|Aclame:pro 1 MGLIY-DKVTASNIAGYFNTLQENVDSTLGESIFPARKQ-LGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDE 78 (348) Q Consensus 1 Ma~l~-d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~-~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~ 78 (348) |+.-. .+.=|+.|...+.+...|. ++...+|-...- .....+++... ..-|-=++.+.+-+ ..+.+-.++ T Consensus 74 mtt~~a~IliP~vis~v~~Eaaepl--~~~~kl~qk~~L~~Grsm~F~~~g---~~Ra~~IgEGgE~~---~~sld~~T~ 145 (393) T protein:vir:79 74 MATPSAQILIPRVIVGTMREAAEPL--YIGTKMLQKIRLKSGQSMIFPSIG---IMRAYDVAEGQEIP---EDSIDWQTH 145 (393) T ss_pred hcCCCcceechhhhhhhhhhcccch--hHHHHHHHHHhhhcCcceeccchh---eeeecccccccccc---ccchhhhcC Confidence 55432 3455677888888876543 566666643221 22222222111 00011112222211 111121222 Q ss_pred ecccccc-----ccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhc-CeeeecCCcee Q lcl|Aclame:pro 79 QMPFFKE-----ALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLAT-GKIAFTSDGVN 152 (348) Q Consensus 79 ~~p~i~~-----~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~-Gki~~~~~~~~ 152 (348) +-+.++. +..++.+ .+-+++ .+.+.--+....++..+..|..|...+.+ |...+++ T Consensus 146 dsv~~~~gK~G~~Ia~SqE------mIsDSg--------~Dvin~~l~aA~RaMaRkKee~a~n~fk~~ghtvfDa---- 207 (393) T protein:vir:79 146 ESPEIRVGKSGIRLRFTDE------MISDSQ--------WDLMSMMIKQAGRAMGRHKEQKAYHQFRSHGHTVFDN---- 207 (393) T ss_pred CceeEEechhhhhhhhHHH------Hhhcch--------HHHHHHHHHHHHHHHHhhhHHHHHhhhhcccceeeec---- Confidence 2222222 2222211 111111 11222223444566666677777766543 4443332 Q ss_pred EEEeeccCccceeeeee--cCCC-CCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcc-- Q lcl|Aclame:pro 153 KDIDYGVKADHKKQVSK--SWAE-PGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGS-- 227 (348) Q Consensus 153 ~~vDfg~~~~~~~t~~~--~W~~-~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~-- 227 (348) .++.-..-+++ .-+. .+-=-++||..+.=.+...+++|++++|++-+|+.|.+|+.+-....+--++.+ T Consensus 208 ------~st~t~ahptGr~~~~~qNGTlSleDllDm~~av~~~hyt~svi~MHPLAWnv~AKna~me~~~~na~gN~~~~ 281 (393) T protein:vir:79 208 ------YSTNKLAHTTGLDKNGVQNDTFSAEDFLDLIIAVMANEYTPSDLMMHPLAWTVFAKNELMGSLQANPYGNYPAK 281 (393) T ss_pred ------cccCccceeecCCccccccccccHHHHHHHHHHHhcccCCcceEEEcCchhhhhhhhhhhcceeeccccccCcc Confidence 11111111222 1122 222346789998878888999999999999999999999765332211111110 Q ss_pred --cccHHHHHHHHHhhc--Cc-----eEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEe--ccchh-hhcccccc Q lcl|Aclame:pro 228 --SVTKAELQNYVADNY--GV-----EIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVF--GTTPE-ESDLFADN 295 (348) Q Consensus 228 --~~~~~~~~~~~~~~~--~~-----~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~y--g~~~~-~~~~~~~~ 295 (348) .-+.....+...... .+ +|+.||.. .++| .+..+..+..|-+.- +.+.+ -+++..+. T Consensus 282 ~~~ts~algp~~i~~~~~~nlnv~~sPfvp~d~k-------~~rF----d~~~Vd~NnvgvlLV~D~i~tdq~ddk~rdi 350 (393) T protein:vir:79 282 GAPSSMALGPDSIQGRLPFNFNVNLSPFIPLDKK-------SRRF----DVYAVDRNNVGVLLVRDDLKTDQWDEKARGL 350 (393) T ss_pred ccchhhhhchhhhccccccceeEEEecccccccc-------ccee----eEEEeecCCceEEEEecCcceeccccccccc Confidence 001112222222221 11 22333322 2222 111111121121110 00000 01111110 Q ss_pred cc---ccc----eeecCCceEEEEeecCCCceeEEeeeeeeeeeecCCC Q lcl|Aclame:pro 296 TV---NAD----VEIVDSGIAVTTTKTTDPVNVQTKVSMVALPSFERLG 337 (348) Q Consensus 296 ~~---~~~----~~~~~~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~ 337 (348) .. ..+ +-..+.++++-+-. ..+..-..|+-+-..-| T Consensus 351 q~iKl~ERYG~gvLn~gkaiavakNI------~~~k~y~~P~~~~~~~~ 393 (393) T protein:vir:79 351 QNIKMIERYGIGILNEGKAIAVAKNI------SMDKSYAEPMLIKNVGN 393 (393) T ss_pred eeeeeeeeeceeeeeCCceEEEEecc------eeecccccchhhhccCC Confidence 00 000 00122233322110 01111112221111111 No 55 >protein:vir:4953 Length: 397 # NCBI annotation: major head protein # Family: family:all:21 # MgeID: mge:108 # MgeName: Sfi19 # Cross-refs: genbank:acc:NP_049929;genbank:gi:9632900;genbank:GeneID:1262076 Probab=48.59 E-value=0.66 Score=21.56 Aligned_cols=268 Identities=11% Similarity=-0.007 Sum_probs=116.8 Q ss_pred Cccch----hhcCHHHHHHHHHhhccchhhhHHHHhCCCcccc--ceeEEEEEeecCceeeeeeeeCCCCcceeccccee Q lcl|Aclame:pro 1 MGLIY----DKVTASNIAGYFNTLQENVDSTLGESIFPARKQL--GTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAE 74 (348) Q Consensus 1 Ma~l~----d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~--~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~ 74 (348) |.... .+.-|.++..-|.+......+ |.+ +....++. ..++....... ....|.++..++..+-.....+. T Consensus 109 ~~~~t~~~gg~~vP~~~~~~ii~~~~~~~~-l~~-~~~~~~~~~~~~~~~~~~~~~-~~~~a~~v~E~~~~~~~~~~~~~ 185 (397) T protein:vir:49 109 KTDASGSDAGLTIPQDIQTAIHTLVSQYDS-LQE-YVNVENVTTLTGSRVYEKWTD-ITGLANIDDEAGKIADVDDPKLS 185 (397) T ss_pred hhccccccCcccccHhHHHHHHHHHHhhhh-HHh-hhceeecccCccceEEEeecc-CCcceeeecCcccccccccccee Confidence 32211 122344444444333333222 323 23333322 22233222222 22346777777666654555677 Q ss_pred eeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEE Q lcl|Aclame:pro 75 IHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKD 154 (348) Q Consensus 75 ~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~ 154 (348) ...+.+-.+.-...++.+=+. ++ .. .+...+ ..++.+++.+.+|.......-+|+ T Consensus 186 ~i~~~~~k~~~~~~iS~ell~------ds-~~----~l~~~i---~~~l~~~~~~~~d~ai~~G~g~~~----------- 240 (397) T protein:vir:49 186 LIKYTIKRYAGISTVTNSLLA------DS-AE----NILAWL---SGWIAKKVVVTRNKAILEAIAALP----------- 240 (397) T ss_pred eEEeeeeeEEeeehhHHHHHh------hh-HH----HHHHHH---HHHHHHHHHHHHHHHHHhhccccc----------- Confidence 777777766666666543221 11 01 122222 233455666666655443221110 Q ss_pred EeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHH Q lcl|Aclame:pro 155 IDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAEL 234 (348) Q Consensus 155 vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~ 234 (348) ...+....++|.++...+...+.....++|++.+|..|++- ++. + +...+.+... T Consensus 241 -----------------~~~~~~~~d~i~~~~~~l~~~~~~~a~~vmn~~~~~~l~~l---kd~----~-G~~l~~~~~~ 295 (397) T protein:vir:49 241 -----------------TKPTLTKWDDIIDLEAKVDPAIKQTSFFLTNTSGFTALKKV---KNA----L-GDYLMERDVK 295 (397) T ss_pred -----------------cccccccHHHHHHHHHhhhhhhcCCCEEEEcHHHHHHHHHh---hcC----C-CceeeccCcC Confidence 00122345566666666655555567899999999877542 221 1 1111111111 Q ss_pred HHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEE-- Q lcl|Aclame:pro 235 QNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTT-- 312 (348) Q Consensus 235 ~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~-- 312 (348) ...-..+.|.++++.+..+.. ++.. ++..++|..... +...+ . ..++-+.. T Consensus 296 ~~~~~~l~G~PV~~~~~~~~~-~~~~----~~~~i~~gd~~~-~~~~~-~--------------------~~~~~i~~~~ 348 (397) T protein:vir:49 296 SPTGYSIDGFAVKEVADRWLA-NGTG----GAMPLYFGDLKQ-AVTLF-D--------------------RQHMSLLSTN 348 (397) T ss_pred CCCCceecceeeEEecccccc-cccC----CceeEEEeeccc-eEEEE-e--------------------ecceEEEEec Confidence 111123457777766544322 1111 111222221111 00000 0 00011100 Q ss_pred ee--cCCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 313 TK--TTDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 313 ~~--~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) +. ...-......+..+.=..+.+|++++++++.+-. T Consensus 349 ~~~~~~~~~~~~~r~~~r~d~~~~~~~a~~~~~~~~~~ 386 (397) T protein:vir:49 349 IGGGAFETDTTKVRVIDRFDVVATDTEAFVPASFKAIA 386 (397) T ss_pred cccchhhcCceeEEEEeeeCcEEecccceEEEEeeccc Confidence 00 0000124455666777788899999999988655 No 56 >protein:vir:10364 Length: 390 # NCBI annotation: head protein; major capsid subunit precursor # Family: family:all:585 # MgeID: mge:183 # MgeName: Xp10 # Cross-refs: genbank:acc:NP_858956;genbank:gi:32128421;genbank:GeneID:2648357 Probab=47.03 E-value=0.71 Score=21.38 Aligned_cols=270 Identities=11% Similarity=0.085 Sum_probs=123.1 Q ss_pred Cccch---h-hcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeee Q lcl|Aclame:pro 1 MGLIY---D-KVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIH 76 (348) Q Consensus 1 Ma~l~---d-~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~ 76 (348) +..-. . ++-+..+..++..+ ....+ +.+ +.+..++....+.+... .+....+.++..++..+-.. ..+... T Consensus 114 ~~~~~~~~g~~~~~~~~~~ii~~~-~~~~~-l~~-~~~~~~~~~~~~~~~~~-~~~~~~a~~v~Eg~~~~~~~-~~~~~i 188 (390) T protein:vir:10 114 STDAAGSAGALTTPNRLPGFITQP-DARLT-VRD-LIGSGRTDSALIEYVQE-TGFVNNAAIVAEGALKPESS-LKFAKK 188 (390) T ss_pred hcccccccccccchhHHHHHHHHH-Hhhch-hhh-hcceeeccCCceEEEEE-ecCCcceeeecCCccccccc-cceeEE Confidence 11100 1 23333444444433 22223 333 35555544444443332 22223456777776655443 457777 Q ss_pred EeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEe Q lcl|Aclame:pro 77 DEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDID 156 (348) Q Consensus 77 ~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vD 156 (348) .+.+-.+.-...++.+ +++ +. .. +...+ ...+.+++.+.++..++ +|.-+ +.. ...+- T Consensus 189 ~~~~~k~~~~~~is~e-ll~-----d~--~~----l~~~i---~~~l~~~~~~~~~~~il----~G~G~--~~~-p~Gi~ 246 (390) T protein:vir:10 189 TDTTHVIAHTMKATRQ-ILS-----DA--PQ----LASYM---NNRLIRGLKVKEDAEIL----RGTGA--NDG-LLGLI 246 (390) T ss_pred EEeeEEEEEeehhhHH-HHH-----hH--HH----HHHHH---HHHHHHHHHHHHHHHHh----hcCCC--Ccc-ccccc Confidence 7777777766666543 211 11 11 22222 23344555566654333 34211 000 01110 Q ss_pred eccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHH Q lcl|Aclame:pro 157 YGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQN 236 (348) Q Consensus 157 fg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~ 236 (348) ..... ....-..++.+++.+|..+...+...+..+..++|++..|..|.+ +++.-. ...+.+ .... T Consensus 247 ---~~~~~--~~~~~~~~~~~~~~~~~~~~~~l~~~~~~~~~~v~n~~~~~~L~~---lkd~~g-----~~l~~~-~~~~ 312 (390) T protein:vir:10 247 ---PQATT--YAAPTTIAGATRVDQLRLAMLQASLAEYPASGIVINPIDWAAIEL---AKDANN-----QYLIGN-ARGT 312 (390) T ss_pred ---ccccc--ccccccccccchHHHHHHHHHhhccccCCCCEEEEcHHHHHHHHH---hhcCCC-----ceeecC-CcCc Confidence 00000 000112234567888888887777777778889999999987753 222211 111111 0000 Q ss_pred HHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeecC Q lcl|Aclame:pro 237 YVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTT 316 (348) Q Consensus 237 ~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 316 (348) .-..+.|+++++.+ .+|++.+++.-... +...+ ...++.+....+. T Consensus 313 ~~~~l~G~pv~~~~------------~~p~~~~~~gdf~~-~~~~~---------------------~~~~~~i~~~~~~ 358 (390) T protein:vir:10 313 LTPTLWGLPVVATQ------------AMAPGEFLVGAFDL-AAQIF---------------------DQWDARVEIGYVN 358 (390) T ss_pred CCceecceeeEEcC------------CCCCCcEEEEeccc-eEEEE---------------------EecceEEEEeecc Confidence 00123466665432 24566665543221 11111 0011111111111 Q ss_pred CC---ceeEEeeeeeeeeeecCCCcEEEEEEe Q lcl|Aclame:pro 317 DP---VNVQTKVSMVALPSFERLGDVYMLTVI 345 (348) Q Consensus 317 dP---~~~~~~~~s~~lPv~~~~~~~~~~~V~ 345 (348) +. .....++..+.=..+.+|++++.+++= T Consensus 359 ~~~~~~~~~~r~~~r~d~~v~~~~a~~~~~~a 390 (390) T protein:vir:10 359 DDFQRNMVTVLAEERLALVVYRPEALISGSFA 390 (390) T ss_pred cccccCcEEEEEEEeeccEEeccccEEEEEeC Confidence 11 234555677777888999999888877 No 57 >protein:vir:4856 Length: 293 # NCBI annotation: major head protein # Family: family:all:21 # MgeID: mge:106 # MgeName: DT1 # Cross-refs: genbank:acc:NP_049396;genbank:gi:9632424;genbank:GeneID:1258532 Probab=46.23 E-value=0.74 Score=21.29 Aligned_cols=272 Identities=11% Similarity=-0.031 Sum_probs=118.2 Q ss_pred Cccchh----hcCHHHHHHHHHhhccchhhhHHHHhCCCccccce--eEEEEEeecCceeeeeeeeCCCCcceeccccee Q lcl|Aclame:pro 1 MGLIYD----KVTASNIAGYFNTLQENVDSTLGESIFPARKQLGT--KLSYIKGASGQSVALKAAAFDTNVTIRDRVSAE 74 (348) Q Consensus 1 Ma~l~d----~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~--~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~ 74 (348) |+.... ++-|.++..-|.+....... +.+ +....++... ++....... ....|.++..+.+.+-.+...+. T Consensus 5 ~~~~t~~~gg~liP~~~~~~Ii~~~~~~~~-l~~-~~~~~~~~~~~g~~~~~~~~~-~~~~a~~v~Eg~~~~~~~~~~~~ 81 (293) T protein:vir:48 5 KTDHSGSDAGLTIPQDIRTAINTLVRQYDS-LQE-YVNVENVTTLTGSRVYEKWTD-ITGLANIDDEAGKIADIDDPKLS 81 (293) T ss_pred ecccccCcCceEechhHHHHHHHHHHhhhh-hhh-hceeeeccCCcceEEEEeecC-CCcceeeecCCccccccccccee Confidence 554321 34455655434333333332 333 3444333322 233332222 22346788877776655555677 Q ss_pred eeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEE Q lcl|Aclame:pro 75 IHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKD 154 (348) Q Consensus 75 ~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~ 154 (348) ...+.+-++.....++.+-++. .. .+ +...+ ..++.+++.+.++..+...+.++ T Consensus 82 ~i~l~~~k~~~~~~iS~ell~d------s~-~~----l~~~i---~~~la~~~~~~~~~~i~~g~~~~------------ 135 (293) T protein:vir:48 82 LIKYTIKRYAGISTVTNSLLAD------SA-EN----ILAWL---SGWIAKKVVVTRNKAILGVVDKL------------ 135 (293) T ss_pred EEEEeeeEEEEeehhhHHHHhh------hh-HH----HHHHH---HHHHHHHHHHHHHhHHhhccccc------------ Confidence 7777777777666665443221 11 11 11222 12233444455554443222100 Q ss_pred EeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHH Q lcl|Aclame:pro 155 IDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAEL 234 (348) Q Consensus 155 vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~ 234 (348) + ..++....+||.++...+...+......+|++.+|..|++ +++. + +.....+... T Consensus 136 -------------~---~~~~~~~~d~i~~~~~~l~~~~~~~a~~vmn~~~~~~L~~---lkd~----~-g~~l~~~~~~ 191 (293) T protein:vir:48 136 -------------P---TKPTLTKWDDIIDLEAKVDPAIKQTSFFLTNTSGFTALKK---VKNA----L-GDYLMERDVK 191 (293) T ss_pred -------------c---ccccccCHHHHHHHHHhhhhhhcCCCEEEEcHHHHHHHHH---hhcc----C-CceEeecCcC Confidence 0 1123334567777766665444455678999999987754 2222 1 1111111111 Q ss_pred HHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEee Q lcl|Aclame:pro 235 QNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTK 314 (348) Q Consensus 235 ~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 314 (348) +..-..+.|.++++.+..+....+. .+..++|..-.. +.... .-+. ..+...+. .-+.|. T Consensus 192 ~~~~~~l~G~Pv~~~~~~~~~~~~~-----~~~~~~~gd~~~-~~~~~--~~~~----------~~i~~~~~--~~~~~~ 251 (293) T protein:vir:48 192 SPTGYSIAGFAVKEISDRWLPNASS-----GVMPLYFGDLKQ-AVTLF--DRQQ----------MSLLSTNI--GGGAFE 251 (293) T ss_pred CCCCceecceeeEEecccccCCccC-----CceEEEEEeccc-eEEEE--Eecc----------eEEEEecc--cchhhh Confidence 1111234577777665544321111 011122221110 00000 0000 00000000 000011 Q ss_pred cCCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 315 TTDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 315 ~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) -......+..+.=..+.+++++..+++.+-+ T Consensus 252 ---~~~~~~r~~~r~d~~~~~~~a~~~l~~~~~~ 282 (293) T protein:vir:48 252 ---TDTTKVRVIDRFDVVATDTEAFVPASFKAIA 282 (293) T ss_pred ---cCeEEEEEEEeeCcEEecccceEEEEeeccc Confidence 1134455556666778899999999987655 No 58 >protein:vir:1268 Length: 397 # NCBI annotation: hypothetical protein # Family: family:all:21 # MgeID: mge:329 # MgeName: phi-105 # Cross-refs: genbank:acc:NP_690760;genbank:gi:22855000;genbank:GeneID:955203 Probab=45.83 E-value=0.76 Score=21.25 Aligned_cols=264 Identities=10% Similarity=0.029 Sum_probs=108.0 Q ss_pred Cccchh----hcCHHHHHHHHHhhccchhhhHHHHhCCCccccc--eeEEEEEeecCceeeeeeeeCCCCcceeccccee Q lcl|Aclame:pro 1 MGLIYD----KVTASNIAGYFNTLQENVDSTLGESIFPARKQLG--TKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAE 74 (348) Q Consensus 1 Ma~l~d----~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~--~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~ 74 (348) |..... ++-|.++...|-+......+ +.+ +.+...+.. .++.... .. ....|.++..++..+-.....+. T Consensus 123 ~~~~~~~~gg~lvP~~~~~~ii~~~~~~~~-l~~-~~~~~~~~~~~~~~~~~~-~~-~~~~a~~v~Eg~~~~~~~~~~~~ 198 (397) T protein:vir:12 123 MSGINDEDGGILIPEDIGRQIHEFKRQFEP-LEQ-YVTVEPVTTRSGTRLLEK-NA-DMVPFSPVEELGNLPEIDQPRFT 198 (397) T ss_pred ccccccccCcccCchhHHHHHHHhhhhhhh-HHh-hcceeeccCCceeEEEEE-ec-CCcceeeecccccccccccccce Confidence 222110 12233444333333333222 322 233333322 2222221 12 22246677777665544445666 Q ss_pred eeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEE Q lcl|Aclame:pro 75 IHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKD 154 (348) Q Consensus 75 ~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~ 154 (348) ...+.+-+++.-..++.+=+ .++. .. +...+ ...+.+++.+.+|.++....-+|+ T Consensus 199 ~v~~~~~k~~~~~~is~e~l------~ds~-~~----l~~~i---~~~l~~~~~~~~d~~il~G~g~~~----------- 253 (397) T protein:vir:12 199 KVSYSIIDYGGIMTLSNSML------NDSD-QA----IMTYV---AKWFAKKSVVTRNNLILAAIASLK----------- 253 (397) T ss_pred eEEeeheeeEeeehhhHHHH------hhch-HH----HHHHH---HHHHHHHHHHHHHHHHHhcccccc----------- Confidence 67777766666655554322 1111 11 12222 233445555666655443211110 Q ss_pred EeeccCccceeeeeecCCCCCccHHHHHHHHHH-HHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHH Q lcl|Aclame:pro 155 IDYGVKADHKKQVSKSWAEPGATPLADLEDAIE-TARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAE 233 (348) Q Consensus 155 vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~-~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~ 233 (348) | .+..-++||..... .+.........++|++..|..|+. +++. ++ .....+.. T Consensus 254 -----~-------------~g~~~~~~i~~~~~~~l~~~~~~~a~~~~n~~~~~~L~~---lkd~----~G-~~l~~~~~ 307 (397) T protein:vir:12 254 -----K-------------VDIDGLDGIKKALNVTLDPMVAPGSIVLTNQDGYDWLDT---LKDG----TG-RYLLQPDP 307 (397) T ss_pred -----c-------------cccccHHHHHHHHhhccchhhhCCCEEEEcHHHHHHHHH---hhcc----CC-ceeecccc Confidence 0 11122445555432 232222234568899999988753 2222 11 11111111 Q ss_pred HHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEe Q lcl|Aclame:pro 234 LQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTT 313 (348) Q Consensus 234 ~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 313 (348) .+..-..+.|.++++.+......+. .+..++|..... +...+ . ..++.+..- T Consensus 308 ~~g~~~~l~G~pv~~~~~~~~~~~~------~~~~~~~gd~~~-~~~~~--~-------------------~~~~~i~~~ 359 (397) T protein:vir:12 308 TNPTKKLLDGRPVVPFTNRVLKTQK------GKAPLIIGNLKE-AIVLF--D-------------------REQQSIAST 359 (397) T ss_pred cCCCCccccceeeEEecccccccCC------CccEEEEEehhc-eEEEE--e-------------------ecceEEEEe Confidence 1111123456677665432211111 111122222111 00000 0 000001000 Q ss_pred ec----CCCceeEEeeeeeeeeeecCCCcEEEEEEecC Q lcl|Aclame:pro 314 KT----TDPVNVQTKVSMVALPSFERLGDVYMLTVIPG 347 (348) Q Consensus 314 ~~----~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~ 347 (348) .+ ..-....+++..+.=..+.+|+++++++++++ T Consensus 360 ~~~~~~f~~~~~~~r~~~r~d~~~~~~~a~~~~~~t~~ 397 (397) T protein:vir:12 360 DTGAGAFETNSTKVRGIEREDVRKWDEDAVVFGQITVE 397 (397) T ss_pred ccccchhhcCceEEEEEEeeccEEecccceEEEEEeeC Confidence 00 00123455566666678889999999999999 No 59 >protein:vir:9875 Length: 296 # NCBI annotation: hypothetical protein # Family: family:all:1178 # MgeID: mge:177 # MgeName: 315.5 # Cross-refs: genbank:acc:NP_795637;genbank:gi:28876404;genbank:GeneID:1257935 Probab=45.48 E-value=0.77 Score=21.21 Aligned_cols=276 Identities=16% Similarity=0.159 Sum_probs=123.2 Q ss_pred Cccch-----hhcCHHHH-----HHHHHhhccchhhhHHHH-----hCCCccccceeEEEEEeecCceeeeeeeeCCCCc Q lcl|Aclame:pro 1 MGLIY-----DKVTASNI-----AGYFNTLQENVDSTLGES-----IFPARKQLGTKLSYIKGASGQSVALKAAAFDTNV 65 (348) Q Consensus 1 Ma~l~-----d~f~~~~l-----~~~i~~~~~~~~~~l~~~-----~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~ 65 (348) |-.-+ ++.+...| ..+++.....-.. |.+. +-|-.. +...+.+.. -....-|.-|+.+... T Consensus 1 ~~~~~~~~e~nlt~~~dl~~~~siDf~~~f~~~i~~-L~~~LGv~r~~pla~--GstIkt~k~-~~y~gda~dVaEGe~I 76 (296) T protein:vir:98 1 MVTSRTYPEENLIKSTDLKYPITIDVTNKFQENISK-LLEMLGVTRKISVSE--GMTLKTYAG-YDVTLAEGNVPEGEVI 76 (296) T ss_pred CCCccccCcCCCcchhhhhhhhhhhhHHHHhhhHHH-HHHHhhhcccccccC--CCEEeeccc-eeeeeccccccCCccc Confidence 33221 11122222 2223333222111 2222 222211 222211110 0111123345566655 Q ss_pred ceecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeee Q lcl|Aclame:pro 66 TIRDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIA 145 (348) Q Consensus 66 ~~~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~ 145 (348) |+.+-..-.....++..-|-.+.++.+-++ + +|-..+ +.+-..+|..+|.+...--+..+|.+|+-+ T Consensus 77 plskvt~~~~~t~t~~ikK~rK~tTdEAIq-l-----sGyg~a-------Vgetd~qL~~~iq~kId~d~~t~LktaT~t 143 (296) T protein:vir:98 77 PLSKVERKIHSEKKIELKKYRKATTGEDIQ-M-----YGSNEA-------VTNTDNALVRQLQKKIRTDFVTALKTGTGT 143 (296) T ss_pred chhhheeeecceEEEEeeccccccCHHHHH-h-----hcCCch-------hHHHHHHHHHHHHHhhhHHHHHHHhcccce Confidence 554433222223333333333445543321 1 111111 222344456666676666778888765421 Q ss_pred ecCCceeEEEeeccCccceeeeeecCCCCCccHHHHHH-HHH---HHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcc Q lcl|Aclame:pro 146 FTSDGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLE-DAI---ETARELGLNPERAIMNAKTFGLIRKAASTVKAIKP 221 (348) Q Consensus 146 ~~~~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~-~~~---~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~ 221 (348) .+.+ .....+-|. .|. +...+.+....+++++|.=...+++++.+-. T Consensus 144 -------------------~~~t------~~~lQ~Ala~~~~~l~~~feded~~~~V~FVnP~D~a~ylg~a~it~---- 194 (296) T protein:vir:98 144 -------------------QDAL------GAGLQGALASAWGKLQVLFEDYGSERAIVFANSLDVAEYIAKAGITT---- 194 (296) T ss_pred -------------------eeec------hhhHHHHHHHHhhhhhhhccccCCCceEEEEehHHHHHHhcCCccch---- Confidence 1110 001111121 122 2344445457777888877766666664310 Q ss_pred cCCCcccccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccce Q lcl|Aclame:pro 222 LAGDGSSVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADV 301 (348) Q Consensus 222 ~~~~~~~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~ 301 (348) +. .+. -.|+..+.|.+|+. .+-+|++++++.|.+++ ..+|.+.- ..+.......+ T Consensus 195 -qt---~fG----~tyl~nfLG~~II~------------S~kV~~G~~~~T~~~Ni-~~ay~~~~-~~~l~~~f~~~--- 249 (296) T protein:vir:98 195 -QT---AFG----LTYLVDFTGTVIIS------------TNDVTKGEIWATVPENI-IFAYINPN-NSELAKEFNLY--- 249 (296) T ss_pred -hh---eec----hhhhhhccccEEEE------------cCcCCCceEEEeeecce-EEEeeccc-ccchhhhhccc--- Confidence 00 111 12233334544422 23378888999888775 34443321 11111111111 Q ss_pred eecCCc-eEEEEeecCCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 302 EIVDSG-IAVTTTKTTDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 302 ~~~~~~-~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ..+.| |-+.+-...+.....+..-+...--|..+|+++++++.|+| T Consensus 250 -~d~tglIGv~h~~~~~~~t~eT~~~~~~~lfpE~~dgiv~~tI~~~~ 296 (296) T protein:vir:98 250 -GDPTGYIGMNHFQENTTLTIQTLLVSGMLMYPERIDGIVKVTLTPGV 296 (296) T ss_pred -cccccceEEEeccccceeeehhHhHhHHHhcccccceEEEEEecCCC Confidence 12233 33555556666777777778888889999999999999999 No 60 >protein:vir:102655 Length: 322 # NCBI annotation: Hypothetical protein # Family: family:all:6384 # MgeID: mge:1624 # MgeName: VP2 # Cross-refs: genbank:acc:YP_052979;genbank:gi:50282923;genbank:GeneID:2948122 Probab=45.46 E-value=0.77 Score=21.21 Aligned_cols=281 Identities=8% Similarity=0.042 Sum_probs=90.9 Q ss_pred CccchhhcCHHHHHHHHHhhccchhhhHHH---HhCCCccccceeEE--EEE--eecCc--e--eeeeeeeC----CCCc Q lcl|Aclame:pro 1 MGLIYDKVTASNIAGYFNTLQENVDSTLGE---SIFPARKQLGTKLS--YIK--GASGQ--S--VALKAAAF----DTNV 65 (348) Q Consensus 1 Ma~l~d~f~~~~l~~~i~~~~~~~~~~l~~---~~Fp~~~~~~~~~~--~~~--~~~~~--~--~~a~~v~~----~~~~ 65 (348) |+. -++..-+.+|-.+. ..++.. +|-+.....+.... .++ +.... . ..+.-..+ +.|- T Consensus 13 Ms~---~i~~~fv~qy~~~v----~~~~qq~~s~L~~tV~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d~~~dtp~ 85 (322) T protein:vir:10 13 IAG---DIDQAFVQTYETTL----RILSQQKSAKLKQYCQHKNESSESHNWETLASMDPDAVKRKRSRQQSADGTYPTPV 85 (322) T ss_pred eec---hhhhHHHHHHHHHH----HHHHHHhhhhhhcccccccccccccceeecccccccccccccccccccCcccCCCc Confidence 443 12222233333322 222211 22222211110000 000 00000 0 00000001 1111 Q ss_pred ceecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeee Q lcl|Aclame:pro 66 TIRDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIA 145 (348) Q Consensus 66 ~~~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~ 145 (348) ....+ .....-+....-...++. +.+++...+.... ..+.....+.+++++ ...+++. |-.. T Consensus 86 ~~~~~---~~r~~~~~d~~~~~~VDd--~D~~k~~~D~~~~-~~~~~a~AL~R~~D~-----------~I~~a~~-g~a~ 147 (322) T protein:vir:10 86 NNKPF---AKRRTNVDTYDTGHVVEQ--EDISQMLLDPNSA-LITSQAYAMARKTDD-----------LIIAGAW-KPAS 147 (322) T ss_pred ccccc---ceEEEeecccccceecch--HHHHHhhcCchHH-HHHHHHHHhhhHHHH-----------HHHhhhh-cccc Confidence 01111 111111111112233333 3333433333222 222222333333332 2234443 3222 Q ss_pred ecCCceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCee---EEEEeCHHHHHHHhcCHHHHHHhccc Q lcl|Aclame:pro 146 FTSDGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNP---ERAIMNAKTFGLIRKAASTVKAIKPL 222 (348) Q Consensus 146 ~~~~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~---~~~~~~~~~~~~l~~~~~v~~~~~~~ 222 (348) ..+.|.. | ..++.+.++.+ ....-.+.|.+..+.+++..... ..++++++.|+.|+..+++.+. +.. T Consensus 148 ~~~~gt~--v--~~~ss~~i~~g-----~~g~t~~kl~~a~~~l~~~dvp~d~~R~~vv~p~~~~~LL~d~~~ts~-D~~ 217 (322) T protein:vir:10 148 IKGTGQP--V--EFLATQEIGDG-----TKPISFDYVTEITERFLENEIEPEVSKVIVIGPTQARKLLQITEATSA-DYT 217 (322) T ss_pred ccccccc--c--ccCCCcccccC-----ccchhHHHHHHHHHHHHhcCCCCCCCeEEEeCHHHHHHHhcchhhhhh-hcc Confidence 2222222 2 12233333321 12445667888888887665542 3699999999999999888654 222 Q ss_pred CCCcccccHHHHHHHHHhhcCceEEEEeeEEEcCCCccccccc--------CCeEEEEeCCccceeEeccchhhhccccc Q lcl|Aclame:pro 223 AGDGSSVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFP--------DGHLTLIPNGPLGNTVFGTTPEESDLFAD 294 (348) Q Consensus 223 ~~~~~~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~--------~~~vv~~p~~~~G~~~yg~~~~~~~~~~~ 294 (348) +.+ .-..+...+.+.|.+++.+..- +.++.+..... ...+++.....+|.-.. T Consensus 218 ~~~-----~l~~~G~ig~~lGf~~i~s~~l--p~~~~t~~~~~~~~~~~~~~~~~~a~~k~Av~~a~~------------ 278 (322) T protein:vir:10 218 SAM-----DLQSKGIITNWMGYTWIVSTRL--DKFDPTQWGMAAEDGPQGDEIWCIAMTDMALGYHSC------------ 278 (322) T ss_pred cch-----hhhhcCeeeeeeeEEEEEeccC--CccccccccccccCCCCccceeEEEEecCceeEEEe------------ Confidence 111 1111233445668888776532 11111111000 00111222111111100 Q ss_pred cccccceeecCCceEEEEeecCCCceeE---EeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 295 NTVNADVEIVDSGIAVTTTKTTDPVNVQ---TKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 295 ~~~~~~~~~~~~~~~~~~~~~~dP~~~~---~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .-++.....+|...+ +.+....=.+..+|+.++.+...=-. T Consensus 279 -------------~dv~~~i~~~~~~~~a~~I~~~~~~Ga~ri~~~gVv~i~~~e~~ 322 (322) T protein:vir:10 279 -------------KDIWTKVAEDPSASFAWRIYSAFTADCVRVEDEHIFKLRLKNSL 322 (322) T ss_pred -------------eeeeEEeeccCCcchhhhhhhhhhhCceEeccCcEEEEEEeccC Confidence 000111111111111 11111111223344444444443112 No 61 >protein:vir:97053 Length: 390 # NCBI annotation: putative head protein # Family: family:all:585 # MgeID: mge:1653 # MgeName: OP1 # Cross-refs: genbank:acc:YP_453565;genbank:gi:84662600;genbank:GeneID:5142468 Probab=43.90 E-value=0.83 Score=21.04 Aligned_cols=269 Identities=10% Similarity=0.076 Sum_probs=117.2 Q ss_pred Ccc----chh-hcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee Q lcl|Aclame:pro 1 MGL----IYD-KVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI 75 (348) Q Consensus 1 Ma~----l~d-~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~ 75 (348) +.. -.. ++.+..+..+++.+ ....+ +.+ +.+..++.......... ......+.++..+.+.+... ..+.. T Consensus 113 ~~~~~~~~~g~lip~~~~~~ii~~~-~~~~~-i~~-~~~~~~~~~~~~~~~~~-~~~~~~a~~v~Eg~~~~~~~-~~~~~ 187 (390) T protein:vir:97 113 ASTDAAGSAGALTTPNRLPGFITPP-DARLT-VRD-LIGSGRTDSALIEYVQE-TGFVNNAAIVAEGALKPESS-LKFAK 187 (390) T ss_pred hhcccccccccccchhhhHHHHHHH-hhhhh-hHh-hcceeeccCCceEEEEE-ecCCcceeeecCCccccccc-cceeE Confidence 110 001 12222233333322 22222 333 34444444433333322 22223567777776655443 45777 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCce-eEE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGV-NKD 154 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~-~~~ 154 (348) .++.+-.++-...++.+ +.+ +. .. +...+ ...+.+++...++..+. +|- +.+. ... T Consensus 188 i~~~~~k~~~~~~is~e-ll~-----ds--~~----l~~~i---~~~la~a~~~~~d~a~l----~G~----g~~~~p~G 244 (390) T protein:vir:97 188 KTDTTHVIAHTMKATRQ-ILS-----DA--PQ----LASYM---NNRLIRGLKVKEDAEIL----RGT----GANDGLLG 244 (390) T ss_pred EEEeeeeEEEeehhhHH-HHH-----hH--HH----HHHHH---HHHHHHHHHHHHHHHHh----hcC----CCCccccc Confidence 77777777666656543 211 11 11 22222 23345566666664333 441 1111 111 Q ss_pred EeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHH Q lcl|Aclame:pro 155 IDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAEL 234 (348) Q Consensus 155 vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~ 234 (348) |-..- ... +. .-..++.+.+++|..+...+...+..+..++|++.+|.+|.+ +++.- +.....+ .. T Consensus 245 i~~~~-~~~--~~--~~~~~~~~~~d~~~~~~~~~~~~~~~~~~~v~n~~~~~~L~~---lkd~~-----G~~l~~~-~~ 310 (390) T protein:vir:97 245 LIPQA-TTY--AA--PTTIAGATRVDQLRLAMLQASLAEYPASGIVINPIDWAAIEL---AKDAN-----NQYLIGN-AR 310 (390) T ss_pred eeecc-ccc--cc--cccccccchHHHHHHHHHhhccccCCCCEEEEcHHHHHHHHH---hhcCC-----CceeecC-cc Confidence 10000 000 00 112234556778888777777777888899999999998863 33221 1111111 00 Q ss_pred HHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEee Q lcl|Aclame:pro 235 QNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTK 314 (348) Q Consensus 235 ~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 314 (348) ...-..+.|+++++.+ .+|++.+++..... +...+. ..++.+.... T Consensus 311 ~~~~~~l~G~pV~~~~------------~~~~~~~~~gd~~~-~~~~~~---------------------~~~~~i~~~~ 356 (390) T protein:vir:97 311 GTLTPTLWGLPVVATQ------------AMAPGEFLVGAFDL-AAQIFD---------------------QWDARVEIGY 356 (390) T ss_pred CCCCceecceeeEEcC------------CCCCCcEEEEeccc-eEEEEE---------------------ecceEEEEee Confidence 1011123466665432 24566666554322 111110 0111111111 Q ss_pred cCC---CceeEEeeeeeeeeeecCCCcEEEEEEe Q lcl|Aclame:pro 315 TTD---PVNVQTKVSMVALPSFERLGDVYMLTVI 345 (348) Q Consensus 315 ~~d---P~~~~~~~~s~~lPv~~~~~~~~~~~V~ 345 (348) +.+ -.....++..+.=-.+.+|+++++++.= T Consensus 357 ~~~~f~~~~~~~r~~~r~d~~v~~~~a~v~~~~a 390 (390) T protein:vir:97 357 VNDDFQRNMVTVLAEERLALVVYRPEALITGSFA 390 (390) T ss_pred cccccccCcEEEEEEEeeccEEeccccEEEEEeC Confidence 100 1123344555555566678888777766 No 62 >protein:vir:7771 Length: 330 # NCBI annotation: gp17 # Family: family:all:507 # MgeID: mge:149 # MgeName: Bxz2 # Cross-refs: genbank:acc:NP_817605;genbank:gi:29566035;genbank:GeneID:1259229 Probab=38.97 E-value=1 Score=20.49 Aligned_cols=295 Identities=10% Similarity=0.027 Sum_probs=124.2 Q ss_pred Cccc---------h----hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcce Q lcl|Aclame:pro 1 MGLI---------Y----DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTI 67 (348) Q Consensus 1 Ma~l---------~----d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~ 67 (348) |+.. . .++.+.....+++.+. .. +.+++ +.+..++........... +. ..|.++..+.+.+. T Consensus 1 m~~~~~~a~~~~~t~~~g~~i~~~~~~~ii~~~~-~~-s~l~~-~~~~~~~~~~~~~~p~~~-~~-~~a~~v~Eg~~~~~ 75 (330) T protein:vir:77 1 MAGSTVPSTQVALTGDFSAFLTPEQSQDYFAEIE-KT-SIVQR-IARKVPMGPTGISIPHWT-GA-VSASWTGEAERKPI 75 (330) T ss_pred CcccccchhhccccCCCcceechhHHHHHHHHHH-hc-cchhh-hcceeeccCCceEEEEEc-CC-cceeEecCCCcccc Confidence 4432 1 1222333334444332 22 22333 455555544444433222 22 23567777666654 Q ss_pred ecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeec Q lcl|Aclame:pro 68 RDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFT 147 (348) Q Consensus 68 ~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~ 147 (348) .. ..+....+.+-++.-...++.+-+ .+. ..+ +...+ ...+.+++.+.+|..++ +|- T Consensus 76 ~~-~~f~~i~~~~~k~~~~~~is~ell------~ds-~~~----~~~~i---~~~l~~ai~~~~~~~~l----~G~---- 132 (330) T protein:vir:77 76 TK-GSFGKQELEPVKITTIFAESAEVV------RLN-PLN----YLNTM---RTKIAEAIALKFDAAAI----HGI---- 132 (330) T ss_pred cc-ceeeEEEEeEEEEEEeehhhHHHH------hcc-hHH----HHHHH---HHHHHHHHHHHHHHHhh----ccc---- Confidence 43 456666666666665555554321 111 111 12222 23345556666664333 342 Q ss_pred CCcee-EEEeeccCccceee--eeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCC Q lcl|Aclame:pro 148 SDGVN-KDIDYGVKADHKKQ--VSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAG 224 (348) Q Consensus 148 ~~~~~-~~vDfg~~~~~~~t--~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~ 224 (348) +.+.. ..+--+....+... .....+..+.+.+.||..+...+...+..+...+|++.+|..|++ +++.-. T Consensus 133 g~~~~~~g~~~~~~~~~~~~~~~~~~~~~~~~~~~~~l~~~~~~~~~~~~~~~~~vmn~~~~~~l~~---lkd~~G---- 205 (330) T protein:vir:77 133 DKPSAFKGYLAETTKVVSLADTNLTTASGPQGNAYLAVNNALSLLVNSGKKWTGTLLDNVTEPILNT---AVDGNG---- 205 (330) T ss_pred CCCCccccccccccccceeecccccccccccchhHHHHHHHHHhhhhcCCCccEEEEcHHHHHHHHH---HhccCC---- Confidence 11111 11101111111111 112344456778899999888887777778889999999988754 222211 Q ss_pred CcccccHHHHH----H-HHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEecc----chhhhcccccc Q lcl|Aclame:pro 225 DGSSVTKAELQ----N-YVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGT----TPEESDLFADN 295 (348) Q Consensus 225 ~~~~~~~~~~~----~-~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~----~~~~~~~~~~~ 295 (348) .....+.... . .-..+.|+++++.+.- .+ ++.. ...++++.+-. ..++|. ..+..+. T Consensus 206 -~~l~~~~~~~~~~~~~~~~~l~G~PV~~~~~~-p~--~~~~----~~~~~~~gd~s--~~~i~~~~~~~i~~~~e---- 271 (330) T protein:vir:77 206 -RPLFVESTYTEQVGAIREGRILGRPTYVADNV-VN--GTVG----NRVVGVMGDFS--QVIWGQIGGLSFDVTDQ---- 271 (330) T ss_pred -ceeecCccccccccccCCceecceeeEEeccc-cC--CCCC----CccEEEEEecc--eEEEEEecCcEEEEeec---- Confidence 1111110000 0 0012346677655432 11 1110 01112221110 011111 0000000 Q ss_pred ccccceeecC----CceEEEEeecCCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 296 TVNADVEIVD----SGIAVTTTKTTDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 296 ~~~~~~~~~~----~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+....... .+..+..|.+ ....+++..+.=..+.+|+++.+++..+.. T Consensus 272 -~~~~~~~~~~~~~~~~~~~~f~~---~~~~~r~~~r~d~~v~~~~a~~~i~~~~~~ 324 (330) T protein:vir:77 272 -ATLDFGEEQGGVWVPKLISLWQH---NMVAVRCEAEFAFMVNDKDAFVKLTDQVAG 324 (330) T ss_pred -ceeeecccccccccccccchhhc---CcEEEEEEEEeccEEecccceEEEEeccCC Confidence 000000000 0000111211 235566666766778889999999877544 No 63 >protein:vir:4997 Length: 397 # NCBI annotation: major head protein # Family: family:all:21 # MgeID: mge:109 # MgeName: Sfi21 # Cross-refs: genbank:acc:NP_049971;genbank:gi:9632943;genbank:GeneID:1262106 Probab=37.45 E-value=1.1 Score=20.32 Aligned_cols=268 Identities=11% Similarity=-0.029 Sum_probs=112.8 Q ss_pred Cccch----hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccc--eeEEEEEeecCceeeeeeeeCCCCcceeccccee Q lcl|Aclame:pro 1 MGLIY----DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLG--TKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAE 74 (348) Q Consensus 1 Ma~l~----d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~--~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~ 74 (348) |..-. .++=|.++..-|.+......+ |++ +.+..++.. ..+.+.... .....|.++..+...+-.....+. T Consensus 109 ~~~~t~~~gg~~iP~~~~~~ii~~~~~~~~-l~~-~~~~~~~~~~~~~~~~~~~~-~~~~~a~~v~E~~~~~~~~~~~~~ 185 (397) T protein:vir:49 109 KTDGSGSDAGLTIPQDIRTAINTLVRQFDS-LQE-YVNVENVTTLTGSRVYEKWA-DITGLAKLDDEGGQIGQNDDPKLS 185 (397) T ss_pred hhccCCccCcceecHHHHHHHHHHHHhhhh-Hhh-hcceeeccCCcceEEEEeec-cCCcceeeecccccccccccccee Confidence 22110 122244444434333333332 322 222222222 222222221 122345677766665544444566 Q ss_pred eeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEE Q lcl|Aclame:pro 75 IHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKD 154 (348) Q Consensus 75 ~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~ 154 (348) ...+.+-.+.....++.+=+. +.. . .+...+ ...+..++.+.++..++ +|- +.+. T Consensus 186 ~v~~~~~k~~~~~~iS~ell~------ds~-~----~l~~~i---~~~l~~~~~~~~d~ail----~G~----g~~~--- 240 (397) T protein:vir:49 186 LIRYAIKRYAGISTVTNSLLA------DSA-E----NILAWL---SGWIAKKVVVTRNKAIL----EAI----GTLP--- 240 (397) T ss_pred eeEeeeeeeEeehhhHHHHHh------hhh-H----HHHHHH---HHHHHHHHHHHHHHHHH----hcc----cccc--- Confidence 667777666666555543211 110 0 112222 23345555556654443 331 1110 Q ss_pred EeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHH Q lcl|Aclame:pro 155 IDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAEL 234 (348) Q Consensus 155 vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~ 234 (348) + .++....+||..+...+...+..+..++|++..|..|.+ +++. + +...+.+... T Consensus 241 --------~---------~~~~~~~d~i~~~~~~l~~~~~~~a~~v~n~~~~~~l~~---lkd~----~-g~~l~~~~~~ 295 (397) T protein:vir:49 241 --------N---------KPTLAKWDDIIDLQAKVDPAIKQTSLFLTNTSGFTALKK---VKNA----M-GDYLMERDVK 295 (397) T ss_pred --------c---------cccccCHHHHHHHHHhhhhhhcCCCEEEEcHHHHHHHHH---hhcc----C-Cceeeccccc Confidence 0 112223456666666666666678889999999987754 2221 1 1111111111 Q ss_pred HHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEE--E Q lcl|Aclame:pro 235 QNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVT--T 312 (348) Q Consensus 235 ~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~--~ 312 (348) ...-..+.|.++++.+..+.. +++. ++..++|..-.. +.. ++. ..++-+. . T Consensus 296 ~g~~~~l~G~pV~~~~~~~~~-~~~~----~~~~~~~gd~~~-~~~-~~~--------------------~~~~~i~~~~ 348 (397) T protein:vir:49 296 SPTGYSIDGFVVKEISDRFLP-NGTG----GAMPLYFGDLKQ-AVT-LFD--------------------RQHLSLLSTN 348 (397) T ss_pred CCCCceecceeeEEecccccc-cccC----CceeEEEeeccc-eEE-EEe--------------------ecccEEEEec Confidence 111123456666665543321 1110 111122221110 000 000 0000000 0 Q ss_pred ee--cCCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 313 TK--TTDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 313 ~~--~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) +. ...-......+..+.=..+.+|++++++++.+.+ T Consensus 349 ~~~~~~~~~~~~~~~~~r~d~~~~~~~a~~~~~~~~~~ 386 (397) T protein:vir:49 349 IGGGAFETDTTKVRVIDRFDVVSTDTEAFVPASFKAIA 386 (397) T ss_pred cccchhhcCeeeEEEEEeeccEEecccceEEEEecccc Confidence 00 0001134455556666677889999999999888 No 64 >protein:vir:105905 Length: 304 # NCBI annotation: major capsid protein # Family: family:all:507 # MgeID: mge:1514 # MgeName: phiETA3 # Cross-refs: genbank:acc:YP_001004375;genbank:gi:122891830;genbank:GeneID:4712376 Probab=34.81 E-value=1.3 Score=20.02 Aligned_cols=281 Identities=9% Similarity=0.023 Sum_probs=123.2 Q ss_pred Cccch------------hhcCHHHHH-HHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcce Q lcl|Aclame:pro 1 MGLIY------------DKVTASNIA-GYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTI 67 (348) Q Consensus 1 Ma~l~------------d~f~~~~l~-~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~ 67 (348) ||.-. ...=|.++. .+++.+. ...+ +.+ +.+..++.+........ .+. ..+.+++.+++.+. T Consensus 1 ma~~~~~~~~~~~t~~gg~lip~~~~~~ii~~~~-~~~~-l~~-~~~~~~~~~~~~~ip~~-~~~-~~a~~v~E~~~~~~ 75 (304) T protein:vir:10 1 MATPTYTPGNVILSDFKNGVIPAEQGTLIMKDIM-ANSA-IMK-LAKNEPMTAQKKKFTYL-AKG-VGAYWVSETERIQT 75 (304) T ss_pred CcccccccccccccCCCceecchhHHHHHHHHHH-hccc-hhh-hcceeeccCCceEEEEE-eCC-cceEEeecCccccc Confidence 55321 112223333 3333332 2222 333 34444444333332222 222 23577777776665 Q ss_pred ecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeec Q lcl|Aclame:pro 68 RDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFT 147 (348) Q Consensus 68 ~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~ 147 (348) .. ..++...+++-++.-...++.+ ++ .++. .+ +...+ ...+.+++.+.+|..+. +|.=.-. T Consensus 76 ~~-~~~~~i~~~~~k~~~~~~iS~e-ll-----~ds~-~~----l~~~i---~~~l~~~ia~~~d~~~l----~G~g~~~ 136 (304) T protein:vir:10 76 SK-PEYAQAEMEAKKIGVIIPLSKE-FL-----KWTA-KD----FFNEV---KPLIAEAFYKAFDQAVI----FGTKSPY 136 (304) T ss_pred cc-ceeeEEEEEEEEEEEeehhhHH-HH-----hcch-HH----HHHHH---HHHHHHHHHHHHHhhhe----eccCCCc Confidence 43 5677777777666666666542 21 1111 11 22222 23345566666665543 2311000 Q ss_pred CCceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcc Q lcl|Aclame:pro 148 SDGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGS 227 (348) Q Consensus 148 ~~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~ 227 (348) ..+. .........+........+.+.++||.++...+...+..+..++|++..|..|++ +++.- ... T Consensus 137 ~~~~-----~~~~~~~~~~~~~~~~~~~~~~~~~i~~~~~~l~~~~~~~~~~v~~~~~~~~L~~---lkd~~-----G~~ 203 (304) T protein:vir:10 137 NTST-----SGKPLVEGAEEKGNVVTDTNNLYVDLSALMATIEDEELDPNGVLTTRSFRSKMRN---ALDAN-----DRP 203 (304) T ss_pred cccc-----ccccccccccccccccccccchHHHHHHHHHHhhhccCCcCEEEEcHHHHHHHHH---hhccC-----CcE Confidence 0000 0000001111222333445667899999888888777788889999999998863 33221 111 Q ss_pred cccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCc Q lcl|Aclame:pro 228 SVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSG 307 (348) Q Consensus 228 ~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~ 307 (348) .+.+. -+.+.|+++++.+.--. +. ++..++|.-... ..+|.--. ..+..... T Consensus 204 l~~~~-----~~~l~G~PV~~~~~~~~--~~------~~~~~~~gd~~~---~~~~~~~~-----------~~i~~~~e- 255 (304) T protein:vir:10 204 LFDAN-----GNEIMGLPLSYTGADVY--DK------KKSLALMGDWDY---ARYGILQG-----------IEYAISED- 255 (304) T ss_pred eecCC-----CccccceeeEEeccccc--CC------CCcEEEEEehhh---EEEEEecc-----------eEEEEeec- Confidence 11111 12345777765443211 11 111223222111 11211000 00000000 Q ss_pred eEEEEeecCCCc----------eeEEeeeeeeeeeecCCCcEEEEEEec Q lcl|Aclame:pro 308 IAVTTTKTTDPV----------NVQTKVSMVALPSFERLGDVYMLTVIP 346 (348) Q Consensus 308 ~~~~~~~~~dP~----------~~~~~~~s~~lPv~~~~~~~~~~~V~~ 346 (348) ..+......|+. ....++..+.=..+.+|++++++|..= T Consensus 256 ~~~~~~~~~~~~g~~~~~f~~~~~~~r~~~r~~~~v~~~~a~~~l~~a~ 304 (304) T protein:vir:10 256 ATLTTLQASDASGQPVSLFERDMFALRATMHIAYMNVKPEAFATLKPTE 304 (304) T ss_pred ceeeeecccccCccchhhhhcCcEEEEEEEEeccEeecccceEEEEecC Confidence 001111111111 344566666667778899998887766 No 65 >protein:vir:94142 Length: 304 # NCBI annotation: ORF013 # Family: family:all:507 # MgeID: mge:1494 # MgeName: 96 # Cross-refs: genbank:acc:YP_240234;genbank:gi:66395898;genbank:GeneID:5133311 Probab=34.81 E-value=1.3 Score=20.02 Aligned_cols=281 Identities=9% Similarity=0.023 Sum_probs=123.2 Q ss_pred Cccch------------hhcCHHHHH-HHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcce Q lcl|Aclame:pro 1 MGLIY------------DKVTASNIA-GYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTI 67 (348) Q Consensus 1 Ma~l~------------d~f~~~~l~-~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~ 67 (348) ||.-. ...=|.++. .+++.+. ...+ +.+ +.+..++.+........ .+. ..+.+++.+++.+. T Consensus 1 ma~~~~~~~~~~~t~~gg~lip~~~~~~ii~~~~-~~~~-l~~-~~~~~~~~~~~~~ip~~-~~~-~~a~~v~E~~~~~~ 75 (304) T protein:vir:94 1 MATPTYTPGNVILSDFKNGVIPAEQGTLIMKDIM-ANSA-IMK-LAKNEPMTAQKKKFTYL-AKG-VGAYWVSETERIQT 75 (304) T ss_pred CcccccccccccccCCCceecchhHHHHHHHHHH-hccc-hhh-hcceeeccCCceEEEEE-eCC-cceEEeecCccccc Confidence 55321 112223333 3333332 2222 333 34444444333332222 222 23577777776665 Q ss_pred ecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeec Q lcl|Aclame:pro 68 RDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFT 147 (348) Q Consensus 68 ~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~ 147 (348) .. ..++...+++-++.-...++.+ ++ .++. .+ +...+ ...+.+++.+.+|..+. +|.=.-. T Consensus 76 ~~-~~~~~i~~~~~k~~~~~~iS~e-ll-----~ds~-~~----l~~~i---~~~l~~~ia~~~d~~~l----~G~g~~~ 136 (304) T protein:vir:94 76 SK-PEYAQAEMEAKKIGVIIPLSKE-FL-----KWTA-KD----FFNEV---KPLIAEAFYKAFDQAVI----FGTKSPY 136 (304) T ss_pred cc-ceeeEEEEEEEEEEEeehhhHH-HH-----hcch-HH----HHHHH---HHHHHHHHHHHHHhhhe----eccCCCc Confidence 43 5677777777666666666542 21 1111 11 22222 23345566666665543 2311000 Q ss_pred CCceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcc Q lcl|Aclame:pro 148 SDGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGS 227 (348) Q Consensus 148 ~~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~ 227 (348) ..+. .........+........+.+.++||.++...+...+..+..++|++..|..|++ +++.- ... T Consensus 137 ~~~~-----~~~~~~~~~~~~~~~~~~~~~~~~~i~~~~~~l~~~~~~~~~~v~~~~~~~~L~~---lkd~~-----G~~ 203 (304) T protein:vir:94 137 NTST-----SGKPLVEGAEEKGNVVTDTNNLYVDLSALMATIEDEELDPNGVLTTRSFRSKMRN---ALDAN-----DRP 203 (304) T ss_pred cccc-----ccccccccccccccccccccchHHHHHHHHHHhhhccCCcCEEEEcHHHHHHHHH---hhccC-----CcE Confidence 0000 0000001111222333445667899999888888777788889999999998863 33221 111 Q ss_pred cccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCc Q lcl|Aclame:pro 228 SVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSG 307 (348) Q Consensus 228 ~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~ 307 (348) .+.+. -+.+.|+++++.+.--. +. ++..++|.-... ..+|.--. ..+..... T Consensus 204 l~~~~-----~~~l~G~PV~~~~~~~~--~~------~~~~~~~gd~~~---~~~~~~~~-----------~~i~~~~e- 255 (304) T protein:vir:94 204 LFDAN-----GNEIMGLPLSYTGADVY--DK------KKSLALMGDWDY---ARYGILQG-----------IEYAISED- 255 (304) T ss_pred eecCC-----CccccceeeEEeccccc--CC------CCcEEEEEehhh---EEEEEecc-----------eEEEEeec- Confidence 11111 12345777765443211 11 111223222111 11211000 00000000 Q ss_pred eEEEEeecCCCc----------eeEEeeeeeeeeeecCCCcEEEEEEec Q lcl|Aclame:pro 308 IAVTTTKTTDPV----------NVQTKVSMVALPSFERLGDVYMLTVIP 346 (348) Q Consensus 308 ~~~~~~~~~dP~----------~~~~~~~s~~lPv~~~~~~~~~~~V~~ 346 (348) ..+......|+. ....++..+.=..+.+|++++++|..= T Consensus 256 ~~~~~~~~~~~~g~~~~~f~~~~~~~r~~~r~~~~v~~~~a~~~l~~a~ 304 (304) T protein:vir:94 256 ATLTTLQASDASGQPVSLFERDMFALRATMHIAYMNVKPEAFATLKPTE 304 (304) T ss_pred ceeeeecccccCccchhhhhcCcEEEEEEEEeccEeecccceEEEEecC Confidence 001111111111 344566666667778899998887766 No 66 >protein:vir:81227 Length: 413 # NCBI annotation: gp6, major capsid protein # Family: family:all:585 # MgeID: mge:1893 # MgeName: BFK20 # Cross-refs: genbank:acc:YP_001456736;genbank:gi:157168379;hssp:P49861;interpro:IPR006444;uniprot:Q9MBJ9;genbank:GeneID:5580350 Probab=34.72 E-value=1.3 Score=20.01 Aligned_cols=279 Identities=11% Similarity=0.071 Sum_probs=113.2 Q ss_pred CccchhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEE--eecCceeeeeeeeCCCCcceecccceeeeEe Q lcl|Aclame:pro 1 MGLIYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIK--GASGQSVALKAAAFDTNVTIRDRVSAEIHDE 78 (348) Q Consensus 1 Ma~l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~--~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~ 78 (348) ...-....-+.++..-|-+...... -+. .+++..++......+.. ........+.++..++..+-..-..+....+ T Consensus 122 ~~~~~~~~vp~~~~~~ii~~~~~~~-~l~-~~~~~~~~~~~~~~~~~~~~~~~~~~~a~~v~Eg~~~~~~~~~~f~~i~~ 199 (413) T protein:vir:81 122 LTDEFQGGYGTTWNRNIIYRRREKL-VVA-DLMDNLTMTNTTIKYLMEKANRVVEGGFKTVAEGGKKPYMRFADFDIVTE 199 (413) T ss_pred cccccccccchhhHHHHHHHHhhhh-hHH-hhcceeeccCCceeEEEeccccccccccceecCcccccccCcccceeeEe Confidence 0000011112223322222222222 232 34554444443333222 1111112345666665555444445666677 Q ss_pred eccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCcee-EEEee Q lcl|Aclame:pro 79 QMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVN-KDIDY 157 (348) Q Consensus 79 ~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~-~~vDf 157 (348) .+-.++-...++.+ +++ +. .. +...+ ...+..++.+.+|..++ +|. +.+.. ..| + T Consensus 200 ~~~k~~~~~~iS~e-ll~-----ds--~~----l~~~i---~~~la~~~~~~~d~~~l----~G~----G~~~~~~Gi-~ 255 (413) T protein:vir:81 200 SLSKIAGLTKITDE-MIE-----DY--DF----LVSYI---NARLLEELAIEEERQLL----LGD----GTGNNLTGL-L 255 (413) T ss_pred eeeeEEEeehhhHH-HHH-----HH--HH----HHHHH---HHHHHHHHHHHHHHHHh----ccC----CCCCccccc-c Confidence 66666666666543 211 11 11 22233 23345566666665433 342 11111 011 0 Q ss_pred ccCccceeeeeecCCCCCccHHHHHHHHHHHHH-hcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH- Q lcl|Aclame:pro 158 GVKADHKKQVSKSWAEPGATPLADLEDAIETAR-ELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ- 235 (348) Q Consensus 158 g~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~-~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~- 235 (348) .. ....+. ....+.+.+++|......+. ..++.++.++|++.+|..|++ +++.- ++..-...+...... T Consensus 256 ~~--~~~~~~---~~~~~~~~~~~i~~~~~~~~~~~~~~~~~~vmn~~~~~~l~~---lkd~~-G~~l~~~~~~~~~~~~ 326 (413) T protein:vir:81 256 KR--DGIQTL---AVSNKDELADSIYKAMTNISLATPFQADALVINPLDYQELRL---AKDAN-GQYYGGGVFQGQYGSG 326 (413) T ss_pred cc--cccccc---cccccchhHHHHHHHHHHhhhhccCCCcEEEEcHHHHHHHHH---hhccC-Cceecccccccccccc Confidence 00 001111 11123345666666655544 456777789999999987742 22221 000000000000000 Q ss_pred --HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEe Q lcl|Aclame:pro 236 --NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTT 313 (348) Q Consensus 236 --~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 313 (348) ..-....|.++++.+ .+|++.++|.-... +...+ . ..++.+..- T Consensus 327 ~~~~~~~l~G~pv~~s~------------~~~~~~~~~gd~~~-~~~~~--~-------------------~~~~~v~~~ 372 (413) T protein:vir:81 327 GIMLDPAPWGLRTVQSQ------------VVPVGKPVVGAFRS-AASVL--R-------------------KGGVRIDST 372 (413) T ss_pred ccccCceecceeeEEcC------------CCCcccEEEEeccc-EEEEE--E-------------------ecceEEEEe Confidence 000123355554322 23555555543221 11111 0 001111110 Q ss_pred ecCC----CceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 314 KTTD----PVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 314 ~~~d----P~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+.. -......+..+.=..+.+|+++.++++.+-| T Consensus 373 ~~~~~~~~~~~~~~r~~~r~d~~~~~~~a~~~l~~~~~~ 411 (413) T protein:vir:81 373 NTNVDDFENNLITVRAEERVGLMVTFPEAIVQLDVAEVV 411 (413) T ss_pred ccccchhhcCcEEEEEEEeeccEEecccceEEEEecCCC Confidence 0000 0133455555666777889999999998888 No 67 >protein:vir:41 Length: 299 # NCBI annotation: major capsid protein # Family: family:all:507 # MgeID: mge:2 # MgeName: A118 # Cross-refs: genbank:acc:NP_463467;swissprot:trembl:q9t1b7;genbank:gi:16798789;uniprot:Q9T1B7;genbank:GeneID:922353 Probab=31.67 E-value=1.5 Score=19.65 Aligned_cols=289 Identities=10% Similarity=-0.006 Sum_probs=124.8 Q ss_pred Cccc-----hhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee Q lcl|Aclame:pro 1 MGLI-----YDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI 75 (348) Q Consensus 1 Ma~l-----~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~ 75 (348) |... --++.+.....+++.+.. . +-+.+ +.+..++.......... . . ..|.++..+.+.+..+ ..++. T Consensus 6 ~~~~~~~~~~~~iP~~~~~~ii~~~~~-~-s~l~~-~~~~~~~~~~~~~~~~~-~-~-~~a~~v~E~~~~~~~~-~~f~~ 78 (299) T protein:vir:41 6 DTTTMQSAKTGSIPINISEQIITGVKN-G-SAAMK-LAKAVPMTKPEEEFTFM-S-G-VGAFWVDEAERIQTSK-PTFTK 78 (299) T ss_pred CcccccCCCceecchhHHHHHHHHHHh-c-chhhh-hceeeecCCCcEEEEEE-c-C-CceeeeecCccccccc-cceeE Confidence 2211 112333333444444332 2 22333 34444444444433322 2 1 3467888877766544 66777 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDI 155 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~v 155 (348) ..+.+-+++-...++.+=++ ++. .+. ...+ ...+.+++.+.+|. ++.+|.-+ +... T Consensus 79 v~l~~~k~~~~~~is~ell~------ds~-~~~----~~~i---~~~l~~a~~~~~d~----a~l~G~g~----~~~~-- 134 (299) T protein:vir:41 79 AKMRSKKMGVIIPTTKENLN------YSV-TNF----FSLM---QAEIVEAFYKKFDQ----AVFTGVES----PYNW-- 134 (299) T ss_pred EEEeeEEEEEeehhhHHHHh------cCH-HHH----HHHH---HHHHHHHHHHHHHH----HHhhcccC----cccc-- Confidence 77777777777777653221 111 111 1222 23344555566653 33345321 1111 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) |.-.. .+.+.....++.+.++||.++...+...+..+...+|++..|.+|++ +++. . ......+.. . T Consensus 135 --gil~~--~~~~~~~~~~~~~~~~~l~~~~~~l~~~~~~~~~~v~n~~~~~~L~~---lkd~---~--G~~l~~~~~-~ 201 (299) T protein:vir:41 135 --NILKS--ATDASNLVEETANKYDDLNEAIGLIEAEDLEPNGIATIRKQRVKYRS---TKDG---N--GMPIFNTAT-S 201 (299) T ss_pred --ccccc--ccccceeeccccccHHHHHHHHHhhhcccCCcCEEEEcHHHHHHHHH---hhcc---C--CceeecCCc-C Confidence 11100 01111112334567888998888887778888899999999998764 2222 1 111111100 0 Q ss_pred HHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeec Q lcl|Aclame:pro 236 NYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKT 315 (348) Q Consensus 236 ~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 315 (348) .--..+.|.++++.+.. . .|+.. ..++|..... ..+|.--+ .........+........+.....|.+ T Consensus 202 ~~~~~l~G~PV~~~~~~-~--~~~~~-----~~~~~gdfs~---~~i~~~~~-~~i~~~~~~~~~~~~~~~~~~~~~~~~ 269 (299) T protein:vir:41 202 NGVDDVLGLPIAYTPKY-T--FGDKD-----ISELVGDWNQ---AYYGILRG-VEYEILTEATLTTVADETGKPLNLAER 269 (299) T ss_pred CCCceecceeeEEeccc-C--CCCCc-----eEEEEEeccc---EEEEEecC-cEEEEeecccccccccccccchhhhhc Confidence 00113446677665432 1 11110 0122221111 11111000 000000000000000000111111211 Q ss_pred CCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 316 TDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 316 ~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ....+++..+.=..+.+|+++.++|.-+.= T Consensus 270 ---~~~~~r~~~~~d~~v~~~~A~~~l~~~aa~ 299 (299) T protein:vir:41 270 ---DMAAIKATFEVGFMVVKDEAFSAVQPKAGN 299 (299) T ss_pred ---CcEEEEEEEEeccEEecccceEEEEeccCC Confidence 124455666666778889999999888666 No 68 >protein:vir:1583 Length: 351 # NCBI annotation: minor capsid protein # Family: family:all:1522 # MgeID: mge:32 # MgeName: phig1e # Cross-refs: genbank:acc:NP_695165;swissprot:trembl:o03966;genbank:gi:23455804;uniprot:O03966;genbank:GeneID:955561 Probab=29.26 E-value=1.7 Score=19.36 Aligned_cols=304 Identities=13% Similarity=0.074 Sum_probs=112.2 Q ss_pred Ccc--chhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCC-CCcc-eec-----cc Q lcl|Aclame:pro 1 MGL--IYDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFD-TNVT-IRD-----RV 71 (348) Q Consensus 1 Ma~--l~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~-~~~~-~~~-----r~ 71 (348) ||. |.|+|.|..+..|+.+.......|+.+...- ..-++...-...|..+..|+..+- .... +.+ -+ T Consensus 1 MA~T~lsd~i~PEvf~~yv~~~~~~~~~l~qSG~i~----~~~~l~~~~~~~G~~it~P~~~~l~Gd~~~~~~~~~i~~~ 76 (351) T protein:vir:15 1 MAETHLSDLIVPEVFGNYVVNQIIKTNRFVQSGILT----PDPDLGPHLLEAGTRITVPFLNDLTGDPDNWTDSDDIDVN 76 (351) T ss_pred CCceeeeeeechhHHHHHHhhhhHHhhhHhhccccc----ccHHHHHHhhcCCCEEEecccccCCCcccccCCCcccchh Confidence 996 5799999999999976432222332221111 000000000012333333443321 1111 111 11 Q ss_pred ceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCce Q lcl|Aclame:pro 72 SAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGV 151 (348) Q Consensus 72 ~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~ 151 (348) ..++..-.-..++..+...+.|+-.+. ..+ ..+..+.+++ ...+.++.+.+....|. |.+.... T Consensus 77 kitt~~~~a~i~~~~kg~~~tD~a~~~---sg~--dp~~~i~~q~-------a~~w~~~~q~~lla~l~-gv~~~~~--- 140 (351) T protein:vir:15 77 NLTSGKQQGIKFYQTKAYGYTDLGTMI---SGA--PVQETIGNRF-------AAFWQRADQKTLLSVLK-GVMGVTK--- 140 (351) T ss_pred eecccceeEEEEeeccceehhhhhHhh---ccc--hHHHHHHHHH-------HHHHHHHHHHHHHHHHH-HHhhchh--- Confidence 111111111222233445566654332 222 2233333333 34444555555555553 4332111 Q ss_pred eEEEeeccCccceeeeeecCCCCCccHH---HHHHHHHHHHHh-cCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcc Q lcl|Aclame:pro 152 NKDIDYGVKADHKKQVSKSWAEPGATPL---ADLEDAIETARE-LGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGS 227 (348) Q Consensus 152 ~~~vDfg~~~~~~~t~~~~W~~~~adp~---~di~~~~~~~~~-~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~ 227 (348) ....|....+.. ++++.. ..|......+-+ .+-....++|.+.++..|+++. ..+.+....++. T Consensus 141 -------~~~~~~~d~t~~---~~~~~~is~~~l~~A~~~~GD~~~~~~~~ivmhS~v~~~L~~~~-li~~~~~s~~~~- 208 (351) T protein:vir:15 141 -------IANSKVYDQTKV---SPSEPMFGAKGFTGAIGLMGDLQDTAFGAIAVNSATYSLMKVQG-LIETIQPQNGAT- 208 (351) T ss_pred -------hcccceeccccc---cccccccCHHHHHHHHHHhccccccceEEEEEChHHHHHHHhhh-hhhhccccccCc- Confidence 111222222111 111111 223333333423 2334788999999999998764 444444332211 Q ss_pred cccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhh-hcccccccc-ccceee-c Q lcl|Aclame:pro 228 SVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEE-SDLFADNTV-NADVEI-V 304 (348) Q Consensus 228 ~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~-~~~~~~~~~-~~~~~~-~ 304 (348) -++.+.|.+|++=|.-=.+..+... ...+.+++..+.+|..-=++..|. .++..+... ....+. . T Consensus 209 ---------~i~t~~G~~VivdD~~p~~~~~~~~---~~ytsyl~~~GAi~~~~~~~~ve~~rd~~~~~g~d~l~~r~~~ 276 (351) T protein:vir:15 209 ---------PFEAYNGLRIVLDDDIEIDLTDKTK---PVSTSYIFAPGAVRYSTNMRSTETKYDPLINGGQDVIVQKRVG 276 (351) T ss_pred ---------ccceecceEEEEcCCCccccCCCCC---ceeEEEEEecceeeeecCCcCcceeecccCCCCceEEEEeeee Confidence 1455667777664432111111000 011233443443331111111111 111111110 000000 0 Q ss_pred CCceEEEEeec-------CCCceeEEeeeeeeeeee-cCCCcEEEEEEecCC Q lcl|Aclame:pro 305 DSGIAVTTTKT-------TDPVNVQTKVSMVALPSF-ERLGDVYMLTVIPGV 348 (348) Q Consensus 305 ~~~~~~~~~~~-------~dP~~~~~~~~s~~lPv~-~~~~~~~~~~V~~~~ 348 (348) -.+..-..|.. ..|....+...+.+=.|= .++..|-++.+.--. T Consensus 277 ~~hp~G~s~~~~~~~~~~~sPt~~~L~~~~NW~~v~~~d~k~I~iv~~~~~~ 328 (351) T protein:vir:15 277 TIHVAGTSIKASFSPSKASFPTIDELAKSSTWEVVDGIDVRSIGVVAYTAQL 328 (351) T ss_pred eeeeeeeeecccccccCcCCcChHHhcCCcccccccCCCccccceEEEEEec Confidence 01122234431 124444333333333331 234444444332111 No 69 >protein:vir:104342 Length: 314 # NCBI annotation: hypothetical protein # Family: family:all:463 # MgeID: mge:1593 # MgeName: RTP # Cross-refs: genbank:acc:YP_398971;genbank:gi:81343955;genbank:GeneID:3778874 Probab=28.26 E-value=1.8 Score=19.23 Aligned_cols=277 Identities=11% Similarity=0.111 Sum_probs=118.2 Q ss_pred Cccch--hhcCHHHHHHHHHhhc-cchhhhHHHHhCCCccccce---eEEEEEeecCceeeeeeeeCCCCc-ceecccce Q lcl|Aclame:pro 1 MGLIY--DKVTASNIAGYFNTLQ-ENVDSTLGESIFPARKQLGT---KLSYIKGASGQSVALKAAAFDTNV-TIRDRVSA 73 (348) Q Consensus 1 Ma~l~--d~f~~~~l~~~i~~~~-~~~~~~l~~~~Fp~~~~~~~---~~~~~~~~~~~~~~a~~v~~~~~~-~~~~r~~~ 73 (348) .++.. -.|...+|+.+-+.+- .+.+++-..++||....-+. .+.+. ... ..-.+...+..+.. |..+ -.+ T Consensus 21 ~~~~d~~~~fl~~ql~~id~~v~e~~~~~~~~~~~i~v~~~~~~~~et~~~~-~~e-~~G~a~~~~d~~~dip~vd-~~~ 97 (314) T protein:vir:10 21 VEKADAAGIWAVSQLTAALNRAYEKEYAENSVVNIFPVTNEIPGHAKYFEYP-EFD-GVGIAQIIADYSDDLPLVD-AFM 97 (314) T ss_pred ccchhhhHHHHHHHHHHHHHHHhhhhccccccceeeccccCCCCceeEEEee-eec-cccceeeeCCcccccceee-ccc Confidence 11111 1566666665433222 13445667788886532211 11111 111 11234444444432 3333 234 Q ss_pred eeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCce-- Q lcl|Aclame:pro 74 EIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGV-- 151 (348) Q Consensus 74 ~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~-- 151 (348) +....++..++.....+..|+..-+..+..-... ......++++.++ -++.+.|+.. T Consensus 98 ~~~~~~i~~~~~~~~~~~~El~~a~~~g~~l~~~-----------k~~aA~~~~~~~~----------n~i~f~G~~~~g 156 (314) T protein:vir:10 98 TEKQGKVFRFGNAFLISTDEIKAGAATGQSLSAR-----------KQALAFEAHDNLL----------DKLVWSGSAPHG 156 (314) T ss_pred ceeEEEEEEEEeeEEecHHHHHHHHHhCCChHHH-----------HHHHHHHHHHHhh----------ceEEEeeccccc Confidence 5677778888889999988876544333211111 0111112222222 1233322211 Q ss_pred eEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHh-c-C-CeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccc Q lcl|Aclame:pro 152 NKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARE-L-G-LNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSS 228 (348) Q Consensus 152 ~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~-~-G-~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~ 228 (348) .+.+ +..|.-...+.++.|+.+ ..+++||.+....+.. + | ..|++++++++.+..|.+ . .. +.+ T Consensus 157 ~~GL-lN~p~v~~~~~~~~WaT~-~ei~~Di~~~~~~l~~~s~g~~~p~~l~Lpp~~~~~L~~-~-----~~--~~~--- 223 (314) T protein:vir:10 157 IVSV-FDQPNINNVVATPNWSVP-QNAIDDVTAMIDAVESSTQGLHHVTDILLPASARRVMQG-L-----VP--QTN--- 223 (314) T ss_pred ceeE-eecCCCccccCCCCcccH-HHHHHHHHHHHHHHHHhcCccccceeEEecHHHHHhhcc-c-----cc--CCC--- Confidence 1111 111211123345689633 3569999998887753 3 4 469999999999987632 0 01 111 Q ss_pred ccHHHHHHHHHhhc-CceEEEEeeEEEcCCCcccccccCCeEEEEeCCcc-ceeEeccchhhhccccccccccceeecCC Q lcl|Aclame:pro 229 VTKAELQNYVADNY-GVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPL-GNTVFGTTPEESDLFADNTVNADVEIVDS 306 (348) Q Consensus 229 ~~~~~~~~~~~~~~-~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~-G~~~yg~~~~~~~~~~~~~~~~~~~~~~~ 306 (348) + .+.+++...+ .++|....+ +....+.. .+.+++...+.. ..... ++ T Consensus 224 ~---tvl~~l~~n~~~l~I~~~~e-l~~ag~~g-----~~~~v~y~~~~~~~~~~v----------------------p~ 272 (314) T protein:vir:10 224 L---SYGELFTRNNPGLTIRFLQF-LDNYDGAG-----GKAALAFEKSPLNMSIEI----------------------PE 272 (314) T ss_pred c---cHHHHHHHhCCCcEEEEccc-ccccCCCc-----ceEEEEEecCCcEEEEec----------------------Cc Confidence 1 2334444332 344444332 22222111 122223222110 01110 01 Q ss_pred ceEEEEeecCCCceeEEeeeeee-eeeecCCCcEEEEEEe--c Q lcl|Aclame:pro 307 GIAVTTTKTTDPVNVQTKVSMVA-LPSFERLGDVYMLTVI--P 346 (348) Q Consensus 307 ~~~~~~~~~~dP~~~~~~~~s~~-lPv~~~~~~~~~~~V~--~ 346 (348) .+....+ +..+.........+. =.++.+|.++..++=+ | T Consensus 273 ~~~~l~~-e~~~~~~~~~~~~r~~Gv~i~~P~ai~~~dGI~~~ 314 (314) T protein:vir:10 273 VTNVLPA-QPKDLHFRYPVTSKATGLIVYRPLTMAVIKGITFA 314 (314) T ss_pred cceeecc-eecCceEEEcceeeeEEEEEECcceeEeeeeeecC Confidence 1111111 222233333333332 3566677777766533 3 No 70 >protein:vir:78148 Length: 123 # NCBI annotation: hypothetical protein # Family: family:all:4955 # MgeID: mge:1847 # MgeName: Min1 # Cross-refs: genbank:acc:YP_001294802;genbank:gi:149882823;genbank:GeneID:5309176 Probab=26.76 E-value=1.9 Score=19.04 Aligned_cols=121 Identities=12% Similarity=0.045 Sum_probs=71.1 Q ss_pred EeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccce Q lcl|Aclame:pro 200 IMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGN 279 (348) Q Consensus 200 ~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~ 279 (348) +++--.|++++...-.-+++-. ++.|..| -|++.+..|-.++. +.+-+|.+...++-+..+|- T Consensus 1 vvsdlqfA~~~g~~v~~~aLpR----------E~aNp~l--tG~lpV~~~GltWl-----~tpnlpg~~a~vlDst~lGg 63 (123) T protein:vir:78 1 MLSGAQFAKLIGILVDDKALPR----------EQANIVL--TGSLPVSAYGLTWV-----TSRHITGTDPWLFDVEQLGG 63 (123) T ss_pred CcchhhHHHHhcchhccccccc----------ccCCceE--ecCcceeeeceeee-----ecCCCCCCccceeehhhhcc Confidence 3344446655555444444332 2234333 24677777776654 34456666666665544443 Q ss_pred eEeccchhhhccccccccccceeecCCceEEEEeecCC--CceeEEeeeeeeeeeecCCCcEEEEEEecC Q lcl|Aclame:pro 280 TVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTD--PVNVQTKVSMVALPSFERLGDVYMLTVIPG 347 (348) Q Consensus 280 ~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d--P~~~~~~~~s~~lPv~~~~~~~~~~~V~~~ 347 (348) ++ ++.-+..+. ......|+-+|+..++. ..++-+++--.-.|++.+|-+.+.++=+-= T Consensus 64 ma-----DE~l~~Pgy-----a~~~~~Gvevkt~Red~~~nD~yriRaRRvTvpiv~EP~Agv~ltg~g~ 123 (123) T protein:vir:78 64 MA-----DEKLLSPEF-----APAGNTGVEASTERAHQGVKDGYLVRGRRNTVAVVTEPMAGVRLTGTGL 123 (123) T ss_pred cc-----ccccCCCcc-----cCCCCcceeEEeeccccCCCCceEEeeeecceeEEecCccceEEeeecC Confidence 33 333333332 22234577788887766 678888888889999999999998875433 No 71 >protein:vir:94070 Length: 339 # NCBI annotation: putative structural protein # Family: family:all:1653 # MgeID: mge:1493 # MgeName: OP2 # Cross-refs: genbank:acc:YP_453625;genbank:gi:84662661;genbank:GeneID:5142580 Probab=24.29 E-value=2.2 Score=18.71 Aligned_cols=272 Identities=8% Similarity=0.020 Sum_probs=96.0 Q ss_pred CccchhhcCHHHHHHHHHhh--ccchhhhHHHHhCCCccccce--eEEEEEeecCceeeeeeeeCCCCcceec-ccceee Q lcl|Aclame:pro 1 MGLIYDKVTASNIAGYFNTL--QENVDSTLGESIFPARKQLGT--KLSYIKGASGQSVALKAAAFDTNVTIRD-RVSAEI 75 (348) Q Consensus 1 Ma~l~d~f~~~~l~~~i~~~--~~~~~~~l~~~~Fp~~~~~~~--~~~~~~~~~~~~~~a~~v~~~~~~~~~~-r~~~~~ 75 (348) |......+=++.++.+|... ....+++-...+||..+..+. +.......... -.|...+..+.-|+.+ +..+.. T Consensus 46 ~~~~~~~~i~a~~~~~i~~~vy~~~~~~~~~~~l~pv~t~g~w~~~t~~y~~~e~~-G~a~~ygd~ad~Pl~~~~v~~~~ 124 (339) T protein:vir:94 46 LQTTANAGIPAWMTTFVDRRVIDIQLAPMAAAKIFPEVKKGDWTTTYGVFIIAEPV-GQVATYSDWSANGMSKANVNFES 124 (339) T ss_pred cccccccchhhhhhhhhchhheeecccccchhhhcccccCCCCcccEEEEeeeecc-cceEEcccccCCCcccccceeeE Confidence 11111122234566667421 113345567889998664432 11111112222 2333445444443333 222332 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCce--eE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGV--NK 153 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~--~~ 153 (348) +. +..+...+..+..|+.+-+..+-.- .+.+ ....+++++..+ -++.+-|+.. .+ T Consensus 125 ~~--v~~~~~g~~y~~~E~~~A~~~g~~l-~~~K----------a~aA~~al~~~~----------N~i~~~Gd~~~~~~ 181 (339) T protein:vir:94 125 RQ--NYRYQTWTEYGDLEMATYGEAGIDY-VARQ----------EISASLVMAKFA----------NSSYLLGVAGIANY 181 (339) T ss_pred Ee--EEEEEEEEeecHHHHHHHHhhCCCh-HHHH----------HHHHHHHHHHhh----------ceEEeeeecccceE Confidence 32 2233334455666654433222111 1110 111112222111 1233322211 12 Q ss_pred EEeeccCccc-eeeeeecCCCCCcc-HHHHHHHHHHHHHh-cC-C----eeEEEEeCHHHHHHHhcCHHHHHHhcccCCC Q lcl|Aclame:pro 154 DIDYGVKADH-KKQVSKSWAEPGAT-PLADLEDAIETARE-LG-L----NPERAIMNAKTFGLIRKAASTVKAIKPLAGD 225 (348) Q Consensus 154 ~vDfg~~~~~-~~t~~~~W~~~~ad-p~~di~~~~~~~~~-~G-~----~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~ 225 (348) .+ +..|.-. .++++++|.+.+.+ +++||.++...++. +| . .|.+++|.+..++.|..- +..+ T Consensus 182 GL-lN~P~l~~~v~~s~~Wa~kT~~eI~~Di~~~~~~l~~~s~g~~~~~~~~~L~LP~~~~~~L~~~---------n~~~ 251 (339) T protein:vir:94 182 GL-MNDPSLPAPVAATVNWATAAPEDIANDVVAMVGRLISQSGGLITGQERMVMALAPSALNNVNRT---------NNFG 251 (339) T ss_pred EE-EeCCCccccccCCCCcccCCHHHHHHHHHHHHHHHHHhcCCeeeeccCcEEEecHHHHHhcccC---------CcCC Confidence 21 1112211 23556789877654 68999998887753 44 2 355799999999977431 0001 Q ss_pred cccccHHHHHHHHHhh-cCceEEEEeeEEEcCCCcccccc-cC----Ce-EEEEeCCccceeEeccchhhhccccccccc Q lcl|Aclame:pro 226 GSSVTKAELQNYVADN-YGVEIVLENGTYRNEKGEVSKFF-PD----GH-LTLIPNGPLGNTVFGTTPEESDLFADNTVN 298 (348) Q Consensus 226 ~~~~~~~~~~~~~~~~-~~~~i~~yd~~y~d~~g~~~~~~-~~----~~-vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~ 298 (348) + .+.++|... -+++|+...+ +.+.+|....++ +. +. -+.+|..- +.++..+... ... T Consensus 252 ---~---Tvl~~lk~n~pnl~i~~~~e-l~~a~g~~~~~~~~~~~~~~~~~~~~p~~~---~~lpvq~~~~------~~~ 315 (339) T protein:vir:94 252 ---L---SAGAKIAQTYPNIQFVAVPE-FDTASGRLVQLWVPEVNGQPTGEVAFAEKL---RSHSIERYST------TTR 315 (339) T ss_pred ---c---cHHHHHHHhcCCcEEEEccc-cccCCCceEEEEEEeccCCcceEEEcchhh---hccccEEcCc------eEE Confidence 1 122333322 1344433221 122222211111 00 00 11112110 0111000000 000 Q ss_pred cceeecCCceEEEEeecCCCceeEEeeeeeee Q lcl|Aclame:pro 299 ADVEIVDSGIAVTTTKTTDPVNVQTKVSMVAL 330 (348) Q Consensus 299 ~~~~~~~~~~~~~~~~~~dP~~~~~~~~s~~l 330 (348) ......-.|..++. |...... ..+ T Consensus 316 v~~~~rt~Gv~i~~-----P~ai~~~---~GI 339 (339) T protein:vir:94 316 QKHSGATFGAVIYQ-----PWAVTQE---LGV 339 (339) T ss_pred ecceeeeeeEEEEc-----cceeeee---ecC Confidence 00000001111111 1111111 111 No 72 >protein:vir:99675 Length: 324 # NCBI annotation: Major capsid protein # Family: family:all:975 # MgeID: mge:1523 # MgeName: VP4 # Cross-refs: genbank:acc:YP_249589;genbank:gi:68299740;genbank:GeneID:3799990 Probab=23.19 E-value=2.3 Score=18.56 Aligned_cols=266 Identities=11% Similarity=-0.015 Sum_probs=73.1 Q ss_pred CCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee--eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHH Q lcl|Aclame:pro 34 PARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI--HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINT 111 (348) Q Consensus 34 p~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~--~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~ 111 (348) =.+...+.+-..+... ....+.+..++.+..- .+..... ..+.+=-.+-. ..--+|+.+.|+..+. +.. T Consensus 1 ~vr~i~~g~s~~~~~i--G~~~~~~~~~G~~l~~-~~~~~~~~e~~itID~~l~~-~~~VdDiD~~qa~~Dl-----r~e 71 (324) T protein:vir:99 1 MTRTITSGKSAQFPVM--GRTKARYLKQGQSLDD-GREDIKHTEKVITIDGLLTT-DVLIYDIEDAMNHYDV-----RSE 71 (324) T ss_pred CeeeeecCceEEEeee--eeeEeccccCCCCcCC-CcCCcCcccEEEEecchhhh-hhhhhhHHHHhcCccc-----hhH Confidence 0011111111111100 1122233333322110 0000000 00000000000 0011233333322221 112 Q ss_pred HHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEeeccCccceeeeeecCCCCCc---cHHHHHHHHHHH Q lcl|Aclame:pro 112 IVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYGVKADHKKQVSKSWAEPGA---TPLADLEDAIET 188 (348) Q Consensus 112 ~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDfg~~~~~~~t~~~~W~~~~a---dp~~di~~~~~~ 188 (348) + .+++-.++.+...-.+++.+..+...-.... ..-..+......+..++.-.++.. ..++-|....+. T Consensus 72 ~-------s~~~G~aLA~~~Dq~i~~~~a~~~~~~a~~~--~~~~~~~g~~~~~~~~~~~~~~~~~~~~~~dai~~a~~~ 142 (324) T protein:vir:99 72 Y-------STQMGEALAMAADVANYAEMAKLVNSRKETT--NENIEGLGAASLVKITGKKEDPAKYGTQVIQALTYARAA 142 (324) T ss_pred H-------HHHHHHHHHHHHHHHHHHHHHHhhhcccccc--cCCcccCCccceecccccccccccCHHHHHHHHHHHHHH Confidence 2 2222333333333333333221110000000 000001111111111111122222 234556666666 Q ss_pred HHhcCCe--eEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHHHhhcCceEEEEeeEEEcCCCc------- Q lcl|Aclame:pro 189 ARELGLN--PERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYVADNYGVEIVLENGTYRNEKGE------- 259 (348) Q Consensus 189 ~~~~G~~--~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~------- 259 (348) +.+...+ ...++++++.|.+|+++..+...-.... +. ..+..++...|++|+.-+.- ....++ T Consensus 143 Lde~~VP~~gR~~vv~P~~y~~Ll~~~~~~~~~~~~~---~~----~~~G~V~~i~Gf~V~~Sn~l-p~~~~t~~~~a~~ 214 (324) T protein:vir:99 143 FAKKYIPAGDRTFYTDPDTYSAILAALMPNAANYAAL---ID----PETGNIRNVMGFEVVETPHM-TAQMVTNPTDAFD 214 (324) T ss_pred HhhcCCCCCCCEEEeChHHHHHHhhcccccccccccc---cc----eecceEEEEeceEEEecCCc-ccccccccccccc Confidence 6555543 3468999999999998877654422211 11 11223334456665543221 000000 Q ss_pred --------------cccccc--CCe-EEEEeCCccceeEeccchhhhccccccccccceeecCCceEEEEeecCCCceeE Q lcl|Aclame:pro 260 --------------VSKFFP--DGH-LTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIAVTTTKTTDPVNVQ 322 (348) Q Consensus 260 --------------~~~~~~--~~~-vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~dP~~~~ 322 (348) ..++-+ .+. .++++...+|...= ..+....|.+.+--+.+ T Consensus 215 ~~~~~~~~~~~~~~~~ky~~d~~~~~gl~~~~~a~~tv~~-----------------------~~~~~e~~~~~~~~~d~ 271 (324) T protein:vir:99 215 GTGHIFPATGDSTTTGKMTVGADNVVGLFVHRSAVATLKL-----------------------KDMALERARRPEYQADQ 271 (324) T ss_pred ccccccccccccccccccccccCceeEEEEehhheEEEee-----------------------ecceecceechhhHHHh Confidence 001111 111 11112111111100 00000000000001111 Q ss_pred EeeeeeeeeeecCCCcEEEEE--------EecCC Q lcl|Aclame:pro 323 TKVSMVALPSFERLGDVYMLT--------VIPGV 348 (348) Q Consensus 323 ~~~~s~~lPv~~~~~~~~~~~--------V~~~~ 348 (348) +.+.-.-=..+.+|+.....+ |+|+| T Consensus 272 i~~~~a~G~~~lRPe~a~~v~l~~~~~~~~~~~~ 305 (324) T protein:vir:99 272 IIAKYAMGHGGLRPEAVGAIIFEDGETPAVAPDV 305 (324) T ss_pred hhhhhhhcCcccccceEEEEEEccCccccccchh Confidence 111111112223555443333 22333 No 73 >protein:vir:4830 Length: 397 # NCBI annotation: MPL-7201 # Family: family:all:21 # MgeID: mge:105 # MgeName: 7201 # Cross-refs: genbank:acc:NP_038327;genbank:gi:9634653;genbank:GeneID:1262632 Probab=21.83 E-value=2.5 Score=18.36 Aligned_cols=268 Identities=12% Similarity=-0.038 Sum_probs=112.9 Q ss_pred Ccc--ch--hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccce--eEEEEEeecCceeeeeeeeCCCCcceeccccee Q lcl|Aclame:pro 1 MGL--IY--DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGT--KLSYIKGASGQSVALKAAAFDTNVTIRDRVSAE 74 (348) Q Consensus 1 Ma~--l~--d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~--~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~ 74 (348) |+. -. .++-|.++..-|-+......+ |.+ +.+..++.+. .+....... ....+.++..+.+.+-.....+. T Consensus 109 ~~~~t~~~gg~~iP~~~~~~ii~~~~~~~~-l~~-~~~~~~~~~~~~~~~~~~~~~-~~~~a~~v~E~~~~~~~~~~~~~ 185 (397) T protein:vir:48 109 KTDASGSDAGLTIPQDIQTAIHTLVRQYDS-LQE-YVNVENVTTLTGSRVYEKWAD-ITGLAKLDDEAGSIGTNDDPKLY 185 (397) T ss_pred hhccCCccccccccHHHHHHHHHHHHHHHH-HHh-hhceeeccCCcceEEEEeecC-CCcceeeecccccccccccccee Confidence 221 11 122234443333333322222 323 3333322222 222222111 22235667666655544455667 Q ss_pred eeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEE Q lcl|Aclame:pro 75 IHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKD 154 (348) Q Consensus 75 ~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~ 154 (348) ...+.+-.++....++.+=+. ++. .+ +...+ ...+..++...+|..++...-+|+ T Consensus 186 ~v~~~~~k~~~~~~iS~ell~------ds~-~~----l~~~v---~~~l~~~~~~~~d~~il~G~g~~~----------- 240 (397) T protein:vir:48 186 PIRYAIKRYAGISTVTNSLLA------DSA-EN----ILAWL---SGWIAKKVVVTRNKAILEAIATLP----------- 240 (397) T ss_pred eEEeeheeeeeehhhHHHHHh------hch-HH----HHHHH---HHHHHHHHHHHHHHHHhhcccccc----------- Confidence 777777666666666543221 111 11 11222 223455666666655543221110 Q ss_pred EeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHH Q lcl|Aclame:pro 155 IDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAEL 234 (348) Q Consensus 155 vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~ 234 (348) . ..+....++|.++...+...+.....++|++.+|..|++ +++. + +...+.+... T Consensus 241 ---------~--------~~~~~~~d~i~~~~~~l~~~~~~~a~~v~n~~~~~~L~~---lkd~----~-G~~i~~~~~~ 295 (397) T protein:vir:48 241 ---------T--------KPTLTKWDDIIDLQAKVDPAIKQTSFFLTNTSGFTALKK---VKNA----F-GDYLMERDVK 295 (397) T ss_pred ---------c--------ccccccHHHHHHHHHHhhhhhcCCCEEEECHHHHHHHHH---hhcC----C-CceeeccCcC Confidence 0 012233456666666665555667789999999998764 2211 1 1111111111 Q ss_pred HHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccchhhhccccccccccceeecCCceE--EEE Q lcl|Aclame:pro 235 QNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTTPEESDLFADNTVNADVEIVDSGIA--VTT 312 (348) Q Consensus 235 ~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~~~~~~~~~~~~~~~~~~~~~~~~~--~~~ 312 (348) ...-..+.|.++++.+..+....+ .++..+++..... +. .++. ..++- +.. T Consensus 296 ~~~~~~l~G~PV~~~~~~~~~~~~-----~~~~~~~~gd~~~-~~-~~~~--------------------~~~~~i~~~~ 348 (397) T protein:vir:48 296 SPTGYSIDGFAVKEVADRWLANAS-----SGAMPLYFGDLKQ-AV-TLFD--------------------RQQMSLLSTN 348 (397) T ss_pred CCCCceeccceeEEecccccCCcC-----CCceEEEEEeccc-eE-EEEe--------------------ecceEEEEec Confidence 111123457777766543321111 1112222221110 00 0000 00000 000 Q ss_pred --eecCCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 313 --TKTTDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 313 --~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) +....-......+..+.=..+.+|++++++++.+-. T Consensus 349 ~~~~~~~~~~~~~r~~~r~d~~~~~~~a~~~~~~~~~~ 386 (397) T protein:vir:48 349 IGGGAFETDTTKIRVIDRFDVVATDTESFVPASFKAIA 386 (397) T ss_pred cchhhhhcCceeEEEEeeeccEEecccceEEEEecccc Confidence 000111234445555566677889999999988766 No 74 >protein:vir:2344 Length: 397 # NCBI annotation: gp14 # Family: family:all:507 # MgeID: mge:51 # MgeName: Bxb1 # Cross-refs: genbank:acc:NP_075281;genbank:gi:12657868;genbank:GeneID:920118 Probab=21.30 E-value=2.6 Score=18.29 Aligned_cols=283 Identities=10% Similarity=0.061 Sum_probs=110.0 Q ss_pred Cccc-----hhhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceee Q lcl|Aclame:pro 1 MGLI-----YDKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEI 75 (348) Q Consensus 1 Ma~l-----~d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~ 75 (348) |+.- -.++-+.....+++.+.. . +-+++ +++..++......... .... ..+.++..+.+.+.. ...+.. T Consensus 10 ~~~~~t~~~~g~l~~~~~~~ii~~l~~-~-s~i~~-l~~~~~~~~~~~~ip~-~~~~-~~a~wv~Eg~~~~~s-~~~f~~ 83 (397) T protein:vir:23 10 IAQTKDTMFTGYLDPVQAKDYFAEAEK-T-SIVQR-VAQKIPMGATGIVIPH-WTGD-VSAQWIGEGDMKPIT-KGNMTK 83 (397) T ss_pred HhhccCCCCccccchhHHHHHHHHHHh-c-cchhh-hcceeeccCCceEEEE-EcCC-cceEEecCCcccccc-ccceeE Confidence 3322 134555555666665542 2 23444 4555555444333322 2222 346778777666654 456777 Q ss_pred eEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEE Q lcl|Aclame:pro 76 HDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDI 155 (348) Q Consensus 76 ~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~v 155 (348) ..+.+-+++-...++.+=++ +. ..+ +...+ ...+.+++.+.+|.+++ +|-= .+.... T Consensus 84 v~l~~~k~~~~v~iS~ell~------ds-~~~----l~~~i---~~~l~~aia~~~d~a~l----~G~g----t~~~~~- 140 (397) T protein:vir:23 84 RDVHPAKIATIFVASAETVR------AN-PAN----YLGTM---RTKVATAIAMAFDNAAL----HGTN----APSAFQ- 140 (397) T ss_pred EEEeeEEEEEeehhhHHHHh------cc-hHH----HHHHH---HHHHHHHHHHHHHHHHh----hccc----CCcccc- Confidence 78888777777666543221 11 111 11222 33445666777776554 2310 000000 Q ss_pred eeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHH Q lcl|Aclame:pro 156 DYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQ 235 (348) Q Consensus 156 Dfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~ 235 (348) +.... ...+..+ ++.....++......+...+......+|++..+..|++ +++.- + .....+.... T Consensus 141 --~~~~~--~~~~~~~--~~~~~~~~~~~~~~~l~~~~~~~a~~vmn~~~~~~L~~---lkd~~----G-~~i~~~~~~~ 206 (397) T protein:vir:23 141 --GYLDQ--SNKTQSI--SPNAYQGLGVSGLTKLVTDGKKWTHTLLDDTVEPVLNG---SVDAN----G-RPLFVESTYE 206 (397) T ss_pred --ccccc--ccceeee--cccchhHHHHHHHHhhhhcccCCCEEEEcHHHHHHHHH---hhccC----C-ceeecccccc Confidence 00000 0011111 12223445555555565566667789999999987764 22221 1 1111111000 Q ss_pred HH-----HHhhcCceEEEEeeEEEcCCCcccccccCCeEEE-EeCCccceeEecc----chhhhccccccccccceeecC Q lcl|Aclame:pro 236 NY-----VADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTL-IPNGPLGNTVFGT----TPEESDLFADNTVNADVEIVD 305 (348) Q Consensus 236 ~~-----~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~-~p~~~~G~~~yg~----~~~~~~~~~~~~~~~~~~~~~ 305 (348) .. -+...|+++++.+. +|++.+.+ +.+- -..+||. ..+.++.. .......+ T Consensus 207 ~~~~~~~~~tl~G~Pv~~s~~------------~~~g~~~~~~gDf--s~~~i~~~~~i~i~~~~e~-----~~~~~~~~ 267 (397) T protein:vir:23 207 SLTTPFREGRILGRPTILSDH------------VAEGDVVGYAGDF--SQIIWGQVGGLSFDVTDQA-----TLNLGSQE 267 (397) T ss_pred cccccccCceeeeeeEEEeCC------------CCCCceEEEEeec--ceEEEEEEeceEEEEeeee-----eeeecccc Confidence 00 01223444443221 23333221 1110 0111211 00000000 00000000 Q ss_pred CceEEEEeecCCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 306 SGIAVTTTKTTDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 306 ~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) .+.....|.+ ....+++..+.=..+.+|+++.+++..+.. T Consensus 268 ~~~~~~lf~~---d~v~~ra~~r~d~~v~~~~a~~~~~~~~~~ 307 (397) T protein:vir:23 268 SPNFVSLWQH---NLVAVRVEAEYGLLINDVNAFVKLTFDPVL 307 (397) T ss_pred ccceeeeeec---cceeEEEEeeeccceecccceEEEeecccc Confidence 0000000110 012223333333444455555555443222 No 75 >protein:vir:2504 Length: 305 # NCBI annotation: major capsid subunit gp9 # Family: family:all:507 # MgeID: mge:53 # MgeName: TM4 # Cross-refs: genbank:acc:NP_569745;genbank:gi:18496895;genbank:GeneID:932268 Probab=20.67 E-value=2.7 Score=18.19 Aligned_cols=287 Identities=9% Similarity=-0.034 Sum_probs=100.2 Q ss_pred Cccch----hhcCHHHHHHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCccee----cccc Q lcl|Aclame:pro 1 MGLIY----DKVTASNIAGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIR----DRVS 72 (348) Q Consensus 1 Ma~l~----d~f~~~~l~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~----~r~~ 72 (348) ||.+. ..+-|.++..-|-+......+ +.+ +.+..++............ ...|.++..++..+-. .... T Consensus 1 ma~~t~~~gg~liP~~~~~~Ii~~~~~~s~-l~~-l~~~~~~~~~~~~~p~~~~--~~~a~wv~E~~~~~~~~~~~s~~~ 76 (305) T protein:vir:25 1 MADISRAEVASLIQEAYSDTLLAAAKQGST-VLS-AFQNVNMGTKTTHLPVLAT--LPEADWVGESATDPKGVKPTSKVT 76 (305) T ss_pred CCCccCCccceecCHHHHHHHHHHHHhhch-hhh-hcceeeccCCcEEEEEEeC--CcceEEeecccccccccccccccc Confidence 88875 344455564444333333333 333 4555554443333322221 2346677776554322 2345 Q ss_pred eeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCce- Q lcl|Aclame:pro 73 AEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGV- 151 (348) Q Consensus 73 ~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~- 151 (348) +....+.+-++.-...++.+-+ .++. .+ +...+ .+.+.+++.+.+|..+. +|.=. ..+. T Consensus 77 f~~i~~~~~k~~~~~~is~ell------~ds~-~~----~~~~i---~~~l~~~~a~~~d~a~~----~G~g~--~~~~~ 136 (305) T protein:vir:25 77 WANRTLVAEEIAVIIPVHENVI------DDAT-VA----VLTEV---AELGGQAIGKKLDQAVI----FGTDK--PASWV 136 (305) T ss_pred eeeEEeeeEEEEEeehhhHHHH------hcch-HH----HHHHH---HHHHHHHHHHHHhhhhe----eccCC--CCCcc Confidence 5656666666665556654321 1111 11 11222 23345556666665544 33210 0000 Q ss_pred eEE-EeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCccccc Q lcl|Aclame:pro 152 NKD-IDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVT 230 (348) Q Consensus 152 ~~~-vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~ 230 (348) ... +.......+.. .+........+.+.++......+...+..++.++|++..+..|++ +++.- ...... T Consensus 137 ~~~~~~~~~~~~~~~-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~v~~~~~~~~l~~---lkd~~-----G~~i~~ 207 (305) T protein:vir:25 137 SPALIPAAVTAGQAV-EVVGGVANESDIVGATNRAAKAVASAGWAPDTLLSSLALRYEVAN---IRDAN-----GNPVFR 207 (305) T ss_pred ccccccccccccccc-cccccchhhhHHHHHHHHHHHhhhhcccccceeEecHHHHHHHHH---hhccC-----Cceeec Confidence 000 00110011100 111112223556666776666666667777889999999988753 22221 111111 Q ss_pred HHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccC-CeEEEEeCCccc--eeEeccchhhhccccccccccceeecCCc Q lcl|Aclame:pro 231 KAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPD-GHLTLIPNGPLG--NTVFGTTPEESDLFADNTVNADVEIVDSG 307 (348) Q Consensus 231 ~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~-~~vv~~p~~~~G--~~~yg~~~~~~~~~~~~~~~~~~~~~~~~ 307 (348) +. ...|+++++.+.--. ..++..=++.+ ..+++.-.+.+- ...++.. .+. .......+ ..- T Consensus 208 ~~-------~l~G~Pv~~~~~~~~-~~~~~~~~~gd~s~~~i~~~~~~~i~~~~~~~~---~~~---~~~~~~~~--~~~ 271 (305) T protein:vir:25 208 DD-------SFAGFRTFFNRNGAW-DADAAIEVIADSSRVKIGVRQDITVKFLDQATL---GTG---ENQINLAE--RDM 271 (305) T ss_pred CC-------cccccceEEcCccCC-CCCccEEEEEecceEEEEEecCeEEEEeeeeee---ecC---Cceeeeee--cCc Confidence 11 123444443332100 01111111111 111111100000 0000000 000 00000000 000 Q ss_pred eEEE-----EeecCCCceeEEeeeeeeeeeecCCCc Q lcl|Aclame:pro 308 IAVT-----TTKTTDPVNVQTKVSMVALPSFERLGD 338 (348) Q Consensus 308 ~~~~-----~~~~~dP~~~~~~~~s~~lPv~~~~~~ 338 (348) +.++ -|.-.+|........ .+.= ...|-+ T Consensus 272 ~~~R~~~r~~~~v~~p~a~v~~~~-~~~~-~~~pa~ 305 (305) T protein:vir:25 272 VALRLKARFAYVLGVSATAQGANK-TPVA-VVAPAA 305 (305) T ss_pred EEEEEEEeecceeeCcccEEEEcc-cccc-ccCCCC Confidence 0000 111122222211111 1110 111111 No 76 >protein:vir:95763 Length: 297 # NCBI annotation: head protein # Family: family:all:507 # MgeID: mge:1578 # MgeName: SMP # Cross-refs: genbank:acc:YP_950590;genbank:gi:119953785;genbank:GeneID:5076833 Probab=20.60 E-value=2.7 Score=18.18 Aligned_cols=280 Identities=9% Similarity=0.053 Sum_probs=122.7 Q ss_pred Cccc------------hhhcCHHHH-HHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcce Q lcl|Aclame:pro 1 MGLI------------YDKVTASNI-AGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTI 67 (348) Q Consensus 1 Ma~l------------~d~f~~~~l-~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~ 67 (348) |... ...+=|.++ .++++.+. .. +-+.+ +.+..++.......+....+ ...|.+++.+++.+. T Consensus 1 m~~~~~~~~~~~~t~~~~~lvP~~~~~~ii~~~~-~~-s~l~~-~~~~~~~~~~~~~~~~~~~~-~~~a~~v~Eg~~~~~ 76 (297) T protein:vir:95 1 MTVQTFNPENVLVSQKKDGTLHKEFTDIIMKEVA-QN-SLVMQ-LGQYQEMEGEQEKTVYVQTD-GISAYWVNETEKIKT 76 (297) T ss_pred CCccccccccccccCCCcceechhHHHHHHHHHH-hh-chhhh-hcceeecCCCccEEEEEEcC-CceeEEeecCccccc Confidence 3221 011112333 33333332 22 22333 35554443332222222222 234677887776654 Q ss_pred ecccceeeeEeeccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeec Q lcl|Aclame:pro 68 RDRVSAEIHDEQMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFT 147 (348) Q Consensus 68 ~~r~~~~~~~~~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~ 147 (348) . ...+....+++-+++--..++.+-+ .++ ..+ +...| ...+.+++.+.+|..+. +|- T Consensus 77 ~-~~~f~~v~l~~~k~~~~~~is~ell------~ds-~~~----l~~~i---~~~la~ai~~~~d~a~l----~G~---- 133 (297) T protein:vir:95 77 D-KPEVVPVTLKAHKLGIILVTSREAL------NYT-WKK----FFEDM---KPQIVEAFYKKIDEAGL----LGH---- 133 (297) T ss_pred c-ccceeEEEEeeEEEEEeehhhHHHH------hcC-HHH----HHHHH---HHHHHHHHHHHHHHHHh----ccc---- Confidence 4 3567777777776666666654322 111 111 11222 23445666677765555 342 Q ss_pred CCceeEEEeeccCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcc Q lcl|Aclame:pro 148 SDGVNKDIDYGVKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGS 227 (348) Q Consensus 148 ~~~~~~~vDfg~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~ 227 (348) +.+... +... ..+...... ++..-++||.++...+...+..+..++|+++.+..|++ +++.- + .. T Consensus 134 g~~~~~----gi~~--~~~~~~~~~-~~~~t~~~i~~~~~~l~~~~~~~~~~v~~~~~~~~L~~---l~d~~----G-~~ 198 (297) T protein:vir:95 134 DTPFAN----SVAK--AAKDANKVI-GGPINYDNILKLQDALYDADVEPNAFVSKIQNRSALRE---ARDGN----K-VS 198 (297) T ss_pred CCcccc----cccc--cccccceec-ccccCHHHHHHHHHHhhhccCCcCEEEEcHHHHHHHHH---hhccC----C-ce Confidence 111100 0000 000011111 12234678888888887777788889999999987753 22221 1 11 Q ss_pred cccHHHHHHHHHhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccc----hhhhccccccccccceee Q lcl|Aclame:pro 228 SVTKAELQNYVADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTT----PEESDLFADNTVNADVEI 303 (348) Q Consensus 228 ~~~~~~~~~~~~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~----~~~~~~~~~~~~~~~~~~ 303 (348) ...+. -+...|.+++... + ...+++.++|.-... ..||.- .+..+ ... ..... T Consensus 199 i~~~~-----~~~l~G~Pv~~~~----~------~~~~~~~~~~gd~s~---~~~~~~~~~~i~~~~-~~~----~~~~~ 255 (297) T protein:vir:95 199 IYDKA-----ANTIDGITTVDLK----S------ARFEKGDLLAGDFDN---LIYGVPYNITYKISE-EGQ----ISTIT 255 (297) T ss_pred eecCC-----CCcccceeeEeec----C------CCCCCceEEEEeccc---EEEEEecCeEEEEee-ccc----ccccc Confidence 11110 0123355543221 1 112334444443222 122210 00000 000 00000 Q ss_pred cCCceEEEEeecCCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 304 VDSGIAVTTTKTTDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 304 ~~~~~~~~~~~~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) ...+.....|.+ ....+++..+.=..+.+|+++.++|...+| T Consensus 256 ~~~~~~~~~~~~---~~~~~r~~~~~d~~v~~~~a~~~l~~at~~ 297 (297) T protein:vir:95 256 NADGTPINLFEQ---EMIAIRATMDIAVMITKTDAFAKLTPAERV 297 (297) T ss_pred ccCccchhhhhc---CcEEEEEEEEeccEeecccceEEEeecCCC Confidence 000111111111 134566677777888899999999999999 No 77 >protein:vir:103955 Length: 324 # NCBI annotation: head protein # Family: family:all:507 # MgeID: mge:1662 # MgeName: phiNM # Cross-refs: genbank:acc:YP_873992;genbank:gi:118430767;genbank:GeneID:4525449 Probab=20.13 E-value=2.8 Score=18.11 Aligned_cols=281 Identities=10% Similarity=0.007 Sum_probs=120.6 Q ss_pred Ccc-chhhcCHHHH-HHHHHhhccchhhhHHHHhCCCccccceeEEEEEeecCceeeeeeeeCCCCcceecccceeeeEe Q lcl|Aclame:pro 1 MGL-IYDKVTASNI-AGYFNTLQENVDSTLGESIFPARKQLGTKLSYIKGASGQSVALKAAAFDTNVTIRDRVSAEIHDE 78 (348) Q Consensus 1 Ma~-l~d~f~~~~l-~~~i~~~~~~~~~~l~~~~Fp~~~~~~~~~~~~~~~~~~~~~a~~v~~~~~~~~~~r~~~~~~~~ 78 (348) |.. -...+=|.++ ..++..+. ...+ +.+ +++..++.+..+.... ..+. ..|.+++.+.+.+... ..+....+ T Consensus 30 ~~~~~~~~liP~~~~~~ii~~~~-~~s~-l~~-~~~~~~~~~~~~~~p~-~~~~-~~a~~v~Eg~~~~~~~-~~~~~v~~ 103 (324) T protein:vir:10 30 MMHEKKDGTLLNDFTTPILQEVM-ENSK-IMQ-LGKYEPMEGTEKKFTF-WADK-PGAYWVGEGQKIETSK-ATWVNATM 103 (324) T ss_pred eccCCCcceechhHHHHHHHHHH-hhch-hhh-hcceeeccCCceEEEE-EeCC-cceeEeccCccccccc-cceeEEEE Confidence 211 1111222333 33333332 2222 333 3555554444444333 2222 3467788877766544 46677777 Q ss_pred eccccccccccCHHHHHHHHhhcCcCCHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHhcCeeeecCCceeEEEeec Q lcl|Aclame:pro 79 QMPFFKEALLVKENDRQQLNLVKDTGNEALINTIVAGIFNDDVTLINGARARLEAMRMQVLATGKIAFTSDGVNKDIDYG 158 (348) Q Consensus 79 ~~p~i~~~~~i~~~d~~~l~~~~~~~~~~~~~~~~~~i~~~~~~~~~~i~~r~E~m~~qal~~Gki~~~~~~~~~~vDfg 158 (348) .+-++.--..++.+-+ .+. ..+ +...+ ...+.+++.+.+|..+. .|.-+-..+ ..+ T Consensus 104 ~~~k~~~~~~iS~ell------~ds-~~~----l~~~i---~~~l~~ai~~~~d~a~l----~G~g~~~~~---~~i--- 159 (324) T protein:vir:10 104 RAFKLGVILPVTKEFL------NYT-YSQ----FFEEM---KPMIAEAFYKKFDEAGI----LNQGNNPFG---KSI--- 159 (324) T ss_pred eeEEEEEeehhhHHHH------hcc-hHH----HHHHH---HHHHHHHHHHHHHHHhh----hcCCCCccC---ccc--- Confidence 7766666556654322 111 111 11222 33445666666665443 232110000 000 Q ss_pred cCccceeeeeecCCCCCccHHHHHHHHHHHHHhcCCeeEEEEeCHHHHHHHhcCHHHHHHhcccCCCcccccHHHHHHHH Q lcl|Aclame:pro 159 VKADHKKQVSKSWAEPGATPLADLEDAIETARELGLNPERAIMNAKTFGLIRKAASTVKAIKPLAGDGSSVTKAELQNYV 238 (348) Q Consensus 159 ~~~~~~~t~~~~W~~~~adp~~di~~~~~~~~~~G~~~~~~~~~~~~~~~l~~~~~v~~~~~~~~~~~~~~~~~~~~~~~ 238 (348) .+.. .......++....+||.++...+...+..+..++|++.+|..|++ +++.- +. ..+....- T Consensus 160 ---~~~~-~~~~~~~~~~~t~~~i~~~~~~l~~~~~~~~~~v~n~~~~~~L~~---l~d~~----g~-~~~~~~~~---- 223 (324) T protein:vir:10 160 ---AQSI-EKTNKVIKGDFTQDNIIDLEALLEDDELEANAFISKTQNRSLLRK---IVDPE----TK-ERIYDRNS---- 223 (324) T ss_pred ---cccc-cccceeccccCCHHHHHHHHHhhhhccCCCCEEEEcHHHHHHHHH---hhccC----Cc-eeecCCCC---- Confidence 0000 111222344567888998888887777778889999999997753 22221 11 11111000 Q ss_pred HhhcCceEEEEeeEEEcCCCcccccccCCeEEEEeCCccceeEeccc----hhhhccccccccccceeecCCceEEEEee Q lcl|Aclame:pro 239 ADNYGVEIVLENGTYRNEKGEVSKFFPDGHLTLIPNGPLGNTVFGTT----PEESDLFADNTVNADVEIVDSGIAVTTTK 314 (348) Q Consensus 239 ~~~~~~~i~~yd~~y~d~~g~~~~~~~~~~vv~~p~~~~G~~~yg~~----~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 314 (348) ..+.|.+++..+.. + .+++.+++..... ..+|.- .+.++... ........+.....|. T Consensus 224 ~~l~G~PV~~~~~~----~------~~~~~~~~gd~~~---~~~~~~~~~~i~~~~~~~-----~~~~~~~~~~~~~~~~ 285 (324) T protein:vir:10 224 DTLDGLPVVNLKSS----N------LKRGELITGDFDK---LIYGIPQLIEYKIDETAQ-----LSTVKNEDGTPVNLFE 285 (324) T ss_pred ccccceeEEeecCC----C------CCcceEEEEeccc---EEEEEecCcEEEEeeccc-----ccccccccccchhhhh Confidence 12345666443211 1 1223344433221 222210 00000000 0000000000011111 Q ss_pred cCCCceeEEeeeeeeeeeecCCCcEEEEEEecCC Q lcl|Aclame:pro 315 TTDPVNVQTKVSMVALPSFERLGDVYMLTVIPGV 348 (348) Q Consensus 315 ~~dP~~~~~~~~s~~lPv~~~~~~~~~~~V~~~~ 348 (348) + ....+++..+.=..+.+|+++.+++....+ T Consensus 286 ~---~~~~~r~~~r~d~~v~~~~A~~~l~~a~~~ 316 (324) T protein:vir:10 286 Q---DMVALRATMHVALHIADDKAFAKLVPADKK 316 (324) T ss_pred c---CcEEEEEEEEEccEEecccceEEEEeccCC Confidence 1 134455566666677789999998776444 Done!