2
!"#$" "& "'() *"$#+, "& -)" *.--)*"+&,* !"#$ !()/+)*0 1),-.) 2+$.* -&(&)* ,(( 3456478 *"$#+,* *)9)/"):; 38 <'()* = 64>> /&?(9)") -),&?)*; <'()0 1),-.) 2+$.* "'() @ -&(&)* ,(( 345@ABB *"$#+,* *)9)/"):; 3@ABB !"$#+,* = @AB7 /&?(9)") -),&?)*; <'()0 1),-.) 2+$.* "'() A 3457C6 *"$#+,* *)9)/"):; 37C6 !"$#+,* = 7A7 /&?(9)") -),&?)*; <'()0 1),-.) 2+$.* "'() A <D#+9#,:5@>>B@5BC 345@ *"$#+,* *)9)/"):; 3@ !"$#+, = A /&?(9)") -),&?)*; < 1 + " -./.01 2345-6.-7 18 390/5%. 39 -.,40: EF/9.:) (#$"+#99' *)G.),/): -),&?)* H.?( "& *"$#+, +, "#F&,&?'0 !"#$"0 IIII IIII 08//.01389 ;.,4 <& #:: ?&,"D "& *)#$/DJ *)) K:2#,/) !)#$/D L("+&,*0 M&,"D N#,-) -,<=/. /80,1389 !"" !#$%&'() +(#,( !)-.&""( !./0%("&( 1()-"(2$/3 1$"&4$ 1%(4&" 1%&0&/3 5&%-&) 6/"()2/ 1%.)$& 1.%7&)( 8(/, 9(#:,2&( 93&"$ 93&)( 9,",#:&( 9,#,%,/ 9,,7 6/"()2/ :8-1 -./.01389 !"" >.#() ?,/@.&0, ?,./$ A)7),B) !"#$%" '"()*+ !)#$/D T&$ 2+$.* -),&?+/ *)G.),/)* #,: $)9#"): +,T&$?#"+&,R I&. /#, *)#$/D T&$ "D) UD&9) 2+$.* T#?+9' &$ *)#$/D T&$ *()/+T+): -),.*J *()/+)* )"/R I&. /#, #9*& T+,: '&.$ *"$#+, &$ -),&?) $)/&$: +T '&. D#2) +"* +,T&$?#"+&,J *./D #* *"$#+, ,#?)J #//)**+&,R V&?) W),&?) !)#$/D !"#$%" !EKNSV 1K<K KXKYIZE [ \]!QKY]ZE ^LN_`EXSV \]NQ! OKM]Y]E! VLME !"#$ &'($)* $'+#$,'- ./ 0',"1'&2 !"#$%& ($)*"$)# 34&56(74,0 89 5'$ 5(0' : &"$+'- ;7 <5')4'& =(1': <+$(4, =(1': >',?(,@ A))'&&4", (&)',-4,067 +),-.#/ !"**)01, 233 *4 54$6)01 !"* !#7" !"#$%& +480.4#3 !"#$%" '"()*+ ,"-./0 94:$ !"."%*"3 ;*"<,= >? )*"<, ,"."%*"3 @ +","."%* 2.. <'6')+ (66 ./ 0',"1'& !*$#)0 A#<" !-"%)", A#<" !"D:"0%" E"01*& +#*" F4,* B"0C#06 F4,* (4:0*$/ G4. H/-" 3BC!99DBB8E. 3',0#' F4$#& B B999 G,@,"H, D=IAD C(6(7&4( 0',"14) J=A 3K=LDBI?JI?M3DLB./EIB999 3',0#' F4$#& B B999 N#1(, N"1" &(54',& ?$(O46 0',"14) J=A 3K=LDBIPQI?M3DL..ERISRRR 3',0#' F4$#& B SRRR N#1(, N"1" &(54',& P"6"1;4( 0',"14) J=A 3K=LDBI=MI?M3DLB.VVIB999 3',0#' F4$#& B WXU899E9 S9/BR B999 N#1(, N"1" &(54',& =4)($(0#( 0',"14) J=A 3K=LDBI=MI?M3DLB.VEIB999 3',0#' F4$#& B WXU899ES S9ER9 B999 N#1(, N"1" &(54',& =4)($(0#( 0',"14) J=A I:0 20#./,), N"1' >',"1' <'($)* J'&#6+& ;3"0*)J/ !)<).#$ !"D:"0%", KCE2!HL 20#./M" !"D:"0%" N#$)#*)40 K!AOL 2.)10 !"D:"0%", KG!2L G"*#3#*#P3$)7"0 (4<-#$#*)7" 20#./,), H44. B"0"$#*" O&/.41"0"*)% H$"" <KAJPN 3AYA A=AZ![K \ LM<GAZM[K ]QJ^?K=PN LMJG< WACMZMK< NQCK !" ,$7+,D/ R$,$ 0,$U"+*/.E /$.$7#$D C,+T /$-,7A ,$/*.#/ #$%&' )*+&*$,*) - ./012' /. )*+&*$,*) %0/3#4*4 - 86-."26$D ZHL)H H."26$D ZHL)H F$V*/ !.*/#-. ! """ $%&' ()'%*+,- """ )*+&*$,* '5%* - F*7.$+#"D$ $&16*0 /. 70/&%) , 328&* '90*)9/84 )A$ ![U-.*$ #A,$/A+.D "/ */$D -/ #A$ :;<=:>:0,+5-5."#E .$U$. C+, #A$ ."\$."A++D #A-# #A$ 0+/"#"+6 "/ D"CC$,$6# -T+62 #A$ 2,+*0/ /"T0.E 5E 7A-67$N ]6#$, #A,$/A+.D U-.*$: ?N?^ ,?@A=@>B ,CB;D )BE>B@FB 7D?>G=@H !"#$%$#$&%'()"* ,-./$'$#()" 0*$123(3 4--1 T$#-[!H)L R".. -..+R */$,/ +C #A$ U",*/[+,"$6#$D R$5/"#$/ #+ $-/".E 0$,C+,T #A$", +R6 7*/#+T"_$D 7+T0-,-#"U$ 2$6+T"7/ -6-.E/$/ "6 -6 -*#+T-#$D C-/A"+6 R"#A T"6"T-. T-6*-. T-6"0*.-#"+6N 8/"62 T$#-[!H)L= */$, 7-6 0$,C+,T - /#-#"/#"7-. -6-.E/"/ +6 /$3*$67$/ -//"26$D #+ D"CC$,$6# 2,+*0/ "6 +,D$, #+ D$#$,T"6$ ,$/"D*$/ #A-# /"26"C"7-6#.E 7+,,$.-#$ R"#A +6$ +, T+,$ T$#-D-#- C"$.D/N !"#$% '( )*#$+,*- ./0 1 +$23,+$4 5,$64 J+T$ S$6+T$ L$-,7A ($/*.#/ W$#-D-#-[D,"U$6 !+T0-,-#"U$ H6-.E/"/ )++. C+, L$3*$67$/ IT$#-[!H)LM !"#$%$%&%'#( L]H(!J 9H)H HFHX`Y] a &GL8HXGY] 4;(b1]F!J &G(8L ZHWGXG]L J;W] ViPR is funded by the National Institute of Allergy and Infectious Diseases (NIH / DHHS) under Contract No. HHSN272200900041C and is a collaboration between Northrop Grumman Health IT, University of Texas Southwestern Medical Center and Vecna Technologies. Comments, questions, suggestions? Contact us at [email protected] What is Meta-CATS? A unique comparative genomics analysis tool in ViPR to identify nucleotide/amino acid positions that significantly differ between two or more groups of virus sequences. How does Meta-CATS work? It runs a multiple sequence alignment, a chi-square test to identify positions that significantly differ from the random distribution of residues between all metadata groups, and a Pearson's chi-square test to identify the specific pairs of groups that contribute to the observed statistical difference. How to use Meta-CATS? Input nucleotide/amino acid sequences to Meta-CATS Divide sequences into two or more groups based on metadata (phenotype) Run Meta-CATS Option 1: Search for sequences and then input sequences to Meta-CATS http://www.viprbrc.org/ Freely available Integrated datasets Bioinformatics tool suite 1 2 3 Select sequences and add them to a working set for future analysis. You’ll need to register for a Workbench account to use this feature. Select display fields Custom-sort records Click to view details of the record 4 Let ViPR automatically group sequences by host, country, year, viral species, or virus type. On the ViPR homepage, choose a virus family to start. 1. Identify sequences to include in the Meta-CATS analysis: mouse- over the “Search Data” tab and click “Genomes” or “Genes & Proteins”. For this example, we will use genome sequences. 2. Select search criteria on the Genome Search page and click the “Search” button to run your query. 3. Select sequences from the search result page by clicking the checkboxes. Mouse-over the yellow “Run Analysis” button, and click “Metadata-driven Comparative Analysis Tool”. If you want to include sequences that are not in this search result, select desired sequences and click “Add to Working Set”, then add additional sequences to the same working set. Click the “Workbench” tab, find the working set you saved and click next to it. On the working set details page, mouse-over “Run Analysis” and click “Metadata-driven Comparative Analysis Tool”. 4. On the next page, choose the number of groups. If you want to group your sequences by host, country, year, viral species, or virus type, you can use ViPR’s auto grouping feature by clicking the “Auto Grouping” drop-down menu and follow the prompts. Otherwise, you can group sequences manually on the next page. Adjust the C-value threshold if needed. Then click “Continue”.

ViPR meta-CATS handout v.1.3 · 2 !"#$%&'()$("*('&+ %%!.*/#-.! '()$("*(&%3#(&&+!"#$%"!"#$%&'()$("*('&+!"#$%&'!"#$%&' %%!.*/#-. (!"#$%"!"##$%&'&(#)*+,-&.%/!"#"$%&"'()*+,-"#"&./'0$""

  • Upload
    others

  • View
    20

  • Download
    0

Embed Size (px)

Citation preview

Page 1: ViPR meta-CATS handout v.1.3 · 2 !"#$%&'()$("*('&+ %%!.*/#-.! '()$("*(&%3#(&&+!"#$%"!"#$%&'()$("*('&+!"#$%&'!"#$%&' %%!.*/#-. (!"#$%"!"##$%&'&(#)*+,-&.%/!"#"$%&"'()*+,-"#"&./'0$""

!"#$"%"&%"'()%*"$#+,%"&%-)"%*.--)*"+&,* !"#$

%&'&(&)*+,((

% !()/+)*0 1),-.)%2+$.* -&(&)*+,((3456478%*"$#+,*%*)9)/"):; 38%<'()*%=%64>>%/&?(9)")%-),&?)*;

% <'()0 1),-.)%2+$.*%"'()%@ -&(&)*+,((345@ABB%*"$#+,*%*)9)/"):; 3@ABB%!"$#+,*%=%@AB7%/&?(9)")%-),&?)*;

% <'()0 1),-.)%2+$.*%"'()%A -&(&)*+,((3457C6%*"$#+,*%*)9)/"):; 37C6%!"$#+,*%=%7A7%/&?(9)")%-),&?)*;

% <'()0 1),-.)%2+$.*%"'()%A<D#+9#,:5@>>B@5BC

-&(&)*+,((345@%*"$#+,*%*)9)/"):;

3@%!"$#+,%=%A%/&?(9)")%-),&?)*;

% < 1 % + %" %6 - ( *+,((

-./.01+2345-6.-7+18+390/5%.+39+-.,40:EF/9.:)%(#$"+#99'%*)G.),/):%-),&?)*

H.?(%"&%*"$#+,%+,%"#F&,&?'0 !"#$"0 IIII

%E,:0 IIII

08//.01389;.,4

<&%#::%?&,"D%"&*)#$/DJ%*))K:2#,/)%!)#$/DL("+&,*0%M&,"DN#,-)

-,<=/.+/80,1389!""!#$%&'()*+(#,(!)-.&""(!./0%("&(1()-"(2$/31$"&4$1%(4&"1%&0&/3*5&%-&)*6/"()2/1%.)$&1.%7&)(*8(/,9(#:,2&(93&"$93&)(9,",#:&(9,#,%,/9,,7*6/"()2/9,0$*;<6=,&%$9,0$*2<6=,&%$9 :

:8-1+-./.01389!"">.#()?,/@.&0,?,./$A)7),B)

:>'*+?&@A&B%%K99%%M#9)%%O)?#9)

O$&?

<&

:>'*+,C&+4D@C&

C%&#(%DC%,:(:"$*E%&#(%DC%,:(:"$*/$',)2(%D+$',)2(%D

3##"@&+-*D*"'

:8-1+,1143E51.-

'$""*/.E$%)(0()0/$%.#E"(/#(

-D#$(&+->"B)&

F,)$9GHIG*J9GHIG*KL

=D''DC&+:F'*>BG

-,<=/.+,1143E51.-

;MFK;MFN;MFI;MFO

2FB"'+1G$&

2$(03),0*7),B)%$',=$%D

%F'&D'&+0>"B'&

2345-+,1143E51.-

-"H#F''F>@+-F*&+,"*I>B'

P%Q*)%/&??#%"&%*)(#$#")%?.9"+(9)%),"$+)*REF0%M/E9$&'J%H&$-)

-D#$(&+0>((&)*F>@+,"*I>B'

P%Q*)%/&??#%"&%*)(#$#")%?.9"+(9)%),"$+)*REF0%S&?#/DJ%H#$?#,

;MF8P!?MC;56*F6/#Q;5M69!RC

0>I>B*+6-*"AG7+=>$"(D*F>@

3-8/,1389+.2.91

!"#$%"&'"()*+&!)#$/D%T&$%2+$.*%-),&?+/%*)G.),/)*%#,:%$)9#"):%+,T&$?#"+&,R%I&.%/#,%*)#$/D%T&$%"D)%UD&9)%2+$.*%T#?+9'%&$%*)#$/D%T&$%*()/+T+):%-),.*J%*()/+)*%)"/R%I&.%/#,%#9*&%T+,:%'&.$%*"$#+,%&$-),&?)%$)/&$:%+T%'&.%D#2)%+"*%+,T&$?#"+&,J%*./D%#*%*"$#+,%,#?)J%#//)**+&,R

V&?)% %W),&?)%!)#$/D

!"#$%"!EKNSV%1K<K KXKYIZE%[%\]!QKY]ZE ^LN_`EXSV \]NQ!%OKM]Y]E! VLME

Ka&."%Q* K,,&.,/)?),"* Y+,b* N)*&.$/)* !.((&$" !+-,%L."

I&.%#$)%9&--):%+,%#*%'.,RcD#,-d."*&."DU)*")$,R):.

!"#$%&'()*+,-.&/()(0(%-&(.1&2.(34%"%&5-%+$#6-&7!"'58&9&:3(;";"#<<< *))=>??@@@<;"=#0#6<+#,?0#6?;"=#A,-.+B-A%-(#6*<1+CB-)*+1DE*+<<<

F&+G&H I?FF?FF&FF>JF&2K

!"#$%&'($)*%$'+#$,'-%./%0',"1'&2 !"#$%&'($)*"$)# 34&56(74,0%89%5'$%5(0'%:%&"$+'-%;7%<5')4'&%=(1':%<+$(4,%=(1':%>',?(,@

A))'&&4",%(&)',-4,067

+),-.#/'!"**)01,

'233'*4'54$6)01'!"*' '!#7"'!"#$%&' '+480.4#3'

!"#$%"&'"()*+&,"-./0

94:$'!"."%*"3';*"<,='>?')*"<,',"."%*"3'''@''+","."%*'2..

% <'6')+%(66%./%0',"1'&

!*$#)0'A#<" !-"%)",'A#<" B"0C#06'2%%",,)40 !"D:"0%"'E"01*& +#*" F4,* B"0C#06'F4,* (4:0*$/ G4.'H/-"

3BC!99DBB8E. 3',0#'%F4$#&%B B999 G,@,"H, D=IAD C(6(7&4( 0',"14)%J=A

3K=LDBI?JI?M3DLB./EIB999 3',0#'%F4$#&%B B999 N#1(, N"1"%&(54',& ?$(O46 0',"14)%J=A

3K=LDBIPQI?M3DL..ERISRRR 3',0#'%F4$#&%B >TUEU88. S9EB8 SRRR N#1(, N"1"%&(54',& P"6"1;4( 0',"14)%J=A

3K=LDBI=MI?M3DLB.VVIB999 3',0#'%F4$#&%B WXU899E9 S9/BR B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLB.VEIB999 3',0#'%F4$#&%B WXU899ES S9ER9 B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLB.EBIB999 3',0#'%F4$#&%B WX/VV/V8 S9E/R B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLB.E.IB999 3',0#'%F4$#&%B WX/VV/98 S9EER B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLB.EVIB999 3',0#'%F4$#&%B WX/VV/VV S9EEV B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBE8/IB999 3',0#'%F4$#&%B WXU89SS/ S9E/R B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBE8UIB999 3',0#'%F4$#&%B WXU89SSU S9E/R B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBE8RIB999 3',0#'%F4$#&%B WXU899EB S9E/R B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBEE9IB999 3',0#'%F4$#&%B WXU899E. S9E/R B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBEEBIB999 3',0#'%F4$#&%B WXU89SSR S9E/U B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBEE.IB999 3',0#'%F4$#&%B WXU899EV S9E/R B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBEEVIB999 3',0#'%F4$#&%B WXU899E8 S9E/R B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBEE8IB999 3',0#'%F4$#&%B WXU899EE S9E/R B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBEEEIB999 3',0#'%F4$#&%B WXU/.U9U S9/VS B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBEU.ISRRR 3',0#'%F4$#&%B >TSRRUR8 S9E/U SRRR N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBRB.IB999 3',0#'%F4$#&%B WXURUV// S9E/U B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBI=MI?M3DLBRBVIB999 3',0#'%F4$#&%B WXURUV/U S9E/R B999 N#1(, N"1"%&(54',& =4)($(0#( 0',"14)%J=A

3K=LDBIG<I?M3DLS9VUISRRR 3',0#'%F4$#&%B KGVUB88/ S9E.R SRRR N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBIG<I?M3DLSVB8ISRRR 3',0#'%F4$#&%B KGE//SVB S9E/U SRRR N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBIG<I?M3DLSVBEISRRR 3',0#'%F4$#&%B KGE//SV. S9E/U SRRR N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBIG<I?M3DLSVB/ISRRR 3',0#'%F4$#&%B KGE//SVV S9E/U SRRR N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBIG<I?M3DLSVBUISRRR 3',0#'%F4$#&%B KGE//SV8 S9E/U SRRR N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBIG<I?M3DLSVESIB999 3',0#'%F4$#&%B KGEU/BBB S9E/U B999 N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBIG<I?M3DLSVEBIB999 3',0#'%F4$#&%B KGEU/BB. S9E/U B999 N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBIG<I?M3DLSVE.IB999 3',0#'%F4$#&%B KGEU/BBV S9E/U B999 N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBIG<I?M3DLSVEVIB999 3',0#'%F4$#&%B KGEU/BB8 S9E/U B999 N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBIG<I?M3DL8RUISRRR 3',0#'%F4$#&%B KGVUB/BR S9E/U SRRR N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBIG<I?M3DL8RRISRRR 3',0#'%F4$#&%B KGVUB/.9 S9EBR SRRR N#1(, N"1"%&(54',& G<A 0',"14)%J=A

3K=LDBILKI?M3DLBRVBIB999 3',0#'%F4$#&%B WXURUVEE S9E/R B999 N#1(, N"1"%&(54',& L','O#'6( 0',"14)%J=A

3WV9V 3',0#'%F4$#&%B WCBS9BS/ S9EU8 SRRR N#1(, N"1"%&(54',& L4'+%=(1 0',"14)%J=A

3(@%A$%SVS9ER 3',0#'%F4$#&%B KWS98.UR S9/B. SRRR G,@,"H, D=IAD <','0(6 0',"14)%J=A

3(@%A$%SVS9/9 3',0#'%F4$#&%B KWS98.R9 S9/S/ SRRR G,@,"H, D=IAD <','0(6 0',"14)%J=A

I:0'20#./,),

N"1'% %>',"1'%<'($)*% %J'&#6+&

';3"0*)J/'!)<).#$'!"D:"0%",'KCE2!HL'

'20#./M"'!"D:"0%"'N#$)#*)40'K!AOL'

'2.)10'!"D:"0%",'KG!2L'

'G"*#3#*#P3$)7"0'(4<-#$#*)7"'20#./,),'H44.'

'B"0"$#*"'O&/.41"0"*)%'H$""'

!"#$%"<KAJPN%3AYA A=AZ![K%\%LM<GAZM[K ]QJ^?K=PN LMJG<%WACMZMK< NQCK

A;"#+%G& A,,"#,)'1',+& Z4,@& J'&"#$)'& <#55"$+ <40,%Q#+

!"#%($'%6"00'-%4,%(&%7#,2O*(,0_#+&"#+*H'&+'$,2'-#

!"#$%&'()*+,-.&/()(0(%-&(.1&2.(34%"%&5-%+$#6-&7!"'58&9&:3(;";"#<<< *))=>??@@@<;"=#0#6<+#,?0#6?;"=#A,-.+B-A%-(#6*<1+

C&+D&E CF?CE?CC&CF>GG&2H

!"#$%&"'( )*#+,"-./ ($0+,#%-%1*2 ($3*$/#%4$5%),-"6"62 !+6#-7#%8/ ($.$-/$%9-#$:%;7#%<=%>?@@

)A"/%0,+B$7#%"/%C*6D$D%5E%#A$%F-#"+6-.%G6/#"#*#$%+C%H..$,2E%-6D%G6C$7#"+*/%9"/$-/$/%IFGJ%K%9JJLM%*6D$,%!+6#,-7#%F+N%JJLF>O>>??P???Q@!%-6D%"/%-%7+..-5+,-#"+6%5$#R$$6%F+,#A,+0S,*TT-6%J$-.#A%G)=%86"U$,/"#E%+C%)$V-/%L+*#AR$/#$,6%W$D"7-.%!$6#$,%-6D%&$76-%)$7A6+.+2"$/N%&",*/%"T-2$/%7+*,#$/E%+C%!9!%'*5."7%J$-.#A%GT-2$%X"5,-,E=%4$..7+T$%GT-2$/=%8NLN9$0-,#T$6#%+C%&$#$,-6/%HCC-",/%=%L7"$67$%+C%#A$%G6U"/"5.$%-6D%&",-.Y+6$=%LR"//%G6/#"#*#$%+C%1"+"6C+,T-#"7/N

!"%,$7+,D/%R$,$%0,$U"+*/.E%/$.$7#$D%C,+T%/$-,7A%,$/*.#/

#$%&'()*+&*$,*)(-

./012'(/.()*+&*$,*)(%0/3#4*4((-%%86-."26$D%ZHL)H%%H."26$D%ZHL)H%%F$V*/%%!.*/#-.

!

"""#$%&'#()'%*+,-#"""

)*+&*$,*('5%*((-F*7.$+#"D$

$&16*0(/.(70/&%)

,(328&*('90*)9/84)A$%![U-.*$%#A,$/A+.D%"/%*/$D%-/%#A$%:;<=:>:%0,+5-5."#E%.$U$.%C+,%#A$%."\$."A++D#A-#%#A$%0+/"#"+6%"/%D"CC$,$6#%-T+62%#A$%2,+*0/%/"T0.E%5E%7A-67$N

]6#$,%#A,$/A+.D%U-.*$:%%% ?N?^

,?@A=@>B,CB;D

)BE>B@FB(7D?>G=@H

!"#$%$#$&%'()"*+,-./$'$#()"+0*$123(3+4--1+T$#-[!H)L%R"..%-..+R%*/$,/%+C%#A$%U",*/[+,"$6#$D%R$5/"#$/%#+%$-/".E%0$,C+,T%#A$",%+R6%7*/#+T"_$D%7+T0-,-#"U$%2$6+T"7/%-6-.E/$/%"6%-6%-*#+T-#$D%C-/A"+6%R"#A%T"6"T-.%T-6*-.T-6"0*.-#"+6N

8/"62%T$#-[!H)L=%*/$,%7-6%0$,C+,T%-%/#-#"/#"7-.%-6-.E/"/%+6%/$3*$67$/%-//"26$D%#+%D"CC$,$6#%2,+*0/%"6%+,D$,%#+%D$#$,T"6$%,$/"D*$/%#A-#%/"26"C"7-6#.E%7+,,$.-#$%R"#A%+6$%+,%T+,$T$#-D-#-%C"$.D/N

!"#$%&'(&)*#$+,*-&./0&1&+$23,+$4&5,$64&&

J+T$% %S$6+T$%L$-,7A% %($/*.#/% %W$#-D-#-[D,"U$6%!+T0-,-#"U$%H6-.E/"/%)++.%C+,%L$3*$67$/%IT$#-[!H)LM

!"#$%$%&%'#(L]H(!J%9H)H HFHX`Y]%a%&GL8HXGY] 4;(b1]F!J &G(8L%ZHWGXG]L J;W]

H5+*#%8/ H66+*67$T$6#/ X"6\/ ($/+*,7$/ L*00+,# L"26%;*#

+̀*%-,$%.+22$D%"6%-/%E*6N_A-62c*#/+*#AR$/#$,6N$D*

!"#$%&'()*+,-.&/()(0(%-&(.1&2.(34%"%&5-%+$#6-&7!"'58&9&:3(;";"#<<< *))=>??@@@<;"=#91-;<+#,?0#6?A,6<1+BA-)*+1C5$.:#+A/()(D"%)E<<<

F&+G&F FH?I?FF&FH>JK&2L

ViPR is funded by the National Institute of Allergy and Infectious Diseases (NIH / DHHS) under Contract No. HHSN272200900041C and is a collaboration between Northrop Grumman Health IT, University of Texas Southwestern Medical Center and Vecna Technologies. Comments, questions, suggestions? Contact us at [email protected]

What is Meta-CATS? A unique comparative genomics analysis tool in ViPR to identify nucleotide/amino acid positions that significantly differ between two or more groups of virus sequences.

How does Meta-CATS work? It runs a multiple sequence alignment, a chi-square test to identify positions that significantly differ from the random distribution of residues between all metadata groups, and a Pearson's chi-square test to identify the specific pairs of groups that contribute to the observed statistical difference.

How to use Meta-CATS? • Input nucleotide/amino acid sequences to Meta-CATS • Divide sequences into two or more groups based on metadata (phenotype) • Run Meta-CATS

Option 1: Search for sequences and then input sequences to Meta-CATS

http://www.viprbrc.org/

Freely available Integrated datasets Bioinformatics tool suite

1 2

3

Select sequences and add them to a working set for future analysis.

You’ll need to register for a Workbench account to

use this feature.

• Select display fields • Custom-sort records

Click to view details of

the record

4

Let ViPR automatically group sequences by host,

country, year, viral species, or virus type.

On the ViPR homepage, choose a virus family to start.

1. Identify sequences to include in the Meta-CATS analysis: mouse-over the “Search Data” tab and click “Genomes” or “Genes & Proteins”. For this example, we will use genome sequences.

2. Select search criteria on the Genome Search page and click the “Search” button to run your query.

3. Select sequences from the search result page by clicking the checkboxes. Mouse-over the yellow “Run Analysis” button, and click “Metadata-driven Comparative Analysis Tool”. If you want to include sequences that are not in this search result, select desired sequences and click “Add to Working Set”, then add additional sequences to the same working set. Click the “Workbench” tab, find the working set you saved and click next to it. On the working set details page, mouse-over “Run Analysis” and click “Metadata-driven Comparative Analysis Tool”.

4. On the next page, choose the number of groups. If you want to group your sequences by host, country, year, viral species, or virus type, you can use ViPR’s auto grouping feature by clicking the “Auto Grouping” drop-down menu and follow the prompts. Otherwise, you can group sequences manually on the next page. Adjust the C-value threshold if needed. Then click “Continue”.

Page 2: ViPR meta-CATS handout v.1.3 · 2 !"#$%&'()$("*('&+ %%!.*/#-.! '()$("*(&%3#(&&+!"#$%"!"#$%&'()$("*('&+!"#$%&'!"#$%&' %%!.*/#-. (!"#$%"!"##$%&'&(#)*+,-&.%/!"#"$%&"'()*+,-"#"&./'0$""

2

!"#$%&"'( )*#+,"-./ ($0+,#%-%1*2 ($3*$/#%4$5%),-"6"62 !+6#-7#%8/ ($.$-/$%9-#$:%;$0%<=>%?@<<

)A"/%0,+B$7#%"/%C*6D$D%5E%#A$%F-#"+6-.%G6/#"#*#$%+C%H..$,2E%-6D%G6C$7#"+*/%9"/$-/$/%IFGJ%K%9JJ;L%*6D$,%!+6#,-7#%F+M%JJ;F?N??@@O@@@P<!%-6D%"/%-%7+..-5+,-#"+6%5$#Q$$6%F+,#A,+0R,*SS-6%J$-.#A%G)>%86"T$,/"#E%+C%)$U-/%;+*#AQ$/#$,6%V$D"7-.%!$6#$,%-6D%&$76-%)$7A6+.+2"$/M%&",*/%"S-2$/%7+*,#$/E%+C%!9!%'*5."7%J$-.#A%GS-2$%W"5,-,E>%4$..7+S$%GS-2$/>%8M;M9$0-,#S$6#%+C%&$#$,-6/%HCC-",/%>%;7"$67$%+C%#A$%G6T"/"5.$%-6D%&",-.X+6$>%;Q"//%G6/#"#*#$%+C%1"+"6C+,S-#"7/M

80.+-D%-%C".$%7+6#-"6"62%SE%/$3*$67$/

'-/#$%/$3*$67$

8/$%Q+,Y"62%/$#M

!"#$%&'()$("*('&+;$3*$67$/%7-6%-./+%5$%/$.$7#$D%C,+S% %+,%-%Q+,Y"62%/$#%"6%E+*,Q+,Y5$67AM

,-./0%&-,&'()$("*('&#.-1!2(2&&+%%86-."26$D%ZH;)H%%H."26$D%ZH;)H%%F$U*/%%!.*/#-.

!

'()$("*(&%3#(&&+%%F*7.$+#"D$%%HS"6+%H7"D%I',+#$"6L

"$/4(.&-,&5.-$#'

*&106$(&%7.('7-62)A$%![T-.*$%#A,$/A+.D%"/%*/$D%-/%#A$%89:;8<8%0,+5-5."#E%.$T$.%C+,%#A$%."Y$."A++D#A-#%#A$%0+/"#"+6%"/%D"CC$,$6#%-S+62%#A$%2,+*0/%/"S0.E%5E%7A-67$M

\6#$,%#A,$/A+.D%T-.*$:%%% @M@=

*=>?;><@*A@9B

'@C<@>D@&5B=<E;>F

!"#$%$#$&%'()"*+,-./$'$#()"+0*$123(3+4--1+S$#-[!H);%Q"..%-..+Q%*/$,/%+C%#A$%T",*/[+,"$6#$D%Q$5/"#$/%#+%$-/".E%0$,C+,S%#A$",%+Q6%7*/#+S"]$D%7+S0-,-#"T$%2$6+S"7/%-6-.E/$/%"6%-6%-*#+S-#$D%C-/A"+6%Q"#A%S"6"S-.%S-6*-.S-6"0*.-#"+6M

8/"62%S$#-[!H);>%*/$,%7-6%0$,C+,S%-%/#-#"/#"7-.%-6-.E/"/%+6%/$3*$67$/%-//"26$D%#+%D"CC$,$6#%2,+*0/%"6%+,D$,%#+%D$#$,S"6$%,$/"D*$/%#A-#%/"26"C"7-6#.E%7+,,$.-#$%Q"#A%+6$%+,%S+,$S$#-D-#-%C"$.D/M

!"#$%&'(&)*#$+,*-&./0&1&+$23,+$4&5,$64&&

J+S$% %V$#-D-#-[D,"T$6%!+S0-,-#"T$%H6-.E/"/%)++.%C+,%;$3*$67$/%IS$#-[!H);L

!"#$%";\H(!J%9H)H HFHW^X\%_%&G;8HWGX\ 4`(a1\F!J &G(8;%ZHVGWG\; J`V\

HFHW^X\%_%&G;8HWGX\

GD$6#"CE%;"S".-,%;$3*$67$/%I1WH;)L

H."26%;$3*$67$/%IV;HL

&"/*-."]$%H."26$D%;$3*$67$/

GD$6#"CE%;A+,#%'$0#"D$/%"6%',+#$"6/

R$6+S$%H66+#-#+,%IRH)8L

H6-.E]$%;$3*$67$%&-,"-#"+6%I;F'L

V$#-D-#-%;$3*$67$%H6-.E/"/

R$6$,-#$%'AE.+2$6$#"7%),$$

JG;)`(^

($#,"$T$%-6%H6-.E/"/

($#,"$T$%-%9+Q6.+-D

+̂*,%H6-.E/"/%J"/#+,E

H5+*#%8/ H66+*67$S$6#/ W"6Y/ ($/+*,7$/ ;*00+,# 4+,Y5$67A%;"26%G6

)A$%V$#-D-#-[D,"T$6%!+S0-,-#"T$%H6-.E/"/%)++.%C+,%;$3*$67$/%IS$#-[!H);L%-..+Q/*/$,/%#+%$-/".E%0$,C+,S%-%7*/#+S"]$D%-*#+S-#$D%7+S0-,-#"T$%-6-.E/"/%#+%"D$6#"CE0+/"#"+6/%"6%#A$%/$3*$67$%#A-#%/"26"C"7-6#.E%D"CC$,%5$#Q$$6%2,+*0/%+C%/$3*$67$/M

!"#$%&'()*+,-.&/()(0(%-&(.1&2.(34%"%&5-%+$#6-&7!"'58&9&:3(;";"#<<< *))=>??@@@<;"=#0#6<+#,?0#6?A,6<1+BA-)*+1CD*+@E3-(.F.=$)'(,<<<

G&+H&G GI?GJ?GG&GI>KK&2L

!"#$%&"'( )*#+,"-./ ($0+,#%-%1*2 ($3*$/#%4$5%),-"6"62 !+6#-7#%8/ ($.$-/$%9-#$:%;$0%<=>%?@<<

)A"/%0,+B$7#%"/%C*6D$D%5E%#A$%F-#"+6-.%G6/#"#*#$%+C%H..$,2E%-6D%G6C$7#"+*/%9"/$-/$/%IFGJ%K%9JJ;L%*6D$,%!+6#,-7#%F+M%JJ;F?N??@@O@@@P<!%-6D%"/%-%7+..-5+,-#"+6%5$#Q$$6%F+,#A,+0R,*SS-6%J$-.#A%G)>%86"T$,/"#E%+C%)$U-/%;+*#AQ$/#$,6%V$D"7-.%!$6#$,%-6D%&$76-%)$7A6+.+2"$/M%&",*/%"S-2$/%7+*,#$/E%+C%!9!%'*5."7%J$-.#A%GS-2$%W"5,-,E>%4$..7+S$%GS-2$/>%8M;M9$0-,#S$6#%+C%&$#$,-6/%HCC-",/%>%;7"$67$%+C%#A$%G6T"/"5.$%-6D%&",-.X+6$>%;Q"//%G6/#"#*#$%+C%1"+"6C+,S-#"7/M

80.+-D%-%C".$%7+6#-"6"62%SE%/$3*$67$/

'-/#$%/$3*$67$

8/$%Q+,Y"62%/$#M

!"#$%&'()$("*('&+;$3*$67$/%7-6%-./+%5$%/$.$7#$D%C,+S%/$-,7A%,$/*.#/%+,%-%Q+,Y"62%/$#%"6%E+*,Q+,Y5$67AM

Z".$%'-#A:!"#$%&'

)A$%S"6"S*S%6*S5$,%+C%/$3*$67$/%"/%?M

;$3*$67$%H//"26S$6#%#+%R,+*0/:!"#$%&'

,-.&/&012345678179:7&,;'%;&<427=&>-1&0/>&1?2-/@&/&A:6B&C-.&D26ED26DF<427&3-&/13-0/34:/22>&/664G9&678179:76&3-&G.-1?6A&(/:H&.-I&6H-12@&J7-<&<-.0/3&K678179:7!LM=KG.-1?&NMA

,OPQ;%&O,&'()$("*('&#POR!L(L&&+%%86-."26$D%ZH;)H%%H."26$D%ZH;)H%%F$U*/%%!.*/#-.

(

'()$("*(&%S#(&&+%%F*7.$+#"D$%%HS"6+%H7"D%I',+#$"6L

"$QT(P&O,&UPO$#'

*&R;V$(&%WP('WOVL)A$%![T-.*$%#A,$/A+.D%"/%*/$D%-/%#A$%0/D4010%0,+5-5."#E%.$T$.%C+,%#A$%."Y$."A++D#A-#%#A$%0+/"#"+6%"/%D"CC$,$6#%-S+62%#A$%2,+*0/%/"S0.E%5E%7A-67$M

\6#$,%#A,$/A+.D%T-.*$:%%% @M@=

*-934917*27/.

'78179:7&U.-1?49G

!"#$%$#$&%'()"*+,-./$'$#()"+0*$123(3+4--1+S$#-[!H);%Q"..%-..+Q%*/$,/%+C%#A$%T",*/[+,"$6#$D%Q$5/"#$/%#+%$-/".E%0$,C+,S%#A$",%+Q6%7*/#+S"]$D%7+S0-,-#"T$%2$6+S"7/%-6-.E/$/%"6%-6%-*#+S-#$D%C-/A"+6%Q"#A%S"6"S-.%S-6*-.S-6"0*.-#"+6M

8/"62%S$#-[!H);>%*/$,%7-6%0$,C+,S%-%/#-#"/#"7-.%-6-.E/"/%+6%/$3*$67$/%-//"26$D%#+%D"CC$,$6#%2,+*0/%"6%+,D$,%#+%D$#$,S"6$%,$/"D*$/%#A-#%/"26"C"7-6#.E%7+,,$.-#$%Q"#A%+6$%+,%S+,$S$#-D-#-%C"$.D/M

!"#$%&'(&)*#$+,*-&./0&1&+$23,+$4&5,$64&&

J+S$% %V$#-D-#-[D,"T$6%!+S0-,-#"T$%H6-.E/"/%)++.%C+,%;$3*$67$/%IS$#-[!H);L

!"#$%";\H(!J%9H)H HFHW^X\%_%&G;8HWGX\ 4`(a1\F!J &G(8;%ZHVGWG\; J`V\

H5+*#%8/ H66+*67$S$6#/ W"6Y/ ($/+*,7$/ ;*00+,# ;"26%`*#

+̂*%-,$%.+22$D%"6%-/%E*6M]A-62b*#/+*#AQ$/#$,6M$D*

!"#$%&'()*+,-.&/()(0(%-&(.1&2.(34%"%&5-%+$#6-&7!"'58&9&:3(;";"#<<< *))=>??@@@<;"=#0#6<+#,?0#6?A,6<1+BA-)*+1CD*+@E3-(.F.=$)'(,<<<

G&+H&G I?JI?GG&K>LG&'M

!"#$%&"'( )*#+,"-./ ($0+,#%-%1*2 ($3*$/#%4$5%),-"6"62 !+6#-7#%8/ ($.$-/$%9-#$:%;*.%<=>%?@<<

)A"/%0,+B$7#%"/%C*6D$D%5E%#A$%F-#"+6-.%G6/#"#*#$%+C%H..$,2E%-6D%G6C$7#"+*/%9"/$-/$/%IFGJ%K%9JJLM%*6D$,%!+6#,-7#%F+N%JJLF?O??@@P@@@Q<!%-6D%"/%-%7+..-5+,-#"+6%5$#R$$6%F+,#A,+0S,*TT-6%J$-.#A%G)>%86"U$,/"#E%+C%)$V-/%L+*#AR$/#$,6%W$D"7-.%!$6#$,%-6D%&$76-%)$7A6+.+2"$/N%&",*/%"T-2$/%7+*,#$/E%+C%!9!%'*5."7%J$-.#A%GT-2$%X"5,-,E>%4$..7+T$%GT-2$/>%8NLN9$0-,#T$6#%+C%&$#$,-6/%HCC-",/%>%L7"$67$%+C%#A$%G6U"/"5.$%-6D%&",-.Y+6$>%LR"//%G6/#"#*#$%+C%1"+"6C+,T-#"7/N

80.+-D%-%C".$%7+6#-"6"62%TE%/$3*$67$/%"6%ZHL)H %+,%'AE."0C+,T-#N

'-/#$%/$3*$67$%"6%ZHL)H %+,%'AE."0%C+,T-#N9$C."6$%"6%E+*,%ZHL)H%C".$%R"..%5$%*/$D%#+%.-5$.%#A$%D"/0.-E

8/$%R+,["62%/$#N

!"##$%&'&(#)*+,-&.%/

0122&3242150674

%\*"7[%),$$%!*/#+T%),$$%IG%R-6#%#+%/$#%TE%+R6%0-,-T$#$,/M

.28924!2&0:;2&&<

%F*7.$+#"D$%HT"6+%H7"D%I',+#$"6M

.791!2&7=&.28924!2.&07&>2&545?:@2A&&<L$3*$67$/%7-6%-./+%5$%/$.$7#$D%C,+T%/$-,7A%,$/*.#/%+,%-%R+,["62%/$#%"6%E+*,R+,[5$67AN

?5>2?6439$C."6$%"6%E+*,%ZHL)H%C".$%R"..%5$%*/$D%#+%.-5$.%#A$%D"/0.-E

=71B50&7=&.28924!2.&;17C6A2A&&<

%86-."26$D%ZHL)H%H."26$D%ZHL)H%'AE."0%I"6#$,.$-U$DM

>D+EF&0)%%!E%')

!"#"$%&"'()*+,-"#"&./'0$""')A$%]\*"7[%),$$]%+0#"+6%*/$/%#A$%Z-/#W^%_%% `N%%%)A"/%-.2+,"#AT%*/$/%-%C-/#>%D"/#-67$a5-/$D-00,+-7A%-6D%"/%2++D%C+,%2$6$,-#"62%#,$$/%C,+T%D-#-/$#/%7+6#-"6"62%<M%T+,$%#A-6%<>@@@%/$3*$67$/%+C%/A+,#%+,%T$D"*T%.$62#A%/$3*$67$/>%?M%T+,$%#A-6%<@@%U$,E%.+62%/$3*$67$/>+,%bM%#+%,$7+6/#,*7#%-%]3*"7[%-6D%D",#E]%#,$$N)A$%]!*/#+T%),$$]%+0#"+6%"67+,0+,-#$/%'AEWX%_%%% %%`%#+%"6C$,%-%T+,$%$U+.*#"+6-,".Ea-77*,-#$%0AE.+2$6$#"7%#+0+.+2E5E%-00.E"62%-%/*5/#"#*#"+6%T+D$.%#+%#A$%6*7.$+#"D$%/$3*$67$/N%)A"/%-.2+,"#AT%"/%5$/#%-00."$D%#+%D-#-/$#/%7+6#-"6"62%<M%C$R$,%#A-6%<@@%U$,E%.+62%/$3*$67$/>%?M%5$#R$$6%<@@%-6D<>@@@%/T-..%+,%T$D"*T%.$62#A%/$3*$67$/N%%I!"#$%&'(&)*#$+,*-&./

J+T$% %S$6$,-#$%'AE.+2$6$#"7%),$$

!"#$%$%&%'#(L^H(!J%9H)H

H5+*#%8/ H66+*67$T$6#/ X"6[/ ($/+*,7$/ L*00+,# L"26%c*#

d+*%-,$%.+22$D%"6%-/%E*6NeA-62f*#/+*#AR$/#$,6N$D*

!',G%E .%E%G/

1),,2"'3,$4.#-'5"&

4'H% 0IJ% 4DHK%)&#L.%MD%,G%$

A'/%

9$62*$?g2$6+T$gA*T-6a<PPPa?@@@

S$6+T$ b? @=K@hK?@<<%b:bO'W

9^F&<aQgPPa@@gA*T-6gS$6+T$/ S$6+T$ =? @iK?QK?@<<%<@:QbHW

A$0-#"#"/%7 S$6+T$ < @bK?PK?@<<%<<:<@HW

!"#$%&'()*+,-.&/()(0(%-&(.1&2.(34%"%&5-%+$#6-&7!"'58&9&:3(;";"#<<< *))=>??@@@<;"=#0#6<+#,?0#6?)#--<1+AB-)*+1CD*+@E3-(.F.=$)'(,-<<<

G&+H&G I?GG?GG&GJ>JI&'K

Option 2: Use a working set or upload your own sequences and then run Meta-CATS

1. Mouse-over the “Analyze & Visualize” tab and click “Metadata Sequence Analysis”.

2. On the Meta-CATS tool landing page, input your sequences using one of the three options:

2.1 Upload a sequence file and a sequence assignment file.

2.2 Paste sequences in FASTA format. 2.3 Use one or more working sets from your

Workbench. 3. Choose the format of sequences provided

and sequence type. 4. Choose the number of groups. Adjust the C-

value threshold if needed. Then click “Continue”.

2

2.1

Three options to input sequences

2.3

Divide sequences into groups based on metadata (phenotype) and run Meta-CATS

Choose the format of sequences

http://www.viprbrc.org/

Freely available Integrated datasets Bioinformatics tool suite

ViPR is funded by the National Institute of Allergy and Infectious Diseases (NIH / DHHS) under Contract No. HHSN272200900041C and is a collaboration between Northrop Grumman Health IT, University of Texas Southwestern Medical Center and Vecna Technologies. Comments, questions, suggestions? Contact us at [email protected]

1

!"#$%&"'( )*#+,"-./ ($0+,#%-%1*2 ($3*$/#%4$5%),-"6"62 !+6#-7#%8/ ($.$-/$%9-#$:%;*.%<=>%?@<<

)A"/%0,+B$7#%"/%C*6D$D%5E%#A$%F-#"+6-.%G6/#"#*#$%+C%H..$,2E%-6D%G6C$7#"+*/%9"/$-/$/%IFGJ%K%9JJLM%*6D$,%!+6#,-7#%F+N%JJLF?O??@@P@@@Q<!%-6D%"/%-%7+..-5+,-#"+6%5$#R$$6%F+,#A,+0S,*TT-6%J$-.#A%G)>%86"U$,/"#E%+C%)$V-/%L+*#AR$/#$,6%W$D"7-.%!$6#$,%-6D%&$76-%)$7A6+.+2"$/N%&",*/%"T-2$/%7+*,#$/E%+C%!9!%'*5."7%J$-.#A%GT-2$%X"5,-,E>%4$..7+T$%GT-2$/>%8NLN9$0-,#T$6#%+C%&$#$,-6/%HCC-",/%>%L7"$67$%+C%#A$%G6U"/"5.$%-6D%&",-.Y+6$>%LR"//%G6/#"#*#$%+C%1"+"6C+,T-#"7/N

80.+-D%-%C".$%7+6#-"6"62%TE%/$3*$67$/%"6%ZHL)H %+,%'AE."0C+,T-#N

'-/#$%/$3*$67$%"6%ZHL)H %+,%'AE."0%C+,T-#N9$C."6$%"6%E+*,%ZHL)H%C".$%R"..%5$%*/$D%#+%.-5$.%#A$%D"/0.-E

8/$%R+,["62%/$#N

!"##$%#&#"'!()&

%\*"7[%),$$%!*/#+T%),$$%IG%R-6#%#+%/$#%TE%+R6%0-,-T$#$,/M

*#+,#&-#$!./#$$0

%F*7.$+#"D$%HT"6+%H7"D%I',+#$"6M

*),"-#$)1$*#+,#&-#*$!)$2#$'&'3.4#5$$0L$3*$67$/%7-6%-./+%5$%/$.$7#$D%C,+T%/$-,7A%,$/*.#/%+,%-%R+,["62%/$#%"6%E+*,R+,[5$67AN

!"#$%&'())*+,-."/0123$450"65781.62749:;<+=>?=>@4<;+A*B=+))),C6#DEF5$+,GH2D$G63/0IJIIIKIJIKILLJLLLKIKKKIKJLIIKJLJIIJKLIKLLJLIIJIKLLLLLLKILLIKIKIKJIKILJLJLKILKIILIIJJIIJKIIIIIIKKJKIKIIKLIJKJJLLLJIILILKJLKIIIJKJKIKIKIIIJJKJKLKLJIIJLKLKJIIJIKJLKIJIIIKIKILLJLJI

%

3'2#3(&%9$C."6$%"6%E+*,%ZHL)H%C".$%R"..%5$%*/$D%#+%.-5$.%#A$%D"/0.-E

1)"6'!$)1$*#+,#&-#*$/")7(5#5$$0

%86-."26$D%ZHL)H%H."26$D%ZHL)H%'AE."0%I"6#$,.$-U$DM

!"##$'3%)"(!86

%'J]WX%(H^WX

(*6%',+#)$/#%C+,%,$7+TT$6D-#"+6%+C%$U+.*#"+6-,E%T+D$.#A-#%5$/#%C"#/%TE%D-#-

G%[6+R%RA"7A%$U+.*#"+6-,E%T+D$.%G%R-6#%#+%*/$N

!"#

/9:;:9<=:>$(>?@9=@>< @N@

&ABCD9$:E$F@<DG:9=DH < %G6#$2$,%C,+T%<%#+%?@%+,%*/$%D$C-*.#%U-.*$

*I@;D$;@9@BD<D9 <N@ %'+/"#"U$%,$-.%U-.*$%+,%*/$%D$C-*.#%U-.*$

)A<G9:A;$J:;<=:>@KL

/'"'6#!#"*$1)"$/8.3)%#&#!(-$'&'3.*(*

#7)3,!()&'".$6)5#3%IL*5/#"#*#"+6%9FHM

H..%T+D$./%-,$%+0#"T"_$D%*/"62%#A$%T-V"T*T%."[$."A++D%7,"#$,"+6N%4$%A-U$%/$#%D$C-*.#U-.*$/%C+,%<`O%0-,-T$#$,/%C+,%$-7A%T+D$.N

($-.%U-.*$%5$#R$$6%@N@@%-6D%<N@@%+,%*/$%D$C-*.#%U-.*$N%)A$%T+D$./%"T0.$T$6#$DA$,$%-..+R%E+*%#+%/0$7"CE%#A-#%-%0,+0+,#"+6%+C%#A$%/"#$/%6$U$,%U-,EN

%'66'$"'!#$7'"('!()&

L0$7"CE%#A$%D$C."6$%+C%#A$%*0.+-D$DK0-/#$D%/$3*$67$/%#+%5*".D%#A$%#,$$

2A=KM$!9DD-KD@9

!"#"$%&"'()*+,-"#"&./'0$""')A$%a\*"7[%),$$a%+0#"+6%*/$/%#A$%Z-/#Wb%c%%9$/0$,>%(N>%S-/7*$.>%dN%I?@@?M%;+*,6-.%+C%!+T0*#-#"+6-.%1"+.+2E%<PIeM>%00N%f=O`O@eN gN%%%)A"/%-.2+,"#AT%*/$/%-%C-/#>%D"/#-67$`5-/$D-00,+-7A%-6D%"/%2++D%C+,%2$6$,-#"62%#,$$/%C,+T%D-#-/$#/%7+6#-"6"62%<M%T+,$%#A-6%<>@@@%/$3*$67$/%+C%/A+,#%+,%T$D"*T%.$62#A%/$3*$67$/>%?M%T+,$%#A-6%<@@%U$,E%.+62%/$3*$67$/>+,%hM%#+%,$7+6/#,*7#%-%a3*"7[%-6D%D",#Ea%#,$$N)A$%a!*/#+T%),$$a%+0#"+6%"67+,0+,-#$/%'AEWX%c%%%S*"6D+6>%LN%-6D%S-/7*$.>%dN>%I?@@hM%LE/#%1"+.N%e?:%fPf`O@Q %%g%#+%"6C$,%-%T+,$%$U+.*#"+6-,".E`-77*,-#$%0AE.+2$6$#"7%#+0+.+2E5E%-00.E"62%-%/*5/#"#*#"+6%T+D$.%#+%#A$%6*7.$+#"D$%/$3*$67$/N%)A"/%-.2+,"#AT%"/%5$/#%-00."$D%#+%D-#-/$#/%7+6#-"6"62%<M%C$R$,%#A-6%<@@%U$,E%.+62%/$3*$67$/>%?M%5$#R$$6%<@@%-6D<>@@@%/T-..%+,%T$D"*T%.$62#A%/$3*$67$/N%%ILd'M!"#$%&'(&)*#$+,*-&./0&1&+$23,+$4&5,$64&&

J+T$% %S$6$,-#$%'AE.+2$6$#"7%),$$

!"#$%$%&%'#(LbH(!J%9H)H HFHX]Yb%i%&GL8HXGYb 4d(j1bF!J &G(8L%ZHWGXGbL JdWb

H5+*#%8/ H66+*67$T$6#/ X"6[/ ($/+*,7$/ L*00+,# L"26%d*#

]+*%-,$%.+22$D%"6%-/%E*6N_A-62k*#/+*#AR$/#$,6N$D*

!"#$%&'()*+,-.&/()(0(%-&(.1&2.(34%"%&5-%+$#6-&7!"'58&9&:3(;";"#<<< *))=>??@@@<;"=#0#6<+#,?0#6?)#--<1+AB-)*+1CD*+@E3-(.F.=$)'(,-<<<

G&+H&G I?GG?GG&GJ>KL&'M

2.2

!"#$%&'()%*+,(-#./"'0&(1#.#2#,0(#&$(3&#45,%,(60,"+*70(8)%-69:::

;%.0()%-6 <+."*%#4, 60="*.(#(>+' 60?+0,.(@02(<*#%&%&' ;"&.#7.(A, 6040#,0(1#.0B(C+4(DEF(GHDD

</%,(=*"I07.(%,(J+&$0$(25(./0(K#.%"&#4(L&,.%.+.0("J(3440*'5(#&$(L&J07.%"+,(1%,0#,0,(8KLM(N(1MMO9(+&$0*(;"&.*#7.(K":(MMOKGPGGHHQHHHRD;(#&$(%,(#(7"44#2"*#.%"&(20.S00&(K"*./*"=T*+UU#&(M0#4./(L<F(A&%V0*,%.5("J(<0W#,(O"+./S0,.0*&(X0$%7#4(;0&.0*(#&$()07&#(<07/&"4"'%0,:()%*+,(%U#'0,(7"+*.0,5("J(;1;(-+24%7(M0#4./(LU#'0(!%2*#*5F(@0447"U0(LU#'0,F(A:O:10=#*.U0&.("J()0.0*#&,(3JJ#%*,(F(O7%0&70("J(./0(L&V%,%240(#&$()%*#4Y"&0F(OS%,,(L&,.%.+.0("J(>%"%&J"*U#.%7,:

3$$(Z(60U"V0

3$$(Z(60U"V0

!"#$%&'(

)*+,-.+/0-12-/3453,$3/T0&2#&[(#770,,%"&B\A]PPDR^(Z(O.*#%&(&#U0B1\K)_GNAON>L1_)DRG]NDQQQ(Z(1#.0BDQQQ(Z(;"+&.*5BAO3(Z(M",.BM+U#&T0&2#&[(#770,,%"&B\A]EPGGG(Z(O.*#%&(&#U0B1\K)_GNAON>L1_)DR]DNGHHH(Z(1#.0BGHHH(Z(;"+&.*5BAO3(Z(M",.BM+U#&T0&2#&[(#770,,%"&B\AREGPGQ(Z(O.*#%&(&#U0B1\K)_GNAON>L1_)`QENDQQQ(Z(1#.0BDQQQ(Z(;"+&.*5BAO3(Z(M",.BM+U#&T0&2#&[(#770,,%"&B\A]PPDRR(Z(O.*#%&(&#U0B1\K)_GNAON>L1_)DRGPNDQQQ(Z(1#.0BDQQQ(Z(;"+&.*5BAO3(Z(M",.BM+U#&T0&2#&[(#770,,%"&B\A]EPGG^(Z(O.*#%&(&#U0B1\K)_GNAON>L1_)DR]GNGHHH(Z(1#.0BGHHH(Z(;"+&.*5BAO3(Z(M",.BM+U#&T0&2#&[(#770,,%"&B\AREGP^H(Z(O.*#%&(&#U0B1\K)_GNAON>L1_)`QQNDQQQ(Z(1#.0BDQQQ(Z(;"+&.*5BAO3(Z(M",.BM+U#&

.+/0-12-/3453,$3/-6!157-8

T0&2#&[(#770,,%"&B\A]PPDRG(Z(O.*#%&(&#U0B1\K)_GNAON>L1_)DRG`NDQQQ(Z(1#.0BDQQQ(Z(;"+&.*5BAO3(Z(M",.BM+U#&T0&2#&[(#770,,%"&B\A]PPDR`(Z(O.*#%&(&#U0B1\K)_GNAON>L1_)DRGENDQQQ(Z(1#.0BDQQQ(Z(;"+&.*5BAO3(Z(M",.BM+U#&T0&2#&[(#770,,%"&BaCPRRPR`(Z(O.*#%&(&#U0B1\K)_GNKLN>L1_)G^]GNGHHH(Z(1#.0BGHHH(Z(;"+&.*5BK%7#*#'+#(Z(M",.BM+U#&T0&2#&[(#770,,%"&BaCE`HH]`(Z(O.*#%&(&#U0B1\K)_GNKLN>L1_)G]]RNGHHH(Z(1#.0BGHHH(Z(;"+&.*5BK%7#*#'+#(Z(M",.BM+U#&T0&2#&[(#770,,%"&BaCEQERPP(Z(O.*#%&(&#U0B1\K)_GNKLN>L1_)GQG^NGHHH(Z(1#.0BGHHH(Z(;"+&.*5BK%7#*#'+#(Z(M",.BM+U#&T0&2#&[(#770,,%"&BTbDQQEQ`(Z(O.*#%&(&#U0B1\K)_GNKLN>L1_)G]E^NDQQQ(Z(1#.0BDQQQ(Z(;"+&.*5BK%7#*#'+#(Z(M",.BM+U#&

.+/0-12-/3453,$3/-6!157-9

!"#$%$#$&'()*"+,-./0$($#)*",1"+./)23,4+$563)3,7..5,&,8"#90,89:3"#,1"+240(74%7[("&(./0(T0&"U0,(."(,0407.(./0UF(./0&(#$$(./0U(."(./0%*('*"+=,(25(74%7[("&(c3$$c:(c60U"V0c(S%44(,0&$(./0(,0407.0$(T0&"U0,(2#7[(."(./0(U#%&(4%,.:(d"+(7#&(#4,"($*#'./0('0&"U0,(."(./0%*('*"+=,:

M"U0( (X0.#$#.#_1*%V0&(;"U=#*#.%V0(T0&"U%7,(3&#45,%,

!"#$%$%&%'#(O\36;M(13<3 3K3!dY\(e()LOA3!LY\ @f6g>\K;M )L6AO(a3XL!L\O MfX\

32"+.(A, 3&&"+&70U0&., !%&[, 60,"+*70, O+=="*. O%'&(f+.

d"+(#*0(4"''0$(%&(#,(5+&:h/#&'i+.,"+./S0,.0*&:0$+

!"#$%&'()*+,-.&/()(0(%-&(.1&2.(34%"%&5-%+$#6-&7!"'58&9&:3(;";"#<<< *))=>??@@@<;"=#0#6<+#,?0#6?A,6<1+

B&+C&B D?BE?BB&BE>FD&'G

3

Double click the desired strains, and then click “Add” to add

them to a group.

4

5

!"#$%&"'( )*#+,"-./ ($0+,#%-%1*2 ($3*$/#%4$5%),-"6"62 !+6#-7#%8/ ($.$-/$%9-#$:%;$0%<=>%?@<<

)A"/%0,+B$7#%"/%C*6D$D%5E%#A$%F-#"+6-.%G6/#"#*#$%+C%H..$,2E%-6D%G6C$7#"+*/%9"/$-/$/%IFGJ%K%9JJ;L%*6D$,%!+6#,-7#%F+M%JJ;F?N??@@O@@@P<!%-6D%"/%-%7+..-5+,-#"+6%5$#Q$$6%F+,#A,+0R,*SS-6%J$-.#A%G)>%86"T$,/"#E%+C%)$U-/%;+*#AQ$/#$,6%V$D"7-.%!$6#$,%-6D%&$76-%)$7A6+.+2"$/M%&",*/%"S-2$/%7+*,#$/E%+C%!9!%'*5."7%J$-.#A%GS-2$%W"5,-,E>%4$..7+S$%GS-2$/>%8M;M9$0-,#S$6#%+C%&$#$,-6/%HCC-",/%>%;7"$67$%+C%#A$%G6T"/"5.$%-6D%&",-.X+6$>%;Q"//%G6/#"#*#$%+C%1"+"6C+,S-#"7/M

%

9$62*$?Y#Q+Y7.-D$/ !"#$%&'%(')*+$,-.

E*6MZA-62[*#/+*#AQ$/#$,6M$D* /$01$2&%3'&454-"&4',

!"#$%&&'()***9-#-%"/%/#"..%0,+7$//"62M%($/*.#/%Q"..%5$%/A+Q6%QA$6%,$-DEM

6789:6%3;<=:/GC%E+*%D+%6+#%Q-6#%#+%Q-"#%C+,%#A$%,$/*.#/>%*/$%E+*,%#"7\$#%6*S5$,%I%VR]^=_@?=O^=^P`%L%#+%7+S$%5-7\%#+%#A$%($#,"$T$%($/*.#/%5E%)"7\$#%F*S5$,%0-2$%-#%-%.-#$,%#"S$-6D%,$#,"$T$%E+*,%,$/*.#/M

!>?:%>3>@A!7!%6B%(B/9=:38Ca6#$,%#A$%6-S$%E+*%Q-6#%#+%*/$%-6D%7."7\%!"#$%&'%(')*+$,-.%"C%E+*%Q-6#%#+%/-T$%#A$%-6-.E/"/%QA$6%#A$%,$/*.#/%-,$%,$-DEM

3B67D78>67B3%BD%8B<E@:67B3a6#$,%E+*,%$S-".%-6D%7."7\%/$01$2&%3'&454-"&4',%"C%E+*%Q-6#%#+%,$7$"T$%-%6+#"C"7-#"+6%QA$6%#A$%,$/*.#/%-,$%,$-DEM

J+S$% %VE%4+,\5$67A% %4+,\"62MMM% %V$#-D-#-YD,"T$6%!+S0-,-#"T$%H6-.E/"/%)++.%C+,%;$3*$67$/%IS$#-Y!H);L% %',+7$//"62MMM

!"#$%$%&%'#(;aH(!J%9H)H HFHWbXa%c%&G;8HWGXa 4d(e1aF!J &G(8;%fHVGWGa; JdVa

H5+*#%8/ H66+*67$S$6#/ W"6\/ ($/+*,7$/ ;*00+,# ;"26%d*#

b+*%-,$%.+22$D%"6%-/%E*6MZA-62[*#/+*#AQ$/#$,6M$D*

!"#$%&'()*+,-.&/()(0(%-&(.1&2.(34%"%&5-%+$#6-&7!"'58&9&:3(;";"#<<< *))=>??@@@<;"=#0#6<+#,?0#6?A,6<1+

B&+C&B BD?E?BB&E>EF&'G

6

!"#$%&'()*+#+%,-$(#)+

!"#$%&'&()*+#'$(,()*"-.*/,0.1#",2333,/444,+56,7$#8*&

%,./').("%0'12$% %3-'-4($-%56*).7-'-$#8%94--% %:6./%5;<()2-+%=(4%5).$%

9*+#8#+#,8:';*"(<61=#:#+';*(!"#$%&'&(>*=6:+(?@'7A*+B(9CD2E2FGE/4H/FFI

!"#$%#&'('&')(*+,#-$./01'*'&+,#$2-'345+5$!//3$6/-5+5&5$/7$&"*##$1'*&58$'$093&+13#$5#:9#-6#$'3+;-0#-&$<95+-;$%=>.?@AB$'$6"+)5:9'*#$;//(-#55$/7$7+&$&#5&$&/$+(#-&+74$1/5+&+/-5

<6/390-5A$/7$&"#$093&+13#$5#:9#-6#$'3+;-0#-&$&"'&$5+;-+7+6'-&34$(+77#*$7*/0$&"#$#C1#6&#($<*'-(/0A$(+5&*+D9&+/-$/7$*#5+(9#5$D#&E##-$'33$0#&'('&'$;*/915B$'-($'$F#'*5/-G5

6"+)5:9'*#$&#5&$&/$+(#-&+74$&"#$51#6+7+6$1'+*5$/7$0#&'('&'$;*/915$&"'&$6/-&*+D9&#$&/$&"#$/D5#*,#($5&'&+5&+6'3$(+77#*#-6#H

I"#-$J$/*$0/*#$;*/915$'*#$+-639(#($+-$&"#$'-'345+5B$&"#$.),'39#$7*/0$&"#$K//(-#55$/7$L+&$&#5&$E+33$+(#-&+74$6/390-5$"',+-;$5+;-+7+6'-&$,'*+'&+/-$D#&E##-$'33$;*/915B$E"+3#$&"#

F#'*5/-G5$&#5&$E+33$+(#-&+74$&"#$51#6+7+6$1'+*<5A$/7$;*/915$&"'&$0'M#$&"#$6/390-$5+;-+7+6'-&$<+H#H$+7$&"/5#$;*/915$E#*#$-/&$+-639(#($+-$&"#$'-'345+5B$&"#$6/390-$E/93($-/$3/-;#*$D#

+(#-&+7+#($'5$5+;-+7+6'-&AH

>6#;+?2(4-%3.."'-++%.@%A#$%9-+$%B-+2)$

!"#*#$'*#$NOP$1/5+&+/-5$&"'&$"',#$'$5+;-+7+6'-&$-/-)*'-(/0$(+5&*+D9&+/-$D#&E##-$&"#$51#6+7+#($;*/915H

5.+#$#.' >6#;+?2(4-%<()2- >;C()2- ,-74--%A4--".D

QQ RJHSJT PHPPTSJU U

VQ RNHTTT PHPPQRUQ J

NPJ JPHVVN SHQJU@)T J

NTS JPHVVU SHQNU@)T J

JRU RSHOT JHRVV@)U J

JNP VHOUN PHPNRST J

JJN NNHOJV UHSPN@)Q J

JVO NOHSJQ OHJTQ@)O J

URO JPHVVU SHQNU@)T J

UUP JPHVVU SHQNU@)T J

UTJ JPHVVU SHQNU@)T J

QNU NOHSJQ OHJTQ@)O J

QSU JPHVVU SHQNU@)T J

QVJ JPHVVU SHQNU@)T J

TPU JPHVVU SHQNU@)T J

TNN NOHONT THPUV@)O J

STV RSHVSU NHTQQ@)U J

SSU RQHONR PHPPRJQO J

SVP RSHVSU NHTQQ@)U J

VPN NOHOQT OHVUO@)O J

VNO JPHVVN SHQJU@)T J

VTT NOHONT THPUV@)O J

RPJR RVHROR NHQJN@)U J

RRNR NJHJOV JHJSN@)Q J

RRJO JPHVVN SHQJU@)T J

RNQP RQHTUJ PHPPRNS J

RNON RQHONR PHPPRJQO J

RNTT JPHVVU SHQNU@)T J

RJRN JPHVVU SHQNU@)T J

RJNJ JPHVVU SHQNU@)T J

RJVR JPHVVU SHQNU@)T J

RUPO NOHONT THPUV@)O J

RUOJ NNHOJV UHSPN@)Q J

RQJQ NOHONT THPUV@)O J

W/0#$ $%4$I/*MD#-6"$ $2-'345+5$<X#-;9#N)"90'-)RVVV)NPPP)&E/)63'(#5A

!"#$%$%&%'#(>@2Y.W$X2!2 2Z2?[\@$]$^_>=2?_\@ I`[email protected] ^_Y=>$L2%_?_@> W`%@

2D/9&$=5 2--/9-6#0#-&5 ?+-M5 Y#5/9*6#5 >911/*& >+;-$`9&

[/9$'*#$3/;;#($+-$'5$49-Hc"'-;d9&5/9&"E#5&#*-H#(9

!"#$%&'()*+,-.&/()(0(%-&(.1&2.(34%"%&5-%+$#6-&7!"'58&9&:3(;";"#<<< *))=>??@@@<;"=#0#6<+#,?0#6?A,6<1+B(.(34%"%C1DEEFGHI)"6J-)K$A<<<

E&+L&EH M?NH?EE&EE>NF&2O

7

5. Divide sequences into groups based on scientific knowledge: double click the desired sequences and then click “Add” to add them to their respective groups. When finished, click “Run”.

6. The analysis may take a few minutes to run. While the analysis is running, you can choose to save the analysis (upon completion) to your Workbench by entering a name for the analysis and then clicking the “Save to Workbench” button. Then you can move to other parts of the ViPR site, and retrieve the analysis results later from your Workbench.

7. The Meta-CATS report includes: • Chi-square Goodness of fit test result:

positions that have significant non-random distribution between the specified groups.

• Pearson’s Chi-square Pairwise Comparison Report: positions that significantly differ between the groups.

• Save the analysis to your Workbench if needed. You can also share the analysis with collaborators.