Multiple Sequence Alignment (MSA) · 2020-04-20 · Freely available Integrated datasets...
Transcript of Multiple Sequence Alignment (MSA) · 2020-04-20 · Freely available Integrated datasets...
http://www.fludb.org/
Freely available Integrated datasets Bioinformatics tool suite Platform for influenza data submission
IRD is funded by the National Institute of Allergy and Infectious Diseases (NIH/DHHS) under Contract No. HHSN266200400041C and is a collaboration between Northrop Grumman Health IT, University of Texas Southwestern Medical Center , Vecna Technologies, SAGE Analytica and Los Alamos National Laboratory. Comments, questions, suggestions? Contact us at [email protected]
Multiple Sequence Alignment (MSA)
Option 1: Search for sequences and then align sequences
Choose sequences for alignment Run the alignment
Customize the alignment based on
your need
!"#$%&'( )*#+,"-./ 0.+//-,1%+2%)$,3/ '$4+,#%-%5*6 '$7*$/#%8$9%),-":":6 !+:#-;#%</ '$.$-/$%(-#$=%>*.%?@A%BC??
)D"/%4,+E$;#%"/%2*:F$F%91%#D$%G-#"+:-.%&:/#"#*#$%+2%H..$,61%-:F%&:2$;#"+*/%("/$-/$/%IG&J%K%(JJLM%*:F$,%!+:#,-;#%G+N%JJLGBOOBCCPCCCP?!%-:F%"/%-%;+..-9+,-#"+:%9$#Q$$:%G+,#D,+40,*33-:%J$-.#D%&)A%<:"R$,/"#1%+2%)$S-/%L+*#DQ$/#$,:%T$F";-.%!$:#$,%A%U$;:-%)$;D:+.+6"$/A%LH0V%H:-.1#";-%-:F%W+/%H.-3+/%G-#"+:-.%W-9+,-#+,1N
!"#"$#%$&'#(&)%L$63$:#%K%G*;.$+#"F$
%X,+#$":
%L#,-":
*+&(,$#-.'H
5
!
,(/$#-.'
Y%</$%;+33-%#+%/$4-,-#$%3*.#"4.$$:#,"$/N%VS=%J?G?A%JZA%J[GBN
,#&"+)$)"0'
Y%</$%;+33-%#+%/$4-,-#$%3*.#"4.$$:#,"$/NVS=%HK;D";\$:K&/,-$.K?C]]KBCC@AHK;D";\$:KW-+/K?OKBCC@N
!+34.$#$%0$:+3$%^:.1^:.1%":;.*F$%/$63$:#/%Q"#D%D"6DF$6,$$%+2%/"3".-,"#1%#+%BCC_4J?G?%/$7*$:;$/%IL^XM
,'1'2#$,'30')#,!""#$%&''$%&#($%!)$*!+$,%-$,!.$/%0$,1
!"#'$&")3'`,+3=% aaaa )+=% aaaa)+%-FF%3+:#D%#+%/$-,;DA%/$$HFR-:;$%^4#"+:/=%T+:#D%'-:6$
4%,#!""!2345&"67$8"9:4;<":=<<>4=:32<>?6@?6;<A>3B$:4>C523D65;<5>8<DD<>*6DA<*E;45F4GF4D@<$:4>/EAHD4>I>=<D%3H
3'%3&".4+2$3&%(.+)3!""!JD3B4!A34CED6K<,6D>=$!;<D3B4IB<45341 =$! 3
2%()#&-!J@=453A>45!"@<D34!D@<5>354!EA>D4"34!EA>D34!L<DG43M45&4=D435& " N =
"!*")2'!$%.#+%),,567892:567
!"#$%!&%'()(*+%,-)+"#)(%&.%/('()(*+0%1+.)2*)"*3%45"6/&7'8%&.%1,/2*)"*3%49:*;<8%LD+Q%H..
!"#$%&'()%*+%,"%-#%*+%./#0*L$-,;D%2+,%":2.*$:b-%/$7*$:;$/A%4,+#$":/A%-:F%/#,-":/%*/":6%#Q+%#14$/%+2%/$-,;D$/N%</$%#D$%-FR-:;$F%/$-,;D%#+%-..+Q%1+*%#+%,$2":$%1+*,%/$-,;D%Q"#D%#D$%3+,$%2":$%6,-":$F%/$-,;DA-:F%1+*%;-:%4";\%1+*,%R"$Q":6%+4#"+:/N
J+3$% %G*;.$+#"F$%L$7*$:;$%L$-,;D
LVH'!J%(H)H HGHWacV%d%U&L<HW&cV 8^'e5VG!J L<5T&)%(H)H J^TV
f<&!e%LVH'!J
f*";\%L$-,;D
LVH'!J%`^'%^'%`&G(
G*;.$+#"F$%L$7*$:;$/
X,+#$":%L$7*$:;$/
L#,-":%(-#-
&33*:$%V4"#+4$/
[(%X,+#$":%L#,*;#*,$/
XD$:+#14$%!D-,-;#$,"/#";/
H:"3-.%L*,R$"..-:;$%(-#-
!+34-,$%L*9#14$/%":%L*,R$"..-:;$
L*33-,1%+2%HR"-:%L*,R$"..-:;$
J*3-:%L*,R$"..-:;$%L#*F"$/
L$7*$:;$%`$-#*,$%U-,"-:#%)14$/
X!'%X,"3$,%X,+9$%(-#-
W-9+,-#+,1%VS4$,"3$:#/%I9$#-M
U",*/%XD$:+#14$%L*93"//"+:/%I9$#-M
8J^%&:2.*$:b-%U-;;":$%L#,-":/
LVH'!J%J&L)^'a
'$#,"$R$%-%(+Q:.+-F
a+*,%L$-,;D%J"/#+,1
H9+*#%</ !+33*:"#1 H::+*:;$3$:#/ W":\/ '$/+*,;$/ L*44+,# L"6:%^*#
a+*%-,$%.+66$F%":%-/%1*:NbD-:6g*#/+*#DQ$/#$,:N$F*
!"!#$"%&'($)$&*+,'-&.&/&)$'0'1$2#$"+$'1$&*+, ,..34556667!#8/79*:5/*+5;"!#$"%&<)$2#$"+$<)$&*+,<)$:=$".<8;)777
>'9?'> @5AB5>>'C4A>'DE
1
!"#$%&'( )*#+,"-./ 0.+//-,1%+2%)$,3/ '$4+,#%-%5*6 '$7*$/#%8$9%),-":":6 !+:#-;#%</ '$.$-/$%(-#$=%>*.%?@A%BC??
)D"/%4,+E$;#%"/%2*:F$F%91%#D$%G-#"+:-.%&:/#"#*#$%+2%H..$,61%-:F%&:2$;#"+*/%("/$-/$/%IG&J%K%(JJLM%*:F$,%!+:#,-;#%G+N%JJLGBOOBCCPCCCP?!%-:F%"/%-%;+..-9+,-#"+:%9$#Q$$:%G+,#D,+40,*33-:%J$-.#D%&)A%<:"R$,/"#1%+2%)$S-/%L+*#DQ$/#$,:%T$F";-.%!$:#$,%A%U$;:-%)$;D:+.+6"$/A%LH0V%H:-.1#";-%-:F%W+/%H.-3+/%G-#"+:-.%W-9+,-#+,1N
!"#"$#%$&'#(&)%L$63$:#%K%G*;.$+#"F$
%X,+#$":
%L#,-":
*+&(,$#-.'H
5
!
,(/$#-.'J?G?
Y%</$%;+33-%#+%/$4-,-#$%3*.#"4.$$:#,"$/N%VS=%J?G?A%JZA%J[GBN
,#&"+)$)"0'
Y%</$%;+33-%#+%/$4-,-#$%3*.#"4.$$:#,"$/NVS=%HK;D";\$:K&/,-$.K?C]]KBCC@AHK;D";\$:KW-+/K?OKBCC@N
!+34.$#$%0$:+3$%^:.1^:.1%":;.*F$%/$63$:#/%Q"#D%D"6DF$6,$$%+2%/"3".-,"#1%#+%BCC_4J?G?%/$7*$:;$/%IL^XM
,'1'2#$,'30')#,!""#$%&''$%&#($%!)$*!+$,%-$,!.$/%0$,1
!"#'$&")3'`,+3=% aaaa )+=% aaaa)+%-FF%3+:#D%#+%/$-,;DA%/$$HFR-:;$%^4#"+:/=%T+:#D%'-:6$
4%,#2345678978:5;63<$2=6>?43@8?:5?6A5@@56*8@;5*B:=?C=DC=@95$2=6/B;E@=6F6G5@%3E=%"=65=B$%3E=H=<<88?$789H5=;;8@6=?615=$/=::="1I3?5
3'%3&".4+2$3&%(.+)3!""!J@3<=!;3=>B@8K5,8@6G$!:5@3<=F<5=?3=1 G$! 3
2%()#&-L=:=3<=/5M3<8/8?6;5@@=6,3<=@=9B=%=?=:=%B5@68$H3<8N@3?3O=O$=?O$N8D=98P1!
"!*")2'!$%.#+%),,567892:567
!"#$%!&%'()(*+%,-)+"#)(%&.%/('()(*+0%1+.)2*)"*3%45"6/&7'8%&.%1,/2*)"*3%49:*;<8%LD+Q%H..
!"#$%&'()%*+%,"%-#%*+%./#0*L$-,;D%2+,%":2.*$:b-%/$7*$:;$/A%4,+#$":/A%-:F%/#,-":/%*/":6%#Q+%#14$/%+2%/$-,;D$/N%</$%#D$%-FR-:;$F%/$-,;D%#+%-..+Q%1+*%#+%,$2":$%1+*,%/$-,;D%Q"#D%#D$%3+,$%2":$%6,-":$F%/$-,;DA-:F%1+*%;-:%4";\%1+*,%R"$Q":6%+4#"+:/N
J+3$% %G*;.$+#"F$%L$7*$:;$%L$-,;D
LVH'!J%(H)H HGHWacV%d%U&L<HW&cV 8^'e5VG!J L<5T&)%(H)H J^TV
H9+*#%</ !+33*:"#1 H::+*:;$3$:#/ W":\/ '$/+*,;$/ L*44+,# L"6:%^*#
a+*%-,$%.+66$F%":%-/%1*:NbD-:6f*#/+*#DQ$/#$,:N$F*
!"!#$"%&'($)$&*+,'-&.&/&)$'0'1$2#$"+$'1$&*+, ,..34556667!#8/79*:5/*+5;"!#$"%&<)$2#$"+$<)$&*+,<)$:=$".<8;)777
>'9?'> @5AB5>>'>A4>@'CD
2
1. Identify sequences to align: mouse-over the “Search Data” tab and click “Nucleotide Sequences” or “Protein Sequences”. For this example, we will use nucleotide sequences.
2. Select search criteria on the Nucleotide Sequence Search page and click the “Search” button to run your query.
3. Select sequences from the search result page by clicking the checkboxes. Mouse-over the yellow “Run Analysis” button and click “Align Sequences (MSA)”. If you want to include sequences that are not in this search result or to use the sequences to do further analysis, select the desired sequences and click “Add to Working Set”. Then add other sequences to the same working set later by repeating the process. Click the “Workbench” tab and find the working set you saved. Click
next to it to view the details of the working set. Then mouse-over the yellow “Run Analysis” button and click “Align Sequences (MSA).
!"#$%&'($)*%$'+#$,'-%./0%&'12',+&3 !"#$%&'($)*"$)# 45&67(85,1%9:%6'$%6(1'+),-.#/'!"**)01,
'233'*4'54$6)01'!"*' '!#7"'!"#$%&' '+480.4#3'
9 % : % ; % < % = % > % ? % @"A*'B % ;(1'<% = %">%=.
!"#$%&'()%*+%,"%-#%*+%./#0*1%2"$'2
C4D$'!"."%*"3'E*"F,G'>'')*"F,',"."%*"3'''H''+","."%*'2..
% ?'7')+%(77%./0%&'12',+&
!"1F"0*I$4*")0@#F"
!"JD"0%"2%%",,)40
+#*"K4,*
!-"%)",(4D0*$/
L.D!"#,40
!*$#)0'@#F"
0 @A B:0.9C =/DC ?E5,' B?A FGHAF IAH&E5,'HJ/H=/DCK@=G=L
0 @A M!:J9::J =/CC ?E5,' B?A FGHAF IAH&E5,'HA$5N",(H=0.H=/CCK@=G=L
0 @A M!:.J:C: G" /:: @=G= :JH:/HJ::O I?E5,' B?A :9F:O AH&E5,'HA$P(,&(&H:://DHJ::O
0 @A M!:.J:C0 G" ..D @=G= :JHJDHJ::O I?E5,' B?A :9F:O AH&E5,'HA$P(,&(&H:://.HJ::O
0 @A M!:.JD9/%I G" /:J @=G= :=HD=HJ::C I?E5,' B?A :OF:C AH&E5,'HA$P(,&(&H:=0O:HJ::C
0 @A M!:0:0O: G" /:= @=G= J::. ?E5,' B?A FGHAF IAH&E5,'HA$P(,&(&HODO:CFDHJ::.K@=G=L
0 @A M!:J.C.: !'& =CDJ @=G= =//= ?E5,' B?A FGHAF IAH&E5,'HM(75>"$,5(HQ/::=C:CH=//=K@=G=L
0 @A M!:.J=C=%I G" .9/ @=G= :9HD=HJ::O I?E5,' B?A :9F:O AH&E5,'HM"7"$(-"H:==9=HJ::O
0 @A M!:.=O.9 G" ./9 @=G= :JHJ0HJ::0 I?E5,' B?A :DF:0 AH&E5,'HR'"$15(H::J9JHJ::0
0 @A M!:.=C:C%I G" ... @=G= :9H:0HJ::0 ?E5,' B?A :DF:0 AH&E5,'HR'"$15(H::J/CHJ::0
0 @A M!:.J:C= G" /:0 @=G= :JH=:HJ::O ?E5,' B?A :9F:O AH&E5,'HR'"$15(H:://9HJ::O
0 @A STOD.J/. G" =C=D @=G= J::9 ?E5,' B?A FGHAF IAH&E5,'HUVH::O.9HJ::9K@=G=L
0 @A RB/.0D/O G" =C:= @=G= =JHJ/HJ::/ ?E5,' B?A :/F=: IAH&E5,'HUVH=:F::=99:HJ::/K@=G=L
0 @A RB/.0D// G" =C:= @=G= =JHJ:HJ::/ ?E5,' B?A :/F=: IAH&E5,'HUVH=:F::=99=F=HJ::/K@=G=L
0 @A RB/.00:J G" =C:= @=G= =JHJ:HJ::/ ?E5,' B?A :/F=: IAH&E5,'HUVH=:F::=99=FJHJ::/K@=G=L
0 @A @WJ=/O=. G" =C:= @=G= :JHJDHJ:=: ?E5,' B?A :/F=: IAH&E5,'HUVH=JOO:HJ:=:K@=G=L
0 @A @WJ=/ODD G" =C:= @=G= :DH=.HJ:=: ?E5,' B?A :/F=: IAH&E5,'HUVH=CD=9F=HJ:=:K@=G=L
0 @A @WJ=/ODO G" =C:= @=G= :DH=.HJ:=: ?E5,' B?A :/F=: IAH&E5,'HUVH=CD=9FDHJ:=:K@=G=L
0 @A @XJ/=9DC G" =C:= @=G= :9H=.HJ:=: ?E5,' B?A :/F=: IAH&E5,'HUVHJ9D//FJHJ:=:K@=G=L
0 @A @XJ/=90: G" =C:= @=G= :9H=.HJ:=: ?E5,' B?A :/F=: IAH&E5,'HUVHJ9D//FDHJ:=:K@=G=L
0 @A @XJ/=90D G" =C:= @=G= :9H=.HJ:=: ?E5,' B?A :/F=: IAH&E5,'HUVHJ9D//F0HJ:=:K@=G=L
0 @A @XJ/=90O G" =C:= @=G= :OH:JHJ:=: ?E5,' B?A FGHAF IAH&E5,'HUVHJC0.OF=HJ:=:K@=G=L
0 @A @XJ/=90/ G" =C:= @=G= :OH:JHJ:=: ?E5,' B?A FGHAF IAH&E5,'HUVHJC0.OFJHJ:=:K@=G=L
0 @A RB0.:/JJ G" =C:= @=G= ==H==HJ::/ ?E5,' B?A :/F=: IAH&E5,'HUVHDJ/C0HJ::/K@=G=L
MD0'20#./,),
@"2'% %G#)7'"+5-'%?'Y#',)'%?'($)*% %Z'+&
'E3"0*)N/'!)F).#$'!"JD"0%",'OPQ2!RS'
'2.)10'!"JD"0%",'OT!2S'
'U),D#.)V"'2.)10"3'!"JD"0%",'
'W"0"$#*"'I&/.41"0"*)%'R$""'
'20#./V"'!"JD"0%"'U#$)#*)40'O!@IS'
?[AZM@%4AQA AGAV!\[%]%^U?BAVU\[ _`Zab[GM@ ?BbWUQ%4AQA @`W[
Ac"#+%B& M"22#,5+8 A,,"#,)'2',+& V5,P& Z'&"#$)'& ?#66"$+ ?51,%`#+
!"#%($'%7"11'-%5,%(&%8#,3N*(,1d#+&"#+*E'&+'$,3'-#
!"!#$"%&'($)$&*+,'-&.&/&)$'0'1#+2$3.45$'6$7#$"+$'6$&*+,'($)#2.) ,..89::;;;<!#5/<3*=:/*+:4"!#$"%&>)$7#$"+$>)$&*+,>)$=?$".>54)<<<
@'3A'B C:BD:@@'@B9ED'FG
3
Click to view details of
the record
• Select display fields • Custom-sort records
Select sequences and add them to a working set for future analysis. You’ll need to register a Workbench account
to use this feature.
Cite IRD Tutorials Glossary of Terms Report a Bug Request Web Training Contact Us Release Date: Jul 18, 2011
This project is funded by the National Institute of Allergy and Infectious Diseases (NIH / DHHS) under Contract No. HHSN266200400041C and is a collaboration between NorthropGrumman Health IT, University of Texas Southwestern Medical Center , Vecna Technologies, SAGE Analytica and Los Alamos National Laboratory.
2 records were previously selected from search results
INPUT SEQUENCESHTML
SELECT OUTPUT FORMATAligned
SELECT OUTPUT ORDER
RunClear
Align Sequences (MSA) IRD uses the MUSCLE (Multiple Sequence Comparison by Log-Expectation) algorithm to align the sequences you select from a search result or a working set on yourworkbench or that you provide in an uploaded file.
Home Nucleotide Sequence Search Results Align Sequences (MSA)
SEARCH DATA ANALYZE & VISUALIZE WORKBENCH SUBMIT DATA HOME
About Us Community Announcements Links Resources Support Sign Out
You are logged in as [email protected]
Inuenza Research Database - MUSCLE Multiple Sequence Alig... http://www.udb.org/brc/msa.do
1 of 1 8/1/11 4:27 PM
5
!"#$%&'( )*#+,"-./ 0.+//-,1%+2%)$,3/ '$4+,#%-%5*6 '$7*$/#%8$9%),-":":6 !+:#-;#%</ '$.$-/$%(-#$=%>+?%@A%BCDD
)E"/%4,+F$;#%"/%2*:G$G%91%#E$%>-#"+:-.%&:/#"#*#$%+2%H..$,61%-:G%&:2$;#"+*/%("/$-/$/%I>&J%K%(JJLM%*:G$,%!+:#,-;#%>+N%JJL>BOOBCCPCCCPD!%-:G%"/%-%;+..-9+,-#"+:%9$#Q$$:%>+,#E,+40,*33-:%J$-.#E%&)A%<:"?$,/"#1%+2%)$R-/%L+*#EQ$/#$,:%S$G";-.%!$:#$,%A%T$;:-%)$;E:+.+6"$/A%LH0U%H:-.1#";-%-:G%V+/%H.-3+/%>-#"+:-.%V-9+,-#+,1N
%
W5B%4+/#%BCCX%SLH !"#$%&'%(')*+$,-.
1*:NYE-:6Z*#/+*#EQ$/#$,:N$G* /$01$2&%3'&454-"&4',
!"#$%&&'()***(-#-%"/%/#"..%4,+;$//":6N%'$/*.#/%Q"..%9$%/E+Q:%QE$:%,$-G1N
6789:6%3;<=:/&2%1+*%G+%:+#%Q-:#%#+%Q-"#%2+,%#E$%,$/*.#/A%*/$%1+*,%#";[$#%:*39$,%I%SL\]@^OOB]^D]_@%M%#+%;+3$%9-;[%#+%#E$%'$#,"$?$%'$/*.#/%91%)";[$#%>*39$,%4-6$%-#%-%.-#$,%#"3$-:G%,$#,"$?$%1+*,%,$/*.#/N
!>?:%>3>@A!7!%6B%(B/9=:38CU:#$,%#E$%:-3$%1+*%Q-:#%#+%*/$%-:G%;.";[%!"#$%&'%(')*+$,-.%"2%1+*%Q-:#%#+%/-?$%#E$%-:-.1/"/%QE$:%#E$%,$/*.#/%-,$%,$-G1N
3B67D78>67B3%BD%8B<E@:67B3U:#$,%1+*,%$3-".%-:G%;.";[%/$01$2&%3'&454-"&4',%"2%1+*%Q-:#%#+%,$;$"?$%-%:+#"2";-#"+:%QE$:%#E$%,$/*.#/%-,$%,$-G1N
J+3$% %S1%8+,[9$:;E% %8+,[":6NNN% %H."6:%L$7*$:;$/%ISLHM% %W,+;$//":6NNN
LUH'!J%(H)H H>HV`aU%b%T&L<HV&aU 8c'd5U>!J L<5S&)%(H)H JcSU
H9+*#%</ !+33*:"#1 H::+*:;$3$:#/ V":[/ '$/+*,;$/ L*44+,# L"6:%c*#
+̀*%-,$%.+66$G%":%-/%1*:NYE-:6Z*#/+*#EQ$/#$,:N$G*
!"!#$"%&'($)$&*+,'-&.&/&)$'0'1223'($)#3.) ,..45667778!#9/82*:6/*+6;)&892
<'2='< <>6><6<<'<>5?@'AB
6
4
4. A “Select Sequence Type” lightbox will pop-up. Select the appropriate sequence type and click “Continue”.
5. On the next page, select output format and output order. Then click “Run”.
6. If you have a large amount of input to align, the analysis may take a few minutes to run. While the analysis is running, you can choose to save it (upon completion) to your Workbench by entering a name for the analysis and then clicking the “Save to Workbench” button. Then you can move to other parts of the IRD site, and retrieve the alignment later from your Workbench.
2
!"#$%&'( )*#+,"-./ 0.+//-,1%+2%)$,3/ '$4+,#%-%5*6 '$7*$/#%8$9%),-":":6 !+:#-;#%</ '$.$-/$%(-#$=%>+?%@A%BCDD
)E"/%4,+F$;#%"/%2*:G$G%91%#E$%>-#"+:-.%&:/#"#*#$%+2%H..$,61%-:G%&:2$;#"+*/%("/$-/$/%I>&J%K%(JJLM%*:G$,%!+:#,-;#%>+N%JJL>BOOBCCPCCCPD!%-:G%"/%-%;+..-9+,-#"+:%9$#Q$$:%>+,#E,+40,*33-:%J$-.#E%&)A%<:"?$,/"#1%+2%)$R-/%L+*#EQ$/#$,:%S$G";-.%!$:#$,%A%T$;:-%)$;E:+.+6"$/A%LH0U%H:-.1#";-%-:G%V+/%H.-3+/%>-#"+:-.%V-9+,-#+,1N
!"#$%&'()'*%+"%,-%. /012,)3"%,45'678% 9*%:#%,; /*%+"%,-%'<5$%3 *;&5=,'!5#%
'*5>%'9,537.=.' '?%,%&5;%'@A73(:%,%;=-'6&%%'
B=C%'*%+"%,-%'D%5;"&%.
*%3%-;'5'E5;%:(&7!""#$%&'$()(*+(,-(.!"&(/0&%',1+,-&%',0")&/+-&+/0"
*%3%-;'5')%5;"&%F'E((&C=,5;%.'A=:A3=:A;%C'(,'53=:,#%,;'=,'C5&G'$3"%F
*%+%",-%'D%5;"&% D%5;"&%'!5#% @(.=;=(,.
&:2.*$:W-%HXY5BXLZD &:2.*$:W-%HXY5BX;E-":XDI[\@M D][\@
&:2.*$:W-%HXY5BXLZB &:2.*$:W-%HXY5BX-.4E-]E$."RXDIDCM D]DC
&:2.*$:W-%HXY5BXLZ^ &:2.*$:W-%HXY5BX-.4E-]E$."RXDPI@M DP]BB
&:2.*$:W-%HXY5BXLZP &:2.*$:W-%HXY5BX-.4E-]E$."RXB[I[M B[]^^
& 2. %H Y5B LZ\ & 2. %H Y5B . E E ." O@DI^M O@D O@^
!"#$%&"'()*&"+,(-).(/$(,0(#
*HIJH!EH'2!DKLM962K!
B2?B<2?B6'*HIJH!EH'DH96JLH*
%
J+3$% %S1%8+,_9$:;E% %8+,_":6NNN% %H."6:%L$7*NNN% %'$/*.#/% %T"/*-."W$%H."6:$G%L$7*$:;$/% %'$/*.#/
LUH'!J%(H)H H>HV`aU%b%T&L<HV&aU 8c'd5U>!J L<5S&)%(H)H JcSU
H9+*#%</ !+33*:"#1 H::+*:;$3$:#/ V":_/ '$/+*,;$/ L*44+,# L"6:%c*#
+̀*%-,$%.+66$G%":%-/%1*:NWE-:6e*#/+*#EQ$/#$,:N$G*
!"!#$"%&'($)$&*+,'-&.&/&)$'0'1&234$5 ,..67885559!#:/9;*<8/*+8=&2>4$59:;?:$+;*&.;*@4"!#$"%&AB$.,;999
C';D'C CE8EC8CC'F7GC'HI
!"#$%!&'#()*+*! !,-.'(-#/!0123!
!"#$%&'%()*'+,-(
!"#$%&''()*+,-./*0+123./4*'#*566#7777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@A@@B!A9)<<==C@?D;":=EF)>;9=G99
A9'H5$%&()*)/+,3*'*566IJAIE'K77777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
A9'H5$I'()*)/+,3*5*566IJAIE'K77777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
A9'H5$'%()*D,./4L3*'*566IJAIE'K777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M$%$H6'()*N3./4O,*5*566H777777777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M$%$#P%()*N3./4O,*'*566H777777777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
)Q$#55P5()*?+./4+.3*'*566#77777777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
!"&%I%'6()*R+3/.*D!6'*566#77777777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:SI$''5#()*D,./4TU/4*6'*566#777777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M66&I&5()*)/+,3*@5*566#777777777777777777777777777777777888888888888888888888888888888888B!A9)<<==C@?D;":=EF)>;9=G99
:M'$#H$$()*</TU/1O3.*I%$A*566#7777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M'$#HP5()*</TU/1O3.*I#6A*566#7777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M'$#HI5()*</TU/1O3.*I%&A*566#7777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M'$#HH#()*</TU/1O3.*I$#A*566#7777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M'$#HHI()*</TU/1O3.*I%#A*566#7777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M'$#HH$()*</TU/1O3.*I%IA*566#7777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M'$#&66()*</TU/1O3.*I$#VA*566#777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$5#P()*</TU/1O3.*R!RIP$*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$$#&()*</TU/1O3.*R!R#5I>*566#7777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$5&I()*</TU/1O3.*R!RIP#*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$%P5()*</TU/1O3.*R!RIPP*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$5HH()*</TU/1O3.*R!RIPI*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$$H#()*</TU/1O3.*R!RIPPE*566#7777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$$%#()*</TU/1O3.*R!R#5I*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$5P%()*</TU/1O3.*R!RIPH*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
A"#I5#%6()*AU/47=U/4*#&$'*56'6JAIE'K777777777777777777777888888888888888888888888888888888888888888888888888888888888
A9''$IP&()*B31W/.-*M@%'$'5<<*566&JAIE'K7777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
A9''$IP6()*B31W/.-*M@%'%P$<<*566&JAIE'K7777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
A9''$I$5()*B31W/.-*M@%'56%)*566HJAIE'K77777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
A9''$I&5()*B31W/.-*AE%'%&&9'*566HJAIE'K7777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
A9''$#6#()*B31W/.-*M@%'$'%<<*566&JAIE'K7777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
A9''$II6()*B31W/.-*M@%'5%P*566HJAIE'K777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
D"5%5$$'()*B31W/.-*AE'*566H7777777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
A9''$IH$()*B31W/.-*M@%'%'5<<*566HJAIE'K7777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
A9''$II&()*B31W/.-*M@%'5$$<<*566HJAIE'K7777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9?<<==C@?D;":=EF)>;9=G99
A9''$I##()*B31W/.-*M@%'5$$<<<*566HJAIE'K777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9?<<==C@?D;":=EF)>;9=G99
A9''$I%$()*B31W/.-*M@%6&I6*566IJAIE'K777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M5#%P&&()*+,-./*R+3/.*D!65*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@R:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M'$##%'()*</TU/1O3.*#*566I7777777777777777777777777777778888888888888888;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$$56()*</TU/1O3.*R!R#5$*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$$5&()*</TU/1O3.*R!R#5$:*566#7777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
:M'$#&'#()*</TU/1O3.*I#PA*566#7777777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$$6$()*</TU/1O3.*R!R#5%*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'$$'5()*</TU/1O3.*R!R#5%:*566#7777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'P%H%()*</TU/1O3.*R!R'6%';:5*566H77777777777777777777788888888888888888889?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'P%$P()*</TU/1O3.*R!R'6%'*566H77777777777777777777777788888888888888888889?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'P%#I()*</TU/1O3.*R!R'6%'@5*566H777777777777777777777788888888888888888889?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'P%IH()*</TU/1O3.*R!R'6%'@*566H7777777777777777777777788888888888888888889?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'P%&'()*</TU/1O3.*R!R'6%5*566H77777777777777777777777788888888888888888889?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'P%&P()*</TU/1O3.*R!R'6%5E*566H7777777777777777777777788888888888888888889?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'P%PH()*</TU/1O3.*R!R'6%5@*566H7777777777777777777777788888888888888888889?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'H#%I()*</TU/1O3.*R!RP%&*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'H#$%()*</TU/1O3.*R!RP%&:*566#7777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
RC6'H#&I()*</TU/1O3.*R!R&&H*566#77777777777777777777777778888888889:;<=:>;!>9?"?;@;:<>@=@@B!A9)<<==C@?D;":=EF)>;9=G99
45'!&'#()*+*
!"#$% %&'%(")*+$,-.% %(")*/,0111% %23/0,%4$56$,-$7%8&429% %:$763;7
!6+*5#(+7%!&(+8'%/!"%95%':%*!
!;%'%<#=%!>?)(-8%'%=+:!1<%%!
!2%=#/#=#@/<+$%'!A-BC#<#=+$%!&'#()*+*!1--(!
4<2:=!%>2?2 2@2ABC<%D%EF4G2AFC< (H:IJ<@=! 4GJ&F?%>2?2 !H&<
2+"6;%G7 ="##6,/;' 2,,"6,-$#$,;7 A/,*7 :$7"6)-$7 46KK"); 4/0,%H6;
B"6%L)$%3"00$M%/,%L7%'6,1N.L,0O6;7"6;.P$7;$),1$M6
:6,%23/0,#$,;%E/$P$)%P/;.%;.$%&42%)$763;
!"!#$"%&'($)$&*+,'-&.&/&)$'0'123456'1#7.897$'3$:#$"+$';78<=== ,..9>??@@@=!#A/=B*<?/*+?C)&=ABDA$+B*&.B*E8"!#$"%&FC$.,BAE($===
G'BH'IJ GJ?JG?GG'GJ>KK'L1
http://www.fludb.org/
Freely available Integrated datasets Bioinformatics tool suite Platform for influenza data submission
IRD is funded by the National Institute of Allergy and Infectious Diseases (NIH/DHHS) under Contract No. HHSN266200400041C and is a collaboration between Northrop Grumman Health IT, University of Texas Southwestern Medical Center , Vecna Technologies, SAGE Analytica and Los Alamos National Laboratory. Comments, questions, suggestions? Contact us at [email protected]
Option 2: Align sequences from a working set or your own sequences
!"#$%&'( )*#+,"-./ 0.+//-,1%+2%)$,3/ '$4+,#%-%5*6 '$7*$/#%8$9%),-":":6 !+:#-;#%</ '$.$-/$%(-#$=%>*.%?@A%BC??
)D"/%4,+E$;#%"/%2*:F$F%91%#D$%G-#"+:-.%&:/#"#*#$%+2%H..$,61%-:F%&:2$;#"+*/%("/$-/$/%IG&J%K%(JJLM%*:F$,%!+:#,-;#%G+N%JJLGBOOBCCPCCCP?!%-:F%"/%-%;+..-9+,-#"+:%9$#Q$$:%G+,#D,+40,*33-:%J$-.#D%&)A%<:"R$,/"#1%+2%)$S-/%L+*#DQ$/#$,:%T$F";-.%!$:#$,%A%U$;:-%)$;D:+.+6"$/A%LH0V%H:-.1#";-%-:F%W+/%H.-3+/%G-#"+:-.%W-9+,-#+,1N
<4.+-F%-%2".$%;+:#-":":6%31%/$7*$:;$/%":%XHL)H %+,%YD1."42+,3-#N
Y-/#$%/$7*$:;$%":%XHL)H %+,%YD1."4%2+,3-#N($2.":$%":%1+*,%XHL)H%2".$%Q"..%9$%*/$F%#+%.-9$.%#D$%F"/4.-1
</$%Q+,Z":6%/$#N
!"##$%&'&(#)*+,-&.%/
0122&3242150674%[*";Z%),$$%IW$#%&'(%/$#%-..%4-,-3$#$,/%\%R"$Q%-..%4-,-3$#$,/M%!*/#+3%),$$%I&%Q-:#%#+%/$#%31%+Q:%4-,-3$#$,/M
.28924!2&0:;2&%G*;.$+#"F$%H3":+%H;"F%IY,+#$":M
.791!2&7<&.28924!2.&07&=2&545>:?2@&L$7*$:;$/%;-:%-./+%9$%/$.$;#$F%2,+3%/$-,;D%,$/*.#/%+,%-%Q+,Z":6%/$#%":%1+*,Q+,Z9$:;DN
>5=2>643($2.":$%":%1+*,%XHL)H%2".$%Q"..%9$%*/$F%#+%.-9$.%#D$%F"/4.-1
<71A50&7<&.28924!2.&;17B6@2@&&C%<:-."6:$F%XHL)H%H."6:$F%XHL)H%YD1."4%I":#$,.$-R$FM
=D+EF&0)%%!E%')
!"#"$%&"'()*+,-"#"&./'0$""'&'(%*/$/%YD1TW%]%%0*":F+:A%LN%-:F%0-/;*$.A%^NA%IBCC_M%L1/#%5"+.N%`B=%OaO\bCP %%c%#+%":2$,%4D1.+6$:"$/%9-/$F%+:%:*;.$+#"F$%/$7*$:;$/N%HFF"#"+:-..1A%&'(%4,+R"F$/%/$R$,-.+4#"+:/%#+%F"/4.-1%-%6$:$,-#$F%#,$$N%%IL^YM!"#$%&'(&)*#$+,*-&./0&1&+$23,+$4&5,$64&&
J+3$% %0$:$,-#$%YD1.+6$:$#";%),$$
LVH'!J%(H)H HGHWdeV%f%U&L<HW&eV 8^'g5VG!J L<5T&)%(H)H J^TV
HGHWdeV%f%U&L<HW&eV
&F$:#"21%L"3".-,%L$7*$:;$/%I5WHL)M
H."6:%L$7*$:;$/%ITLHM
&F$:#"21%LD+,#%Y$4#"F$/%":%Y,+#$":/
&F$:#"21%Y+":#%T*#-#"+:/%":%Y,+#$":/
0$:$,-#$%YD1.+6$:$#";%),$$
U"/*-."h$%H."6:$F%L$7*$:;$/
H::+#-#$%G*;.$+#"F$%L$7*$:;$/
H:-.1h$%L$7*$:;$%U-,"-#"+:%ILGYM
J&L)^'d
'$#,"$R$%-:%H:-.1/"/
'$#,"$R$%-%(+Q:.+-F
'$#,"$R$%-:%H::+#-#"+:
d+*,%H:-.1/"/%J"/#+,1
H9+*#%</ !+33*:"#1 H::+*:;$3$:#/ W":Z/ '$/+*,;$/ L*44+,# L"6:%^*#
d+*%-,$%.+66$F%":%-/%1*:NhD-:6i*#/+*#DQ$/#$,:N$F*
!"!#$"%&'($)$&*+,'-&.&/&)$'0'1,2345$"$.6+'7*$$ ,..89::;;;<!#=/<4*5:/*+:.*$$<=4>?$.,4=@A,4;B3$&"!"8#.1&5$C<<<
D'4E'D F:GH:DD'DD9IF'JK
1
Loading Influenza Research Database...
Cite IRD Tutorials Glossary of Terms Report a Bug Request Web Training Contact Us Release Date: Jul 18, 2011
This project is funded by the National Institute of Allergy and Infectious Diseases (NIH / DHHS) under Contract No. HHSN266200400041C and is a collaboration between NorthropGrumman Health IT, University of Texas Southwestern Medical Center , Vecna Technologies, SAGE Analytica and Los Alamos National Laboratory.
Upload a file containing my sequences in FASTA format.
Paste sequence in FASTA format.
Use working set.
INPUT SEQUENCESSequences can also be selected from search results or a working set in yourworkbench.
File Path:Browse�…
The minimum number of sequences is 2.
HTML
SELECT OUTPUT FORMATAligned
SELECT OUTPUT ORDER
RunClear
Align Sequences (MSA) IRD uses the MUSCLE (Multiple Sequence Comparison by Log-Expectation) algorithm to align the sequences you select from a search result or a working set on yourworkbench or that you provide in an uploaded file.
Home Align Sequences (MSA)
SEARCH DATA ANALYZE & VISUALIZE WORKBENCH SUBMIT DATA HOME
About Us Community Announcements Links Resources Support Sign Out
You are logged in as [email protected]
Inuenza Research Database - MUSCLE Multiple Sequence Alig... http://www.udb.org/brc/msa.do?method=ShowCleanInputPage&...
1 of 1 8/1/11 3:10 PM
2
2.1
Three options to input sequences
Visualize and Customize the Alignment
!"#$%&'()&*+,-&.#(/-0-#123(4#5#6#0-777
8%5-()/4 9,5"1%#+0 :+"00#1;("*(9-1<0 /-="15(#(>,' /-?,-05(@-6(91#%&%&' 8"&5#25(A0 /-+-#0-(4#5-B(C,+(DEF(GHDD
93%0(=1"I-25(%0(*,&$-$(6;(53-(J#5%"&#+()&05%5,5-("*(K++-1';(#&$()&*-25%",0(4%0-#0-0(LJ)M(N(4MMOP(,&$-1(8"&51#25(J"7(MMOJGQQGHHRHHHRD8(#&$(%0(#(2"++#6"1#5%"&(6-5S--&(J"1531"=:1,<<#&(M-#+53()9F(A&%T-10%5;("*(9-U#0(O",53S-05-1&(V-$%2#+(8-&5-1(F(W-2&#(9-23&"+"'%-0F(OK:X(K&#+;5%2#(#&$(!"0(K+#<"0(J#5%"&#+(!#6"1#5"1;7
A=+"#$(#(*%+-(2"&5#%&%&'(<;(0-?,-&2-0(%&(*"1<#57
Y#05-(0-?,-&2-(%&(ZKO9K4-*+%&-(%&(;",1(ZKO9K(*%+-(S%++(6-(,0-$(5"(+#6-+(53-($%0=+#;
A0-(S"1[%&'(0-57
!"##$%&'&(#)*+,-&.%/
0122&3242150674
(\,%2[(91--(L!-5()/4(0-5(#++(=#1#<-5-10(](T%-S(#++(=#1#<-5-10P(8,05"<(91--(L)(S#&5(5"(0-5(<;("S&(=#1#<-5-10P
.28924!2&0:;2&&<
(J,2+-"5%$-(K<%&"(K2%$(LY1"5-%&P
.791!2&7=&.28924!2.&07&>2&545?:@2A&O-?,-&2-0(2#&(#+0"(6-(0-+-25-$(*1"<(S"1[6-&237
?5>2?6434-*+%&-(%&(;",1(ZKO9K(*%+-(S%++(6-(,0-$(5"(+#6-+(53-($%0=+#;
=71B50&7=&.28924!2.&;17C6A2A&
(A&#+%'&-$(ZKO9K(K+%'&-$(ZKO9K(Y3;+%=(L%&5-1+-#T-$P
>D+EF&0)%%!E%')
!"#"$%&"'()*+,-"#"&./'0$""')/4(,0-0(Y3;V!(^((:,%&$"&F(O7(#&$(:#02,-+F(_7F(LGHH`P(O;05(>%"+7(aGB(QbQ]cHR ((d(5"(%&*-1(=3;+"'-&%-0(6#0-$("&(&,2+-"5%$-(0-?,-&2-07(K$$%5%"&#++;F()/4(=1"T%$-0(0-T-1#+"=5%"&0(5"($%0=+#;(#('-&-1#5-$(51--7((LO_YP!"#$%&'(&)*#$+,*-&./0&1&+$23,+$4&5,$64&&
M"<-( (:-&-1#5-(Y3;+"'-&-5%2(91--
OXK/8M(4K9K KJK!efX(g(W)OAK!)fX @_/h>XJ8M OA>V)9(4K9K M_VX
K6",5(A0 8"<<,&%5; K&&",&2-<-&50 !%&[0 /-0",12-0 O,=="15 O%'&(_,5
e",(#1-(+"''-$(%&(#0(;,&7.3#&'i,50",53S-05-1&7-$,
!',G%E .%E%G/
1),,2"'3,$4.#-'5"&
4'H% 0IJ% 4DHK%)&#L&.%MD%,G%$ A'/%
K,051#+%#(MK(Hc(g(Hb O-'<-&5 `Q HQNH`NGHDD(QBRH(YV
2#+%*"1&%#(0S%&-(*+, O-'<-&5 R HaN`DNGHDD(GBGD(YV
MDJD(JK(O",53(K*1%2# O-'<-&5 DR HaNHQNGHDD(aBRb(YV
Y-153]MK O-'<-&5 DR HcNDaNGHDD(DB`R(YV
@M_(T#22%&-(051#%&0(](MK O-'<-&5 DG HaN`DNGHDD(`BRa(YV
!"!#$"%&'($)$&*+,'-&.&/&)$'0'1,2345$"$.6+'7*$$ ,..89::;;;<!#=/<4*5:/*+:.*$$<=4>?$.,4=@A,4;B3$&"!"8#.1&5$C<<<
D'4E'D F:GH:DD'DI9ID'JK
2.3
Loading Influenza Research Database...
Cite IRD Tutorials Glossary of Terms Report a Bug Request Web Training Contact Us Release Date: Jul 18, 2011
This project is funded by the National Institute of Allergy and Infectious Diseases (NIH / DHHS) under Contract No. HHSN266200400041C and is a collaboration between NorthropGrumman Health IT, University of Texas Southwestern Medical Center , Vecna Technologies, SAGE Analytica and Los Alamos National Laboratory.
Upload a file containing my sequences in FASTA format.
Paste sequence in FASTA format.
Use working set.
INPUT SEQUENCESSequences can also be selected from search results or a working set in your workbench.
>gb:HM628693|Organism:Influenza A virus A/Acre/15093/2010|Segment:4|Subtype:H3N2|Host:HumanATGAAGACTATCATTGCTTTGAGCTACATTCTATGTCTGGTTTTCGCTCAAAAACTTCCTGGAAATGACAACAGCACGGCAACGCTGTGCCTTGGGCACCATGCAGTACCAAACGGGACGATAGTGAAAACAATCACGAATGACCAAATTGAAGTTACTTATGCTACTGAGCTGGTTCAGAGTTCCTCAACAGGTGAAATATGCGACAGTCCCCATCAGATCCTTGATGGAAAAAACTGCACACTAATAGATGCTCTATTGGGAGACCCTCAGTGTGATGGCTTCCAAAATAAGAAATGGGACCTTTTTGTTGAACGCAGCAAAGCCTACAGCAACTGTTACCCTTATGATGTGCCGGATTATGCCTCCCTTAGGTCACTAGTTGCCTCATCCGGCACACTTGAGTTTAACAATGAAAGC
The minimum number of sequences is 2.Defline in your FASTA file will be used to label the display
HTML
SELECT OUTPUT FORMATAligned
SELECT OUTPUT ORDER
RunClear
Align Sequences (MSA) IRD uses the MUSCLE (Multiple Sequence Comparison by Log-Expectation) algorithm to align the sequences you select from a search result or a working set on yourworkbench or that you provide in an uploaded file.
Home Align Sequences (MSA)
SEARCH DATA ANALYZE & VISUALIZE WORKBENCH SUBMIT DATA HOME
About Us Community Announcements Links Resources Support Sign Out
You are logged in as [email protected]
Inuenza Research Database - MUSCLE Multiple Sequence Alig... http://www.udb.org/brc/msa.do?method=ShowCleanInputPage&...
1 of 1 8/1/11 4:10 PM
2.2
!"#$%&'( )*#+,"-./ 0.+//-,1%+2%)$,3/ '$4+,#%-%5*6 '$7*$/#%8$9%),-":":6 !+:#-;#%</ '$.$-/$%(-#$=%>+?%@A%BCDD
)E"/%4,+F$;#%"/%2*:G$G%91%#E$%>-#"+:-.%&:/#"#*#$%+2%H..$,61%-:G%&:2$;#"+*/%("/$-/$/%I>&J%K%(JJLM%*:G$,%!+:#,-;#%>+N%JJL>BOOBCCPCCCPD!%-:G%"/%-%;+..-9+,-#"+:%9$#Q$$:%>+,#E,+40,*33-:%J$-.#E%&)A%<:"?$,/"#1%+2%)$R-/%L+*#EQ$/#$,:%S$G";-.%!$:#$,%A%T$;:-%)$;E:+.+6"$/A%LH0U%H:-.1#";-%-:G%V+/%H.-3+/%>-#"+:-.%V-9+,-#+,1N
%
W5B%4+/#%BCCX%SLH !"#$%&'%(')*+$,-.
1*:NYE-:6Z*#/+*#EQ$/#$,:N$G* /$01$2&%3'&454-"&4',
!"#$%&&'()***(-#-%"/%/#"..%4,+;$//":6N%'$/*.#/%Q"..%9$%/E+Q:%QE$:%,$-G1N
6789:6%3;<=:/&2%1+*%G+%:+#%Q-:#%#+%Q-"#%2+,%#E$%,$/*.#/A%*/$%1+*,%#";[$#%:*39$,%I%SL\]@^OOB]^D]_@%M%#+%;+3$%9-;[%#+%#E$%'$#,"$?$%'$/*.#/%91%)";[$#%>*39$,%4-6$%-#%-%.-#$,%#"3$-:G%,$#,"$?$%1+*,%,$/*.#/N
!>?:%>3>@A!7!%6B%(B/9=:38CU:#$,%#E$%:-3$%1+*%Q-:#%#+%*/$%-:G%;.";[%!"#$%&'%(')*+$,-.%"2%1+*%Q-:#%#+%/-?$%#E$%-:-.1/"/%QE$:%#E$%,$/*.#/%-,$%,$-G1N
3B67D78>67B3%BD%8B<E@:67B3U:#$,%1+*,%$3-".%-:G%;.";[%/$01$2&%3'&454-"&4',%"2%1+*%Q-:#%#+%,$;$"?$%-%:+#"2";-#"+:%QE$:%#E$%,$/*.#/%-,$%,$-G1N
J+3$% %S1%8+,[9$:;E% %8+,[":6NNN% %H."6:%L$7*$:;$/%ISLHM% %W,+;$//":6NNN
LUH'!J%(H)H H>HV`aU%b%T&L<HV&aU 8c'd5U>!J L<5S&)%(H)H JcSU
H9+*#%</ !+33*:"#1 H::+*:;$3$:#/ V":[/ '$/+*,;$/ L*44+,# L"6:%c*#
+̀*%-,$%.+66$G%":%-/%1*:NYE-:6Z*#/+*#EQ$/#$,:N$G*
!"!#$"%&'($)$&*+,'-&.&/&)$'0'1223'($)#3.) ,..45667778!#9/82*:6/*+6;)&892
<'2='< <>6><6<<'<>5?@'AB
3
1. Mouse-over the “Analyze & Visualize” tab and click “Align Sequences (MSA)”.
2. On the MSA landing page, use one of the three options to input sequences:
2.1 Upload a file containing sequences in FASTA format. 2.2 Paste sequences in FASTA format. 2.3 Use a working set from your Workbench.
Select output format and order. Then click “Run”. 3. If you have a large amount of input, the analysis may
take a few minutes to run. While the analysis is running, you can choose to save it (upon completion) to your Workbench by entering a name for the analysis and then clicking the “Save to Workbench” button. Then you can move to other parts of the IRD site, and retrieve the alignment later from your Workbench.
1. After the alignment analysis is finished, mouse-over “Run Analysis” and click “Visualize Aligned Sequences”.
2. On the next page, you will have the option to customize the sequence labels by selecting the “Custom” radio button in the “Label sequence by” section. Click “Run” to load the alignment visualization window.
3. In the alignment visualization window, many customization options exist: • Rename a sequence label: Right-click a strain name in the alignment,
mouse-over the sequence name in pop-up menu, click “Edit Name/Description”, modify the name and click “Accept”.
• Highlight IRD-defined Sequence Features on the alignment: • Add your own sequence feature to the alignment: Click and drag a desired
region of sequence alignment, right-click the selected region, mouse-over “Selection” and click “Create Sequence Feature”.
• Color alignment based on sequence identity cutoff: Click the “Colour” pulldown menu and then the “Above Identity Threshold” option. Using sliding bar to adjust color display.
• Manually adjust the alignment: Click a sequence and then use ç èon the keyboard to adjust the alignment.
4. Export the alignment from the “File” menu.
1
!"#$%&'( )*#+,"-./ 0.+//-,1%+2%)$,3/ '$4+,#%-%5*6 '$7*$/#%8$9%),-":":6 !+:#-;#%</ '$.$-/$%(-#$=%>+?%@A%BCDD
)E"/%4,+F$;#%"/%2*:G$G%91%#E$%>-#"+:-.%&:/#"#*#$%+2%H..$,61%-:G%&:2$;#"+*/%("/$-/$/%I>&J%K%(JJLM%*:G$,%!+:#,-;#%>+N%JJL>BOOBCCPCCCPD!%-:G%"/%-%;+..-9+,-#"+:%9$#Q$$:%>+,#E,+40,*33-:%J$-.#E%&)A%<:"?$,/"#1%+2%)$R-/%L+*#EQ$/#$,:%S$G";-.%!$:#$,%A%T$;:-%)$;E:+.+6"$/A%LH0U%H:-.1#";-%-:G%V+/%H.-3+/%>-#"+:-.%V-9+,-#+,1N
>*39$,%+2%L$7*$:;$/ DOW
L$7*$:;$%)14$ 4,+#$":
&:2.*$:X-%)14$ H
L$63$:# D
!"#$"%&"'(%)*+,-.(*%
!"#$"%&"')(/."+%UR;.*G$%I2-./$M%9-G%4,$Y-."6:$G%/$7*$:;$%2,+3%Z-.?"$Q
G"/4.-1
/-0"/'!"#$"%&"'01%L#,-":%>-3$%H;;$//"+:%>*39$,%!*/#+3
%%%% %L#,-":%>-3$%%%% %H;;$//"+:%>*39$,%%%% %)14$%%%% %L*9)14$%%%% %(-#$%%%% %L$-/+:%%%% %!+*:#,1%%%% %J+/#%L4$;"$/%%%% %BCC@%4JD>DY."[$
+23
!"#$%&"'()*&"+,(-).(/$(,0(#)1$#234"'%2"3,</$%#E$%Z-.T"$Q %":#$,-;#"?$%-."6:3$:#%?"$Q$,%#+%?"/*-."X$%:*;.$+#"G$%+,%-3":+%-;"G%/$7*$:;$/%4,+?"G$GN%&2%1+*%4,+?"G$%*:-."6:$G%/$7*$:;$/A%&'(%Q"..%2",/#%-."6:%1+*,%/$7*$:;$/*/":6%#E$%S<L!VU%-.6+,"#E3N%IL\]M!"#$%&'(&)*#$+,*-&./0&1&+$23,+$4&5,$64&&
J+3$% %S1%8+,[9$:;E% %8+,[":6NNN% %H."6:%L$7*NNN% %'$/*.#/% %T"/*-."X$%H."6:$G%L$7*$:;$/
LUH'!J%(H)H H>HV^_U%`%T&L<HV&_U 8\'a5U>!J L<5S&)%(H)H J\SU
H9+*#%</ !+33*:"#1 H::+*:;$3$:#/ V":[/ '$/+*,;$/ L*44+,# L"6:%\*#
+̂*%-,$%.+66$G%":%-/%1*:NXE-:6b*#/+*#EQ$/#$,:N$G*
!"!#$"%&'($)$&*+,'-&.&/&)$'0'1&234$5 ,..67885559!#:/9;*<8/*+8=&2>4$59:;?.4+@$.A#B/$*CDEFGGGHIJI999
K';L'K KG8GK8KK'KK7MK'ND
2
Select and highlight IRD-defined Sequence
Features on the alignment
Export the alignment
Add your own sequence feature on
the alignment
Rename a sequence label
3