Pattern Recognition Methods for the Prediction of Chemical Structures of Fungal Secondary Metabolites
Total Page:16
File Type:pdf, Size:1020Kb
!"##$%&'%$()*&+#+)&',$#-)./'0)%'#-$'1%$.+(#+)&')0' (-$,+("2'/#%3(#3%$/')0'03&*"2'/$()&."%4',$#"5)2+#$/' ! ! ! !"##$%&'&"()! ! "#!$%&'(&&! )*+!,+-%(.+/+0)1!'#.!)*+!2+3.++!#'! !*+(,&(%-%$%./-)'&.%'0"./1-2!%3-%$%3-)'&34! - - - - ! 5.6/"&&$+-&(-&7$-8(.),"0-(9-&7$-:',.0&;-(9- <"(0(=",'0-5,"$),$#! (9-&7$-:%"$+%",7-5,7"00$%->)"?$%#"&;-@$)'! - - - !"!5'='%-87')=+$?-A(%$#$%&'()*#+,#-./)0.)1# # !+*0!+0!BC!"[email protected];-DEED! /0!F7'&'?G-H)+"'# ! ! ! ! ! ! ! ! "#$%#&#'()! "#$%&!'#&!'(#)!*$%%+,(-.,#! #$%&'%()*+,(%-".,(&/0,/-/12" 3&,)4&,($"5($,--)&"67,8)&9,+2:";)7%<" " "#$%&!'#&!/.,%01!/234-.,#! =)>%&+')7+"/?"@,/,7?/&'%+,(9" 3&,)4&,($"5($,--)&"67,8)&9,+2:";)7%<" " 5416"#$%&!'#&!"0107($.(-!8&!90-.#(.(-! A&/*>"B)%4)&"%74"C)%4"/?"D&2/EF-)(+&/7".,(&/9(/>2" .%&+,7EB*+$)&E67,8)&9,+G+"C%--)EH,++)70)&1:"@,/I)7+&*':"C%--)"J5%--)K<" " " '0.,!$%!:$2.$#0;!:,%,1-,<!;*7)"LM!":"!N!N<" ! ! !" ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! O" *+,,-'.! ! ! ! ! ! ! ! ! ! ! Q!! /+(-,,#01-((+02! ! ! ! ! ! ! ! ! LN! 3-45#!61!7608#08(! 9:!;08'6<+78%60! ! ! ! ! ! ! ! ! ! LR! L<L"H$2",9"+$)&)"%"7))4"?/&"7)S"4&*19T" " " " " " " LM" L<L<L"U7+,0,/+,("&)9,9+%7()" " " " " " " " LM" L<!"V%+*&%-">&/4*(+9E0%9)4"4&*1"4,9(/8)&2" " " " " " " LM" L<O"3*71,"W"%"9/*&()"/?"7/8)-"7%+*&%-">&/4*(+9" " " " " " LQ"" L<P"H$2"%&)"?*71%-"7%+*&%-">&/4*(+9"7/+"9+*4,)4"S)--T" " " " " !N"" L<R"V/7E&,0/9/'%-">)>+,4)"927+$)+%9)9"JVX#5K" " " " " " !L" L<M"U4)72-%+,/7"4/'%,79" " " " " " " " " !!"" L<Y"5*09+&%+)"9>)(,?,(,+2"/?"UE4/'%,79" " " " " " " !P" L<Q"D/74)79%+,/7"4/'%,79" " " " " " " !Y" " L<Z"F7(/4,71"/?"9'%--"'/-)(*-)9" " " " " " " " !Q" L<Z<L"./-)(*-%&"&)>&)9)7+%+,/7" " " " " " " !Q"" L<Z<!"./-)(*-%&"4)9(&,>+/&9" " " " " " " " !Z" L<Z<O"./-)(*-%&"?,71)&>&,7+9" " " " " " " " !Z"" L<Z<P"./-)(*-%&"9,',-%&,+2" " " " " " " " ON"" L<LN"D/'>*+%+,/7%-"')+$/49"?/&!UE4/'%,7"9*09+&%+)"9>)(,?,(,+2">&)4,(+,/79" " OL" L<LN<L"5UV=#6.U["%7")79)'0-)"(-%99,?,)&"" " " " " OL"" L<LN<!"B,',+%+,/79"%74"4&%S0%(\9"/?"+$)">&)8,/*9-2"4)8)-/>)4"+//-9" " OO"" L<LL".%($,7)"-)%&7,71" " " " " " " " " OO"" L<LL<L"U&+,?,(,%-"7)*&%-"7)+S/&\9" " " " " " " OP" L<LL<!"F8%-*%+,/7"/?">&)4,(+/&">)&?/&'%7()" " " " " " OM" P" =:!>#8?6<(! ! ! ! ! ! ! ! ! ! ! PN! !<L"UE4/'%,7"9*09+&%+)"9>)(,?,(,+2"4%+%" " " " " " " PN" !<!"#$2-/1)7)+,("%7%-29,9" " " " " " " " " PN" !<!<L"#$2-/1)7)+,("%7%-29,9"/?"?*71%-"UE4/'%,7"9)]*)7()9" " " " PN" !<!<!"F^+&%(+,/7"/?"DE4/'%,79"%74">$2-/1)7)+,("%7%-29,9" " " " PL" !<O"D-*9+)&,71"/?"0%(+)&,%-"%74"?*71%-"UE4/'%,7"VX#5"(/4)9" " " " PL" !<P"D-*9+)&,71"/?"7/7E&,0/9/'%-">)>+,4)"'/7/')&9" " " " " " PL"" !<R"=)8)-/>')7+"/?"VVE0%9)4"UE4/'%,7"9*09+&%+)"9>)(,?,(,+2"(-%99,?,)&"JVV%99(K"" P!" !<R<L"=%+%9)+">&)>%&%+,/7"?/&"VV%99("" " " " " " P!" !<R<!"#&)>&/()99,71" " " " " " " " " PO" !<R<!<L"F7(/4,71"/?"VX#5"(/4)"&)9,4*)9" " " " " PO" !<R<!<!"F7(/4,71"/?"9*09+&%+)9" " " " " " PP"" !<R<O"#%&%')+)&"/>+,',I%+,/7"%74"+&%,7,71"VV%99(" " " " " PP" !<R<P".%+($,71"/?">&)4,(+)4"0,+"8)(+/&"S,+$"9*09+&%+)9"?&/'"+&%,7,71"4%+%9)+" PR"" !<R<R"_%-,4%+,/7"%74"0)7($'%&\,71" " " " " " " PM"" !<R<R<L"`7+)&7%-"8%-,4%+,/7"4%+%9)+" " " " " " PM" !<R<R<!"F^+)&7%-"8%-,4%+,/7"4%+%9)+" " " " " " PM"! @:!"#(+58(!-0<!<%(7+((%60! ! ! ! ! ! ! ! PZ! O<L"#$2-/1)7)+,("%7%-29,9"/?"?*71%-"UE4/'%,79" " " " " " PZ" O<L<L"UE4/'%,79"%(+,8%+,71"*7(/''/7"7/7E>&/+)/1)7,("9*09+&%+)9"" " PZ" O<L<!"UD_5"927+$)+%9)" " " " " " " " PZ" O<L<O"#a5EVX#5"$20&,49" " " " " " " " PZ" O<!"D-*9+)&"%7%-29,9"/?"VX#5"(/4)"&)9,4*)9" " " " " " " RO" O<!<L"5,',-%&,+2b4,??)&)7()9"0)+S))7"?*71%-"%74"0%(+)&,%-"VX#5"(/4)9" " RO" O<O"#$2-/1)7)+,("&)-%+,/79$,>9"%'/71"?*71%-"DE4/'%,79" " " " " RM" R" O<P"D-*9+)&,71"/?"VX#"'/7/')&9"%74"UE4/'%,7"9*09+&%+)9" " " " " RY" O<P<L"./4,?,(%+,/79" " " " " " " " " RY" O<P<!"UE4/'%,7"9*09+&%+)9"%74"VX#5"(/4)"9,',-%&,+2" " " " RZ" O<R"5*09+&%+)"9>)(,?,(,+2">&)4,(+,/7"*9,71"VV%99(" " " " " " MN""" O<R<L"#&)4,(+,/79"W",7+)&7%-"8%-,4%+,/7"4%+%9)+" " " " " ML" O<R<!"#&)4,(+,/79"E")^+)&7%-"8%-,4%+,/7"4%+%9)+" " " " " ML"" O<R<O"5+&*(+*&%-",79,1$+9",7+/"9*09+&%+)"9>)(,?,(,+2">&)4,(+,/7"" " " MO"" O<R<P"#&)4,(+,/7"/?"9*09+&%+)"0,+"8)(+/&9" " " " " " MO"" O<R<R"`7(-*9,/7"/?"'/&)"+&%,7,71"4%+%"" " " " " " MP" O<R<M"F^+&%(+,/7"/?"(/&&)(+"VX#5"(/4)"&)9,4*)9" " " " " MP""" A:!B6075+(%60(! ! ! ! ! ! ! ! ! ! MM! C:!"#1#'#07#(! ! ! ! ! ! ! ! ! ! MQ! DEE#0<%F! ! ! ! ! ! ! ! ! ! ! YR! D7G06&5#<2#,#08! ! ! ! ! ! ! ! ! Q!! B+''%7+5+,!H%8-#!! ! ! ! ! ! ! ! ! QP! I%(8!61!E+45%7-8%60(! ! ! ! ! ! ! ! ! QM! J#75-'-8%60K!*#54(8(8L0<%2G#%8(#'G5L'+02! ! ! ! ! ! QQ"! ! ! ! ! M" ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! Y" "#$$%&'! V/7EX,0/9/'%-"#)>+,4)"527+$)+%9)9"JVX#5K"%&)"')1%"927+$)+%9)9"+$%+"%&)">&)4/',7%7+-2"?/*74",7" 0%(+)&,%"%74"?*71,<"c$)2">&/4*()"9'%--">)>+,4)9"+$%+"9)&8)"7*')&/*9"0,/-/1,(%-"?*7(+,/79"%74"(&*(,%-" )(/-/1,(%-" &/-)9<" VX#59" %&)" /&1%7,I)4" ,7+/" 4,??)&)7+" '/4*-)9:" )%($" &)9>/79,0-)" ?/&" >&/()99,71" J9*09+&%+)"%(+,8%+,/7"/&"($)',(%-"'/4,?,(%+,/79K"%74",7(/&>/&%+,/7"/?"9,71-)"9*09+&%+)"'/7/')&9<"U" 9,71-)" '/4*-)" /?" VX#5" $%9" +$&))" 4/'%,79" 9*($" %9" U4)72-%+,/7" JUK:" D/74)79%+,/7" JDK:" %74" c$,/-%+,/7" JcK<" 5*09+&%+)" 9)-)(+,/7" %74" +$),&" %(+,8%+,/7" 02" %4)72-%+,/7" ,9" %" \)2" 9+)>" ,7" +$)" 7/7E &,0/9/'%-">)>+,4)"JVX#9K"0,/927+$)9,9<"UE4/'%,79"(%+%-2I)"Uc#"4)>)74)7+"%(+,8%+,/7"/?"9*09+&%+)9" $%&0/&,71"(%&0/^2"+)&',7*9<"UE4/'%,7"9*09+&%+)9",7(-*4)"7/+"/7-2"7%+*&%-"%',7/"%(,49"J="%74"B" ?/&'9K" 0*+" %-9/" 7/7E>&/+),7/1)7,(" %',7/" %(,49<" c$)" ,7(-*9,/7" /?" 7/7E>&/+),7/1)7,(" %',7/" %(,4" ,7(&)%9)9"+$)"9+&*(+*&%-"%74"($)',(%-"4,8)&9,+2"/?"0,/927+$)9,I)4">)>+,4)9<"DE4/'%,79"$%8)"%-9/"0))7" &)>/&+)4"+/"9$/S"'/4)&%+)"9>)(,?,(,+2"+/S%&49"%"9*09+&%+)"+$%+",9"%(+,8%+)4"02"%7"UE4/'%,7<"V/&,7)" 4%+%0%9)" $%9" -,9+)4" RPO" '/7/')&9" J!PY" VX#5" 9>)(,?,(K" ,7" +$),&" &)>/9,+/&2:" +$)9)" '/7/')&9" %&)" )^+&%(+)4"?&/'"+$)"(/'>-)+)"($)',(%-"9+&*(+*&)9"/?"($%&%(+)&,I)4"VX#9<"U9"+$)"9*09+&%+)"&)>)&+/,&)" ,9"-%&1)"%74"9>)(,?,(,+2"&*-)9"?/&"?*71,"%&)"7/+")9+%0-,9$)4"S)--:"+$)&)",9"%"4,??,(*-+2",7">&)4,(+,71" 9*09+&%+)9"?/&"?*71%-"UE4/'%,79<"`7"0%(+)&,%:"+)7"%',7/"%(,4"&)9,4*)9"S)&)")9+%0-,9$)4"%9"dVX#5" (/4)e:"S$,($"4)+)&',7)"9>)(,?,(,+2"/?"UE4/'%,79<"c$)9)"&)9,4*)9"S)&)",4)7+,?,)4"02"'*+%1)7)9,9" 9+*4,)9"4/7)"S,+$"%">$)72-%-%7,7)"0,74,71"UE4/'%,7<" c/"9+*42"&)-%+,/79$,>9"0)+S))7"?*71%-"UE4/'%,79"%74"+$),&"9>)(,?,(,+2:"`"&%7"+$)"(-*9+)&"%7%-29,9"/?" VX#5"(/4)"&)9,4*)9<"3*71%-"UE4/'%,7"9)]*)7()9"S,+$"\7/S7"9*09+&%+)9"%74"(/&&)9>/74,71"VX#5" (/4)"&)9,4*)9"S)&)"/0+%,7)4"?&/'"+$)"VX#5>&)4,(+/&!"4%+%9)+"J&)-)%9)4",7"!NLLK<"c$,9"4%+%9)+"S%9" )^>%74)4"02"%44,71"'%7*%--2"(*&%+)4"9)]*)7()9"+$%+"S)&)">*0-,9$)4"%?+)&"!NLL<"VX#5>&)4,(+/&!",9" UE4/'%,7" 9*09+&%+)" 9>)(,?,(,+2" (-%99,?,)&:" S$,($" *9)9" 9*>>/&+" 8)(+/&" '%($,7)" '/4)-9" ?/&" +$)" >&)4,(+,/7<"VX#5"(/4)"&)9,4*)9"S)&)")7(/4)4"02">$29,(/($)',(%-">&/>)&+,)9")99)7+,%-"?/&"0,74,71" 9'%--" '/-)(*-)9" %74" +$)9)" &)9,4*)9" S)&)" (-*9+)&)4" 02" +$),&" 9,',-%&,+2<" D-*9+)&" %7%-29,9" 9$/S)4" 9,',-%&"VX#5"(/4)9"?/&"fE%',7/"%4,>,("%(,4:">$)72-%-%7,7):"%74"+&2>+/>$%7:")+(<"0)+S))7"0%(+)&,%" %74"?*71,<"3*71%-"VX#5"(/4)9"?/&"9*09+&%+)9"9*($"%9"+2&/9,7):"9)&,7):"%74">&/-,7):"4,4"7/+"(-*9+)&" +/1)+$)&"S,+$"0%(+)&,%:"S$,($",74,(%+)9"%7",74)>)74)7+")8/-*+,/7"/?"9*09+&%+)"9>)(,?,(,+2",7"?*71,<" c$,9" )'>$%9,I)9" +$)" >&)99,71" 7))4" ?/&" +$)" 4)8)-/>')7+" /?" %" ?*71*9E9>)(,?,(" >&)4,(+,/7" +//-<" D*&&)7+-2" %8%,-%0-)" UE4/'%,7" 9)]*)7()E0%9)4" 9>)(,?,(,+2" >&)4,(+,/7" +//-9" %((*&%+)-2" ,4)7+,?2" Q" 9*09+&%+)9"?/&"0%(+)&,%"0*+"?%,-"+/">&/8,4)"(/&&)(+">&)4,(+,/79"?/&"?*71,<"5UV=#6.U:"%7")79)'0-)" (-%99,?,)&" ?/&" UE4/'%,7" 9*09+&%+)" 9>)(,?,(,+2" >&)4,(+,/7:" 4)8)-/>)4" ,7" !NLY:" *9)9" /7-2" ZN" ?*71%-" 9)]*)7()9"J(/'>-)+)"4%+%9)+"W"Z!Q"9)]*)7()9K"0*+"4/)9"7/+"1,8)"%((*&%+)"9*09+&%+)">&)4,(+,/79"?/&" ?*71%-"9)]*)7()9<"" `">&)9)7+"$)&)"%"7/8)-"%>>&/%($"?/&"?*71%-"UE4/'%,7"9*09+&%+)"9>)(,?,(,+2">&)4,(+,/7:"S$,($",9"0%9)4" /7" %" 7)*&%-" 7)+S/&\" JVVK<" `" 4)8)-/>)4" +$)" VVE0%9)4" UE4/'%,7" 9*09+&%+)" 9>)(,?,(,+2" (-%99,?,)&" JVV%99(K"*9,71"a)&%9"S,+$"c)79/&3-/S"0%(\)74"*9,71"#2+$/7"9(&,>+,71"-%71*%1)<"`+"S%9"+&%,7)4" 9/-)-2" *9,71" ?*71%-" VX#5" (/4)9" %74" (/'0,7)9" >$29,(/($)',(%-" %74" 9+&*(+*&%-" ?)%+*&)9" ?/&" 9>)(,?,(,+2">&)4,(+,/79<"`7+)&7%-"%74")^+)&7%-"8%-,4%+,/7"4%+%9)+9"/?")^>)&,')7+%--2"8)&,?,)4"VX#5" (/4)9"S)&)"*9)4"+/"%99)99"+$)">)&?/&'%7()"/?"VV%99(<"VV%99(">&)4,(+,/79"S)&)"(/'>%&)4"S,+$" 5UV=#6.U"*9,71"+$)9)"+S/"8%-,4%+,/7"4%+%9)+9<"U9"/>>/9)4"+/")%&-,)&"9)]*)7()E0%9)4">&)4,(+,/7" +//-9:" /*&" %>>&/%($" ,78/-8)9" +$)" >&)4,(+,/7" /?" 9*09+&%+)" 9*09+&*(+*&)9" &%+$)&" +$%7" ')&)" 9*09+&%+)" (-%99)9<"VV%99(",4)7+,?,)9"(/&&)(+"9*09+&%+)9"S,+$,7"+$)"+/>"+$&))"/&"?,8)">&)4,(+,/79",7"%--"(%9)9")^()>+" ?/&" >$)72-%-%7,7):" S$,-)" 5UV=#6.U" S/&\9" /7-2" S,+$" %-%7,7)" /&" +2&/9,7)" VX#5" (/4)9<" c$)" 9*09+&%+)",9")7(/4)4"%9"%"./&1%7"?,71)&>&,7+"0,+"8)(+/&:"9*($"+$%+")%($"0,+")7(/4)9"()&+%,7"'/-)(*-%&" >&/>)&+2"/&"%"9*09+&*(+*&)<"#&)4,(+,/7"/?"9*09+&*(+*&)9"$%9"%7"%48%7+%1)"+$%+"+$)"7/8)-"J7/+">%&+"/?" +$)"+&%,7,71"4%+%9)+K"9*09+&%+)9"(/*-4"%-9/"0)">&)4,(+)4"+$%+"$%&0/&"+$)9)"9*09+&*(+*&)9<"`7"+$)"(%9)"/?" VV%99(:" (/'>%&,9/79" /?" >&)4,(+)4" ?,71)&>&,7+" 0,+E8)(+/&9" S)&)" 4/7)" /7-2" S,+$" +&%,7,71" 4%+%9)+" 9*09+&%+)9:"%-+$/*1$"%"-%&1)&"4%+%0%9)"J)<1<"V/&,7)"4%+%0%9)K"/?">&/0%0-)"9*09+&%+)9"(/*-4"0)"*9)4",7" 4,??,(*-+" (%9)9<" `7" +$)" ?*+*&):" UE4/'%,7" 9*09+&%+)" 9>)(,?,(,+2" >&)4,(+,/79" (/*-4" 0)" ,'>&/8)4" 02" ,7(-*4,71"'/&)"VX#5"(/4)9"?/&")%($"9*09+&%+)"%74"9+&*(+*&%-",7?/&'%+,/7"%0/*+"9>)(,?,("0,74,71" ,7+)&%(+,/79<! ! ! ! ! Z" (#)%$$*+,%))#+-! V,($+EX,0/9/'%-)"#)>+,4927+$)9)7"JVX#5K"9,74".)1%927+$)+%9)7:"4,)"g0)&S,)1)74",7"@%\+)&,)7"