From f825160f8cb5ef10302dd6811895cea894ac43a6 Mon Sep 17 00:00:00 2001 From: ens-ftricomi Date: Thu, 28 Sep 2023 10:06:57 +0000 Subject: [PATCH] deploy: c2af524323397f177a093f8a789394d484e9ca4e --- .buildinfo | 4 + .doctrees/cmsearch.doctree | Bin 0 -> 2512 bytes .doctrees/cpg.doctree | Bin 0 -> 2482 bytes .doctrees/dust.doctree | Bin 0 -> 3032 bytes .doctrees/environment.pickle | Bin 0 -> 112556 bytes .doctrees/eponine.doctree | Bin 0 -> 2502 bytes .doctrees/genblast.doctree | Bin 0 -> 2507 bytes .doctrees/index.doctree | Bin 0 -> 7631 bytes .doctrees/install.doctree | Bin 0 -> 10317 bytes .doctrees/license.doctree | Bin 0 -> 48845 bytes .doctrees/minimap.doctree | Bin 0 -> 2506 bytes .doctrees/red.doctree | Bin 0 -> 2482 bytes .doctrees/repeatmasker.doctree | Bin 0 -> 3052 bytes .doctrees/scallop.doctree | Bin 0 -> 2502 bytes .doctrees/star.doctree | Bin 0 -> 2487 bytes .doctrees/stringtie.doctree | Bin 0 -> 2512 bytes .doctrees/trf.doctree | Bin 0 -> 2482 bytes .doctrees/trnascan.doctree | Bin 0 -> 3042 bytes .nojekyll | 0 .../anno/protein_annotation/genblast.html | 603 ++++++++++++ .../tools/anno/repeat_annotation/dust.html | 310 ++++++ .../tools/anno/repeat_annotation/red.html | 272 +++++ .../anno/repeat_annotation/repeatmasker.html | 369 +++++++ .../tools/anno/repeat_annotation/trf.html | 398 ++++++++ .../anno/simple_feature_annotation/cpg.html | 363 +++++++ .../simple_feature_annotation/eponine.html | 348 +++++++ .../anno/snc_rna_annotation/trnascan.html | 399 ++++++++ .../transcriptomic_annotation/minimap.html | 365 +++++++ .../transcriptomic_annotation/scallop.html | 305 ++++++ .../anno/transcriptomic_annotation/star.html | 720 ++++++++++++++ .../transcriptomic_annotation/stringtie.html | 256 +++++ _modules/index.html | 117 +++ _sources/cmsearch.rst.txt | 8 + _sources/cpg.rst.txt | 8 + _sources/dust.rst.txt | 8 + _sources/eponine.rst.txt | 8 + _sources/genblast.rst.txt | 8 + _sources/index.rst.txt | 58 ++ _sources/install.rst.txt | 54 + _sources/license.rst.txt | 203 ++++ _sources/minimap.rst.txt | 8 + _sources/red.rst.txt | 8 + _sources/repeatmasker.rst.txt | 8 + _sources/scallop.rst.txt | 8 + _sources/star.rst.txt | 8 + _sources/stringtie.rst.txt | 8 + _sources/trf.rst.txt | 8 + _sources/trnascan.rst.txt | 8 + _static/agogo.css | 555 +++++++++++ _static/basic.css | 925 ++++++++++++++++++ _static/bgfooter.png | Bin 0 -> 276 bytes _static/bgtop.png | Bin 0 -> 266 bytes _static/doctools.js | 156 +++ _static/documentation_options.js | 13 + _static/file.png | Bin 0 -> 286 bytes _static/language_data.js | 199 ++++ _static/minus.png | Bin 0 -> 90 bytes _static/plus.png | Bin 0 -> 90 bytes _static/pygments.css | 84 ++ _static/searchtools.js | 574 +++++++++++ _static/sphinx_highlight.js | 154 +++ cpg.html | 95 ++ dust.html | 95 ++ eponine.html | 95 ++ genblast.html | 95 ++ genindex.html | 94 ++ index.html | 122 +++ install.html | 143 +++ license.html | 280 ++++++ minimap.html | 95 ++ objects.inv | Bin 0 -> 462 bytes py-modindex.html | 185 ++++ red.html | 95 ++ repeatmasker.html | 95 ++ scallop.html | 95 ++ search.html | 123 +++ searchindex.js | 1 + star.html | 95 ++ stringtie.html | 95 ++ trf.html | 95 ++ trnascan.html | 95 ++ 81 files changed, 9996 insertions(+) create mode 100644 .buildinfo create mode 100644 .doctrees/cmsearch.doctree create mode 100644 .doctrees/cpg.doctree create mode 100644 .doctrees/dust.doctree create mode 100644 .doctrees/environment.pickle create mode 100644 .doctrees/eponine.doctree create mode 100644 .doctrees/genblast.doctree create mode 100644 .doctrees/index.doctree create mode 100644 .doctrees/install.doctree create mode 100644 .doctrees/license.doctree create mode 100644 .doctrees/minimap.doctree create mode 100644 .doctrees/red.doctree create mode 100644 .doctrees/repeatmasker.doctree create mode 100644 .doctrees/scallop.doctree create mode 100644 .doctrees/star.doctree create mode 100644 .doctrees/stringtie.doctree create mode 100644 .doctrees/trf.doctree create mode 100644 .doctrees/trnascan.doctree create mode 100644 .nojekyll create mode 100644 _modules/ensembl/tools/anno/protein_annotation/genblast.html create mode 100644 _modules/ensembl/tools/anno/repeat_annotation/dust.html create mode 100644 _modules/ensembl/tools/anno/repeat_annotation/red.html create mode 100644 _modules/ensembl/tools/anno/repeat_annotation/repeatmasker.html create mode 100644 _modules/ensembl/tools/anno/repeat_annotation/trf.html create mode 100644 _modules/ensembl/tools/anno/simple_feature_annotation/cpg.html create mode 100644 _modules/ensembl/tools/anno/simple_feature_annotation/eponine.html create mode 100644 _modules/ensembl/tools/anno/snc_rna_annotation/trnascan.html create mode 100644 _modules/ensembl/tools/anno/transcriptomic_annotation/minimap.html create mode 100644 _modules/ensembl/tools/anno/transcriptomic_annotation/scallop.html create mode 100644 _modules/ensembl/tools/anno/transcriptomic_annotation/star.html create mode 100644 _modules/ensembl/tools/anno/transcriptomic_annotation/stringtie.html create mode 100644 _modules/index.html create mode 100644 _sources/cmsearch.rst.txt create mode 100644 _sources/cpg.rst.txt create mode 100644 _sources/dust.rst.txt create mode 100644 _sources/eponine.rst.txt create mode 100644 _sources/genblast.rst.txt create mode 100644 _sources/index.rst.txt create mode 100644 _sources/install.rst.txt create mode 100644 _sources/license.rst.txt create mode 100644 _sources/minimap.rst.txt create mode 100644 _sources/red.rst.txt create mode 100644 _sources/repeatmasker.rst.txt create mode 100644 _sources/scallop.rst.txt create mode 100644 _sources/star.rst.txt create mode 100644 _sources/stringtie.rst.txt create mode 100644 _sources/trf.rst.txt create mode 100644 _sources/trnascan.rst.txt create mode 100644 _static/agogo.css create mode 100644 _static/basic.css create mode 100644 _static/bgfooter.png create mode 100644 _static/bgtop.png create mode 100644 _static/doctools.js create mode 100644 _static/documentation_options.js create mode 100644 _static/file.png create mode 100644 _static/language_data.js create mode 100644 _static/minus.png create mode 100644 _static/plus.png create mode 100644 _static/pygments.css create mode 100644 _static/searchtools.js create mode 100644 _static/sphinx_highlight.js create mode 100644 cpg.html create mode 100644 dust.html create mode 100644 eponine.html create mode 100644 genblast.html create mode 100644 genindex.html create mode 100644 index.html create mode 100644 install.html create mode 100644 license.html create mode 100644 minimap.html create mode 100644 objects.inv create mode 100644 py-modindex.html create mode 100644 red.html create mode 100644 repeatmasker.html create mode 100644 scallop.html create mode 100644 search.html create mode 100644 searchindex.js create mode 100644 star.html create mode 100644 stringtie.html create mode 100644 trf.html create mode 100644 trnascan.html diff --git a/.buildinfo b/.buildinfo new file mode 100644 index 0000000..99ec388 --- /dev/null +++ b/.buildinfo @@ -0,0 +1,4 @@ +# Sphinx build info version 1 +# This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. +config: 6ef85c61a07ec8e9f0ed07676e851c59 +tags: 645f666f9bcd5a90fca523b33c5a78b7 diff --git a/.doctrees/cmsearch.doctree b/.doctrees/cmsearch.doctree new file mode 100644 index 0000000000000000000000000000000000000000..64ac9e2e433ca87ddb4027a649a947e0872cb35f GIT binary patch literal 2512 zcmai0OK)5?6mFBwOeUF3l0Fbp8%Tvpsc2?U#R9QmQFc+YK)|lDJlDQsE57!{_H8DM zNU*3xB=2f|690?O_m#Hno-8IVcf;A!%S8c zT>JPbzWOU($8W;e(o1J5oADU#K_e4VG0Sy)AHy`Md#T*4y+3k1^U~=4x)_L|7`=~T z90p!`#n(>4@!P_2YBO>2&ag`Hlb>7fw6@XSd+;k?rFi~N{bOtb9+nj0`6!OUnDqIG z?J#W9I1dk$)I6S73mSH*_f{?{kMvWz+mgAI+9*@hIe_>cXj(L1JFF^ig$2znEYFip z6-J&e(@_)$;;ER3XJT6%ho9!ZId0uNhm*_{a^9ur=3F~oEYvC0+RPEBn>X>zv$iTT z>yX74XIqF+slHs-3ERlhT@{<*q5@z#C6hJi8ZmI~~p-R>|M}FwH8P+C=)M zOgf}#PS|nWd#RV8oy_FS_VhQCu)p({O6hoR?HI1l3`*W6NXY=pol z+UsdiLfC5@5_q|QxZ8@ARgm_*$w+EzI)&o_BD7aAJj{*p+IYTpcy>SRC%WsZAgkQi zA_AE@G`b{cb($gvlTRCjD_$eyQhGr;a=~MJp=H~7m{?vK>xtqYILfybb_G?vI0#34 zB~dj`edRi(K^QQ;sFrXyy`)y7YS6Hp7C^=*f5uZ%@$WE|8Z{zZXNEy5hH>Td(;rTq z#P_qihlE>eED=;Q#VsnHLd|>(2Ti5dtPE-^Am_%(h6(XLOdF%O0d!ZN-96a284gnd zAes}Xk3vE*>?^956Vi!YvY?1PO-A@!cwf37=X1br zR$h5w^vu}hJccJpvkm~7#Pb5}@o2{m@Y5IHeUExhZJuqIPspwLuRHUYRGRpD!R<_P zpVvMx{d3_91!rSV7Z@StMLgRH#~@@u`q}IgAg)Xdxe15vN_)B@LN0~EFUb2qnZ)~v zD=4Pyj|xNWP^d?>+=xV(jJBmc&ICm~XnZqlsB&FG+`gzvxJYkc{j#-7;0Ek5nbbKr z&~1f>X-~Lnv7sl6L|$cRGm7a|x`^ORvEU5zdxa1L=N?X;WYD@Gyr5DMJlAQ<)?pvD z4=%{6@@A*qgl(=rq}MI%G`j@D3o1&@B!z3_FovDf? UiY!yNc3IkO?HWk0b+wrN2c9_Z9{>OV literal 0 HcmV?d00001 diff --git a/.doctrees/cpg.doctree b/.doctrees/cpg.doctree new file mode 100644 index 0000000000000000000000000000000000000000..dc27bf3a96b1d0becad202da0f5c491e01a8491b GIT binary patch literal 2482 zcmaJ@O>Y}F5KZjJvTRwl^HBsy+&U=IG-xapK@UYQJ)}SnMtmrWo*EF;k`f7V$t^!( z`4FHz1gHVt!v2Q-%|7m~)|L)6V0dRZoOv_zX6QeA|NJ|+Q~$(6R|%085s;-^2gfoXlcy>jnYzRXbm$MR!pVD3~DpnMX?aX`8( z#CF_i!C%CCN@|`i!j#56>b;fI;E{Ara$7Q&6Y3X=ItL}bdzzNb*DedyjWDIf!tzYsbr}I-^>fbpc@Aqyaf8s`=PD zWbyg=7I2C$08Tsun8!FdE9+97t+H!MMa7pW@AKB?w6Qtew0QxWmjEoj5qki--2fG@ zHUq7kiS|NQKJh9(^pae7;W^TD_%GdM8QNrKe>DVZRAO z;ClgauN8w;kPf^lNN!<1MYtYt*{c-q&y4Zfcz)~f{BAtRgw~-X%bBrdf@b8voQf2t z%yZ)4@=2rNiq{%)DZL;oA|YaXp=H)Z99mu(>xts;If}Lw_XJg)*o((}DN!p=eQ+zI zUhFYG4ReGWT~e!2D_B@gOK1itdckv2>F+p_x(c3fT^I(d6bHf2&b~i$65mhP4+*!{ zSR$xqid)n0ZJ_-q? zc%Z1B2Ri2{H-o%|wG$s$UKq;=;}yt(FcQqTh&zSRGvtVJNCtZHnOr8Z6Gt?7LvB=Y zOM+1cER+@LScj_C3JJnlO;vVySZiuN=ic9_D#rseWLaiD9r0yl94EJL))Xl`c`u!8 z_<2Z}babk6A}z}PY8o(ELnPzC|7M~=nbwTVq-s{sXZZ_39JhHvqP^K0L%;X2pF0u! zJkBEp+UPl0sAMU9dVBODjw)Ue6oq3Di@IRLteH|^&yx`!3-2rU!(;-r8&_9e7(F(2 zK1uOWwyXibl6YRCJs$1Yh5qdMx8I?jBReZL+-J>=`>$5+F{w23b;0deazCqMVCE;n zmkPlKo=!1B%!_os8&5#Ul614#B|u!28FC$u+?DopNrapWgZJt+hQ9yGogHdMJTA#N{1g%J6btKY7630#9crjU9D4y?Aq{k$h! zm~Pm~GLu&s+Kgg;fffmzDW{xaey;#QaPAT0Q30z3;U$%d;6cv2wT6A%KB*w9nl(G^ zI&O3QKEGsfx7j5aUQkhLCNUhIcxvYyy9tlNF+hP@9xD~JVfo$qfNi&?ZQeGh;ceCl zJ9&igEJEMU%H~_V784f-S>dlLApDTT>uV>T;qOEYT|BtmtorsrA<^<29v&M_p2?M6 z1M{|~u>*KCx11W)^}jZKxS{N<2WuV&tEly*`)mHOTdmK_{L!Yb_5=?ZHb!AW-Ulh} z7e*-*7CGR_=)Y<8pOE~=^b6RJe?Blr_;fA_&>(!;vN71 literal 0 HcmV?d00001 diff --git a/.doctrees/dust.doctree b/.doctrees/dust.doctree new file mode 100644 index 0000000000000000000000000000000000000000..e27f1d6f2fa6ab70cb0c775724416b989c2eb197 GIT binary patch literal 3032 zcmbtW+iP4!7;lqolFemv=>@S(nHoH=Mkb zLqQ)32Ij5fpCf|!>WlaX`I~b~cER?+g^)AfeDhs@-{q&yuYYY`DSv*)6pYJRpJbU- z88yMLXDW3$l{UNykA4oX!b9KH(^(TCQaK zoOReLTYDK;*LN(pf?m4ucb_?9pA$2s`tZ5RoS=u#YW<{?QomgJmd>I@?|$$)R7S5B z1SZVAy%k02^F<>gE1MQ@wdT^@rbU>w{`A8fQDb@S| z#+pH8>jMS8?W**az}X?xueF*DsqHXFaS~4;NV< zfb|jVXCJW**u7lY%^okRZDg|gK^sl>*k8ArNFz$^Nukw5Q&UB=W0fT$9AEJp4G+z5 zbWz_`-%Fj2xk}p1Y&DcBLw?;*Yq^{NpL@~t5^!U!q@^+oe)T&d98%LDmhB9EcR~?s zVwDa!WCWSDBrkB-tkfisJ;iaOJ~}OM+O{f9Vn*XF)OBE&J_~+-tdy0?(o2`eSN(QG zyL5Rn8!Md$P0TbdS1+eFY4il8m| z4Ms$J?D#!8<2xB0xe3(uPKlO?6*x2{IVfEOJ*Cm9@Qd$pSvZ?enW_w2 z!FQb zZ_i&Wy!5-#0l>>J#7DrP;I{>l6GtW#;m&YgLQnG7G)MB)_a>TmdjvlBVo3ouasm_zo^u_Lof))vaLQ#lm8L+KL84=hX zE5pCXtS!vb!2o2_FU~Aevaj@H5d4kESsDP&#L^t;u}H@{=tuWI{si&t>2bOsK2k2k zf7pmerILtOOoTqCc3kQ}%@3H(1(bCy8KHzS%fj)xKL8-}q^-@?fy5LMA?JSAoJmV& z3F8wc@CWd&2o-U^WpaWl`_ZAO4FYwoJXgm=sFc*9JxCdWJxF|2Y>09hLcE^30xIGN zEC*ZN1kQmTm2x=-2AZz0ANz!HqXj;mNAL@~Plq2O)JtS6?Sd$H3W#(l{#Rub&+vcIn!`|7~2O4jsCij!-Z=7;P~T!Px&VsXgFDg6i7e|IC;v@JNCCL$T3NT!$V`urWs+{R~b{WZ4#Uon+` zu=gMH7N>j{4f<)-CeW!+PgI}Kas&E1`pOR2V>hDz85G}X=krQLI`aPgmoJ9j48M*Y zCN7qk+|8~DQHbGhkXvtr?Plfo+X>Pjp#dxZDUPKzu&8V@7{Osx#ynko_pT8Z(8-P+pbx@jQ_l?ZY7s5T^zMb7xL9| zsc4sK4R7;(^?V_FB=YE;jlFMfTxtw^*Q6_z#+WylEoW*~+s@{z4R5S1-o2o#GYpB)pQN@8zEj%m(bfT@ERZ+57YHp83he*XQWj=bnC@px;hhY_(I;E z&Xluu!}bO$)v{w}&|DmE-fFy^D+8^Y3_kD8+80L4RbXHMeX_^PM56v^5uMKvRo}< zfEm|1R&s0kTD^wpT%W5I3#kb-SFaWt-YvOWt>WIZf4_lZbShuV)h9;tW&erHGst0s z&Q{8;Pfq4967?%btHjghD$rG}XKMATovmRO8m>23OuIF^ni8C?%9pbCMc}Sj&dQ&u zOu1Mrmr|9g&8E&Zyj=#tsjNMjt`};la)mR)86Ni57eQ}!b);O)k`C9W3zb}Y!p6wb z7{P{m3B8PH9k($HgkH=P>RCH@fXkhU91$+m}Mb<_CJ^ko;A|m zX43+TF$zOat5ZIOpUKsW6YgjhY_oRs@HjZ9T;*gB3T|sTn|!k>Jyo76gN(w5u~Ds= zC}(FT%jDplN7L0b5R%*9%#>V62IBwQ<=S zn3xJ$yY05S@efi$dzzSP#%`YIrdy5w=aEsc@2}bku!NQ1s36u zL?&#~NB%HP`!Wz7k+Y>CZ#6)vgP7Rf78HBM}w4FBNK&k27-R@L>^M3 zG{us-xB5c5PzPvW$lP8G@fzr$#@JgMxffx?m+^~1@*#7 z@&@$YZKSn)w+=exzbn`+rOBN;pQ?g*FO5FsmtA@alIxOb*qXAz_!n!bbfHk5PEFRI zd~zmLtENjXC`;thtT$llaA@8QkwS>IG6)}&nJJ`Q7dV?0aB?pLjSHsMuy2u#=1K0w zxtD0sCL?9-5~c#k2Se3slOr!1ar59gzMZ>2cU0?c&X+{cMa7i2;?`UJ;jj0FX%))P zN968wHj4q3gh=pa6-<+}3FT$eDl0%z*MV5#Dk#`mD`!&W32L(xUaIE9q8powQf>~I z)AmV!*>W+R_a|---Y$Y_%e4|DND6}41{@hXn^zV`XMa7(M0I zW@K0-DM(r9!~*qVFx#L9g8(zDTf#b_dQqGn${iNc^fvi=ATnMXaGqC_%w`2sshADQbS7 zuS)q^C7(Gz)0mY?8_j(xKUJbqJE!k%k3YtYO+kE`!qqB;{At@}gc1Z1{(?rYK=&M9 zu4s8f?vjGOrRk{&= z=8bj!8{mB(gM+n#n}Si5pPca@t>dE%h^-2hVO|}qL+z#@W1y4$)?8q|_Cy_28qCMm z$g@=12-|C(I1KwtCS`lH+*lH7$gK5+jYz8%P8yRuV{i1)6e`;OBLgoe*4NfrRUxXB$-qX9OF`~JZaM%-k?I?mv3j1O2(r}h z%r)Asj)IS|&@nK!QO zK`e~&PvRArWPU@rnQ`}`F43He4dhlc`JVF!=_I)Un2yg?-?{#3i+C$q}gZz zEytAc3dDL6+SCHV;e)YLzzCoFi&HF3YmlJYw2qIUfK#vnNLMpCTADHt1&D0uziXyU z3)oqrK${bQLPOU8yIbL*<)i)JUG)!`3IUm+f+}rOpcFzjq3HLgM$ufZ*D7_|T)s)T zN=!mCJY8R6MGeyl#t&@vV3u^^RS#2vnx(t9V$?D(YX=6_KsFl`n2`#?A__ner``Ia z%)nNF;PzDMm}#MHo;3m|GHbaza(8MQHwe18=8z?a7yzX*>>07_oP&_p(auD(!%l?S zLuW=q3*ug!q5#1|LrpMsYB>kePUM64a^K03$(BYPH)|L27pkKrySBenDegCQ@4a)s z?Y?9`@IO*47Dh6J4V4X|#1LVN5zA2sXrtei5t-EDD_%E@Wy zz2eBpgU3$Xd+_k#(?`a~U)9i_cZ9F%f)AdVG@KUOPaGUO`q06nc<;oCdkcBG%KUfM z8y7%nib~5{Q^~@B#zcZ3G4!01JFj#(sP&9w7W-(kK7yYVbS07xV~~>TwS;m*|0=>S z1u<8s7fV2s)G>|*)`8C;3nN;eU#oA_%9VnB!7e};h?&Us+?dwbt~HvZZnW8mLS8{v ztCVfi7p07H92PLOJj-&qTwW{f)JhSN9~c_a$QA=17ygFZNVjlFmCwT~01E(qMmUnH z=Q6phzO{iax{wSFbzjG)#q@cQj?y(9 zF!-wsKe(x~%>}I&Y*mNqQFI&5q%Y8OmE05B!&b1Vc-vZV;AX!p;@i`=cKRi)`6qDU zg`lgmlHLY0-8=jyO7QgAwRFA!uR`62f45(nsg|+24;&Q11hI>nKmJTEjj8hnZhhs* z8;4%>xDkRIq)N%22I^r^c`NHBIJ;FqZj&;4S_19Nre*y|$fRkr?2Tz{sWEsFE`0bM zYPDcJyD5{(XH#%ji&H>3^Wq6TS zLNdVDK0u{Xpf7(d*BAMcY<;YurvNK>tXwx3A20o0Rc?CJa#gsnQ{tF|BoXj$%z%12 zSp4tGR4QsEHf zQ}g+zW=F#tGL?;CLSDxL2-dk>#X5nF2TRBu;81Y1U8ukwC}oXz5G#LgZBQZ(g>AvD zUlDf2m}9S4wv2|z_OKW`Ui2i1w|bRb8i6-FsJ1(-X1ep87~b;R!)hDDYPz-x8i@3B zeu6&PEVig%2St~IBivsL-q;+rg*U`W7L-L=tJ+0~kwp2f@Lk>F@&)>A(8RT2m14dG zv!+@Myj?-12=ZK*56YGBmH60;z^Kk{I#T??O<@ma4Z9^eS_?Zzm2kM%hqY;f(+>w3 zLU#(pN;qGUi3qBxfAU<|*3Pgk89o*pYI<+lUw5nfC-SBJxjc8A!&f303)sv(*b!(}>=%eI?9q{2A)`R90XjB=zLZ`=uNZy8@=!>13l&tnO0XY0!u@U77)D>n zN=d4=SS*HxRI~m%%eUa4fCWUZ38Bzs!Ddq+UUqSOn>W^*00xSf&{93;XcM0t31?*Mn26rGKGFp0W#BDVAS)>9>PhDBe;CJjs!Sn~!Y&udkf zq9b2CLq2MR^Zj0mQGw+A3hWalnj4~RslbAz%~2>TC!W_Z<|sM8Mrq2u|P)h z`K!Y1!E+3ht8lu(ef!Z03Mb350o??Indu!tMXoW-KAF!&_4{1PFb!hmYVo)0Xww&3v|2 z2BZ(JmG=yw`shY^WFXc@mOL`((MLP^2w`7Yy}gdNo1=r%=Qqil1||CFd3>~n1K0Z@ z-eXlp-3+wq!|VBQ0JzZG=ks>Gk8XW-1D+vn$43xxCDH_l67)E?pn^lhIK#XUAI@H0 zhy~|XUO0T`MZ9p-&OTl^SZ9P6j?o$Ag~N09^TGi+xADSpIJfh{5jc17La?1Xc_GBk zi+LfO&P#9swdY1SjhhYes%yX<%`}c*R+2^D_jW@3_m8(e~rH5#_<*2j>KEKDr+2H+0;KcjV~m@a%)*U&J6>C z)!J6$_$%t(cC%)pVFtd}4IqTbZH+z0&H;A%5z%76g2V+0*){IS(P$d>Hd5Bn!2p%V zh&^uwmUP|**<-}IIIWQ?D{1_4g@xUEI5z0S$9^twJnQYqpw@Y8VZ+Y?Ga<{E2`Vga zeFb3^w2Wmvr%iSNZ)+L$lJc35)%*4s#3#*M(#McRf$8Wpu$pNK!*;`_i{yD-TejPs~E zm`fvuQGCB}_IW#H$pAS3p9u6gc5*24vl#xiXsm!Ay+qed?wZ_3XT1&nmJDVO8>6|W z5fj6Jgp?nVQ1{kA28v0@i4xYlGB7gsh3VYt)xw@v2F7f?Ba2=c_*WP7j%<2m;G1vJ zJF@DPftUS)-jQ9e41DFc^^PoiW#C^{|E{!2w!Jd&v)Ae!S@+7orD44z`(7E?@-n?6 z3tt&{%~8E08($fC`eD5zD_=Zx5{1JLlhHz^Vt1jz>&8O zj_HDLF?s8Zr2*G{4S~xVO#!+^#cRmj?`-@iW02Pv!x)?WHd=RbxJbbU>?F}Yl`c%D zXWRx9mC7Y*0F`bc#6&`g_z`&{!cHWV2rQ9MBKA0tcX&HfjHuz>7ikE7AqJY{Y_ipE z-Kb(gQ=!hDx5>x?a0%9*95NNDL?U81Ca`;LH9f5gm%4jRCWp{#IQii96T;<6+a1-{ zb8qzDa%KQt&U2o`57zE)zz+iNWV1U~#oK+Ta@0C0Az+EP%hglWf^N8y2JtNKLR8;rOyDSfWVi)RuF+Qidgl&jRTz+ceQ zmGFj+Gq5%nn02VQG#r@-_jBHiUYsA}<&C_&jTi0NJFq{8IQRV;<-VUT`gr7X)Pu4g zaJ%~z@%saF;q7Sc_zFPoyaRuc4Sxc^0Btv_jA$s`h(BW8drLbFsp7mltZ8Y@M0i5l zd5_loDfy{8@5OKKjXD?(Avzf6XZWBUJn=r`?FPa4(uB9&-?O8*f*C0BjG_tLk8qfVTolW%a`v zXBto>r*6z!YYcv@zH!6I2iQ18#{I7|hNp;LeCuFt#eL^(U|=F?f~8<3co}Pq*54Y$ z9)^X`of|038MLM{A5S)_XO;o$Y94#n>l1%ZLYKroWsa$>RS7~rsij~z(y7XwKqzVF zwHOeT!WL|N06}7y`-Q8#RpM*Lur?Z>18P7*6*+3^G{j~jHutjgFdBiDx*@K(QsSRT z!MK5c7N+lN!b-2_CTvK>G@Q3eV+g!GiIPMU&gVH%8@1i02n6qjctPT2Z!@74KQ@rS zptXkcdIJ8mw+$Oc@IApD5)tlWx!o9MXl6iGy&Bb>hU5WUM&kX$ z%Ej9xPlPO~v%^OfeC?1er?72;T8QpPj20uA!Z&4_5k7Gt@8%h!gtoA$rT#@-FyYaF zADW^(vYt*T0HYj@nWu?`o%lKh9D2;Tk75-{PD`-0GIKhBIIRUX@J`=MmI`K?07I?K+=9 zoU?rHoM1yIc^Q-Y2XVdZJj%bZrp7{ajdB5q5)%MxSvCxf=Z?bKLn!TpexyQ?1GP@e z6E;`$sfu|#Mr)J7&1&3GL*V%UAL`%EFA$oa!^QR1@-cletRw}quE=QIv4$uG*V_;X z1<@dAZ$ri`1!yix4;yF+`}Gv?=o77X4o0v$Q=BLlf*5D1x;^nQsJ%AU;#$8~d1-5` zeXi_e(Xu1imMMW;1_Ncvby9c3$zXWiz#(({PK;mdo{iAQU;#vTyAlfqh!KH|_;&J5 z?D4wbvCQ2%-^Iw-WxO?*B_A6W2vt#iLanC@=w3~hgz<5yUBM5<3%nZ-V;O!@R`he5 zB$qkTd21VkMAhe>m6&_61$N;tSRtZ1X@ev*`COXQ=)KUwxGvGEcW<{AM(BZPr_#L} zSw|fnomm=@7rHPwh^HvVoEPyyJLu*@TWD}d6aN9TN6YD#@q2uk^DFWbwJDrm#iKFj z{c@%C;Cu)dLtA1aIKL)kACc>?%k?+p`cYh+-{j?ExEx>Zd|ZD%fuAwwlXCqnxqgZT zzJ_)_&AV03XQb$}a{U~xzVdZ`8#kgKo!{YKU*P3;gJ-|TzkZ*WFY@vSyr}YX{t$mt z*E#^G7Uk{s&)E;yG8dt19 z{sun~!Qa-O@959p>d$xe=XTQ9C@!w^58;zge6z?Q$GOh`(DLu;&p+b_UHpswd|!W- zqaq$&qd%+kX8=DKz#9H6bJpU=S%-^CN@o-P#4B$=126_>@Ks|VAA{vsT(%8sWqf#7 zO;1(Rm0Y}@cikB-xh(9V+f|wZ7WOSI*>)Oj`0FbXW^+}H$+1TXbD!kcBWz1nN@wsF z0AG1<%gGyfLv80u`^jxS`7SvtU zTKVTlUq6FOpq2R~)XFS!$Zm_QmFE$4#MduDl~(K;B(Dm%KBp6Gn2=qa9zHoUJ1WX57Y-BxhS= z51u)8=!iuZqy=9nJjwWe)6QCq7DI)+YjLy0g2%`TKQys|v@_+>AYyydRqhR2!IyFt zzR$%c5V?G1bPx$9Byc0EYa!|MAmSj=w<+0YJ&ek52wHcH-ewIGsv%P}wD;wMGv&Hf zOwU*dkg^bera%e2_(lYuodX#3j2N^$qH%2>@Sye4!ADI4@ZdvdEUYk29~?V#?8vzF;A!j7gJXw}ojLa481C-34vsx)9X~d9 zc%NlsUhS#{?>Kko2_V9b3J5YEMJ5p?2_Ge#b54eY1y1HO7?FOgWlb^Uia8Q2ejJ*2 zB_9(&%MQvHCmP2VnQzl#eC4}DhWHM4i430&GK{(pR;_|SUy%F2nWiGRNHMId_G{3D z`XZL`FR}9YS8j)Quv>d95@04K&nAfcm1r~KXZQXvx@#TZQHI21YA%uM`>YH$7b(;y zW(GCxU<48idv@Grupm_KujZ|ByJA_lTeshF&mAwh=gzwL)@qyD&q^1`%DwM{4IG5%yWoA6C9bUst`5g`yXF;t|(%Enj0mt-77OeAmL~J|> zYXa^h@kl1hV#}Bzwi+SuUN%!60ZeeOg@9h$iirUHB>)!zJ_v3Zc9Q!@YYyr65ctF> zI->A#Y%q8BaWLV|&~1rUBLm#iVkRaJ@k>|>8}!ya*nhm|aT7@@O4NFVxqH>)$QCD` z7mF!2S+9y3kJw@4W27V)6hi}?T_^~vndshtvxaq!2g6>mS192-iu{8K=z|G%YM2E^ z@?l#Sfrb|WYuv2#_RI-?Fe7v|%UAy~|FUzE9Y-f^eH0OKAWyXevdxy>u(wj+MYtG3 zC=p*=%Z?C!+eGHXqhyR!XJP`y$#HbIu1@GWFau! zv7)E@EKM8MPu!vb0G~R;5kRVve)J6r#P5oi#3hC6t#rD?VOHGsTX9Z&1piQyh zL8#I(&6>HApJE`UbagJDMHD3d+F)7>9<0$Xg(VIPVOiW>a?7OxzQ*EwOam_`vrLD&2F-oV{dtZP|-wG6A z`Q>tbVM#W_gmiCJAx5?DBTRi#TA`f(`9!M`Ie(W=wd*G8h-1}+Ep2Gh-$-OmmlQt9 zEynA4n^da8?eZ__DrxW81G($U~ z>%10kbSZK_iC5c_WJ~&+L*)KG;h0n8A}l@-xlV!ALnIjHX%e2(OKUpY}x8AC@eriI|{p7XY+3t3~4(GGYx*b+XlO(unj81G>=q!31$I{?dU67 zmZYy}nb6m2?I})O!)!gm6pKn-FF=Yv>&xajvJ{P*XGUP9^O_6N17qX7?2$?W=Jx?->(xjRpt!s zZ*LcrZbJS~x2Ovvm`yJ*<_5F<99lW7Zcp>~B2o91GTz!%c3p=WA3S zw?8DP?}d>7KkS3xOV3O$aJA?Hyt7wg>y=rKdjXoNr9B*x(<aZr;;y5VjXPQsdIVd=oo|_4ckt9PZ2sbSEm^h1 zHeLM1xG3(qD#py0&n3n--$HvX^Cfh*emc>r^C>=%0dIk3>wLiLPiwr6e(D<=V!S9e zsIMft@6VvVlxQ_FDDK+I&c|xA{S(_R^VW}!TKKqCHu~-fEUeD=H@sDFcrw37u%BT} zj=u`fx>GHvmM{Xig#XzaI#{xdiD;3g5aE?M&uvZJ$iSvy2&WKKCojb2;2#p$YCi{m zkDAFPaxl=AD{{wdM}<_iyVdZ$YoQRa5gTR}$)+Y|n|?OYC$U>C0FGUJx4F z+6-+R*j?>_ZL_P1|J^BrI)E-hL@pJbv|BTVp9Fkokx0BeX8r3&^X{h3EDiRH0D$z&}bjn7S6 zLRyHUDzXm7(k*1~>$LwtLFz&#+cX&ZD+f435qb|hX|>z(BR-9!k`#91|*Q=_hTGOjNc>4WevRXNjjbw zeaP)QQ4%H8hXelhVeg1?{mShI8jM9~Xmb+1acEDsgLWYl;In&kU(PLP-@CU1MxS$3 z&Ad-6x8VIleZXLVzl1nw9$iuxw5kzvK8K=Ug7Al;z_|WR7(xj3H*wd3hetc& zVZYf|1z2gvu6|9#=``T(LsaLxhq{){T)K979bgg$&V z9K5ix`mpH!$GXVy;*fl%9V82xTc2fP-6*#PsUqiC24Q5)%9bcty2_B6B znPksIVH?i;5@Bn@nFj8boY{8T`@xxelrujfcw5NqEsQf40;=;cR~*Yn{Mj}8{!R9O z+`EBU@7$5JX54(l6->8aK71UrR{o_Q)Nb$~M62Q2g;oUJ%)H0DH$y%j^jc2;d=Jaj=aP41c@rNPbU zV_|_eO*FV60cMEPR_nP<_vOooiY-{TkKQ$U_lw%g`Hk_40YZgnl7%t6y(j@tV085Z zZ#OI6Zdqi!ErfTyHKbULk6(@aIurQ}+$bh1F|(Nahb6&bU}kR}Q6yfHIXGgddD9jt zkbNdj%HwEBOc-mIes<2d0ExL6$bp@UlZ}SkPD)DFM2vH?Fh(B_^^rb8(Q-P`YRCr1 zUx{OtvF*up2x=QB%tdnPu!xUG>JZXlqH!2 zm?07&OBTYu&JnhBKQBjd0lFXH-^XxiVu3kk?v@rTfWy{#>Xgao;5MxrOu0$n!1C_c z0aTNe0?eB#A5ZIMOp*nYrE~N<$Mz6+QaWeD^~ZEmMYA2oG+VqVMvhN&GWw+2LKbW! zS`De^_&y9Op^Cj7hvh>`e3OYxyG840zV<+UBC+YxrcP`y?@M&sSKb;?-ii+mgGt0C zoxK5{U%_yhpq`yMrGWP+c!<W~HN9>EyD*4lYaMm!;v$(&%Mra8??dm4+h0(E_a6I_yCf9|EkzMhLKb z36lVu;a>vmd-<0D`(^$mz{)~NfE9a@z&g~*iyUli0#)0^Tqlj1a9ttm|uLUy1 z(A|o^`jy9SN21m4!{N*a*^zKKoY|p%uyvBwR!`N5`@qhAb?>re@gUE^NKUGK)~j&> z9!^01XWgwy zhL}sr9LN%bs9YUNf|N+)#Vk=UrEy}cg*5dzIy3*ICX)d;Oy`oUUdtit3%WyIWW0qe zQLJQW%6Kn~srurZCZOJ$(LdB6}PVPi9sc_f@*x-KMRt69S@ zx$On0fWC03x52cuQm-MR5MTo1AXDUK@|#0@6F7|#X~1woXuRnNgl2Y;acv0UCsk_* ze^rO}M(GPw&oAjNY4Cd8yPE|Uf(hQ0Qe1#y<|?8`0|#tpG+&v_We}?ML#gzH3Lj1wrFa=ql+h;0i zg#*x1&>(0PvxLJ!>Uws9WMlHh!GjY#b+H-ZbP3CMjsnQ97lig@HD9!Gct;7q3h@W$ zHE5a`3`w38%vO2GUk!t+Ie+hK57{x^EC4q+rU74qrlP z_BY^1IkISH^Jz;C;xOd!2r>vZF}b7_1YxQ~VXnZCypbl#K(EBDxH3a2rn9z%qu28V zNwe3KG!KY(g~TwgN-t>+I22MCIzHr7fdOtdc{Z~6gXD-~shFHlCY;nmIQjlC2-lo- zOW6jg3=&2)lhW!SQe%LuFM>-7<>|d<?O*S_caB$Wvi4^D% zs=ji}BpwJD!pxomj2TWc z(l~^GWD*lpLZw+_DM&LM2^5zAjd8YvIiw*D8oC!Jju#3ug1!1gF<&FU04*w7(GW>U z0G8~WhSH@MC?EnKGLK%ngj-XqP6Al3d0?=g4CJ_OrR*1Ne?0!f-!NzIj_d#A$DPF;s|R|#}xU<7D~wn7+H_B zAQ}HSFr;HG)Wvj&578G~7=ep36YJ%=3$EmuQRU0&2*a%MB%HudcQX=Th{a#95;pr;Nu*T zNp>+x-j47*u_^pnEzjUA)R~b<#3F+OU~F9|OBP(V5HfK=)9A7*e_ey>;2$0w*(|n< zJjR*XcoAp=DdK!NnDW6BfU3$7=rxT~4MkQ+lG2t?h}dG0n5#`95;G8(97gqu-o

z8JUh#m@-U^!RhF8ZZ3vR&Sa1*41L38qJT|$!MzqvfaVY*a|LS|)09iYilOl(WFd>w z@+1sv&L)nTuZIi{&LZ zoWLHa1VIL)Auy^TgYwmoh4cj(hi1z*b^{QihF2Uc)BZGZ@2lHU>)0gOj*ZZfm9HWD zwm(`N$CIDZ&eKycb6gAw;tI3FrTB2DXw<;1mR)y5FhuCh;c$8n>P|BuwOh~EIKqMr zD~%!?Sn}mKLBM-)SvsevqE0d(Gfy>_wx$sjs998o)5H)Ia#afUxv&+@!(`S$shNJ4 z4fsnvBawUyKa^!+n1m*eI#ehJIafjxz%hg;hsIMxeF_WEiKdvP4@s{FUp#7^hGlFr zpJR?jMGP|Icp#&aA_WpnNK|?t#3EdPye6>%2xu(=jWSrSjp{H?CA&K6^B14Uv5A<8 zr`*#{CQ)RX)rTO#&`%MkaLbSihniGt9Fm~cSq7#SHdv$a;PtKa+vV>EhRz9XL zk71Qy(-_p5Q4u=+YZ_cMlX^HgFDJINw~0t^>hEB8I#O_`Ca;WrOq)q@i8ZG z+Xc!DlOTc;q+Eqiq&XwA=C|MQa25QN=^hAvT8W@S+Gkp%d}35 z*Y6>~3`Q8?=VYe}GiNP$0cr&F=eJ|}M%O%~TUKyHvQLDq@JR83iM6wS8{{KQvdCM7 zUm%Cg6WF9}5$U(l8lQrr0l zXd?J-J&k6#ER0c-=rh6*^GN~P$xvcYy-oSv&Q>&1t_Eai`bqnimlZmMRD(8=nDj;d zClvSxhb3%57zr{pn51fUgtR2bIgrOe%GDxQp*%XlPFF{*GZ+;on3BkE#^5zFwW8d0 zeM$>Zv?SaPp|6(aLj(}RG$MO+F>ykT(NNsudMpZ>m4*?2LSv~@e z*qJT1K{#H{aq~_HEtP1_yQs+~7Nz+)>LMJHjbK zoD&Quqyom+XwHY-3)~!Y^kv9-vK2-l92Z!j?HxUY8?4U0Fw-1?!U^=N)dkY>?K2qp zE#?pd(7}fmg4#b!4L|@RB&_eF?GR0)e0i)~BNBtH3BmzSr7l7#`KM$pOAR1<7RA4hq03SQ0|MKwuBW&)vcMJs!P75X|X2 zv?z@CEaZ;xFdYgVY!)bbWa$y*5t)xk>&&q;Cywlcg)ugQ7=zO|ZS=^=BV%XwStpO2 zKJ>uBu`>tnJ9gsOnMZ|G?mu>B?8x}IbwADuI>-i29XySbpdLDL@U(U6q0^@x96zF( zk&9>-?tO?D`22C!rJENgJ5ZLjbHVx*d|zS5CWBAc!aev3<*GowX5)qzv&7-!2Ss~PlKs~cVViKhf$QV_u`Zl zifQb~3Vs96hcr>2_oS#{Rp;DXF61X<*G<5h;;LSK^nPc6H&Y{3wmn=*gkVhgqwa*5 zAUGw9)2C`%>PW`q$~?;!rwWm9;y5rW2O~2m3h@L>d!0JMZp0(o5YZEv5*|N8n%&7yR{%QM@>IDDuO_@!Y-5^xW)OLm3NXQmELI@yvHt;gd>!Igq>=Jt7ala6+?uB(IwBfWYq_ zwGL)@2pU<;m!1UopxGY+BoUf_B*$akuoLbtYVjJ!AFv|cY%-5fNEgOFbsWH=%jC*j zlVTdg|0fs}ts%}}*iw@?NDR1!&=T0>ST=#Z0-rb7!^kl>azR{n5n(dQXy{#C5hPMG zWVm(J1xA}WyB}4=8}5?ZkUT?_i>PFn0kT{$>UGq50O1!{d9V`$2$3WREQhUz!;)AE ztQv?A2z-$?TnU&>DUQ&8OnDeeLxGg;aFDEDT^dpH*C7QOMerhRL85{fXj+LDBSH;6 zCKVruGr)z#IVplh!5f!GymU?px1c5#I&EB*ZgTlS60L}4PFs}m$sDDr#QL$`6WDazgI|FHaQ6##8 z&z*2t8IM|z;H`qoO&6_A&l&yWe4qX^P9KN^l96U68O>OHa!Lv1j=v!YcvSmQLJ2%< z!{u8;Q2Q|UvhWp6Arc3xD#8)285P3LoLV|{($@rjSZi}S=Lh0Kru&%BunUP&-rI4z@r(!~ zi7?pU!>gv;3^&dbgz5vNIT+@x9SiY&NjoSO^1Wi1`sbx+&cro`xllOLg?-@>3C6~U zG%qBKlKgR{hGy@T2HSp>I-LA0_3VFKw`^HFNVhK$x*|IR^9mvoaOtqc-s5p+A$L&PoC^(9xWDRDM0EZjD+9Od$oo6jA_+ESumL?%2? z;&hbH;(@k9TnINYt*mTeAVotEBmNAtdxRxu&mp#<31$pEU)TipA`Ck&6I#XBE;zV$ zD7j3HjhyQfjvVH^37ALU!C3vsTFxgoE+Jwd6T1tm?NdxG-KPBrsKrck9qh~WE~9Dt z6iQ10K%$iOL~_2UdQ2ScP_Xg@Z?&99u0Wy`97u~n_R(tuEtZx-1Oh84v>m7+t;Dub z2E%O>v=q3Wxgr-hJB^)1eR{cj44frGLRJ(Lp)<`Hi<<36$gH5%H!m$`8(3BaW`OedA5UsCDjsWC|A`Bag$LO*kt3!(V(IJKA) zwr~BG3^hA-yG@3QY6hoJ0(iPUq!TH>B=EjNc1B*#?FPMwy&i)P;7)j?} zOMm2&Upa{;L#o{AF#i4)SsI>EzjBPL&i=lxF_K^>m~3g^K;z(_3;PCfvGK{p6dSkB zDK^||AU2k^Fpw!|5DT59EsR9;@nGE1zqEw`4^}^Ne8lDZzXB7&aEh{F8`+*TpqBO$ zCFhTBVuk_CK$C2)Cj81B?j>R>f?ZL}!{E|>BKAN1*l?hhTgmodu+_%B;^)eKBBpi> zR$e?!#3&{?u8_aDm>IFNINEy-rg$(;7YUfKQYgI(<_lLuW%%D{ z;%kRFQ!fQsmavW6W!@zTsUe-p*CNT)7nX`mQCZ?cYkyka*{7B!X7E{@n3$kinhYe2 zd^RT|w#)X9iz#pqtHAv`k(LYj4xm$k`ztWu1A*IRmbGVF+V&^88k0`IMC>KA8l1vC zrd7i-zUiYtiBanyr&@Fo)>T3^^F3z|+0=STrIzV6j~a~mxOGgIXxn^`jO|V)Q9}!O z+HD3k`MLw))7gMP}7Pay~K#froc&zn0fPzH(cwzI#y#LOmB z;u142G4peRnFC(t2aHP$9Hcs3V&EkPer_;uY%#E5a1mqMkLzM!E&5p4X-J(e28MCY zQjbYl#q$6=s>$a7KWir$Srd8W=)-8|tqAk;>32jhy5R7hI~QyBiCCKkG-npp;eMoG z?KuDHa37Mdid{;(HTZY{%c0IQueQp9DCeipzivJOlrSx0;*w4zgH0!?Lg&i4%J!3U zV-l_o_nK`rKm|UKldS{hBWq4x8<1ZFcVVhkKQ5!|JgX)-hpY?7BuVT7ldSffVb#o8 zki^AWczRVVZv0%ft!K=PvWZ+Yw`xBUtC}9V&8jMk`yNxO8bn5BaY6Z1drhXQUkGbv zOi0xv+q9x%%7ADlRW7ob5{hYux=N!eazu}~6kk1NPwhE% zD)$t{c=g@=n!FTGqtb*ceL$PY-^vVUgKU6OrnT#y$e$x=YP{2?Z^0tMH%wUypGP!f zDmf5d5dSkX$!{u3IO^uZPQkl!A6zE?%z?ZpT5tlHX{tJB!WpJ&QTdkLx_&)%#NB zP9>GZMzUuI^U}=$2%TEq!Sp1_BKu5qAM`H7@yv7?BazdKNg^2~k+H=hk+UnXr5#LD z7e`j~uwrUu@65ki3X>SLJyfCHN~yKY4f|j)Aff~bpIyF$o>Dfzj<{!+Py&jHhZ{MI zDFP-{1WYcP2;lB_*XOZB?fI^}13h^Ldh!bNziMfgok)VbO}#LThhqp{K19!=Ob8by-sNFn_tq% z3q91#moNsWO}{Bh_I0>bNR1;iX{wy}*Verq^|rKG(b;B2T+J*YpU3MxV>?B0 z@$hdJQ#@RXGTlOWyVC%f4}ovTd4@C&2f}xSumht(*PWjc$o;+On}~5)=mCL<6sPkt zneA1BiaRkSvf4tB0gq#F3w_XJL&&kOx^G!svADgyXn~G)734I zBxm|?=x9Gq9PQ6>qkTAQG+@)D+}*r{EjXTn)2DeF*l2((k!ed9;-Lx&48`Qd7Z+1r zcq%WxuxRq)$O;^U)XOovVjs!pW{BmRuI70d<-X7$GDm8+JcBo|J>gCW>UDYmZ?C8C z_T}hZ7>zxgyW59DcO%CEc6;J(pN`uN#70ua9$uob9u9Y2qA<;PlGIBNJZGp1n+9@p zIQIri0cm>cf+{cs@smXPnEIY`q+CKFzej-Jfo* zhs`mIVK+yccXh6LTT9|&OSFv?oA%%mZD*(Rg~GnU=NxSZq%CXfC3=P&T%zZxa``z+ z&oNKP_ZQQ0`f0VC{&~?XryqfKIhe`VIQ1T9BR`U^G6CQWRrSHFeujovqZ2SI@&%l? zJZe3XgSQOn^ulnT(v&1k6_t(GS_DPY%yI2BL`liB^KQq520a2g{%uyb)*HI54N4_wZ>CNHTyYCV7$1AJ+!(Ru-5|gs$8K5h=2qCd!njY;CI>lE2hC=jjwIqH0xqPX0uCmW zPZuq5KhexHIG6+uaN;&T3e~!~av^Iqr(R4~iv`%q&}WxG<2K9^Q8IFOi720CsTp_S>{_>o`EPzv4Uui=qc8by77`&O(SOeU z4D4gnU(S=5Kj#?!ZVLL_tGSI6?s)I|BV&iH2k*De965b*+&YMxLl2G}K6d8VgJa_{ z)}Fg&%<#K?G4cI=#dn+Gy!7CyQy9^)v-i+mp&DL784C0jG<-5c!>CpRW&}q;HkHANGVIwZ zVzv?dq~XCDj-}P|b|LHHP}xiY7AuV-YoeOYoVQ^`4n1{gh=F{CbOt374<&e}`6vFf z{NxO6pnM6|Y*7r+QET{cxpYf#T#(q!euFpdwX8FkHwmzJbLBcLIE0b~ePf@Ivm0?A z%PAYQV%?ciEq&2sxPNd@%3gF#6`RIN8|7dg>BS^XP`tzwxG@ zyqb6&xQKE)clP?r?{RbHHH)cNKCF7>WVhzbEzm@{9nK5!nEJth(tOXg5kLUY*Fb1~ZY7V=_DE8B~Sy^qJVazZ$Jzhq30Y>cuCfi-i$^K+)vJ)nl_o7^_ zR=H>Y{^{xI(X?2eqvh(<{(>I8;qE_i?9h?1@gpOc=(g(IyS4L1f;rnc5VHlHw-N_W zf)&9*R2vIwG=|ODeqhsEU9~6c)qFz$Gs~16fLXEmqv)fnb<`s(6N2Y6+TfeJZLmp_ znFd=+va`2C89!7KFJjexqMlcup)5aO(sA>-ke(Jd-&ECxT_`@vFhb5PPuAcJ#Cd4& zz*h4Ub=r<~ICAwcD8ow@_&r(ywkWdR4M{-BP@lp{EE5VhIyerGb3}XucC=fuGx^DU z1|up>)nVUSQ)PIDOSI~d#KC-sBHm?eP8Rbu<85vlPJG#Q_9f3A3i}_G^NgY~#-_i} z4>mQ7*~C?!iweDk_$o|;OKVvu4$oUWGjO%VDdN{t!Ve*#a%j#ydb=*0> zip!Yuez`ut2Oq-4tk&NwPk&9WACc>?%k?+p`cYh+-{j?ExEx>Zd|ZD%fuAwwlXCqn zxqgZTE1cKzXO;75{rQX(eO9iY!}YTBFs`|O>-;u;oX_*}JG^{>m){MZ{T~1NeO|uE z%OCLadR%f(JAa6uvE1%4=Rfh@b6(A|Yw4~9`Ine-ti6UmmJauCt?VEu}`!oEN+c73<3rtHFrw@_kR3>~Q(W-Z7f394#_gCvB zEI9VlF}U9@xpr})Fp@5n%JCay8F2TjDA-@rVUJc_*v_)-X(3d+J*L_nBghpC?2N<` z6*LL9pgL2_5}C>BbBH^lNyVKa%=vphXa`wbqB^m5LvbffEQz~r#GRn-sup+OBYpi7 zE`hk?lTh5T$RWc$yW)=A0AYR|WkB!ZZZ~oXcOdE7SBnX`q4fYtgz^pet6xIy#zd>$ zfo_EyRy6YnxZSAInQUXtF2ouU6Gf488z1y0)})CgvDS@P6VzSRV(l){*PXZoVvSEi zvBn~YEcWb*HSz_-+D-itYd4*?D|Wh8OuOgdewg2q>!5y2(4~kp5p<8@uYL)-*Ckr@ z9_U`sg~Ojm;@yPpj{sGjiN4q?UC2P=P>O7*3 zd;w86)E`lI?f994r#p~ybJU9oxfL6HuKoW3XTOBp_lbJZ_1da;Z?_8xoY+#GN5Wmp zI-Q9(soI5X<0zuzaW)fey~#FdVoA1jBijUZSG8>0N&4D`OCa0$B$RC|a>!-Ru52S; zK(<}qAKCW2afEG@rfPY+0|7T*<(QN^Ky-;bx*LD>OUk_>(W-Z(dnsoIK98t-9s^qh zL!HUHuznXpkEn_w%{j>jy$L;OVoB(ABlHAySGCX^Cw-m5B@lXi5(+&QIb^zLSLl&1 zAoQN!AECGV%<20(5O?jX#RT0Oh$0bm7w}iV1l>%c)$TXIYSqbkMBHvv=}fq>W*1_O zh>4=exxxp%i8X0rNvw4v)&zA|wOD%x>FdXE3B($ogkp_F4q5Ek6>H=Rh_xH~Bi5|i z>9K=wJ(Whrk8~j3=C2+Ta~~nfM9h5vfAveueK^soceq=7u2wCjIrw>Go#odXaqZ4z zUi6JFWFN5=#hddvKIl#MNfS%5uN&DXsJp6V-|vyWeg~I8_VGz5`&i_V?-p71J)0X} zf5$QQNmzv&U*AEi5ZB3#uLJYR-39G?_1v0DZQb_zKBu`~+g=<#w!O$fi?r<}O((a# zk}4u8KfV~7T}x-vHJmkMQ{PVF;;qc)GquJ$CG^-^UE}_%E8nBCdCM|*_k+WDbb!!%F`EO*VfvC5@qdhGbd z`8&Su;HhKQxLvDPBrO1wKVkb;x=8v`28n(Ka_Y^LfVxi_Z=+iHmD0Vc+pM0-zvE(<6*&(s( zmNtn^H-I?L>J=rT)sesv))8NX4}C&Y=7XzRN1-_%X;)AKZ+KhyT|QDGrg)y%R5e}6 z!B}b)&E_P&-|os*`Ys?}n6>JyVY(Wu{0oiC;V0TO-aMqCL}p49741gOGe%YT#rA(E zmKJ0gnuOqyaqN zWL}59dYsH%-8KOB}aPQ^^6&H^Chasci;gN6!5!qd=K8xpLgp| z>{DOWq%u#J`Q|JyZ{y|d(hx4lG4SL3`zLsLCoZ#2L$2?V>$`Eqr|3`1&3kZlev+4; z;)So&)m?uRoL}4cOtk+8b&zfCr!EO#>#-7iQnsWav1-h~689B+cCkpo+jcXuPqS-$ zHJ%+YT{qcHpX!}FKGAIxAy+H%li4=rq7pL@a<$H%5@{DrgiySz+kqI_A`5|bT+-Gu z?^?EW>I3>;eIhXqZ$4@B&)uRhls5lUnwUe{v}4h(5xM@frb=Rph&Xrd+1wwaw+VIL zhMP@(ChfF|FRw$-y_&$%L>GwcTG@@8^ieTa;42pmhih;4^HnvP@OMw|_DFwsyUj>H*Dc0E?tg8!O(c=tg(e7< z$u5DSizY%Swo4OjrGB?lzy4S|SO445VL!Yrtz=bff1!!jyl&?#oc7snn@A$Oi#ZFY zT~$vPO@vVVW48*>*bw4ET(Aw%Ej6{=yZKz72#G_P&tCX+xAPv7&L_KVBAm33b=!oQ zG}*0s#wKk68(-h;(^PVR^G)S{?-q&SRDQeLCc>%wZ{0Rwrc$>0p0TOyY}atlmi|a~ zj%~hKybgW!YIk9&b*7XP1an=rE|fi=(AEG{fY z=f)s}W`=m~DWgC8I_v455B7SIW;D^czKa_L$A*0}j7(Twd?rmiE zuAKn{6F3S4aYy=SGCvi0v>CN(I7T34&YogD0puJu`mS(i#>2&Sz0Euw#7))8sj59u z&lj>1$iy0NM@@qM4yhX4)x8Z2O>HO@7>4XJdgTsjm! zsZV$VVp-Ga%0Ud%5iI_Fw~+;g!oSm zR;O_9yk1^S$(5fyjX96w?^!2}D|U7>@`G3=?(LdUg3Z%0F=&ZmwD`3tFl(Pcl ztiU)cAkGSevjX63U1mM^72-s@citv&Dm7fgRNi5kdFa-JfxLBI}}5b~SeVRJD9@MneLf zLm0C+fcNbx!tuOS*vLjRZ*5GxwSkW>%2{m|K+JGMK<}{S|2}ksSTuRv`9<7#>vfyL ziZ-y?wRw(Q!}(Q#s>NID#-)aJ3MYG*USnN3AJ*|~i|vI3oglE2+!mrj#&3}DmWK21 z@V4{sr3u^-3Ihu6*s^IJcguJx42jYC`_;>qy`>>j=B+}QBG`i*wPLphL|2bQ2f$=Jo<-k(lFDb2MT|X z`nk`cUoyne15ciM%{5=US3x;?;LX30`qp)c;gE{ zp`oWo4>)V@-t{ovBhMT?aQ?#obU%PQvJT4r+a2Hf@i%E0D#~_`Jo*m2M@Bk&;E5mp z$6Y`9a~h6%^g#ajS8td^O|lhg-jLdL@e?>;qVBCmrhUk(hPTcTR=t)7xoo~4BA@c{ zp;G>d!}?VY$l~n{$h>Sp^g+Y<91!hoIE<6E3gvW`Z@5Z)-qtdXj_lM*lbS Ci*IxQ literal 0 HcmV?d00001 diff --git a/.doctrees/eponine.doctree b/.doctrees/eponine.doctree new file mode 100644 index 0000000000000000000000000000000000000000..b1f7732ed25ce03ab85d9c2e01fdc1882b3b140d GIT binary patch literal 2502 zcmai0O>Y}F5KZjJvTRwl^HCIt-8v}JG-xapK@UZ*X-`IcD2kpM5Y&aBGxKKXKYRcDJGfW>#6wpJsh4BQm^O^N6nB{^ zLdmsHpVG^}(ued-99VkgOt1w{@g6J+Ar-S+r*|oivbmSajobTu#|tlw?yifT*b)7A zNep7oORxBylX&uTWwg}%?5$xz@w1=W;IwwpUVHE>UuHP}WBoBTaCa&Sa6XCSI3Qg% zVmt1%NnFMU3Nh1Vn9{gMy|;22Jd)4JZcFBJV*Nr<=b*%QPt&sb+GU}-6{fUUSU$@( zA@)6;=c6PJ#Zxg9Ct_Qi#y1mTNVSK z0^bXWd#xC(f^^_bL2^6uDZ=%D%U-AWaAu6x#`8Oe7x&{qCb3)dw1j4Wq8B_TmHv(+sjJ`#*M(uQN^ubU?EHswC-HrE9#kE6!vEr8Y4ll6m*oAD?o0D3ur`Y0rn z;(?-i9_XB-+zj#-R#ALpd0{Lgj8`BB!bmXVGVT;c&yXX^AsOh&XL6auP8`wT4Y^gt zEeS>)uuxW{V;!nmDWm+>bld4%qpXDzEaopyGiS}l14E^56&hA9; z^Ei(bXrt#~p^~Na>Fv>rII4I>P!x_qEb4*{vt~+xJx@mbTzFr(A14#2-MG5;!sxNF z^GS+NvSkebmc;WC?eS>GF7)Tmzxy8b9NAg1;XZ3_-G9Auk4dGOuM2L+lKWX512aDn zzElV{@N|k1VqT<+-FON@mZY1_E&<}I%#fRS@SyR{u%XIz32}Q7Dul={U;Uo7OW+3VF@@AKaA36+9_Bsa z!gRwr>$4a;xX2W-1FZS&4S4R5nf z*vTV=CldO8RyN<_wV1d#$O?a50pW)vUf($J41XtL=;FcMX4SV33W=8I@bK7Z@=UJm z8kl!AjUB+Fx#iTTuK%^^;|*nJJy`QNSVgTbJzVpT-D-Va=1(?#wI_JUurUe~@;*p$ zzc5Onu*d;VM*mH#|Agc}reDB*{3C)n!oLm<{cZwwi(^f_->K`C?Mq##z%oVVxm$ZI O@3wXgqo#Ali%*>gg|Lpzq@8Dkj6AxV_q+X6GW7;t8Qru;x z2qo7(eM&F?N*~fUabW3{Gr<--#e1+QgjCFOo!+H5%I01wH*W9u9WT5zdUaj&#E$5{ zOJWdvUV6pvoW#?gxt=QO{MlQ>g5qay+UT_Q(cXLTD_>?j|7ZR&HGp?23V1$=<2WFz ze8hI#Y16oj50unAU4|)*d(?X?r@%Dbt_D1v9NrW zZ9?pOI?qQ*9EvAmD4vRKaT?!Dgem#N2CccBTp7EVaP4?GRp(S|vn~Lvn=~LN^R_f& z>yXM97h3=;z63(?42Vv<?wV@$yzx|}i+gdev*8S4$noySQ4wtJ6jJ z41ww8S9DS?>UOL754;HE3p@k`BI`*p8DWA zqh9PWJ`Hn(8(mSWQ7c$jPD^M8D0;zjQt9tFlDZ0>a9tP%s}u*p&(421cM{)E*AEG| z)>tB_W{O+XIYTXciialnbuYcz3n;m9vf)Df9!HJSTL9hFr|SnBH{(%G0Q7PK^-)MD z#REn4JkU8uxf$dw?4$V5^1@g~7_UGMgppvzW!x!@o*_q+Lo(2l&*UqV4W3!}%z z&L=58&XzR*SQ5`mw8x_zyU?FM|L%L#b7W`5hWo6!b^mqe9+OHlUl-htCHJ#B24;RD ze5nv@;OP`2#JorsyYUo+EXis%R|ybTWrp0uBX_MmT@oSZLg5$WeV|O{{m_*ZQ}#!| zP&*XrVJ$ZzQKq16X-^A5fd`Fmh7DD&ONiTxP$5Kq{_01qT>>{?k13>{fdk!EILUj$ zh3ST!EHinPq0K1f2WgSOnR3b*=Jy&91m_+>9v84$5MENL2wv*ETWi?I?OO}7s#&ws zZsIoA@AJbJcbi>;;RO|?W)j2UiKlkXv77KR90L@n<*`yh85V+UBW)8s26r zVJD9eUP%p4GK^L{Ybh73jyVd%<%pY(1YESTxVPg~~2>(4e^t%bTS{!TY{gt|I*}l|;3M^A(p1ZZj O@@{L_Kz^gcbo?K61?>I+ literal 0 HcmV?d00001 diff --git a/.doctrees/index.doctree b/.doctrees/index.doctree new file mode 100644 index 0000000000000000000000000000000000000000..800b59ee506723aa854735ee03a899b412790e2a GIT binary patch literal 7631 zcmeHM>uMy&71mxx(zI?Xd3POS%PFsKTC*D2>%`cK<3w4@SYCTJtYka>vGn$I*G%YDGrE4Mr`?ae~m{GE?(TXs138lI-K`>QA$uWE-j(TSFP9vCT6z zgB`YTJtyWtb_a{gv_Ek@*(wOk*`a^rylDI=Jv%eA&pAs3XYE@DdpCAj*Y!AaT$#jf zCr!A+hHfIT!If+n#sk(3V+O9=#0>+>V{U*6-=dKb^PUwuZqQ?P7>#4MClVG810GA^ zMlHj5)3tdZK{5>-9_veYBFo0z#mY7I4mN`nyWV=1Z4g&iilr-8zhjKUl=;?}1!2Nc zNnC>|%`YF>JW9X}ZuTS3wE~-$j91iK#(M>Uu#;HWYiT}N*ww5Q7cna_42D0EB+>TP z)^Ip%S(?jM827fk{0(yJO$e*Kzq<)e4dd;=<5IGizn{7>9@rT(D*_+3)qylUYsg4y zy_jPy35m~P3<(CkYfOgSWN5|QsLOmJppq-Rw7vl%vI2HxXP@ouUtvGk+27m0X1u$1 z@cON{57@gqw{P#X5B7HV*{$2`#;x|Ndk1^B+8DjYcG~Z;n|tk7uQ3k2LJNEp#l$-p zbV+pFX&I$Sl$VpvNf|QYw%c`WyeR0UR*$n@c#p>csXXGb?@Cgh1Z$4rxxSldyO1?~ z7Zh8Wn7fmSraFJXM`Y1oTOvH>YfJoJSmK8np{bgU;DkU|u_!y1GOVNkK&hejoa;!y zs+zMsOG@A|zBdBP&%ez(X*3yhEPD|1uHMre`QEk!d;p^7$DbSTO#!NR-6Vv(JjK?EkaPg<84|&5FQ zlOjw#2SCg`4qgm93^ZO71jQl1|85f63BdF&FfrzK;@;y0qOATuzAU#;*vT_6P4OT? zzjz4f`7r+1@&8TyKZgIu#S^J`GB+sklsG4z78~N~&5KZcQ#E1U2tZaOs{8?Fu(Sg! zf*L}P4P4khf%59~Y<~R)?%&SIw#C(UdIBfJ#f!!550QD(G0nxCByEL3jR!GHw{C#N zM&c$OuPv$h8_+zQQkI-eCMHbXIz3ZwftfdIqFD!1FI7I#y&{gpb556C*W;Q8JDIo9E~PwSZ5gDoCkd zr@zq4$eIFtrE@@|9tYOV6;H~D2VR)qqu}KZG`*_6_f=JQjGFkdPFZ&a;zL`Xc7=Ju z!4QdFO{cjpK|}>(R=AFXD&tTs6?CeJ`5^T> z92szSb4D53pJf<$W9&6htW4O`!}1342NKh73UxgOG5vblbks^AkszG!Kp_&*-+9n%~U+TdbKV(d+gSJiw;q2}@b zI{r-?Vt6WN|L3&E>cXg;9X48b^M9Z0=7%*m7r(4=Uia=7A>@CYba~wcY4hLixA`yF z^yi7%$dLY8im_CK9|DuVKn?xHGcz+sH8Gj0lrfotK1xy(ee^F95goz5DAb-(CH+-U zIq9v(Xr=!s&V4z>R8OcY<|T2tzkDAS>bjx*#wqrnsGg zE~?oa1v7Q#86B)YE6|@jRAXk^nVeQ@a5h3~R6WjSf!0=;09UKjcPO#kD$`ynVpW(#hSKu!pi{FFCWWt`Yh7n9fuWS&Zz$OO>}l6hs> zNJ1o;dAuz4=IsxK#<@TW!@u4B)YqgfTLMrh@_xX{sM#u#jJa;1monG>Tywdl)St2Afpf(kiZN zP&^-JYORZ+3{5#+TfBKjEm59~guon8i!j5?GIbRrvuH$0kbF3w;U1^fq%^77XqGiL zZY&NIMK>NF^C*lFJo!Bip`BHRu)J#6P^*08LRM%zrLx@APz{H7(jKl`rks(IY0%}C zkC`SEV{>{GQpsgEh|0YJF;DibVhSsfpnrMt**9GMCq2y-$q_z?}G4Hw3%}sR0MDLSw zG(4o>a;|g;IM*T`BjEzNPy^AWVw+j!x9T!|!zF0HP)-XC6Ez1aUqD(~4Pm0I4vsz@b10J_ro^lrTdVra?qz=^uIYw_~WC}FvJ!;rfzbGWrUz9#tJm&i;{8~a# z59o0|G`-Na^3p-A+X9^h8;Z~U4N}%3#OXmAA@QdlB6KBC-~h@7%uu~N0fse#3Ym7M z_PIWK%(%?Ty^%UugA6u<8pDALkHLcAsQV7pB^$d2CP(?`nfQ5v;8nA|S`_OrRi*p-n1X2~KvkFxDkcJLwRU7S@BCpJ)VkGx z>RW0WVt$S$^Y0t|pTWudAJE5->0^YCR5fV_mAg77=skye{V){|q2Hqqh&S|Z@oB1- z>MGTDETJye_D^P%&yeSq`|`)sXYze$W5NXdPUuxuqPJe0nyhv=k5Fuux9US{N9Y5D z*?nW{HF(mk5b{jr|4i>x(EmsMvpbJqe zEz2>Qm3}!piE@pyHCKz~3l2-4<96h(jn?L+&WA&2CyE?zY$`Vs*m zmNRG0oH_HIGiT1>_bP8+oIN1_#8l{W+uf`imgRaD3llMBd1l;YZj`*0%)Obsp3I7B zU~Gh59GEN-2S8zR+pz-XCO6PIN%WEJg!PQUsOfe4#`DTc@u33;RvFVG&a~x~>r0mw zwU+HL&9cKNu$ytjEN#P%I0)=e+wg)lt>pz8q_QL1a}7tcT{LtJdaDJjZ3LF>wl&l9 zdx72Nk>+ip8Ez0AjGxzFfbc&5~3zS=Y?m zw`x5v*1ASdbG=B5Ly{UoNqO0($@~byVCJsx*oJE|C3w!gUVAxX;58!yw1$*Z^IB4r zY$DBwYBddiJc|6s8jX#Ojk+PFtb0Mb;iPK_8_z;n%d3m?khE5N-gQ_QY5{vSwgW7% z+0zUka+pRF+H{N!jkMMd82TcQU0+&R#@kcc!t%@7 zm8Ip&=QW0X#V)W-KOos5piQb{R=uVmp(dw2r_Bg`X4);=#ERT@Y_yry_SRY8(w6%y z=-MG|UI@{wnqznENa7+a?RUnpp77Bd39pJH*V!f^`g0`0Vm?RW{{xA)67r^E#D@{W zyYh*!X^5H;WezZuuJ*8Pg>b84)O3t6gg?gbifeS!Ut?D67cWi2TnkuB(o{FQ&SN3m z2VC?R85#@LSrUuU$Y|4ugxB~^3Y}jrX8IDsA!YC0(9NT5dm8rN1iyIA@N!~g?MtFsfkTuStvl7{n!%AJ^ z{)MYc+A51;pR5|5OY)U=o!ap9o+PPqXR*dd_!)kfpIzp2%W>1-_uv5I_rV7|fdA9@ z{{sHMcq57V!@L3V^C>x><#Si2A^5rU%qxVwpc=%)wbbp>;T9^P`Wp)|F78i^Cre`7 zE%i4N89|#Br!cRGiF#erGtE4f3b5PqL^V#G~RUi^)hT-$_ zhRiIu+G2_UjrIn|r@7|EboiN0Os8)q!n7EMw9w4WT{LsUPSck&+GyyjH14 zw%^lhvrz1YZ8Q;cH7&q&P9U7TxbIU4NJaJRcjxAk5kH3~0 z&a}8|2lh#!+c(O(g`HJ%&6MR{{7i&Y7I1vKNF|AWRF-IWa}-D9u8EzPi4m+K4(vqC z?@N&q^0xq%H?YayQMwctw0-VJzoqRcVgcQq7LcPjUkQJQ{LfW^P*x!~xpFWQby^&( zmo(V7r)*D$rYz)saQg0@yx%5>;==8~Tk>A6q#vkFH4uFFLPUi*X7ZL{)ToFX5n|GY z#nv0#UT1pO2qP8{(zRKHm;>!vGeBU?=TgNNR`9;Eg6VD2mGt#N8FBoF`I27v->g8H z!LdP^N+SKXEYh8gU^^@RWAW`Fu)n9ab94Bh&m1ldWe$6Ceqz8vw##4G$4-6Okz82E zAEb5gpG%VKrQEB#nm1o}v&~sJ*`ne&1p3@Uh$i;ushw1uI zm{v@7g|8w=c7SiGZxFtn@q-5rlo3qA4LJ3_Z5j@xr?AYweJYeLDwHCVQUH`*hJga; z2$r=0uPiQq7F;FMS!ijZ%&kCHXC68&gR2DXZ{*P4-%=Ey$4gU|X8hW~jCY1}A0r_7 z%n(S1$jULxHTL0nZs?6k*P?C%qEC_ny#vkLfVr{~a!6 z+ryIG`HPV>a8Ja+d8x%PyCP5kBriEo=N>n@vDGXorl3$XqEs1IgdS$RReU^F}@ct*}3IoVsXxNYXjlBlWM>zjJ|$f|N?!qMsDQ0}q|oNce4#n2DRk z6k;q?Ff2^9+*V3id`SU213F=A4}ec*IC>8EQ)G^FT@N%Dy8ivXbWLFYT|PpB{Y>2K zypARncBgmf(#>K5X^jxcgsxGmZNo-2?^L3eS_&!un$Ni(M4W}RA7bP%0RK}yLk95O zy?^HypzXXzk6+TLkto>3HT^DaZ2CDQrK| zJ(}rwE|WE$J0yVA4NIGEQmupqHf@~YG}=wuXx8?{t4Jp8Zyept_cua?!TTFUK~H*w zeXggyl7ghC6te){89){#gIyCq{6YSZ7^M`v>xIc}Q9(5g<$x_QrmASj(7QlmA|^R% zrViCjb#l1Kg_5Uwh-@NFv65pifL?YgeTn&!QyFOA!>PcIOAPNfe0x5mygw=p*8BjQ zENL%@N|RLEs{?s&`ZSemghyNX0uY~m4o6am1q#n=$lkqM*>nzQaRq&vkHC)mJg&Y%wh5z z(Wy$WtKt-9%m!rDDl9%=z84^s&ej=}c1YB?;pDFsG0iq@=n56vI8;OxQL$JvZezMh zl&Go93yOdlU9?o8bd%Adfayuw_2WoKs^6muL?Wtj)S7>EKD6=sRDY+=g1`%O4p=!X zfSyTI6J@F?R5ALwR3w)~oF3>IV9|LM79u87zJ&~G^r`-ifx+S!tpNxNIaK7xO5IUq znb5ceyF7$%D#Tql*Sx^eE#?Csn8pS;mc@waxh*Uc8nG=PR0W)qMjUy1(IgI0+2^Pg zcYQqv9uzAZY+x=xMwb{)$rcG|+Ww-+4_Rz^Ix32wI)<~z3mM8z#Yl+~lwH>C&`u#b zrQ@Rk`UU|D$)p@r1_9%mz+ys}Kw8cNYBDmNKB|!Q%ainrYFjLzq9JyexLMfpaeRD| zzXGDuWK}?p+XfJ2@jrR)*jX{@Gry<<(PAd3rD;HRG7fRCx{RYatfv8&{L&&3Cx}uC z07@N29&Aq}3#rVXfB3>zq0h;nWe%{XmV$kL*N3qh1lctf)NK~Ej29LT<1Bi`` zCalPccyeV-oCYSldTyS1IY3Wqxm)5`*h3VssplS>%B&tieAZL^)HVeFmD^f*M1e^YGlpl0|k{~7<7f7CfaQT}mytkC0G zdi;hSzoy4O>G2PGJV~P;$0HV1;!k%+d9uhEwj}p0?%d|@-sT_QmTYfJmbWFlEy-$2 zve}CHeW+(ksrdO+q$eTLO^Eap{t^FUD$fK>E9H5Leo1*KCy~lSHxVh1JmF(;w2VHf zy`yIKMGYZ7Z6PP4=u*9xTT(iFssOZho1T*cT9V#9(3n$K`#4tBta8xtKK?i_f`|^N z6N9|69vseafu7k%2E3!BSM=xdVZ(*}S ziJQr=hhkM%wHD`e_B}&!Dar1-(_;P^>~TQGprugNX0pI$Mnfr$zAMWu-BPtagj|0C zO7;rzDB^epbRQC$_6P+gnSQ!8`^rl0Y_CubjPoTSL_&nZ7Kp6fsw a+<02*Cj)QOhbT3RPNvL>Q;>yP_J05@svGP2zn#C%`P}JW`}1#{l7F%XD$p@dmJ8c5#`tyEQ>QiuZp%}SAye&T6~&;g z^K|{Gb?3+2e(FYt&eKml^|6|lB!g!*Hum@T>#n?052LP~FW#utY9FaPmsQ8_`{Ykt zuhksKSuq2zII-sjfzwlN-$^iGqM}~xxc#=%3j1ySiqi=rCymv*6RANIwo~EsI>+II zZ9mpDCxCA3v^kk-JIzC9R|`e#d<26>VcPYaPdZ@-KYToAByI$vFd74?6%Gy~zw0GV zxDT>B00si#Cx?!kCSDl%KP8h99AZ#?Jn`Jb!F1io#asQZJY>+fQ>(5UI9oF4*z{?i zcnQ$Tae+F9u=4|ZP>(Z*nA*VQs~B@&Qcy67!eHHj1lu2hz`9N(cs1>}@meeF^};@f zF|RoLe&Xpt^i*}{S-e5?25B@1A;|?9bKVL^R?HA9!qeDU_1E-!;l7I2!K?^8;q*S( z%fHv1By?IX_{--AguX6VM^4Y}yIn=gz!~GT?TXc0q2Bb$vkCuTVpJ62UAaru>bW;LelKkMz{nLf6<+%NR*(w%uxL&{ zOq{^)`3c?y%i^$;>{Euci2)1RAh%U28HEVwyO2Sx(jC8>MsgEO2$VGkSDH5<3gZyF z{X-2Wh@S=``<*E4LAF|++Xt{B{0USmCOUdxpd?oU^Rwf)jwXqWwGNV(@FI{E)SwRo z0M~Xx0n4D)1;+t8E{`B7lrq@e(qAVJ^%Yp{F(s!dr{rmiLNP7G z+wWWGwQy@%8B}_18&=_#>j!Q#u=-3s8;JnnV-Yd%6_7(!Tq0Z;DWDGDpmiNqN|Odp zVph-*?u>pw7|u}%C*NO%;Hm?+H^7{D3sxB-tl#2en}dOZSRX)3f^dJ$D8gkG`M1E6 zTgo93;t?v4(;R&=-i}6^QOwe22|wVg;I$}5Qavga>rTuauh+cDsxk!n+l;(2NbZxsf<4^Lb?1% z2qeMNy0emFv%-NGX)(Yub`=t*0+`+?gf(4vK=!7Kh=JM?kpz8U)$1V!(SE_9oC`c! zUUK4)Hc4FQf~YyvX2jH1>@3F_9UWK~(7-SGkk&3lHcl{9$tjYyw1x{9!~?&ThG`6~?77iR+A&0z7%5`t!a8cS$PHpUCDs_=mM0-z z5Xo45Hiaw!cZf)cm{Pk|2A(C=f?;{O?tGe|Gs%A`55@I}s_yKj+D97$HZgy&DpaQV_?aj7ZH*~UHln^ zhi;G@UhG5)zkCE+x55^Uu@-onO$0h8qv^GI4IYOtVa7Rbw!)4;Fi4wt5oCiX4gwc) zoL>Q`+Bt%}W^lTpQiha=*ttcQaCOW?f&(UC0%1z=2H5e@5<9L!GQpTTmKUqwpBg}8 zVh4e~(K3mrO*LW78E6zsyh5}LHhC_h7zSU$6iH6Q4gzb5j8y;=8q0rSA;O4}0oahM zwhm9_Y2#hBa8U$xieu+<2ZMn5T-XQ4MZ}SNS)fo;@R2O*XRUlegoURieJ{*kA37Pw zZsd#Fbs|_3m=3yjSg_5 zFpe(@g$R8sOc~ke-;i$C2~b>0{e&0>3Q-zOIHCq?#|Z-78?~j!nkxDv12Sq0lG>U< za6^YhA&MqOp!~k3J`-E2MbK7Z*p_yfFds!PTweu~u6vo%Yz>3RpJ)0l$4 zk`9y0EjOZ^AZ|w)3+7d4Xd(-on3gIRS4spkVX84jR|YA~*(%K$sRU}nkW3yeWyA!U zuvBrfxLUf>=a}*)c!IKB9+83xVkjZX5sV_k8R428!Inj#^%ft=(k4M-RZwgqF)l(W z$Op`yAqd`u!nQ;Hrkf^qq@UKKhyjD0oOk5+uAV@#%}(5Q-&NEA2`C>MGJcVWjcic=^c;uZLx zXGGCy0~`ZgLEM5WIW{GFPiCV*mp4abTKpO1XS7`7_?^OH(7kmFhgC)GQ}6+~7@B!p z8+kcJK}dVhF%bi0s8~5FC|DvEM35k?fenw^7b#0f!leom~*gojqVh z2GbH%=vrc})N*xx$_P-rB+3p&t(M_K2@s<+VtaJ%YRpw(?y)pOPVLI!cq84;gGBGw-v`)?c_y98~pMW(p! zywpb(ITk;z4lqRvOMSqN;e0W@z)hUXFT>84>OMsjdUTaG+ADlTc>QUCCu(U^P&2 z3S*8csf6)b$}I!T6x#dinjy$$h0yIHffczvGzuVD50)gb_NsMX&VYYNr+(&1rCrEp+O50XiNp+ z(Pc|JN1j|;O|eD=jFg1gz)~{cpw16qnH1F}=5+87c;pqtfv9^N<}#iG2^o~cP>Kr7 zWQ=AD!z5Dxl%`s=Ua-fgGmFJ0H$xe}?XVI;Byx5^HZ-h1xKOMA{Mo7b*w?(A)E?K)SkIhU^NT;AT>zOsW~&pMksuR70f z?_5SK0?7fM&{-7E5oC*LLbi-_x6O#cRL^vFK<$vFC-H1FI#?{w&2~|y>;ist!tN_1ALo5y8XiT-m6jve0Fu3p*Q(w@W z4_YHsC>R9n6Lp9J>e@Po#v3pAZW9$&O4v5TatE;qd=OrG`H&$}ZL*IM=T+^_xt1UJO<8plu)56Z zb&cLm26$Tur4o?@?bVq0Ya=*f{PAp47!-g4V4rr|nu~4^%grN&Yrblis*6SIcz_Ji zR0Tl-#59P)b>$ptZmOGHUTW(R$s&%#A|W7#=%Wmy3&~)v@L85PwGk;8C**_p<8`Vn zO(DQXYOh&WGLIZXM5x4)3G22N9?EP0a&qKu7^13)sujoB=VBF1-e3SqkdeIs%stjW zP>xSgpu&5IQ9Eg0w_yn7>A4^_2wgdXPN7-%=Hhjk26{>rLqI5OjE{xYxrxzsATJ`j zZLH0Krv`g;9zfwlW_d|oHTXclKUsG+TP)~Np{(^Jc$-DERg(Ev&`+c)dPwMV>xehU z!Xp|jEO@O;5WtA8<%P^iAwp9B6AFsgkYX@msg4r+0HY_Pts_XO zZ$cOtT8SEypoShDO%JSTAw$rQV}(`wt-?2f7NB@ffEwpCPwM06KY{o{hF+@ty!dRmG^lZg0w`K|fj27b(v(bB@pqp$-vJ zbVPtUxighH>O;p@K|4mVwFQ#_Vu2)0F0v_v2P<#9DJzSJc9`EA|0M8HV#G4~okJ=m zs-8AItvjoi!~T=`IyOPzOm^7E*MJm$OKl)Vd<>2wyv`w@|G{mL$hugLAT|d|5Ff%C zABaWQ;AywL|>#y7QWV3$s|vBJ0qv*J{QLSieqCMkQ+9dAaEDb5{94-lDhmsT!Cm2{5%< z2jiw@%#spUP{0lP35Yt)n=wH)JyP}Bt7d?(DOI|1tu%iMk}0C>+@_`Q1r+3VcDF8~ z7qM0|>EAK21Z~0Oz`!&x)$%|L?6Q$l0TnPUKL9?DN52b(zFbFU+*_~h!dZ~`HZ7th z<8O&J(42)}zu!$EQgGQY=Mrp|13%d1S`jG6B>4h}7#&_N~-|{xni4WYiaYwnrSCJD`pz%C?x`$G}#EJR$D3e zPL8x6aj+@cXmxBN;LP1ai$IJ$x7Gy0uW0n9Yu2eP+C95q>#R^Um`fsTZA`#u2;6mfhQzf(=^J)(y^<9TZqtvF4+~` zhA|E(!%s$448f0Rk(F-PJo2K>$rXfpCZIXCKbB6v)b~q2&(-27n`4dLfwR(`%LrYy zo{e_Kt}t^QQ(8$y5z*YXEw*MLSF6K}o z4PPd-zn)O`|}6U?G_7U9&K-K{jD3%9n8@Ro$OX)MGOG2b+OtwjUDC}!3Q!FAoHsr7_9S_`GC z#F#mfBpD6qG3~72N8V#SXD=(1XWB+qlMsDOf8FSv&d!(Pcblq=UM%vG#&mf}InOwU zJmWRw8O4mh^zO+KEWW?|tv(xZGm4?^<>aJ6#mbslmnTnrFO2p0;m{~uId^hBFMl`Q~6D*~4 zmOgfzAfb0g$__kC(oYn0=rQX@ukQuc7QX7O*|q-Rs@7*W-o7e;HJGrHUqtDFY~-44>@ISb!+m%3q(IYTq?Rwcoo#>KT^ge+VM$%$8J_GKNm^@(lsrJvEpTuYPxS zUVUJUSO4^$F6mef{|h**D;ASD{9Y(tmE_{9v&)4uCKvzy|EU&c#pFLACahpkNGcY9 zrLbxVWl~|Rc1INfOH%V^vrEkrRjIlDH;j_2wV#RQsAXBPN+u(5@1nAzQH$$;rvv3G zz!fc77L4_$w0AroL%ofJf`>YJ<$7Q2^w3o)DW{TOVHAJS1i}nMhmse5;W>4 zC$Xu5HPAl;^+V`VR=^{Sb2Wrnt^!G`wqAZJdPPAdSr)65C#PHm0xR}zyUHNF zU1Up{!cGRW??|b>>PMvd z#g1M2Lj?pysLLL|JLCLYGmart{?@pN!OZS|t0%E3<&9;+qWdrAq(F15RJgV5R;SCw zuSC0I^F_TLgYW&h*~2_LFVb#9Yb0+gZS6Guwu=kzxoCKnZ|mU9zTqO054*eNWR4ju z$HYbNws;a-Et(nT-DgpfZ+vd38ByLmL4Vmd%_fV6kR>k8w8P?}+bdc?4JD?LW7>f7 z-il0uxk=328!L*P5m_$nRXE9d9JQ+=rq`Rzjen_4^R?i9iVJV1$fd9G58(L~MA@1! z69=@F9UWySMGim@Il1ml;vch(;>cI`7^d>oeaZM1duO30QQkw58i*=|+0ppO4HPBA zSS@`7^pEf5$id`O*?SwwBJ%v`T#@H%h&(qW^7LM^>tS}oiF|=9Ylxc8v^Vycr8+M7 zs+6y?pZvd_&x*$X^)v-@o|}s~p8<0&PnQ}nRtOjksUaY~ubFsZEw;k{g zhS^=K_z|Za{bOy&4VLx*fhnIA?aMa-lH}}*ofEXIYfo3#wq9UKcAm=gwk;==wD-$% zY44l4?i{U^)Uojnu-jRp6P_Gp4 zP06yWTOiiZol8}(ZV{*(Ij1@UYP40F9&_3Qpmt8+^e3vA-W3{Dlr=0lE`Elip9pcW zS>*BOK2>wBuPqtb$8lJ993!pCUGfhd<98zeiZzYDp38QB9=7{0@aF6dYY*eClQ{bA zB+h+1nM2=B;KaA8U3_RsB>5P*)OAz0HfKp2z0fd1n?j%ec`kjo1db*w9hx-n zxr8TlC}GtGUS0~;0w-TC1xs5HmHUn7?ihJO&00=WWy#u{sk$^)F#ol8jj<}#KK^Si zfBUQOxBoepzx`8)@uFw9mbOfs>)_VKPiLdRx#?1pVfb*K_EM7XSV=A_2@k<6 z&%Wu*ZzHlfk2hzp41OMOEqrKqUL}Aaj(viFo3}Z!o1fqCSazJMI_GiS^!%KsIB^=M zML*6_w3u^@Bi#+P{UuDb2gl4G{>7Om{jt)0uxm1mv3t!pptI-B@$>B`RK z?Y-?QJG(~Fj(?^IlUS#oJxuxv_U7Zs-vvlNuzB?=pxVCv3>`lU8{8;PcL|Q3o6dXU z-k2xZ`eruw`vof3=0fFb29>(~e)Kw5lJ=&A9}$I|qbr4ye7k~LGsMBd5!zAFiK06n zaaIL8O&H*Hd=<1~oKe>b!Wi4Dp$VrMxviTDr*f{m@#YGfpaQprJMxOqim{Lsd;HEJ z>nwhsdt1n{$8~4*a@c<|KS)+Kowfr$zUDZ4(j;?`;BbgA4KSZ7=EgP;1gTV-lzrB@ zX<~fXPuzoiXXOqsk_}JYr0%?eSAsai1`|?xLD(suIk+`>3PEHmaAWLG;P&t!zX?}y zEAj{SlxBNgCm_+KBObymkkn$nvNDL+%hX0Ye^;&W`+oviY!ItSDxfJh_OWBWp^e|t zCqa{Nf?Cns?nW)ozopRcP>qoOVaf0JGQVx)@vrY7o3SSH#+%&6eIC{R*5`iny`S#;J?5=@AABCqSG?heFNK4{$nScI^V%W)dEI$U zY#}nc!iveE(63v6JP+*#6!9e;##T%G5C75Hq?T6cMslplBazX7?GeFo(Ts&LeZ^0g34PTO2 za{bXf07LZ5YmmCP6X=3rzc3fW{;V3LWZ&l{$>5odjs5-ox;t=No~nmYcO%eSr^g#F zY+u^i+1p$+l&#c1 z2)+Cbynnmm+((UG{w1CtPVv0eV>~~q$JajspYc*ZP>5wB_1P5X)=Id>&=#QvSMUON zpNnIY+koP*lk8)oQDmK~wI zMiKJ(E*_|s-|<_(sNYQycRAef29Ta=%kYmTdBVn51(fWnBoli54|~D^&WqHn4LA2WaxU| z4RwEF^wN{KwD!7Wr!~BOkIo>)8Qy)IcH#>p6gFFG=&fhpp5V-i7%37ySZJXCt&7Fz zc!>G4(@B`P!SMN0SLq><*RlBrzmI6+GpLu{AXV}33qxbq9^A>!brnwDa?wzL_s_MFxM2^O-T*)D*V8mG z_D%e(nV)GC;MW65*lIM9yzwrkJB>&>Ivi$?biy!!FI1(Q&)=0j5aZx$e5lnpVEQ)1 zl?yR;=N>e48kNKt@=<+71*(U^;s$e>hU8NK88ey}m|)3;^N1<`xV4gD_8__mMn^d8PPwABFe zfoXgp?3q^B?*L6u#BW1FOm@Ldldw@-%I@|dR1dV%-k^~S9tbNJn8!x=T$rqT zP_Bqbll{e|L9Eht*f{7>q#jZS1Jnf?Os#_C^t%v5 zG5y0AA9^yoFi?XAh=N5aM07;vJg+oez)t1JzLQ}_j2H!%B_K+@oG(3dwSo!iGzxQ%S!eMqk?zvF3 z&!*7p7=-#Z`K^C8g0STp(muvDIJX7HYkdQig@kzfW;(zW7XV%2C!oK!18+fk!WL^f zg<*JvrUKt^Ri5*EaLt&^)!KNkSS83zuc_Kl;X{DnVM|&}@;;Q8+?x&6bN!%!tq*Bl z1?-18GL3Gmf{r$8Z)NwW{;lCo+RX0L<^=i+QS`AZACx0$BwSR4d4k|P44@!d39Kr{ zz+xGVcJ|1~Rr$PumoZu=|G|LHZ_DFnc~Sp;+%IfnxSVdsoV&>p}3zweBol>h($ literal 0 HcmV?d00001 diff --git a/.doctrees/minimap.doctree b/.doctrees/minimap.doctree new file mode 100644 index 0000000000000000000000000000000000000000..ea4bd5fa44aa588bef06d7ad6e7cffda0c3c95c6 GIT binary patch literal 2506 zcmai0OK%%D5KipKvTRwl^C$`=ZXE<^8Z?#)qlco`^k&3|qUfmsK`kkf5SQHY5zB`F z?IA!7@D}#>^sn{f?rLr6QUiu}hV!0pX8dRGpMMAU>YsS%Dk1f9Oc~RLahKvQGes!5 z_UUta{a5;!zKsJ*ubc_C;3?jNL?NVNmh1FB#ZeabQn_)f-*>$5(&$cI^u&(nzfWQi zdtQ3Q@4Up5cT&reR_CYh3=4{%{@i+}wT)Kq!LNLo(GwoKrR9B@>T z!jyS_985lKI9&0XL$0J3WCbgDY!zCZUB;p1m9d^E{(+-tTX9cN)sek;%$E|i^3(^n z66(bsTkVYNohFopY##Pw~(Mziy>hTLC0DUN%gK-{Yt;dK_1XHvhGsm<2>@PBpgsx- zrFfvIo(DSTC^rMWg>@7kSzZ{+2;&vN0XGuJxQsi6(KF2Sxr?ocvy34Jm=ouvMR>|Gh|t2JRR|6WgI7WHEW0zo_vr_ zHuyXwOgcJMIgvKX{%RU9Swke_fd6K!0hv~e%%o}-(iiy)P8_#+XQI8?8biPLv9~)C z_&m-d1=#30P^e@neR_BFDvl~%5fp`E5R1BC!_1jd#GWT3ekr`K+)tAU*lt{1dtvn0 z*!d*ICt0!%0FuP>67BJ5$1eD1FTei*^&Ht*v0*-QZq0wQGLK268Lta&$CCS5?E^DE z5x!J#Ht=+c5n^7Xi`{qvK$fJN%`O4rs*I4Ec;v3Nr%NK_TqyhkybqMgxF5QbV#@vq z7;1+?J*w%3B+3-DE$vAmDB?lmn_)wh>k>kH5h}RI*RQ^5?Gm^FdQ2hp3>a8#g@<`h zxG>$2!_@ks*^#ocC?V0ZyVshPxZc;cy@bL=KuhGPT;XnCwuz=q{3_7U4|joVy0uwiZ1 z5j%N=a3sO+XJ+#)&c(#VL1y^t3K4!x;{3*m=lDAjLl+P3HmlY?C?r~*-NRzT$uqf< zYr?$CY2*+*np;kd>iS=cKHgw<(t|aNgO%4>>EW7v>{jdZGJmpZt9`*C!^S8~$onA0 z{lX}P!XgKpjQ-n}{~5`DO1}X8_*VpTgnu3!`rSC}7RMTUzhl=e+n2gffn|uybGPY}F5KZjJvTRwl^HBsy+&T!-G-xapK@UYQJ+wC?J_JQi4G3yUiG;Z1mLIWv z2+$q^)BtZ`e?$LfA9q)4ONSaTyfYlmyqS43^q;+d{vF(@f8wF5gw)G1WlS5!U5dNR z6rtqWr_brtU+H7|CJrpUbSBt>r+5bzg^-F_uG9MzN7>v<<;Ly(zT<_LMt9dmPwa^P z`y>Xj=cQNt)=7N)je`y2L`g(ii-miR_q5O~Kr_{jQsVG4CB#z^NbXkb) zxYL5ai1(D#JY9q-jeFF4E2qID>73-YWG*MvFBEkSN__V;Et{`h7OERzN{fZ%vuqP$ z-_vSil(?pn(Pi)Yd+sUP|iwW0`ms52{wKnSlz`98Ta$-3fTZb&Z zJl_IN@fE;{X8`jUCue0{sDCi@&3#huZ`!o4$tq#gG^{0O0t|8TPA2m4$P@YVahxw z4lbWG8m@S)A(zq%vLX^9wijAvUBsc~m9d^E{(+-tTX9cN)rq}$%$E|i^3(^nGU~-1 zTuu5?d{Os(9Gbi!=bp4QUYmFs> zYNohFoio(Jr+8?BU-#0hy`*@uakAk;{2oV*(;EP*t54StHg3kFoB-(M1nQ%ZP>KhN z>Up4Zj&d`|TUa~sf#rp5<783gE!pC1`({m%!jliu$%dbY zgh@xIDksvS?60N)lQl##4*YK>8kA|x$V{qc1$~jf5X5nt7bM!7y)pEAAN#oz!O!D7 zQlO2VgM~_#(xW9O3; zA7#rL04#~;CEDZBj$P=_UVQgG>N&ErV#9sb+_?XGBgDK&=ezL)ge*xnn_U9LRhc2z@yK0iPnSfk{JjB2);GU%C42YL~z@*kcN*XW+nUE8Nd}!iDLE zoh&nXm7&cj<`-y@z?pK&8Rqv25CrEQK^_&bS`c1RsR$nAyjyG7$L*5}vZ`6L)2`z- z*B|mr7I&Lng5d=frDhVt;fbeq&as>DC>#S6sO7OzK^vCet&iAtYue^*gBspuov@Qf z2+tz){j6-h#TzkkagY`Mssh4~NxZps;u-!<#L&fq+s&$P9~2TT&*9;*(d3z2*)=e4 zYZ^O%M{~=mQC=wtGdcRZGE!&s6P=RHN%yYN)Sl(^z L8pv;Sn2!GgH1FbL literal 0 HcmV?d00001 diff --git a/.doctrees/repeatmasker.doctree b/.doctrees/repeatmasker.doctree new file mode 100644 index 0000000000000000000000000000000000000000..1cf46e0c4cdab1fc66caa06adb82b1f229db2be0 GIT binary patch literal 3052 zcmbtWYinFZ7;c+vlFemv=>@S(O_16an_Ve>kb+@cI==}WG#C!Az+H~#R1<&3(F+9@*!&vjZzcJO&^0WIa!ZYNdy!XXUN?In@g=;CT3skI>DyQ64U zeXXTMet8(tWNO$r@)Um6(Mh}te4F3poBSSM;`{!~0oNHDm_jLL24~t#2TWO(jpPwk zN?$#|SUaeU9GJNf^^Ju)_m6MDVEzuQ~Kj6X10>nqC5MY_xJrrNOU!LuG+9H3;V0L*Jb+ z#GN{A0uCufmL1J<95yO71hS_%uGh!HNSwBuPDspdyoI_B>@w%U?~S!~N;@`pd3@b( zMf9s8BeStKSpcPH0jiuNI*UbRA@XiTVUm>;awZ%n4aT6ceo%vM=r@sFZ5)y8lp$z0 z{5q$yJ$C#qn+e3qQCHZ8spC5-8x<3%>zz@f5G!yPMl(>l2ztVzQ{gAy6DltpVJgun zxPtE%ZhZ97krnv9clDAmW3(Zhs#G$AI7d?x7yPy^+*K)^QcCdq3pWcQ_;~Kpl|-vC zd_*`z3V5=ym<7J#d$e$xT$20^0Yq)3MV6Bmb%<(75CEJ}R7Qc@C8fl3%>5-Px2#At znPm}AJ8YI~%gFr85+aEsr^1Q~pW7rAmX2g}q_%RksRmTmCY-Ure^uImOwC5dLRQ`B zPW*xr%S>#dNN<#uBHtTm=Is&q+>Ip#*r*9mC`Be*c)s({_i~mK1cjjxlQLkNkusvN zJywQ)i#wOwXM+LAwx6Fnu2o-~$sqXKk+U=aoW!vV>2XNM8t6w4KKKyv?3r=0AU;wq z#lP2xN2St;SImdLU~XLMK+O-h%OsR_9UY;BQpdybn%@T?Gt$;(>j1HNM978TvFFOs z8R25WCH?^3WvL_XH*H2yW#1PlYKuVKEYH=ENS)9+wEGFCum_2+iVaaNLx|VYB8Q4N z63anXH-QVFM<+s!fq|wg?8QD|i_rp~$Rc>9rd27%;WQ1vOg3UE>h~NbaK;>z+)ltX zB`l*t5=`&dTT8Qd>-h_?%5l}xF8mTxr*X*nwW^n(cmYMBQi0-d#8ES0=uMaoyD$pS za%ic5O&UkqOLV&{)N1U33~A%`uo6oM6BG2+NUXm3Q$Dc18wu__hlMW#e|lm0A^s2e zruAF%$tquOB?2jr>LIbB#F}jQDl_LP6(5X8a?NopY!Vjvjta3H z_3XJttu)lj;Z^TXkHFK#Lpm`u=X2No?XTlnbx@$YnFz%Lr}cs5m>K<0ZclgK$Wm`h z81uhZV}8i*$AzffFBXSY(!sb8i8yxdpH0ftmt3bCxO)+!I$}Q-R=r7;rPl^%y*TDErJENB)+L8NjKRp?K zHT)uWnYd_TdN;c#L?Mp9KyJMuw%e88Yo|zqh7yz;ExD}U4WSZQq_JO2V(G4@anRK> KA!f1|_5TKKmb1P9 literal 0 HcmV?d00001 diff --git a/.doctrees/scallop.doctree b/.doctrees/scallop.doctree new file mode 100644 index 0000000000000000000000000000000000000000..501d6f994b2ac7fe0f752591fe2e0526fd94876b GIT binary patch literal 2502 zcmai0O>Y}F5KZjJvTRwl^HCIt-8v}JG-xapK@UZ*>CK1_ZP8N$f?84{AuhS)M=T!# zw1)sSz+2c~(?8e8-PPLCr3MV|42LssX5I|_XYZeX2lwiqc<3r2^>R!Z(}r=E;x02q zD7p6OQ+oMV`jEbf152-*3AW%V-h)LUq+*uq^e)9wHuqAwaeKe-c;Thd-F49uJEH$C zi9zgn=@q|o5>I|9s8Xgnduv!w{OqSTIIUf@*B<=Jml@9gSbt0n+?|R7oKNC74oH`c z*p54G5|{CTlA5Q>Fr{&idT-@4cqE^b-ImPd#QKGz&OwRqo~C8sj7Xa2x8jus$6lQE4 zGWp_S3s}XM04SaT&`EoGUe;whUuD^pjf$^O?&o*x&KkS3O}iJcdkOI3Td@bw+YM;( zYBS)g5-AQQ-tdQm%UE$;mjDXjpug`FYd>KOmZDcvYZ)PCTKSJDfzA{8RG7h0BG#-Zhvv7RXYo}*}6aZgayiM@EtmlCz|)CadR z>ct-8(=bQ4(G|5CwStA^w1j4Wq8B_TmHv(+sjJ`#*M(uQN^ubU?EHswC-HrE9#kE6!vEr8Y4ll6m*oAD?o0D3ur`Y0rn z;(?-i9_XB-+zj#-R#ALpd0{Lgj8`BB!bmXVGVT;c&yXX^AsOh&XL6auP8`wT4Y^gt zEeS>)uuxW{V;!nmDWm+>bld4%qpXDzEaopyGiS}l14E^56&hA9; z^Ei(bXrt#~p^~Na>Fv>rII4I>P!x_qEb4*{vt~+xJx@mbTzFr(A14#2-MG5;!sxNF z^GS+NvSkebmc;WC?eS>GF7)Tmzxy8b9NAg1;XZ3_-G9Auk4dGOuM2L+lKWX512aDn zzElV{@N|k1VqT<+-FON@mZY1_E&<}I%#fRSq%?ir|sXyS0XW+&;4)tC}@C z?Ivz>{XV~Haktqe7+z3OY9=upo_K2K9J>h*!!baCS{^GEv|;%T`+#k?rfuFisNrqa z2|Ia&@I*r2&&uXoycQD|2U+2-D zT?6y3rm+KfG`E}@)%CwNeY~OUtOsiz2dk*{rH5<&v0JUr%lyfvul58F88${?Lf!`{ z?iWTW6c#z)$>_gn^`DUZ$MiGUkAFlkNBGylq2EowZgH%s_d9jnvVExw6G(fa!RrbD literal 0 HcmV?d00001 diff --git a/.doctrees/star.doctree b/.doctrees/star.doctree new file mode 100644 index 0000000000000000000000000000000000000000..22a4124de5c680cce8fd271f37e661f2dd5b82a0 GIT binary patch literal 2487 zcmaJ@OK%%D5Kin!vTRwl^C%i5ZXE<^8Z?%QpogNT7VXW54{6X-1A4h_;&3FvAAdv~FnB_XYi(#C^y;N?}=novvyfnH~7d_DzgLhF3 zL(faE_>GtF@YlCLy*YVpSgH8QFO6qf={Gue-ttw7<^M!K#yZe`K@paZ;wTJBmxtI6 z{U-eLa7Rha<9RuwVV8Pu<*f8bJEgfTnM)}RGDV#O6W={e^ZILtmBlqNquJ8(d6Fr^ zz|%!~isC>#5+m_gY>VUY<5ZZOPi?6+x6=z_ms74C&u8kCYHijD1nZ`CkW=TWomhu7 zzBt=LpyEqJC!Qdhhw14wuc~$0=2usXil->?vsUP&7CPA!dJdr%h*^9ib`k4#9jkb` z>8iCR8ilTc;$^t+E!9p{eo0}?!g5zvu;-1ZDxTd6yR8goAj{Bk+_Ssf+0q?s|yJUdC{DZj9H)^Ba$6x5IuywJvkAnj4!(aK;YcDM)7W zG%OA#AJrVLc*P+X(hJgJ2_74T23+T1WO-q%CyKx4DB4!o6;yR(FC6ieM6EparE7(H zp~v{FT)^GG!8j;`{OXBjMH> zO9a(Saf>>qP%|IHfhqmEm0o2fhU1Nw4HM$`Fs_YW2hgfMUVqro42LNJz{?5LMsLjrJCQ#-c9i6F^NE79tod!(S2+26$zaD8orV%4^sp>8CS^9z#$8B1YXm7H{(C5c?G zkJ3m1HhKXRDw#_kUmrdXaPHycK?bQM;W?Fx;3}uxT7`Yo+*N>8&Fh_Z z6}Gv4pN?7Bsdov67f_U%NeqW4xE2eJ-Gr-fgrEQ|kCh78uyndUVB4*6>+=RStj#;3 zpGF9m5&S`7*5Bfln7S}b41ZZ5!Vgirx^m(P{!Ycnh5eh&sgBbQQ zqZA5@9B?uQKR5hONd9Ad1N7tn56lt%V{qtq?XX)MYwW#_UA1ga>P(d^L1dA-wae0O MYt}%z(dBINA0C?IC;$Ke literal 0 HcmV?d00001 diff --git a/.doctrees/stringtie.doctree b/.doctrees/stringtie.doctree new file mode 100644 index 0000000000000000000000000000000000000000..771b04c88fe2e9daf7e0078173302b1a12345a01 GIT binary patch literal 2512 zcmai0O>Y}F5KZjJvTRwl^HCH?oH_{7G-xapK@UZ*ZBIsgXp5d25Y&aBGxKKXKYRcDJGfK-#6wpJsh4BQm^O^N6nB{^ zLdmsHpVF(p(ued_99VkkOt1w{@eV8sAr-S+r*|oivbmSajobTu#|tlw?yifT*b)7A zNep7oORxB?llb%(Z>64l$xq)J78F1Iu?Vb(03<#I1@m zwhp;GJ>LRa@dY4?XMpsyJ3lMy;+?HBZHh<5bCmtXn&oL@dAe!&5|*!!g7{kO0s3|W zUA*25x^gMn3td6Q>-f-Hs-3EXlggU8<*q4c&l^uwI=>V5RyLeL3_0H2I4Xk8?IK-s zhAU0eq`2$2_aF)gdYqxxjGI}bJ=ZM7o!_Vm=+26=;_xC4<{agw-q-|zQ8d@nvVySR zgdy;~fVkI+!74}x-V`J^HJ>6}54h}AiuY&6cx^ntb$EU^9%Q=fP?F`$*fK#g%3Y~Q zVahy34lW-z8m@S)A(zq%vZ59uwijBiUBsc~m9d^E{+^>~TX9cN)rq}$%$E|i^3(^n zGU~-1Tuu5?d{Os(zGbi!=Wc`qE zYmFs>YNohFoio(Jr+8?BU-#0hy`*@uakAk;{2oV*(;EP*t54PsHg3kFoB-(M1nQ%Z zP>KhN>Up4Zj&d`|TUbi*f#rp5<783gE!pC1`({m%!jt#X z$%dbYgh@xIDksvS?60N)lQl##4*YNC8kA|x$V{qcDSei|5X5nt7bn`Ay)pEAAKSYV z!O!D7QlJgCuD}SC(xwOSH$M9lOw zMEFu6*uc{%Mu>Tl&UfPp2w9SDHoF9ft1?5b^M2?`iYfae zV5l7m^`Mp;ktkEpwzMaOpumI1H^YW1*CoX5MW_%Wzk&73)-Hi-u*Vcq&%lAzR=A({ zgbULRJ6UG(Dnpx5%x}^nfivZlGtBQ5APCMqf;=iite#w`^bPLIsv7GSA)G PV|ll=YaqYTVLJW~5ufk1 literal 0 HcmV?d00001 diff --git a/.doctrees/trf.doctree b/.doctrees/trf.doctree new file mode 100644 index 0000000000000000000000000000000000000000..6635d44c6e456cf5912e00c7d05b57c8fd2f3829 GIT binary patch literal 2482 zcmaJ@O>Y}F5KZjJvTRwl^HBsy+`1^zG-xapK@UYQJ+$b>hz~)~Qv-rpaz#R1a?6ic zJ_KkF0cwD^u)m>yvyZzg+0vl~4DSqwGjC?z4E<;CpMM8;nxA;+Y9aMvOc~RLahKvQ zGexMl_UTi4@mKngzKH`%FP#at;3?jLMIoeOmh1E`#Zfl*Qn_(=zwdbArO~VFq9=Al z|6LM;*z?jWe(NMYe*5Ov)7ORt#ZQ0f0@LPtcjew&zQ|Di$MR!pVeZrvpnMX?aX?mC zi0!!3fxn3Nl+-+3gei@C)O#zZ!6WIMfbpc@Aqy;(gwj5iB zEIvQq0#5M-z=eA$ZEa3BZJxvC1pte0#U6lew?M_q z%|J_MqPwsvpLiJ`dP}uaO;}P}Gqc>aT};@;ARGl(I_yBkMEu(>&8)r#R# z)3zk;I_|yHGf?n2LvJ`$TBAMJEXAGQs0!%Cl9b}`A`WI8#iicZ1c6bs($lJju-}Fu z@I8mP*NMR@NC(~&B)2f1B3uu+>{W{QOJlq?p5Hn=zZ(xSp>?RpqBOQj(2N|IQv@kT=~r59vLBt+~kbj-SlL(6MpJyHBUN71(8o}g+a_Tn*LNYu(xAKcQY z7ki9P!wlg@m(*(13Ko{r3Yr0mUhte$`a6!Ku7f9B7ly$q#X<1p*$-z<;`{0PA>q~< zO9a(Saf>=E(8~$bMb*O5ikRY7ZRAq;Uji%vq?){Cbc04dc7FFic5nt5CadP`+Ly^Lh_tMFh zpNE7=N2e+$(xL1xrvZ~SL^2NiZzmd*>C8weRl9;d%U=lMxXlX^?akg8`n`|+yb{6B z<2+KJjh=ypN>?=+B;g_dV)4vSqR1K5K5=f4y{%Nu`;ub8g3y`?86FnV$$> zDFhpMI>iVvFVgvLJOLpqvYO3R0>sssA=mN9U1?7jM97&?_yu|IDU*3WbQQ&v{Sh$K z4uyKq$gN0}DQH*PlR{A7LF3zDLzSBn;`Th$2$5g8=I!d1z%|%o3aLwQV7V3U=RM)V zbi+uATT2er z!YGBpA_qJf{hvGiCnWzdy#f32&j;oR|1LQ6yA8Nn9Bb@S(-6FLucC%7^kb+3DA`-d}wdjjwm_289XV^J2$C)|F z=Aobu1q1We@y`)K{0l_z-|;u+mSn*yxDayYn{U4B@4Nia`T4JnOXbgR+nftEKcH!< zbjob-YpG6(j42o1ga`q8~P`_WbEOA1s z_BrqH6~6j1@UHJT;UqhEG;l=Av znZ1%z80iAv^#h3g_?aat8OQBd86=UkxsdGk*3x^;?rB@NIsRZ}MAwiSPTTL#{J6G=);k43D*$4Vkhm8_NMz zN?$y{SUaqY96F-ob)#f?y2KWJmhANp&~P-SJQp5#VP4YO5DJ5D<)!{H^r z-te##$0F*x?0ZRJV#Y|DpUs9+<;kyE=A2Md;B+^dUIK4ov~oiZs<`ZqQ07}mSPB}?*7K_P3v zd!ihj6E3D);t$|mmOA2o(`FP^_I-h(wg}YK@?0H>)CsLayPt3hdyx35*bwD1gm^tG za;S)-upDr86F3EWbRyIQ7-+h}UhEUL7%%XNEP_{RT9slPOS1sXWMh`1eotTmXUsv# z^#oiq!ZIo(!PJhuwKRLTp1T06oK!vS)Gsl06vvxit9l8F7f=)`6(|lz95qvh-h|<> z3!?xnhn5Q1q;Z(NLbtm>tp*;*kTz)#E3t$yD?wk4#Oj+r;zR4Zk>E~pSokXNN2iwG z!T%xOw0`S+vdY(6i9pJudPuA&u_hb7%FOeWiVwykx!G9DHvc8-wFP3!-Mt{O+h{Ex z?Ol+M-fCQI=GPZx)i)Sq=opDEVm}CeBhgYKu<||D zjta39_3Vj7tu)lL;Z^TV_rcS}Lpn7y=jX2dyD#E8)i2Q9OoU?JY2CLRGvgqXYtxOl zvebJL#{BQqm>==maTRK}i^U-yr}S@N|FsyyrY$MpG?iqGBAK1H>$87b>efGf>#s5X zf6J*ngvEc_x47lIXwi?WMuA?1iel!7l{?TM(ObUH9~NWwk74nhc0w;ltRwT^K6yU+ zYV>97F>%4f>~3~Wh(Z*9f!umCY1s + + + + + + ensembl.tools.anno.protein_annotation.genblast — ensembl-anno 0.1 documentation + + + + + + + + + +

+ +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.protein_annotation.genblast

+# See the NOTICE file distributed with this work for additional information
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+GenBlast identifies homologous gene sequences in genomic databases.
+One of the key features of GenBlast is its flexibility to handle
+comparative genomics tasks and accurately identify homologs even when
+the sequences have undergone significant evolutionary changes.
+This capability makes it a valuable resource for researchers studying gene
+evolution, gene families, and gene function across diverse species.
+
+GenBlast has been widely used in various genomic analyses and is available as
+a standalone command-line tool or as part of different bioinformatics pipelines.
+Researchers in the field of comparative genomics and gene function analysis
+often rely on GenBlast to perform sensitive homology searches and obtain
+valuable insights into the evolutionary relationships and functional conservation
+of genes in different organisms.
+
+
+She, R., Chu, J.S., Uyar, B., Wang, J., Wang, K., and Chen, N. (2011).
+GenBlastA: enabling BLAST to identify homologous gene sequences.
+Genome Res., 21(5): 936-949.
+"""
+__all__ = ["run_genblast"]
+
+import logging
+import logging.config
+import multiprocessing
+import os
+from pathlib import Path
+import random
+import re
+import shutil
+import signal
+import subprocess
+from typing import List
+import argschema
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    create_dir,
+    check_gtf_content,
+)
+
+logger = logging.getLogger(__name__)
+
+
+
+[docs] +def run_genblast(#pylint:disable=dangerous-default-value + masked_genome: Path, + output_dir: Path, + protein_dataset: Path, + max_intron_length: int, + genblast_timeout_secs: int = 10800, + genblast_bin: Path = Path("genblast"), + convert2blastmask_bin: Path = Path("convert2blastmask"), + makeblastdb_bin: Path = Path("makeblastdb"), + num_threads: int = 1, + protein_set: str = ["uniprot", "orthodb"], +) -> None: + """ + Executes GenBlast on genomic slices + Args: + masked_genome : Masked genome file path. + output_dir: Working directory path. + protein_dataset: Protein dataset (Uniprot/OrthoDb) path. + genblast_timeout_secs: Time for timeout (sec). + max_intron_length: Maximum intron length. + genblast_bin : Software path. + convert2blastmask_bin: Software path. + makeblastdb_bin : Software path. + genblast_timeout: seconds + num_threads: int, number of threads. + """ + + check_exe(genblast_bin) + check_exe(convert2blastmask_bin) + check_exe(makeblastdb_bin) + if protein_set == "uniprot": + genblast_dir = create_dir(output_dir, "uniprot_output") + elif protein_set == "orthodb": + genblast_dir = create_dir(output_dir, "orthodb_output") + output_file = genblast_dir / "annotation.gtf" + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "transcript") + if transcript_count > 0: + logger.info("Genblast gtf file exists, skipping analysis") + return + logging.info(Path(f"{output_dir}/alignscore.txt")) + if not Path(f"{genblast_dir}/alignscore.txt").exists(): + # Get the repo directory + repo_root_dir = Path(__file__).parents[6] + shutil.copy(Path(f"{repo_root_dir}/data/alignscore.txt"), genblast_dir) + + if not masked_genome.exists(): + raise IOError(f"Masked genome file does not exist: {masked_genome}") + if not protein_dataset.exists(): + raise IOError(f"Protein file does not exist: {protein_dataset}") + asnb_file = Path(f"{masked_genome}.asnb") + if asnb_file.exists(): + logger.info("Found an existing asnb, so will skip convert2blastmask") + else: + _run_convert2blastmask(convert2blastmask_bin, masked_genome, asnb_file) + _run_makeblastdb(makeblastdb_bin, masked_genome, asnb_file) + batched_protein_files = _split_protein_file( + protein_dataset, genblast_dir, num_threads + ) + pool = multiprocessing.Pool(num_threads) # pylint:disable=consider-using-with + for batched_protein_file in batched_protein_files: + pool.apply_async( + _multiprocess_genblast, + args=( + batched_protein_file, + masked_genome, + genblast_bin, + genblast_timeout_secs, + max_intron_length, + ), + ) + pool.close() + pool.join() + _generate_genblast_gtf(genblast_dir) + for i in range(0, 10): + shutil.rmtree(genblast_dir / f"bin_{i}") + logger.info("Completed running GenBlast")
+ + + +def _multiprocess_genblast( + protein_file: Path, + masked_genome: Path, + genblast_bin: Path, + genblast_timeout: int, + max_intron_length: int, +): + """ + Executes GenBlast on genomic slice + Args: + protein_file: Path of a single batched file. + masked_genome : Masked genome file path. + genblast_bin : Software path. + genblast_timeout_secs: Time for timeout (sec). + max_intron_length: Maximum intron length. + Command line options: + -P Search program used to produce HSPs, + can be either "blast" or "wublast", default is "blast", + optional + -p specifies the program option of genBlast: genblasta or genblastg + -q List of query sequences to blast, must be in fasta format, + required + -t The target database of genomic sequences in fasta format, + required + -g parameter for blast: Perform gapped alignment (T/F) + [default: F], optional + -d parameter for genBlast: maximum allowed distance between HSPs + within the same gene, a non-negative integer [default: 100000], + optional + -r parameter for genBlast: number of ranks in the output, + a positive integer, optional + -e parameter for blast: The e-value, [default: 1e-2], + optional + -c parameter for genBlast: minimum percentage of query gene + coverage in the output, between 0 and 1 (e.g. for 50% + gene coverage, use "0.5"), optional + -W parameter for blast: Set word size, 0 means using blast default [default: 0], + optional + -scodon The number of base pairs to search for start codon within the region of HSP + group (inside the first HSP). If not specified, default is 15. + -i parameter for genBlastG: minimum intron length, optional. + If not specified, the default value is 15. + -x parameter for genBlastG: minimum internal exon length, optional. + If not specified, default is 20. + -n parameter for genBlastG: maximum number of splice sites per region, optional. + If not specified, default is 20. + -gff output options: turn on GFF output + -o output filename, optional. If not specified, the output + will be the same as the query filename with ".gblast" + extension. + -pid turn on final alignment PID computation (global alignment between predicted + gene and query) in output. + -softmask With this option NCBI blast will create a masking library, + you need to use it when blasting against a whole genome + """ + logger.info("Running GenBlast on : %s", protein_file) + + genblast_cmd = [ + str(genblast_bin), + "-p", + "genblastg", + "-q", + str(protein_file), + "-t", + str(masked_genome), + "-g", + "T", + "-pid", + "-r", + "1", + "-P", + "blast", + "-gff", + "-e", + "1e-1", + "-c", + "0.8", + "-W", + "3", + "-softmask", + "-scodon", + "50", + "-i", + "30", + "-x", + "10", + "-n", + "30", + "-d", + str(max_intron_length), + "-o", + str(protein_file), + ] + + logger.info(" ".join(genblast_cmd)) + # Using the child process termination as described here: + # https://alexandra-zaharia.github.io/posts/kill-subprocess + # -and-its-children-on-timeout-python/ + try: + p = subprocess.Popen(# pylint:disable=consider-using-with + genblast_cmd, start_new_session=True + ) + p.wait(timeout=genblast_timeout) + except subprocess.TimeoutExpired: + logger.error("Timeout reached for file: %s \n", protein_file) + subprocess.run(# pylint:disable=subprocess-run-check + ["touch", (Path(f"{protein_file}.except"))] + ) + os.killpg(os.getpgid(p.pid), signal.SIGTERM) + + +def _generate_genblast_gtf(genblast_dir: Path) -> None: + """ + Collect output from geneblast and create the final gtf file + genblast_dir: Working directory path. + """ + logging.info("AAAAA _generate_genblast_gtf") + output_file = genblast_dir / "annotation.gtf" + with open(output_file, "w+", encoding="utf8") as file_out: + genblast_extension = "_1.1c_2.3_s1_0_16_1" + for path in genblast_dir.rglob("*"): + # for root, dirs, files in os.walk(genblast_dir): + # for genblast_file in files: + # genblast_file = os.path.join(root, genblast_file) + if path.is_file() and path.suffix == ".gff": + gtf_string = _convert_genblast_gff_to_gtf(path) + file_out.write(gtf_string) + elif path.is_file() and path.suffix in ( + ".fa.blast", + ".fa.blast.report", + genblast_extension, + ): + path.unlink() + + +def _split_protein_file( + protein_dataset: Path, output_dir: Path, batch_size: int = 20 +) -> List: + """ + The protein dataset file is splitted by a number of sequence equals to the batch_size + in batch files stored in 10 output directories. + protein_dataset : Path for the protein dataset. + output_dir : Output directory path. + batch_size : Size of the batch, it needs to be equals to the number of threads + to parallelise the sequence processing for each file. + """ + batched_protein_files = [] + + for i in range(0, 10): + create_dir(output_dir, (f"bin_{i}")) + with open(protein_dataset,"r", encoding="utf8") as file_in: + seq_count = 0 + batch_count = 0 + current_record = "" + initial_seq = True + for line in file_in: + match = re.search(r">(.+)$", line) + # match header and is not first sequence, if the number of stored sequences in each file equals + # the number of batch_size, a new file will be created and the current_record reset + if match and not initial_seq and seq_count % batch_size == 0: + bin_num = random.randint(0, 9) + batch_file = output_dir / f"bin_{bin_num}" / f"{batch_count}.fa" + with batch_file.open("w+") as file_out: + file_out.write(current_record) + batch_count += 1 + seq_count += 1 + current_record = line + batched_protein_files.append(batch_file) + # match header and is the first sequence + elif match: + current_record += line + initial_seq = False + seq_count += 1 + # other lines + else: + current_record += line + + if current_record: + bin_num = random.randint(0, 9) + batch_file = output_dir / f"bin_{bin_num}" / f"{batch_count}.fa" + with batch_file.open("w+") as file_out: + file_out.write(current_record) + batched_protein_files.append(batch_file) + return batched_protein_files + + +def _run_convert2blastmask( + convert2blastmask_bin: Path, masked_genome: Path, asnb_file: Path +) -> None: + """ + Convert masking information in lower-case masked FASTA input to file + formats suitable for makeblastdb. + convert2blastmask_bin : Software path. + masked_genome: Path of masked genome file. + asnb_file: Path of assembly file. + """ + logger.info("Running convert2blastmask prior to GenBlast:") + cmd = [ + str(convert2blastmask_bin), + "-in", + str(masked_genome), + "-parse_seqids", + "-masking_algorithm", # mask_program_name + "other", + "-masking_options", # mask_program_options + '"REpeatDetector, default"', + "-outfmt", # output_format + "maskinfo_asn1_bin", + "-out", + str(asnb_file), + ] + logger.info(" ".join(cmd)) + subprocess.run(cmd, check=True) + logger.info("Completed running convert2blastmask") + + +def _run_makeblastdb(makeblastdb_bin: Path, masked_genome: Path, asnb_file: Path) -> None: + """ + Application to create BLAST databases. + makeblastdb_bin : Software path. + masked_genome: Path of masked genome file. + asnb_file: Path of assembly file. + """ + logger.info("Running makeblastdb prior to GenBlast") + subprocess.run( # pylint:disable=subprocess-run-check + [ + str(makeblastdb_bin), + "-in", + str(masked_genome), + "-dbtype", # molecule_type + "nucl", + "-parse_seqids", + "-mask_data", + str(asnb_file), + "-max_file_sz", # number_of_bytes + "10000000000", + ] + ) + logger.info("Completed running makeblastdb") + + +def _convert_genblast_gff_to_gtf(gff_file: Path) -> str: + """ + Convert the content of gtf file in gff format + gff_file: Path for the gff file + """ + gtf_string = "" + with open(gff_file, "r", encoding="utf8") as file_in: + for line in file_in: + results = line.split() + if len(results) == 9: + results[2] = "exon" if results[2] == "coding_exon" else results[2] + attributes = _set_genblast_attributes(str(results[8]), str(results[2])) + results[8] = attributes + converted_line = "\t".join(results) + gtf_string += converted_line + "\n" + return gtf_string + + +def _set_genblast_attributes(attributes: str, feature_type: str) -> str: + """ + Given the list of attributes in the genblast output, + define the new attributes for the gtf file. + attributes: GenBlast attribute list + feature_type: transcript or exon + Example genBlast output #pylint: disable=line-too-long, trailing-whitespace + 1 genBlastG transcript 131128674 131137049 252.729 - . ID=259447-R1-1-A1;Name=259447;PID=84.65;Coverage=94.22;Note=PID:84.65-Cover:94.22 + 1 genBlastG coding_exon 131137031 131137049 . - . ID=259447-R1-1-A1-E1;Parent=259447-R1-1-A1 + 1 genBlastG coding_exon 131136260 131136333 . - . ID=259447-R1-1-A1-E2;Parent=259447-R1-1-A1 + 1 genBlastG coding_exon 131128674 131130245 . - . ID=259447-R1-1-A1-E3;Parent=259447-R1-1-A1 + """ + converted_attributes = "" + split_attributes = attributes.split(";") + if feature_type == "transcript": + match = re.search(r"Name\=(.+)$", split_attributes[1]) + assert match + name = match.group(1) + converted_attributes = f'gene_id "{name}"; transcript_id "{name}";' + elif feature_type == "exon": + match = re.search(r"\-E(\d+);Parent\=(.+)\-R\d+\-\d+\-", attributes) + assert match + exon_rank = match.group(1) + name = match.group(2) + converted_attributes = ( + f'gene_id "{name}"; transcript_id "{name}"; exon_number "{exon_rank}";' + ) + + return converted_attributes + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run TRF.""" + + masked_genome_file = argschema.fields.InputFile( + required=True, description="Masked genome file path" + ) + output_dir = argschema.fields.OutputDir( + required=True, description="Output directory path" + ) + protein_file = argschema.fields.String( + required=True, description="Path for the protein dataset" + ) + genblast_timeout_secs = argschema.fields.Integer( + required=False, default=10800, description="Genblast timeout period" + ) + max_intron_length = argschema.fields.Integer( + required=True, description="Maximum intron length" + ) + genblast_bin = argschema.fields.String( + required=False, + default="genblast", + description="Genblast executable path", + ) + convert2blastmask_bin = argschema.fields.String( + required=False, + default="convert2blastmask", + description="convert2blastmask executable path", + ) + makeblastdb_bin = argschema.fields.String( + required=False, default="makeblastdb", description="makeblastdb executable path" + ) + num_threads = argschema.fields.Integer( + required=False, default=1, description="Number of threads" + ) + protein_set = argschema.fields.String( + required=True, + description="Protein set [uniprot,orthodb]", + validate=lambda x: x in ["uniprot", "orthodb"], + ) + + +def main() -> None: + """Genblast's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "genblast.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_genblast( + Path(mod.args["masked_genome_file"]), + Path(mod.args["output_dir"]), + Path(mod.args["protein_file"]), + mod.args["max_intron_length"], + mod.args["genblast_timeout_secs"], + Path(mod.args["genblast_bin"]), + Path(mod.args["convert2blastmask_bin"]), + Path(mod.args["makeblastdb_bin"]), + mod.args["num_threads"], + mod.args["protein_set"], + ) + + +if __name__ == "__main__": + main() +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/repeat_annotation/dust.html b/_modules/ensembl/tools/anno/repeat_annotation/dust.html new file mode 100644 index 0000000..3a8cf2c --- /dev/null +++ b/_modules/ensembl/tools/anno/repeat_annotation/dust.html @@ -0,0 +1,310 @@ + + + + + + + ensembl.tools.anno.repeat_annotation.dust — ensembl-anno 0.1 documentation + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.repeat_annotation.dust

+# See the NOTICE file distributed with this work for additional information #pylint: disable=missing-module-docstring
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+DustMasker is a program that identifies and masks out low complexity
+parts of a genome using a new and improved DUST algorithm.
+
+Morgulis A, Gertz EM, Schaffer AA, Agarwala R. A Fast and Symmetric
+DUST Implementation to Mask Low-Complexity DNA Sequences.
+"""
+__all__ = ["run_dust"]
+
+import logging
+import logging.config
+import multiprocessing
+import os
+from os import PathLike
+from pathlib import Path
+import re
+import subprocess
+import tempfile
+from typing import List
+import argschema
+
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    create_dir,
+    check_gtf_content,
+    get_seq_region_length,
+    get_slice_id,
+    slice_output_to_gtf,
+    get_sequence,
+)
+
+logger = logging.getLogger(__name__)
+
+
+
+[docs] +def run_dust( + genome_file: PathLike, + output_dir: Path, + dust_bin: Path = Path("dustmasker"), + num_threads: int = 1, +) -> None: + """ + Run Dust on genomic slices with mutiprocessing + Args: + genome_file : Genome file path. + output_dir : Working directory path. + dust_bin : Dust software path. + num_threads: Number of threads. + """ + + check_exe(dust_bin) + dust_dir = create_dir(output_dir, "dust_output") + os.chdir(str(dust_dir)) + output_file = dust_dir / "annotation.gtf" + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "repeat") + if transcript_count > 0: + logger.info("Dust gtf file exists, skipping analysis") + return + logger.info("Creating list of genomic slices") + seq_region_to_length = get_seq_region_length(genome_file, 5000) + slice_ids_per_region = get_slice_id( + seq_region_to_length, slice_size=1000000, overlap=0, min_length=5000 + ) + dust_cmd = [dust_bin, "-in"] + pool = multiprocessing.Pool(num_threads) # pylint: disable=consider-using-with + for slice_id in slice_ids_per_region: + pool.apply_async( + _multiprocess_dust, + args=( + dust_cmd, + slice_id, + dust_dir, + genome_file, + ), + ) + pool.close() + pool.join() + slice_output_to_gtf(dust_dir, "repeat_id", "dust", True, ".dust.gtf") + for gtf_file in dust_dir.glob("*.dust.gtf"): + gtf_file.unlink()
+ + + +def _multiprocess_dust( # pylint: disable=too-many-locals + dust_cmd: List[str], + slice_id: List[str], + dust_dir: Path, + genome_file: Path, +) -> None: + """ + Run Dust on multiprocess on genomic slices + Args: + dust_cmd: Dust command to execute. + slice_id: List of slice IDs. + dust_dir : Dust output directory path. + genome_file : Genome file. + """ + region_name, start, end = slice_id + logger.info( + "Processing slice to find low complexity regions with Dust: %s:%s:%s", + region_name, + start, + end, + ) + seq = get_sequence(region_name, int(start), int(end), 1, genome_file, dust_dir) + slice_name = f"{region_name}.rs{start}.re{end}" + with tempfile.TemporaryDirectory(dir=dust_dir) as tmpdirname: + slice_file = dust_dir / tmpdirname / f"{slice_name}.fa" + with open(slice_file, "w+", encoding="utf8") as region_out: + region_out.write(f">{region_name}\n{seq}\n") + region_results = dust_dir / f"{slice_name}.dust.gtf" + output_file = Path(f"{slice_file}.dust") + dust_cmd.append(str(slice_file)) + logger.info("dust_cmd: %s", dust_cmd) + with open(output_file, "w+", encoding="utf8") as dust_out: + subprocess.run(dust_cmd, stdout=dust_out, check=True) + _create_dust_gtf(output_file, region_results, region_name) + slice_file.unlink() + output_file.unlink() + + +def _create_dust_gtf( + output_file: Path, + region_results: Path, + region_name: str, +) -> None: + """ + Read the fasta file and save the content in gtf format + All the genomic slices are collected in a single gtf output + Args: + output_file : GTF file with final results. + region_results : GTF file with the results per region. + region_name :Coordinates of genomic slice. + """ + with open(output_file, "r", encoding="utf8") as dust_in, open( + region_results, "w+", encoding="utf8" + ) as dust_out: + repeat_count = 1 + for line in dust_in: + result_match = re.search(r"(\d+)\ - (\d+)", line) + if result_match: + start = int(result_match.group(1)) + 1 + end = int(result_match.group(2)) + 1 + gtf_line = ( + f"{region_name}\tDust\trepeat\t{start}\t" + f'{end}\t.\t+\t.\trepeat_id "{repeat_count}";\n' + ) + dust_out.write(gtf_line) + repeat_count += 1 + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run DustMasker.""" + + genome_file = argschema.fields.InputFile( + required=True, description="Genome file path" + ) + output_dir = argschema.fields.OutputDir( + required=True, description="Output directory path" + ) + dust_bin = argschema.fields.String( + required=False, + default="dustmasker", + description="Dust executable path", + ) + num_threads = argschema.fields.Integer( + required=False, default=1, description="Number of threads" + ) + + +def main() -> None: + """Dust's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "dust.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_dust( + mod.args["genome_file"], + mod.args["output_dir"], + mod.args["dust_bin"], + mod.args["num_threads"], + ) + + +if __name__ == "__main__": + main() +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/repeat_annotation/red.html b/_modules/ensembl/tools/anno/repeat_annotation/red.html new file mode 100644 index 0000000..61a905f --- /dev/null +++ b/_modules/ensembl/tools/anno/repeat_annotation/red.html @@ -0,0 +1,272 @@ + + + + + + + ensembl.tools.anno.repeat_annotation.red — ensembl-anno 0.1 documentation + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.repeat_annotation.red

+# See the NOTICE file distributed with this work for additional information
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+Red is the first repeat-detection tool capable of labeling its training data
+and training itself automatically on an entire genome.
+Girgis, H.Z. Red: an intelligent, rapid, accurate tool for detecting repeats
+de-novo on the genomic scale. BMC Bioinformatics 16, 227 (2015).
+https://doi.org/10.1186/s12859-015-0654-5
+"""
+__all__ = ["run_red"]
+
+import logging
+import logging.config
+from os import PathLike
+from pathlib import Path
+import re
+import subprocess
+import argschema
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    create_dir,
+)
+
+logger = logging.getLogger(__name__)
+
+
+
+[docs] +def run_red(genome_file: Path, output_dir: Path, red_bin: Path = Path("Red"),) -> str: + """ + Run Red on genome file + + Args: + genome_file : Genome file path. + output_dir : Working directory path. + red_bin : Red software path. + + Return: + masked genome file + """ + check_exe(red_bin) + red_dir = create_dir(output_dir, "red_output") + red_mask_dir = create_dir(red_dir, "mask_output") + red_repeat_dir = create_dir(red_dir, "repeat_output") + red_genome_dir = create_dir(red_dir, "genome_dir") + + sym_link_genome_cmd = "ln -s " + str(genome_file) + " " + str(red_genome_dir) + genome_file_name = genome_file.name + red_genome_file = red_genome_dir / genome_file_name + genome_file_stem = genome_file.stem + masked_genome_file = red_mask_dir / f"{genome_file_stem}.msk" + repeat_coords_file = red_repeat_dir / f"{genome_file_stem}.rpt" + output_file = red_dir / "annotation.gtf" + + if masked_genome_file.exists(): + logger.warning( + "Masked Genome file already found on the path to the Red mask output dir. \ + Will not create a new file" + ) + # _create_red_gtf(repeat_coords_file, output_file) + return str(masked_genome_file) + if red_genome_file.exists(): + logger.warning( + "Unmasked genome file already found on the path to the Red genome dir, \ + will not create a sym link" + ) + + else: + logger.info( + "Preparing to sym link the genome file to the Red genome dir. Cmd\n %s", + sym_link_genome_cmd, + ) + # subprocess.run(["ln", "-s", genome_file, red_genome_dir]) + red_genome_file.symlink_to(genome_file) + try: + if red_genome_file.exists(): + logger.info("Running Red") + subprocess.run( + [ + red_bin, + "-gnm", + red_genome_dir, + "-msk", + red_mask_dir, + "-rpt", + red_repeat_dir, + ], + check=True, + ) + except: + logger.error( + "Could not find the genome file in the Red genome dir or sym link \ + to the original file. Path expected:\n%s", + genome_file, + ) + _create_red_gtf(repeat_coords_file, output_file) + return str(masked_genome_file)
+ + + +def _create_red_gtf(repeat_coords_file: Path, output_file: Path): + """ + Create Red gtf file from masked genome file + + Args: + repeat_coords_file: Coordinates for repeats. + output_file : GTF file with the final results. + """ + with open(repeat_coords_file, "r", encoding="utf8") as red_in, open( + output_file, "w+", encoding="utf8" + ) as red_out: + for repeat_id, line in enumerate(red_in, start=1): + result_match = re.search(r"^\>(.+)\:(\d+)\-(\d+)", line) + if result_match: + region_name = result_match.group(1) + # Note that Red is 0-based, so add 1 + start = int(result_match.group(2)) + 1 + end = int(result_match.group(3)) + 1 + gtf_line = ( + f"{region_name}\tRed\trepeat\t{start}\t" + f'{end}\t.\t+\t.\trepeat_id "{repeat_id}";\n' + ) + red_out.write(gtf_line) + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run Red.""" + + genome_file = argschema.fields.InputFile( + required=True, description="Genome file path" + ) + output_dir = argschema.fields.OutputDir( + required=True, description="Output directory path" + ) + red_bin = argschema.fields.String( + required=False, default="Red", description="Red executable path", + ) + + +def main() -> None: + """Red's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "red.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_red( + Path(mod.args["genome_file"]), mod.args["output_dir"], mod.args["red_bin"], + ) + + +if __name__ == "__main__": + main() +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/repeat_annotation/repeatmasker.html b/_modules/ensembl/tools/anno/repeat_annotation/repeatmasker.html new file mode 100644 index 0000000..0aa3ca3 --- /dev/null +++ b/_modules/ensembl/tools/anno/repeat_annotation/repeatmasker.html @@ -0,0 +1,369 @@ + + + + + + + ensembl.tools.anno.repeat_annotation.repeatmasker — ensembl-anno 0.1 documentation + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.repeat_annotation.repeatmasker

+# See the NOTICE file distributed with this work for additional information #pylint: disable=missing-module-docstring
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+    RepeatMasker is a program that screens DNA sequences for interspersed
+    repeats and low complexity DNA sequences.
+    Smit, AFA, Hubley, R & Green, P. RepeatMasker Open-4.0
+"""
+
+__all__ = ["run_repeatmasker"]
+
+import json
+import logging
+import logging.config
+import multiprocessing
+import os
+from os import PathLike
+from pathlib import Path
+import re
+import subprocess
+from typing import List
+import argschema
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    create_dir,
+    check_gtf_content,
+    get_seq_region_length,
+    get_slice_id,
+    slice_output_to_gtf,
+    get_sequence,
+)
+logger = logging.getLogger('__name__')
+
+
+
+[docs] +def run_repeatmasker( + genome_file: PathLike, + output_dir: Path, + repeatmasker_bin: Path = Path("RepeatMasker"), + library: str = "", + repeatmasker_engine: str = "rmblast", + species: str = "", + num_threads: int = 1, +) -> None: + + """ + Executes RepeatMasker on the genome slices and stores the final annotation.gtf in repeatmasker_output + Args: + genome_file : Genome file path. + repeatmasker_path : RepeatMasker executable path. + library : Custom repeat library. + species :Species name. + output_dir : Output directory path. + num_threads: Number of threads. + + """ + check_exe(repeatmasker_bin) + repeatmasker_dir = create_dir(output_dir, "repeatmasker_output") + + output_file = repeatmasker_dir / "annotation.gtf" + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "repeat") + if transcript_count > 0: + logger.info("Repeatmasker gtf file exists") + return + logger.info("Creating list of genomic slices") + seq_region_to_length = get_seq_region_length(genome_file, 5000) + slice_ids_per_region = get_slice_id( + seq_region_to_length, slice_size=1000000, overlap=0, min_length=5000 + ) + repeatmasker_cmd = [ + str(repeatmasker_bin), + "-nolow",#does not display simple repeats or low_complexity DNA in the annotation + "-engine", + repeatmasker_engine, + "-dir", + str(repeatmasker_dir), + ] + if not library: + if not species: + species = "homo" + repeatmasker_cmd.extend(["-species", species]) + else: + repeatmasker_cmd.extend(["-lib", library]) + logger.info(f"Running RepeatMasker {repeatmasker_cmd}") + pool = multiprocessing.Pool(num_threads) # pylint: disable=consider-using-with + for slice_id in slice_ids_per_region: + pool.apply_async( + _multiprocess_repeatmasker, + args=( + repeatmasker_cmd, + slice_id, + genome_file, + repeatmasker_dir, + ), + ) + pool.close() + pool.join() + slice_output_to_gtf(repeatmasker_dir, "repeat_id", "repeatmask", True, ".rm.gtf") + for gtf_file in repeatmasker_dir.glob("*.rm.gtf"): + gtf_file.unlink()
+ + +def _multiprocess_repeatmasker( # pylint: disable=too-many-locals + repeatmasker_cmd: List[str], + slice_id: List[str], + genome_file: Path, + repeatmasker_dir: Path, +) -> None: + """ + Run Repeatmasker on genomic slice + + Args: + repeatmasker_cmd: RepeatMasker command to execute. + slice_id: Slice ID to run RepeatMasker on. + genome_file : Genome file path. + repeatmasker_dir : RepeatMasker output directory path. + """ + + region_name, start, end = slice_id + logger.info( + "Processing slice to find repeats with RepeatMasker: %s:%s:%s", + region_name, + start, + end, + ) + seq = get_sequence( + region_name, int(start), int(end), 1, genome_file, repeatmasker_dir + ) + slice_file_name = f"{region_name}.rs{start}.re{end}" + region_file = repeatmasker_dir / f"{slice_file_name}.fa" + with open(region_file, "w+", encoding="utf8") as region_fasta_out: + region_fasta_out.write(f">{region_name}\n{seq}\n") + region_results_file = Path(f"{region_file}.rm.gtf") + output_file = Path(f"{region_file}.out") + masked_file = Path(f"{region_file}.masked") + tbl_file = Path(f"{region_file}.tbl") + log_file = Path(f"{region_file}.log") + cat_file = Path(f"{region_file}.cat") + repeatmasker_cmd = repeatmasker_cmd.copy() + repeatmasker_cmd.append(str(region_file)) + logger.info(repeatmasker_cmd) + subprocess.run(repeatmasker_cmd, check=True) + _create_repeatmasker_gtf(output_file, region_results_file, region_name) + output_file.unlink() + region_file.unlink() + masked_file.unlink(missing_ok=True) + tbl_file.unlink(missing_ok=True) + log_file.unlink(missing_ok=True) + cat_file.unlink(missing_ok=True) + + +def _create_repeatmasker_gtf( # pylint: disable=too-many-locals + output_file: Path, + region_results_file: Path, + region_name: str, +) -> None: + """ + Read the fasta file and save the content in gtf format + + All the genomic slices are collected in a single gtf output with the following format: + SW perc perc perc query position in query matching repeat position in repeat + score div. del. ins. sequence begin end (left) repeat class/family begin end (left) ID + Args: + output_file : GTF file with final results. + region_results_file_path : GTF file with results per region. + region_name : Coordinates of genomic slice. + """ + with open(output_file, "r", encoding="utf8") as repeatmasker_in, open( + region_results_file, "w+", encoding="utf8" + ) as repeatmasker_out: + repeat_count = 1 + for line in repeatmasker_in: + result_match = re.search(r"^\s*\d+\s+", line) + if result_match: + results = line.split() + if results[-1] == "*": + results.pop() + if len(results) != 15: + continue + score = results[0] + start = results[5] + end = results[6] + strand = results[8] + repeat_name = results[9] + repeat_class = results[10] + if strand == "+": + repeat_start = results[11] + repeat_end = results[12] + else: + repeat_start = results[13] + repeat_end = results[12] + strand = "-" + gtf_line = ( + f"{region_name}\tRepeatMasker\trepeat\t{start}\t{end}\t.\t" + f"{strand}\t.\trepeat_id{repeat_count}; " + f'repeat_name "{repeat_name}"; repeat_class "{repeat_class}"; ' + f'repeat_start "{repeat_start}"; ' + f'repeat_end "{repeat_end}"; score "{score}";\n' + ) + repeatmasker_out.write(gtf_line) + repeat_count += 1 + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run RepeatMasker.""" + + genome_file = argschema.fields.InputFile( + required= True, description= "Genome file path" + ) + output_dir = argschema.fields.OutputDir( + required= True, description= "Output directory path" + ) + repeatmasker_bin = argschema.fields.String( + required= False, default= "RepeatMasker", + description = "RepeatMasker executable path", + + ) + library = argschema.fields.String( + required= False, default= "", description= "Custom repeat library" + ) + repeatmasker_engine = argschema.fields.String( + required= False, default= "rmblast", description= "RepeatMasker engine" + ) + species = argschema.fields.String( + required= False, + default="homo", + description="Species name (used if no library is provided)" + ) + num_threads = argschema.fields.Integer( + required= False, default= 1, description= "Number of threads" + ) + + +def main() -> None: + """RepeatMasker's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") /"repeatmasking.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig(loginipath, defaults={"logfilename": str(log_file_path)}, disable_existing_loggers=False,) + run_repeatmasker( + mod.args["genome_file"], + mod.args["output_dir"], + mod.args["repeatmasker_bin"], + mod.args["library"], + mod.args["repeatmasker_engine"], + mod.args["species"], + mod.args["num_threads"], + ) + +if __name__ == "__main__": + main() + +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/repeat_annotation/trf.html b/_modules/ensembl/tools/anno/repeat_annotation/trf.html new file mode 100644 index 0000000..187602c --- /dev/null +++ b/_modules/ensembl/tools/anno/repeat_annotation/trf.html @@ -0,0 +1,398 @@ + + + + + + + ensembl.tools.anno.repeat_annotation.trf — ensembl-anno 0.1 documentation + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.repeat_annotation.trf

+# See the NOTICE file distributed with this work for additional information #pylint: disable=missing-module-docstring
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+    Tandem Repeats Finder is a program to locate and display tandem repeats in DNA sequences.
+    Benson G. Tandem repeats finder: a program to analyze DNA sequences.
+    Nucleic Acids Res. 1999; 27(2):573–580. doi:10.1093/nar/27.2.573
+"""
+__all__ = ["run_trf"]
+
+import logging
+import logging.config
+import multiprocessing
+import os
+from os import PathLike
+from pathlib import Path
+import re
+import subprocess
+import tempfile
+from typing import List
+import argschema
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    create_dir,
+    check_gtf_content,
+    get_seq_region_length,
+    get_slice_id,
+    slice_output_to_gtf,
+    get_sequence,
+)
+
+logger = logging.getLogger(__name__)
+
+
+
+[docs] +def run_trf( + genome_file: PathLike, + output_dir: Path, + num_threads: int = 1, + trf_bin: Path = Path("trf"), + match_score: int = 2, + mismatch_score: int = 5, + delta: int = 7, + pm: int = 80, + pi: int = 10, + minscore: int = 40, + maxperiod: int = 500, +) -> None: + """ + Executes TRF on genomic slices + Args: + genome_file : Genome file path. + output_dir : working directory path. + num_threads: int, number of threads. + trf_bin : TRF software path. + match_score : Matching weight. + mismatch_score : Mismatching penalty. + delta : Indel penalty. + pm : Match probability (whole number). + pi : Indel probability (whole number). + minscore : Minimum alignment score to report. + maxperiod : Maximum period size to report. + """ + check_exe(trf_bin) + trf_dir = create_dir(output_dir, "trf_output") + os.chdir(str(trf_dir)) + output_file = trf_dir / "annotation.gtf" + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "repeat") + if transcript_count > 0: + logger.info("Trf gtf file exists, skipping analysis") + return + logger.info("Creating list of genomic slices") + seq_region_to_length = get_seq_region_length(genome_file, 5000) + slice_ids_per_region = get_slice_id( + seq_region_to_length, slice_size=1000000, overlap=0, min_length=5000 + ) + trf_output_extension = ( + f".{match_score}.{mismatch_score}.{delta}." + f"{pm}.{pi}.{minscore}.{maxperiod}.dat" + ) + trf_cmd = [ + trf_bin, + None, + str(match_score), + str(mismatch_score), + str(delta), + str(pm), + str(pi), + str(minscore), + str(maxperiod), + "-d", + "-h", + ] + logger.info("Running TRF") + pool = multiprocessing.Pool(num_threads)#pylint:disable=consider-using-with + for slice_id in slice_ids_per_region: + pool.apply_async( + _multiprocess_trf, + args=( + trf_cmd, + slice_id, + trf_dir, + trf_output_extension, + genome_file, + ), + ) + pool.close() + pool.join() + slice_output_to_gtf(trf_dir, "repeat_id", "trf", True, ".trf.gtf") + for gtf_file in trf_dir.glob("*.trf.gtf"): + gtf_file.unlink()
+ + + +def _multiprocess_trf( + trf_cmd: List[str], + slice_id: List[str], + trf_dir: Path, + trf_output_extension: Path, + genome_file:Path, +) -> None: + """ + Run TRF on multiprocess on genomic slices + Args: + trf_cmd: TRF command to execute. + slice_id: Slice Id to run TRF on. + trf_dir : TRF output dir. + trf_output_extension: TRF file output extension. + genome_file : Genome file. + """ + region_name, start, end = slice_id + logger.info( + "Processing slice to find tandem repeats with TRF:%s:%s:%s", + region_name, + start, + end, + ) + seq = get_sequence(region_name, int(start), int(end), 1, genome_file, trf_dir) + slice_name = f"{region_name}.rs{start}.re{end}" + with tempfile.TemporaryDirectory(dir=trf_dir) as tmpdirname: + slice_file = trf_dir / tmpdirname / f"{slice_name}.fa" + with open(slice_file, "w+", encoding="utf8") as region_out: + region_out.write(f">{region_name}\n{seq}\n") + region_results = trf_dir / f"{slice_name}.trf.gtf" + # TRF writes to the current dir, so swtich to the output dir for it + # os.chdir(str(trf_output_dir)) + output_file = Path(f"{slice_file}{trf_output_extension}") + trf_cmd = trf_cmd.copy() + trf_cmd[1] = str(slice_file) + logger.info("trf_cmd: %s", trf_cmd) + # with open(trf_output_file_path, "w+") as trf_out: + subprocess.run(trf_cmd, cwd=trf_dir / tmpdirname)#pylint:disable=subprocess-run-check + _create_trf_gtf(output_file, region_results, region_name) + slice_file.unlink() + output_file.unlink() + + +def _create_trf_gtf( + output_file: Path, + region_results: Path, + region_name: str, +) -> None: + """ + Read the fasta file and save the content in gtf format + + TRF output format: + cols 1+2: Indices of the repeat relative to the start of the sequence + col 3: Period size of the repeat + col 4: Number of copies aligned with the consensus pattern + col 5: Size of consensus pattern (may differ slightly from the period size) + col 6: Percent of matches between adjacent copies overall + col 7: Percent of indels between adjacent copies overall + col 8: Alignment score + cols 9-12: Percent composition for each of the four nucleotides + col 13: Entropy measure based on percent composition + col 14: Consensus sequence + col 15: Repeat sequence + Args: + output_file : GTF file with final results. + region_results : GTF file with results per region. + region_name : Coordinates of genomic slice. + """ + with open(output_file, "r", encoding="utf8") as trf_in, open( + region_results, "w+", encoding="utf8" + ) as trf_out: + repeat_count = 1 + for line in trf_in: + result_match = re.search(r"^\d+", line) + if result_match: + results = line.split() + if len(results) != 15: + continue + start = results[0] + end = results[1] + period = float(results[2]) + copy_number = float(results[3]) + percent_matches = float(results[5]) + score = float(results[7]) + repeat_consensus = results[13] + if ( # pylint: disable=too-many-boolean-expressions + score < 50 + and percent_matches >= 80 + and copy_number > 2 + and period < 10 + ) or (copy_number >= 2 and percent_matches >= 70 and score >= 50): + gtf_line = ( + f"{region_name}\tTRF\trepeat\t{start}\t{end}\t.\t+\t.\t" + f'repeat_id "{repeat_count}"; score "{score}"; ' + f'repeat_consensus "{repeat_consensus}";\n' + ) + trf_out.write(gtf_line) + repeat_count += 1 + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run TRF.""" + + genome_file = argschema.fields.InputFile( + required=True, description="Genome file path" + ) + output_dir = argschema.fields.OutputDir( + required=True, description="Output directory path" + ) + trf_bin = argschema.fields.String( + required=False, + default="trf", + description="TRF executable path", + ) + match_score = argschema.fields.Integer( + required=False, default=2, description="Matching weight" + ) + mismatch_score = argschema.fields.Integer( + required=False, default=5, description="Mismatching penalty" + ) + delta = argschema.fields.Integer( + required=False, default=7, description="Indel penalty" + ) + pm = argschema.fields.Integer( + required=False, default=80, description="Match probability" + ) + pi = argschema.fields.Integer( + required=False, default=10, description="Indel probability" + ) + minscore = argschema.fields.Integer( + required=False, default=40, description="Minimum alignment score to report" + ) + maxperiod = argschema.fields.Integer( + required=False, default=500, description="Maximum period size to report" + ) + num_threads = argschema.fields.Integer( + required=False, default=1, description="Number of threads" + ) + + +def main() -> None: + """TRF's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "trf.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_trf( + mod.args["genome_file"], + mod.args["output_dir"], + mod.args["num_threads"], + mod.args["trf_bin"], + mod.args["match_score"], + mod.args["mismatch_score"], + mod.args["delta"], + mod.args["pm"], + mod.args["pi"], + mod.args["minscore"], + mod.args["maxperiod"], + ) + + +if __name__ == "__main__": + main() +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/simple_feature_annotation/cpg.html b/_modules/ensembl/tools/anno/simple_feature_annotation/cpg.html new file mode 100644 index 0000000..015bc80 --- /dev/null +++ b/_modules/ensembl/tools/anno/simple_feature_annotation/cpg.html @@ -0,0 +1,363 @@ + + + + + + + ensembl.tools.anno.simple_feature_annotation.cpg — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.simple_feature_annotation.cpg

+# See the NOTICE file distributed with this work for additional information
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+Set of discriminant functions that can recognize structural and compositional features
+such as CpG islands, promoter regions and first splice-donor sites.
+Davuluri RV, Grosse I, Zhang MQ: Computational identification of promoters and
+first exons in the human genome. Nat Genet. 2001, 29(4):412-417. [PMID: 11726928]
+"""
+__all__ = ["run_cpg"]
+import logging
+import logging.config
+import multiprocessing
+from os import PathLike
+from pathlib import Path
+import re
+import subprocess
+from tempfile import TemporaryDirectory
+from typing import List,Union
+import argschema
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    create_dir,
+    check_gtf_content,
+    get_seq_region_length,
+    get_slice_id,
+    slice_output_to_gtf,
+    get_sequence,
+)
+
+logger = logging.getLogger(__name__)
+
+
+
+[docs] +def run_cpg( + genome_file: PathLike, + output_dir: Path, + cpg_bin: Path = Path("cpg_lh"), + cpg_min_length: int = 400, + cpg_min_gc_content: int = 50, + cpg_min_oe: float = 0.6, + num_threads: int = 1, +) -> None: + """ + Run CpG islands on genomic slices + Args: + genome_file : Genome file path. + output_dir : Working directory path + cpg_bin : CpG software path. + cpg_min_length : Min length of CpG islands + cpg_min_gc_content : Min GC frequency percentage + cpg_min_oe : Min ratio of the observed to expected number of CpG (CpGo/e) + num_threads: int, number of threads. + """ + + check_exe(cpg_bin) + cpg_dir = create_dir(output_dir, "cpg_output") + output_file = cpg_dir / "annotation.gtf" + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "simple_feature") + if transcript_count > 0: + logger.info("Cpg gtf file exists") + return + logger.info("Creating list of genomic slices") + seq_region_to_length = get_seq_region_length(genome_file, 5000) + slice_ids_per_region = get_slice_id( + seq_region_to_length, slice_size=1000000, overlap=0, min_length=5000 + ) + logger.info("Running CpG") + pool = multiprocessing.Pool(int(num_threads)) # pylint:disable=consider-using-with + for slice_id in slice_ids_per_region: + pool.apply_async( + _multiprocess_cpg, + args=( + cpg_bin, + slice_id, + genome_file, + cpg_dir, + cpg_min_length, + cpg_min_gc_content, + cpg_min_oe, + ), + ) + + pool.close() + pool.join() + slice_output_to_gtf(cpg_dir, "feature_id", "cpg", True, ".cpg.gtf") + for gtf_file in cpg_dir.glob("*.cpg.gtf"): + gtf_file.unlink()
+ + + +def _multiprocess_cpg( + cpg_bin: Path, + slice_id: List[str], + genome_file: Path, + cpg_dir: Path, + cpg_min_length: int = 400, + cpg_min_gc_content: int = 50, + cpg_min_oe: float = 0.6, +) -> None: + """ + Annotation of CpG islands on multiprocess on genomic slices + Args: + cpg_bin: CpG software path. + slice_id: Slice id to run CpG on. + genome_file : Genome file. + cpg_dir : Output dir. + cpg_min_length : Min length of CpG islands + cpg_min_gc_content : Min GC frequency percentage + cpg_min_oe : Min ratio of the observed to expected number of CpG (CpGo/e) + """ + region_name, start, end = slice_id + logger.info( + "Processing slice to find CpG islands with cpg_lh: %s:%s:%s", + region_name, + start, + end, + ) + seq = get_sequence(region_name, int(start), int(end), 1, genome_file, cpg_dir) + slice_name = f"{region_name}.rs{start}.re{end}" + #with TemporaryDirectory(dir=cpg_dir) as tmpdirname: + slice_file = cpg_dir / f"{slice_name}.fa" + with open(slice_file, "w+", encoding="utf8") as region_out: + region_out.write(f">{region_name}\n{seq}\n") + region_results = cpg_dir / f"{slice_file}.cpg.gtf" + output_file = Path(f"{slice_file}.cpg") + cpg_cmd = [str(cpg_bin), str(slice_file)] + with open(output_file, "w+", encoding="utf8") as cpg_out: + subprocess.run(cpg_cmd, stdout=cpg_out, check=True) + _create_cpg_gtf( + output_file, + region_results, + region_name, + cpg_min_length, + cpg_min_gc_content, + cpg_min_oe, + ) + slice_file.unlink() + output_file.unlink() + + +def _create_cpg_gtf( + output_file: Path, + region_results: Path, + region_name: str, + cpg_min_length: int = 400, + cpg_min_gc_content: int = 50, + cpg_min_oe: float = 0.6, +) -> None: + """ + Read the fasta file and save the content in gtf format + All the genomic slices are collected in a single gtf output + Args: + output_file : GTF file with final results. + region_results : GTF file with the results per region. + region_name :Coordinates of genomic slice. + cpg_dir : Output dir. + cpg_min_length : Min length of CpG islands + cpg_min_gc_content : Min GC frequency percentage + cpg_min_oe : Min ratio of the observed to expected number of CpG (CpGo/e) + """ + with open(output_file, "r", encoding="utf8") as cpg_in, open(region_results, "w+", encoding="utf8") as cpg_out: + feature_count = 1 + for line in cpg_in: + result_match = re.search(r"^" + region_name, line) + if result_match: + results = line.split() + start = int(results[1]) + end = int(results[2]) + length = end - start + 1 + score = float(results[3]) + gc_content = float(results[6]) + oe_score_str = results[7] + oe_score: Union[float, int] + if oe_score_str in ("-", "inf"): + oe_score=0 + else: + oe_score=float(oe_score_str) + if ( + int(length) >= int(cpg_min_length) + and gc_content >= int(cpg_min_gc_content) + and oe_score >= float(cpg_min_oe) + ): + gtf_line = ( + f"{region_name}\tCpG\tsimple_feature\t{start}\t" + f'{end}\t.\t+\t.\tfeature_id "{feature_count}"; score "{score}";\n' + ) + cpg_out.write(gtf_line) + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run CpG software.""" + + genome_file = argschema.fields.InputFile( + required=True, description="Genome file path" + ) + output_dir = argschema.fields.OutputDir( + required=True, description="Output directory path" + ) + cpg_bin = argschema.fields.String( + required=False, + default="cpg_lh", + description="CpG executable path", + ) + cpg_min_length = argschema.fields.Integer( + required=False, + default="400", + description="Min length of CpG islands", + ) + cpg_min_gc_content = argschema.fields.Integer( + required=False, + default="50", + description="Min GC frequency percentage", + ) + cpg_min_oe = argschema.fields.Float( + required=False, + default="0.6", + description="Min ratio of the observed to expected number of CpG (CpGo/e)", + ) + num_threads = argschema.fields.Integer( + required=False, default=1, description="Number of threads" + ) + + +def main() -> None: + """CpG's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "cpg.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_cpg( + mod.args["genome_file"], + mod.args["output_dir"], + mod.args["cpg_bin"], + mod.args["cpg_min_length"], + mod.args["cpg_min_gc_content"], + mod.args["cpg_min_oe"], + mod.args["num_threads"], + ) +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/simple_feature_annotation/eponine.html b/_modules/ensembl/tools/anno/simple_feature_annotation/eponine.html new file mode 100644 index 0000000..23a3e09 --- /dev/null +++ b/_modules/ensembl/tools/anno/simple_feature_annotation/eponine.html @@ -0,0 +1,348 @@ + + + + + + + ensembl.tools.anno.simple_feature_annotation.eponine — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.simple_feature_annotation.eponine

+# See the NOTICE file distributed with this work for additional information
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+Eponine is a probabilistic method for detecting transcription start sites (TSS)
+in mammalian genomic sequence, with good specificity and excellent positional accuracy.
+Down TA, Hubbard TJ. Computational detection and location of transcription start sites
+in mammalian genomic DNA. Genome Res. 2002 Mar;12(3):458-61. doi: 10.1101/gr.216102.
+PMID: 11875034; PMCID: PMC155284.
+"""
+__all__ = ["run_eponine"]
+
+import logging
+import logging.config
+import multiprocessing
+import os
+from os import PathLike
+from pathlib import Path
+import re
+import subprocess
+from tempfile import TemporaryDirectory
+from typing import List
+import argschema
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    check_file,
+    create_dir,
+    check_gtf_content,
+    get_sequence,
+    get_seq_region_length,
+    get_slice_id,
+    slice_output_to_gtf,
+)
+
+logger = logging.getLogger("__name__")
+
+
+
+[docs] +def run_eponine( + genome_file: PathLike, + output_dir: Path, + num_threads: int = 1, + java_bin: Path = Path("java"), + eponine_bin: Path = Path( + "/hps/software/users/ensembl/ensw/C8-MAR21-sandybridge/linuxbrew/opt/eponine/libexec/eponine-scan.jar" + ), + eponine_threshold: float = 0.999, +) -> None: + """ + Run Eponine on genomic slices + Args: + genome_file : Genome file path. + output_dir : Working directory path. + java_bin : Java path. + eponine_bin : Eponine software path + num_threads: Number of threads. + """ + check_file(eponine_bin) + check_exe(java_bin) + eponine_dir = create_dir(output_dir, "eponine_output") + # os.chdir(str(eponine_dir)) + output_file = eponine_dir / "annotation.gtf" + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "simple_feature") + if transcript_count > 0: + logger.info("Eponine gtf file exists, skipping analysis") + return + logger.info("Creating list of genomic slices") + seq_region_to_length = get_seq_region_length(genome_file, 5000) + slice_ids_per_region = get_slice_id( + seq_region_to_length, slice_size=1000000, overlap=0, min_length=5000 + ) + + eponine_cmd = [ + str(java_bin), + "-jar", + str(eponine_bin), + "-threshold", + str(eponine_threshold), + "-seq", + ] + logger.info("Running Eponine") + pool = multiprocessing.Pool(int(num_threads)) # pylint:disable=consider-using-with + for slice_id in slice_ids_per_region: + pool.apply_async( + _multiprocess_eponine, + args=( + eponine_cmd, + slice_id, + eponine_dir, + Path(genome_file), + ), + ) + pool.close() + pool.join() + slice_output_to_gtf(eponine_dir, "feature_id", "eponine", True, ".epo.gtf") + for gtf_file in eponine_dir.glob("*.epo.gtf"): + gtf_file.unlink()
+ + + +def _multiprocess_eponine( + eponine_cmd: List[str], + slice_id: List[str], + eponine_dir: Path, + genome_file: Path, +) -> None: + """ + Run Eponine on multiprocess on genomic slices + Args: + eponine_cmd: Eponine command to execute. + slice_id: List of slice IDs. + eponine_dir : Eponine output directory path. + genome_file : Genome file. + """ + region_name, start, end = slice_id + logger.info( + "Processing slice to find transcription start sites with Eponine: %s:%s:%s", + region_name, + start, + end, + ) + seq = get_sequence(region_name, int(start), int(end), 1, genome_file, eponine_dir) + slice_name = f"{region_name}.rs{start}.re{end}" + #with tempfile.TemporaryDirectory(dir=eponine_dir) as tmpdirname: + slice_file = eponine_dir / f"{slice_name}.fa" + with open(slice_file, "w+", encoding="utf8") as region_out: + region_out.write(f">{region_name}\n{seq}\n") + region_results = eponine_dir / f"{slice_name}.epo.gtf" + output_file = Path(f"{slice_file}.epo") + eponine_cmd = eponine_cmd.copy() + eponine_cmd.append(str(slice_file)) + logging.info(eponine_cmd) + with open(output_file, "w+", encoding="utf8") as eponine_out: + subprocess.run(eponine_cmd, stdout=eponine_out, check=True) + _create_eponine_gtf(output_file, region_results, region_name) + slice_file.unlink() + output_file.unlink() + + +def _create_eponine_gtf( + output_file: Path, + region_results: Path, + region_name: str, +) -> None: + """ + Read the fasta file and save the content in gtf format + All the genomic slices are collected in a single gtf output + Args: + output_file: GTF file with final results. + region_results: GTF file with the results per region. + region_name: Coordinates of genomic slice. + """ + with open(output_file, "r", encoding="utf8") as eponine_in, open( + region_results, "w+", encoding="utf8" + ) as eponine_out: + feature_count = 1 + for line in eponine_in: + result_match = re.search(r"^" + region_name, line) + if result_match: + results = line.split() + start = int(results[3]) + end = int(results[4]) + score = float(results[5]) + strand = results[6] + logging.info(results) + # There's a one base offset on the reverse strand + if strand == "-": + start -= 1 + end -= 1 + + gtf_line = ( + f"{region_name}\tEponine\tsimple_feature\t" + f"{start}\t{end}\t.\t{strand}\t.\t" + f'feature_id "{feature_count}"; score "{score}";\n' + ) + eponine_out.write(gtf_line) + feature_count += 1 + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run Eponine.""" + + genome_file = argschema.fields.InputFile( + required=True, description="Genome file path" + ) + output_dir = argschema.fields.OutputDir( + required=True, description="Output directory path" + ) + num_threads = argschema.fields.Integer( + required=False, default=1, description="Number of threads" + ) + java_bin = argschema.fields.String( + required=False, + default="java", + description="Java executable path", + ) + eponine_bin = argschema.fields.String( + required=False, + default="/hps/software/users/ensembl/ensw/C8-MAR21-sandybridge/linuxbrew/opt/eponine/libexec/eponine-scan.jar", # pylint:disable=line-too-long + description="Java executable path", + ) + eponine_threashold = argschema.fields.Float( + required=False, default=0.999, description="Eponine threashold" + ) + + +def main() -> None: + """Eponine's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "eponine.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_eponine( + mod.args["genome_file"], + mod.args["output_dir"], + mod.args["num_threads"], + Path(mod.args["java_bin"]), + Path(mod.args["eponine_bin"]), + mod.args["eponine_threashold"], + ) + + +if __name__ == "__main__": + main() +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/snc_rna_annotation/trnascan.html b/_modules/ensembl/tools/anno/snc_rna_annotation/trnascan.html new file mode 100644 index 0000000..fe91f78 --- /dev/null +++ b/_modules/ensembl/tools/anno/snc_rna_annotation/trnascan.html @@ -0,0 +1,399 @@ + + + + + + + ensembl.tools.anno.snc_rna_annotation.trnascan — ensembl-anno 0.1 documentation + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.snc_rna_annotation.trnascan

+# See the NOTICE file distributed with this work for additional information
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+tRNAscan-SE identifies 99-100% of transfer RNA genes in DNA sequence while
+giving less than one false positive per 15 gigabases.
+Lowe TM, Eddy SR: tRNAscan-SE: a program for improved detection of transfer
+RNA genes in genomic sequence.
+Nucleic Acids Res. 1997, 25(5):955-64. [PMID: 9023104]
+"""
+__all__ = ["run_trnascan"]
+
+import logging
+import logging.config
+import multiprocessing
+from os import PathLike
+from pathlib import Path
+import re
+import subprocess
+from typing import List
+import argschema
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    check_file,
+    create_dir,
+    check_gtf_content,
+    get_seq_region_length,
+    get_slice_id,
+    slice_output_to_gtf,
+    get_sequence,
+)
+
+logger = logging.getLogger(__name__)
+
+
+
+[docs] +def run_trnascan( + genome_file: PathLike, + output_dir: Path, + trnascan_bin: Path = Path("tRNAscan-SE"), + trnascan_filter: Path = Path("EukHighConfidenceFilter"), + num_threads: int = 1, +) -> None: + """ + Executes tRNAscan-SE on genomic slices + Args: + genome_file : Genome file path. + trnascan_bin : tRNAscan-SE software path. + trnascan_filter : tRNAscan-SE filter set path. + output_dir : working directory path. + num_threads: int, number of threads. + """ + check_exe(trnascan_bin) + check_file(trnascan_filter) + trnascan_dir = create_dir(output_dir, "trnascan_output") + output_file = trnascan_dir / "annotation.gtf" + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "transcript") + if transcript_count > 0: + logger.info("Trnascan gtf file exists, skipping analysis") + return + logger.info("Creating list of genomic slices") + seq_region_to_length = get_seq_region_length(genome_file, 5000) + slice_ids_per_region = get_slice_id(seq_region_to_length, 1000000, 0, 5000) + trnascan_cmd = [ + str(trnascan_bin), + None, + "-o", + None, + "-f", + None, + "-H", # show both primary and secondary structure components to covariance model bit scores + "-q", # quiet mode + "--detail", + "-Q", + ] + logger.info("Running tRNAscan-SE") + pool = multiprocessing.Pool(num_threads) # pylint: disable=consider-using-with + for slice_id in slice_ids_per_region: + pool.apply_async( + _multiprocess_trnascan, + args=( + trnascan_cmd, + slice_id, + genome_file, + trnascan_filter, + trnascan_dir, + ), + ) + + pool.close() + pool.join() + slice_output_to_gtf( + output_dir=trnascan_dir, unique_ids=True, file_extension=".trna.gtf" + ) + for gtf_file in trnascan_dir.glob("*.trna.gtf"): + gtf_file.unlink()
+ + + +def _multiprocess_trnascan( + trnascan_cmd: List[str], + slice_id: List[str], + genome_file: Path, + trnascan_filter: Path, + trnascan_dir: Path, +) -> None: + """ + Run tRNAscan-SE on multiprocess on genomic slices + Args: + trnascan_cmd: tRNAscan-SE command to execute. + slice_id: Slice Id to run tRNAscan-SE on. + genome_file : Genome file. + trnascan_dir : tRNAscan-SE output dir. + trnascan_filter: tRNAscan-SE filter set. + """ + region_name, start, end = slice_id + logger.info( + "Processing slice to find tRNAs using tRNAscan-SE:%s:%s:%s", + region_name, + start, + end, + ) + seq = get_sequence(region_name, int(start), int(end), 1, genome_file, trnascan_dir) + slice_name = f"{region_name}.rs{start}.re{end}" + slice_file = trnascan_dir / f"{slice_name}.fa" + with open(slice_file, "w+", encoding="utf8") as region_out: + region_out.write(f">{region_name}\n{seq}\n") + # trnscan output + region_results = trnascan_dir / f"{slice_name}.trna.gtf" + output_file = Path(f"{slice_file}.trna") + ss_output_file = Path(f"{output_file}.ss") + # filtering + filter_prefix_file = f"{slice_name}.filt" + filter_output_file = trnascan_dir / f"{filter_prefix_file}.out" + filter_log_file = trnascan_dir / f"{filter_prefix_file}.log" + filter_ss_file = trnascan_dir / f"{filter_prefix_file}.ss" + # trnascan_cmd = generic_trnascan_cmd.copy() + trnascan_cmd[1], trnascan_cmd[3], trnascan_cmd[5] = ( + str(slice_file), + str(output_file), + str(ss_output_file), + ) + logger.info("tRNAscan-SE command: %s", " ".join(trnascan_cmd)) + subprocess.run(trnascan_cmd, check=True) + # If the trnascan output is empty there is no need to go on with filtering + if output_file.stat().st_size == 0: + output_file.unlink() + slice_file.unlink() + ss_output_file.unlink(missing_ok=True) + return + + filter_cmd = [ + str(trnascan_filter), + "--result", # tRNAscan-SE output file used as input + str(output_file), + "--ss", # tRNAscan-SE secondary structure file used as input + str(ss_output_file), + "--output", + str(trnascan_dir), + "--prefix", + str(filter_prefix_file), + ] + logger.info( + "tRNAscan-SE filter command: %s", " ".join(str(item) for item in filter_cmd) + ) + subprocess.run(filter_cmd)#pylint:disable=subprocess-run-check + _create_trnascan_gtf(region_results, filter_output_file, region_name) + output_file.unlink(missing_ok=True) + slice_file.unlink(missing_ok=True) + ss_output_file.unlink(missing_ok=True) + Path(filter_prefix_file).unlink(missing_ok=True) + filter_log_file.unlink(missing_ok=True) + filter_ss_file.unlink(missing_ok=True) + filter_output_file.unlink(missing_ok=True) + + +def _create_trnascan_gtf( + region_results: Path, filter_output_file: Path, region_name: str +) -> None: + """ + Read the fasta file and save the content in gtf format + All the genomic slices are collected in a single gtf output + Args: + region_results : GTF file with the results per region. + filter_file : GTF file with the filtered results per region. + region_name :Coordinates of genomic slice. + + tRNAscan-SE output format: + col0: GtRNAdb Gene Symbol - gene ID in corresponding genome + col1: tRNAscan-SE ID - tRNA ID in tRNAscan-SE prediction results + col2-3: Locus - Genomic coordinates of predicted gene + col4: Isotype (from Anticodon) - tRNA isotype determined by anticodon + col5: Anticodon - anticodon of predicted tRNA gene + col6-7: Intron boundaries + col8: General tRNA Model Score - covariance model bit score from tRNAscan-SE results + col9: Best Isotype Model - best matching (highest scoring) isotype determined + by isotype-specific covariance model classification + col10-11-12: Anticodon and Isotype Model Agreement - consistency between anticodon + from predicted gene sequence and best isotype model + col13: Features - special gene features that may include gene set categorization, + number of introns, possible pseudogenes, possible truncation, or base-pair mismatches + """ + with open(filter_output_file, "r", encoding="utf8") as trna_in, open( + region_results, "w+", encoding="utf8" + ) as trna_out: + gene_counter = 1 + for line in trna_in: + result_match = re.search(r"^" + region_name, line) + if result_match: + results = line.split() + start = int(results[2]) + end = int(results[3]) + strand = "+" + if start > end: + strand = "-" + start, end = end, start + biotype = ( + "tRNA" + if re.search(r"high confidence set", line) + else "tRNA_pseudogene" + ) + transcript_string = ( + f"{region_name}\ttRNAscan\ttranscript\t{start}\t{end}\t.\t" + f'{strand}\t.\tgene_id "{gene_counter}"; transcript_id ' + f'"{gene_counter}"; biotype "{biotype}";\n' + ) + exon_string = ( + f"{region_name}\ttRNAscan\texon\t{start}\t{end}\t.\t" + f'{strand}\t.\tgene_id "{gene_counter}"; transcript_id ' + f'"{gene_counter}"; exon_number "1"; biotype "{biotype}";\n' + ) + trna_out.write(transcript_string) + trna_out.write(exon_string) + trna_out.flush() + gene_counter += 1 + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run tRNAscan-SE.""" + + genome_file = argschema.fields.InputFile( + required=True, description="Genome file path" + ) + trnascan_bin = argschema.fields.String( + required=False, + default="tRNAscan-SE", + description="tRNAscan-SE executable path", + ) + trnascan_filter = argschema.fields.String( + required=False, + default="/hps/software/users/ensembl/ensw/C8-MAR21-sandybridge/linuxbrew/bin/EukHighConfidenceFilter", + description="tRNAscan-SE filter path", + ) + output_dir = argschema.fields.OutputDir( + required=True, description="Output directory path" + ) + num_threads = argschema.fields.Integer( + required=False, default=1, description="Number of threads" + ) + + +def main() -> None: + """tRNAscan-SE's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "trnascan.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_trnascan( + mod.args["genome_file"], + mod.args["output_dir"], + mod.args["trnascan_bin"], + Path(mod.args["trnascan_filter"]), + mod.args["num_threads"], + ) + + +if __name__ == "__main__": + main() +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/transcriptomic_annotation/minimap.html b/_modules/ensembl/tools/anno/transcriptomic_annotation/minimap.html new file mode 100644 index 0000000..190d992 --- /dev/null +++ b/_modules/ensembl/tools/anno/transcriptomic_annotation/minimap.html @@ -0,0 +1,365 @@ + + + + + + + ensembl.tools.anno.transcriptomic_annotation.minimap — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.transcriptomic_annotation.minimap

+# See the NOTICE file distributed with this work for additional information
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Minimap2 is a pairwise sequence alignment algorithm designed for efficiently comparing nucleotide sequences.
+The algorithm uses a versatile indexing strategy to quickly find approximate matches between sequences, 
+allowing it to efficiently align long sequences against reference genomes or other sequences.
+
+Li, H. (2018). Minimap2: pairwise alignment for nucleotide sequences. Bioinformatics, 34(18), 3094-3100.
+"""
+
+__all__ = ["run_minimap2"]
+import logging
+import logging.config
+from pathlib import Path
+import subprocess
+from typing import List
+import argschema
+
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    create_dir,
+    check_gtf_content,
+)
+
+
+
+[docs] +def run_minimap2( + output_dir: Path, + long_read_fastq_dir: Path, + genome_file: Path, + minimap2_bin: Path = Path("minimap2"), + paftools_bin: Path = Path("paftools.js"), + max_intron_length: int = 100000, + num_threads: int = 1, +) -> None: + """ + Run Minimap2 to align long read data against genome file. + Default Minimap set for PacBio data. + Args: + output_dir : Working directory path. + long_read_fastq_dir : Long read directory path. + genome_file : Genome file path. + minimap2_bin : Software path. + paftools_bin : Software path. + max_intron_length : The maximum intron size for alignments. Defaults to 100000. + num_threads : Number of available threads. + """ + check_exe(minimap2_bin) + check_exe(paftools_bin) + minimap2_dir = create_dir(output_dir, "minimap2_output") + + logging.info("Skip analysis if the gtf file already exists") + output_file = minimap2_dir / "annotation.gtf" + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "transcript") + if transcript_count > 0: + logging.info("Minimap2 gtf file exists, skipping analysis") + return + minimap2_index_file = minimap2_dir / f"{genome_file.name}.mmi" + # minimap2_hints_file = minimap2_dir /"minimap2_hints.gff" + file_types = ("*.fastq", "*.fq") + fastq_file_list = [ + path for file_type in file_types for path in Path(long_read_fastq_dir).rglob(file_type) + ] + if len(fastq_file_list) == 0: + raise IndexError(f"The list of fastq files is empty. Fastq dir:\n{long_read_fastq_dir}") + + if not minimap2_index_file.exists(): + logging.info("Did not find an index file for minimap2. Will create now") + try: + subprocess.run( # pylint:disable=subprocess-run-check + [ + minimap2_bin, + "-t", + str(num_threads), + "-d", + str(minimap2_index_file), + genome_file, + ] + ) + except subprocess.CalledProcessError as e: + logging.error("An error occurred while creating minimap2 index: %s", e) + except OSError as e: + logging.error("An OS error occurred: %s", e) + + logging.info("Running minimap2 on the files in the long read fastq dir") + for fastq_file in fastq_file_list: + sam_file = minimap2_dir / f"{fastq_file.name}.sam" + bed_file = minimap2_dir / f"{fastq_file.name}.bed" + logging.info("Processing %s", fastq_file) + with open(bed_file, "w+", encoding="utf8") as bed_file_out: + subprocess.run( # pylint:disable=subprocess-run-check + [ + minimap2_bin, + "-G", + str(max_intron_length), + "-t", + str(num_threads), + "--cs", + "--secondary=no", + "-ax", + "splice", + "-u", + "b", + minimap2_index_file, + fastq_file, + "-o", + sam_file, + ] + ) + logging.info("Creating bed file from SAM") + subprocess.run( + [paftools_bin, "splice2bed", sam_file], stdout=bed_file_out + ) # pylint:disable=subprocess-run-check + + bed_to_gtf(minimap2_dir) + + logging.info("Completed running minimap2")
+ + + +def bed_to_gtf(output_dir: Path) -> None: + """ + Convert bed file into gtf file + Args: + output_dir : Working directory path. + """ + gtf_file_path = output_dir / "annotation.gtf" + with open(gtf_file_path, "w+", encoding="utf8") as gtf_out: + gene_id = 1 + for bed_file in output_dir.glob("*.bed"): + logging.info("Converting bed to GTF: %s", str(bed_file)) + with open(bed_file, "r", encoding="utf8") as bed_in: + for line in bed_in: + elements = line.rstrip().split("\t") + seq_region_name = elements[0] + offset = int(elements[1]) + strand = elements[5] + # sizes of individual block of exons + block_sizes = [size for size in elements[10].split(",") if size] + block_starts = [size for size in elements[11].split(",") if size] + exons = bed_block_to_exons(block_sizes, block_starts, offset) + transcript_start = None + transcript_end = None + exon_records = [] + for i, exon_coords in enumerate(exons): + if transcript_start is None or exon_coords[0] < transcript_start: + transcript_start = exon_coords[0] + + if transcript_end is None or exon_coords[1] > transcript_end: + transcript_end = exon_coords[1] + + exon_line = ( + f"{seq_region_name}\tminimap\texon\t{exon_coords[0]}\t" + f"{exon_coords[1]}\t.\t{strand}\t.\t" + f'gene_id "minimap_{gene_id}"; transcript_id "minimap_{gene_id}"; ' + f'exon_number "{i+ 1}";\n' + ) + exon_records.append(exon_line) + transcript_line = ( + f"{seq_region_name}\tminimap\ttranscript\t{transcript_start}\t" + f"{transcript_end}\t.\t{strand}\t.\t" + f'gene_id "minimap_{gene_id}"; transcript_id "minimap_{gene_id}"\n' + ) + gtf_out.write(transcript_line) + for exon_line in exon_records: + gtf_out.write(exon_line) + gene_id += 1 + + +def bed_block_to_exons(block_sizes: List, block_starts: List, offset: int) -> List: + """ + Extract exon size and start from exon feature block + Args: + block_sizes : Block feature size. + block_starts : Block feature starts. + offset : Feature offset. + + Returns: + List of exon coordinates + """ + exons = [] + for i, _ in enumerate(block_sizes): + block_start = offset + int(block_starts[i]) + 1 + block_end = block_start + int(block_sizes[i]) - 1 + if block_end < block_start: + logging.warning("Warning: block end is less than block start, skipping exon") + continue + exon_coords = [str(block_start), str(block_end)] + exons.append(exon_coords) + return exons + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run Minimap2 software.""" + + output_dir = argschema.fields.OutputDir(required=True, description="Output directory path") + long_read_fastq_dir = argschema.fields.String( + required=True, + description="Long read directory path", + ) + genome_file = argschema.fields.InputFile(required=True, description="Genome file path") + minimap2_bin = argschema.fields.String( + required=False, + default="minimap2", + description="Minimap2 software path", + ) + paftools_bin = argschema.fields.String( + required=False, + default="paftools.js", + description="Paftools software path", + ) + max_intron_length = argschema.fields.Integer( + required=False, + default="100000", + description="The maximum intron length.", + ) + max_intron_length = argschema.fields.Integer( + required=False, + default="100000", + description="The maximum intron size for alignments.", + ) + num_threads = argschema.fields.Integer(required=False, default=1, description="Number of threads") + + +def main() -> None: + """Minimap2's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "minimap.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_minimap2( + mod.args["output_dir"], + mod.args["long_read_fastq_dir"], + mod.args["genome_file"], + mod.args["minimap2_bin"], + mod.args["paftools_bin"], + mod.args["max_intron_length"], + mod.args["num_threads"], + ) +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/transcriptomic_annotation/scallop.html b/_modules/ensembl/tools/anno/transcriptomic_annotation/scallop.html new file mode 100644 index 0000000..44ae968 --- /dev/null +++ b/_modules/ensembl/tools/anno/transcriptomic_annotation/scallop.html @@ -0,0 +1,305 @@ + + + + + + + ensembl.tools.anno.transcriptomic_annotation.scallop — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.transcriptomic_annotation.scallop

+# See the NOTICE file distributed with this work for additional information
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Scallop is a high-performance tool designed for the accurate and efficient quantification 
+of transcriptome assembly. 
+It's capable of handling large-scale transcriptomic data while providing precise estimates 
+of transcript abundances.
+Scallop's algorithmic approach allows it to efficiently reconstruct transcript structures 
+and quantify their expression levels, making it a valuable resource for studying gene 
+expression and transcriptome analysis.
+
+Shao M, Kingsford C. Accurate assembly of transcripts through phase-preserving graph 
+decomposition. Nat Biotechnol.
+2017 Dec;35(12):1167-1169. doi: 10.1038/nbt.4020. Epub 2017 Nov 13. PMID: 29131147; PMCID: PMC5722698.
+"""
+
+__all__ = ["run_scallop"]
+import logging
+import logging.config
+from pathlib import Path
+import re
+import subprocess
+import argschema
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    create_dir,
+    check_gtf_content,
+)
+
+
+
+[docs] +def run_scallop( + output_dir: Path, + scallop_bin: Path = Path("scallop"), + prlimit_bin: Path = Path("prlimit"), + stringtie_bin: Path = Path("stringtie"), + memory_limit: int = 40 * 1024**3, +) -> None: + """ + Run Scallop assembler on short read data after STAR alignment. + + Args: + output_dir : Working directory path. + scallop_bin : Software path. + prlimit_bin : Software path. + stringtie_bin : Software path. + memory_limit : Memory limit Scallop command Defaults to 40*1024**3. + """ + check_exe(scallop_bin) + check_exe(stringtie_bin) + scallop_dir = create_dir(output_dir, "scallop_output") + logging.info("Skip analysis if the gtf file already exists") + output_file = scallop_dir / "annotation.gtf" + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "transcript") + if transcript_count > 0: + logging.info("Scallop gtf file exists, skipping analysis") + return + + star_dir = output_dir / "star_output" + + if star_dir.exists() and len(list(star_dir.glob("*.bam"))) != 0: + for sorted_bam_file in star_dir.glob("*.bam"): + transcript_file_name = re.sub(".bam", ".scallop.gtf", sorted_bam_file.name) + transcript_file = scallop_dir / transcript_file_name + if transcript_file.exists(): + logging.info( + "Found an existing stringtie gtf file, will not overwrite. \ + File found: %s", + transcript_file, + ) + else: + logging.info("Running Scallop on: %s", sorted_bam_file.name) + try: + scallop_cmd = [ + scallop_bin, + "-i", + sorted_bam_file, + "-o", + transcript_file, + "--min_flank_length", + "10", + ] + if memory_limit is not None: + scallop_cmd = prlimit_command(prlimit_bin, scallop_cmd, memory_limit) + subprocess.check_output(scallop_cmd, stderr=subprocess.STDOUT, universal_newlines=True) + # This combines the standard output and error streams into a single + # string and ensures that the output is in text mode + + except subprocess.CalledProcessError as ex: + logging.error("Error occurred while running Scallop:") + logging.error("Command: %s\n", " ".join(scallop_cmd)) + logging.error("Return code: %s\n", str(ex.returncode)) + logging.error("Output and error messages: %s\n", ex.output) + else: + raise IndexError(f"The list of sorted bam files is empty, Star output dir: {star_dir}") + + # Now need to merge + logging.info("Merge Scaalop's output.") + scallop_merge(scallop_dir, stringtie_bin)
+ + + +def scallop_merge(scallop_dir: Path, stringtie_bin: Path = Path("stringtie")) -> None: + """ + Merge Scallop result in a single gtf file + + scallop_dir : Input directory's path. + stringtie_bin : Software path. + """ + scallop_input_to_file = scallop_dir / "scallop_assemblies.txt" + scallop_merge_output_file = scallop_dir / "annotation.gtf" + with open(scallop_input_to_file, "w+", encoding="utf8") as gtf_list_out: + for gtf_file in scallop_dir.glob("*.scallop.gtf"): + transcript_count = check_gtf_content(gtf_file, "transcript") + if transcript_count > 0: + gtf_list_out.write(gtf_file + "\n") + else: + logging.warning("Warning, skipping file with no transcripts. Path:%s\n", gtf_file) + + try: + subprocess.check_output( + [ + stringtie_bin, + "--merge", + "-o", + scallop_merge_output_file, + scallop_input_to_file, + ], + stderr=subprocess.STDOUT, + text=True, + ) + + except subprocess.CalledProcessError as e: + print("StringTie execution failed with an error:%s", e.output) + + +def prlimit_command(prlimit_bin, command_list, virtual_memory_limit) -> list: + """ + Prepend memory limiting arguments to a command list to be run with subprocess. + + This method uses the `prlimit` program to set the memory limit. + + The `virtual_memory_limit` size is in bytes. + + prlimit arguments: + -v, --as[=limits] + Address space limit. + """ + return [str(prlimit_bin), f"-v{virtual_memory_limit}"] + command_list + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run StringTie software.""" + + output_dir = argschema.fields.OutputDir(required=True, description="Output directory path") + scallop_bin = argschema.fields.String( + required=False, + default="scallop", + description="Scallop software path", + ) + prlimit_bin = argschema.fields.String( + required=False, + default="prlimit", + description="Prlimit software path", + ) + memory_limit = argschema.fields.Integer( + required=False, default=40 * 1024**3, description="Memory's limit for Scallop command" + ) + + +def main() -> None: + """Scallop's entry-point. :no-index:""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "scallop.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_scallop( + mod.args["output_dir"], mod.args["scallop_bin"], mod.args["prlimit_bin"], mod.args["memory_limit"] + ) +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/transcriptomic_annotation/star.html b/_modules/ensembl/tools/anno/transcriptomic_annotation/star.html new file mode 100644 index 0000000..df38ad2 --- /dev/null +++ b/_modules/ensembl/tools/anno/transcriptomic_annotation/star.html @@ -0,0 +1,720 @@ + + + + + + + ensembl.tools.anno.transcriptomic_annotation.star — ensembl-anno 0.1 documentation + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.transcriptomic_annotation.star

+# See the NOTICE file distributed with this work for additional information
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+The STAR (Spliced Transcripts Alignment to a Reference) alignment tool is widely used
+in genomics research for aligning RNA-seq data to a reference genome.
+Dobin A, Davis CA, Schlesinger F, et al. STAR: ultrafast universal RNA-seq aligner.
+Bioinformatics. 2013;29(1):15-21. doi:10.1093/bioinformatics/bts635
+"""
+
+__all__ = ["run_star", "subsample_transcriptomic_data"]
+import logging
+import logging.config
+import gzip
+import math
+import multiprocessing
+from pathlib import Path
+import random
+import re
+import shutil
+import subprocess
+from typing import List
+import argschema
+
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    create_dir,
+    check_gtf_content,
+    get_seq_region_length,
+)
+
+
+
+[docs] +def run_star( + genome_file: Path, + output_dir: Path, + short_read_fastq_dir: Path, + delete_pre_trim_fastq: bool = False, + trim_fastq: bool = False, + max_reads_per_sample: int = 0, + max_intron_length: int = 100000, + num_threads: int = 1, + star_bin: Path = Path("star"), + samtools_bin: Path = Path("samtools"), + trim_galore_bin: Path = Path("trim_galore"), +) -> None: + """ + Run STAR alignment on list of short read data. + + Args: + genome_file : Genome file path. + output_dir : Working directory path. + short_read_fastq_dir : Short read directory path. + delete_pre_trim_fastq : Delete the original fastq files after trimming. Defaults to False. + trim_fastq : Trim short read files using TrimGalore. Defaults to False. + max_reads_per_sample : Max number of reads per sample. Defaults to 0 (unlimited). + max_intron_length : The maximum intron size for alignments. Defaults to 100000. + num_threads : Number of available threads. + star_bin : Software path. + samtools_bin : Software path. + trim_galore_bin : Software path. + + """ + check_exe(star_bin) + # If trimming has been enabled then switch the path for + # short_read_fastq_dir from the original location to the trimmed fastq dir + if trim_fastq: + run_trimming(output_dir, short_read_fastq_dir, delete_pre_trim_fastq, num_threads, trim_galore_bin) + short_read_fastq_dir = output_dir / "trim_galore_output" + + # if not os.path.exists(subsample_script_path): + #subsample_script_path = "subsample_fastq.py" + + star_dir = create_dir(output_dir, "star_output") + + for output_file in [ + output_dir / "stringtie_output/annotation.gtf", + output_dir / "scallop_output/annotation.gtf", + ]: + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "transcript") # check a gtf + if transcript_count > 0: + logging.info("Transcriptomic alignment exists") + return + + star_index_file = star_dir / "SAindex" + fastq_file_list = [] + file_types = ("*.fastq", "*.fq", "*.fastq.gz", "*.fq.gz") + fastq_file_list = [ + path for file_type in file_types for path in Path(short_read_fastq_dir).rglob(file_type) + ] + if len(fastq_file_list) == 0: + raise IndexError(f"The list of fastq files is empty. Fastq dir:\n{short_read_fastq_dir}") + + + # for file_type in file_types: + # fastq_file_list.extend(glob.glob(os.path.join(short_read_fastq_dir, file_type))) + + # Get list of paired paths + fastq_file_list = _create_paired_paths(fastq_file_list) + # Subsamples in parallel if there's a value set + if max_reads_per_sample: + subsample_transcriptomic_data(fastq_file_list) + # Get the list of the new subsampled files + fastq_file_list = [ + path for file_type in file_types for path in Path(short_read_fastq_dir).rglob(file_type) + ] + # I don't think is needed + # fastq_file_list = check_for_fastq_subsamples(fastq_file_list) + + if not star_index_file.exists(): + logging.info("Did not find an index file for Star. Will create now") + seq_region_to_length = get_seq_region_length(genome_file, 0) + genome_size = sum(seq_region_to_length.values()) + # This calculates the base-2 logarithm of the genome_size. The logarithm of the genome size is + # a measure of how many bits are needed to represent the genome size in binary. + # + # The choice of 14 as the maximum value is likely based on empirical observations and optimization + # considerations. Too large of a seed length can lead to increased memory usage and potentially + # slower indexing, while a seed length that is too small might affect alignment accuracy. + index_bases = min(14, math.floor((math.log(genome_size, 2) / 2) - 1)) + try: + subprocess.run(#pylint:disable=subprocess-run-check + [ + str(star_bin), + "--runThreadN", + str(num_threads), + "--runMode", + "genomeGenerate", + "--outFileNamePrefix", + f"{star_dir}/", + "--genomeDir", + str(star_dir), + "--genomeSAindexNbases", + str(index_bases), + "--genomeFastaFiles", + str(genome_file), + ] + ) + except Exception as e: + logging.error("An error occurred while creating star index: %s", e) + + logging.info("Running Star on the files in the fastq dir") + for fastq_file in fastq_file_list: + # logger.info(fastq_file_path) + # fastq_file_name = os.path.basename(fastq_file_path) + star_tmp_dir = star_dir / "tmp" + if star_tmp_dir.exists(): + shutil.rmtree(star_tmp_dir) + sam_file = Path(f"{star_dir}/{fastq_file.name}.sam") + junctions_file = Path(f"{star_dir}/{fastq_file.name}.sj.tab") + sam_file_name = sam_file.name + sam_temp_file = Path(f"{star_dir}/{sam_file_name}.tmp") + bam_file = re.sub(".sam", ".bam", sam_file_name) + bam_sort_file = Path(f"{star_dir}/{bam_file}") + log_out_file = Path(f"{star_dir}/{fastq_file.name}.Log.final.out") + if log_out_file.exists() and bam_sort_file.exists() and bam_sort_file.stat().st_size != 0: + logging.info( + "Found an existing bam file for the fastq file, \ + presuming the file has been processed, will skip" + ) + continue + + logging.info("Processing %s", fastq_file) + star_command = [ + str(star_bin), + "--outFilterIntronMotifs", + "RemoveNoncanonicalUnannotated", + "--outSAMstrandField", + "intronMotif", + "--runThreadN", + str(num_threads), + "--twopassMode", + "Basic", + "--runMode", + "alignReads", + "--genomeDir", + str(star_dir), + "--readFilesIn", + str(fastq_file), + "--outFileNamePrefix", + f"{star_dir}/", + "--outTmpDir", + str(star_tmp_dir), + "--outSAMtype", + "SAM", + "--alignIntronMax", + str(max_intron_length), + ] + #'--outSJfilterIntronMaxVsReadN','5000','10000','25000','40000', + #'50000','50000','50000','50000','50000','100000'] + check_compression = re.search(r".gz$", fastq_file) + if check_compression: + star_command.append("--readFilesCommand") + star_command.append("gunzip") + star_command.append("-c") + subprocess.run(star_command)#pylint:disable=subprocess-run-check + shutil.move(Path(f"{star_dir}/Aligned.out.sam"), sam_file) + shutil.move(Path(f"{star_dir}/SJ.out.tab"), junctions_file) + logging.info("Converting samfile into sorted bam file. Bam file: %s", bam_file) + subprocess.run(#pylint:disable=subprocess-run-check + [ + str(samtools_bin), + "sort", + "-@", + str(num_threads), + "-T", + str(sam_temp_file), + "-o", + str(bam_sort_file), + str(sam_file), + ] + ) + shutil.move(star_dir / "Log.final.out", log_out_file) + sam_file.unlink() + logging.info("Completed running STAR")
+ + + +def _create_paired_paths(fastq_file_paths: List) -> List: + """ + Create list of paired transcriptomic fastq files + + Args: + fastq_file_paths (List): List of transcriptomic file paths. + + Returns: + List: List of paired transcriptomic files + """ + path_dict = {} + # final_list = [] + for fastq_file in fastq_file_paths: + paired_name = re.search(r"(.+)_\d+\.(fastq|fq)", fastq_file) + if not paired_name: + logging.exception( + "Could not find _1 or _2 at the end of the prefix \ + for file. Assuming file is not paired: %s", + fastq_file, + ) + # final_list.append([fastq_file]) + path_dict[fastq_file] = [fastq_file] + continue + run_accession = paired_name.group(1) + if run_accession in path_dict: + path_dict[run_accession].append(fastq_file) + else: + path_dict[run_accession] = [fastq_file] + # for pair in path_dict: + # final_list.append(path_dict[pair]) + logging.info([value for values_list in path_dict.values() for value in values_list]) + return [value for values_list in path_dict.values() for value in values_list] + +#pylint:disable=pointless-string-statement +""" +For an advanced and optimised subsampling we could use +https://github.com/lh3/seqtk +""" + + +def _subsample_paired_fastq_files( + fastq_files: List[Path], + output_files: List[Path] = "", + subsample_read_limit: int = 100000000, + num_threads: int = 2, + compressed: bool = False, +) -> None: + """ + Perform subsampling on two paired FastQ files in parallel using multiple threads. + + Args: + fastq_files : Path for paired fastq files. + output_files : Path for the output file. + subsample_read_limit : Subsample size, defaults to 100000000. + num_threads : Number of threads, defaults to 2. + compressed : file compressed, defaults to False. + """ + fastq_file_1, fastq_file_2 = fastq_files + if len(output_files) == 0: + output_files = [f"{fastq_file_1}.sub", f"{fastq_file_2}.sub"] + output_file_1, output_file_2 = output_files + if re.search(r"\.gz$", fastq_file_1): + compressed = True + num_lines = sum(1 for line in gzip.open(fastq_file_1))#pylint:disable=consider-using-with + else: + num_lines = sum(1 for line in open(fastq_file_1))#pylint:disable=consider-using-with + + range_limit = int(num_lines / 4) + if range_limit <= subsample_read_limit: + logging.info("Number of reads (%s is less than the max allowed read count (%s), \ + no need to subsample", str(range_limit),str(subsample_read_limit) + ) + return + + rand_list = random.sample(range(0, range_limit - 1), subsample_read_limit) + random_indices = {idx * 4: 1 for idx in rand_list} + logging.info("Processing paired files in parallel") + pool = multiprocessing.Pool(int(num_threads))#pylint:disable=consider-using-with + pool.apply_async( + _subsample_fastq_subset, + args=( + fastq_file_1, + output_file_1, + random_indices, + compressed, + ), + ) + pool.apply_async( + _subsample_fastq_subset, + args=( + fastq_file_2, + output_file_2, + random_indices, + compressed, + ), + ) + pool.close() + pool.join() + + +def _subsample_fastq_subset( + fastq_file: Path, output_file: Path, random_indices: dict, compressed: bool +) -> None: + """ + Selecting specific sets of four lines from an input FastQ file and writing them to an output file. + + Args: + fastq_file : Path for the fastq file. + output_file : Path for the output file. + random_indices : set of random indices. + compressed : the files is compressed + """ + line_index = 0 + + with gzip.open(fastq_file, "rt") if compressed else open(fastq_file) as file_in, open( + output_file, "w+" + ) as file_out: + lines = [file_in.readline() for _ in range(4)] + while lines[3]: # This ensures that the loop continues until the end of the input file. + if line_index in random_indices: + file_out.writelines(lines) + line_index += 4 + lines = [file_in.readline() for _ in range(4)] + + +
+[docs] +def subsample_transcriptomic_data(fastq_file_list: List[Path], num_threads: int = 2) -> None: + """ + Subsample paired fastq files. + + Args: + fastq_file_list : List of fastq file path to process. + num_threads : number of threads + """ + for fastq_files in fastq_file_list: + fastq_file_1, fastq_file_2 = fastq_files + # fastq_file_pair = "" + # if len(fastq_files) == 2: + # fastq_file_pair = fastq_files[1] + + if len(fastq_files) == 1: + fastq_file_1 = fastq_files[0] + if Path(f"{fastq_file_1}.sub").exists(): + logging.info( + "Found an existing .sub file on the fastq path, will use that instead. File:%s.sub", + fastq_file_1, + ) + else: + _subsample_paired_fastq_files(fastq_files, compressed=True, num_threads=num_threads) + + elif len(fastq_files) == 2: + fastq_file_1, fastq_file_2 = fastq_files + if Path(f"{fastq_file_1}.sub").exists() and Path(f"{fastq_file_2}.sub").exists(): + logging.info( + "Found an existing .sub files on the fastq path for both members of the pair, will use \ + those instead of subsampling again. Files: %s.sub,%s.sub", + fastq_file_1, + fastq_file_2, + ) + elif Path(f"{fastq_file_2}.sub").exists(): + _subsample_paired_fastq_files(fastq_files, compressed=True, num_threads=num_threads)
+ + + +def run_trimming( + output_dir: Path, + short_read_fastq_dir: Path, + delete_pre_trim_fastq: bool = False, + num_threads: int = 1, + trim_galore_bin="trim_galore", +) -> None: + """ + Trim list of short read fastq files. + Args: + output_dir : Working directory path. + short_read_fastq_dir : Short read directory path. + delete_pre_trim_fastq : Removing original fastq file post trimming. Defaults to False. + num_threads : Number of threads. + trim_galore_bin : Software path. + """ + check_exe(trim_galore_bin) + trim_dir = create_dir(output_dir, "trim_galore_output") + + fastq_file_list = [] + file_types = ("*.fastq", "*.fq", "*.fastq.gz", "*.fq.gz") + fastq_file_list = [ + path for file_type in file_types for path in Path(short_read_fastq_dir).rglob(file_type) + ] + fastq_file_list = _create_paired_paths(fastq_file_list) + + trim_galore_cmd = [ + str(trim_galore_bin), + "--illumina", + "--quality", + "20", + "--length", + "50", + "--output_dir", + str(trim_dir), + ] + + pool = multiprocessing.Pool(int(num_threads)) # pylint:disable=consider-using-with + for fastq_paired_files in fastq_file_list: + pool.apply_async( + multiprocess_trim_galore, + args=( + trim_galore_cmd, + fastq_paired_files, + trim_dir, + ), + ) + if delete_pre_trim_fastq: + for file_path in fastq_paired_files: + file_path.unlink() + pool.close() + pool.join() + + trimmed_fastq_list = trim_dir.glob("*.fq.gz") + + for trimmed_fastq_path in trimmed_fastq_list: + logging.info("Trimmed file path: %s", str(trimmed_fastq_path)) + sub_patterns = re.compile(r"|".join(("_val_1.fq", "_val_2.fq", "_trimmed.fq"))) + updated_file_path = sub_patterns.sub(".fq", trimmed_fastq_path.name) + updated_file_path = short_read_fastq_dir / updated_file_path + logging.info("Updated file path: %s", str(updated_file_path)) + trimmed_fastq_path.rename(updated_file_path) + + files_to_delete_list = [] + for file_type in file_types: + files_to_delete_list.extend(short_read_fastq_dir.glob(file_type)) + + for file_to_delete in files_to_delete_list: + file_to_delete.unlink() + + +def multiprocess_trim_galore(trim_galore_cmd: List, fastq_paired_files: List[Path]) -> None: + """ + Trim short paired or single short read fastq file. + Args: + trim_galore_cmd : Generic command. + fastq_paired_files : List of single or paired fastq files. + """ + + fastq_file = fastq_paired_files[0] + fastq_file_pair = None + + if len(fastq_paired_files) == 2: + fastq_file, fastq_file_pair = fastq_paired_files + trim_galore_cmd.append("--paired") + trim_galore_cmd.append(fastq_file) + trim_galore_cmd.append(fastq_file_pair) + elif len(fastq_paired_files) == 1: + trim_galore_cmd.append(fastq_paired_files) + + logging.info("Running Trim Galore with the following command: %s", {" ".join(trim_galore_cmd)}) + subprocess.run(trim_galore_cmd, check=True) + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run STAR software.""" + + genome_file = argschema.fields.InputFile(required=True, description="Genome file path") + output_dir = argschema.fields.OutputDir(required=True, description="Output directory path") + short_read_fastq_dir = argschema.fields.String( + required=True, + description="Short read directory path", + ) + delete_pre_trim_fastq = argschema.fields.Bool( + required=False, + default=False, + description="Delete the original fastq files after trimming", + ) + trim_fastq = argschema.fields.Bool( + required=False, + default=False, + description="Trim the short read files using Trim Galore", + ) + max_reads_per_sample = argschema.fields.Integer( + required=False, + default="0", + description="The maximum number of reads to use per sample.", + ) + max_intron_length = argschema.fields.Integer( + required=False, + default="100000", + description="The maximum intron size for alignments.", + ) + num_threads = argschema.fields.Integer(required=False, default=1, description="Number of threads") + star_bin = argschema.fields.String( + required=False, + default="star", + description="Star software path", + ) + samtools_bin = argschema.fields.String( + required=False, + default="samtools", + description="Samtools software path", + ) + trim_galore_bin = argschema.fields.String( + required=False, + default="trim_galore", + description="Trim Galore software path", + ) + + +def main() -> None: + """STAR's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "star.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_star( + mod.args["genome_file"], + mod.args["output_dir"], + mod.args["short_read_fastq_dir"], + mod.args["delete_pre_trim_fastq"], + mod.args["trim_fastq"], + mod.args["max_reads_per_sample"], + mod.args["max_intron_length"], + mod.args["num_threads"], + mod.args["star_bin"], + mod.args["samtools_bin"], + mod.args["trim_galore_bin"], + ) + + +# pylint:disable=pointless-string-statement +""" +def model_builder(work_dir): + + star_output_dir = os.path.join(work_dir, "star_output") + + all_junctions_file = os.path.join(star_output_dir, "all_junctions.sj") + sjf_out = open(all_junctions_file, "w+") + + for sj_tab_file in glob.glob(input_dir + "/*.sj.tab"): + sjf_in = open(sj_tab_file) + sjf_lines = sjf_in.readlines() + for line in sjf_lines: + elements = line.split("\t") + strand = "+" + + # my $slice_name = $eles[0]; + # my $start = $eles[1]; + # my $end = $eles[2]; + # my $strand = $eles[3]; + + # If the strand is undefined then skip, Augustus expects a strand + if elements[3] == "0": + continue + elif elements[3] == "2": + strand = "-" + + junction_length = int(elements[2]) - int(elements[1]) + 1 + if junction_length < 100: + continue + + if not elements[4] and elements[7] < 10: + continue + + # For the moment treat multimapping and single + # mapping things as a combined score + score = float(elements[6]) + float(elements[7]) + score = str(score) + output_line = [ + elements[0], + "RNASEQ", + "intron", + elements[1], + elements[2], + score, + strand, + ".", + ("src=W;mul=" + score + ";"), + ] + sjf_out.write("\t".join(output_line) + "\n") + + sjf_out.close() +""" +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/ensembl/tools/anno/transcriptomic_annotation/stringtie.html b/_modules/ensembl/tools/anno/transcriptomic_annotation/stringtie.html new file mode 100644 index 0000000..55cf6e6 --- /dev/null +++ b/_modules/ensembl/tools/anno/transcriptomic_annotation/stringtie.html @@ -0,0 +1,256 @@ + + + + + + + ensembl.tools.anno.transcriptomic_annotation.stringtie — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +

Source code for ensembl.tools.anno.transcriptomic_annotation.stringtie

+# See the NOTICE file distributed with this work for additional information
+# regarding copyright ownership.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+StringTie is a fast and highly efficient assembler of RNA-Seq alignments into potential transcripts.
+It uses a novel network flow algorithm as well as an optional de novo assembly step to assemble and
+quantitate full-length transcripts representing multiple splice variants for each gene locus.
+Pertea M, Pertea GM, Antonescu CM, Chang TC, Mendell JT & Salzberg SL. StringTie enables improved 
+reconstruction of a transcriptome from RNA-seq reads Nature Biotechnology 2015, doi:10.1038/nbt.3122
+"""
+
+__all__ = ["run_stringtie"]
+import logging
+import logging.config
+from pathlib import Path
+import re
+import subprocess
+import argschema
+
+from ensembl.tools.anno.utils._utils import (
+    check_exe,
+    create_dir,
+    check_gtf_content,
+)
+
+
+
+[docs] +def run_stringtie( + output_dir: Path, + stringtie_bin: Path = Path("stringtie"), + num_threads: int = 1, +) -> None: + """ + StringTie assembler of short read data. + Args: + output_dir : Working directory path. + stringtie_bin : Software path. + num_threads : Number of available threads. + """ + check_exe(stringtie_bin) + stringtie_dir = create_dir(output_dir, "stringtie_output") + logging.info("Skip analysis if the gtf file already exists") + output_file = stringtie_dir / "annotation.gtf" + if output_file.exists(): + transcript_count = check_gtf_content(output_file, "transcript") + if transcript_count > 0: + logging.info("Stringtie gtf file exists, skipping analysis") + return + + stringtie_merge_input_file = stringtie_dir / "stringtie_assemblies.txt" + stringtie_merge_output_file = stringtie_dir / "annotation.gtf" + star_dir = output_dir / "star_output" + + if star_dir.exists() and len(list(star_dir.glob("*.bam"))) != 0: + for sorted_bam_file in star_dir.glob("*.bam"): + transcript_file_name = re.sub(".bam", ".stringtie.gtf", sorted_bam_file.name) + transcript_file = stringtie_dir / transcript_file_name + if transcript_file.exists(): + logging.info( + "Found an existing stringtie gtf file, will not overwrite. \ + File found: %s", + transcript_file, + ) + else: + logging.info("Running Stringtie on: %s", sorted_bam_file.name) + try: + subprocess.check_output( # pylint:disable=subprocess-run-check + [ + stringtie_bin, + sorted_bam_file, + "-o", + transcript_file, + "-p", + str(num_threads), + "-t", # disable trimming of predicted transcripts based on coverage + "-a", # minimum anchor length for junctions + "15", + ] + ) + except subprocess.CalledProcessError as e: + logging.error("Error running Stringtie command: %s", e) + logging.error("Return code: %s", str(e.returncode)) + logging.error("Output and error messages:%s\n", e.output) + else: + raise IndexError(f"The list of sorted bam files is empty, Star output dir: {star_dir}") + + logging.info("Creating Stringtie merge input file: %s", stringtie_merge_input_file) + with open(stringtie_merge_input_file, "w+", encoding="utf8") as gtf_list_out: + for gtf_file in stringtie_dir.glob("*.stringtie.gtf"): + transcript_count = check_gtf_content(gtf_file, "transcript") + if transcript_count > 0: + gtf_list_out.write(f"{gtf_file}\n") + else: + logging.warning("Warning, skipping file with no transcripts. Path:%s", gtf_file) + logging.info("Merging Stringtie results.") + try: + subprocess.run( # pylint:disable=subprocess-run-check + [ + stringtie_bin, + "--merge", + "-o", + stringtie_merge_output_file, + stringtie_merge_input_file, + ] + ) + except subprocess.CalledProcessError as e: + logging.error("Error running Stringtie merging command: %s", e)
+ + + +class InputSchema(argschema.ArgSchema): + """Input arguments expected to run StringTie software.""" + + output_dir = argschema.fields.OutputDir(required=True, description="Output directory path") + stringtie_bin = argschema.fields.String( + required=False, + default="stringtie", + description="StringTie software path", + ) + num_threads = argschema.fields.Integer(required=False, default=1, description="Number of threads") + + +def main() -> None: + """StringTie's entry-point.""" + mod = argschema.ArgSchemaParser(schema_type=InputSchema) + log_file_path = create_dir(mod.args["output_dir"], "log") / "stringtie.log" + loginipath = Path(__file__).parents[6] / "conf" / "logging.conf" + logging.config.fileConfig( + loginipath, + defaults={"logfilename": str(log_file_path)}, + disable_existing_loggers=False, + ) + run_stringtie( + mod.args["output_dir"], + mod.args["stringtie_bin"], + mod.args["num_threads"], + ) +
+ +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/_modules/index.html b/_modules/index.html new file mode 100644 index 0000000..2ed8aa9 --- /dev/null +++ b/_modules/index.html @@ -0,0 +1,117 @@ + + + + + + + Overview: module code — ensembl-anno 0.1 documentation + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/_sources/cmsearch.rst.txt b/_sources/cmsearch.rst.txt new file mode 100644 index 0000000..3faba6f --- /dev/null +++ b/_sources/cmsearch.rst.txt @@ -0,0 +1,8 @@ +Cmsearch Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.snc_rna_annotation.cmsearch + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/cpg.rst.txt b/_sources/cpg.rst.txt new file mode 100644 index 0000000..8603218 --- /dev/null +++ b/_sources/cpg.rst.txt @@ -0,0 +1,8 @@ +CpG Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.simple_feature_annotation.cpg + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/dust.rst.txt b/_sources/dust.rst.txt new file mode 100644 index 0000000..2bc64ca --- /dev/null +++ b/_sources/dust.rst.txt @@ -0,0 +1,8 @@ +DustMasker Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.repeat_annotation.dust + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/eponine.rst.txt b/_sources/eponine.rst.txt new file mode 100644 index 0000000..e460382 --- /dev/null +++ b/_sources/eponine.rst.txt @@ -0,0 +1,8 @@ +Eponine Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.simple_feature_annotation.eponine + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/genblast.rst.txt b/_sources/genblast.rst.txt new file mode 100644 index 0000000..401f411 --- /dev/null +++ b/_sources/genblast.rst.txt @@ -0,0 +1,8 @@ +Genblast Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.protein_annotation.genblast + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/index.rst.txt b/_sources/index.rst.txt new file mode 100644 index 0000000..98a7404 --- /dev/null +++ b/_sources/index.rst.txt @@ -0,0 +1,58 @@ +.. See the NOTICE file distributed with this work for additional information + regarding copyright ownership. + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. + +.. ensembl-anno documentation master file, created by + sphinx-quickstart on Fri Sep 1 12:25:36 2023. + You can adapt this file completely to your liking, but it should at least + contain the root `toctree` directive. + +======================================== +Ensembl-anno +=========================================== + +Anno tool kit + + +Contents +-------- +Check out :ref:`installation ` section for further information on how +to install the project. + +.. toctree:: + :maxdepth: 2 + :caption: Index + + install + license + + _modules/cpg + _modules/dust + _modules/eponine + _modules/genblast + _modules/minimap + _modules/red + _modules/repeatmasker + _modules/scallop + _modules/star + _modules/stringtie + _modules/trf + _modules/trnascan + +Indices and tables +================== + +* :ref:`genindex` +* :ref:`modindex` +* :ref:`search` \ No newline at end of file diff --git a/_sources/install.rst.txt b/_sources/install.rst.txt new file mode 100644 index 0000000..997e6c0 --- /dev/null +++ b/_sources/install.rst.txt @@ -0,0 +1,54 @@ +.. See the NOTICE file distributed with this work for additional information + regarding copyright ownership. + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. + +API Setup and installation +=========================== + +Requirements +-------------- + +.. _install: + +An Ensembl API checkout including: + +- ensembl-production `ensembl-production `_. +- ensembl-analysis `ensembl-analysis `_. (on dev/hive_master branch) +- ensembl-taxonomy `ensembl-taxonomy `_. +- ensembl-orm `ensembl-orm `_. + +Software +^^^^^^^^ + +#. Python 3.8+ +#. Bioperl 1.6.9+ + +Python Modules +^^^^^^^^^^^^^^ +#. argschema + + + +Installation +------------ +Directly from GitHub: + +.. code-block:: none + :linenos: + + git clone https://github.com/Ensembl/ensembl-analysis -b experimental/gbiab + git clone https://github.com/Ensembl/ensembl-production + git clone https://github.com/Ensembl/ensembl-hive + git clone https://github.com/Ensembl/ensembl-taxonomy + git clone https://github.com/Ensembl/ensembl-orm \ No newline at end of file diff --git a/_sources/license.rst.txt b/_sources/license.rst.txt new file mode 100644 index 0000000..9e9b2fe --- /dev/null +++ b/_sources/license.rst.txt @@ -0,0 +1,203 @@ +License +------- + + Apache License + Version 2.0, January 2004 + http://www.apache.org/licenses/ + + + 1. Definitions. + + "License" shall mean the terms and conditions for use, reproduction, + and distribution as defined by Sections 1 through 9 of this document. + + "Licensor" shall mean the copyright owner or entity authorized by + the copyright owner that is granting the License. + + "Legal Entity" shall mean the union of the acting entity and all + other entities that control, are controlled by, or are under common + control with that entity. For the purposes of this definition, + "control" means (i) the power, direct or indirect, to cause the + direction or management of such entity, whether by contract or + otherwise, or (ii) ownership of fifty percent (50%) or more of the + outstanding shares, or (iii) beneficial ownership of such entity. + + "You" (or "Your") shall mean an individual or Legal Entity + exercising permissions granted by this License. + + "Source" form shall mean the preferred form for making modifications, + including but not limited to software source code, documentation + source, and configuration files. + + "Object" form shall mean any form resulting from mechanical + transformation or translation of a Source form, including but + not limited to compiled object code, generated documentation, + and conversions to other media types. + + "Work" shall mean the work of authorship, whether in Source or + Object form, made available under the License, as indicated by a + copyright notice that is included in or attached to the work + (an example is provided in the Appendix below). + + "Derivative Works" shall mean any work, whether in Source or Object + form, that is based on (or derived from) the Work and for which the + editorial revisions, annotations, elaborations, or other modifications + represent, as a whole, an original work of authorship. For the purposes + of this License, Derivative Works shall not include works that remain + separable from, or merely link (or bind by name) to the interfaces of, + the Work and Derivative Works thereof. + + "Contribution" shall mean any work of authorship, including + the original version of the Work and any modifications or additions + to that Work or Derivative Works thereof, that is intentionally + submitted to Licensor for inclusion in the Work by the copyright owner + or by an individual or Legal Entity authorized to submit on behalf of + the copyright owner. For the purposes of this definition, "submitted" + means any form of electronic, verbal, or written communication sent + to the Licensor or its representatives, including but not limited to + communication on electronic mailing lists, source code control systems, + and issue tracking systems that are managed by, or on behalf of, the + Licensor for the purpose of discussing and improving the Work, but + excluding communication that is conspicuously marked or otherwise + designated in writing by the copyright owner as "Not a Contribution." + + "Contributor" shall mean Licensor and any individual or Legal Entity + on behalf of whom a Contribution has been received by Licensor and + subsequently incorporated within the Work. + + 2. Grant of Copyright License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + copyright license to reproduce, prepare Derivative Works of, + publicly display, publicly perform, sublicense, and distribute the + Work and such Derivative Works in Source or Object form. + + 3. Grant of Patent License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + (except as stated in this section) patent license to make, have made, + use, offer to sell, sell, import, and otherwise transfer the Work, + where such license applies only to those patent claims licensable + by such Contributor that are necessarily infringed by their + Contribution(s) alone or by combination of their Contribution(s) + with the Work to which such Contribution(s) was submitted. If You + institute patent litigation against any entity (including a + cross-claim or counterclaim in a lawsuit) alleging that the Work + or a Contribution incorporated within the Work constitutes direct + or contributory patent infringement, then any patent licenses + granted to You under this License for that Work shall terminate + as of the date such litigation is filed. + + 4. Redistribution. You may reproduce and distribute copies of the + Work or Derivative Works thereof in any medium, with or without + modifications, and in Source or Object form, provided that You + meet the following conditions: + + (a) You must give any other recipients of the Work or + Derivative Works a copy of this License; and + + (b) You must cause any modified files to carry prominent notices + stating that You changed the files; and + + (c) You must retain, in the Source form of any Derivative Works + that You distribute, all copyright, patent, trademark, and + attribution notices from the Source form of the Work, + excluding those notices that do not pertain to any part of + the Derivative Works; and + + (d) If the Work includes a "NOTICE" text file as part of its + distribution, then any Derivative Works that You distribute must + include a readable copy of the attribution notices contained + within such NOTICE file, excluding those notices that do not + pertain to any part of the Derivative Works, in at least one + of the following places: within a NOTICE text file distributed + as part of the Derivative Works; within the Source form or + documentation, if provided along with the Derivative Works; or, + within a display generated by the Derivative Works, if and + wherever such third-party notices normally appear. The contents + of the NOTICE file are for informational purposes only and + do not modify the License. You may add Your own attribution + notices within Derivative Works that You distribute, alongside + or as an addendum to the NOTICE text from the Work, provided + that such additional attribution notices cannot be construed + as modifying the License. + + You may add Your own copyright statement to Your modifications and + may provide additional or different license terms and conditions + for use, reproduction, or distribution of Your modifications, or + for any such Derivative Works as a whole, provided Your use, + reproduction, and distribution of the Work otherwise complies with + the conditions stated in this License. + + 5. Submission of Contributions. Unless You explicitly state otherwise, + any Contribution intentionally submitted for inclusion in the Work + by You to the Licensor shall be under the terms and conditions of + this License, without any additional terms or conditions. + Notwithstanding the above, nothing herein shall supersede or modify + the terms of any separate license agreement you may have executed + with Licensor regarding such Contributions. + + 6. Trademarks. This License does not grant permission to use the trade + names, trademarks, service marks, or product names of the Licensor, + except as required for reasonable and customary use in describing the + origin of the Work and reproducing the content of the NOTICE file. + + 7. Disclaimer of Warranty. Unless required by applicable law or + agreed to in writing, Licensor provides the Work (and each + Contributor provides its Contributions) on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or + implied, including, without limitation, any warranties or conditions + of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A + PARTICULAR PURPOSE. You are solely responsible for determining the + appropriateness of using or redistributing the Work and assume any + risks associated with Your exercise of permissions under this License. + + 8. Limitation of Liability. In no event and under no legal theory, + whether in tort (including negligence), contract, or otherwise, + unless required by applicable law (such as deliberate and grossly + negligent acts) or agreed to in writing, shall any Contributor be + liable to You for damages, including any direct, indirect, special, + incidental, or consequential damages of any character arising as a + result of this License or out of the use or inability to use the + Work (including but not limited to damages for loss of goodwill, + work stoppage, computer failure or malfunction, or any and all + other commercial damages or losses), even if such Contributor + has been advised of the possibility of such damages. + + 9. Accepting Warranty or Additional Liability. While redistributing + the Work or Derivative Works thereof, You may choose to offer, + and charge a fee for, acceptance of support, warranty, indemnity, + or other liability obligations and/or rights consistent with this + License. However, in accepting such obligations, You may act only + on Your own behalf and on Your sole responsibility, not on behalf + of any other Contributor, and only if You agree to indemnify, + defend, and hold each Contributor harmless for any liability + incurred by, or claims asserted against, such Contributor by reason + of your accepting any such warranty or additional liability. + + END OF TERMS AND CONDITIONS + + APPENDIX: How to apply the Apache License to your work. + + To apply the Apache License to your work, attach the following + boilerplate notice, with the fields enclosed by brackets "{}" + replaced with your own identifying information. (Don't include + the brackets!) The text should be enclosed in the appropriate + comment syntax for the file format. We also recommend that a + file or class name and description of purpose be included on the + same "printed page" as the copyright notice for easier + identification within third-party archives. + + Copyright [yyyy] [name of copyright owner] + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. \ No newline at end of file diff --git a/_sources/minimap.rst.txt b/_sources/minimap.rst.txt new file mode 100644 index 0000000..bf3a45c --- /dev/null +++ b/_sources/minimap.rst.txt @@ -0,0 +1,8 @@ +Minimap2 Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.transcriptomic_annotation.minimap + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/red.rst.txt b/_sources/red.rst.txt new file mode 100644 index 0000000..26743cd --- /dev/null +++ b/_sources/red.rst.txt @@ -0,0 +1,8 @@ +Red Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.repeat_annotation.red + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/repeatmasker.rst.txt b/_sources/repeatmasker.rst.txt new file mode 100644 index 0000000..8598c0e --- /dev/null +++ b/_sources/repeatmasker.rst.txt @@ -0,0 +1,8 @@ +Repeatmasker Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.repeat_annotation.repeatmasker + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/scallop.rst.txt b/_sources/scallop.rst.txt new file mode 100644 index 0000000..744055b --- /dev/null +++ b/_sources/scallop.rst.txt @@ -0,0 +1,8 @@ +Scallop Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.transcriptomic_annotation.scallop + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/star.rst.txt b/_sources/star.rst.txt new file mode 100644 index 0000000..d83c66b --- /dev/null +++ b/_sources/star.rst.txt @@ -0,0 +1,8 @@ +STAR Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.transcriptomic_annotation.star + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/stringtie.rst.txt b/_sources/stringtie.rst.txt new file mode 100644 index 0000000..878de41 --- /dev/null +++ b/_sources/stringtie.rst.txt @@ -0,0 +1,8 @@ +Stringtie Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.transcriptomic_annotation.stringtie + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/trf.rst.txt b/_sources/trf.rst.txt new file mode 100644 index 0000000..9268f3c --- /dev/null +++ b/_sources/trf.rst.txt @@ -0,0 +1,8 @@ +TRF Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.repeat_annotation.trf + :members: + :undoc-members: + :show-inheritance: + diff --git a/_sources/trnascan.rst.txt b/_sources/trnascan.rst.txt new file mode 100644 index 0000000..d9da9d4 --- /dev/null +++ b/_sources/trnascan.rst.txt @@ -0,0 +1,8 @@ +tRNAscan-SE Module Documentation +============================== + +.. automodule:: ensembl.tools.anno.snc_rna_annotation.trnascan + :members: + :undoc-members: + :show-inheritance: + diff --git a/_static/agogo.css b/_static/agogo.css new file mode 100644 index 0000000..11b0b92 --- /dev/null +++ b/_static/agogo.css @@ -0,0 +1,555 @@ +/* + * agogo.css_t + * ~~~~~~~~~~~ + * + * Sphinx stylesheet -- agogo theme. + * + * :copyright: Copyright 2007-2023 by the Sphinx team, see AUTHORS. + * :license: BSD, see LICENSE for details. + * + */ + +* { + margin: 0px; + padding: 0px; +} + +body { + font-family: Garamond, Arial, serif; + line-height: 1.4em; + color: black; + background-color: #009999; + + /* fix for background colors breaking at horizontal + scrolling on smaller devices */ + min-width: fit-content; +} + + +/* Page layout */ + +div.header, div.content, div.footer { + width: 70em; + margin-left: auto; + margin-right: auto; +} + +div.header-wrapper { + background: #009999; + border-bottom: 3px solid #2e3436; +} + + +/* Default body styles */ +a { + color: green; +} + +a:visited { + color: #551a8b; +} + +div.bodywrapper a, div.footer a { + text-decoration: underline; +} + +.clearer { + clear: both; +} + +.left { + float: left; +} + +.right { + float: right; +} + +.line-block { + display: block; + margin-top: 1em; + margin-bottom: 1em; +} + +.line-block .line-block { + margin-top: 0; + margin-bottom: 0; + margin-left: 1.5em; +} + +h1, h2, h3, h4 { + font-family: Arial, Helvetica, serif; + font-weight: normal; + color: #3465a4; + margin-bottom: .8em; +} + +h1 { + color: #204a87; +} + +h2 { + padding-bottom: .5em; + border-bottom: 1px solid #3465a4; +} + +a.headerlink { + visibility: hidden; + color: #dddddd; + padding-left: .3em; +} + +h1:hover > a.headerlink, +h2:hover > a.headerlink, +h3:hover > a.headerlink, +h4:hover > a.headerlink, +h5:hover > a.headerlink, +h6:hover > a.headerlink, +dt:hover > a.headerlink, +caption:hover > a.headerlink, +p.caption:hover > a.headerlink, +div.code-block-caption:hover > a.headerlink { + visibility: visible; +} + +img { + border: 0; +} + +div.admonition { + margin-top: 10px; + margin-bottom: 10px; + padding: 2px 7px 1px 7px; + border-left: 0.2em solid black; +} + +p.admonition-title { + margin: 0px 10px 5px 0px; + font-weight: bold; +} + +dt:target, .highlighted { + background-color: #fbe54e; +} + +/* Header */ + +div.header { + padding: 1em; +} + +div.header .headertitle { + font-family: Arial, Helvetica, serif; + font-weight: normal; + font-size: 180%; + letter-spacing: .08em; + margin-bottom: .8em; +} + +div.header .headertitle a { + color: white; +} + +div.header div.rel { + margin-top: 1em; +} + +div.header div.rel a { + color: #33d6ff; + letter-spacing: .1em; + text-transform: uppercase; +} + +p.logo { + float: right; +} + +img.logo { + border: 0; +} + + +/* Content */ +div.content-wrapper { + background-color: white; + padding: 1em; +} + +div.document { + width: 50em; + float: left; +} + +div.body { + padding-right: 2em; + text-align: justify; +} + +div.document h1 { + line-height: 120%; +} + +div.document ul { + margin: 1.5em; + list-style-type: square; +} + +div.document dd { + margin-left: 1.2em; + margin-top: .4em; + margin-bottom: 1em; +} + +div.document .section { + margin-top: 1.7em; +} +div.document .section:first-child { + margin-top: 0px; +} + +div.document div.highlight { + padding: 3px; + border-top: 2px solid #dddddd; + border-bottom: 2px solid #dddddd; + margin-top: .8em; + margin-bottom: .8em; +} + +div.document div.literal-block-wrapper { + margin-top: .8em; + margin-bottom: .8em; +} + +div.document div.literal-block-wrapper div.highlight { + margin: 0; +} + +div.document div.code-block-caption span.caption-number { + padding: 0.1em 0.3em; + font-style: italic; +} + +div.document div.code-block-caption span.caption-text { +} + +div.document h2 { + margin-top: .7em; +} + +div.document p { + margin-bottom: .5em; +} + +div.document li.toctree-l1 { + margin-bottom: 1em; +} + +div.document .descname { + font-weight: bold; +} + +div.document .sig-paren { + font-size: larger; +} + +div.document .docutils.literal { + background-color: #eeeeec; + padding: 1px; +} + +div.document .docutils.xref.literal { + background-color: transparent; + padding: 0px; +} + +div.document blockquote { + margin: 1em; +} + +div.document ol { + margin: 1.5em; +} + + +/* Sidebar */ + +div.sidebar, +aside.sidebar { + width: 20em; + float: right; + font-size: .9em; +} + +div.sidebar a, aside.sidebar a, div.header a { + text-decoration: none; +} + +div.sidebar a:hover, aside.sidebar a:hover, div.header a:hover { + text-decoration: underline; +} + +div.sidebar h3, +aside.sidebar h3 { + color: #2e3436; + text-transform: uppercase; + font-size: 130%; + letter-spacing: .1em; +} + +div.sidebar ul, +aside.sidebar ul { + list-style-type: none; +} + +div.sidebar li.toctree-l1 a, +aside.sidebar li.toctree-l1 a { + display: block; + padding: 1px; + border: 1px solid #dddddd; + background-color: #eeeeec; + margin-bottom: .4em; + padding-left: 3px; + color: #2e3436; +} + +div.sidebar li.toctree-l2 a, +aside.sidebar li.toctree-l2 a { + background-color: transparent; + border: none; + margin-left: 1em; + border-bottom: 1px solid #dddddd; +} + +div.sidebar li.toctree-l3 a, +aside.sidebar li.toctree-l3 a { + background-color: transparent; + border: none; + margin-left: 2em; + border-bottom: 1px solid #dddddd; +} + +div.sidebar li.toctree-l2:last-child a, +aside.sidebar li.toctree-l2:last-child a { + border-bottom: none; +} + +div.sidebar li.toctree-l1.current a, +aside.sidebar li.toctree-l1.current a { + border-right: 5px solid #33d6ff; +} + +div.sidebar li.toctree-l1.current li.toctree-l2 a, +aside.sidebar li.toctree-l1.current li.toctree-l2 a { + border-right: none; +} + +div.sidebar input[type="text"], +aside.sidebar input[type="text"] { + width: 170px; +} + +div.sidebar input[type="submit"], +aside.sidebar input[type="submit"] { + width: 30px; +} + + +/* Footer */ + +div.footer-wrapper { + background: #e6fff9; + border-top: 4px solid #babdb6; + padding-top: 10px; + padding-bottom: 10px; + min-height: 80px; +} + +div.footer, div.footer a { + color: #888a85; +} + +div.footer .right { + text-align: right; +} + +div.footer .left { + text-transform: uppercase; +} + + +/* Styles copied from basic theme */ + +img.align-left, figure.align-left, .figure.align-left, object.align-left { + clear: left; + float: left; + margin-right: 1em; +} + +img.align-right, figure.align-right, .figure.align-right, object.align-right { + clear: right; + float: right; + margin-left: 1em; +} + +img.align-center, figure.align-center, .figure.align-center, object.align-center { + display: block; + margin-left: auto; + margin-right: auto; +} + +img.align-default, figure.align-default, .figure.align-default { + display: block; + margin-left: auto; + margin-right: auto; +} + +.align-left { + text-align: left; +} + +.align-center { + text-align: center; +} + +.align-right { + text-align: right; +} + +table caption span.caption-number { + font-style: italic; +} + +table caption span.caption-text { +} + +div.figure p.caption span.caption-number, +figcaption span.caption-number { + font-style: italic; +} + +div.figure p.caption span.caption-text, +figcaption span.caption-text { +} + +/* -- search page ----------------------------------------------------------- */ + +ul.search { + margin: 10px 0 0 20px; + padding: 0; +} + +ul.search li { + padding: 5px 0 5px 20px; + background-image: url(file.png); + background-repeat: no-repeat; + background-position: 0 7px; +} + +ul.search li a { + font-weight: bold; +} + +ul.search li div.context { + color: #888; + margin: 2px 0 0 30px; + text-align: left; +} + +ul.keywordmatches li.goodmatch a { + font-weight: bold; +} + +/* -- index page ------------------------------------------------------------ */ + +table.contentstable { + width: 90%; +} + +table.contentstable p.biglink { + line-height: 150%; +} + +a.biglink { + font-size: 1.3em; +} + +span.linkdescr { + font-style: italic; + padding-top: 5px; + font-size: 90%; +} + +/* -- general index --------------------------------------------------------- */ + +table.indextable td { + text-align: left; + vertical-align: top; +} + +table.indextable ul { + margin-top: 0; + margin-bottom: 0; + list-style-type: none; +} + +table.indextable > tbody > tr > td > ul { + padding-left: 0em; +} + +table.indextable tr.pcap { + height: 10px; +} + +table.indextable tr.cap { + margin-top: 10px; + background-color: #f2f2f2; +} + +img.toggler { + margin-right: 3px; + margin-top: 3px; + cursor: pointer; +} + +/* -- domain module index --------------------------------------------------- */ + +table.modindextable td { + padding: 2px; + border-collapse: collapse; +} + +/* -- viewcode extension ---------------------------------------------------- */ + +.viewcode-link { + float: right; +} + +.viewcode-back { + float: right; + font-family:: Garamond, Arial, serif; +} + +div.viewcode-block:target { + margin: -1px -3px; + padding: 0 3px; + background-color: #f4debf; + border-top: 1px solid #ac9; + border-bottom: 1px solid #ac9; +} + +div.code-block-caption { + background-color: #ddd; + color: #333; + padding: 2px 5px; + font-size: small; +} + +/* -- math display ---------------------------------------------------------- */ + +div.body div.math p { + text-align: center; +} + +span.eqno { + float: right; +} \ No newline at end of file diff --git a/_static/basic.css b/_static/basic.css new file mode 100644 index 0000000..a917981 --- /dev/null +++ b/_static/basic.css @@ -0,0 +1,925 @@ +/* + * basic.css + * ~~~~~~~~~ + * + * Sphinx stylesheet -- basic theme. + * + * :copyright: Copyright 2007-2023 by the Sphinx team, see AUTHORS. + * :license: BSD, see LICENSE for details. + * + */ + +/* -- main layout ----------------------------------------------------------- */ + +div.clearer { + clear: both; +} + +div.section::after { + display: block; + content: ''; + clear: left; +} + +/* -- relbar ---------------------------------------------------------------- */ + +div.related { + width: 100%; + font-size: 90%; +} + +div.related h3 { + display: none; +} + +div.related ul { + margin: 0; + padding: 0 0 0 10px; + list-style: none; +} + +div.related li { + display: inline; +} + +div.related li.right { + float: right; + margin-right: 5px; +} + +/* -- sidebar --------------------------------------------------------------- */ + +div.sphinxsidebarwrapper { + padding: 10px 5px 0 10px; +} + +div.sphinxsidebar { + float: left; + width: 20em; + margin-left: -100%; + font-size: 90%; + word-wrap: break-word; + overflow-wrap : break-word; +} + +div.sphinxsidebar ul { + list-style: none; +} + +div.sphinxsidebar ul ul, +div.sphinxsidebar ul.want-points { + margin-left: 20px; + list-style: square; +} + +div.sphinxsidebar ul ul { + margin-top: 0; + margin-bottom: 0; +} + +div.sphinxsidebar form { + margin-top: 10px; +} + +div.sphinxsidebar input { + border: 1px solid #98dbcc; + font-family: sans-serif; + font-size: 1em; +} + +div.sphinxsidebar #searchbox form.search { + overflow: hidden; +} + +div.sphinxsidebar #searchbox input[type="text"] { + float: left; + width: 80%; + padding: 0.25em; + box-sizing: border-box; +} + +div.sphinxsidebar #searchbox input[type="submit"] { + float: left; + width: 20%; + border-left: none; + padding: 0.25em; + box-sizing: border-box; +} + + +img { + border: 0; + max-width: 100%; +} + +/* -- search page ----------------------------------------------------------- */ + +ul.search { + margin: 10px 0 0 20px; + padding: 0; +} + +ul.search li { + padding: 5px 0 5px 20px; + background-image: url(file.png); + background-repeat: no-repeat; + background-position: 0 7px; +} + +ul.search li a { + font-weight: bold; +} + +ul.search li p.context { + color: #888; + margin: 2px 0 0 30px; + text-align: left; +} + +ul.keywordmatches li.goodmatch a { + font-weight: bold; +} + +/* -- index page ------------------------------------------------------------ */ + +table.contentstable { + width: 90%; + margin-left: auto; + margin-right: auto; +} + +table.contentstable p.biglink { + line-height: 150%; +} + +a.biglink { + font-size: 1.3em; +} + +span.linkdescr { + font-style: italic; + padding-top: 5px; + font-size: 90%; +} + +/* -- general index --------------------------------------------------------- */ + +table.indextable { + width: 100%; +} + +table.indextable td { + text-align: left; + vertical-align: top; +} + +table.indextable ul { + margin-top: 0; + margin-bottom: 0; + list-style-type: none; +} + +table.indextable > tbody > tr > td > ul { + padding-left: 0em; +} + +table.indextable tr.pcap { + height: 10px; +} + +table.indextable tr.cap { + margin-top: 10px; + background-color: #f2f2f2; +} + +img.toggler { + margin-right: 3px; + margin-top: 3px; + cursor: pointer; +} + +div.modindex-jumpbox { + border-top: 1px solid #ddd; + border-bottom: 1px solid #ddd; + margin: 1em 0 1em 0; + padding: 0.4em; +} + +div.genindex-jumpbox { + border-top: 1px solid #ddd; + border-bottom: 1px solid #ddd; + margin: 1em 0 1em 0; + padding: 0.4em; +} + +/* -- domain module index --------------------------------------------------- */ + +table.modindextable td { + padding: 2px; + border-collapse: collapse; +} + +/* -- general body styles --------------------------------------------------- */ + +div.body { + min-width: 360px; + max-width: 800px; +} + +div.body p, div.body dd, div.body li, div.body blockquote { + -moz-hyphens: auto; + -ms-hyphens: auto; + -webkit-hyphens: auto; + hyphens: auto; +} + +a.headerlink { + visibility: hidden; +} + +a:visited { + color: #551A8B; +} + +h1:hover > a.headerlink, +h2:hover > a.headerlink, +h3:hover > a.headerlink, +h4:hover > a.headerlink, +h5:hover > a.headerlink, +h6:hover > a.headerlink, +dt:hover > a.headerlink, +caption:hover > a.headerlink, +p.caption:hover > a.headerlink, +div.code-block-caption:hover > a.headerlink { + visibility: visible; +} + +div.body p.caption { + text-align: inherit; +} + +div.body td { + text-align: left; +} + +.first { + margin-top: 0 !important; +} + +p.rubric { + margin-top: 30px; + font-weight: bold; +} + +img.align-left, figure.align-left, .figure.align-left, object.align-left { + clear: left; + float: left; + margin-right: 1em; +} + +img.align-right, figure.align-right, .figure.align-right, object.align-right { + clear: right; + float: right; + margin-left: 1em; +} + +img.align-center, figure.align-center, .figure.align-center, object.align-center { + display: block; + margin-left: auto; + margin-right: auto; +} + +img.align-default, figure.align-default, .figure.align-default { + display: block; + margin-left: auto; + margin-right: auto; +} + +.align-left { + text-align: left; +} + +.align-center { + text-align: center; +} + +.align-default { + text-align: center; +} + +.align-right { + text-align: right; +} + +/* -- sidebars -------------------------------------------------------------- */ + +div.sidebar, +aside.sidebar { + margin: 0 0 0.5em 1em; + border: 1px solid #ddb; + padding: 7px; + background-color: #ffe; + width: 40%; + float: right; + clear: right; + overflow-x: auto; +} + +p.sidebar-title { + font-weight: bold; +} + +nav.contents, +aside.topic, +div.admonition, div.topic, blockquote { + clear: left; +} + +/* -- topics ---------------------------------------------------------------- */ + +nav.contents, +aside.topic, +div.topic { + border: 1px solid #ccc; + padding: 7px; + margin: 10px 0 10px 0; +} + +p.topic-title { + font-size: 1.1em; + font-weight: bold; + margin-top: 10px; +} + +/* -- admonitions ----------------------------------------------------------- */ + +div.admonition { + margin-top: 10px; + margin-bottom: 10px; + padding: 7px; +} + +div.admonition dt { + font-weight: bold; +} + +p.admonition-title { + margin: 0px 10px 5px 0px; + font-weight: bold; +} + +div.body p.centered { + text-align: center; + margin-top: 25px; +} + +/* -- content of sidebars/topics/admonitions -------------------------------- */ + +div.sidebar > :last-child, +aside.sidebar > :last-child, +nav.contents > :last-child, +aside.topic > :last-child, +div.topic > :last-child, +div.admonition > :last-child { + margin-bottom: 0; +} + +div.sidebar::after, +aside.sidebar::after, +nav.contents::after, +aside.topic::after, +div.topic::after, +div.admonition::after, +blockquote::after { + display: block; + content: ''; + clear: both; +} + +/* -- tables ---------------------------------------------------------------- */ + +table.docutils { + margin-top: 10px; + margin-bottom: 10px; + border: 0; + border-collapse: collapse; +} + +table.align-center { + margin-left: auto; + margin-right: auto; +} + +table.align-default { + margin-left: auto; + margin-right: auto; +} + +table caption span.caption-number { + font-style: italic; +} + +table caption span.caption-text { +} + +table.docutils td, table.docutils th { + padding: 1px 8px 1px 5px; + border-top: 0; + border-left: 0; + border-right: 0; + border-bottom: 1px solid #aaa; +} + +th { + text-align: left; + padding-right: 5px; +} + +table.citation { + border-left: solid 1px gray; + margin-left: 1px; +} + +table.citation td { + border-bottom: none; +} + +th > :first-child, +td > :first-child { + margin-top: 0px; +} + +th > :last-child, +td > :last-child { + margin-bottom: 0px; +} + +/* -- figures --------------------------------------------------------------- */ + +div.figure, figure { + margin: 0.5em; + padding: 0.5em; +} + +div.figure p.caption, figcaption { + padding: 0.3em; +} + +div.figure p.caption span.caption-number, +figcaption span.caption-number { + font-style: italic; +} + +div.figure p.caption span.caption-text, +figcaption span.caption-text { +} + +/* -- field list styles ----------------------------------------------------- */ + +table.field-list td, table.field-list th { + border: 0 !important; +} + +.field-list ul { + margin: 0; + padding-left: 1em; +} + +.field-list p { + margin: 0; +} + +.field-name { + -moz-hyphens: manual; + -ms-hyphens: manual; + -webkit-hyphens: manual; + hyphens: manual; +} + +/* -- hlist styles ---------------------------------------------------------- */ + +table.hlist { + margin: 1em 0; +} + +table.hlist td { + vertical-align: top; +} + +/* -- object description styles --------------------------------------------- */ + +.sig { + font-family: 'Consolas', 'Menlo', 'DejaVu Sans Mono', 'Bitstream Vera Sans Mono', monospace; +} + +.sig-name, code.descname { + background-color: transparent; + font-weight: bold; +} + +.sig-name { + font-size: 1.1em; +} + +code.descname { + font-size: 1.2em; +} + +.sig-prename, code.descclassname { + background-color: transparent; +} + +.optional { + font-size: 1.3em; +} + +.sig-paren { + font-size: larger; +} + +.sig-param.n { + font-style: italic; +} + +/* C++ specific styling */ + +.sig-inline.c-texpr, +.sig-inline.cpp-texpr { + font-family: unset; +} + +.sig.c .k, .sig.c .kt, +.sig.cpp .k, .sig.cpp .kt { + color: #0033B3; +} + +.sig.c .m, +.sig.cpp .m { + color: #1750EB; +} + +.sig.c .s, .sig.c .sc, +.sig.cpp .s, .sig.cpp .sc { + color: #067D17; +} + + +/* -- other body styles ----------------------------------------------------- */ + +ol.arabic { + list-style: decimal; +} + +ol.loweralpha { + list-style: lower-alpha; +} + +ol.upperalpha { + list-style: upper-alpha; +} + +ol.lowerroman { + list-style: lower-roman; +} + +ol.upperroman { + list-style: upper-roman; +} + +:not(li) > ol > li:first-child > :first-child, +:not(li) > ul > li:first-child > :first-child { + margin-top: 0px; +} + +:not(li) > ol > li:last-child > :last-child, +:not(li) > ul > li:last-child > :last-child { + margin-bottom: 0px; +} + +ol.simple ol p, +ol.simple ul p, +ul.simple ol p, +ul.simple ul p { + margin-top: 0; +} + +ol.simple > li:not(:first-child) > p, +ul.simple > li:not(:first-child) > p { + margin-top: 0; +} + +ol.simple p, +ul.simple p { + margin-bottom: 0; +} + +aside.footnote > span, +div.citation > span { + float: left; +} +aside.footnote > span:last-of-type, +div.citation > span:last-of-type { + padding-right: 0.5em; +} +aside.footnote > p { + margin-left: 2em; +} +div.citation > p { + margin-left: 4em; +} +aside.footnote > p:last-of-type, +div.citation > p:last-of-type { + margin-bottom: 0em; +} +aside.footnote > p:last-of-type:after, +div.citation > p:last-of-type:after { + content: ""; + clear: both; +} + +dl.field-list { + display: grid; + grid-template-columns: fit-content(30%) auto; +} + +dl.field-list > dt { + font-weight: bold; + word-break: break-word; + padding-left: 0.5em; + padding-right: 5px; +} + +dl.field-list > dd { + padding-left: 0.5em; + margin-top: 0em; + margin-left: 0em; + margin-bottom: 0em; +} + +dl { + margin-bottom: 15px; +} + +dd > :first-child { + margin-top: 0px; +} + +dd ul, dd table { + margin-bottom: 10px; +} + +dd { + margin-top: 3px; + margin-bottom: 10px; + margin-left: 30px; +} + +.sig dd { + margin-top: 0px; + margin-bottom: 0px; +} + +.sig dl { + margin-top: 0px; + margin-bottom: 0px; +} + +dl > dd:last-child, +dl > dd:last-child > :last-child { + margin-bottom: 0; +} + +dt:target, span.highlighted { + background-color: #fbe54e; +} + +rect.highlighted { + fill: #fbe54e; +} + +dl.glossary dt { + font-weight: bold; + font-size: 1.1em; +} + +.versionmodified { + font-style: italic; +} + +.system-message { + background-color: #fda; + padding: 5px; + border: 3px solid red; +} + +.footnote:target { + background-color: #ffa; +} + +.line-block { + display: block; + margin-top: 1em; + margin-bottom: 1em; +} + +.line-block .line-block { + margin-top: 0; + margin-bottom: 0; + margin-left: 1.5em; +} + +.guilabel, .menuselection { + font-family: sans-serif; +} + +.accelerator { + text-decoration: underline; +} + +.classifier { + font-style: oblique; +} + +.classifier:before { + font-style: normal; + margin: 0 0.5em; + content: ":"; + display: inline-block; +} + +abbr, acronym { + border-bottom: dotted 1px; + cursor: help; +} + +.translated { + background-color: rgba(207, 255, 207, 0.2) +} + +.untranslated { + background-color: rgba(255, 207, 207, 0.2) +} + +/* -- code displays --------------------------------------------------------- */ + +pre { + overflow: auto; + overflow-y: hidden; /* fixes display issues on Chrome browsers */ +} + +pre, div[class*="highlight-"] { + clear: both; +} + +span.pre { + -moz-hyphens: none; + -ms-hyphens: none; + -webkit-hyphens: none; + hyphens: none; + white-space: nowrap; +} + +div[class*="highlight-"] { + margin: 1em 0; +} + +td.linenos pre { + border: 0; + background-color: transparent; + color: #aaa; +} + +table.highlighttable { + display: block; +} + +table.highlighttable tbody { + display: block; +} + +table.highlighttable tr { + display: flex; +} + +table.highlighttable td { + margin: 0; + padding: 0; +} + +table.highlighttable td.linenos { + padding-right: 0.5em; +} + +table.highlighttable td.code { + flex: 1; + overflow: hidden; +} + +.highlight .hll { + display: block; +} + +div.highlight pre, +table.highlighttable pre { + margin: 0; +} + +div.code-block-caption + div { + margin-top: 0; +} + +div.code-block-caption { + margin-top: 1em; + padding: 2px 5px; + font-size: small; +} + +div.code-block-caption code { + background-color: transparent; +} + +table.highlighttable td.linenos, +span.linenos, +div.highlight span.gp { /* gp: Generic.Prompt */ + user-select: none; + -webkit-user-select: text; /* Safari fallback only */ + -webkit-user-select: none; /* Chrome/Safari */ + -moz-user-select: none; /* Firefox */ + -ms-user-select: none; /* IE10+ */ +} + +div.code-block-caption span.caption-number { + padding: 0.1em 0.3em; + font-style: italic; +} + +div.code-block-caption span.caption-text { +} + +div.literal-block-wrapper { + margin: 1em 0; +} + +code.xref, a code { + background-color: transparent; + font-weight: bold; +} + +h1 code, h2 code, h3 code, h4 code, h5 code, h6 code { + background-color: transparent; +} + +.viewcode-link { + float: right; +} + +.viewcode-back { + float: right; + font-family: sans-serif; +} + +div.viewcode-block:target { + margin: -1px -10px; + padding: 0 10px; +} + +/* -- math display ---------------------------------------------------------- */ + +img.math { + vertical-align: middle; +} + +div.body div.math p { + text-align: center; +} + +span.eqno { + float: right; +} + +span.eqno a.headerlink { + position: absolute; + z-index: 1; +} + +div.math:hover a.headerlink { + visibility: visible; +} + +/* -- printout stylesheet --------------------------------------------------- */ + +@media print { + div.document, + div.documentwrapper, + div.bodywrapper { + margin: 0 !important; + width: 100%; + } + + div.sphinxsidebar, + div.related, + div.footer, + #top-link { + display: none; + } +} \ No newline at end of file diff --git a/_static/bgfooter.png b/_static/bgfooter.png new file mode 100644 index 0000000000000000000000000000000000000000..b7c7cadd4e6978aa7081fe672fcf5afc97516bda GIT binary patch literal 276 zcmV+v0qg#WP)qvnR6EfsQ*t~7O=UY2%BZy- zs#7>Lw$#|1-#yb5jZ8}CcXenmE?Bb?+emvZy3eu4G&!aT9i`%Ot1U0%(#mRx?NNc)^t8TJHA0R4$Di^IIL4X9&MVm&N-9#bE;?}xqq}wTrc0WUU#YK z#2JfT+O{=ipwX3&j4H~AegD$wD(9Ee_Le?vx(rq^B%Dj?^+nzae0J!bK00|W&N)Yz aUi|<^NiO;Hz(H~V0000P0IhA`JcOe?|*M3M!YD+&^mI=Y=U~-8S>8l1XAJ*3?jZZ Q8UO$Q07*qoM6N<$f;!4|TmS$7 literal 0 HcmV?d00001 diff --git a/_static/doctools.js b/_static/doctools.js new file mode 100644 index 0000000..d06a71d --- /dev/null +++ b/_static/doctools.js @@ -0,0 +1,156 @@ +/* + * doctools.js + * ~~~~~~~~~~~ + * + * Base JavaScript utilities for all Sphinx HTML documentation. + * + * :copyright: Copyright 2007-2023 by the Sphinx team, see AUTHORS. + * :license: BSD, see LICENSE for details. + * + */ +"use strict"; + +const BLACKLISTED_KEY_CONTROL_ELEMENTS = new Set([ + "TEXTAREA", + "INPUT", + "SELECT", + "BUTTON", +]); + +const _ready = (callback) => { + if (document.readyState !== "loading") { + callback(); + } else { + document.addEventListener("DOMContentLoaded", callback); + } +}; + +/** + * Small JavaScript module for the documentation. + */ +const Documentation = { + init: () => { + Documentation.initDomainIndexTable(); + Documentation.initOnKeyListeners(); + }, + + /** + * i18n support + */ + TRANSLATIONS: {}, + PLURAL_EXPR: (n) => (n === 1 ? 0 : 1), + LOCALE: "unknown", + + // gettext and ngettext don't access this so that the functions + // can safely bound to a different name (_ = Documentation.gettext) + gettext: (string) => { + const translated = Documentation.TRANSLATIONS[string]; + switch (typeof translated) { + case "undefined": + return string; // no translation + case "string": + return translated; // translation exists + default: + return translated[0]; // (singular, plural) translation tuple exists + } + }, + + ngettext: (singular, plural, n) => { + const translated = Documentation.TRANSLATIONS[singular]; + if (typeof translated !== "undefined") + return translated[Documentation.PLURAL_EXPR(n)]; + return n === 1 ? singular : plural; + }, + + addTranslations: (catalog) => { + Object.assign(Documentation.TRANSLATIONS, catalog.messages); + Documentation.PLURAL_EXPR = new Function( + "n", + `return (${catalog.plural_expr})` + ); + Documentation.LOCALE = catalog.locale; + }, + + /** + * helper function to focus on search bar + */ + focusSearchBar: () => { + document.querySelectorAll("input[name=q]")[0]?.focus(); + }, + + /** + * Initialise the domain index toggle buttons + */ + initDomainIndexTable: () => { + const toggler = (el) => { + const idNumber = el.id.substr(7); + const toggledRows = document.querySelectorAll(`tr.cg-${idNumber}`); + if (el.src.substr(-9) === "minus.png") { + el.src = `${el.src.substr(0, el.src.length - 9)}plus.png`; + toggledRows.forEach((el) => (el.style.display = "none")); + } else { + el.src = `${el.src.substr(0, el.src.length - 8)}minus.png`; + toggledRows.forEach((el) => (el.style.display = "")); + } + }; + + const togglerElements = document.querySelectorAll("img.toggler"); + togglerElements.forEach((el) => + el.addEventListener("click", (event) => toggler(event.currentTarget)) + ); + togglerElements.forEach((el) => (el.style.display = "")); + if (DOCUMENTATION_OPTIONS.COLLAPSE_INDEX) togglerElements.forEach(toggler); + }, + + initOnKeyListeners: () => { + // only install a listener if it is really needed + if ( + !DOCUMENTATION_OPTIONS.NAVIGATION_WITH_KEYS && + !DOCUMENTATION_OPTIONS.ENABLE_SEARCH_SHORTCUTS + ) + return; + + document.addEventListener("keydown", (event) => { + // bail for input elements + if (BLACKLISTED_KEY_CONTROL_ELEMENTS.has(document.activeElement.tagName)) return; + // bail with special keys + if (event.altKey || event.ctrlKey || event.metaKey) return; + + if (!event.shiftKey) { + switch (event.key) { + case "ArrowLeft": + if (!DOCUMENTATION_OPTIONS.NAVIGATION_WITH_KEYS) break; + + const prevLink = document.querySelector('link[rel="prev"]'); + if (prevLink && prevLink.href) { + window.location.href = prevLink.href; + event.preventDefault(); + } + break; + case "ArrowRight": + if (!DOCUMENTATION_OPTIONS.NAVIGATION_WITH_KEYS) break; + + const nextLink = document.querySelector('link[rel="next"]'); + if (nextLink && nextLink.href) { + window.location.href = nextLink.href; + event.preventDefault(); + } + break; + } + } + + // some keyboard layouts may need Shift to get / + switch (event.key) { + case "/": + if (!DOCUMENTATION_OPTIONS.ENABLE_SEARCH_SHORTCUTS) break; + Documentation.focusSearchBar(); + event.preventDefault(); + } + }); + }, +}; + +// quick alias for translations +const _ = Documentation.gettext; + +_ready(Documentation.init); diff --git a/_static/documentation_options.js b/_static/documentation_options.js new file mode 100644 index 0000000..e21c068 --- /dev/null +++ b/_static/documentation_options.js @@ -0,0 +1,13 @@ +const DOCUMENTATION_OPTIONS = { + VERSION: '0.1', + LANGUAGE: 'en', + COLLAPSE_INDEX: false, + BUILDER: 'html', + FILE_SUFFIX: '.html', + LINK_SUFFIX: '.html', + HAS_SOURCE: true, + SOURCELINK_SUFFIX: '.txt', + NAVIGATION_WITH_KEYS: false, + SHOW_SEARCH_SUMMARY: true, + ENABLE_SEARCH_SHORTCUTS: true, +}; \ No newline at end of file diff --git a/_static/file.png b/_static/file.png new file mode 100644 index 0000000000000000000000000000000000000000..a858a410e4faa62ce324d814e4b816fff83a6fb3 GIT binary patch literal 286 zcmV+(0pb3MP)s`hMrGg#P~ix$^RISR_I47Y|r1 z_CyJOe}D1){SET-^Amu_i71Lt6eYfZjRyw@I6OQAIXXHDfiX^GbOlHe=Ae4>0m)d(f|Me07*qoM6N<$f}vM^LjV8( literal 0 HcmV?d00001 diff --git a/_static/language_data.js b/_static/language_data.js new file mode 100644 index 0000000..250f566 --- /dev/null +++ b/_static/language_data.js @@ -0,0 +1,199 @@ +/* + * language_data.js + * ~~~~~~~~~~~~~~~~ + * + * This script contains the language-specific data used by searchtools.js, + * namely the list of stopwords, stemmer, scorer and splitter. + * + * :copyright: Copyright 2007-2023 by the Sphinx team, see AUTHORS. + * :license: BSD, see LICENSE for details. + * + */ + +var stopwords = ["a", "and", "are", "as", "at", "be", "but", "by", "for", "if", "in", "into", "is", "it", "near", "no", "not", "of", "on", "or", "such", "that", "the", "their", "then", "there", "these", "they", "this", "to", "was", "will", "with"]; + + +/* Non-minified version is copied as a separate JS file, is available */ + +/** + * Porter Stemmer + */ +var Stemmer = function() { + + var step2list = { + ational: 'ate', + tional: 'tion', + enci: 'ence', + anci: 'ance', + izer: 'ize', + bli: 'ble', + alli: 'al', + entli: 'ent', + eli: 'e', + ousli: 'ous', + ization: 'ize', + ation: 'ate', + ator: 'ate', + alism: 'al', + iveness: 'ive', + fulness: 'ful', + ousness: 'ous', + aliti: 'al', + iviti: 'ive', + biliti: 'ble', + logi: 'log' + }; + + var step3list = { + icate: 'ic', + ative: '', + alize: 'al', + iciti: 'ic', + ical: 'ic', + ful: '', + ness: '' + }; + + var c = "[^aeiou]"; // consonant + var v = "[aeiouy]"; // vowel + var C = c + "[^aeiouy]*"; // consonant sequence + var V = v + "[aeiou]*"; // vowel sequence + + var mgr0 = "^(" + C + ")?" + V + C; // [C]VC... is m>0 + var meq1 = "^(" + C + ")?" + V + C + "(" + V + ")?$"; // [C]VC[V] is m=1 + var mgr1 = "^(" + C + ")?" + V + C + V + C; // [C]VCVC... is m>1 + var s_v = "^(" + C + ")?" + v; // vowel in stem + + this.stemWord = function (w) { + var stem; + var suffix; + var firstch; + var origword = w; + + if (w.length < 3) + return w; + + var re; + var re2; + var re3; + var re4; + + firstch = w.substr(0,1); + if (firstch == "y") + w = firstch.toUpperCase() + w.substr(1); + + // Step 1a + re = /^(.+?)(ss|i)es$/; + re2 = /^(.+?)([^s])s$/; + + if (re.test(w)) + w = w.replace(re,"$1$2"); + else if (re2.test(w)) + w = w.replace(re2,"$1$2"); + + // Step 1b + re = /^(.+?)eed$/; + re2 = /^(.+?)(ed|ing)$/; + if (re.test(w)) { + var fp = re.exec(w); + re = new RegExp(mgr0); + if (re.test(fp[1])) { + re = /.$/; + w = w.replace(re,""); + } + } + else if (re2.test(w)) { + var fp = re2.exec(w); + stem = fp[1]; + re2 = new RegExp(s_v); + if (re2.test(stem)) { + w = stem; + re2 = /(at|bl|iz)$/; + re3 = new RegExp("([^aeiouylsz])\\1$"); + re4 = new RegExp("^" + C + v + "[^aeiouwxy]$"); + if (re2.test(w)) + w = w + "e"; + else if (re3.test(w)) { + re = /.$/; + w = w.replace(re,""); + } + else if (re4.test(w)) + w = w + "e"; + } + } + + // Step 1c + re = /^(.+?)y$/; + if (re.test(w)) { + var fp = re.exec(w); + stem = fp[1]; + re = new RegExp(s_v); + if (re.test(stem)) + w = stem + "i"; + } + + // Step 2 + re = /^(.+?)(ational|tional|enci|anci|izer|bli|alli|entli|eli|ousli|ization|ation|ator|alism|iveness|fulness|ousness|aliti|iviti|biliti|logi)$/; + if (re.test(w)) { + var fp = re.exec(w); + stem = fp[1]; + suffix = fp[2]; + re = new RegExp(mgr0); + if (re.test(stem)) + w = stem + step2list[suffix]; + } + + // Step 3 + re = /^(.+?)(icate|ative|alize|iciti|ical|ful|ness)$/; + if (re.test(w)) { + var fp = re.exec(w); + stem = fp[1]; + suffix = fp[2]; + re = new RegExp(mgr0); + if (re.test(stem)) + w = stem + step3list[suffix]; + } + + // Step 4 + re = /^(.+?)(al|ance|ence|er|ic|able|ible|ant|ement|ment|ent|ou|ism|ate|iti|ous|ive|ize)$/; + re2 = /^(.+?)(s|t)(ion)$/; + if (re.test(w)) { + var fp = re.exec(w); + stem = fp[1]; + re = new RegExp(mgr1); + if (re.test(stem)) + w = stem; + } + else if (re2.test(w)) { + var fp = re2.exec(w); + stem = fp[1] + fp[2]; + re2 = new RegExp(mgr1); + if (re2.test(stem)) + w = stem; + } + + // Step 5 + re = /^(.+?)e$/; + if (re.test(w)) { + var fp = re.exec(w); + stem = fp[1]; + re = new RegExp(mgr1); + re2 = new RegExp(meq1); + re3 = new RegExp("^" + C + v + "[^aeiouwxy]$"); + if (re.test(stem) || (re2.test(stem) && !(re3.test(stem)))) + w = stem; + } + re = /ll$/; + re2 = new RegExp(mgr1); + if (re.test(w) && re2.test(w)) { + re = /.$/; + w = w.replace(re,""); + } + + // and turn initial Y back to y + if (firstch == "y") + w = firstch.toLowerCase() + w.substr(1); + return w; + } +} + diff --git a/_static/minus.png b/_static/minus.png new file mode 100644 index 0000000000000000000000000000000000000000..d96755fdaf8bb2214971e0db9c1fd3077d7c419d GIT binary patch literal 90 zcmeAS@N?(olHy`uVBq!ia0vp^+#t*WBp7;*Yy1LIik>cxAr*|t7R?Mi>2?kWtu=nj kDsEF_5m^0CR;1wuP-*O&G^0G}KYk!hp00i_>zopr08q^qX#fBK literal 0 HcmV?d00001 diff --git a/_static/plus.png b/_static/plus.png new file mode 100644 index 0000000000000000000000000000000000000000..7107cec93a979b9a5f64843235a16651d563ce2d GIT binary patch literal 90 zcmeAS@N?(olHy`uVBq!ia0vp^+#t*WBp7;*Yy1LIik>cxAr*|t7R?Mi>2?kWtu>-2 m3q%Vub%g%s<8sJhVPMczOq}xhg9DJoz~JfX=d#Wzp$Pyb1r*Kz literal 0 HcmV?d00001 diff --git a/_static/pygments.css b/_static/pygments.css new file mode 100644 index 0000000..6110e9f --- /dev/null +++ b/_static/pygments.css @@ -0,0 +1,84 @@ +pre { line-height: 125%; } +td.linenos .normal { color: inherit; background-color: transparent; padding-left: 5px; padding-right: 5px; } +span.linenos { color: inherit; background-color: transparent; padding-left: 5px; padding-right: 5px; } +td.linenos .special { color: #000000; background-color: #ffffc0; padding-left: 5px; padding-right: 5px; } +span.linenos.special { color: #000000; background-color: #ffffc0; padding-left: 5px; padding-right: 5px; } +.highlight .hll { background-color: #ffffcc } +.highlight { background: #f8f8f8; } +.highlight .c { color: #8f5902; font-style: italic } /* Comment */ +.highlight .err { color: #a40000; border: 1px solid #ef2929 } /* Error */ +.highlight .g { color: #000000 } /* Generic */ +.highlight .k { color: #204a87; font-weight: bold } /* Keyword */ +.highlight .l { color: #000000 } /* Literal */ +.highlight .n { color: #000000 } /* Name */ +.highlight .o { color: #ce5c00; font-weight: bold } /* Operator */ +.highlight .x { color: #000000 } /* Other */ +.highlight .p { color: #000000; font-weight: bold } /* Punctuation */ +.highlight .ch { color: #8f5902; font-style: italic } /* Comment.Hashbang */ +.highlight .cm { color: #8f5902; font-style: italic } /* Comment.Multiline */ +.highlight .cp { color: #8f5902; font-style: italic } /* Comment.Preproc */ +.highlight .cpf { color: #8f5902; font-style: italic } /* Comment.PreprocFile */ +.highlight .c1 { color: #8f5902; font-style: italic } /* Comment.Single */ +.highlight .cs { color: #8f5902; font-style: italic } /* Comment.Special */ +.highlight .gd { color: #a40000 } /* Generic.Deleted */ +.highlight .ge { color: #000000; font-style: italic } /* Generic.Emph */ +.highlight .ges { color: #000000; font-weight: bold; font-style: italic } /* Generic.EmphStrong */ +.highlight .gr { color: #ef2929 } /* Generic.Error */ +.highlight .gh { color: #000080; font-weight: bold } /* Generic.Heading */ +.highlight .gi { color: #00A000 } /* Generic.Inserted */ +.highlight .go { color: #000000; font-style: italic } /* Generic.Output */ +.highlight .gp { color: #8f5902 } /* Generic.Prompt */ +.highlight .gs { color: #000000; font-weight: bold } /* Generic.Strong */ +.highlight .gu { color: #800080; font-weight: bold } /* Generic.Subheading */ +.highlight .gt { color: #a40000; font-weight: bold } /* Generic.Traceback */ +.highlight .kc { color: #204a87; font-weight: bold } /* Keyword.Constant */ +.highlight .kd { color: #204a87; font-weight: bold } /* Keyword.Declaration */ +.highlight .kn { color: #204a87; font-weight: bold } /* Keyword.Namespace */ +.highlight .kp { color: #204a87; font-weight: bold } /* Keyword.Pseudo */ +.highlight .kr { color: #204a87; font-weight: bold } /* Keyword.Reserved */ +.highlight .kt { color: #204a87; font-weight: bold } /* Keyword.Type */ +.highlight .ld { color: #000000 } /* Literal.Date */ +.highlight .m { color: #0000cf; font-weight: bold } /* Literal.Number */ +.highlight .s { color: #4e9a06 } /* Literal.String */ +.highlight .na { color: #c4a000 } /* Name.Attribute */ +.highlight .nb { color: #204a87 } /* Name.Builtin */ +.highlight .nc { color: #000000 } /* Name.Class */ +.highlight .no { color: #000000 } /* Name.Constant */ +.highlight .nd { color: #5c35cc; font-weight: bold } /* Name.Decorator */ +.highlight .ni { color: #ce5c00 } /* Name.Entity */ +.highlight .ne { color: #cc0000; font-weight: bold } /* Name.Exception */ +.highlight .nf { color: #000000 } /* Name.Function */ +.highlight .nl { color: #f57900 } /* Name.Label */ +.highlight .nn { color: #000000 } /* Name.Namespace */ +.highlight .nx { color: #000000 } /* Name.Other */ +.highlight .py { color: #000000 } /* Name.Property */ +.highlight .nt { color: #204a87; font-weight: bold } /* Name.Tag */ +.highlight .nv { color: #000000 } /* Name.Variable */ +.highlight .ow { color: #204a87; font-weight: bold } /* Operator.Word */ +.highlight .pm { color: #000000; font-weight: bold } /* Punctuation.Marker */ +.highlight .w { color: #f8f8f8 } /* Text.Whitespace */ +.highlight .mb { color: #0000cf; font-weight: bold } /* Literal.Number.Bin */ +.highlight .mf { color: #0000cf; font-weight: bold } /* Literal.Number.Float */ +.highlight .mh { color: #0000cf; font-weight: bold } /* Literal.Number.Hex */ +.highlight .mi { color: #0000cf; font-weight: bold } /* Literal.Number.Integer */ +.highlight .mo { color: #0000cf; font-weight: bold } /* Literal.Number.Oct */ +.highlight .sa { color: #4e9a06 } /* Literal.String.Affix */ +.highlight .sb { color: #4e9a06 } /* Literal.String.Backtick */ +.highlight .sc { color: #4e9a06 } /* Literal.String.Char */ +.highlight .dl { color: #4e9a06 } /* Literal.String.Delimiter */ +.highlight .sd { color: #8f5902; font-style: italic } /* Literal.String.Doc */ +.highlight .s2 { color: #4e9a06 } /* Literal.String.Double */ +.highlight .se { color: #4e9a06 } /* Literal.String.Escape */ +.highlight .sh { color: #4e9a06 } /* Literal.String.Heredoc */ +.highlight .si { color: #4e9a06 } /* Literal.String.Interpol */ +.highlight .sx { color: #4e9a06 } /* Literal.String.Other */ +.highlight .sr { color: #4e9a06 } /* Literal.String.Regex */ +.highlight .s1 { color: #4e9a06 } /* Literal.String.Single */ +.highlight .ss { color: #4e9a06 } /* Literal.String.Symbol */ +.highlight .bp { color: #3465a4 } /* Name.Builtin.Pseudo */ +.highlight .fm { color: #000000 } /* Name.Function.Magic */ +.highlight .vc { color: #000000 } /* Name.Variable.Class */ +.highlight .vg { color: #000000 } /* Name.Variable.Global */ +.highlight .vi { color: #000000 } /* Name.Variable.Instance */ +.highlight .vm { color: #000000 } /* Name.Variable.Magic */ +.highlight .il { color: #0000cf; font-weight: bold } /* Literal.Number.Integer.Long */ \ No newline at end of file diff --git a/_static/searchtools.js b/_static/searchtools.js new file mode 100644 index 0000000..7918c3f --- /dev/null +++ b/_static/searchtools.js @@ -0,0 +1,574 @@ +/* + * searchtools.js + * ~~~~~~~~~~~~~~~~ + * + * Sphinx JavaScript utilities for the full-text search. + * + * :copyright: Copyright 2007-2023 by the Sphinx team, see AUTHORS. + * :license: BSD, see LICENSE for details. + * + */ +"use strict"; + +/** + * Simple result scoring code. + */ +if (typeof Scorer === "undefined") { + var Scorer = { + // Implement the following function to further tweak the score for each result + // The function takes a result array [docname, title, anchor, descr, score, filename] + // and returns the new score. + /* + score: result => { + const [docname, title, anchor, descr, score, filename] = result + return score + }, + */ + + // query matches the full name of an object + objNameMatch: 11, + // or matches in the last dotted part of the object name + objPartialMatch: 6, + // Additive scores depending on the priority of the object + objPrio: { + 0: 15, // used to be importantResults + 1: 5, // used to be objectResults + 2: -5, // used to be unimportantResults + }, + // Used when the priority is not in the mapping. + objPrioDefault: 0, + + // query found in title + title: 15, + partialTitle: 7, + // query found in terms + term: 5, + partialTerm: 2, + }; +} + +const _removeChildren = (element) => { + while (element && element.lastChild) element.removeChild(element.lastChild); +}; + +/** + * See https://developer.mozilla.org/en-US/docs/Web/JavaScript/Guide/Regular_Expressions#escaping + */ +const _escapeRegExp = (string) => + string.replace(/[.*+\-?^${}()|[\]\\]/g, "\\$&"); // $& means the whole matched string + +const _displayItem = (item, searchTerms, highlightTerms) => { + const docBuilder = DOCUMENTATION_OPTIONS.BUILDER; + const docFileSuffix = DOCUMENTATION_OPTIONS.FILE_SUFFIX; + const docLinkSuffix = DOCUMENTATION_OPTIONS.LINK_SUFFIX; + const showSearchSummary = DOCUMENTATION_OPTIONS.SHOW_SEARCH_SUMMARY; + const contentRoot = document.documentElement.dataset.content_root; + + const [docName, title, anchor, descr, score, _filename] = item; + + let listItem = document.createElement("li"); + let requestUrl; + let linkUrl; + if (docBuilder === "dirhtml") { + // dirhtml builder + let dirname = docName + "/"; + if (dirname.match(/\/index\/$/)) + dirname = dirname.substring(0, dirname.length - 6); + else if (dirname === "index/") dirname = ""; + requestUrl = contentRoot + dirname; + linkUrl = requestUrl; + } else { + // normal html builders + requestUrl = contentRoot + docName + docFileSuffix; + linkUrl = docName + docLinkSuffix; + } + let linkEl = listItem.appendChild(document.createElement("a")); + linkEl.href = linkUrl + anchor; + linkEl.dataset.score = score; + linkEl.innerHTML = title; + if (descr) { + listItem.appendChild(document.createElement("span")).innerHTML = + " (" + descr + ")"; + // highlight search terms in the description + if (SPHINX_HIGHLIGHT_ENABLED) // set in sphinx_highlight.js + highlightTerms.forEach((term) => _highlightText(listItem, term, "highlighted")); + } + else if (showSearchSummary) + fetch(requestUrl) + .then((responseData) => responseData.text()) + .then((data) => { + if (data) + listItem.appendChild( + Search.makeSearchSummary(data, searchTerms) + ); + // highlight search terms in the summary + if (SPHINX_HIGHLIGHT_ENABLED) // set in sphinx_highlight.js + highlightTerms.forEach((term) => _highlightText(listItem, term, "highlighted")); + }); + Search.output.appendChild(listItem); +}; +const _finishSearch = (resultCount) => { + Search.stopPulse(); + Search.title.innerText = _("Search Results"); + if (!resultCount) + Search.status.innerText = Documentation.gettext( + "Your search did not match any documents. Please make sure that all words are spelled correctly and that you've selected enough categories." + ); + else + Search.status.innerText = _( + `Search finished, found ${resultCount} page(s) matching the search query.` + ); +}; +const _displayNextItem = ( + results, + resultCount, + searchTerms, + highlightTerms, +) => { + // results left, load the summary and display it + // this is intended to be dynamic (don't sub resultsCount) + if (results.length) { + _displayItem(results.pop(), searchTerms, highlightTerms); + setTimeout( + () => _displayNextItem(results, resultCount, searchTerms, highlightTerms), + 5 + ); + } + // search finished, update title and status message + else _finishSearch(resultCount); +}; + +/** + * Default splitQuery function. Can be overridden in ``sphinx.search`` with a + * custom function per language. + * + * The regular expression works by splitting the string on consecutive characters + * that are not Unicode letters, numbers, underscores, or emoji characters. + * This is the same as ``\W+`` in Python, preserving the surrogate pair area. + */ +if (typeof splitQuery === "undefined") { + var splitQuery = (query) => query + .split(/[^\p{Letter}\p{Number}_\p{Emoji_Presentation}]+/gu) + .filter(term => term) // remove remaining empty strings +} + +/** + * Search Module + */ +const Search = { + _index: null, + _queued_query: null, + _pulse_status: -1, + + htmlToText: (htmlString) => { + const htmlElement = new DOMParser().parseFromString(htmlString, 'text/html'); + htmlElement.querySelectorAll(".headerlink").forEach((el) => { el.remove() }); + const docContent = htmlElement.querySelector('[role="main"]'); + if (docContent !== undefined) return docContent.textContent; + console.warn( + "Content block not found. Sphinx search tries to obtain it via '[role=main]'. Could you check your theme or template." + ); + return ""; + }, + + init: () => { + const query = new URLSearchParams(window.location.search).get("q"); + document + .querySelectorAll('input[name="q"]') + .forEach((el) => (el.value = query)); + if (query) Search.performSearch(query); + }, + + loadIndex: (url) => + (document.body.appendChild(document.createElement("script")).src = url), + + setIndex: (index) => { + Search._index = index; + if (Search._queued_query !== null) { + const query = Search._queued_query; + Search._queued_query = null; + Search.query(query); + } + }, + + hasIndex: () => Search._index !== null, + + deferQuery: (query) => (Search._queued_query = query), + + stopPulse: () => (Search._pulse_status = -1), + + startPulse: () => { + if (Search._pulse_status >= 0) return; + + const pulse = () => { + Search._pulse_status = (Search._pulse_status + 1) % 4; + Search.dots.innerText = ".".repeat(Search._pulse_status); + if (Search._pulse_status >= 0) window.setTimeout(pulse, 500); + }; + pulse(); + }, + + /** + * perform a search for something (or wait until index is loaded) + */ + performSearch: (query) => { + // create the required interface elements + const searchText = document.createElement("h2"); + searchText.textContent = _("Searching"); + const searchSummary = document.createElement("p"); + searchSummary.classList.add("search-summary"); + searchSummary.innerText = ""; + const searchList = document.createElement("ul"); + searchList.classList.add("search"); + + const out = document.getElementById("search-results"); + Search.title = out.appendChild(searchText); + Search.dots = Search.title.appendChild(document.createElement("span")); + Search.status = out.appendChild(searchSummary); + Search.output = out.appendChild(searchList); + + const searchProgress = document.getElementById("search-progress"); + // Some themes don't use the search progress node + if (searchProgress) { + searchProgress.innerText = _("Preparing search..."); + } + Search.startPulse(); + + // index already loaded, the browser was quick! + if (Search.hasIndex()) Search.query(query); + else Search.deferQuery(query); + }, + + /** + * execute search (requires search index to be loaded) + */ + query: (query) => { + const filenames = Search._index.filenames; + const docNames = Search._index.docnames; + const titles = Search._index.titles; + const allTitles = Search._index.alltitles; + const indexEntries = Search._index.indexentries; + + // stem the search terms and add them to the correct list + const stemmer = new Stemmer(); + const searchTerms = new Set(); + const excludedTerms = new Set(); + const highlightTerms = new Set(); + const objectTerms = new Set(splitQuery(query.toLowerCase().trim())); + splitQuery(query.trim()).forEach((queryTerm) => { + const queryTermLower = queryTerm.toLowerCase(); + + // maybe skip this "word" + // stopwords array is from language_data.js + if ( + stopwords.indexOf(queryTermLower) !== -1 || + queryTerm.match(/^\d+$/) + ) + return; + + // stem the word + let word = stemmer.stemWord(queryTermLower); + // select the correct list + if (word[0] === "-") excludedTerms.add(word.substr(1)); + else { + searchTerms.add(word); + highlightTerms.add(queryTermLower); + } + }); + + if (SPHINX_HIGHLIGHT_ENABLED) { // set in sphinx_highlight.js + localStorage.setItem("sphinx_highlight_terms", [...highlightTerms].join(" ")) + } + + // console.debug("SEARCH: searching for:"); + // console.info("required: ", [...searchTerms]); + // console.info("excluded: ", [...excludedTerms]); + + // array of [docname, title, anchor, descr, score, filename] + let results = []; + _removeChildren(document.getElementById("search-progress")); + + const queryLower = query.toLowerCase(); + for (const [title, foundTitles] of Object.entries(allTitles)) { + if (title.toLowerCase().includes(queryLower) && (queryLower.length >= title.length/2)) { + for (const [file, id] of foundTitles) { + let score = Math.round(100 * queryLower.length / title.length) + results.push([ + docNames[file], + titles[file] !== title ? `${titles[file]} > ${title}` : title, + id !== null ? "#" + id : "", + null, + score, + filenames[file], + ]); + } + } + } + + // search for explicit entries in index directives + for (const [entry, foundEntries] of Object.entries(indexEntries)) { + if (entry.includes(queryLower) && (queryLower.length >= entry.length/2)) { + for (const [file, id] of foundEntries) { + let score = Math.round(100 * queryLower.length / entry.length) + results.push([ + docNames[file], + titles[file], + id ? "#" + id : "", + null, + score, + filenames[file], + ]); + } + } + } + + // lookup as object + objectTerms.forEach((term) => + results.push(...Search.performObjectSearch(term, objectTerms)) + ); + + // lookup as search terms in fulltext + results.push(...Search.performTermsSearch(searchTerms, excludedTerms)); + + // let the scorer override scores with a custom scoring function + if (Scorer.score) results.forEach((item) => (item[4] = Scorer.score(item))); + + // now sort the results by score (in opposite order of appearance, since the + // display function below uses pop() to retrieve items) and then + // alphabetically + results.sort((a, b) => { + const leftScore = a[4]; + const rightScore = b[4]; + if (leftScore === rightScore) { + // same score: sort alphabetically + const leftTitle = a[1].toLowerCase(); + const rightTitle = b[1].toLowerCase(); + if (leftTitle === rightTitle) return 0; + return leftTitle > rightTitle ? -1 : 1; // inverted is intentional + } + return leftScore > rightScore ? 1 : -1; + }); + + // remove duplicate search results + // note the reversing of results, so that in the case of duplicates, the highest-scoring entry is kept + let seen = new Set(); + results = results.reverse().reduce((acc, result) => { + let resultStr = result.slice(0, 4).concat([result[5]]).map(v => String(v)).join(','); + if (!seen.has(resultStr)) { + acc.push(result); + seen.add(resultStr); + } + return acc; + }, []); + + results = results.reverse(); + + // for debugging + //Search.lastresults = results.slice(); // a copy + // console.info("search results:", Search.lastresults); + + // print the results + _displayNextItem(results, results.length, searchTerms, highlightTerms); + }, + + /** + * search for object names + */ + performObjectSearch: (object, objectTerms) => { + const filenames = Search._index.filenames; + const docNames = Search._index.docnames; + const objects = Search._index.objects; + const objNames = Search._index.objnames; + const titles = Search._index.titles; + + const results = []; + + const objectSearchCallback = (prefix, match) => { + const name = match[4] + const fullname = (prefix ? prefix + "." : "") + name; + const fullnameLower = fullname.toLowerCase(); + if (fullnameLower.indexOf(object) < 0) return; + + let score = 0; + const parts = fullnameLower.split("."); + + // check for different match types: exact matches of full name or + // "last name" (i.e. last dotted part) + if (fullnameLower === object || parts.slice(-1)[0] === object) + score += Scorer.objNameMatch; + else if (parts.slice(-1)[0].indexOf(object) > -1) + score += Scorer.objPartialMatch; // matches in last name + + const objName = objNames[match[1]][2]; + const title = titles[match[0]]; + + // If more than one term searched for, we require other words to be + // found in the name/title/description + const otherTerms = new Set(objectTerms); + otherTerms.delete(object); + if (otherTerms.size > 0) { + const haystack = `${prefix} ${name} ${objName} ${title}`.toLowerCase(); + if ( + [...otherTerms].some((otherTerm) => haystack.indexOf(otherTerm) < 0) + ) + return; + } + + let anchor = match[3]; + if (anchor === "") anchor = fullname; + else if (anchor === "-") anchor = objNames[match[1]][1] + "-" + fullname; + + const descr = objName + _(", in ") + title; + + // add custom score for some objects according to scorer + if (Scorer.objPrio.hasOwnProperty(match[2])) + score += Scorer.objPrio[match[2]]; + else score += Scorer.objPrioDefault; + + results.push([ + docNames[match[0]], + fullname, + "#" + anchor, + descr, + score, + filenames[match[0]], + ]); + }; + Object.keys(objects).forEach((prefix) => + objects[prefix].forEach((array) => + objectSearchCallback(prefix, array) + ) + ); + return results; + }, + + /** + * search for full-text terms in the index + */ + performTermsSearch: (searchTerms, excludedTerms) => { + // prepare search + const terms = Search._index.terms; + const titleTerms = Search._index.titleterms; + const filenames = Search._index.filenames; + const docNames = Search._index.docnames; + const titles = Search._index.titles; + + const scoreMap = new Map(); + const fileMap = new Map(); + + // perform the search on the required terms + searchTerms.forEach((word) => { + const files = []; + const arr = [ + { files: terms[word], score: Scorer.term }, + { files: titleTerms[word], score: Scorer.title }, + ]; + // add support for partial matches + if (word.length > 2) { + const escapedWord = _escapeRegExp(word); + Object.keys(terms).forEach((term) => { + if (term.match(escapedWord) && !terms[word]) + arr.push({ files: terms[term], score: Scorer.partialTerm }); + }); + Object.keys(titleTerms).forEach((term) => { + if (term.match(escapedWord) && !titleTerms[word]) + arr.push({ files: titleTerms[word], score: Scorer.partialTitle }); + }); + } + + // no match but word was a required one + if (arr.every((record) => record.files === undefined)) return; + + // found search word in contents + arr.forEach((record) => { + if (record.files === undefined) return; + + let recordFiles = record.files; + if (recordFiles.length === undefined) recordFiles = [recordFiles]; + files.push(...recordFiles); + + // set score for the word in each file + recordFiles.forEach((file) => { + if (!scoreMap.has(file)) scoreMap.set(file, {}); + scoreMap.get(file)[word] = record.score; + }); + }); + + // create the mapping + files.forEach((file) => { + if (fileMap.has(file) && fileMap.get(file).indexOf(word) === -1) + fileMap.get(file).push(word); + else fileMap.set(file, [word]); + }); + }); + + // now check if the files don't contain excluded terms + const results = []; + for (const [file, wordList] of fileMap) { + // check if all requirements are matched + + // as search terms with length < 3 are discarded + const filteredTermCount = [...searchTerms].filter( + (term) => term.length > 2 + ).length; + if ( + wordList.length !== searchTerms.size && + wordList.length !== filteredTermCount + ) + continue; + + // ensure that none of the excluded terms is in the search result + if ( + [...excludedTerms].some( + (term) => + terms[term] === file || + titleTerms[term] === file || + (terms[term] || []).includes(file) || + (titleTerms[term] || []).includes(file) + ) + ) + break; + + // select one (max) score for the file. + const score = Math.max(...wordList.map((w) => scoreMap.get(file)[w])); + // add result to the result list + results.push([ + docNames[file], + titles[file], + "", + null, + score, + filenames[file], + ]); + } + return results; + }, + + /** + * helper function to return a node containing the + * search summary for a given text. keywords is a list + * of stemmed words. + */ + makeSearchSummary: (htmlText, keywords) => { + const text = Search.htmlToText(htmlText); + if (text === "") return null; + + const textLower = text.toLowerCase(); + const actualStartPosition = [...keywords] + .map((k) => textLower.indexOf(k.toLowerCase())) + .filter((i) => i > -1) + .slice(-1)[0]; + const startWithContext = Math.max(actualStartPosition - 120, 0); + + const top = startWithContext === 0 ? "" : "..."; + const tail = startWithContext + 240 < text.length ? "..." : ""; + + let summary = document.createElement("p"); + summary.classList.add("context"); + summary.textContent = top + text.substr(startWithContext, 240).trim() + tail; + + return summary; + }, +}; + +_ready(Search.init); diff --git a/_static/sphinx_highlight.js b/_static/sphinx_highlight.js new file mode 100644 index 0000000..8a96c69 --- /dev/null +++ b/_static/sphinx_highlight.js @@ -0,0 +1,154 @@ +/* Highlighting utilities for Sphinx HTML documentation. */ +"use strict"; + +const SPHINX_HIGHLIGHT_ENABLED = true + +/** + * highlight a given string on a node by wrapping it in + * span elements with the given class name. + */ +const _highlight = (node, addItems, text, className) => { + if (node.nodeType === Node.TEXT_NODE) { + const val = node.nodeValue; + const parent = node.parentNode; + const pos = val.toLowerCase().indexOf(text); + if ( + pos >= 0 && + !parent.classList.contains(className) && + !parent.classList.contains("nohighlight") + ) { + let span; + + const closestNode = parent.closest("body, svg, foreignObject"); + const isInSVG = closestNode && closestNode.matches("svg"); + if (isInSVG) { + span = document.createElementNS("http://www.w3.org/2000/svg", "tspan"); + } else { + span = document.createElement("span"); + span.classList.add(className); + } + + span.appendChild(document.createTextNode(val.substr(pos, text.length))); + const rest = document.createTextNode(val.substr(pos + text.length)); + parent.insertBefore( + span, + parent.insertBefore( + rest, + node.nextSibling + ) + ); + node.nodeValue = val.substr(0, pos); + /* There may be more occurrences of search term in this node. So call this + * function recursively on the remaining fragment. + */ + _highlight(rest, addItems, text, className); + + if (isInSVG) { + const rect = document.createElementNS( + "http://www.w3.org/2000/svg", + "rect" + ); + const bbox = parent.getBBox(); + rect.x.baseVal.value = bbox.x; + rect.y.baseVal.value = bbox.y; + rect.width.baseVal.value = bbox.width; + rect.height.baseVal.value = bbox.height; + rect.setAttribute("class", className); + addItems.push({ parent: parent, target: rect }); + } + } + } else if (node.matches && !node.matches("button, select, textarea")) { + node.childNodes.forEach((el) => _highlight(el, addItems, text, className)); + } +}; +const _highlightText = (thisNode, text, className) => { + let addItems = []; + _highlight(thisNode, addItems, text, className); + addItems.forEach((obj) => + obj.parent.insertAdjacentElement("beforebegin", obj.target) + ); +}; + +/** + * Small JavaScript module for the documentation. + */ +const SphinxHighlight = { + + /** + * highlight the search words provided in localstorage in the text + */ + highlightSearchWords: () => { + if (!SPHINX_HIGHLIGHT_ENABLED) return; // bail if no highlight + + // get and clear terms from localstorage + const url = new URL(window.location); + const highlight = + localStorage.getItem("sphinx_highlight_terms") + || url.searchParams.get("highlight") + || ""; + localStorage.removeItem("sphinx_highlight_terms") + url.searchParams.delete("highlight"); + window.history.replaceState({}, "", url); + + // get individual terms from highlight string + const terms = highlight.toLowerCase().split(/\s+/).filter(x => x); + if (terms.length === 0) return; // nothing to do + + // There should never be more than one element matching "div.body" + const divBody = document.querySelectorAll("div.body"); + const body = divBody.length ? divBody[0] : document.querySelector("body"); + window.setTimeout(() => { + terms.forEach((term) => _highlightText(body, term, "highlighted")); + }, 10); + + const searchBox = document.getElementById("searchbox"); + if (searchBox === null) return; + searchBox.appendChild( + document + .createRange() + .createContextualFragment( + '" + ) + ); + }, + + /** + * helper function to hide the search marks again + */ + hideSearchWords: () => { + document + .querySelectorAll("#searchbox .highlight-link") + .forEach((el) => el.remove()); + document + .querySelectorAll("span.highlighted") + .forEach((el) => el.classList.remove("highlighted")); + localStorage.removeItem("sphinx_highlight_terms") + }, + + initEscapeListener: () => { + // only install a listener if it is really needed + if (!DOCUMENTATION_OPTIONS.ENABLE_SEARCH_SHORTCUTS) return; + + document.addEventListener("keydown", (event) => { + // bail for input elements + if (BLACKLISTED_KEY_CONTROL_ELEMENTS.has(document.activeElement.tagName)) return; + // bail with special keys + if (event.shiftKey || event.altKey || event.ctrlKey || event.metaKey) return; + if (DOCUMENTATION_OPTIONS.ENABLE_SEARCH_SHORTCUTS && (event.key === "Escape")) { + SphinxHighlight.hideSearchWords(); + event.preventDefault(); + } + }); + }, +}; + +_ready(() => { + /* Do not call highlightSearchWords() when we are on the search page. + * It will highlight words from the *previous* search query. + */ + if (typeof Search === "undefined") SphinxHighlight.highlightSearchWords(); + SphinxHighlight.initEscapeListener(); +}); diff --git a/cpg.html b/cpg.html new file mode 100644 index 0000000..894cd57 --- /dev/null +++ b/cpg.html @@ -0,0 +1,95 @@ + + + + + + + + CpG Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

CpG Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/dust.html b/dust.html new file mode 100644 index 0000000..2706af4 --- /dev/null +++ b/dust.html @@ -0,0 +1,95 @@ + + + + + + + + DustMasker Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

DustMasker Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/eponine.html b/eponine.html new file mode 100644 index 0000000..50e28a5 --- /dev/null +++ b/eponine.html @@ -0,0 +1,95 @@ + + + + + + + + Eponine Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

Eponine Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/genblast.html b/genblast.html new file mode 100644 index 0000000..0615f59 --- /dev/null +++ b/genblast.html @@ -0,0 +1,95 @@ + + + + + + + + Genblast Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

Genblast Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/genindex.html b/genindex.html new file mode 100644 index 0000000..9a05235 --- /dev/null +++ b/genindex.html @@ -0,0 +1,94 @@ + + + + + + + Index — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ + +

Index

+ +
+ +
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/index.html b/index.html new file mode 100644 index 0000000..aee7143 --- /dev/null +++ b/index.html @@ -0,0 +1,122 @@ + + + + + + + + Contents — ensembl-anno 0.1 documentation + + + + + + + + + + + + +
+
+
+ +
+
+
+ +

Anno tool kit

+
+

Contents

+

Check out installation section for further information on how +to install the project.

+ +
+

Indices and tables

+ +
+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/install.html b/install.html new file mode 100644 index 0000000..7bad679 --- /dev/null +++ b/install.html @@ -0,0 +1,143 @@ + + + + + + + + API Setup and installation — ensembl-anno 0.1 documentation + + + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

API Setup and installation

+
+

Requirements

+

An Ensembl API checkout including:

+ +
+

Software

+
    +
  1. Python 3.8+

  2. +
  3. Bioperl 1.6.9+

  4. +
+
+
+

Python Modules

+
    +
  1. argschema

  2. +
+
+
+
+

Installation

+

Directly from GitHub:

+
1git clone https://github.com/Ensembl/ensembl-analysis -b experimental/gbiab
+2git clone https://github.com/Ensembl/ensembl-production
+3git clone https://github.com/Ensembl/ensembl-hive
+4git clone https://github.com/Ensembl/ensembl-taxonomy
+5git clone https://github.com/Ensembl/ensembl-orm
+
+
+
+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/license.html b/license.html new file mode 100644 index 0000000..c4696e1 --- /dev/null +++ b/license.html @@ -0,0 +1,280 @@ + + + + + + + + License — ensembl-anno 0.1 documentation + + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

License

+
+

Apache License +Version 2.0, January 2004 +http://www.apache.org/licenses/

+
    +
  1. Definitions.

    +

    “License” shall mean the terms and conditions for use, reproduction, +and distribution as defined by Sections 1 through 9 of this document.

    +

    “Licensor” shall mean the copyright owner or entity authorized by +the copyright owner that is granting the License.

    +

    “Legal Entity” shall mean the union of the acting entity and all +other entities that control, are controlled by, or are under common +control with that entity. For the purposes of this definition, +“control” means (i) the power, direct or indirect, to cause the +direction or management of such entity, whether by contract or +otherwise, or (ii) ownership of fifty percent (50%) or more of the +outstanding shares, or (iii) beneficial ownership of such entity.

    +

    “You” (or “Your”) shall mean an individual or Legal Entity +exercising permissions granted by this License.

    +

    “Source” form shall mean the preferred form for making modifications, +including but not limited to software source code, documentation +source, and configuration files.

    +

    “Object” form shall mean any form resulting from mechanical +transformation or translation of a Source form, including but +not limited to compiled object code, generated documentation, +and conversions to other media types.

    +

    “Work” shall mean the work of authorship, whether in Source or +Object form, made available under the License, as indicated by a +copyright notice that is included in or attached to the work +(an example is provided in the Appendix below).

    +

    “Derivative Works” shall mean any work, whether in Source or Object +form, that is based on (or derived from) the Work and for which the +editorial revisions, annotations, elaborations, or other modifications +represent, as a whole, an original work of authorship. For the purposes +of this License, Derivative Works shall not include works that remain +separable from, or merely link (or bind by name) to the interfaces of, +the Work and Derivative Works thereof.

    +

    “Contribution” shall mean any work of authorship, including +the original version of the Work and any modifications or additions +to that Work or Derivative Works thereof, that is intentionally +submitted to Licensor for inclusion in the Work by the copyright owner +or by an individual or Legal Entity authorized to submit on behalf of +the copyright owner. For the purposes of this definition, “submitted” +means any form of electronic, verbal, or written communication sent +to the Licensor or its representatives, including but not limited to +communication on electronic mailing lists, source code control systems, +and issue tracking systems that are managed by, or on behalf of, the +Licensor for the purpose of discussing and improving the Work, but +excluding communication that is conspicuously marked or otherwise +designated in writing by the copyright owner as “Not a Contribution.”

    +

    “Contributor” shall mean Licensor and any individual or Legal Entity +on behalf of whom a Contribution has been received by Licensor and +subsequently incorporated within the Work.

    +
  2. +
  3. Grant of Copyright License. Subject to the terms and conditions of +this License, each Contributor hereby grants to You a perpetual, +worldwide, non-exclusive, no-charge, royalty-free, irrevocable +copyright license to reproduce, prepare Derivative Works of, +publicly display, publicly perform, sublicense, and distribute the +Work and such Derivative Works in Source or Object form.

  4. +
  5. Grant of Patent License. Subject to the terms and conditions of +this License, each Contributor hereby grants to You a perpetual, +worldwide, non-exclusive, no-charge, royalty-free, irrevocable +(except as stated in this section) patent license to make, have made, +use, offer to sell, sell, import, and otherwise transfer the Work, +where such license applies only to those patent claims licensable +by such Contributor that are necessarily infringed by their +Contribution(s) alone or by combination of their Contribution(s) +with the Work to which such Contribution(s) was submitted. If You +institute patent litigation against any entity (including a +cross-claim or counterclaim in a lawsuit) alleging that the Work +or a Contribution incorporated within the Work constitutes direct +or contributory patent infringement, then any patent licenses +granted to You under this License for that Work shall terminate +as of the date such litigation is filed.

  6. +
  7. Redistribution. You may reproduce and distribute copies of the +Work or Derivative Works thereof in any medium, with or without +modifications, and in Source or Object form, provided that You +meet the following conditions:

    +
      +
    1. You must give any other recipients of the Work or +Derivative Works a copy of this License; and

    2. +
    3. You must cause any modified files to carry prominent notices +stating that You changed the files; and

    4. +
    5. You must retain, in the Source form of any Derivative Works +that You distribute, all copyright, patent, trademark, and +attribution notices from the Source form of the Work, +excluding those notices that do not pertain to any part of +the Derivative Works; and

    6. +
    7. If the Work includes a “NOTICE” text file as part of its +distribution, then any Derivative Works that You distribute must +include a readable copy of the attribution notices contained +within such NOTICE file, excluding those notices that do not +pertain to any part of the Derivative Works, in at least one +of the following places: within a NOTICE text file distributed +as part of the Derivative Works; within the Source form or +documentation, if provided along with the Derivative Works; or, +within a display generated by the Derivative Works, if and +wherever such third-party notices normally appear. The contents +of the NOTICE file are for informational purposes only and +do not modify the License. You may add Your own attribution +notices within Derivative Works that You distribute, alongside +or as an addendum to the NOTICE text from the Work, provided +that such additional attribution notices cannot be construed +as modifying the License.

    8. +
    +

    You may add Your own copyright statement to Your modifications and +may provide additional or different license terms and conditions +for use, reproduction, or distribution of Your modifications, or +for any such Derivative Works as a whole, provided Your use, +reproduction, and distribution of the Work otherwise complies with +the conditions stated in this License.

    +
  8. +
  9. Submission of Contributions. Unless You explicitly state otherwise, +any Contribution intentionally submitted for inclusion in the Work +by You to the Licensor shall be under the terms and conditions of +this License, without any additional terms or conditions. +Notwithstanding the above, nothing herein shall supersede or modify +the terms of any separate license agreement you may have executed +with Licensor regarding such Contributions.

  10. +
  11. Trademarks. This License does not grant permission to use the trade +names, trademarks, service marks, or product names of the Licensor, +except as required for reasonable and customary use in describing the +origin of the Work and reproducing the content of the NOTICE file.

  12. +
  13. Disclaimer of Warranty. Unless required by applicable law or +agreed to in writing, Licensor provides the Work (and each +Contributor provides its Contributions) on an “AS IS” BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or +implied, including, without limitation, any warranties or conditions +of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A +PARTICULAR PURPOSE. You are solely responsible for determining the +appropriateness of using or redistributing the Work and assume any +risks associated with Your exercise of permissions under this License.

  14. +
  15. Limitation of Liability. In no event and under no legal theory, +whether in tort (including negligence), contract, or otherwise, +unless required by applicable law (such as deliberate and grossly +negligent acts) or agreed to in writing, shall any Contributor be +liable to You for damages, including any direct, indirect, special, +incidental, or consequential damages of any character arising as a +result of this License or out of the use or inability to use the +Work (including but not limited to damages for loss of goodwill, +work stoppage, computer failure or malfunction, or any and all +other commercial damages or losses), even if such Contributor +has been advised of the possibility of such damages.

  16. +
  17. Accepting Warranty or Additional Liability. While redistributing +the Work or Derivative Works thereof, You may choose to offer, +and charge a fee for, acceptance of support, warranty, indemnity, +or other liability obligations and/or rights consistent with this +License. However, in accepting such obligations, You may act only +on Your own behalf and on Your sole responsibility, not on behalf +of any other Contributor, and only if You agree to indemnify, +defend, and hold each Contributor harmless for any liability +incurred by, or claims asserted against, such Contributor by reason +of your accepting any such warranty or additional liability.

  18. +
+

END OF TERMS AND CONDITIONS

+

APPENDIX: How to apply the Apache License to your work.

+
+

To apply the Apache License to your work, attach the following +boilerplate notice, with the fields enclosed by brackets “{}” +replaced with your own identifying information. (Don’t include +the brackets!) The text should be enclosed in the appropriate +comment syntax for the file format. We also recommend that a +file or class name and description of purpose be included on the +same “printed page” as the copyright notice for easier +identification within third-party archives.

+
+

Copyright [yyyy] [name of copyright owner]

+

Licensed under the Apache License, Version 2.0 (the “License”); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at

+
+
+

Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an “AS IS” BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License.

+
+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/minimap.html b/minimap.html new file mode 100644 index 0000000..9d55a8c --- /dev/null +++ b/minimap.html @@ -0,0 +1,95 @@ + + + + + + + + Minimap2 Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

Minimap2 Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/objects.inv b/objects.inv new file mode 100644 index 0000000000000000000000000000000000000000..f7bc3af3fcaea92e2ec24f8ad56321559a8c9dbe GIT binary patch literal 462 zcmV;<0Wtm~AX9K?X>NERX>N99Zgg*Qc_4OWa&u{KZXhxWBOp+6Z)#;@bUGkqZgXXA zVr(s8Zf%ZEX>4U6 zX>%ZBZ*6dLWpi_7WFU2OX>MmAdTeQ8E(&gUfE#umAfkD^b1`1L=3|l&D{Y^6kr+IxCibBX&-Y7R1V_ zu>&MY#$lz$fl^|s8CiwXP7XiNmr3vr4MGY>iTQQx7vUE0WMzK!tTDcs9glc}8h)?5 zl_#(<;i_`Nb~;vfTf8Q5EFDsa9D->eX>D%1N^D&0x8eXadLdEIEuJJrZ-b=p)3c~6 zYZTy+Eh|cV!6z40XV7%gr@kn$Z^y-3c`KdMg{}BYJvU+qv%H_A`wzCi(Ai;5_n^~R zL&@GI=*1Cx@F1z<|0*Nz`W%rsi&=vTJ9gQ!qQnV@*e}B%dv(sA%vyxGzn3jk;bUgQ zPIYu07tMow>J7GJAP1uu>6@n*LH&0Mhmx^l^YI8k88(19#Tuj3d@ZJ`KCH_Te}CJB EkyJC&SpWb4 literal 0 HcmV?d00001 diff --git a/py-modindex.html b/py-modindex.html new file mode 100644 index 0000000..c7e6859 --- /dev/null +++ b/py-modindex.html @@ -0,0 +1,185 @@ + + + + + + + Python Module Index — ensembl-anno 0.1 documentation + + + + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/red.html b/red.html new file mode 100644 index 0000000..bf16623 --- /dev/null +++ b/red.html @@ -0,0 +1,95 @@ + + + + + + + + Red Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

Red Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/repeatmasker.html b/repeatmasker.html new file mode 100644 index 0000000..739b31b --- /dev/null +++ b/repeatmasker.html @@ -0,0 +1,95 @@ + + + + + + + + Repeatmasker Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

Repeatmasker Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/scallop.html b/scallop.html new file mode 100644 index 0000000..97726f6 --- /dev/null +++ b/scallop.html @@ -0,0 +1,95 @@ + + + + + + + + Scallop Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

Scallop Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/search.html b/search.html new file mode 100644 index 0000000..8ded71c --- /dev/null +++ b/search.html @@ -0,0 +1,123 @@ + + + + + + + Search — ensembl-anno 0.1 documentation + + + + + + + + + + + + + + + + + +
+
+
+ +
+
+
+ +

Search

+ + + + +

+ Searching for multiple words only shows matches that contain + all words. +

+ + +
+ + + +
+ + + +
+ +
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/searchindex.js b/searchindex.js new file mode 100644 index 0000000..c36b8e9 --- /dev/null +++ b/searchindex.js @@ -0,0 +1 @@ +Search.setIndex({"docnames": ["cpg", "dust", "eponine", "genblast", "index", "install", "license", "minimap", "red", "repeatmasker", "scallop", "star", "stringtie", "trf", "trnascan"], "filenames": ["cpg.rst", "dust.rst", "eponine.rst", "genblast.rst", "index.rst", "install.rst", "license.rst", "minimap.rst", "red.rst", "repeatmasker.rst", "scallop.rst", "star.rst", "stringtie.rst", "trf.rst", "trnascan.rst"], "titles": ["CpG Module Documentation", "DustMasker Module Documentation", "Eponine Module Documentation", "Genblast Module Documentation", "Contents", "API Setup and installation", "License", "Minimap2 Module Documentation", "Red Module Documentation", "Repeatmasker Module Documentation", "Scallop Module Documentation", "STAR Module Documentation", "Stringtie Module Documentation", "TRF Module Documentation", "tRNAscan-SE Module Documentation"], "terms": {"index": [], "modul": 4, "search": 4, "page": [4, 6], "anno": 4, "tool": 4, "kit": 4, "check": 4, "out": [4, 6], "instal": 4, "section": [4, 6], "further": 4, "inform": [4, 6], "how": [4, 6], "project": 4, "api": 4, "setup": 4, "licens": 4, "an": [5, 6], "ensembl": 5, "checkout": 5, "includ": [5, 6], "product": [5, 6], "analysi": 5, "dev": 5, "hive_mast": 5, "branch": 5, "taxonomi": 5, "orm": 5, "3": 5, "8": 5, "bioperl": 5, "1": [5, 6], "6": 5, "9": [5, 6], "argschema": 5, "directli": 5, "from": [5, 6], "github": 5, "git": 5, "clone": 5, "http": [5, 6], "com": 5, "b": 5, "experiment": 5, "gbiab": 5, "hive": 5, "apach": 6, "version": 6, "2": 6, "0": 6, "januari": 6, "2004": 6, "www": 6, "org": 6, "definit": 6, "shall": 6, "mean": 6, "term": 6, "condit": 6, "us": 6, "reproduct": 6, "distribut": 6, "defin": 6, "through": 6, "thi": 6, "document": 6, "licensor": 6, "copyright": 6, "owner": 6, "entiti": 6, "author": 6, "i": 6, "grant": 6, "legal": 6, "union": 6, "act": 6, "all": 6, "other": 6, "control": 6, "ar": 6, "under": 6, "common": 6, "For": 6, "purpos": 6, "power": 6, "direct": 6, "indirect": 6, "caus": 6, "manag": 6, "whether": 6, "contract": 6, "otherwis": 6, "ii": 6, "ownership": 6, "fifti": 6, "percent": 6, "50": 6, "more": 6, "outstand": 6, "share": 6, "iii": 6, "benefici": 6, "you": 6, "your": 6, "individu": 6, "exercis": 6, "permiss": 6, "sourc": 6, "form": 6, "prefer": 6, "make": 6, "modif": 6, "limit": 6, "softwar": 6, "code": 6, "configur": 6, "file": 6, "object": 6, "ani": 6, "result": 6, "mechan": 6, "transform": 6, "translat": 6, "compil": 6, "gener": 6, "convers": 6, "media": 6, "type": 6, "work": 6, "authorship": 6, "made": 6, "avail": 6, "indic": 6, "notic": 6, "attach": 6, "exampl": 6, "provid": 6, "appendix": 6, "below": 6, "deriv": 6, "base": 6, "which": 6, "editori": 6, "revis": 6, "annot": 6, "elabor": 6, "repres": 6, "whole": 6, "origin": 6, "remain": 6, "separ": 6, "mere": 6, "link": 6, "bind": 6, "name": 6, "interfac": 6, "thereof": 6, "contribut": 6, "addit": 6, "intention": 6, "submit": 6, "inclus": 6, "behalf": 6, "electron": 6, "verbal": 6, "written": 6, "commun": 6, "sent": 6, "its": 6, "mail": 6, "list": 6, "system": 6, "issu": 6, "track": 6, "discuss": 6, "improv": 6, "exclud": 6, "conspicu": 6, "mark": 6, "design": 6, "write": 6, "Not": 6, "contributor": 6, "whom": 6, "ha": 6, "been": 6, "receiv": 6, "subsequ": 6, "incorpor": 6, "within": 6, "subject": 6, "each": 6, "herebi": 6, "perpetu": 6, "worldwid": 6, "non": 6, "exclus": 6, "charg": 6, "royalti": 6, "free": 6, "irrevoc": 6, "reproduc": 6, "prepar": 6, "publicli": 6, "displai": 6, "perform": 6, "sublicens": 6, "patent": 6, "except": 6, "state": 6, "have": 6, "offer": 6, "sell": 6, "import": 6, "transfer": 6, "where": 6, "appli": 6, "onli": 6, "those": 6, "claim": 6, "necessarili": 6, "infring": 6, "": 6, "alon": 6, "combin": 6, "wa": 6, "If": 6, "institut": 6, "litig": 6, "against": 6, "cross": 6, "counterclaim": 6, "lawsuit": 6, "alleg": 6, "constitut": 6, "contributori": 6, "termin": 6, "date": 6, "redistribut": 6, "mai": 6, "copi": 6, "medium": 6, "without": 6, "meet": 6, "follow": 6, "must": 6, "give": 6, "recipi": 6, "modifi": 6, "carri": 6, "promin": 6, "chang": 6, "retain": 6, "trademark": 6, "attribut": 6, "do": 6, "pertain": 6, "part": 6, "text": 6, "readabl": 6, "contain": 6, "least": 6, "one": 6, "place": 6, "along": 6, "wherev": 6, "third": 6, "parti": 6, "normal": 6, "appear": 6, "The": 6, "content": 6, "add": 6, "own": 6, "alongsid": 6, "addendum": 6, "cannot": 6, "constru": 6, "statement": 6, "differ": 6, "compli": 6, "submiss": 6, "unless": 6, "explicitli": 6, "notwithstand": 6, "abov": 6, "noth": 6, "herein": 6, "supersed": 6, "agreement": 6, "execut": 6, "regard": 6, "doe": 6, "trade": 6, "servic": 6, "requir": [4, 6], "reason": 6, "customari": 6, "describ": 6, "disclaim": 6, "warranti": 6, "applic": 6, "law": 6, "agre": 6, "AS": 6, "basi": 6, "OR": 6, "OF": 6, "kind": 6, "either": 6, "express": 6, "impli": 6, "titl": 6, "merchant": 6, "fit": 6, "FOR": 6, "A": 6, "particular": 6, "sole": 6, "respons": 6, "determin": 6, "appropri": 6, "assum": 6, "risk": 6, "associ": 6, "liabil": 6, "In": 6, "event": 6, "theori": 6, "tort": 6, "neglig": 6, "deliber": 6, "grossli": 6, "liabl": 6, "damag": 6, "special": 6, "incident": 6, "consequenti": 6, "charact": 6, "aris": 6, "inabl": 6, "loss": 6, "goodwil": 6, "stoppag": 6, "comput": 6, "failur": 6, "malfunct": 6, "commerci": 6, "even": 6, "advis": 6, "possibl": 6, "accept": 6, "while": 6, "choos": 6, "fee": 6, "support": 6, "indemn": 6, "oblig": 6, "right": 6, "consist": 6, "howev": 6, "indemnifi": 6, "defend": 6, "hold": 6, "harmless": 6, "incur": 6, "assert": 6, "end": 6, "AND": 6, "To": 6, "boilerpl": 6, "field": 6, "enclos": 6, "bracket": 6, "replac": 6, "identifi": 6, "don": 6, "t": 6, "should": 6, "comment": 6, "syntax": 6, "format": 6, "we": 6, "also": 6, "recommend": 6, "class": 6, "descript": 6, "same": 6, "print": 6, "easier": 6, "identif": 6, "archiv": 6, "yyyi": 6, "complianc": 6, "obtain": 6, "see": 6, "specif": 6, "languag": 6, "govern": 6, "function": [], "run": [], "assembl": [], "short": [], "read": [], "data": [], "pertea": [], "m": [], "gm": [], "antonescu": [], "cm": [], "tc": [], "mendel": [], "jt": [], "salzberg": [], "sl": [], "enabl": [], "reconstruct": [], "transcriptom": [], "rna": [], "seq": [], "natur": [], "biotechnologi": [], "2015": [], "doi": [], "10": [], "1038": [], "nbt": [], "3122": [], "stringti": [], "python": [], "run_stringti": [], "fast": [], "highli": [], "effici": [], "align": [], "potenti": [], "transcript": [], "It": [], "novel": [], "network": [], "flow": [], "algorithm": [], "well": [], "option": [], "de": [], "novo": [], "assembli": [], "step": [], "quantit": [], "full": [], "length": [], "multipl": [], "splice": [], "variant": [], "gene": [], "locu": [], "transcriptomic_annot": [], "output_dir": [], "path": [], "stringtie_bin": [], "posixpath": [], "num_thread": [], "int": [], "none": [], "param": [], "directori": [], "number": [], "thread": [], "No": [], "inputschema": [], "strsequenceorset": [], "mani": [], "bool": [], "fals": [], "context": [], "dict": [], "load_onli": [], "dump_onli": [], "partial": [], "unknown": [], "str": [], "input": [], "argument": [], "expect": [], "set": [], "discrimin": [], "can": [], "recogn": [], "structur": [], "composit": [], "featur": [], "island": [], "promot": [], "region": [], "first": [], "donor": [], "site": [], "davuluri": [], "rv": [], "gross": [], "zhang": [], "mq": [], "exon": [], "human": [], "genom": [], "nat": [], "genet": [], "2001": [], "29": [], "4": [], "412": [], "417": [], "pmid": [], "11726928": [], "simple_feature_annot": [], "run_cpg": [], "genome_fil": [], "pathlik": [], "cpg_bin": [], "cpg_lh": [], "cpg_min_length": [], "400": [], "cpg_min_gc_cont": [], "cpg_min_o": [], "float": [], "slice": [], "min": [], "gc": [], "frequenc": [], "percentag": [], "ratio": [], "observ": [], "cpgo": [], "e": [], "program": [], "mask": [], "low": [], "complex": [], "new": [], "dust": [], "morguli": [], "gertz": [], "em": [], "schaffer": [], "aa": [], "agarwala": [], "r": [], "symmetr": [], "implement": [], "dna": [], "sequenc": [], "repeat_annot": [], "run_dust": [], "dust_bin": [], "mutiprocess": [], "probabilist": [], "method": [], "detect": [], "start": [], "tss": [], "mammalian": [], "good": [], "excel": [], "posit": [], "accuraci": [], "down": [], "ta": [], "hubbard": [], "tj": [], "locat": [], "re": [], "2002": [], "mar": [], "12": [], "458": [], "61": [], "1101": [], "gr": [], "216102": [], "11875034": [], "pmcid": [], "pmc155284": [], "run_eponin": [], "java_bin": [], "java": [], "eponine_bin": [], "hp": [], "user": [], "ensw": [], "c8": [], "mar21": [], "sandybridg": [], "linuxbrew": [], "opt": [], "libexec": [], "scan": [], "jar": [], "eponine_threshold": [], "999": [], "homolog": [], "databas": [], "One": [], "kei": [], "flexibl": [], "handl": [], "compar": [], "task": [], "accur": [], "when": [], "undergon": [], "signific": [], "evolutionari": [], "capabl": [], "valuabl": [], "resourc": [], "research": [], "studi": [], "evolut": [], "famili": [], "across": [], "divers": [], "speci": [], "wide": [], "variou": [], "analys": [], "standalon": [], "command": [], "line": [], "bioinformat": [], "pipelin": [], "often": [], "reli": [], "sensit": [], "homologi": [], "insight": [], "relationship": [], "conserv": [], "organ": [], "she": [], "chu": [], "j": [], "uyar": [], "wang": [], "k": [], "chen": [], "n": [], "2011": [], "genblasta": [], "blast": [], "21": [], "5": [], "936": [], "949": [], "protein_annot": [], "run_genblast": [], "masked_genom": [], "protein_dataset": [], "max_intron_length": [], "genblast_timeout_sec": [], "10800": [], "genblast_bin": [], "convert2blastmask_bin": [], "convert2blastmask": [], "makeblastdb_bin": [], "makeblastdb": [], "protein_set": [], "uniprot": [], "orthodb": [], "protein": [], "dataset": [], "time": [], "timeout": [], "sec": [], "maximum": [], "intron": [], "genblast_timeout": [], "second": [], "cmsearch": [], "eponin": [], "genblast": [], "minimap2": [], "run_minimap2": [], "red": [], "run_r": [], "repeatmask": [], "run_repeatmask": [], "scallop": [], "run_scallop": [], "star": [], "run_star": [], "subsample_transcriptomic_data": [], "trf": [], "run_trf": [], "trnascan": [], "se": [], "run_trnascan": [], "pairwis": [], "nucleotid": [], "versatil": [], "strategi": [], "quickli": [], "find": [], "approxim": [], "match": [], "between": [], "allow": [], "long": [], "refer": [], "li": [], "h": [], "2018": [], "34": [], "18": [], "3094": [], "3100": [], "minimap": [], "long_read_fastq_dir": [], "minimap2_bin": [], "paftools_bin": [], "paftool": [], "100000": [], "default": [], "pacbio": [], "size": [], "repeat": [], "label": [], "train": [], "itself": [], "automat": [], "entir": [], "girgi": [], "z": [], "intellig": [], "rapid": [], "scale": [], "bmc": [], "16": [], "227": [], "1186": [], "s12859": [], "015": [], "0654": [], "red_bin": [], "paramet": [], "return": [], "screen": [], "interspers": [], "smit": [], "afa": [], "hublei": [], "green": [], "p": [], "open": [], "repeatmasker_bin": [], "librari": [], "repeatmasker_engin": [], "rmblast": [], "store": [], "final": [], "gtf": [], "repeatmasker_output": [], "repeatmasker_path": [], "custom": [], "output": [], "high": [], "quantif": [], "larg": [], "precis": [], "estim": [], "abund": [], "approach": [], "quantifi": [], "level": [], "shao": [], "kingsford": [], "c": [], "phase": [], "preserv": [], "graph": [], "decomposit": [], "biotechnol": [], "2017": [], "dec": [], "35": [], "1167": [], "1169": [], "4020": [], "epub": [], "nov": [], "13": [], "29131147": [], "pmc5722698": [], "scallop_path": [], "stringtie_path": [], "main_output_dir": [], "dobin": [], "davi": [], "ca": [], "schlesing": [], "f": [], "et": [], "al": [], "ultrafast": [], "univers": [], "2013": [], "15": [], "1093": [], "bts635": [], "short_read_fastq_dir": [], "delete_pre_trim_fastq": [], "trim_fastq": [], "max_reads_per_sampl": [], "star_bin": [], "samtools_bin": [], "samtool": [], "trim_galore_bin": [], "trim_galor": [], "delet": [], "fastq": [], "after": [], "trim": [], "trimgalor": [], "max": [], "per": [], "sampl": [], "unlimit": [], "fastq_file_list": [], "subsampl": [], "pair": [], "process": [], "tandem": [], "finder": [], "benson": [], "g": [], "analyz": [], "nucleic": [], "acid": [], "1999": [], "27": [], "573": [], "580": [], "nar": [], "trf_bin": [], "match_scor": [], "mismatch_scor": [], "delta": [], "7": [], "pm": [], "80": [], "pi": [], "minscor": [], "40": [], "maxperiod": [], "500": [], "weight": [], "mismatch": [], "penalti": [], "indel": [], "probabl": [], "minimum": [], "score": [], "report": [], "period": [], "99": [], "100": [], "less": [], "than": [], "gigabas": [], "tm": [], "eddi": [], "sr": [], "1997": [], "25": [], "955": [], "64": [], "9023104": [], "snc_rna_annot": [], "trnascan_bin": [], "trnascan_filt": [], "eukhighconfidencefilt": [], "filter": [], "cpg": [], "dustmask": [], "scallop_bin": [], "prlimit_bin": [], "prlimit": [], "memory_limit": [], "42949672960": [], "memori": [], "1024": []}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"welcom": [], "ensembl": [], "anno": [], "": [], "document": [0, 1, 2, 3, 7, 8, 9, 10, 11, 12, 13, 14], "indic": 4, "tabl": 4, "content": 4, "index": 4, "api": 5, "setup": 5, "instal": 5, "requir": 5, "softwar": 5, "python": 5, "modul": [0, 1, 2, 3, 5, 7, 8, 9, 10, 11, 12, 13, 14], "licens": 6, "stringti": 12, "cmsearch": [], "cpg": 0, "dustmask": 1, "eponin": 2, "genblast": 3, "minimap2": 7, "red": 8, "repeatmask": 9, "scallop": 10, "star": 11, "trf": 13, "trnascan": 14, "se": 14}, "envversion": {"sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1, "sphinx": 60}, "alltitles": {"CpG Module Documentation": [[0, "cpg-module-documentation"]], "DustMasker Module Documentation": [[1, "dustmasker-module-documentation"]], "Eponine Module Documentation": [[2, "eponine-module-documentation"]], "Genblast Module Documentation": [[3, "genblast-module-documentation"]], "Contents": [[4, "contents"]], "Index": [[4, null]], "Indices and tables": [[4, "indices-and-tables"]], "API Setup and installation": [[5, "api-setup-and-installation"]], "Requirements": [[5, "requirements"]], "Software": [[5, "software"]], "Python Modules": [[5, "python-modules"]], "Installation": [[5, "installation"]], "License": [[6, "license"]], "Minimap2 Module Documentation": [[7, "minimap2-module-documentation"]], "Red Module Documentation": [[8, "red-module-documentation"]], "Repeatmasker Module Documentation": [[9, "repeatmasker-module-documentation"]], "Scallop Module Documentation": [[10, "scallop-module-documentation"]], "STAR Module Documentation": [[11, "star-module-documentation"]], "Stringtie Module Documentation": [[12, "stringtie-module-documentation"]], "TRF Module Documentation": [[13, "trf-module-documentation"]], "tRNAscan-SE Module Documentation": [[14, "trnascan-se-module-documentation"]]}, "indexentries": {}}) \ No newline at end of file diff --git a/star.html b/star.html new file mode 100644 index 0000000..ec03331 --- /dev/null +++ b/star.html @@ -0,0 +1,95 @@ + + + + + + + + STAR Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

STAR Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/stringtie.html b/stringtie.html new file mode 100644 index 0000000..d8bf948 --- /dev/null +++ b/stringtie.html @@ -0,0 +1,95 @@ + + + + + + + + Stringtie Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

Stringtie Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/trf.html b/trf.html new file mode 100644 index 0000000..9636f16 --- /dev/null +++ b/trf.html @@ -0,0 +1,95 @@ + + + + + + + + TRF Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

TRF Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file diff --git a/trnascan.html b/trnascan.html new file mode 100644 index 0000000..5137cb5 --- /dev/null +++ b/trnascan.html @@ -0,0 +1,95 @@ + + + + + + + + tRNAscan-SE Module Documentation — ensembl-anno 0.1 documentation + + + + + + + + + + + +
+
+
+ +
+
+
+ +
+

tRNAscan-SE Module Documentation

+
+ + +
+
+
+
+
+ +
+
+
+ + + + + \ No newline at end of file