From 705996494fdccb73129a8e8fecf9036a90123b3d Mon Sep 17 00:00:00 2001 From: Zilong-Li Date: Tue, 7 May 2024 17:51:41 +0200 Subject: [PATCH] update readme --- README.Rmd | 9 +++--- README.md | 30 +++--------------- docs/index.html | 2 +- docs/pkgdown.yml | 2 +- .../reference/figures/README-summary_sm-1.png | Bin 14601 -> 14689 bytes docs/search.json | 2 +- 6 files changed, 12 insertions(+), 33 deletions(-) diff --git a/README.Rmd b/README.Rmd index bca4583..40f2f40 100644 --- a/README.Rmd +++ b/README.Rmd @@ -43,7 +43,7 @@ remotes::install_github("Zilong-Li/vcfppR") ## from latest github If you find it useful, please cite the [paper](https://doi.org/10.1093/bioinformatics/btae049) -``` {r cite} +```r library(vcfppR) citation("vcfppR") ``` @@ -64,6 +64,7 @@ popfile <- "https://ftp.1000genomes.ebi.ac.uk/vol1/ftp/data_collections/1000G_25 Want to investigate the concordance between two VCF files? `vcfcomp` is the utility function you need! For example, in benchmarkings, we intend to calculate the genotype correlation between the test and the truth. ```{r r2} +library(vcfppR) res <- vcfcomp(test = rawvcf, truth = phasedvcf, region = "chr21:1-5100000", stats = "r2", formats = c("GT","GT")) @@ -95,21 +96,21 @@ vcfplot(res, main = "Structure Variant Counts", col = 1:7) `vcftable` gives you fine control over what you want to extract from VCF/BCF files. -**Read SNP variants** +**Read SNP variants with GT format** ```{r snp} res <- vcftable(phasedvcf, "chr21:1-5100000", vartype = "snps") str(res) ``` -**Read SNP variants with PL format and drop the INFO column in the VCF/BCF** +**Read SNP variants with PL format and drop the INFO column** ```{r pl} res <- vcftable(rawvcf, "chr21:1-5100000", vartype = "snps", format = "PL", info = FALSE) str(res) ``` -**Read INDEL variants with DP format in the VCF/BCF** +**Read INDEL variants with DP format** ```{r indel} res <- vcftable(rawvcf, "chr21:1-5100000", vartype = "indels", format = "DP") diff --git a/README.md b/README.md index d74dd70..72368fd 100644 --- a/README.md +++ b/README.md @@ -41,28 +41,6 @@ If you find it useful, please cite the ``` r library(vcfppR) citation("vcfppR") -#> To cite package 'vcfppR' in publications use: -#> -#> Li Z (2024). "vcfpp: a C++ API for rapid processing of the variant -#> call format." _Bioinformatics_, *40*(2), btae049. ISSN 1367-4811, -#> doi:10.1093/bioinformatics/btae049 -#> . -#> -#> A BibTeX entry for LaTeX users is -#> -#> @Article{, -#> title = {vcfpp: a C++ API for rapid processing of the variant call format}, -#> author = {Zilong Li}, -#> journal = {Bioinformatics}, -#> volume = {40}, -#> number = {2}, -#> pages = {btae049}, -#> year = {2024}, -#> month = {01}, -#> issn = {1367-4811}, -#> abstract = {Given the widespread use of the variant call format (VCF/BCF) coupled with continuous surge in big data, there remains a perpetual demand for fast and flexible methods to manipulate these comprehensive formats across various programming languages.This work presents vcfpp, a C++ API of HTSlib in a single file, providing an intuitive interface to manipulate VCF/BCF files rapidly and safely, in addition to being portable. Moreover, this work introduces the vcfppR package to demonstrate the development of a high-performance R package with vcfpp, allowing for rapid and straightforward variants analyses.vcfpp is available from https://github.com/Zilong-Li/vcfpp under MIT license. vcfppR is available from https://cran.r-project.org/web/packages/vcfppR.}, -#> doi = {10.1093/bioinformatics/btae049}, -#> } ``` ## URL as filename @@ -83,6 +61,7 @@ the utility function you need\! For example, in benchmarkings, we intend to calculate the genotype correlation between the test and the truth. ``` r +library(vcfppR) res <- vcfcomp(test = rawvcf, truth = phasedvcf, region = "chr21:1-5100000", stats = "r2", formats = c("GT","GT")) @@ -126,7 +105,7 @@ vcfplot(res, main = "Structure Variant Counts", col = 1:7) `vcftable` gives you fine control over what you want to extract from VCF/BCF files. -**Read SNP variants** +**Read SNP variants with GT format** ``` r res <- vcftable(phasedvcf, "chr21:1-5100000", vartype = "snps") @@ -145,8 +124,7 @@ str(res) #> - attr(*, "class")= chr "vcftable" ``` -**Read SNP variants with PL format and drop the INFO column in the -VCF/BCF** +**Read SNP variants with PL format and drop the INFO column** ``` r res <- vcftable(rawvcf, "chr21:1-5100000", vartype = "snps", format = "PL", info = FALSE) @@ -165,7 +143,7 @@ str(res) #> - attr(*, "class")= chr "vcftable" ``` -**Read INDEL variants with DP format in the VCF/BCF** +**Read INDEL variants with DP format** ``` r res <- vcftable(rawvcf, "chr21:1-5100000", vartype = "indels", format = "DP") diff --git a/docs/index.html b/docs/index.html index 6d3edab..736cb44 100644 --- a/docs/index.html +++ b/docs/index.html @@ -150,7 +150,7 @@

Small variants

 res <- vcfsummary(rawvcf,"chr21:10000000-10010000")
-vcfplot(res, pop = popfile, col = 1:5, main = "Mean number of SNP & INDEL variants")
+vcfplot(res, pop = popfile, col = 1:5, main = "Number of SNP & INDEL variants per population")
 #> input is an object with vcfsummary class

Complex structure variants

diff --git a/docs/pkgdown.yml b/docs/pkgdown.yml index 2e2ba1f..a6e4471 100644 --- a/docs/pkgdown.yml +++ b/docs/pkgdown.yml @@ -3,5 +3,5 @@ pkgdown: 2.0.9 pkgdown_sha: ~ articles: concordance-of-two-vcf-files: concordance-of-two-vcf-files.html -last_built: 2024-05-07T13:49Z +last_built: 2024-05-07T15:08Z diff --git a/docs/reference/figures/README-summary_sm-1.png b/docs/reference/figures/README-summary_sm-1.png index 78a2ad1520375fb58c18d02b0c991090f73be4e1..38efda364660dc3ff33acb9a25526d73cf12b231 100644 GIT binary patch literal 14689 zcmd6Oc{r7O+xC*ZBQjJpDYk4;il``Il_41-$s9^F7&B!aDl!$jQZk3iOcF9{kTT1Z zAw>JFoLPuXFjGQITh2*v>#8 z5SSEB$(|(;);uK;Xu9av;2p~7sZ020-StyCwgdw6d+L8QWmXBs1j26w1=$nl93w`) zIk_s&ESHUwKgn)X_~iAwubbajhv)ZNyA8swK6;~Np`VcKoS5gVG?Sz&sHkW0JSl0> z)XcnYA}%9G(En@_e++%tAHKi&{oX%Q=F~pdtCAghN#shkgFy{({!~qbZQnus(NR4S zD!j*k7lGh;e(!)jhICzO4JQV+VT?dHrT!j)fSTeLkUWqu`B z2o;;xKE0Wf`O z=yG^Sh}P}3Ol#L~9h`FW zCQ|){azv*Z5$5NwTGUb=RqMdSL_D%&c{F`XVqkT2e9(|SD3X^MF z8k4o;?`?k+5fKp*;?Q3m8GG<|K0bL_S>;G^`<3M-EP%YGX4802nO55QmPGYCJ04ulw;9FHnz6Z z;hzo{9n|-Ya$lk}yUdKP-xB$KFg{vENokYxhtks0j~~O7UvOclnKe@R zxQ@fBpbkS)i4Re70cb*!!G19t@`%8U&@$x)L#)rALzrT3w9itEP&b>F5DWvA) z`vup(zk6{ye0s2+Pe8!zTb}*H-KT99?T?-5$1W|E(6aFR+YEkrjsfkIbe?L>GK-TB zTAu5VE-WZus5xr>^<_c=e|RZ}m}N>#!Nft!_BYE*3vK6^d%Bq#eb(f#ad7C(TFm!_ zTQv+4m!=+yKlfN!9tzgYGF`_lZZ~j2zbT9^+HE>i{JC1(NoikEi`L(F?-n&}NWkuo zwB=xRVq*CX-6$F%g8FOLtl7oGLtLJ{L{c1TOpX_v=m{cD4>bz#^Cw&?3p{wa@>5NX z(D{C>6CDd@dxBb=r>7@kS5W(9S4W{sll(Eef#19mG?F!M+?e*=z_V8?&6P6L7%Ll4(BU)?T^VS2$BORxQTW;OD#V(*JF;y!Q6BFa^?tYI$%zZSs-+g7tA-vf# z^WoHBy*&MQ5-GX*(u(3)b#$_2 z=la5b?Vx6uB`S{|;%x8%F z!>+L+bb*qjjDFe=F*$KxPg`WJb@3OPl#~mlcN8;O^40QDl$G@o-%aN063|FG7xT_T zKiFwFqfB|X`u9E9*GGB2+sC-Mx$)T^iT9o~vmAQ|HC(fSKBq|^rs$Bo#wE7j_z`$&$hRaMi13uz~>hUU0PEJjOEiEk-Awq^l zu5&<#9p92l*A~R`vq;T86<_Ku4Ja+LE?$}r4+;umjYU|S&d$xwMu^)d1<&a2Ioef` zlKItBi>((}awdKT%NTi9g{IhL#?pRykNS%Q^@+*J+qZ9fvs$!eYp|I#rRc=^p1il+ zg$cI()&8;jbY49hFvVGkxPM=5 zI6$LJ7w65aIZfa3KF(}!UtiMX5tB1tCuL2TcN}Yu>~lKB%k<|`R3x_1xCl!m<-vkCu%ovhICaee*HEP*`-cIaAH6LjgS{TGxPF~ zhpI)36H27w@=cpIvCHK;kPVEDpRw)|5wQW(eg6Epi6!M%#?1)=YCZ`q=9&U`@7*i3 z?zvMX5P9I@t-JaIF;C1!u%b5A%CQpxv&wNCI?&`>6L*{{NU8%vn{jeA7NNbjQyta^ma=7RSPV=L^ z8XKh#U9G)9YDxv zY5VfW`}G?3*bg;qkUp1g;D(&FFhkCXy7xrVRpQ z)tTTqS^u51W!01;+sCF0kWsQum$a!DNRsy`%9rHtA;~WSD-T(B%W}(JxX^|D89mq~ zbpFj#enm@5%QI*G5bp)n`^Oqzxq@t>LtppGM9F@GS&7HONX}5Oq5GViWV^?Y`+$j- z0;f!I8ENTT;xYyXQS&;TFHUpV``h~p>b_3+8gflCzoWp(*35XcJy%`dbZVe(DENzN zoq+$udlsUXk59nLW;QmqEn9Nj7H%-BTAkoNI*H3r!T2?-#+Fao3QP& zNGJ~f3;uFswZ_8{5>6t#ye16**^~EL-&n_qXHuTdEzNZ1IE{EaJb34HVMP&V+{WgW zcrV`7>JL45B~ZL{xBX~GVe+ySphzWJDwSVRMWtFGy+Fii;s-{uWkE63DHqAqzWnn; zzQz-E$y!3C3b)@y@x8L`3eM#$9rw)XAK{nm8rjzoHN*D2N6?wpak5HGMn=Z!Ti#)l z^56v>)t-;{8f7*Et0}rR7+XWY2PrA3p=%m)Y79af+1MI#tPCk+Bs@g40e#H0pAN@` z4)=u-LH#_t!7sdf_wE%CP@=aU{+e;?)*2F(WSk7#p<}Lar8+{59JN3)Trn+ltxeU- zK?d65?k{3L_@%cYQ5{g$h_ygod+zRPY;5d`#4YJEeg5Tz6LoUK?MaMV1kVwxcb^Wk z>nfq)mOXyFB;u&8f8^XdZ^oU+Zk&I8RqeUrBi(HCJzm-`FTC|<7nqosxU+uSmqHf@ zCMMmmPPgy?p_&J#SV81qEr}zN&EflP8-J)GpP<%4J@z$^*>&`26sa zkY@8rDo}c zn|JP%MB*WFU&~0+NN&n^u%eKW9gvdgxv^RMBM$KoJMHpWtFnhwSF)TF_d7E?xz>e& z0N|*L#0NiJ-uwP44fArwNF0TZw^r-oooykV&ZWetMdT)mpWY6MIGV{6O2 z62xlMRdRDEj>~=aB0y*@3#SC|ZNFZ&cF-P+VCu?lq!i?oM{#5~r|3-9%CIDQL?5v> zLVm{H-}Uu<8MSB6&GR39l5nEM#Y2dIYj+vTMl`8q^+As zvx1zg`s4t&m{<;WHC)W9y0Y?ok*iaNz#bF63=iHw({Fhc0Ci2|F)^!-0_=I>oHcMu z_|nJVR}EQa%?vB);wKvpUR2q}HZ5^qhBiK!qTRAWW3yuAqkd9y_(TbZj5h_^UfP!Yi+CS51<<9x;|By!3?eRa<_2KK$m%R!5at|U7-H4zaJFV^MdWl=ie zreBp>lUfsY(#Z#LYSbJTz4qk?h;Wva?!3m>*(17FEGgj z?>SxT?p>6?E`!l8MX$_pg%2`uh)Uqu2zzP?_Vza23WB03KO(~D>&uHEl2bD?9zFNO z8fMRtJx6dApb@B-gIY=W$dNaw60l^NEE-g*eN1bVL^^i4@(C!xj$=2>ahkA%`L1)X z^4xKZP!hFeKJfMR1-0fpYGVxg0&cof-0mul$d@l)G*fk-8ypVu^V>7{!$3h#BOFX> z78F_1wom!|`F7hH$@nNrmXvePN2V$>!OUvlUqb2}=vv1c>z?oLeY{!k-@mUaNeQls z7`nEWWB0?s&?`}UBuvO1h2AxRNl}=dk*c&E{sh{BM*I2s#n#R_d3bnGf@WuDL2*%p z6^?)87-CzfIe65BH@0?N2Q3|QLdeHPy*&=YU&p80tQHm)xFns=Ep542$1KPpb7y_1 z@TEJ^(Ve99;EAB%?QyNo%6_ys+Y>Y-(bP2b zZspY=qSW2JsA>yCVnJac&`@vK>|9MrbE0}#Uw1}5b$yI$N;0lUPP=*@nZNPX-1PaW z@CeD$w#leiyNFn^2V-MnS_V#~myNLHIEH$!uYMfommw{lV>E&1| zD=VKp`vqHOxuQ7KlF-fDMtStV-?X`u@6x~Fh`1x`S{XKehVb9p+arz|L4KfkH7a|NexX<_B%A`VuMUst`wHE(}D)I^r#E{?3*;z-*^n?iFPue#j zA)(p8W&gf?DJW|}JrmEwyaQTq-ltugYugVdp_QVY0feMoyZ&pARWzkK-^lyU9lVjH z8ZEUs;CaMa>Uyt~>~WI}bocx^iS-_e6|gQ(kPlV%pS1k6hTzwjroVu_#xZ<3_eeU& zZC42U`k4S#UnV`F1+LQ@K_kFLlH3Tz$qGh3CW)TjQJ2~;8^eNWP257)}q zEVGaf4FW;J7l#udvUBt1zWMm+r=Ba{eYlpFXNq&oTh5ZD352L_KfWm7*mfGjQK$se zTt-N=jNJ=m+gU378M4$Hgfdfxl9%TbaZqplhG>; z*(oVd?mTUOp`#Pn%-YW{3@NW`2N3p4!7!lKn-#V6tI6_lyYsiH z8sLt%w1lZEBB4`)Cq$tK9`~@ewssErjRSW*Ee4|_>EAMcv-VGQ&~urYQ^Ikq>qKGl z9}MvWG=%vDh$&vIK+T4HR;TN~{G}p(*yBv_TpqaXAWnS{alR`u5R&6Skd$M5&-Q=B z!F(J`$KVk;7D6qT+n7q(KgGxDv#Fm_C-$$8`57dCJ&a8fW1f0@Y^VI+x@JV|pI^lT zZFBWY{(4Lrrn{~V=*8kDO za~Nma+uJKEmBCj6N@E@N69`*kFs1fhwx!a5EmV@emTCL!{QMm+FKpey{Jf}TyCVoC zN?>O#Is(68Rk&C@dq-}2H~lhn5j8b6s73eix_fs$GqWZeFAq--q!qBaz@VT`NS1&o zir^*!;r;ahPb&4xvHZ4ipBv;QX&G+C=qDX$fyUTYpgvkJyweSHdOb zItv0N6gDbNpV=aDWB4ly_S~Yq$9Dq+^KOiUWt&V+PJ%aW+p#0X!aB2sN-r#9qz9>s zkV8L<^b2{6Wyg`1U*#V@co25zT6gyY!sp6pq6f6h*2jfTlb3aMb)nN{?Y9&SN7;{} z^7Ve^;~cmd#TCo;L;OdN9u*W!yH@{Vb3m!FNMdtWbGl*i#rJnGk7<` zjJjjx0{DO3fKh_En+2 z4n1`33xIzrZ3E#<;H;!0X3jGUVOKR&!~`Tz+Lt<03=laKG>Kgr;Zs&oVTL;Xy$?%s ze&xg~r^!Ajv1WRrMB>T^zfCi?c8A>;9joug*g?#~oLLwd>+@Md#I3tO&~dpwbs7iX zK5W&|UQwac){R6p^Ey0W@Mlj%8$r_nUL4PWkrTL>-FM34N85jqRDmIAory z?xx3kH`8>2x#K96ef+4IqAd*GeBi)X=gP7JMAHWOncMXDbiZ z&~xJeQZ=jM#a^Mj%>zXewx>YWKYsjZD)mBHK>;CFx;%YT5<d&sgKe254|b*3@;1E}epQlmuhr=@ucMX)N>+uM7;e%?9q-t+r^|D9SPR8>^e zXU}5)Py(-vy=O7gD*&r*-F!%JzU#1do?T-6x5tjrZ`zs%+j+Y*IyySA=X?z#S~1ez z0|QslkvIV?IV_|H9RPabx0)sOs5?@QOcJ&i-le{gX5DN(jiJ!~)A=v~`!N$gBD(&5=qPaefEOyRn=@O1Md{ci_c)SDq+DylB zBlia-+-=zw90xDo?aQB@u1lH&``FbTWhFg0c!f#_w$=>arn~zyf22vr^K{+2 z#~t$)bq@t=(plp+>nXW4ikS+nZ`N9wN43y-L^E?qEiRCYN&4RRYw6Ny+{Oa)qJ>6I zW*oUCCK@zy+ee@d@6v9{>!JS(>&0;14?kt;P@8&dcATpqZZ&sxd>y#m>?!3aPrcr4 ztafLa@YoS#8-FRs65pRmWv`w1nvSnqH*T+`V`;wNDDJhI;tDc;-VqqfVn93JwNq|2 zOIVpty?y^H^^rH%eWNCg)x;-X!olG-hWp9w?ShF$g-IDeAo9icw|Y5*XWU3e`Uyf_pq^; zEZbj0K&t-N#gMQovtBR3j8%+f;XJTwHKXS-tX_7KZ*0$JEpBqYF7!$D%ZfN`M-nX z-xtGY^hn^%G6Xf^k@h6DDLW;v6+>OKkAKwSk#E+%uji)no}Y1YeRk|SkZRM|G<90H zr{AXQW(_^kGN{XE*r^;XwUq9$l-!|lWZUZ1t07qOly(w=AB)51s4-XlLPqPvIWGM- z*T3JwWn5V1Sr3gQ$L8c7oK!)L=l(ezyupk)W)CZ>s!l5@DWM$6XT9|FpO;X^VRYlz z79j&yN~0FXp{rda5(n7Fjvd1!QX3Ep{R;FnN&1lse;)}fyo`gT^$uGkF_a}JhJc7C zPo7*$WwHwUe5SfcCf7|2t=i+t91=AuD6k4=|xdDyvW+&LbXx)u=9R2L^tNn0~< z$x+(Sa>E#eda!k&!MbP9o`EdAdBsT^gGsvo#DxpBQjVWK>{qE%MaHjvdIC%hbeXE- zY46+pP@!-w^1?jCj}+Z3Me_DC{oIa6i=dh(p&Nba-!FhZ9>~QIYSyB+eJH6BdC8>z}}cl`WgZ-NMhm>f{>C%PawqE#Cd9= z=ZAjmCDi>`v*#UITM5NKb4>Tl>X*kH%b_;H&YY=*T1o`zS+{9-Lz=!G*`|H_Um%NA z!+4BVI7?fOX^4{OL{{il!jz|rJ(M>q4|1|wAKTkSV<4?Tw8Ev20E-`$9iZPvk z=M<`s<6pr|#^K)~2S|9S%laqkdv4e;rt*}(99$5Mi{AP8>hkjP%1SgFZu! ztLKY$JsT3gb~wZM^8?6(gA)y*p`rEhsx0*M*O%0_63?1U{P=um@TRB3t;)(uP^o;w zV)rx;Q#rLTQ442y9GZ#t=t!fJw1GCN^Y+XR+`E!`U+$OLp|SQVGdDX*LM^X}*f0kK zKJ?P;98KSBTGMf~@-oWX#Vdu$*Avlb?|};BtQGTXG4kZ4nYRvBywbO)1m9&99ewKX z>vhIoBs@g`+0+!VRR*32NPGP^#q!Y%yo%P8vlh)(78;hIOSMw7XiMyz-T%C?-fBSK zS7~W{at249uZxE1?u;;9dprmwwJ%2A`#NDOD_c|FMe6sr>kW1gA|b(COvh5PiS_SF6z>I|Sm>fD;dZTj+p{%?g_AHWUn0ZB z2LN$jd;|I!_Sx9~-aQJXv8Swx;J9@S=lm1!+tAwrW@}0MK4v4wc$3mPJL2S73K?mB zBjV#TY`rZ+Klx*W_;kr68=Z^VdH8we!>2wwK z4$sNEPf#o&SJ)*o0f=k@)Tew{xTqR(o!u7cCslnJm&y=yL22nQdi4Otf_#0y7P+}7 z1nuVKJ$&uUhes3w;ewr|wZA)pAEqL-4+8@N%vxV3mKwnkFm!kpRM!eM1q49nW_p6> z{Wo$YD3T8d3sYMUn8ZGbZ^j~&fjS;x;S30k&W&pco*Ph)GjbcPzTlKmKYKRqeC{qU zdPYV@78Vv}=4=n%c$LU7qK7+LB^g0|px;GqZAW|85V|_R<-J+w=H|9-+lC|rozm$$ z)qQ}{e?23kfGrcsO_W#r2kV|Ig@jdEPC3&M_=%Pq98uZfR7XOXhd{KnxcCtU4!3zb zYM-SJ^|vIYLES$#I5!FvY9Oa%-ZS}?@gNVV+ecEb5(w>20L$R*km$$XF$$q?*$d|F z0k;WK2~`#@B&{KoBp_iE7lt!K44kQ$D(#E99ZgSnEDwrCkEuF&iXgT@#wI{&7H$d1 zraCJQ1GO>G48jjwl)iBzJ5U2z@jS93T1!fbihCtYu!uQUol(ej2E6#}Ds?N68z7z5 zR8+vN;Wqo-$IaDMT1F;hpU%WUTu?`zeKN`!=PlTbx7dsz4zW>4T$xvDmZ?1|bRh09 zaWHUmI{mnhty>wf@=#JxsLMZ&Ao_@;&&X}yGLqHM(1077AnJ+>i;7NzLZSJIj%q`O zD6T8pAK0Y5A}ekdINr+s$+y#ahmaiAd(#2$o& zE!1b|Ict4Co0yn;m^7p>d-OLj>=i3YUb10oZY-#yiD?QkI z$7;)P-SpzF>BU%wooN~^?=7d-Jmo1$+6)UODnGZ`xjCkh-MY>7`OMApM)@7=gt4u^ zNKAbn8TpnK>iGI$hy9zTkGE&CW~&&B-4B*$is~3lk97HP0_;ovpm!`ez%bf-`N}h_ zPcnOZXLB}zGvKE(%7f4LHV3$Nm9kK<&}W$~8Q+XQglv6Bw&a*kEI;~kC<;Q*UoEOR z-2QoknANf8o8Nz`C{8au{eq!`MkC@}fbbJH0gZ&~9(>!$eZFlo`RUv5*$^4~jr*^( zPo;4ASAH%kzCV~o@5nbcJ`U*u;L(`Rss+DZR-cJkL&A9V*@|PN2<^Z^^p-|?dM=5Q zUQR-p>*~5-Q2}n>A0N?5Ie(@9v2jpAK|w^s4z$afiCL`OF?`Vt1?Et^(mclQZ3@UR zynOlcg$qwV8`~_YFRay|jE~o4n?tXu49(F>U1-VWZIO|@jBH`Qq|V6Q;UaV{q<_EG zZn@la57M?%@V)?+aNeIgaM!lP1xd{hXVy%UnpMft>w&n|Fez||SwgqwS;xXcbR4?? zV4(JJ13H7OukE5ekU@5XWFvR-s^Ro&+^`42! z{Wlg+yQOTI<6`(Kx_Sa{poN(%r((C{&1J7-JB7BM7(Fe|s{OZU-#$t&B_<|z@L+vKMTJqufPO&04p<%G7Oc-U z$LhjW3UkxHbBezQX zLSzMbl0e20GAKaR_zsvCLG&;vOvbR|aWCp35bnnd{)0%wNMu?2_0F6b1I(HloTvYO zt+R&5OB=3Rtj{{fg{6rKAt;l)U218#m6zTz9{HAN^W)UHbLViyrAwDkjiBgZm;3zb z(-F7%DRilNdV0`4wI+5ZcK7AM`3iFi=o#Tu>3@;#H#+1aXA>bCL+*r$wO_7YpZ=m~ zIHqKFg#(03V3fvy$I z<-bR7nit!`2n0tFhjosRN{s+4C{7_W5D0hgr6>LRpBdJF7&z30i+8MDZh)=>VfoG!oFeUiml%QeJ`OM3waf}_f?^r|dguz_Q zqV*hEIzoBrj+DORnUbI#M<=@8-iD!~HlOth>Y~&pPnx z)hmPsVmQ@-`=kwezf`k&73b78muU1j;iu&7WYMN}NKh~5Nn|N3joWWMr>Lli$b&UB z1vgO%iWC^qjpbV#yjbBQK;xe3Wy7!);4MO#h{k>*MmpZ4XQi{k7~l0*AML-i?+aZ# zAez}yDR%8hxw)u|iwji~b#!sb3_t3hG01=NdHuMY*c}HH@W3o&ll$be#_y6B0pq>3kzc47qa!ZZbhPVZn2KH!_Dh3iCf3JHtg{ z{(=nA1O+Fc8ax8|rw$?z2!_5!k(6R98z}GLP~~XX3BRf-06yl9R0P{7eNcOqm)pX+ z1#LB6i-!+RTAn@oV64HdQfKzCj04-&t#6D!Zw&WC(}y|rLtC3msXzNrC&)E4A1WZ$ z$Jh96;=}Gos3(MHT*=pm+XzgLhK2?@4b{MFKM%953uTBMPBvhANl6Knn4%>Hxf`nd z46>FSMNsR@i*#YXzyi*(-tQWsHRj(@TOLbzNFSn=VwP27_gY;1kH!#={VwydQ zlY^rTe{z2S=CNblhFes>mig~Bxgy~9!?{bUPc|ZU=C>hvTW9CI4)1|$z2%Pp(oRE( z@q0CrUYj=VB~4+?AXeo{d#`Y9Kt_lXF;S%ETmE`>Y*7*&r{hz2#_(NPD)3x3p)Bj} z?p8ERZO;#tT-~DQWb?oWE?l;|)^yxnM7ognMbD3I;T6T*us_sZnz$9GJJj0o^Vl%B)~SBa!Q7o?fE*Pt6yd^ z`sbIWz0Hq%{rV8xZU?Qg2_DOn(IbWmXdF?Z@^K04!x@j!6 z)lUoa?dtlbmXQ;Io%&(KJ`~G_~>kh!^ZyZ=jXp} z`PMSFasiuKi4HZPOL?tIOynx=B|5ukVklU-e2xUMeD^1 z^UAa5fD$qH#aUEr*!SnIBwH;3&6Kg38C6Ba);TV6(ZXnNMFguMV~3@XhsFpXQCnt+NP<_HlG(BIRO3D-B6 zDk8-152C?~&p`mAimC}aoIEB2Vu8xW0GNd`f8{e@^xdt(yWmt76cm(@ zkl4T9Vs4@rEmlnTNjLI=O14z;)T=TQ0T z7q-)wpMG*6=Bq;zh((hVGU^MJ$X2j$oF*#%4>g)WU6!<%lC zH|Gc2EC7n|=2QKpN^an5(!SV86}4bI3BOE|la+P^{> zUt)lgZJ$emXAp(>1f2`u=zQ la_+xZ(f`lJxA%|tc||!|>K)Vs0)h7QDVYld z!m1Yp0!0_qDtu>p?9>(fZ@tASO)COnV+r{`igNR~s|3O>!fBb~D)ynH?GDZl`d3Il zjURjOdHitwCI&I@<{KmON}(sVB$V!tQM@>`uOXo~-CFjja9n!M`E*r9;~OTCEIXWr zn~f8rcKB%AmXYCn)VH#1Nvd|XdRyJL*XoN))$qI=o8=dm_Q~MfSqWlx(3c0Nm9|n4 z2z@<~cKBb>Pbzx?VUJAFYQiq|Rje4|rf~w{)IE1f!ZGPJ;snCx-CY!fhx8P51b2`B z)JK)l!zG-auW;|(yO(rg%U*>yl2bJ&=mu3I3x?|BuN)56$}owyV<&a0>$#|An(6TK zr#MazF^HTnG8z&i=G7(Z*FL;){ui z;oQ4-W~61ZE!)agqUlb(1F<9j<;$0zG)#h~-_kuq+iQOImiP9M|L|#Ny|Cl8*pSw- zwuq3doA0=?H2>|LF%A3Mv@|+4$=7zWb8O`2E-%h{(qAci;O** zs|_PuGE7@De4?~-tZ$UurIqt%&9@!>_VE#iKbzFp;9#&@b>s;zTb!bz@i%V{(tdvu zmU^XpX1FQk*!N?{sm}+pN;t+{Jk^k(>Pb&pXez89T$~x*BCV3Ft?6PFuk|j$=3}sc z;X2wKDuu2tZf>Nfycb=kYUO5$otcu)gMwzOggUK9np4j_Ie@Lcbm(bA1x8>=k9-s7Ur>2J*Jn56P-n~^!{qY{_RKI_E zxQR(R{d(Wi6X5-tl1 znA&TNR4fxd-BRG{9TpJC&&%_m_m^C_zB1V9Jn1Vslt0^{94jLy z*Y9T4oMjm;x*QwfdLeddxanNj<*Huu!sW)Cq6ZHie0su7!!9l^jz`d_NA3HxNGwd* zD1Ni=UevyKMh%;#OUud_MXYWyaC&4}_TJU8Q4AGU3VUnP@^*>4@0{C0favn%7b$fv z#Sp=yA~mI#+XV~)-z3m5i`l*wB~^!sC2d)pC8j8f+l_^eF3PU>zQmlQso2=qY{Dr! zv&;N;UW`@T`7Yt!y?fmyUWs)=W^Ho=(f(>lS`D3@g{K4drsU6PojK#f%g>VR?k-pR znj)oOyYF^^lVPk(Ok5rVt(hq;Ce>`?-rn9TD=TXyB~Qx9U7R%e@i{o^;llKAY;0_z zKpgQn5po_#Wgz|JaKM*VK}9M-KdC? zl2ZM(#v#%MT$L}Cm1&k?8lAS~54J~3Y6*AMef|1e$Xr*SeQ&^xZ|OJIuAI|k&?v?s zXc)wetf;6+Rs8b#vvvm7=vw8>SbL&k>blqkT{c$M@F!1VnpwtuqO1pMj)%Ga?D?>p z6ts+Yc64+|-(%#}itFwl9mVzz?l#Ogz}F?8l=jhGee3sfHaC^n*`WscunQ+C3XPli zY*w%|@ya)?tnS>t?Lp6bF+;_qgP+=D&)QWh@9mOTT~x}o9o;HB-*caznqQEIhliK9 z>S@!)c1v2;n1SZhX!_!XyK%binFaodH*el7d$2v=(W6b9Hl><(7QB49XS(V-?&MJZ zDG?D7PKH6kH#B)JOj6Ji}W5& z&gI2U5?`b=?FpYL4BUG3o6X?Ym=kw5D8;_Mn3;^@4qS5?ijS?|-x#f{ip`CU?Z??% zXi(RSzmx`s@MRYI_EzyV5NzRRIa{Vt!vRsz9PR9zYZIP}J51C@%X!jcUpj#xSYT;s z>8-NC`2H6u5|0NJ9bIPlv1HA(S4U}*Zr`~Bvf%b;E_8E~ktt0~DOecI>o0^y>MJ;FE5u{W>eD0cbu;Oa!+b`sxHrA@_MNOX6X&v z4i?QUM|t>`vWqo=o%+8-q*P}(Od8k-x%G$HdC&uQ+VO@0m&JOzs~`fMEQ`pDcNB(o zi(A%d2TpIv&q;K0bWD(2ebl&dtMtgXcif~+OW@7=;NITehHmWC(4y9TM&7Nmrxg`h z4_z+3w~3=MMK7gVUqX1U>keK0ext*|3Lw8dHa^ojPGA&S#v7INt^Qq}^h|u(=eKf- ziHRLNcs}gr%94Yu63~EKC2p6;^>69%qB0Vi5yzKugQ}hDf;gm5g?W&@p^61(=pU00MPb^J-xoB+v z^8-`EAh&vQTj~|LlP6C;iuMt^&Ht{t$FGY)R!M5g-qF#((2#rHuj~F*iL}eaO?grK zhA71XDsTjk$|@ODJ&)n*u8&vFATq5Le7qz#?)NQwf)XEU{Boq~`B5>e9}lATX=-Yw z6s|0Qu+@{bZ}b{_6=YRxjG@}N(X8ghduS6-NN1cPn*_Nn#Ei01TIHdlo6S5dbhKAi-$Bpg-M*4E%}ndWYQ z6abWYYlbOlWjR(cEXR%Hs-^WUvy)8Toz)>i#1Bk*JO}&2>^d|7T=*>4+2=>h+Om3{ znw(wB4GL{ZGh`B(#H?~`N6Ers;(KLNqB?QzXD^$}loI%V-A0zVdgXK9`}$bK?J>%) zWlY!9!#o+X<}TP?zI<77W$ucs5}th+;8$8I!!FZX<_l8vpcfot;xyTFE!}EHQtb-?|FAb-q7>UpG&K>d=j^FM&=>S)>;r@6^;(C_|06S5HF#m^%2>)YJg6 zRwg4zJjqNXfSrWfinG3c7xd(L$O-&gxQNw{?EY{u%N`j;ML#buIiRqqo9y#p6;3WL z8g`?m?`FE-y@1g$PN__XXtI5gExqbIhf_>=)F`csA$8 zzSeqY^!eE#qo9$B0IqZ4;v&Y4uXAjM%gW0$uh&M^ch~G}>QWLNzBad;zlestzOGA} zYFb5?0?SwK&&DQXrfq9$i$g4A`YkX#ya3y0Sm2SDCqCS{cB3(CDfH1KX%cHCeXpkG zd_aZDkZ7vkfo|X2lfFCVgS6+oP4-U&>A41DW}kxvlJxc~1A8~_6y?!MKb0RW&cP8~ zG@<%Ma?#}K)t6EG%nRlXENQ;D1+>S=2le#!-j}yy_jqn9;W%}@K28a11xklv!o6u| zEWm<2<=5+Ys{S&vdescEGbQ}Ctu!eFlFD$Nt=~M2E>A zfWCPg`5)C`tugXU(*p0IganQ1_j&QKUGsI98?1Nl%(Y8d&@8Yhx@i7b)UwCJrl;q_ z{r=Cv(X1RR<0W)PrHapw#6!loy1L5wu~;hp9NKvrSL&_nYK4{EZ0B*U@b>z`FJWS_ zf^I@LzREPeQ8d}a$oPuY2K)SJA^R%y{ZMVJZ+R{&E9({#w~$bisE$%#dioJ|kBA7p zTgsanZ?U<~MbbwV1r^+QWy``M;i!^7R`cTc9W2%7h3ggS@8$K)!&+Keu%&7wzHwgP zYceiRQFu)E$ZBY4q#0Cs+?k>AB5Dsk1sA3MUj1?tL4Tk$?hn{U-CSE3LgNk(n_|g+ z$H3&{ch)`ORxg0WbEMLklezvSTmovFG@Mdcfcoe7@#9C0>NWE0Qyn#C%9zcm*q4@; z>P47%H0W7aoI&pZl8a$IMZJT&aUzKL8xCU!`I6A?n5yJ2)JVA}R$3Ez!tnF6?*4vq zS&{fNUUxm8O;~erdAT7r7a&p#@PuSPf)S%wO01lnnsOeD2{O?NorM7UB0i~bOQfN0!`f#GulmEC_(*|3 zqduwLq#fe+7LT~t0e%T%$Jei4zq@nZ!E1yG6!N;YXk~d(%w{O?(WA(YGuf#6_A9@d zo1fo_U0asX$THu;_vx0<$nm|6xdRO;#bnL8@CDUSg22{+JEXB(BDI@%aiTRRqI{`IA| zjfiJ#oE?{DtcJPTfv&;Wh>VT<9m2M1x?RF!FPvN7XLvaHm13AtSZsanz?TRqy|$Ef zM{ayA{ni*t8nYg5h9J}Acv&ww_qaXFvc$3WeFE@nXml1Q93a4dQ-8f(ZIE{CG~YsT zf=c{br&+V%@yB1-o>dvx2oCE^$>vxOUa(A&a3i9Er>yt>Hbe8>jTmKDU;Ts>a25&+ zI+eyb^5Lh-N@JX>nB|na@?BdcOfD}^RQHTs8A73n6^yX&@dj3{U9(1fX}kpIznd&? zRzHVD0D!X_X|6>@aHH-Ov0!lwXQ08KiiVNrJdu~5YPthONxt&D=jU} z>~O4{@vKi!9Y*DgpGOg@jG8Y$KOZpIit2&CV6F!WXKg`ZtUEwYE{R-6VzaH6=6-@S z_v;lnLv41h%w&T3U+d<7`|^bdaR{K6KYO+z!-9Eu>gUgRo!l8nG;%dH$9<#HZ(8dZ zz~Oa-I?G!ptFd+hp9w7(>1KnGI064w=D#=;TXbJg<= zD4Pr~e41OcpFpsX^!v|SL;sF9Wspx}5nf1ICW_gO)#p+Z+?jt)PcH);PDo3KlIqR2 zj>CcJz0Y6JoPI+&pN4{vbsvbLmuu_m&Toa=`smRkM|BE<1rv&RM~S0N|Ng9Rrts%b z5CX&8K*zWuUj=7=QJ5F2)D}EU(UzB zqYc~!W_MCSeo*(aU{KE)T ztX)l*l4Hv&A&+dimXc@zEAW`x)O#_Ozh+;<<}$vq{MTa!?$`soFhME4amB zqBelE3)a@wGBPrd+fn;&+_+&_9jcjq^ZV_!G#M!H@*J%4E7uT;4r=f20vvWio6ODG z>*;l_qN@rMvul2H3D#$Gj!h!pI|@SRG1J?zXRB}Fv#{KjAPt!mA!1rg;8C>8NPPumN4Q4aJkdULsWxOi;wv(r`nF4-60X#B_)$6v-Ux$Fc zvyL`Yd-JYfc!xX1Y_Bsr0k}Zt^@-}|S}oFALQz$)u)H=ECYa*gTmTk}t|AzP&z?QI zOUsO<3aEIgdk2?i6zUH~Qly=)dumm<#Kp;G4-XIM`eePrj$6}&ea3v7##gV~aO%{l zX99-Rc-P0r=gir&XB8C-ZhrTn-@Rwg zo+C%vuhKWwcN-b9$dbi3f8jcX~@oO&iDZjn;URF=s^-xNn*dZIY z;0fJaTT_(0%z`HL(rebN$y*%Ddbf~W)fUNv}bVH>Xw`HZ`pl5W0Ijk~6 z?hoQN2T{#UO<4~!6hP~-mxAj|T&5n$vChx+`cKDy-fz_Sdi(b6@untPT3XJ|OR#nm z=UWC9PsV4MwJ)?7MkHyboy2Pn2n%aW`tA47z#-pqPJGk0ZE>ddD1nbk9er`r+nv~! zJqgJh9UTplVFJ+7(~n1xmSQ2NhoT|u%tn^R2>)>R@o{Q+f4f^=;u$H?ONqiRGMzn4eE|fRD^ve$j3!~4Vh38H9)kB!MDb#ir*69G$!(^h75w#4=P-e zZCa%hlqFrv1W|qwQ|+@$T7k6?(x@z1!sd`}YwpGn%N%GP)5w5Svmu zIsC<=OznMl98IS^!ne?M6osC5Zu`?Y_pH{YZf(vkRapDT0NCqI`@6eQ71HG=)*MGg zdelEjBlR-2l&x=NzugJ8yme#QSBhh@WZ1+BMOD8bJumgzwQCX|Q#`V{(ppRea~rd{ znSufWqUSUF+8fEDEezAg% zCpe0kIoAU}TO!gdF)9ttv!v~49=Oxw{_B$|6fWa4QNI{UNN}O6d(G5)<08NH?Url) zBB#H-*RGk=GpyM`lNih*c4DSvT^mX6G-(@vmNksgd=< z-*>`mOxW*MYa|_cRaT!Qr;Jl_>XGD+mGMPlh!z`d&*j!&(Asy%%ZqIyfAWuoBZ~_1 zh=lRM|6ezpeEcvw7D;E}!-pTcXYRybwx!d#e(+&{KbX^@IYJ&;~&eh z&AL3#qPv)5RG{29KE{q+kzw{H$dzwE$Fmn(>`qcnjZzQg)R7Lh$QH~V z85seWBTO68xp#o;!PNKHL~FKB2&kZxYM@VKKP zn~Xt!?UJ~4|K{>Ta3=;)yu_S&5)~Z{tL^sf+pve_<>7RGCfi%^?Ohga&Ae|%|2|U` z8~}edDOYF66SyxfE;PDxWbk-%sRYU08^{J7qt%3>d)hr)myyYZZiHD8IdDnlujP>>`3b( zBjIdh@b?va(!g@yAFD-Jh4@YMg_`=~Cr^%=cjUdOc!IEfTMD@sVEvZ813LE}k%2EX zG!#U&weagx@9-t(83X(sRJhV4CrgV|s`L>x9b6<3jSg^$J#w9{jt<4$D2{S92| z*%f5R2!db~VaC;~eM|F`(|qLz$zXWIxN!sqTO*ifur}Ju%PTSOeX&G#%}oFI??=Jj zNQ99oO3pN2frr+RyPH6G@X2$PZUaQYm2yATxbu-%GRLONgeBJBK->B2qK^MSJA zOJb)Ygv>jz#76aTk#-_{e*;Il_Utjs&#=m1CB3v`c!;56*sKS4tBa$SA<*4(7ZTiI zdbDe{tD6Ovqx2Dz=5d%*iG1g1n-S6#z>7=gI~Nun&dSU@ zOe7MQVv{vedyqoh__~^cNPv1q5Jzr}n2gX;3WT7C8fu(B7lzo5jm^B&y??f=UCzX0 zBxRbnxKqxn-%NYCH&M=$Z-1^C5r+^rC$2=f5XZt;40RdB71YIqSab?_LiR13{%O{ z_iwJ;V&`S8&83e0R1k2WS`S|pJtRM6p^GAGbwS0(U!|ml*b=Ka!R}a5$tVsUp^XB% z;IBrPl2I~b5JrkyS=#(87rQ8mY}bfSSwcSoL4dSrNV*0FuCuX8xVCL@4`J_$^hfd= zF7YN$>tTnDa8pNJ)YosOK$N;%dcp)pS0tURQaCAKp!FnCG<29hO-5HYyhD{>LDP1X z@*i*g-`k0Ecv$Dyak#-aCgI`XjQ3@UTEM*n>LRxb?SJ+#o98K^4r61B=<4cv@nRRg zc=P5B0%X)(gE~72gmt}}<;MRlvY0`lGOV+gK)BnznL-Mo7L;{qdHLeP0;B!)v9@er zHWHU&V1i9NEr9?&QJw-#uu3}HcUv<_KdbryCCnynUo)>tLD1I*@*w6xD8)Ti3+D|t zRyYlg!Gmf}#oBYB!j?E@DBEH00W;Dyc=iUI&RAOwxTne!Pl_0oszioB3E!1hOZwJ$qi(bE4WzN7A1q z7sR7^SunR|crD?@NR~_&>N*9O3kX`#<}o=vjhfxW#N;&!x`hFl*5M96w#zD=(NRQ` z#YsOF&9-Pa(qbn}#+_*oU2^1o^`S3+|W}4kAQ?)FORgci1G#*Y<7nY)=vfN zhq!d1Txw+#Gc&ixwuAb|fW`3H7ZKoPn(O7ugRUQHN71byt;1m6u2_A1$POcGCvqJF zgI9ik?gGk~GYSfyrLI+niom!JJ9z1~E+^h_ozK!|1vRWIid8fUKt`}R^ldUXCmv8u za7G*puR9+V?+H4Imv*;6lMm$AEFrr?8-WC3COEOcu_b4P}5k>zX z0MXOKV?bvWfiiKkcJdhu5j-Mccz=sy(D}XS9sG(kxS*MIpK4!<9eeeYpxIr~l#)s| zpN6MdRPVFrZE;d0ZvM1}g18NF)i2MrTLm$Be0)6I*T6jj0?Myfj-%wS9*MVGYq5S! z-W4SAek>vv@Vy}lo*}P4eC&6ucDxHX@f-46Z^m_ z7LmGZGnM^7FYNAIH^yAI#@vnl30($4P82np z^i*+AJ%n$2Njkf@cv)|%G9K3PvU15jOQa@b(XL`$7@wFJYCAP$8f~|;`rS&=YT81V z?jT=|HsdGXuXfN5HLDR15Kf?-vgBiKL|E|CC_9Ggr?dKct*f$le|xm>P)p*@i$#rc zPonUSe@tgGT{s;8hPW$JBz8AypWD(;uMSmVRRe<`tNFV9c`O%`PZ%9~5ZXq$!|bqw z{k*#MdEPSpnf=7>pZZ)oh}XPx>2i{G_)hG)lXlpu&MdcyPS)U>WOMjn0+l`G_{>a( z29I*AVnZ&yp>aoE_K#FLiK&`gc^+c2rM^f;j?-*1)Mm@;k}~td!O-;SzO>ZTpUz6= zPkP$=@m4UR7X;gb?55hyh+U?qB)g{Bg+Ovxj;GU$Y7DgA8cieNLyJ=hj$ z$6lk^S>OUJnwNB0fGoZQ5zeEXWdUcyk?HatNNaf7acW7=J3P0Q!PZJ5Jvj~g1Es~c z*O~(TQb&baDA3xfSj&9T%xuiA)1~}RlhLo4qIY} zPW%N<(~^q_zq4;%GrdCli8eF!?a3nMR`_ZNn`Mhyub~+WjtkBj#~|7sVHaYvT4018 zx>B~GssysJQ2+g^bLV`es#cl`S8U)*J&$O=7Y-xow@sf}N6s1K4{mdFa}(0Ofo852 zxVjyxS&!fW4(QxA$y!GiA=+b9l4zEZkZ7-~tGk>!pmRTfMbvr#nNyRXpo9eaJ+C0_ z{&qK{>IYOP8Vih=&Cct&&R;`fKa9>oJNCPlz;;M{smad*j!dh9O*;#8sA`ig3gy#0 z@=9E@^x-}eB3crF5nY73`H3G|Tgibsh!CnPaM5QFw(|vL<#)bSm6gLak#~M{OHtJhOD^Kl$KYJ-jh5s@8*e2X9}00|87 z2Eja>dH(#V#~G=j&*40y6)N2~AEQD*|I6TOwSecIl_flzomduz9>Bevvc3E}Nazh} zBpH!gDDZElSFU~km)5z7rXtt{M^d9L8pe6RoOt2I^;A^%yuB-`8s--1;j|}Ri1GQ6 zk|#K@lU*mrIvzb_8L7d+!A&W8P2z2JbppF~9c$ItCJ)h!6~oXRCSTD@PpYq8yKbEk z^S(pSA>LcKkmDQ#NAKPH3ic-B{SQ|U$2WDs3C~4Q%D}DG{5BNv(&kkw%d?&Q6MHB& zAe2W-ksk5DhF53-`@`Z+Mquq2GOILSJo0`W#BzJq?CVO3_- zdME||TN_?w(%g6zp{ttgM`AFSQ_<3+L6in-3Kk?V{&!8~4~^Sp^%^1K5V{@$RlG!J z(%jr!f@&h%iATs3RM3Zt7CPMXZBU(==ACdP8guD6vYqE|LeJn9lP^6EDLKY`bLm7r zjpe~<<^}8SlN3_UbK^+6+7KrYrCIjluHb~ghb3bM6TdE09{M=R4<`HA@$vB9Yw%zZ zrx_FIm(K=5j{Yvk&?HK(mz<^aC9pa;ro$8Ud#B5rE}cj7B~}NC>01oo^lyA}V0L>? zC4KL&kVBU!{QwEY6tZe~y{G_6o{2lWoi4PX`YVw8ADivxHm|!P5K`qFa5w+6L0V8y z5d2W@pdhA@;QVHx(GR+V7S6T4-Du`ZyAX56QT@^$1WFVX6rg7Ew6e3a?Z(>HZ`c50 z81gndmzm zP?2udE;=1yog%o1`Y3w)dMP~P{%PnD}V?DtgEExwl_6p z!jnM4b?V$XJGJ?ReP*iAyI-#!c0oL{_El$&O(p(ZJsc+Pa3Slv!CsSA#pW_^^0BXDTG8Rug0c%;Tfu8eE*<0QS6l{4*fm{fhmzNlIrY6zcpaNV6A)(mk>kiASz_2b_4?LndTAD3<3#u zIX!Bg*w{qWs-8>A=z)wt65!^OYif{T!ew&B^GRMRLv}x!=T(+V+A|KxUFf=8=F6;( zC}gw2Hc{*A$N_J8qfV!neyx+Mw%m_V4)*pc>xaXjpk_zv)Kg@nBNsn>_NZYsOIphk zl<0c)jck%8VI3GPuJHFCKeS?((D^BS58aGUPG|GI$Wo2mcZS^AC}fWAb_YP~QXOrI4p<Xx=(G!-5(hV@&j2aS>(0?HM9k~hC2t6?S z9a3+a|6?IqVbon&;#TI-c;|DnOX95crM~lR1*lIjL{KDR2E;OFkBh`Z?MYg>F+St(0r30bS z9;%m);)k$6F)v@Pp+wsryiGKltWTSF>p0S8D!^?cc8Qt$b-i!Wc(@oyU#P?W#BwW+ z2IcN99i>N^p=j+dPWEgobSu;=be)g&xO>-+Rbt`zeXC0`$(iW(2Y?r%mt6WDJO@w| zU_Q?L2;=>0=#j+T7qcBXrJ%4hi$(|ZSmGEPV%jKstDPCDm5LMI7y+hmUYnqbZuWh| z_%VbVScA1sd(A>L|7 z*lxmzfT#=|D<@8zXkd685TLBT0!UPYt%f^&O(R|Lj4p#u6sB|;YwQ!1H}zE>MkV@x zB_%s9r(QKQB(|in+nma`19p69ap)Q1%Dhv8W4_N)b#Z9Ra?yAvU#R@Q#){+NVu{1dgTgr{J zGQ`DI5%}f+^=A?65vJ0aWyv8axq`m$*@=k*4iz}9F=pgz+ftC)atfz4mCC;NMngga zigB6|RtN`PH0q)|On#dN6e4>mo>7@0ss0Wdf_@%UiRqPYzB|Pl(I*S<9(8ewO8i&! zrH2Lu8HP!Ti8-MmmNVtTodcItw?0clZLFH0q6xeKZl1|^)8+hWpf+S%EU5NulsRN{ zPe&QcedF=uecarYj>_Ju`uh41v>xnhNOfqGfIbHY2=8+bEI& z9;D0gSR2ioAD)a)EQatD)yWT9LA&lIX}HWKPru9O1v@x71-&8PHiM=z12J#hwz|a~ z6x2IV>^~yKqPOZ=7#9c^q>MOlc6K%e--04=oBGv=vVbI&#XZib|gNqj7I24aVH#mOg(=*=0Vn To cite package 'vcfppR' in publications use: #> #> Li Z (2024). \"vcfpp: a C++ API for rapid processing of the variant #> call format.\" _Bioinformatics_, *40*(2), btae049. ISSN 1367-4811, #> doi:10.1093/bioinformatics/btae049 #> . #> #> A BibTeX entry for LaTeX users is #> #> @Article{, #> title = {vcfpp: a C++ API for rapid processing of the variant call format}, #> author = {Zilong Li}, #> journal = {Bioinformatics}, #> volume = {40}, #> number = {2}, #> pages = {btae049}, #> year = {2024}, #> month = {01}, #> issn = {1367-4811}, #> abstract = {Given the widespread use of the variant call format (VCF/BCF) coupled with continuous surge in big data, there remains a perpetual demand for fast and flexible methods to manipulate these comprehensive formats across various programming languages.This work presents vcfpp, a C++ API of HTSlib in a single file, providing an intuitive interface to manipulate VCF/BCF files rapidly and safely, in addition to being portable. Moreover, this work introduces the vcfppR package to demonstrate the development of a high-performance R package with vcfpp, allowing for rapid and straightforward variants analyses.vcfpp is available from https://github.com/Zilong-Li/vcfpp under MIT license. vcfppR is available from https://cran.r-project.org/web/packages/vcfppR.}, #> doi = {10.1093/bioinformatics/btae049}, #> }"},{"path":"/index.html","id":"url-as-filename","dir":"","previous_headings":"","what":"URL as filename","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"functions vcfppR support URL filename VCF/BCF files.","code":"phasedvcf <- \"https://ftp.1000genomes.ebi.ac.uk/vol1/ftp/data_collections/1000G_2504_high_coverage/working/20220422_3202_phased_SNV_INDEL_SV/1kGP_high_coverage_Illumina.chr21.filtered.SNV_INDEL_SV_phased_panel.vcf.gz\" rawvcf <- \"https://ftp.1000genomes.ebi.ac.uk/vol1/ftp/data_collections/1000G_2504_high_coverage/working/20201028_3202_raw_GT_with_annot/20201028_CCDG_14151_B01_GRM_WGS_2020-08-05_chr21.recalibrated_variants.vcf.gz\" svfile <- \"https://ftp.1000genomes.ebi.ac.uk/vol1/ftp/data_collections/1000G_2504_high_coverage/working/20210124.SV_Illumina_Integration/1KGP_3202.gatksv_svtools_novelins.freeze_V3.wAF.vcf.gz\" popfile <- \"https://ftp.1000genomes.ebi.ac.uk/vol1/ftp/data_collections/1000G_2504_high_coverage/20130606_g1k_3202_samples_ped_population.txt\""},{"path":"/index.html","id":"vcfcomp-compare-two-vcf-files-and-report-concordance","dir":"","previous_headings":"","what":"vcfcomp: compare two VCF files and report concordance","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"Want investigate concordance two VCF files? vcfcomp utility function need! example, benchmarkings, intend calculate genotype correlation test truth. Check vignettes !","code":"res <- vcfcomp(test = rawvcf, truth = phasedvcf, region = \"chr21:1-5100000\", stats = \"r2\", formats = c(\"GT\",\"GT\")) par(mar=c(5,5,2,2), cex.lab = 2) vcfplot(res, what = \"r2\", col = 2, cex = 3, lwd = 4, type = \"b\") #> input is an object with vcfcomp class"},{"path":"/index.html","id":"vcfsummary-variants-characterization","dir":"","previous_headings":"","what":"vcfsummary: variants characterization","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"Want summarize variants discovered genotype caller e.g. GATK? vcfsummary utility function need! Small variants Complex structure variants","code":"res <- vcfsummary(rawvcf,\"chr21:10000000-10010000\") vcfplot(res, pop = popfile, col = 1:5, main = \"Mean number of SNP & INDEL variants\") #> input is an object with vcfsummary class res <- vcfsummary(svfile, svtype = TRUE, region = \"chr20\") vcfplot(res, main = \"Structure Variant Counts\", col = 1:7) #> input is an object with vcfsummary class"},{"path":"/index.html","id":"vcftable-read-vcf-as-tabular-data","dir":"","previous_headings":"","what":"vcftable: read VCF as tabular data","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"vcftable gives fine control want extract VCF/BCF files. Read SNP variants Read SNP variants PL format drop INFO column VCF/BCF Read INDEL variants DP format VCF/BCF","code":"res <- vcftable(phasedvcf, \"chr21:1-5100000\", vartype = \"snps\") str(res) #> List of 10 #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ chr : chr [1:194] \"chr21\" \"chr21\" \"chr21\" \"chr21\" ... #> $ pos : int [1:194] 5030578 5030588 5030596 5030673 5030957 5030960 5031004 5031031 5031194 5031224 ... #> $ id : chr [1:194] \"21:5030578:C:T\" \"21:5030588:T:C\" \"21:5030596:A:G\" \"21:5030673:G:A\" ... #> $ ref : chr [1:194] \"C\" \"T\" \"A\" \"G\" ... #> $ alt : chr [1:194] \"T\" \"C\" \"G\" \"A\" ... #> $ qual : num [1:194] 2.14e+09 2.14e+09 2.14e+09 2.14e+09 2.14e+09 ... #> $ filter : chr [1:194] \".\" \".\" \".\" \".\" ... #> $ info : chr [1:194] \"AC=74;AF=0.0115553;CM=0;AN=6404;AN_EAS=1170;AN_AMR=980;AN_EUR=1266;AN_AFR=1786;AN_SAS=1202;AN_EUR_unrel=1006;AN\"| __truncated__ \"AC=53;AF=0.00827608;CM=1.78789e-05;AN=6404;AN_EAS=1170;AN_AMR=980;AN_EUR=1266;AN_AFR=1786;AN_SAS=1202;AN_EUR_un\"| __truncated__ \"AC=2;AF=0.000312305;CM=3.21821e-05;AN=6404;AN_EAS=1170;AN_AMR=980;AN_EUR=1266;AN_AFR=1786;AN_SAS=1202;AN_EUR_un\"| __truncated__ \"AC=2;AF=0.000312305;CM=0.00016985;AN=6404;AN_EAS=1170;AN_AMR=980;AN_EUR=1266;AN_AFR=1786;AN_SAS=1202;AN_EUR_unr\"| __truncated__ ... #> $ gt : int [1:194, 1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> - attr(*, \"class\")= chr \"vcftable\" res <- vcftable(rawvcf, \"chr21:1-5100000\", vartype = \"snps\", format = \"PL\", info = FALSE) str(res) #> List of 10 #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ chr : chr [1:1383] \"chr21\" \"chr21\" \"chr21\" \"chr21\" ... #> $ pos : int [1:1383] 5030082 5030088 5030105 5030253 5030278 5030347 5030356 5030357 5030391 5030446 ... #> $ id : chr [1:1383] \".\" \".\" \".\" \".\" ... #> $ ref : chr [1:1383] \"G\" \"C\" \"C\" \"G\" ... #> $ alt : chr [1:1383] \"A\" \"T\" \"A\" \"T\" ... #> $ qual : num [1:1383] 70.1 2773.1 3897.8 102.6 868.9 ... #> $ filter : chr [1:1383] \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" ... #> $ info : chr(0) #> $ PL : int [1:1383, 1:9606] NA 64 64 0 0 0 0 0 0 0 ... #> - attr(*, \"class\")= chr \"vcftable\" res <- vcftable(rawvcf, \"chr21:1-5100000\", vartype = \"indels\", format = \"DP\") str(res) #> List of 10 #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ chr : chr [1:195] \"chr21\" \"chr21\" \"chr21\" \"chr21\" ... #> $ pos : int [1:195] 5030240 5030912 5030937 5031018 5031125 5031147 5031747 5031881 5031919 5031984 ... #> $ id : chr [1:195] \".\" \".\" \".\" \".\" ... #> $ ref : chr [1:195] \"AC\" \"CA\" \"T\" \"C\" ... #> $ alt : chr [1:195] \"A\" \"C\" \"TGGTGCACGCCTGCAGTCCCGGC\" \"CCTATGATCACACCGT\" ... #> $ qual : num [1:195] 6872 321 233 270 58361 ... #> $ filter : chr [1:195] \"VQSRTrancheINDEL99.00to100.00\" \"PASS\" \"PASS\" \"PASS\" ... #> $ info : chr [1:195] \"AC=82;AF=0.0136439;AN=6010;BaseQRankSum=-0.55;ClippingRankSum=0;DP=18067;FS=0;InbreedingCoeff=0.0664;MLEAC=76;M\"| __truncated__ \"AC=19;AF=0.0030586;AN=6212;BaseQRankSum=0.358;ClippingRankSum=-0.594;DP=30725;FS=44.58;InbreedingCoeff=-1.1608;\"| __truncated__ \"AC=1;AF=0.00015753;AN=6348;BaseQRankSum=-1.793;ClippingRankSum=-0.48;DP=32486;FS=27.337;InbreedingCoeff=-0.0212\"| __truncated__ \"AC=2;AF=0.000314268;AN=6364;BaseQRankSum=1.59;ClippingRankSum=0.358;DP=44916;FS=0;InbreedingCoeff=-0.0092;MLEAC\"| __truncated__ ... #> $ DP : int [1:195, 1:3202] 3 15 13 16 19 20 5 34 29 24 ... #> - attr(*, \"class\")= chr \"vcftable\""},{"path":"/index.html","id":"r-api-of-vcfpph","dir":"","previous_headings":"","what":"R API of vcfpp.h","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"two classes .e. vcfreader vcfwriter offering full R-bindings vcfpp.h. Check examples tests folder refer manual.","code":"?vcfppR::vcfreader"},{"path":"/reference/heterozygosity.html","id":null,"dir":"Reference","previous_headings":"","what":"calculate the number of heterozygous SNPs for each sample — heterozygosity","title":"calculate the number of heterozygous SNPs for each sample — heterozygosity","text":"calculate number heterozygous SNPs sample","code":""},{"path":"/reference/heterozygosity.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"calculate the number of heterozygous SNPs for each sample — heterozygosity","text":"","code":"heterozygosity(vcffile, region = \"\", samples = \"-\", pass = FALSE, qual = 0)"},{"path":"/reference/heterozygosity.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"calculate the number of heterozygous SNPs for each sample — heterozygosity","text":"vcffile path VCF file index region region extract, default \"\" samples samples extract, default \"-\" pass restrict variants FILTER==PASS qual restrict variants QUAL > qual.","code":""},{"path":"/reference/heterozygosity.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"calculate the number of heterozygous SNPs for each sample — heterozygosity","text":"list heterozygosity couts sample along id vcf header","code":""},{"path":"/reference/vcfcomp.html","id":null,"dir":"Reference","previous_headings":"","what":"Compare two VCF/BCF files reporting various statistics — vcfcomp","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"Compare two VCF/BCF files reporting various statistics","code":""},{"path":"/reference/vcfcomp.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"","code":"vcfcomp( test, truth, formats = c(\"DS\", \"GT\"), stats = \"r2\", by.sample = FALSE, by.variant = FALSE, flip = FALSE, names = NULL, bins = NULL, af = NULL, out = NULL, choose_random_start = FALSE, return_pse_sites = FALSE, ... )"},{"path":"/reference/vcfcomp.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"test path first VCF/BCF file referred test, saved RDS file. truth path second VCF/BCF file referred truth, saved RDS file. formats character vector. FORMAT tags extract test truth respectively. default c(\"DS\", \"GT\") extracts 'DS' target 'GT' truth. stats statistics calculated. supports following. \"r2\": pearson correlation coefficient ** 2. \"f1\": F1-score, good balance sensitivity precision. \"nrc\": Non-Reference Concordance rate \"pse\": Phasing Switch Error rate .sample logical. calculate concordance samples, average bins. .variant logical. calculate concordance variant, average bins. bysample variant TRUE, average samples first. bysample variant FALSE, average samples variants. flip logical. flip ref alt variants names character vector. reset samples' names test VCF. bins numeric vector. break statistics allele frequency bins. af file path allele frequency text file saved RDS file. output prefix saving objects RDS file choose_random_start choose random start stats=\"pse\" return_pse_sites boolean. return phasing switch error sites ... options passed vcftable","code":""},{"path":"/reference/vcfcomp.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"list various statistics","code":""},{"path":"/reference/vcfcomp.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"vcfcomp implements various statisitcs compare two VCF/BCF files, e.g. report genotype concocrdance, correlation stratified allele frequency.","code":""},{"path":"/reference/vcfcomp.html","id":"author","dir":"Reference","previous_headings":"","what":"Author","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"Zilong Li zilong.dk@gmail.com","code":""},{"path":"/reference/vcfcomp.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"","code":"library('vcfppR') test <- system.file(\"extdata\", \"imputed.gt.vcf.gz\", package=\"vcfppR\") truth <- system.file(\"extdata\", \"imputed.gt.vcf.gz\", package=\"vcfppR\") samples <- \"HG00133,HG00143,HG00262\" res <- vcfcomp(test, truth, stats=\"f1\", format=c('GT','GT'), samples=samples) #> Warning: F1 should be used only for a sample with genotypes of all types, hom ref(0), het(1) and hom alt(2) str(res) #> List of 2 #> $ samples: chr [1:3] \"HG00133\" \"HG00143\" \"HG00262\" #> $ f1 : int [1:17, 1:3] 15 NA NA NA NA NA NA NA NA NA ... #> ..- attr(*, \"dimnames\")=List of 2 #> .. ..$ : chr [1:17] \"[0,1e-05]\" \"(1e-05,2e-05]\" \"(2e-05,5e-05]\" \"(5e-05,0.0001]\" ... #> .. ..$ : chr [1:3] \"n\" \"nA\" \"concordance\" #> - attr(*, \"class\")= chr \"vcfcomp\""},{"path":"/reference/vcfplot.html","id":null,"dir":"Reference","previous_headings":"","what":"Make sensible and beautiful plots based on various objects in vcfppR — vcfplot","title":"Make sensible and beautiful plots based on various objects in vcfppR — vcfplot","text":"Make sensible beautiful plots based various objects vcfppR","code":""},{"path":"/reference/vcfplot.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Make sensible and beautiful plots based on various objects in vcfppR — vcfplot","text":"","code":"vcfplot( obj, what = \"r2\", which.sample = 1, pop = NULL, variant = c(\"SNP\", \"INDEL\"), ... )"},{"path":"/reference/vcfplot.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Make sensible and beautiful plots based on various objects in vcfppR — vcfplot","text":"obj object returned vcfcomp statisitcs plotted .sample sample among plotted pop file contains population information variant type variant desired ... parameters passed graphics","code":""},{"path":"/reference/vcfpopgen.html","id":null,"dir":"Reference","previous_headings":"","what":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"count heterozygous sites per sample VCF/BCF","code":""},{"path":"/reference/vcfpopgen.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"","code":"vcfpopgen( vcffile, region = \"\", samples = \"-\", pass = FALSE, qual = 0, fun = \"heterozygosity\" )"},{"path":"/reference/vcfpopgen.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"vcffile path VCF/BCF file region region subset like bcftools samples samples subset like bcftools pass restrict variants FILTER==PASS qual restrict variants QUAL > qual. fun popgen function run. available functions \"heterozygosity\".","code":""},{"path":"/reference/vcfpopgen.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"vcfpopgen list containing following components: samples : character vector; samples ids VCF file subsetting hets : integer vector; counts heterozygous sites sample order samples","code":""},{"path":"/reference/vcfpopgen.html","id":"author","dir":"Reference","previous_headings":"","what":"Author","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"Zilong Li zilong.dk@gmail.com","code":""},{"path":"/reference/vcfpopgen.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"","code":"library('vcfppR') vcffile <- system.file(\"extdata\", \"raw.gt.vcf.gz\", package=\"vcfppR\") res <- vcfpopgen(vcffile) str(res) #> List of 2 #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ hets : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ..."},{"path":"/reference/vcfppR-package.html","id":null,"dir":"Reference","previous_headings":"","what":"vcfppR: Rapid Manipulation of the Variant Call Format (VCF) — vcfppR-package","title":"vcfppR: Rapid Manipulation of the Variant Call Format (VCF) — vcfppR-package","text":"'vcfpp.h' (https://github.com/Zilong-Li/vcfpp) provides easy--use 'C++' 'API' 'htslib', offering full functionality manipulating Variant Call Format (VCF) files. 'vcfppR' package serves R bindings 'vcfpp.h' library, enabling rapid processing compressed uncompressed VCF files. Explore range powerful features efficient VCF data manipulation.","code":""},{"path":[]},{"path":"/reference/vcfppR-package.html","id":"author","dir":"Reference","previous_headings":"","what":"Author","title":"vcfppR: Rapid Manipulation of the Variant Call Format (VCF) — vcfppR-package","text":"Maintainer: Zilong Li zilong.dk@gmail.com (ORCID) contributors: Bonfield, James K Marshall, John Danecek, Petr Li, Heng Ohan, Valeriu Whitwham, Andrew Keane, Thomas Davies, Robert M (Authors included htslib library) [copyright holder]","code":""},{"path":"/reference/vcfreader.html","id":null,"dir":"Reference","previous_headings":"","what":"API for manipulating the VCF/BCF. — vcfreader","title":"API for manipulating the VCF/BCF. — vcfreader","text":"Type name class see details methods","code":""},{"path":"/reference/vcfreader.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"API for manipulating the VCF/BCF. — vcfreader","text":"C++ class following fields/methods manipulating VCF/BCF","code":""},{"path":"/reference/vcfreader.html","id":"fields","dir":"Reference","previous_headings":"","what":"Fields","title":"API for manipulating the VCF/BCF. — vcfreader","text":"new Constructor given vcf file Parameter: vcffile - path vcf file new Constructor given vcf file region Parameter: vcffile - path vcf file Parameter: region - region constrained new Constructor given vcf file, region samples Parameter: vcffile - path vcf file Parameter: region - region constrained Parameter: samples - samples constrained. Comma separated list samples include (exclude \"^\" prefix). variant Try get next variant record. return FALSE variants hit end file, otherwise TRUE. chr Return CHROM field current variant pos Return POS field current variant id Return CHROM field current variant ref Return REF field current variant alt Return ALT field current variant qual Return QUAL field current variant filter Return FILTER field current variant info Return INFO field current variant infoInt Return tag value integer type INFO field current variant Parameter: tag - tag name retrieve INFO infoFloat Return tag value float type INFO field current variant Parameter: tag - tag name retrieve INFO infoStr Return tag value string type INFO field current variant Parameter: tag - tag name retrieve INFO infoIntVec Return tag value vector integer type INFO field current variant Parameter: tag - tag name retrieve INFO infoFloatVec Return tag value vector float type INFO field current variant Parameter: tag - tag name retrieve INFO genotypes Return genotype values vector integers Parameter: collapse - Boolean value indicates wheather collapse size genotypes, eg, return diploid genotypes. formatInt Return tag value integer type sample FORAMT field current variant Parameter: tag - tag name retrieve FORAMT formatFloat Return tag value float type sample FORAMT field current variant Parameter: tag - tag name retrieve FORAMT formatStr Return tag value string type sample FORAMT field current variant Parameter: tag - tag name retrieve FORAMT isSNP Test current variant exculsively SNP isIndel Test current variant exculsively INDEL isSV Test current variant exculsively SV isMultiAllelics Test current variant exculsively Multi Allelics isMultiAllelicSNP Test current variant exculsively Multi Biallelics (SNPs) hasSNP Test current variant SNP hasINDEL Test current variant INDEL hasINS Test current variant INS hasDEL Test current variant DEL hasMNP Test current variant MNP hasBND Test current variant BND hasOTHER Test current variant hasOVERLAP Test current variant OVERLAP nsamples Return number samples samples Return vector samples id header Return raw string vcf header string Return raw string current variant including newline line Return raw string current variant without newline output Init output object streaming variants another vcf write Streaming current variant output vcf close Close connection output vcf setCHR Modify CHR current variant Parameter: s - string CHR setID Modify ID current variant Parameter: s - string ID setPOS Modify POS current variant Parameter: pos - integer POS setRefAlt Modify REF ALT current variant Parameter: s - string reperated comma setInfoInt Modify given tag INT type INFO current variant Parameter: tag - string tag name Parameter: v - integer tag value setInfoFloat Modify given tag FLOAT type INFO current variant Parameter: tag - string tag name Parameter: v - double tag value setInfoStr Modify given tag STRING type INFO current variant Parameter: tag - string tag name Parameter: s - string tag value setPhasing Modify phasing status sample Parameter: v - integer vector size number samples. 1s 0s valid. setGenotypes Modify genotypes current variant Parameter: v - integer vector genotypes. Use NA -9 missing value. setFormatInt Modify given tag INT type FORMAT current variant Parameter: tag - string tag name Parameter: v - integer tag value setFormatFloat Modify given tag FLOAT type FORMAT current variant Parameter: tag - string tag name Parameter: v - double tag value setFormatStr Modify given tag STRING type FORMAT current variant Parameter: tag - string tag name Parameter: s - string tag value rmInfoTag Remove given tag INFO current variant Parameter: s - string tag name rmFormatTag Remove given tag FORMAT current variant Parameter: s - string tag name setVariant Modify current variant adding vcf line Parameter: s - string one line VCF addINFO Add INFO header vcf Parameter: id - string tag name Parameter: number - string number Parameter: type - string type Parameter: desc - string description means addFORMAT Add FORMAT header vcf Parameter: id - string tag name Parameter: number - string number Parameter: type - string type Parameter: desc - string description means","code":""},{"path":"/reference/vcfreader.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"API for manipulating the VCF/BCF. — vcfreader","text":"","code":"vcffile <- system.file(\"extdata\", \"raw.gt.vcf.gz\", package=\"vcfppR\") br <- vcfreader$new(vcffile) res <- rep(0L, br$nsamples()) while(br$variant()) { if(br$isSNP()) { gt <- br$genotypes(TRUE) == 1 gt[is.na(gt)] <- FALSE res <- res + gt } }"},{"path":"/reference/vcfsummary.html","id":null,"dir":"Reference","previous_headings":"","what":"summarize the various variant types at both variant level and sample level. — vcfsummary","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"summarize various variant types variant level sample level.","code":""},{"path":"/reference/vcfsummary.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"","code":"vcfsummary( vcffile, region = \"\", samples = \"-\", pass = FALSE, qual = 0, svtype = FALSE )"},{"path":"/reference/vcfsummary.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"vcffile path VCF/BCF file region region subset like bcftools samples samples subset like bcftools pass restrict variants FILTER==PASS qual restrict variants QUAL > qual. svtype summarize variants SVTYPE","code":""},{"path":"/reference/vcfsummary.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"vcfsummary list containing following components: summary : named integer vector; summarize counts variant type samples : character vector; samples ids VCF file subsetting vartype : integer vector; counts variant type sample level order samples","code":""},{"path":"/reference/vcfsummary.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"bcftools view -s \"id01,id02\" input.bcf.gz chr1:100000-20000","code":""},{"path":"/reference/vcfsummary.html","id":"author","dir":"Reference","previous_headings":"","what":"Author","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"Zilong Li zilong.dk@gmail.com","code":""},{"path":"/reference/vcfsummary.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"","code":"library('vcfppR') svfile <- system.file(\"extdata\", \"sv.vcf.gz\", package=\"vcfppR\") res <- vcfsummary(svfile, region = \"chr21:1-10000000\", svtype = TRUE) str(res) #> List of 10 #> $ summary: Named int [1:10] 9 9 0 0 0 0 2 4 3 0 #> ..- attr(*, \"names\")= chr [1:10] \"ALL\" \"SV\" \"BND\" \"CNV\" ... #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ BND : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ CNV : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ CPX : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ CTX : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ DEL : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ DUP : int [1:3202] 0 1 0 0 0 0 0 0 0 0 ... #> $ INS : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ INV : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> - attr(*, \"class\")= chr \"vcfsummary\""},{"path":"/reference/vcftable.html","id":null,"dir":"Reference","previous_headings":"","what":"read VCF/BCF contents into R data structure — vcftable","title":"read VCF/BCF contents into R data structure — vcftable","text":"swiss army knife reading VCF/BCF R data types rapidly easily.","code":""},{"path":"/reference/vcftable.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"read VCF/BCF contents into R data structure — vcftable","text":"","code":"vcftable( vcffile, region = \"\", samples = \"-\", vartype = \"all\", format = \"GT\", ids = NULL, qual = 0, pass = FALSE, info = TRUE, collapse = TRUE, setid = FALSE, mac = 0 )"},{"path":"/reference/vcftable.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"read VCF/BCF contents into R data structure — vcftable","text":"vcffile path VCF/BCF file region region subset bcftools-like style: \"chr1\", \"chr1:1-10000000\" samples samples subset bcftools-like style. comma separated list samples include (exclude \"^\" prefix). e.g. \"id01,id02\", \"^id01,id02\". vartype restrict specific type variants. supports \"snps\",\"indels\", \"sv\", \"multisnps\",\"multiallelics\" format FORMAT tag extract. default \"GT\" extracted. ids character vector. restrict sites ID given vector. default NULL filter sites. qual numeric. restrict variants QUAL > qual. pass logical. restrict variants FILTER = \"PASS\". info logical. drop INFO column returned list. collapse logical. acts FORMAT. FORMAT extract \"GT\", dim raw genotypes matrix diploid (M, 2 * N), M #markers N #samples. default TRUE collapse genotypes sample matrix (M, N). Set FALSE one wants maintain phasing order, e.g. \"1|0\" parsed c(1, 0) collapse=FALSE. FORMAT extract \"GT\", collapse=TRUE try turn list extracted vector matrix. However, raises issues one variant mutliallelic resulting vaules others. setid logical. reset ID column CHR_POS_REF_ALT. mac integer. restrict variants minor allele count higher value.","code":""},{"path":"/reference/vcftable.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"read VCF/BCF contents into R data structure — vcftable","text":"Return list containing following components: samples : character vector; samples ids VCF file subsetting chr : character vector; CHR column VCF file pos : character vector; POS column VCF file id : character vector; ID column VCF file ref : character vector; REF column VCF file alt : character vector; ALT column VCF file qual : character vector; QUAL column VCF file filter : character vector; FILTER column VCF file info : character vector; INFO column VCF file format : matrix either integer numberic values depending tag extract; specifiy tag FORMAT column extracted","code":""},{"path":"/reference/vcftable.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"read VCF/BCF contents into R data structure — vcftable","text":"vcftable uses C++ API vcfpp, wrapper htslib, read VCF/BCF files. Thus, full functionalities htslib, restrict specific variant types, samples regions. memory efficiency reason, vcftable designed parse one tag time FORMAT column VCF. default, matrix genotypes, .e. \"GT\" tag, returned vcftable, many tags supported format option.","code":""},{"path":"/reference/vcftable.html","id":"author","dir":"Reference","previous_headings":"","what":"Author","title":"read VCF/BCF contents into R data structure — vcftable","text":"Zilong Li zilong.dk@gmail.com","code":""},{"path":"/reference/vcftable.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"read VCF/BCF contents into R data structure — vcftable","text":"","code":"library('vcfppR') vcffile <- system.file(\"extdata\", \"raw.gt.vcf.gz\", package=\"vcfppR\") res <- vcftable(vcffile, \"chr21:1-5050000\", vartype = \"snps\") str(res) #> List of 10 #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ chr : chr [1:12] \"chr21\" \"chr21\" \"chr21\" \"chr21\" ... #> $ pos : int [1:12] 5030082 5030088 5030105 5030253 5030278 5030347 5030356 5030357 5030391 5030446 ... #> $ id : chr [1:12] \"chr21:5030082:G:A\" \"chr21:5030088:C:T\" \"chr21:5030105:C:A\" \"chr21:5030253:G:T\" ... #> $ ref : chr [1:12] \"G\" \"C\" \"C\" \"G\" ... #> $ alt : chr [1:12] \"A\" \"T\" \"A\" \"T\" ... #> $ qual : num [1:12] 70.1 2773.1 3897.8 102.6 868.9 ... #> $ filter : chr [1:12] \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" ... #> $ info : chr [1:12] \"AC=2;AF=0.000616523;AN=3244;DP=2498;FS=0;MLEAC=1;MLEAF=0.0003083;MQ=17.07;MQ0=0;QD=17.52;SOR=3.258;VQSLOD=-32.6\"| __truncated__ \"AC=127;AF=0.0400126;AN=3174;BaseQRankSum=0.736;ClippingRankSum=0.736;DP=2750;FS=0;InbreedingCoeff=0.0015;MLEAC=\"| __truncated__ \"AC=128;AF=0.0352811;AN=3628;BaseQRankSum=0.736;ClippingRankSum=0.727;DP=3476;FS=0;InbreedingCoeff=-0.0015;MLEAC\"| __truncated__ \"AC=1;AF=0.000165837;AN=6030;BaseQRankSum=-0.583;ClippingRankSum=-0.259;DP=19530;FS=0;InbreedingCoeff=-0.0274;ML\"| __truncated__ ... #> $ gt : int [1:12, 1:3202] NA 2 2 0 0 0 0 0 0 0 ... #> - attr(*, \"class\")= chr \"vcftable\""},{"path":"/reference/vcfwriter.html","id":null,"dir":"Reference","previous_headings":"","what":"API for writing the VCF/BCF. — vcfwriter","title":"API for writing the VCF/BCF. — vcfwriter","text":"Type name class see details methods","code":""},{"path":"/reference/vcfwriter.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"API for writing the VCF/BCF. — vcfwriter","text":"C++ class following fields/methods writing VCF/BCF","code":""},{"path":"/reference/vcfwriter.html","id":"fields","dir":"Reference","previous_headings":"","what":"Fields","title":"API for writing the VCF/BCF. — vcfwriter","text":"new Constructor given vcf file Parameter: vcffile - path vcf file. start \"~\" Parameter: version - version VCF specification addContig Add Contig header vcf Parameter: str - string CONTIG name addFILTER Add FILTER header vcf Parameter: id - string FILTER name Parameter: desc - string description means addINFO Add INFO header vcf Parameter: id - string tag name Parameter: number - string number Parameter: type - string type Parameter: desc - string description means addFORMAT Add FORMAT header vcf Parameter: id - string tag name Parameter: number - string number Parameter: type - string type Parameter: desc - string description means addSample Add SAMPLE header vcf Parameter: str - string SAMPLE name addLine Add line header vcf Parameter: str - string line header VCF writeline Write variant record given line Parameter: line - string line variant VCF. ended \"newline\" close Close save vcf file","code":""},{"path":"/reference/vcfwriter.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"API for writing the VCF/BCF. — vcfwriter","text":"","code":"outvcf <- file.path(paste0(tempfile(), \".vcf.gz\")) bw <- vcfwriter$new(outvcf, \"VCF4.1\") bw$addContig(\"chr20\") bw$addFORMAT(\"GT\", \"1\", \"String\", \"Genotype\"); bw$addSample(\"NA12878\") s1 <- \"chr20\\t2006060\\t.\\tG\\tC\\t100\\tPASS\\t.\\tGT\\t1|0\" bw$writeline(s1) bw$close()"},{"path":"/news/index.html","id":"vcfppr-045","dir":"Changelog","previous_headings":"","what":"vcfppR 0.4.5","title":"vcfppR 0.4.5","text":"CRAN release: 2024-04-08 add vcfcomp function fix memory leaks pass ASAN check","code":""},{"path":"/news/index.html","id":"vcfppr-040","dir":"Changelog","previous_headings":"","what":"vcfppR 0.4.0","title":"vcfppR 0.4.0","text":"CRAN release: 2024-02-26 add setid option vcftable patches upcoming Rtools windows","code":""},{"path":"/news/index.html","id":"vcfppr-038","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.8","title":"vcfppR 0.3.8","text":"CRAN release: 2024-01-14 fix issues M1 Mac","code":""},{"path":"/news/index.html","id":"vcfppr-037","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.7","title":"vcfppR 0.3.7","text":"add vcfreader@rmFormatTag() add vcfreader@samples() vcftable supports vartype = ‘sv’","code":""},{"path":"/news/index.html","id":"vcfppr-036","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.6","title":"vcfppR 0.3.6","text":"add vcfreader::line remove vcfreader::setVariant bug fix setFormatStr units tests","code":""},{"path":"/news/index.html","id":"vcfppr-035","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.5","title":"vcfppR 0.3.5","text":"CRAN release: 2023-12-14 add vcfreader vcfwriter","code":""},{"path":"/news/index.html","id":"vcfppr-034","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.4","title":"vcfppR 0.3.4","text":"support filters variant ID","code":""},{"path":"/news/index.html","id":"vcfppr-033","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.3","title":"vcfppR 0.3.3","text":"use API vcfpp.h v0.3.1 set missing vaules FORMAT NA support filters QUAL, FILTER INFO","code":""},{"path":"/news/index.html","id":"vcfppr-030","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.0","title":"vcfppR 0.3.0","text":"First release using vcfpp.h v0.3.0 add vcftable function add vcfsummary function add vcfpopgen function","code":""}] +[{"path":"/CONTRIBUTING.html","id":"contributing-to-vcfppr","dir":"","previous_headings":"","what":"Contributing to vcfppR","title":"NA","text":"Please see file Contributing details report issue: Minimally Complete () Verifiable Example (MCVE) helps lot; submit pull request: post issue first, get consensus ; follow (informal) coding style: simply files invent new style; nice NEWS.Rd","code":""},{"path":"/PULL_REQUEST_TEMPLATE.html","id":"pull-request-template-for-rcpp","dir":"","previous_headings":"","what":"Pull Request Template for Rcpp","title":"NA","text":"Please explain changes want apply Rcpp, preferably issue ticket create pull request. See file Contributing templates details.","code":""},{"path":"/PULL_REQUEST_TEMPLATE.html","id":"checklist","dir":"","previous_headings":"Pull Request Template for Rcpp","what":"Checklist","title":"NA","text":"Code compiles correctly R CMD check still passes tests Preferably, new tests added fail without change Document changes file ChangeLog","code":""},{"path":"/articles/concordance-of-two-vcf-files.html","id":"background","dir":"Articles","previous_headings":"","what":"Background","title":"Assess the concordance between VCFs","text":"benchmarking, ’s often need calculate concordance rate test set truth set. truth VCF file, always true genotypes GT otherwise can’t validate test VCF. test VCF may variant caller genotype imputation program, format can variable, e.g GP, DS GT. Hence, article guides use vcfppR::vcfcomp function rapidly examine various statistics different scenarios formats, Pearson correlation genotyping (stats=“r2”), Non-Reference Concordance (stats=“nrc”), F1-score (stats=“f1”) Phasing Switch Error (stats=“pse”).","code":""},{"path":"/articles/concordance-of-two-vcf-files.html","id":"case-1-genotype-imputation-accuracy","dir":"Articles","previous_headings":"","what":"Case 1: Genotype imputation accuracy","title":"Assess the concordance between VCFs","text":"normally get genotype posterior GP genotype dosage DS diploid imputation software, eg QUILT GLIMPSE. examine imputation accuracy, calculate Pearson correlation imputed genotype dosage true genotypes. vcfcomp, need specify desired stats=\"r2\" formats=c(\"DS\",\"GT\"), extract respective FORMAT items testvcf truthvcf. Besides, QUILT2-nipt method outputs MDS FDS maternal fetal genotype dosages constract DS diploid mode. assess imputation accuracy maternal fetal, need specify corresponding formats. Note: absence DS format testvcf, one can either fill DS tag using vcf_addDS command line tool manipulate testvcf R using vcftable.","code":"vcfcomp(testvcf, truthvcf, formats = c(\"DS\", \"GT\"), stats = \"r2\") vcfcomp(testvcf, truthvcf, formats = c(\"MDS\", \"GT\"), stats = \"r2\") vcfcomp(testvcf, truthvcf, formats = c(\"FDS\", \"GT\"), stats = \"r2\")"},{"path":"/articles/concordance-of-two-vcf-files.html","id":"case-2-genotype-concordance","dir":"Articles","previous_headings":"","what":"Case 2: Genotype concordance","title":"Assess the concordance between VCFs","text":"case, interested called genotype concordance sensitivity / specificity genotype calling. contrast stats=\"r2\", choose stats=\"f1\" stats=\"nrc\" specify formats=c(\"GT\", \"GT\"). Normally, want results sample, can achieved using .sample=TRUE.","code":"vcfcomp(testvcf, truthvcf, formats = c(\"GT\",\"GT\"), stats=\"nrc\", by.sample=TRUE) vcfcomp(testvcf, truthvcf, formats = c(\"GT\",\"GT\"), stats=\"f1\", by.sample=TRUE)"},{"path":"/articles/concordance-of-two-vcf-files.html","id":"case-3-phasing-switch-error","dir":"Articles","previous_headings":"","what":"Case 3: Phasing switch error","title":"Assess the concordance between VCFs","text":"case, look functionality assess phasing switch error. First , need two VCF files contain phased GT, represented ‘|’. can choose return sites pse. Note: Currently, pse statatics simple form doesn’t take completeness quality account.","code":"vcfcomp(testvcf, truthvcf, stats=\"pse\", return_pse_sites=TRUE)"},{"path":"/articles/concordance-of-two-vcf-files.html","id":"case-4-multiple-testing-repetitively","dir":"Articles","previous_headings":"","what":"Case 4: Multiple testing repetitively","title":"Assess the concordance between VCFs","text":"comprehensive benchmarking, often run many tests true sets. scenario, can save truth RDS object reuse . Actually, test truth can take RDS file input. RDS file stores object returned vcftable.","code":"saveRDS(vcftable(truthvcf), \"truth.rds\") vcfcomp(test=testvcf1, truth=\"truth.rds\") vcfcomp(test=testvcf2, truth=\"truth.rds\") vcfcomp(test=testvcf3, truth=\"truth.rds\")"},{"path":"/articles/concordance-of-two-vcf-files.html","id":"qa-how-to-fix-the-error-inconsistent-samples-name","dir":"Articles","previous_headings":"","what":"Q&A: How to fix the error “inconsistent samples name”","title":"Assess the concordance between VCFs","text":"one certain samples name testvcf can replaced names can match samples truthvcf. One can use names option specify vector new names can found truthvcf.","code":""},{"path":"/authors.html","id":null,"dir":"","previous_headings":"","what":"Authors","title":"Authors and Citation","text":"Zilong Li. Author, maintainer. Bonfield, James K Marshall, John Danecek, Petr Li, Heng Ohan, Valeriu Whitwham, Andrew Keane, Thomas Davies, Robert M. Copyright holder. Authors included htslib library","code":""},{"path":"/authors.html","id":"citation","dir":"","previous_headings":"","what":"Citation","title":"Authors and Citation","text":"Li Z (2024). “vcfpp: C++ API rapid processing variant call format.” Bioinformatics, 40(2), btae049. ISSN 1367-4811, doi:10.1093/bioinformatics/btae049.","code":"@Article{, title = {vcfpp: a C++ API for rapid processing of the variant call format}, author = {Zilong Li}, journal = {Bioinformatics}, volume = {40}, number = {2}, pages = {btae049}, year = {2024}, month = {01}, issn = {1367-4811}, abstract = {Given the widespread use of the variant call format (VCF/BCF) coupled with continuous surge in big data, there remains a perpetual demand for fast and flexible methods to manipulate these comprehensive formats across various programming languages.This work presents vcfpp, a C++ API of HTSlib in a single file, providing an intuitive interface to manipulate VCF/BCF files rapidly and safely, in addition to being portable. Moreover, this work introduces the vcfppR package to demonstrate the development of a high-performance R package with vcfpp, allowing for rapid and straightforward variants analyses.vcfpp is available from https://github.com/Zilong-Li/vcfpp under MIT license. vcfppR is available from https://cran.r-project.org/web/packages/vcfppR.}, doi = {10.1093/bioinformatics/btae049}, }"},{"path":"/index.html","id":"vcfppr-rapid-manipulation-of-the-vcfbcf-file","dir":"","previous_headings":"","what":"Rapid Manipulation of the Variant Call Format (VCF)","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"vcfppR package implements various powerful functions fast genomics analyses VCF/BCF files using C++ API vcfpp.h. Load/save content VCF/BCF R objects highly customizable options Visualize chracterize variants Compare two VCF/BCF files report various statistics Streaming read/write VCF/BCF files fine control everything Paper shows vcfppR 20x faster vcfR. Also, much faster cyvcf2","code":""},{"path":"/index.html","id":"installation","dir":"","previous_headings":"","what":"Installation","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"","code":"## install.package(\"vcfppR\") ## from CRAN remotes::install_github(\"Zilong-Li/vcfppR\") ## from latest github"},{"path":"/index.html","id":"cite-the-work","dir":"","previous_headings":"","what":"Cite the work","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"find useful, please cite paper","code":"library(vcfppR) citation(\"vcfppR\") #> To cite package 'vcfppR' in publications use: #> #> Li Z (2024). \"vcfpp: a C++ API for rapid processing of the variant #> call format.\" _Bioinformatics_, *40*(2), btae049. ISSN 1367-4811, #> doi:10.1093/bioinformatics/btae049 #> . #> #> A BibTeX entry for LaTeX users is #> #> @Article{, #> title = {vcfpp: a C++ API for rapid processing of the variant call format}, #> author = {Zilong Li}, #> journal = {Bioinformatics}, #> volume = {40}, #> number = {2}, #> pages = {btae049}, #> year = {2024}, #> month = {01}, #> issn = {1367-4811}, #> abstract = {Given the widespread use of the variant call format (VCF/BCF) coupled with continuous surge in big data, there remains a perpetual demand for fast and flexible methods to manipulate these comprehensive formats across various programming languages.This work presents vcfpp, a C++ API of HTSlib in a single file, providing an intuitive interface to manipulate VCF/BCF files rapidly and safely, in addition to being portable. Moreover, this work introduces the vcfppR package to demonstrate the development of a high-performance R package with vcfpp, allowing for rapid and straightforward variants analyses.vcfpp is available from https://github.com/Zilong-Li/vcfpp under MIT license. vcfppR is available from https://cran.r-project.org/web/packages/vcfppR.}, #> doi = {10.1093/bioinformatics/btae049}, #> }"},{"path":"/index.html","id":"url-as-filename","dir":"","previous_headings":"","what":"URL as filename","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"functions vcfppR support URL filename VCF/BCF files.","code":"phasedvcf <- \"https://ftp.1000genomes.ebi.ac.uk/vol1/ftp/data_collections/1000G_2504_high_coverage/working/20220422_3202_phased_SNV_INDEL_SV/1kGP_high_coverage_Illumina.chr21.filtered.SNV_INDEL_SV_phased_panel.vcf.gz\" rawvcf <- \"https://ftp.1000genomes.ebi.ac.uk/vol1/ftp/data_collections/1000G_2504_high_coverage/working/20201028_3202_raw_GT_with_annot/20201028_CCDG_14151_B01_GRM_WGS_2020-08-05_chr21.recalibrated_variants.vcf.gz\" svfile <- \"https://ftp.1000genomes.ebi.ac.uk/vol1/ftp/data_collections/1000G_2504_high_coverage/working/20210124.SV_Illumina_Integration/1KGP_3202.gatksv_svtools_novelins.freeze_V3.wAF.vcf.gz\" popfile <- \"https://ftp.1000genomes.ebi.ac.uk/vol1/ftp/data_collections/1000G_2504_high_coverage/20130606_g1k_3202_samples_ped_population.txt\""},{"path":"/index.html","id":"vcfcomp-compare-two-vcf-files-and-report-concordance","dir":"","previous_headings":"","what":"vcfcomp: compare two VCF files and report concordance","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"Want investigate concordance two VCF files? vcfcomp utility function need! example, benchmarkings, intend calculate genotype correlation test truth. Check vignettes !","code":"res <- vcfcomp(test = rawvcf, truth = phasedvcf, region = \"chr21:1-5100000\", stats = \"r2\", formats = c(\"GT\",\"GT\")) par(mar=c(5,5,2,2), cex.lab = 2) vcfplot(res, what = \"r2\", col = 2, cex = 3, lwd = 4, type = \"b\") #> input is an object with vcfcomp class"},{"path":"/index.html","id":"vcfsummary-variants-characterization","dir":"","previous_headings":"","what":"vcfsummary: variants characterization","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"Want summarize variants discovered genotype caller e.g. GATK? vcfsummary utility function need! Small variants Complex structure variants","code":"res <- vcfsummary(rawvcf,\"chr21:10000000-10010000\") vcfplot(res, pop = popfile, col = 1:5, main = \"Number of SNP & INDEL variants per population\") #> input is an object with vcfsummary class res <- vcfsummary(svfile, svtype = TRUE, region = \"chr20\") vcfplot(res, main = \"Structure Variant Counts\", col = 1:7) #> input is an object with vcfsummary class"},{"path":"/index.html","id":"vcftable-read-vcf-as-tabular-data","dir":"","previous_headings":"","what":"vcftable: read VCF as tabular data","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"vcftable gives fine control want extract VCF/BCF files. Read SNP variants Read SNP variants PL format drop INFO column VCF/BCF Read INDEL variants DP format VCF/BCF","code":"res <- vcftable(phasedvcf, \"chr21:1-5100000\", vartype = \"snps\") str(res) #> List of 10 #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ chr : chr [1:194] \"chr21\" \"chr21\" \"chr21\" \"chr21\" ... #> $ pos : int [1:194] 5030578 5030588 5030596 5030673 5030957 5030960 5031004 5031031 5031194 5031224 ... #> $ id : chr [1:194] \"21:5030578:C:T\" \"21:5030588:T:C\" \"21:5030596:A:G\" \"21:5030673:G:A\" ... #> $ ref : chr [1:194] \"C\" \"T\" \"A\" \"G\" ... #> $ alt : chr [1:194] \"T\" \"C\" \"G\" \"A\" ... #> $ qual : num [1:194] 2.14e+09 2.14e+09 2.14e+09 2.14e+09 2.14e+09 ... #> $ filter : chr [1:194] \".\" \".\" \".\" \".\" ... #> $ info : chr [1:194] \"AC=74;AF=0.0115553;CM=0;AN=6404;AN_EAS=1170;AN_AMR=980;AN_EUR=1266;AN_AFR=1786;AN_SAS=1202;AN_EUR_unrel=1006;AN\"| __truncated__ \"AC=53;AF=0.00827608;CM=1.78789e-05;AN=6404;AN_EAS=1170;AN_AMR=980;AN_EUR=1266;AN_AFR=1786;AN_SAS=1202;AN_EUR_un\"| __truncated__ \"AC=2;AF=0.000312305;CM=3.21821e-05;AN=6404;AN_EAS=1170;AN_AMR=980;AN_EUR=1266;AN_AFR=1786;AN_SAS=1202;AN_EUR_un\"| __truncated__ \"AC=2;AF=0.000312305;CM=0.00016985;AN=6404;AN_EAS=1170;AN_AMR=980;AN_EUR=1266;AN_AFR=1786;AN_SAS=1202;AN_EUR_unr\"| __truncated__ ... #> $ gt : int [1:194, 1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> - attr(*, \"class\")= chr \"vcftable\" res <- vcftable(rawvcf, \"chr21:1-5100000\", vartype = \"snps\", format = \"PL\", info = FALSE) str(res) #> List of 10 #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ chr : chr [1:1383] \"chr21\" \"chr21\" \"chr21\" \"chr21\" ... #> $ pos : int [1:1383] 5030082 5030088 5030105 5030253 5030278 5030347 5030356 5030357 5030391 5030446 ... #> $ id : chr [1:1383] \".\" \".\" \".\" \".\" ... #> $ ref : chr [1:1383] \"G\" \"C\" \"C\" \"G\" ... #> $ alt : chr [1:1383] \"A\" \"T\" \"A\" \"T\" ... #> $ qual : num [1:1383] 70.1 2773.1 3897.8 102.6 868.9 ... #> $ filter : chr [1:1383] \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" ... #> $ info : chr(0) #> $ PL : int [1:1383, 1:9606] NA 64 64 0 0 0 0 0 0 0 ... #> - attr(*, \"class\")= chr \"vcftable\" res <- vcftable(rawvcf, \"chr21:1-5100000\", vartype = \"indels\", format = \"DP\") str(res) #> List of 10 #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ chr : chr [1:195] \"chr21\" \"chr21\" \"chr21\" \"chr21\" ... #> $ pos : int [1:195] 5030240 5030912 5030937 5031018 5031125 5031147 5031747 5031881 5031919 5031984 ... #> $ id : chr [1:195] \".\" \".\" \".\" \".\" ... #> $ ref : chr [1:195] \"AC\" \"CA\" \"T\" \"C\" ... #> $ alt : chr [1:195] \"A\" \"C\" \"TGGTGCACGCCTGCAGTCCCGGC\" \"CCTATGATCACACCGT\" ... #> $ qual : num [1:195] 6872 321 233 270 58361 ... #> $ filter : chr [1:195] \"VQSRTrancheINDEL99.00to100.00\" \"PASS\" \"PASS\" \"PASS\" ... #> $ info : chr [1:195] \"AC=82;AF=0.0136439;AN=6010;BaseQRankSum=-0.55;ClippingRankSum=0;DP=18067;FS=0;InbreedingCoeff=0.0664;MLEAC=76;M\"| __truncated__ \"AC=19;AF=0.0030586;AN=6212;BaseQRankSum=0.358;ClippingRankSum=-0.594;DP=30725;FS=44.58;InbreedingCoeff=-1.1608;\"| __truncated__ \"AC=1;AF=0.00015753;AN=6348;BaseQRankSum=-1.793;ClippingRankSum=-0.48;DP=32486;FS=27.337;InbreedingCoeff=-0.0212\"| __truncated__ \"AC=2;AF=0.000314268;AN=6364;BaseQRankSum=1.59;ClippingRankSum=0.358;DP=44916;FS=0;InbreedingCoeff=-0.0092;MLEAC\"| __truncated__ ... #> $ DP : int [1:195, 1:3202] 3 15 13 16 19 20 5 34 29 24 ... #> - attr(*, \"class\")= chr \"vcftable\""},{"path":"/index.html","id":"r-api-of-vcfpph","dir":"","previous_headings":"","what":"R API of vcfpp.h","title":"Rapid Manipulation of the Variant Call Format (VCF)","text":"two classes .e. vcfreader vcfwriter offering full R-bindings vcfpp.h. Check examples tests folder refer manual.","code":"?vcfppR::vcfreader"},{"path":"/reference/heterozygosity.html","id":null,"dir":"Reference","previous_headings":"","what":"calculate the number of heterozygous SNPs for each sample — heterozygosity","title":"calculate the number of heterozygous SNPs for each sample — heterozygosity","text":"calculate number heterozygous SNPs sample","code":""},{"path":"/reference/heterozygosity.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"calculate the number of heterozygous SNPs for each sample — heterozygosity","text":"","code":"heterozygosity(vcffile, region = \"\", samples = \"-\", pass = FALSE, qual = 0)"},{"path":"/reference/heterozygosity.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"calculate the number of heterozygous SNPs for each sample — heterozygosity","text":"vcffile path VCF file index region region extract, default \"\" samples samples extract, default \"-\" pass restrict variants FILTER==PASS qual restrict variants QUAL > qual.","code":""},{"path":"/reference/heterozygosity.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"calculate the number of heterozygous SNPs for each sample — heterozygosity","text":"list heterozygosity couts sample along id vcf header","code":""},{"path":"/reference/vcfcomp.html","id":null,"dir":"Reference","previous_headings":"","what":"Compare two VCF/BCF files reporting various statistics — vcfcomp","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"Compare two VCF/BCF files reporting various statistics","code":""},{"path":"/reference/vcfcomp.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"","code":"vcfcomp( test, truth, formats = c(\"DS\", \"GT\"), stats = \"r2\", by.sample = FALSE, by.variant = FALSE, flip = FALSE, names = NULL, bins = NULL, af = NULL, out = NULL, choose_random_start = FALSE, return_pse_sites = FALSE, ... )"},{"path":"/reference/vcfcomp.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"test path first VCF/BCF file referred test, saved RDS file. truth path second VCF/BCF file referred truth, saved RDS file. formats character vector. FORMAT tags extract test truth respectively. default c(\"DS\", \"GT\") extracts 'DS' target 'GT' truth. stats statistics calculated. supports following. \"r2\": pearson correlation coefficient ** 2. \"f1\": F1-score, good balance sensitivity precision. \"nrc\": Non-Reference Concordance rate \"pse\": Phasing Switch Error rate .sample logical. calculate concordance samples, average bins. .variant logical. calculate concordance variant, average bins. bysample variant TRUE, average samples first. bysample variant FALSE, average samples variants. flip logical. flip ref alt variants names character vector. reset samples' names test VCF. bins numeric vector. break statistics allele frequency bins. af file path allele frequency text file saved RDS file. output prefix saving objects RDS file choose_random_start choose random start stats=\"pse\" return_pse_sites boolean. return phasing switch error sites ... options passed vcftable","code":""},{"path":"/reference/vcfcomp.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"list various statistics","code":""},{"path":"/reference/vcfcomp.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"vcfcomp implements various statisitcs compare two VCF/BCF files, e.g. report genotype concocrdance, correlation stratified allele frequency.","code":""},{"path":"/reference/vcfcomp.html","id":"author","dir":"Reference","previous_headings":"","what":"Author","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"Zilong Li zilong.dk@gmail.com","code":""},{"path":"/reference/vcfcomp.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Compare two VCF/BCF files reporting various statistics — vcfcomp","text":"","code":"library('vcfppR') test <- system.file(\"extdata\", \"imputed.gt.vcf.gz\", package=\"vcfppR\") truth <- system.file(\"extdata\", \"imputed.gt.vcf.gz\", package=\"vcfppR\") samples <- \"HG00133,HG00143,HG00262\" res <- vcfcomp(test, truth, stats=\"f1\", format=c('GT','GT'), samples=samples) #> Warning: F1 should be used only for a sample with genotypes of all types, hom ref(0), het(1) and hom alt(2) str(res) #> List of 2 #> $ samples: chr [1:3] \"HG00133\" \"HG00143\" \"HG00262\" #> $ f1 : int [1:17, 1:3] 15 NA NA NA NA NA NA NA NA NA ... #> ..- attr(*, \"dimnames\")=List of 2 #> .. ..$ : chr [1:17] \"[0,1e-05]\" \"(1e-05,2e-05]\" \"(2e-05,5e-05]\" \"(5e-05,0.0001]\" ... #> .. ..$ : chr [1:3] \"n\" \"nA\" \"concordance\" #> - attr(*, \"class\")= chr \"vcfcomp\""},{"path":"/reference/vcfplot.html","id":null,"dir":"Reference","previous_headings":"","what":"Make sensible and beautiful plots based on various objects in vcfppR — vcfplot","title":"Make sensible and beautiful plots based on various objects in vcfppR — vcfplot","text":"Make sensible beautiful plots based various objects vcfppR","code":""},{"path":"/reference/vcfplot.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Make sensible and beautiful plots based on various objects in vcfppR — vcfplot","text":"","code":"vcfplot( obj, what = \"r2\", which.sample = 1, pop = NULL, variant = c(\"SNP\", \"INDEL\"), ... )"},{"path":"/reference/vcfplot.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Make sensible and beautiful plots based on various objects in vcfppR — vcfplot","text":"obj object returned vcfcomp statisitcs plotted .sample sample among plotted pop file contains population information variant type variant desired ... parameters passed graphics","code":""},{"path":"/reference/vcfpopgen.html","id":null,"dir":"Reference","previous_headings":"","what":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"count heterozygous sites per sample VCF/BCF","code":""},{"path":"/reference/vcfpopgen.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"","code":"vcfpopgen( vcffile, region = \"\", samples = \"-\", pass = FALSE, qual = 0, fun = \"heterozygosity\" )"},{"path":"/reference/vcfpopgen.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"vcffile path VCF/BCF file region region subset like bcftools samples samples subset like bcftools pass restrict variants FILTER==PASS qual restrict variants QUAL > qual. fun popgen function run. available functions \"heterozygosity\".","code":""},{"path":"/reference/vcfpopgen.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"vcfpopgen list containing following components: samples : character vector; samples ids VCF file subsetting hets : integer vector; counts heterozygous sites sample order samples","code":""},{"path":"/reference/vcfpopgen.html","id":"author","dir":"Reference","previous_headings":"","what":"Author","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"Zilong Li zilong.dk@gmail.com","code":""},{"path":"/reference/vcfpopgen.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"count the heterozygous sites per sample in the VCF/BCF — vcfpopgen","text":"","code":"library('vcfppR') vcffile <- system.file(\"extdata\", \"raw.gt.vcf.gz\", package=\"vcfppR\") res <- vcfpopgen(vcffile) str(res) #> List of 2 #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ hets : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ..."},{"path":"/reference/vcfppR-package.html","id":null,"dir":"Reference","previous_headings":"","what":"vcfppR: Rapid Manipulation of the Variant Call Format (VCF) — vcfppR-package","title":"vcfppR: Rapid Manipulation of the Variant Call Format (VCF) — vcfppR-package","text":"'vcfpp.h' (https://github.com/Zilong-Li/vcfpp) provides easy--use 'C++' 'API' 'htslib', offering full functionality manipulating Variant Call Format (VCF) files. 'vcfppR' package serves R bindings 'vcfpp.h' library, enabling rapid processing compressed uncompressed VCF files. Explore range powerful features efficient VCF data manipulation.","code":""},{"path":[]},{"path":"/reference/vcfppR-package.html","id":"author","dir":"Reference","previous_headings":"","what":"Author","title":"vcfppR: Rapid Manipulation of the Variant Call Format (VCF) — vcfppR-package","text":"Maintainer: Zilong Li zilong.dk@gmail.com (ORCID) contributors: Bonfield, James K Marshall, John Danecek, Petr Li, Heng Ohan, Valeriu Whitwham, Andrew Keane, Thomas Davies, Robert M (Authors included htslib library) [copyright holder]","code":""},{"path":"/reference/vcfreader.html","id":null,"dir":"Reference","previous_headings":"","what":"API for manipulating the VCF/BCF. — vcfreader","title":"API for manipulating the VCF/BCF. — vcfreader","text":"Type name class see details methods","code":""},{"path":"/reference/vcfreader.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"API for manipulating the VCF/BCF. — vcfreader","text":"C++ class following fields/methods manipulating VCF/BCF","code":""},{"path":"/reference/vcfreader.html","id":"fields","dir":"Reference","previous_headings":"","what":"Fields","title":"API for manipulating the VCF/BCF. — vcfreader","text":"new Constructor given vcf file Parameter: vcffile - path vcf file new Constructor given vcf file region Parameter: vcffile - path vcf file Parameter: region - region constrained new Constructor given vcf file, region samples Parameter: vcffile - path vcf file Parameter: region - region constrained Parameter: samples - samples constrained. Comma separated list samples include (exclude \"^\" prefix). variant Try get next variant record. return FALSE variants hit end file, otherwise TRUE. chr Return CHROM field current variant pos Return POS field current variant id Return CHROM field current variant ref Return REF field current variant alt Return ALT field current variant qual Return QUAL field current variant filter Return FILTER field current variant info Return INFO field current variant infoInt Return tag value integer type INFO field current variant Parameter: tag - tag name retrieve INFO infoFloat Return tag value float type INFO field current variant Parameter: tag - tag name retrieve INFO infoStr Return tag value string type INFO field current variant Parameter: tag - tag name retrieve INFO infoIntVec Return tag value vector integer type INFO field current variant Parameter: tag - tag name retrieve INFO infoFloatVec Return tag value vector float type INFO field current variant Parameter: tag - tag name retrieve INFO genotypes Return genotype values vector integers Parameter: collapse - Boolean value indicates wheather collapse size genotypes, eg, return diploid genotypes. formatInt Return tag value integer type sample FORAMT field current variant Parameter: tag - tag name retrieve FORAMT formatFloat Return tag value float type sample FORAMT field current variant Parameter: tag - tag name retrieve FORAMT formatStr Return tag value string type sample FORAMT field current variant Parameter: tag - tag name retrieve FORAMT isSNP Test current variant exculsively SNP isIndel Test current variant exculsively INDEL isSV Test current variant exculsively SV isMultiAllelics Test current variant exculsively Multi Allelics isMultiAllelicSNP Test current variant exculsively Multi Biallelics (SNPs) hasSNP Test current variant SNP hasINDEL Test current variant INDEL hasINS Test current variant INS hasDEL Test current variant DEL hasMNP Test current variant MNP hasBND Test current variant BND hasOTHER Test current variant hasOVERLAP Test current variant OVERLAP nsamples Return number samples samples Return vector samples id header Return raw string vcf header string Return raw string current variant including newline line Return raw string current variant without newline output Init output object streaming variants another vcf write Streaming current variant output vcf close Close connection output vcf setCHR Modify CHR current variant Parameter: s - string CHR setID Modify ID current variant Parameter: s - string ID setPOS Modify POS current variant Parameter: pos - integer POS setRefAlt Modify REF ALT current variant Parameter: s - string reperated comma setInfoInt Modify given tag INT type INFO current variant Parameter: tag - string tag name Parameter: v - integer tag value setInfoFloat Modify given tag FLOAT type INFO current variant Parameter: tag - string tag name Parameter: v - double tag value setInfoStr Modify given tag STRING type INFO current variant Parameter: tag - string tag name Parameter: s - string tag value setPhasing Modify phasing status sample Parameter: v - integer vector size number samples. 1s 0s valid. setGenotypes Modify genotypes current variant Parameter: v - integer vector genotypes. Use NA -9 missing value. setFormatInt Modify given tag INT type FORMAT current variant Parameter: tag - string tag name Parameter: v - integer tag value setFormatFloat Modify given tag FLOAT type FORMAT current variant Parameter: tag - string tag name Parameter: v - double tag value setFormatStr Modify given tag STRING type FORMAT current variant Parameter: tag - string tag name Parameter: s - string tag value rmInfoTag Remove given tag INFO current variant Parameter: s - string tag name rmFormatTag Remove given tag FORMAT current variant Parameter: s - string tag name setVariant Modify current variant adding vcf line Parameter: s - string one line VCF addINFO Add INFO header vcf Parameter: id - string tag name Parameter: number - string number Parameter: type - string type Parameter: desc - string description means addFORMAT Add FORMAT header vcf Parameter: id - string tag name Parameter: number - string number Parameter: type - string type Parameter: desc - string description means","code":""},{"path":"/reference/vcfreader.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"API for manipulating the VCF/BCF. — vcfreader","text":"","code":"vcffile <- system.file(\"extdata\", \"raw.gt.vcf.gz\", package=\"vcfppR\") br <- vcfreader$new(vcffile) res <- rep(0L, br$nsamples()) while(br$variant()) { if(br$isSNP()) { gt <- br$genotypes(TRUE) == 1 gt[is.na(gt)] <- FALSE res <- res + gt } }"},{"path":"/reference/vcfsummary.html","id":null,"dir":"Reference","previous_headings":"","what":"summarize the various variant types at both variant level and sample level. — vcfsummary","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"summarize various variant types variant level sample level.","code":""},{"path":"/reference/vcfsummary.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"","code":"vcfsummary( vcffile, region = \"\", samples = \"-\", pass = FALSE, qual = 0, svtype = FALSE )"},{"path":"/reference/vcfsummary.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"vcffile path VCF/BCF file region region subset like bcftools samples samples subset like bcftools pass restrict variants FILTER==PASS qual restrict variants QUAL > qual. svtype summarize variants SVTYPE","code":""},{"path":"/reference/vcfsummary.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"vcfsummary list containing following components: summary : named integer vector; summarize counts variant type samples : character vector; samples ids VCF file subsetting vartype : integer vector; counts variant type sample level order samples","code":""},{"path":"/reference/vcfsummary.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"bcftools view -s \"id01,id02\" input.bcf.gz chr1:100000-20000","code":""},{"path":"/reference/vcfsummary.html","id":"author","dir":"Reference","previous_headings":"","what":"Author","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"Zilong Li zilong.dk@gmail.com","code":""},{"path":"/reference/vcfsummary.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"summarize the various variant types at both variant level and sample level. — vcfsummary","text":"","code":"library('vcfppR') svfile <- system.file(\"extdata\", \"sv.vcf.gz\", package=\"vcfppR\") res <- vcfsummary(svfile, region = \"chr21:1-10000000\", svtype = TRUE) str(res) #> List of 10 #> $ summary: Named int [1:10] 9 9 0 0 0 0 2 4 3 0 #> ..- attr(*, \"names\")= chr [1:10] \"ALL\" \"SV\" \"BND\" \"CNV\" ... #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ BND : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ CNV : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ CPX : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ CTX : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ DEL : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ DUP : int [1:3202] 0 1 0 0 0 0 0 0 0 0 ... #> $ INS : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> $ INV : int [1:3202] 0 0 0 0 0 0 0 0 0 0 ... #> - attr(*, \"class\")= chr \"vcfsummary\""},{"path":"/reference/vcftable.html","id":null,"dir":"Reference","previous_headings":"","what":"read VCF/BCF contents into R data structure — vcftable","title":"read VCF/BCF contents into R data structure — vcftable","text":"swiss army knife reading VCF/BCF R data types rapidly easily.","code":""},{"path":"/reference/vcftable.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"read VCF/BCF contents into R data structure — vcftable","text":"","code":"vcftable( vcffile, region = \"\", samples = \"-\", vartype = \"all\", format = \"GT\", ids = NULL, qual = 0, pass = FALSE, info = TRUE, collapse = TRUE, setid = FALSE, mac = 0 )"},{"path":"/reference/vcftable.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"read VCF/BCF contents into R data structure — vcftable","text":"vcffile path VCF/BCF file region region subset bcftools-like style: \"chr1\", \"chr1:1-10000000\" samples samples subset bcftools-like style. comma separated list samples include (exclude \"^\" prefix). e.g. \"id01,id02\", \"^id01,id02\". vartype restrict specific type variants. supports \"snps\",\"indels\", \"sv\", \"multisnps\",\"multiallelics\" format FORMAT tag extract. default \"GT\" extracted. ids character vector. restrict sites ID given vector. default NULL filter sites. qual numeric. restrict variants QUAL > qual. pass logical. restrict variants FILTER = \"PASS\". info logical. drop INFO column returned list. collapse logical. acts FORMAT. FORMAT extract \"GT\", dim raw genotypes matrix diploid (M, 2 * N), M #markers N #samples. default TRUE collapse genotypes sample matrix (M, N). Set FALSE one wants maintain phasing order, e.g. \"1|0\" parsed c(1, 0) collapse=FALSE. FORMAT extract \"GT\", collapse=TRUE try turn list extracted vector matrix. However, raises issues one variant mutliallelic resulting vaules others. setid logical. reset ID column CHR_POS_REF_ALT. mac integer. restrict variants minor allele count higher value.","code":""},{"path":"/reference/vcftable.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"read VCF/BCF contents into R data structure — vcftable","text":"Return list containing following components: samples : character vector; samples ids VCF file subsetting chr : character vector; CHR column VCF file pos : character vector; POS column VCF file id : character vector; ID column VCF file ref : character vector; REF column VCF file alt : character vector; ALT column VCF file qual : character vector; QUAL column VCF file filter : character vector; FILTER column VCF file info : character vector; INFO column VCF file format : matrix either integer numberic values depending tag extract; specifiy tag FORMAT column extracted","code":""},{"path":"/reference/vcftable.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"read VCF/BCF contents into R data structure — vcftable","text":"vcftable uses C++ API vcfpp, wrapper htslib, read VCF/BCF files. Thus, full functionalities htslib, restrict specific variant types, samples regions. memory efficiency reason, vcftable designed parse one tag time FORMAT column VCF. default, matrix genotypes, .e. \"GT\" tag, returned vcftable, many tags supported format option.","code":""},{"path":"/reference/vcftable.html","id":"author","dir":"Reference","previous_headings":"","what":"Author","title":"read VCF/BCF contents into R data structure — vcftable","text":"Zilong Li zilong.dk@gmail.com","code":""},{"path":"/reference/vcftable.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"read VCF/BCF contents into R data structure — vcftable","text":"","code":"library('vcfppR') vcffile <- system.file(\"extdata\", \"raw.gt.vcf.gz\", package=\"vcfppR\") res <- vcftable(vcffile, \"chr21:1-5050000\", vartype = \"snps\") str(res) #> List of 10 #> $ samples: chr [1:3202] \"HG00096\" \"HG00097\" \"HG00099\" \"HG00100\" ... #> $ chr : chr [1:12] \"chr21\" \"chr21\" \"chr21\" \"chr21\" ... #> $ pos : int [1:12] 5030082 5030088 5030105 5030253 5030278 5030347 5030356 5030357 5030391 5030446 ... #> $ id : chr [1:12] \"chr21:5030082:G:A\" \"chr21:5030088:C:T\" \"chr21:5030105:C:A\" \"chr21:5030253:G:T\" ... #> $ ref : chr [1:12] \"G\" \"C\" \"C\" \"G\" ... #> $ alt : chr [1:12] \"A\" \"T\" \"A\" \"T\" ... #> $ qual : num [1:12] 70.1 2773.1 3897.8 102.6 868.9 ... #> $ filter : chr [1:12] \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" \"VQSRTrancheSNP99.80to100.00\" ... #> $ info : chr [1:12] \"AC=2;AF=0.000616523;AN=3244;DP=2498;FS=0;MLEAC=1;MLEAF=0.0003083;MQ=17.07;MQ0=0;QD=17.52;SOR=3.258;VQSLOD=-32.6\"| __truncated__ \"AC=127;AF=0.0400126;AN=3174;BaseQRankSum=0.736;ClippingRankSum=0.736;DP=2750;FS=0;InbreedingCoeff=0.0015;MLEAC=\"| __truncated__ \"AC=128;AF=0.0352811;AN=3628;BaseQRankSum=0.736;ClippingRankSum=0.727;DP=3476;FS=0;InbreedingCoeff=-0.0015;MLEAC\"| __truncated__ \"AC=1;AF=0.000165837;AN=6030;BaseQRankSum=-0.583;ClippingRankSum=-0.259;DP=19530;FS=0;InbreedingCoeff=-0.0274;ML\"| __truncated__ ... #> $ gt : int [1:12, 1:3202] NA 2 2 0 0 0 0 0 0 0 ... #> - attr(*, \"class\")= chr \"vcftable\""},{"path":"/reference/vcfwriter.html","id":null,"dir":"Reference","previous_headings":"","what":"API for writing the VCF/BCF. — vcfwriter","title":"API for writing the VCF/BCF. — vcfwriter","text":"Type name class see details methods","code":""},{"path":"/reference/vcfwriter.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"API for writing the VCF/BCF. — vcfwriter","text":"C++ class following fields/methods writing VCF/BCF","code":""},{"path":"/reference/vcfwriter.html","id":"fields","dir":"Reference","previous_headings":"","what":"Fields","title":"API for writing the VCF/BCF. — vcfwriter","text":"new Constructor given vcf file Parameter: vcffile - path vcf file. start \"~\" Parameter: version - version VCF specification addContig Add Contig header vcf Parameter: str - string CONTIG name addFILTER Add FILTER header vcf Parameter: id - string FILTER name Parameter: desc - string description means addINFO Add INFO header vcf Parameter: id - string tag name Parameter: number - string number Parameter: type - string type Parameter: desc - string description means addFORMAT Add FORMAT header vcf Parameter: id - string tag name Parameter: number - string number Parameter: type - string type Parameter: desc - string description means addSample Add SAMPLE header vcf Parameter: str - string SAMPLE name addLine Add line header vcf Parameter: str - string line header VCF writeline Write variant record given line Parameter: line - string line variant VCF. ended \"newline\" close Close save vcf file","code":""},{"path":"/reference/vcfwriter.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"API for writing the VCF/BCF. — vcfwriter","text":"","code":"outvcf <- file.path(paste0(tempfile(), \".vcf.gz\")) bw <- vcfwriter$new(outvcf, \"VCF4.1\") bw$addContig(\"chr20\") bw$addFORMAT(\"GT\", \"1\", \"String\", \"Genotype\"); bw$addSample(\"NA12878\") s1 <- \"chr20\\t2006060\\t.\\tG\\tC\\t100\\tPASS\\t.\\tGT\\t1|0\" bw$writeline(s1) bw$close()"},{"path":"/news/index.html","id":"vcfppr-045","dir":"Changelog","previous_headings":"","what":"vcfppR 0.4.5","title":"vcfppR 0.4.5","text":"CRAN release: 2024-04-08 add vcfcomp function fix memory leaks pass ASAN check","code":""},{"path":"/news/index.html","id":"vcfppr-040","dir":"Changelog","previous_headings":"","what":"vcfppR 0.4.0","title":"vcfppR 0.4.0","text":"CRAN release: 2024-02-26 add setid option vcftable patches upcoming Rtools windows","code":""},{"path":"/news/index.html","id":"vcfppr-038","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.8","title":"vcfppR 0.3.8","text":"CRAN release: 2024-01-14 fix issues M1 Mac","code":""},{"path":"/news/index.html","id":"vcfppr-037","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.7","title":"vcfppR 0.3.7","text":"add vcfreader@rmFormatTag() add vcfreader@samples() vcftable supports vartype = ‘sv’","code":""},{"path":"/news/index.html","id":"vcfppr-036","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.6","title":"vcfppR 0.3.6","text":"add vcfreader::line remove vcfreader::setVariant bug fix setFormatStr units tests","code":""},{"path":"/news/index.html","id":"vcfppr-035","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.5","title":"vcfppR 0.3.5","text":"CRAN release: 2023-12-14 add vcfreader vcfwriter","code":""},{"path":"/news/index.html","id":"vcfppr-034","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.4","title":"vcfppR 0.3.4","text":"support filters variant ID","code":""},{"path":"/news/index.html","id":"vcfppr-033","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.3","title":"vcfppR 0.3.3","text":"use API vcfpp.h v0.3.1 set missing vaules FORMAT NA support filters QUAL, FILTER INFO","code":""},{"path":"/news/index.html","id":"vcfppr-030","dir":"Changelog","previous_headings":"","what":"vcfppR 0.3.0","title":"vcfppR 0.3.0","text":"First release using vcfpp.h v0.3.0 add vcftable function add vcfsummary function add vcfpopgen function","code":""}]