Namespace(genes='/oak/stanford/groups/akundaje/soumyak/refs/gencode/hg38/hg38.gencode.protein_coding.tss.bed', list='/oak/stanford/groups/akundaje/projects/neuro-variants/variant_summary/asd/ameen_2022/K562_bias/ameen_2022.vEC.mean.variant_scores.tsv', out_prefix='/oak/stanford/groups/akundaje/projects/neuro-variants/variant_annotations/asd/ameen_2022/K562_bias/ameen_2022.vEC', peaks='/oak/stanford/groups/akundaje/projects/neuro-variants/data/processed/ameen_2022/peaks/overlap/ameen_2022.vEC.overlap.peaks.bed.gz', schema='chrombpnet') Namespace(genes='/oak/stanford/groups/akundaje/soumyak/refs/gencode/hg38/hg38.gencode.protein_coding.tss.bed', list='/oak/stanford/groups/akundaje/projects/neuro-variants/variant_summary/asd/ameen_2022/K562_bias/ameen_2022.vEC.mean.variant_scores.tsv', out_prefix='/oak/stanford/groups/akundaje/projects/neuro-variants/variant_annotations/asd/ameen_2022/K562_bias/ameen_2022.vEC', peaks='/oak/stanford/groups/akundaje/projects/neuro-variants/data/processed/ameen_2022/peaks/overlap/ameen_2022.vEC.overlap.peaks.bed.gz', schema='chrombpnet') chr pos end allele1 allele2 variant_id 44909 chr1 843979 843980 A G chr1:843980:A:G 1968 chr1 848166 848167 A G chr1:848167:A:G 1969 chr1 894776 894777 A G chr1:894777:A:G 44237 chr1 915678 915679 G A chr1:915679:G:A 1544 chr1 932169 932170 C G chr1:932170:C:G Variants table shape: (84980, 6) annotating with closest genes 0 1 2 3 4 5 6 7 8 9 \ 0 chr1 843979 843980 A G chr1:843980:A:G chr1 923923 923924 SAMD11 1 chr1 843979 843980 A G chr1:843980:A:G chr1 959308 959309 NOC2L 2 chr1 843979 843980 A G chr1:843980:A:G chr1 960584 960585 KLHL17 3 chr1 848166 848167 A G chr1:848167:A:G chr1 923923 923924 SAMD11 4 chr1 848166 848167 A G chr1:848167:A:G chr1 959308 959309 NOC2L 10 11 12 13 14 0 0 + ENSG00000187634.13 protein_coding 79944 1 0 - ENSG00000188976.11 protein_coding 115329 2 0 + ENSG00000187961.15 protein_coding 116605 3 0 + ENSG00000187634.13 protein_coding 75757 4 0 - ENSG00000188976.11 protein_coding 111142 Closest genes table shape: (254940, 15) annotating with peak overlap chr pos end allele1 allele2 variant_id 0 chr1 3540089 3540090 A C chr1:3540090:A:C 1 chr1 3540221 3540222 G C chr1:3540222:G:C 2 chr1 3619307 3619308 C A chr1:3619308:C:A 3 chr1 7726762 7726763 T C chr1:7726763:T:C 4 chr1 10210431 10210432 C G chr1:10210432:C:G Peak overlap table shape: (1600, 6) chr pos allele1 allele2 variant_id logfc.mean \ 0 chr1 3747728 T C chr1:3747728:T:C 0.004931 1 chr1 117942118 T G chr1:117942118:T:G 0.006983 2 chr1 163337297 C A chr1:163337297:C:A -0.003908 3 chr1 32951474 G C chr1:32951474:G:C 0.016711 4 chr1 214496189 G C chr1:214496189:G:C -0.007206 logfc.mean.pval abs_logfc.mean abs_logfc.mean.pval jsd.mean ... \ 0 0.770757 0.005382 0.770747 0.004925 ... 1 0.589954 0.011053 0.590236 0.010062 ... 2 0.750655 0.006360 0.750624 0.009604 ... 3 0.485476 0.016711 0.486807 0.012884 ... 4 0.591852 0.011830 0.591683 0.011428 ... logfc_x_jsd_x_active_allele_quantile.mean.pval \ 0 0.564576 1 0.525193 2 0.832107 3 0.737567 4 0.430214 abs_logfc_x_jsd_x_active_allele_quantile.mean \ 0 0.000015 1 0.000018 2 0.000003 3 0.000006 4 0.000042 abs_logfc_x_jsd_x_active_allele_quantile.mean.pval closest_gene_1 \ 0 0.566893 CCDC27 1 0.526186 WDR3 2 0.831863 RGS5 3 0.737378 RNF19B 4 0.428209 PTPN14 gene_distance_1 closest_gene_2 gene_distance_2 closest_gene_3 \ 0 1267 SMIM1 25022 LRRC47 1 12397 GDAP2 12497 SPAG17 2 15506 NUF2 70720 RGS4 3 13335 TMEM54 50036 HPCA 4 56260 CENPF 106997 SMYD2 gene_distance_3 peak_overlap 0 48770 False 1 243110 False 2 268521 False 3 65479 False 4 215086 False [5 rows x 34 columns] Annotation table shape: (84980, 34) DONE Done Annotating