In [2]:
data_name = "K562"
modisco_root = "/srv/scratch/msharmin/mouse_hem/k562_modisco"
tomtom_report_root = "http://mitra.stanford.edu/kundaje/msharmin/report/tomtom_outs/cells"
task_dir = "fold0"
#perf_file = "/srv/scratch/msharmin/mouse_hem/with_tfd/full_mouse50/fineFactorized/task_273-naivegw/NaiveauPRC.txt"
#homer_root = "/srv/scratch/msharmin/mouse_hem/with_tfd/full_mouse50/Naive_scans"
#reportfile = "/mnt/lab_data/kundaje/msharmin/annotations/filtering samples_MS2.xlsx"
#sheetname = "filter23"
In [8]:
from matlas.matches import DenovoModisco
from matlas.genome_data import *
# from matlas.matches import prepare_pattern_matches
ob = DenovoModisco("{}/{}".format(modisco_root, task_dir))
# ob.fetch_tomtom_matches(save_report=True,
#                             tomtom_dir= "{0}/{1}_tomtomout".format("{}/{}".format(modisco_root, task_dir), 
#                                                                    DEFAULT_DATABASE))
ob.load_matched_motifs()
ob.get_motif_per_celltype(match_threshold=0.05)
#
In [9]:
ob.display_individual_table()
The following two links show list of Denovo Patterns and corresponding Motifs discovered by TF-MoDISco
Click here for Denovo Patterns by TF-MoDISco: #23
Pattern NameTF Name(s)Modisco
metacluster_1/pattern_0 # seqlets: 3789 SequenceContrib ScoresHyp_Contrib Scores
Fosl2, Fosl1, Bach2, Fos, Jun, Mafk, Nfe2l2, Nfe2, Atf3, Bach1,

Maf, Jund, Fosb, Mafg, Junb, Mafb, Maff, Batf, Mafa, Jdp2
metacluster_1/pattern_1 # seqlets: 2778 SequenceContrib ScoresHyp_Contrib Scores
Sp2, Sp3, Sp1, Klf3, Klf6, Sp4, Klf15, Klf1, Maz, Wt1,

Sp5, Zbtb17, Egr1, Zfx, Klf7, Klf4, Klf5, E2f4, Egr2, Klf8, Klf12,

Zfp281, Rela, Usf2, Nr1h4, Sall4, Ptf1a, E2f1, Srebf2, Fli1, Tfap2c, Egr3,

Mxi1, E2f7
metacluster_1/pattern_2 # seqlets: 1843 SequenceContrib ScoresHyp_Contrib Scores
Gata6, Gata4, Tal1, Gata2, Gata1, Gata3, Gata5
metacluster_1/pattern_3 # seqlets: 1409 SequenceContrib ScoresHyp_Contrib Scores
Atf2, Atf7, Creb1, Atf1, Creb5, Crem, Nfil3, Rxrb, Tef
metacluster_1/pattern_4 # seqlets: 1006 SequenceContrib ScoresHyp_Contrib Scores
metacluster_1/pattern_5 # seqlets: 956 SequenceContrib ScoresHyp_Contrib Scores
Elk1, Gabpa, Elf1, Erg, Ehf, Ets1, Elf4, Etv6, Etv4, Elk4,

Spi1, Etv2, Elf2, Elf3, Spib, Elf5, Etv3, XP_911724.4, Elk3, Etv5, Spdef,

Etv1, Fev, Irf8, Irf4, Spic, Stat4, Irf2, Prdm1
metacluster_1/pattern_6 # seqlets: 889 SequenceContrib ScoresHyp_Contrib Scores
Nfyb, Foxi1, Nfyc, Nfya, Pbx3
metacluster_1/pattern_7 # seqlets: 818 SequenceContrib ScoresHyp_Contrib Scores
Usf1, Tfeb, Tfe3, Arntl, Tfec, Mitf, Srebf1, Npas2, Clock, Arnt,

Bhlhe40, Creb3l2, Mlx, Tcfl5, Mycn, Max, Xbp1, Myc, Bhlhe41, Hes1, Mlxip
metacluster_1/pattern_8 # seqlets: 729 SequenceContrib ScoresHyp_Contrib Scores
Nrf1
metacluster_1/pattern_9 # seqlets: 435 SequenceContrib ScoresHyp_Contrib Scores
metacluster_1/pattern_10 # seqlets: 358 SequenceContrib ScoresHyp_Contrib Scores
Ctcfl, Ctcf
metacluster_1/pattern_11 # seqlets: 305 SequenceContrib ScoresHyp_Contrib Scores
Rest
metacluster_1/pattern_12 # seqlets: 257 SequenceContrib ScoresHyp_Contrib Scores
metacluster_1/pattern_13 # seqlets: 257 SequenceContrib ScoresHyp_Contrib Scores
Zfp143, Thap11, Tbx2
metacluster_1/pattern_14 # seqlets: 237 SequenceContrib ScoresHyp_Contrib Scores
metacluster_1/pattern_15 # seqlets: 201 SequenceContrib ScoresHyp_Contrib Scores
Rfx2, Rfx3, Rfx1, Rfx4, Rfx7, Rfx6
metacluster_1/pattern_16 # seqlets: 173 SequenceContrib ScoresHyp_Contrib Scores
Yy1, Taf1
metacluster_1/pattern_17 # seqlets: 121 SequenceContrib ScoresHyp_Contrib Scores
metacluster_1/pattern_18 # seqlets: 82 SequenceContrib ScoresHyp_Contrib Scores
Runx1, Runx2, Runx3, Cbfb
metacluster_1/pattern_19 # seqlets: 77 SequenceContrib ScoresHyp_Contrib Scores
Mef2d, Mef2a, Mef2c
metacluster_1/pattern_20 # seqlets: 67 SequenceContrib ScoresHyp_Contrib Scores
metacluster_1/pattern_21 # seqlets: 59 SequenceContrib ScoresHyp_Contrib Scores
metacluster_1/pattern_22 # seqlets: 55 SequenceContrib ScoresHyp_Contrib Scores
Rorc, Nfatc1, Nr1d2
Click here for Motifs by TF-MoDISco: #150
TF NamePattern(s)
Fosl2
Pattern NameModiscoSignificance
metacluster_1/pattern_00.000531124
metacluster_1/pattern_220.0244429
Fosl1
Pattern NameModiscoSignificance
metacluster_1/pattern_00.000285876
metacluster_1/pattern_220.0123203
Bach2
Pattern NameModiscoSignificance
metacluster_1/pattern_00.000285876
metacluster_1/pattern_220.0484955
Fos
Pattern NameModiscoSignificance
metacluster_1/pattern_00.00042876199999999996
metacluster_1/pattern_220.0350237
Jun
Pattern NameModiscoSignificance
metacluster_1/pattern_00.000531124
metacluster_1/pattern_30.0206707
metacluster_1/pattern_220.00784668
Mafk
Pattern NameModiscoSignificance
metacluster_1/pattern_00.000615157
Nfe2l2
Pattern NameModiscoSignificance
metacluster_1/pattern_00.000531124
Nfe2
Pattern NameModiscoSignificance
metacluster_1/pattern_00.000531124
Atf3
Pattern NameModiscoSignificance
metacluster_1/pattern_00.00061973
metacluster_1/pattern_30.0498925
metacluster_1/pattern_220.000144666
Bach1
Pattern NameModiscoSignificance
metacluster_1/pattern_00.0010957
Maf
Pattern NameModiscoSignificance
metacluster_1/pattern_00.00111253
Jund
Pattern NameModiscoSignificance
metacluster_1/pattern_00.0446203
metacluster_1/pattern_220.0195532
Fosb
Pattern NameModiscoSignificance
metacluster_1/pattern_00.00112121
metacluster_1/pattern_220.000144666
Mafg
Pattern NameModiscoSignificance
metacluster_1/pattern_00.00112698
Junb
Pattern NameModiscoSignificance
metacluster_1/pattern_00.00129502
metacluster_1/pattern_220.0484955
Mafb
Pattern NameModiscoSignificance
metacluster_1/pattern_00.00616733
metacluster_1/pattern_30.0076056
Maff
Pattern NameModiscoSignificance
metacluster_1/pattern_00.00174817
Batf
Pattern NameModiscoSignificance
metacluster_1/pattern_00.04491780000000001
metacluster_1/pattern_220.00677315
Mafa
Pattern NameModiscoSignificance
metacluster_1/pattern_00.00480529
Jdp2
Pattern NameModiscoSignificance
metacluster_1/pattern_00.00783977
metacluster_1/pattern_30.00173861
metacluster_1/pattern_220.00199718
Sp2
Pattern NameModiscoSignificance
metacluster_1/pattern_11.6957e-10
metacluster_1/pattern_160.0187443
Sp3
Pattern NameModiscoSignificance
metacluster_1/pattern_12.55797e-10
Sp1
Pattern NameModiscoSignificance
metacluster_1/pattern_10.000210585
metacluster_1/pattern_160.00342276
Klf3
Pattern NameModiscoSignificance
metacluster_1/pattern_13.22813e-08
Klf6
Pattern NameModiscoSignificance
metacluster_1/pattern_13.3932e-08
Sp4
Pattern NameModiscoSignificance
metacluster_1/pattern_10.0010217
Klf15
Pattern NameModiscoSignificance
metacluster_1/pattern_15.2079099999999996e-06
Klf1
Pattern NameModiscoSignificance
metacluster_1/pattern_10.0374967
metacluster_1/pattern_210.0323434
Maz
Pattern NameModiscoSignificance
metacluster_1/pattern_12.7735300000000002e-05
Wt1
Pattern NameModiscoSignificance
metacluster_1/pattern_17.87153e-05
Sp5
Pattern NameModiscoSignificance
metacluster_1/pattern_10.000144836
Zbtb17
Pattern NameModiscoSignificance
metacluster_1/pattern_10.000210585
Egr1
Pattern NameModiscoSignificance
metacluster_1/pattern_10.00306536
Zfx
Pattern NameModiscoSignificance
metacluster_1/pattern_10.00709033
metacluster_1/pattern_160.0187443
Klf7
Pattern NameModiscoSignificance
metacluster_1/pattern_10.0007575460000000001
Klf4
Pattern NameModiscoSignificance
metacluster_1/pattern_10.00130578
metacluster_1/pattern_210.044139
Klf5
Pattern NameModiscoSignificance
metacluster_1/pattern_10.000776117
E2f4
Pattern NameModiscoSignificance
metacluster_1/pattern_10.000968164
Egr2
Pattern NameModiscoSignificance
metacluster_1/pattern_10.00130578
Klf8
Pattern NameModiscoSignificance
metacluster_1/pattern_10.00141702
Klf12
Pattern NameModiscoSignificance
metacluster_1/pattern_10.00159289
Zfp281
Pattern NameModiscoSignificance
metacluster_1/pattern_10.00957792
Rela
Pattern NameModiscoSignificance
metacluster_1/pattern_10.00901111
Usf2
Pattern NameModiscoSignificance
metacluster_1/pattern_10.010885700000000002
metacluster_1/pattern_70.000549045
Nr1h4
Pattern NameModiscoSignificance
metacluster_1/pattern_10.0190022
Sall4
Pattern NameModiscoSignificance
metacluster_1/pattern_10.0190022
Ptf1a
Pattern NameModiscoSignificance
metacluster_1/pattern_10.025825099999999997
E2f1
Pattern NameModiscoSignificance
metacluster_1/pattern_10.025825099999999997
Srebf2
Pattern NameModiscoSignificance
metacluster_1/pattern_10.029158299999999998
metacluster_1/pattern_70.0173899
Fli1
Pattern NameModiscoSignificance
metacluster_1/pattern_10.0299007
metacluster_1/pattern_50.000299707
Tfap2c
Pattern NameModiscoSignificance
metacluster_1/pattern_10.0303509
Egr3
Pattern NameModiscoSignificance
metacluster_1/pattern_10.0326033
Mxi1
Pattern NameModiscoSignificance
metacluster_1/pattern_10.0326033
E2f7
Pattern NameModiscoSignificance
metacluster_1/pattern_10.043560800000000004
Gata6
Pattern NameModiscoSignificance
metacluster_1/pattern_20.000809963
Gata4
Pattern NameModiscoSignificance
metacluster_1/pattern_20.00453647
Tal1
Pattern NameModiscoSignificance
metacluster_1/pattern_24.61583e-06
Gata2
Pattern NameModiscoSignificance
metacluster_1/pattern_27.958739999999998e-06
Gata1
Pattern NameModiscoSignificance
metacluster_1/pattern_21.03485e-05
metacluster_1/pattern_210.0323434
Gata3
Pattern NameModiscoSignificance
metacluster_1/pattern_20.0291138
Gata5
Pattern NameModiscoSignificance
metacluster_1/pattern_20.0055788
Atf2
Pattern NameModiscoSignificance
metacluster_1/pattern_30.00017758099999999998
Atf7
Pattern NameModiscoSignificance
metacluster_1/pattern_30.00010086700000000001
Creb1
Pattern NameModiscoSignificance
metacluster_1/pattern_30.00169528
Atf1
Pattern NameModiscoSignificance
metacluster_1/pattern_30.024642599999999997
Creb5
Pattern NameModiscoSignificance
metacluster_1/pattern_34.99929e-05
Crem
Pattern NameModiscoSignificance
metacluster_1/pattern_30.00173861
Nfil3
Pattern NameModiscoSignificance
metacluster_1/pattern_30.0129629
Rxrb
Pattern NameModiscoSignificance
metacluster_1/pattern_30.0138474
Tef
Pattern NameModiscoSignificance
metacluster_1/pattern_30.0337915
Elk1
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00020789400000000003
Gabpa
Pattern NameModiscoSignificance
metacluster_1/pattern_50.000508191
Elf1
Pattern NameModiscoSignificance
metacluster_1/pattern_52.72749e-05
Erg
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00029623700000000003
Ehf
Pattern NameModiscoSignificance
metacluster_1/pattern_50.000263741
Ets1
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00020789400000000003
Elf4
Pattern NameModiscoSignificance
metacluster_1/pattern_55.7799799999999995e-05
Etv6
Pattern NameModiscoSignificance
metacluster_1/pattern_50.0025886999999999998
Etv4
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00172722
Elk4
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00038214300000000004
Spi1
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00405171
Etv2
Pattern NameModiscoSignificance
metacluster_1/pattern_50.000149312
Elf2
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00033676699999999997
Elf3
Pattern NameModiscoSignificance
metacluster_1/pattern_50.000749314
Spib
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00020789400000000003
Elf5
Pattern NameModiscoSignificance
metacluster_1/pattern_50.000439651
Etv3
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00020789400000000003
XP_911724.4
Pattern NameModiscoSignificance
metacluster_1/pattern_50.000211975
Elk3
Pattern NameModiscoSignificance
metacluster_1/pattern_50.000749314
Etv5
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00038214300000000004
Spdef
Pattern NameModiscoSignificance
metacluster_1/pattern_50.0157678
Etv1
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00252243
Fev
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00152209
Irf8
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00240447
Irf4
Pattern NameModiscoSignificance
metacluster_1/pattern_50.00243487
metacluster_1/pattern_220.0123203
Spic
Pattern NameModiscoSignificance
metacluster_1/pattern_50.0038306999999999994
Stat4
Pattern NameModiscoSignificance
metacluster_1/pattern_50.017204499999999998
Irf2
Pattern NameModiscoSignificance
metacluster_1/pattern_50.03740809999999999
metacluster_1/pattern_120.0433443
Prdm1
Pattern NameModiscoSignificance
metacluster_1/pattern_50.043144
Nfyb
Pattern NameModiscoSignificance
metacluster_1/pattern_61.15376e-07
Foxi1
Pattern NameModiscoSignificance
metacluster_1/pattern_65.9560400000000005e-06
Nfyc
Pattern NameModiscoSignificance
metacluster_1/pattern_66.03507e-05
Nfya
Pattern NameModiscoSignificance
metacluster_1/pattern_66.03507e-05
Pbx3
Pattern NameModiscoSignificance
metacluster_1/pattern_60.0005506280000000001
Usf1
Pattern NameModiscoSignificance
metacluster_1/pattern_70.00426855
Tfeb
Pattern NameModiscoSignificance
metacluster_1/pattern_70.00128519
Tfe3
Pattern NameModiscoSignificance
metacluster_1/pattern_70.00128519
Arntl
Pattern NameModiscoSignificance
metacluster_1/pattern_70.0128965
Tfec
Pattern NameModiscoSignificance
metacluster_1/pattern_70.000654635
Mitf
Pattern NameModiscoSignificance
metacluster_1/pattern_70.000549045
Srebf1
Pattern NameModiscoSignificance
metacluster_1/pattern_70.00859238
Npas2
Pattern NameModiscoSignificance
metacluster_1/pattern_70.029829599999999998
Clock
Pattern NameModiscoSignificance
metacluster_1/pattern_70.015138999999999998
Arnt
Pattern NameModiscoSignificance
metacluster_1/pattern_70.035667199999999996
Bhlhe40
Pattern NameModiscoSignificance
metacluster_1/pattern_70.0408658
Creb3l2
Pattern NameModiscoSignificance
metacluster_1/pattern_70.014718799999999999
Mlx
Pattern NameModiscoSignificance
metacluster_1/pattern_70.00943528
Tcfl5
Pattern NameModiscoSignificance
metacluster_1/pattern_70.00777018
Mycn
Pattern NameModiscoSignificance
metacluster_1/pattern_70.0092256
Max
Pattern NameModiscoSignificance
metacluster_1/pattern_70.0128965
Xbp1
Pattern NameModiscoSignificance
metacluster_1/pattern_70.0144828
Myc
Pattern NameModiscoSignificance
metacluster_1/pattern_70.0292875
Bhlhe41
Pattern NameModiscoSignificance
metacluster_1/pattern_70.0392036
Hes1
Pattern NameModiscoSignificance
metacluster_1/pattern_70.0441652
Mlxip
Pattern NameModiscoSignificance
metacluster_1/pattern_70.0441652
Nrf1
Pattern NameModiscoSignificance
metacluster_1/pattern_83.41395e-08
Ctcfl
Pattern NameModiscoSignificance
metacluster_1/pattern_101.17681e-11
Ctcf
Pattern NameModiscoSignificance
metacluster_1/pattern_103.07262e-10
Rest
Pattern NameModiscoSignificance
metacluster_1/pattern_117.09218e-16
Zfp143
Pattern NameModiscoSignificance
metacluster_1/pattern_134.7156600000000005e-21
Thap11
Pattern NameModiscoSignificance
metacluster_1/pattern_132.4247199999999998e-17
Tbx2
Pattern NameModiscoSignificance
metacluster_1/pattern_137.061060000000001e-12
Rfx2
Pattern NameModiscoSignificance
metacluster_1/pattern_153.2542e-07
Rfx3
Pattern NameModiscoSignificance
metacluster_1/pattern_150.033992900000000006
Rfx1
Pattern NameModiscoSignificance
metacluster_1/pattern_152.49613e-09
Rfx4
Pattern NameModiscoSignificance
metacluster_1/pattern_150.00011358700000000001
Rfx7
Pattern NameModiscoSignificance
metacluster_1/pattern_150.0136131
Rfx6
Pattern NameModiscoSignificance
metacluster_1/pattern_150.00915489
Yy1
Pattern NameModiscoSignificance
metacluster_1/pattern_162.2396200000000003e-06
Taf1
Pattern NameModiscoSignificance
metacluster_1/pattern_160.00013015
Runx1
Pattern NameModiscoSignificance
metacluster_1/pattern_182.64511e-05
Runx2
Pattern NameModiscoSignificance
metacluster_1/pattern_181.96662e-06
Runx3
Pattern NameModiscoSignificance
metacluster_1/pattern_180.00010082899999999999
Cbfb
Pattern NameModiscoSignificance
metacluster_1/pattern_180.000113768
Mef2d
Pattern NameModiscoSignificance
metacluster_1/pattern_191.3062000000000001e-07
Mef2a
Pattern NameModiscoSignificance
metacluster_1/pattern_190.00010555200000000001
Mef2c
Pattern NameModiscoSignificance
metacluster_1/pattern_195.4594799999999994e-05
Rorc
Pattern NameModiscoSignificance
metacluster_1/pattern_220.00784668
Nfatc1
Pattern NameModiscoSignificance
metacluster_1/pattern_220.00872025
Nr1d2
Pattern NameModiscoSignificance
metacluster_1/pattern_220.0488916