# DREME 4.12.0 # command: dreme -v 1 -oc /srv/scratch/shared/surya/imk1/TFBindingPredictionProject/EncodeK562eGFPComparisons/TFDP1-Antibody.IDR0.05.filt.narrowPeak.summitPlusMinus250bp.MemeChipResultsDefaultMax/dreme_out -png -dna -p /srv/scratch/shared/surya/imk1/TFBindingPredictionProject/EncodeK562eGFPComparisons/TFDP1-Antibody.IDR0.05.filt.narrowPeak.summitPlusMinus250bp.MemeChipResultsDefaultMax/seqs-centered -n /srv/scratch/shared/surya/imk1/TFBindingPredictionProject/EncodeK562eGFPComparisons/TFDP1-Antibody.IDR0.05.filt.narrowPeak.summitPlusMinus250bp.MemeChipResultsDefaultMax/seqs-shuffled # positives: 5617 from /srv/scratch/shared/surya/imk1/TFBindingPredictionProject/EncodeK562eGFPComparisons/TFDP1-Antibody.IDR0.05.filt.narrowPeak.summitPlusMinus250bp.MemeChipResultsDefaultMax/seqs-centered (Wed Nov 22 12:43:44 PST 2017) # negatives: 5617 from /srv/scratch/shared/surya/imk1/TFBindingPredictionProject/EncodeK562eGFPComparisons/TFDP1-Antibody.IDR0.05.filt.narrowPeak.summitPlusMinus250bp.MemeChipResultsDefaultMax/seqs-shuffled (Wed Nov 22 12:43:45 PST 2017) # host: indra # when: Wed Nov 22 12:59:37 PST 2017 MEME version 4.12.0 ALPHABET "DNA" DNA-LIKE A "Adenine" CC0000 ~ T "Thymine" 008000 C "Cytosine" 0000CC ~ G "Guanine" FFB300 N "Any base" = ACGT X = ACGT . = ACGT V "Not T" = ACG H "Not G" = ACT D "Not C" = AGT B "Not A" = CGT M "Amino" = AC R "Purine" = AG W "Weak" = AT S "Strong" = CG Y "Pyrimidine" = CT K "Keto" = GT U = T END ALPHABET strands: + - Background letter frequencies (from dataset): A 0.188 C 0.312 G 0.312 T 0.188 MOTIF AGRKGGCG DREME-1 # Word RC Word Pos Neg P-value E-value # BEST AGRKGGCG CGCCMYCT 796 146 3.9e-118 1.7e-113 # AGAGGGCG CGCCCTCT 249 44 4.9e-037 2.2e-032 # AGGGGGCG CGCCCCCT 288 66 1.8e-035 7.9e-031 # AGGTGGCG CGCCACCT 164 27 8.4e-026 3.7e-021 # AGATGGCG CGCCATCT 116 11 8.8e-024 3.9e-019 letter-probability matrix: alength= 4 w= 8 nsites= 824 E= 1.7e-113 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.444175 0.000000 0.555825 0.000000 0.000000 0.000000 0.655340 0.344660 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 MOTIF RGRAA DREME-2 # Word RC Word Pos Neg P-value E-value # BEST RGRAA TTYCY 3689 2744 3.8e-073 1.7e-068 # GGGAA TTCCC 2044 1324 3.5e-050 1.6e-045 # GGAAA TTTCC 1527 951 1.1e-039 4.8e-035 # AGGAA TTCCT 1540 1062 5.6e-027 2.5e-022 # AGAAA TTTCT 934 732 4.6e-008 2.0e-003 letter-probability matrix: alength= 4 w= 5 nsites= 6011 E= 1.7e-068 0.433871 0.000000 0.566129 0.000000 0.000000 0.000000 1.000000 0.000000 0.376643 0.000000 0.623357 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 MOTIF CCACHAGR DREME-3 # Word RC Word Pos Neg P-value E-value # BEST CCACHAGR YCTDGTGG 517 140 6.8e-055 2.9e-050 # CCACCAGG CCTGGTGG 188 51 2.7e-020 1.1e-015 # CCACCAGA TCTGGTGG 111 22 6.0e-016 2.5e-011 # CCACTAGA TCTAGTGG 71 12 1.0e-011 4.3e-007 # CCACTAGG CCTAGTGG 68 13 1.7e-010 7.0e-006 # CCACAAGA TCTTGTGG 37 14 8.6e-004 3.7e+001 # CCACAAGG CCTTGTGG 58 31 2.7e-003 1.1e+002 letter-probability matrix: alength= 4 w= 8 nsites= 535 E= 2.9e-050 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.177570 0.560748 0.000000 0.261682 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.411215 0.000000 0.588785 0.000000 MOTIF TTATYW DREME-4 # Word RC Word Pos Neg P-value E-value # BEST TTATYW WRATAA 402 155 8.2e-028 3.4e-023 # TTATCA TGATAA 136 43 6.5e-013 2.7e-008 # TTATCT AGATAA 175 69 2.5e-012 1.1e-007 # TTATTT AAATAA 65 25 1.4e-005 5.8e-001 # TTATTA TAATAA 48 21 7.5e-004 3.2e+001 letter-probability matrix: alength= 4 w= 6 nsites= 438 E= 3.4e-023 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.746575 0.000000 0.253425 0.417808 0.000000 0.000000 0.582192 MOTIF RGGCGGGR DREME-5 # Word RC Word Pos Neg P-value E-value # BEST RGGCGGGR YCCCGCCY 513 244 1.1e-024 4.7e-020 # GGGCGGGA TCCCGCCC 136 38 1.3e-014 5.2e-010 # GGGCGGGG CCCCGCCC 243 121 3.9e-011 1.6e-006 # AGGCGGGG CCCCGCCT 98 60 1.5e-003 6.1e+001 # AGGCGGGA TCCCGCCT 60 31 1.5e-003 6.3e+001 letter-probability matrix: alength= 4 w= 8 nsites= 551 E= 4.7e-020 0.288566 0.000000 0.711434 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.361162 0.000000 0.638838 0.000000 MOTIF AGRKGGCA DREME-6 # Word RC Word Pos Neg P-value E-value # BEST AGRKGGCA TGCCMYCT 380 165 8.8e-022 3.7e-017 # AGGGGGCA TGCCCCCT 144 51 6.2e-012 2.6e-007 # AGGTGGCA TGCCACCT 96 39 4.3e-007 1.8e-002 # AGAGGGCA TGCCCTCT 108 54 1.2e-005 4.9e-001 # AGATGGCA TGCCATCT 44 22 4.5e-003 1.9e+002 letter-probability matrix: alength= 4 w= 8 nsites= 394 E= 3.7e-017 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.388325 0.000000 0.611675 0.000000 0.000000 0.000000 0.642132 0.357868 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 MOTIF RGGTTCGA DREME-7 # Word RC Word Pos Neg P-value E-value # BEST RGGTTCGA TCGAACCY 113 14 6.7e-021 2.8e-016 # GGGTTCGA TCGAACCC 92 12 7.3e-017 3.1e-012 # AGGTTCGA TCGAACCT 21 2 3.3e-005 1.4e+000 letter-probability matrix: alength= 4 w= 8 nsites= 113 E= 2.8e-016 0.185841 0.000000 0.814159 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 MOTIF ACTTCCG DREME-8 # Word RC Word Pos Neg P-value E-value # BEST ACTTCCG CGGAAGT 145 34 4.6e-018 1.9e-013 # ACTTCCG CGGAAGT 145 34 4.6e-018 1.9e-013 letter-probability matrix: alength= 4 w= 7 nsites= 155 E= 1.9e-013 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 MOTIF CTCCCKC DREME-9 # Word RC Word Pos Neg P-value E-value # BEST CTCCCKC GMGGGAG 624 404 3.2e-013 1.3e-008 # CTCCCGC GCGGGAG 325 177 7.0e-012 2.9e-007 # CTCCCTC GAGGGAG 321 238 1.8e-004 7.6e+000 letter-probability matrix: alength= 4 w= 7 nsites= 665 E= 1.3e-008 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.496241 0.503759 0.000000 1.000000 0.000000 0.000000 MOTIF ATTGGCYG DREME-10 # Word RC Word Pos Neg P-value E-value # BEST ATTGGCYG CRGCCAAT 92 19 4.4e-013 1.8e-008 # ATTGGCTG CAGCCAAT 64 10 3.9e-011 1.6e-006 # ATTGGCCG CGGCCAAT 28 9 1.3e-003 5.3e+001 letter-probability matrix: alength= 4 w= 8 nsites= 96 E= 1.8e-008 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.291667 0.000000 0.708333 0.000000 0.000000 1.000000 0.000000 MOTIF BCACGTG DREME-11 # Word RC Word Pos Neg P-value E-value # BEST BCACGTG CACGTGV 204 85 5.0e-013 2.1e-008 # TCACGTG CACGTGA 91 29 5.1e-009 2.1e-004 # CCACGTG CACGTGG 120 50 3.2e-008 1.3e-003 # GCACGTG CACGTGC 77 44 1.6e-003 6.8e+001 letter-probability matrix: alength= 4 w= 7 nsites= 213 E= 2.1e-008 0.000000 0.446009 0.253521 0.300469 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 MOTIF RRTTTGAA DREME-12 # Word RC Word Pos Neg P-value E-value # BEST RRTTTGAA TTCAAAYY 106 28 2.7e-012 1.1e-007 # GATTTGAA TTCAAATC 38 8 4.4e-006 1.8e-001 # AGTTTGAA TTCAAACT 24 4 8.8e-005 3.7e+000 # GGTTTGAA TTCAAACC 29 12 5.7e-003 2.4e+002 # AATTTGAA TTCAAATT 15 4 9.6e-003 4.0e+002 letter-probability matrix: alength= 4 w= 8 nsites= 106 E= 1.1e-007 0.367925 0.000000 0.632075 0.000000 0.500000 0.000000 0.500000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 MOTIF TGACGTCA DREME-13 # Word RC Word Pos Neg P-value E-value # BEST TGACGTCA TGACGTCA 49 3 4.8e-012 2.0e-007 # TGACGTCA TGACGTCA 49 3 4.8e-012 2.0e-007 letter-probability matrix: alength= 4 w= 8 nsites= 50 E= 2.0e-007 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 MOTIF CGCAKGCG DREME-14 # Word RC Word Pos Neg P-value E-value # BEST CGCAKGCG CGCMTGCG 131 43 5.4e-012 2.3e-007 # CGCATGCG CGCATGCG 37 2 1.3e-009 5.6e-005 # CGCAGGCG CGCCTGCG 97 41 9.1e-007 3.8e-002 letter-probability matrix: alength= 4 w= 8 nsites= 137 E= 2.3e-007 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.722628 0.277372 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 MOTIF HGGCCACA DREME-15 # Word RC Word Pos Neg P-value E-value # BEST HGGCCACA TGTGGCCD 164 64 8.4e-012 3.5e-007 # TGGCCACA TGTGGCCA 68 28 2.5e-005 1.1e+000 # CGGCCACA TGTGGCCG 47 16 5.6e-005 2.3e+000 # AGGCCACA TGTGGCCT 51 20 1.5e-004 6.0e+000 letter-probability matrix: alength= 4 w= 8 nsites= 166 E= 3.5e-007 0.307229 0.283133 0.000000 0.409639 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 MOTIF CWGCAGC DREME-16 # Word RC Word Pos Neg P-value E-value # BEST CWGCAGC GCTGCWG 620 420 4.1e-011 1.7e-006 # CAGCAGC GCTGCTG 354 231 1.0e-007 4.2e-003 # CTGCAGC GCTGCAG 288 213 3.5e-004 1.5e+001 letter-probability matrix: alength= 4 w= 7 nsites= 654 E= 1.7e-006 0.000000 1.000000 0.000000 0.000000 0.553517 0.000000 0.000000 0.446483 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 MOTIF STGAGTCA DREME-17 # Word RC Word Pos Neg P-value E-value # BEST STGAGTCA TGACTCAS 87 23 2.5e-010 1.0e-005 # CTGAGTCA TGACTCAG 56 14 2.0e-007 8.3e-003 # GTGAGTCA TGACTCAC 31 10 7.1e-004 3.0e+001 letter-probability matrix: alength= 4 w= 8 nsites= 87 E= 1.0e-005 0.000000 0.643678 0.356322 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 MOTIF GCTCYACC DREME-18 # Word RC Word Pos Neg P-value E-value # BEST GCTCYACC GGTRGAGC 124 47 1.3e-009 5.4e-005 # GCTCTACC GGTAGAGC 59 15 1.2e-007 4.9e-003 # GCTCCACC GGTGGAGC 65 32 5.0e-004 2.1e+001 letter-probability matrix: alength= 4 w= 8 nsites= 124 E= 5.4e-005 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.524194 0.000000 0.475806 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 MOTIF GCDGGGA DREME-19 # Word RC Word Pos Neg P-value E-value # BEST GCDGGGA TCCCHGC 519 356 5.4e-009 2.2e-004 # GCAGGGA TCCCTGC 201 136 1.9e-004 8.0e+000 # GCTGGGA TCCCAGC 201 137 2.4e-004 1.0e+001 # GCGGGGA TCCCCGC 131 88 2.0e-003 8.4e+001 letter-probability matrix: alength= 4 w= 7 nsites= 546 E= 2.2e-004 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.379121 0.000000 0.245421 0.375458 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 MOTIF TGGWTAA DREME-20 # Word RC Word Pos Neg P-value E-value # BEST TGGWTAA TTAWCCA 91 32 4.2e-008 1.7e-003 # TGGTTAA TTAACCA 48 17 7.3e-005 3.0e+000 # TGGATAA TTATCCA 43 15 1.5e-004 6.1e+000 letter-probability matrix: alength= 4 w= 7 nsites= 91 E= 1.7e-003 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.472527 0.000000 0.000000 0.527473 0.000000 0.000000 0.000000 1.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 MOTIF CCGCCDCC DREME-21 # Word RC Word Pos Neg P-value E-value # BEST CCGCCDCC GGHGGCGG 308 191 4.8e-008 2.0e-003 # CCGCCGCC GGCGGCGG 177 110 3.7e-005 1.5e+000 # CCGCCTCC GGAGGCGG 92 55 1.3e-003 5.5e+001 # CCGCCACC GGTGGCGG 60 36 9.0e-003 3.7e+002 letter-probability matrix: alength= 4 w= 8 nsites= 336 E= 2.0e-003 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.175595 0.000000 0.538690 0.285714 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 MOTIF GGACAS DREME-22 # Word RC Word Pos Neg P-value E-value # BEST GGACAS STGTCC 797 612 7.7e-008 3.2e-003 # GGACAC GTGTCC 337 230 2.3e-006 9.6e-002 # GGACAG CTGTCC 484 395 9.9e-004 4.1e+001 letter-probability matrix: alength= 4 w= 6 nsites= 855 E= 3.2e-003 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.404678 0.595322 0.000000 MOTIF CCACGCCC DREME-23 # Word RC Word Pos Neg P-value E-value # BEST CCACGCCC GGGCGTGG 79 28 3.7e-007 1.5e-002 # CCACGCCC GGGCGTGG 79 28 3.7e-007 1.5e-002 letter-probability matrix: alength= 4 w= 8 nsites= 81 E= 1.5e-002 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 MOTIF AAAATGKC DREME-24 # Word RC Word Pos Neg P-value E-value # BEST AAAATGKC GMCATTTT 36 5 3.8e-007 1.5e-002 # AAAATGGC GCCATTTT 26 4 2.9e-005 1.2e+000 # AAAATGTC GACATTTT 10 1 5.8e-003 2.4e+002 letter-probability matrix: alength= 4 w= 8 nsites= 37 E= 1.5e-002 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.729730 0.270270 0.000000 1.000000 0.000000 0.000000 MOTIF AAYTACA DREME-25 # Word RC Word Pos Neg P-value E-value # BEST AAYTACA TGTARTT 67 21 4.2e-007 1.7e-002 # AACTACA TGTAGTT 44 14 4.8e-005 2.0e+000 # AATTACA TGTAATT 23 8 5.3e-003 2.2e+002 letter-probability matrix: alength= 4 w= 7 nsites= 67 E= 1.7e-002 1.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.656716 0.000000 0.343284 0.000000 0.000000 0.000000 1.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 MOTIF CTGAGCTA DREME-26 # Word RC Word Pos Neg P-value E-value # BEST CTGAGCTA TAGCTCAG 58 17 1.0e-006 4.2e-002 # CTGAGCTA TAGCTCAG 58 17 1.0e-006 4.2e-002 letter-probability matrix: alength= 4 w= 8 nsites= 58 E= 4.2e-002 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 1.000000 0.000000 0.000000 0.000000 # Stopping reason: E-value threshold exceeded # Running time: 756.87 seconds