; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return freq,mseq,occ,proba,rank,ratio,zscore -1str -noov -quick_if_possible -seqtype dna -markov 2 -pseudo 0.01 -l 6 -o $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_6nt.tab
; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42.
; Program version 1.169
; Slow counting mode
; Detection of over-represented words (right-tail test)
; Oligomer length 6
; Input file $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged
; Input format fasta
; Output file $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_6nt.tab
; Discard overlapping matches
; Counted on a single strand
; Background model Markov
; Background estimation method Markov model estimated from input sequences
; Markov chain order 2
; Pseudo-frequency 0.01
; Pseudo-frequency per oligo 2.44140625e-06
; Sequence type DNA
; Nb of sequences 500
; Sum of sequence lengths 189796
; discarded residues 535 (other letters than ACGT)
; discarded occurrences 535 (contain discarded residues)
; nb possible positions 186761
; total oligo occurrences 186761
; total overlapping occurrences 1034
; total non overlapping occ 185727
; alphabet size 4
; nb possible oligomers 4096
; oligomers tested for significance 4096
;
; column headers
; 1 seq oligomer sequence
; 2 id oligomer identifier
; 3 obs_freq observed relative frequency
; 4 exp_freq expected relative frequency
; 5 occ observed occurrences
; 6 exp_occ expected occurrences
; 7 occ_P occurrence probability (binomial)
; 8 occ_E E-value for occurrences (binomial)
; 9 occ_sig occurrence significance (binomial)
; 10 rank rank
; 11 ovl_occ number of overlapping occurrences (discarded from the count)
; 12 forbocc forbidden positions (to avoid self-overlap)
; 13 zscore z-score (Gaussian approximation)
; 14 exp_var estimation of the variance on occurrences
; 15 ratio observed/expected ratio
; 16 ms number of matching sequences
; 17 exp_ms expected number of matching sequences
; 18 ms_P matching sequence probability (binomial)
; 19 ms_E E-value for matching sequences (binomial)
; 20 ms_sig matching sequenc significance (binomial)
; 21 ms_freq proportion of matching sequences (sequences with at least one occurrence)
; 22 exp_msf expected proportion matching sequences
; 23 ms_rati observed/expected numbers of matching sequences
#seq id obs_freq exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc zscore exp_var ratio ms exp_ms ms_P ms_E ms_sig ms_freq exp_msf ms_rati
tgatga tgatga 0.0005515070063 0.0002701109552 103 50.45 5.9e-11 2.4e-07 6.62 1 7 510 7.40 50.446 2.0418 83 47.99 7.1e-07 0.0029 2.5 0.16600 0.09598 1.72949
tctttt tctttt 0.0012957737429 0.0008617198419 242 160.94 1.6e-09 6.5e-06 5.19 2 3 1203 6.39 160.936 1.5037 174 137.65 0.00022 0.91 0.0 0.34800 0.27531 1.26403
atgatg atgatg 0.0004926081998 0.0002477585921 92 46.27 2e-09 8.4e-06 5.08 3 5 450 6.72 46.272 1.9883 78 44.20 7.6e-07 0.0031 2.5 0.15600 0.08840 1.76469
ggtggt ggtggt 0.0003694561498 0.0001668323904 69 31.16 3.5e-09 1.4e-05 4.85 4 4 337 6.78 31.158 2.2145 58 30.21 2e-06 0.0081 2.1 0.11600 0.06042 1.91994
ttcttc ttcttc 0.0008567099127 0.0005261929040 160 98.27 6.8e-09 2.8e-05 4.55 5 11 792 6.23 98.272 1.6281 133 89.24 7.9e-07 0.0032 2.5 0.26600 0.17848 1.49038
aacagc aacagc 0.0004926081998 0.0002633125370 92 49.18 3.2e-08 1.3e-04 3.88 6 0 455 6.11 49.177 1.8708 74 46.84 6.5e-05 0.26 0.6 0.14800 0.09368 1.57980
cgatga cgatga 0.0003212662173 0.0001475721071 60 27.56 6.1e-08 2.5e-04 3.60 7 0 293 6.18 27.561 2.1770 55 26.82 5.3e-07 0.0022 2.7 0.11000 0.05363 2.05095
gaggaa gaggaa 0.0005300892585 0.0003071534815 99 57.36 3.8e-07 1.6e-03 2.80 8 0 488 5.50 57.364 1.7258 86 54.20 1.3e-05 0.052 1.3 0.17200 0.10841 1.58660
tatata tatata 0.0008245832909 0.0005517069312 154 103.04 1.7e-06 6.9e-03 2.16 9 37 761 5.02 103.037 1.4946 127 93.14 0.00011 0.46 0.3 0.25400 0.18627 1.36358
aagaaa aagaaa 0.0017455464471 0.0013354485904 326 249.41 2e-06 8.1e-03 2.09 10 9 1606 4.85 249.410 1.3071 218 196.48 0.02761 1.1e+02 -2.1 0.43600 0.39296 1.10954
aagagg aagagg 0.0005675703171 0.0003556591240 106 66.42 4.7e-06 1.9e-02 1.72 11 0 520 4.86 66.423 1.5958 94 62.21 3.1e-05 0.13 0.9 0.18800 0.12442 1.51100
agtaat agtaat 0.0004872537628 0.0002935297331 91 54.82 4.9e-06 2.0e-02 1.70 12 0 453 4.89 54.820 1.6600 81 51.93 4.3e-05 0.17 0.8 0.16200 0.10386 1.55983
ccattg ccattg 0.0004283549563 0.0002489761191 80 46.50 5.1e-06 2.1e-02 1.68 13 0 400 4.91 46.499 1.7205 70 44.41 0.00011 0.46 0.3 0.14000 0.08882 1.57631
atagca atagca 0.0004551271411 0.0002705082381 85 50.52 6e-06 2.5e-02 1.61 14 0 425 4.85 50.520 1.6825 78 48.06 1.6e-05 0.065 1.2 0.15600 0.09612 1.62304
tcttct tcttct 0.0006853679301 0.0004521104632 128 84.44 6.1e-06 2.5e-02 1.60 15 12 632 4.74 84.437 1.5159 107 77.71 0.00032 1.3 -0.1 0.21400 0.15542 1.37695
cctcca cctcca 0.0003480384020 0.0001907917490 65 35.63 6.4e-06 2.6e-02 1.58 16 0 321 4.92 35.632 1.8242 60 34.40 2.3e-05 0.096 1.0 0.12000 0.06879 1.74441
gctgct gctgct 0.0003212662173 0.0001717554616 60 32.08 6.9e-06 2.8e-02 1.55 17 3 300 4.93 32.077 1.8705 52 31.07 0.00023 0.95 0.0 0.10400 0.06215 1.67350
caacaa caacaa 0.0007763933584 0.0005323933804 145 99.43 1.1e-05 4.4e-02 1.35 18 8 712 4.57 99.430 1.4583 109 90.19 0.01831 75 -1.9 0.21800 0.18038 1.20856
tttctt tttctt 0.0011726216930 0.0008668206853 219 161.89 1.1e-05 4.7e-02 1.33 19 5 1084 4.49 161.888 1.3528 163 138.34 0.00860 35 -1.5 0.32600 0.27669 1.17822
gtggtg gtggtg 0.0002944940325 0.0001564914219 55 29.23 1.4e-05 5.6e-02 1.25 20 4 269 4.77 29.226 1.8819 51 28.39 4.8e-05 0.2 0.7 0.10200 0.05678 1.79635
ctgctg ctgctg 0.0003052029064 0.0001642528362 57 30.68 1.4e-05 5.6e-02 1.25 21 3 281 4.75 30.676 1.8581 53 29.76 4.3e-05 0.17 0.8 0.10600 0.05951 1.78113
gatgat gatgat 0.0004176460824 0.0002489560401 78 46.50 1.5e-05 6.3e-02 1.20 22 4 379 4.62 46.495 1.6776 67 44.40 0.00052 2.1 -0.3 0.13400 0.08881 1.50887
taagga taagga 0.0005140259476 0.0003250316287 96 60.70 1.8e-05 7.2e-02 1.14 23 0 477 4.53 60.703 1.5815 85 57.17 0.00014 0.57 0.2 0.17000 0.11434 1.48675
tgctgc tgctgc 0.0003159117803 0.0001750017899 59 32.68 2.2e-05 9.0e-02 1.05 24 2 295 4.60 32.684 1.8052 50 31.64 0.00107 4.4 -0.6 0.10000 0.06328 1.58023
tactac tactac 0.0003748105868 0.0002208480872 70 41.25 2.8e-05 1.2e-01 0.94 25 1 341 4.48 41.246 1.6971 65 39.59 6.4e-05 0.26 0.6 0.13000 0.07919 1.64164
cgctag cgctag 0.0001927597304 0.0000897110556 36 16.75 3e-05 1.2e-01 0.91 26 0 175 4.70 16.755 2.1487 32 16.48 0.00035 1.4 -0.2 0.06400 0.03296 1.94202
cttctt cttctt 0.0007067856780 0.0004878265292 132 91.11 3.4e-05 1.4e-01 0.86 27 7 660 4.28 91.107 1.4488 107 83.31 0.00342 14 -1.1 0.21400 0.16661 1.28441
attgac attgac 0.0004337093933 0.0002682945492 81 50.11 3.7e-05 1.5e-01 0.82 28 0 400 4.36 50.107 1.6165 72 47.68 0.00031 1.3 -0.1 0.14400 0.09537 1.50994
cattga cattga 0.0005086715106 0.0003278487935 95 61.23 3.8e-05 1.6e-01 0.80 29 0 475 4.32 61.229 1.5515 85 57.64 0.00018 0.74 0.1 0.17000 0.11528 1.47473
cccttc cccttc 0.0002837851586 0.0001551713189 53 28.98 4e-05 1.6e-01 0.79 30 0 261 4.46 28.980 1.8289 46 28.16 0.00088 3.6 -0.6 0.09200 0.05632 1.63363
gatgaa gatgaa 0.0005675703171 0.0003768434894 106 70.38 4.5e-05 1.9e-01 0.73 31 0 524 4.25 70.380 1.5061 82 65.66 0.02029 83 -1.9 0.16400 0.13132 1.24881
gatgac gatgac 0.0002944940325 0.0001646556990 55 30.75 5.1e-05 2.1e-01 0.68 32 0 270 4.37 30.751 1.7885 52 29.83 8.6e-05 0.35 0.5 0.10400 0.05965 1.74338
agaaga agaaga 0.0010441152061 0.0007788837352 195 145.47 5.2e-05 2.1e-01 0.67 33 9 968 4.11 145.465 1.3405 148 126.26 0.01549 63 -1.8 0.29600 0.25252 1.17220
gcgatg gcgatg 0.0001874052934 0.0000896745934 35 16.75 6.5e-05 2.7e-01 0.57 34 1 172 4.46 16.748 2.0898 33 16.47 0.00016 0.67 0.2 0.06600 0.03294 2.00351
ttcttt ttcttt 0.0011404950712 0.0008668206853 213 161.89 7e-05 2.9e-01 0.54 35 5 1049 4.02 161.888 1.3157 164 138.34 0.00659 27 -1.4 0.32800 0.27669 1.18544
tgttga tgttga 0.0004711904520 0.0003040362374 88 56.78 7.4e-05 3.0e-01 0.52 36 0 440 4.14 56.782 1.5498 78 53.68 0.00054 2.2 -0.3 0.15600 0.10737 1.45294
caagaa caagaa 0.0010548240800 0.0007946874286 197 148.42 8.1e-05 3.3e-01 0.48 37 0 979 3.99 148.417 1.3273 154 128.46 0.00584 24 -1.4 0.30800 0.25692 1.19882
tatcga tatcga 0.0003641017129 0.0002212341474 68 41.32 8.8e-05 3.6e-01 0.45 38 0 340 4.15 41.318 1.6458 63 39.66 0.00021 0.85 0.1 0.12600 0.07932 1.58846
aaggaa aaggaa 0.0008727732235 0.0006430398440 163 120.09 0.00011 4.7e-01 0.33 39 2 805 3.92 120.095 1.3573 130 106.79 0.00755 31 -1.5 0.26000 0.21358 1.21733
acagca acagca 0.0004069372085 0.0002569076954 76 47.98 0.00011 4.7e-01 0.33 40 0 375 4.05 47.980 1.5840 64 45.76 0.00422 17 -1.2 0.12800 0.09151 1.39873
agcagc agcagc 0.0002837851586 0.0001624151046 53 30.33 0.00012 5.0e-01 0.30 41 5 265 4.12 30.333 1.7473 48 29.43 0.00070 2.9 -0.5 0.09600 0.05887 1.63080
tagtaa tagtaa 0.0004015827716 0.0002532261638 75 47.29 0.00012 5.0e-01 0.30 42 0 375 4.03 47.293 1.5859 72 45.13 6.1e-05 0.25 0.6 0.14400 0.09026 1.59537
aacaat aacaat 0.0007924566692 0.0005764028353 148 107.65 0.00013 5.4e-01 0.27 43 0 735 3.89 107.650 1.3748 126 96.87 0.00084 3.4 -0.5 0.25200 0.19375 1.30065
atcatc atcatc 0.0004176460824 0.0002669342911 78 49.85 0.00014 5.6e-01 0.25 44 6 388 3.99 49.853 1.5646 67 47.45 0.00275 11 -1.1 0.13400 0.09491 1.41189
atataa atataa 0.0008406466018 0.0006190122688 157 115.61 0.00015 6.0e-01 0.22 45 1 780 3.85 115.607 1.3580 133 103.24 0.00084 3.4 -0.5 0.26600 0.20649 1.28821
ctgcta ctgcta 0.0003266206542 0.0001964275566 61 36.69 0.00015 6.1e-01 0.22 46 0 305 4.01 36.685 1.6628 52 35.37 0.00380 16 -1.2 0.10400 0.07075 1.46997
ataatg ataatg 0.0004926081998 0.0003287409216 92 61.40 0.00016 6.5e-01 0.18 47 0 458 3.91 61.396 1.4985 79 57.79 0.00269 11 -1.0 0.15800 0.11557 1.36713
ggcgta ggcgta 0.0001766964195 0.0000882115951 33 16.47 0.00022 8.9e-01 0.05 48 0 165 4.07 16.474 2.0031 32 16.21 0.00026 1.1 -0.0 0.06400 0.03241 1.97449
ctacca ctacca 0.0003587472759 0.0002253923408 67 42.09 0.00024 9.9e-01 0.00 49 0 327 3.84 42.094 1.5917 58 40.38 0.00371 15 -1.2 0.11600 0.08075 1.43651
; Host name rsat
; Job started 2026-05-11.133715
; Job done 2026-05-11.133715
; Seconds 0.92
; user 0.92
; system 0.02
; cuser 0
; csystem 0
; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return freq,mseq,occ,proba,rank,ratio,zscore -1str -noov -quick_if_possible -seqtype dna -markov 2 -pseudo 0.01 -l 7 -o $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_7nt.tab
; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42.
; Program version 1.169
; Slow counting mode
; Detection of over-represented words (right-tail test)
; Oligomer length 7
; Input file $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged
; Input format fasta
; Output file $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_7nt.tab
; Discard overlapping matches
; Counted on a single strand
; Background model Markov
; Background estimation method Markov model estimated from input sequences
; Markov chain order 2
; Pseudo-frequency 0.01
; Pseudo-frequency per oligo 6.103515625e-07
; Sequence type DNA
; Nb of sequences 500
; Sum of sequence lengths 189796
; discarded residues 535 (other letters than ACGT)
; discarded occurrences 535 (contain discarded residues)
; nb possible positions 186261
; total oligo occurrences 186261
; total overlapping occurrences 627
; total non overlapping occ 185634
; alphabet size 4
; nb possible oligomers 16384
; oligomers tested for significance 16203
;
; column headers
; 1 seq oligomer sequence
; 2 id oligomer identifier
; 3 obs_freq observed relative frequency
; 4 exp_freq expected relative frequency
; 5 occ observed occurrences
; 6 exp_occ expected occurrences
; 7 occ_P occurrence probability (binomial)
; 8 occ_E E-value for occurrences (binomial)
; 9 occ_sig occurrence significance (binomial)
; 10 rank rank
; 11 ovl_occ number of overlapping occurrences (discarded from the count)
; 12 forbocc forbidden positions (to avoid self-overlap)
; 13 zscore z-score (Gaussian approximation)
; 14 exp_var estimation of the variance on occurrences
; 15 ratio observed/expected ratio
; 16 ms number of matching sequences
; 17 exp_ms expected number of matching sequences
; 18 ms_P matching sequence probability (binomial)
; 19 ms_E E-value for matching sequences (binomial)
; 20 ms_sig matching sequenc significance (binomial)
; 21 ms_freq proportion of matching sequences (sequences with at least one occurrence)
; 22 exp_msf expected proportion matching sequences
; 23 ms_rati observed/expected numbers of matching sequences
#seq id obs_freq exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc zscore exp_var ratio ms exp_ms ms_P ms_E ms_sig ms_freq exp_msf ms_rati
gatgatg gatgatg 0.0001932771756 0.0000492060911 36 9.17 1.6e-11 2.6e-07 6.58 1 2 210 8.86 9.165 3.9279 34 9.08 1e-10 1.7e-06 5.8 0.06800 0.01816 3.74371
caacaac caacaac 0.0002630717112 0.0000929633159 49 17.32 3.6e-10 5.9e-06 5.23 2 5 294 7.61 17.315 2.8298 37 17.02 1.2e-05 0.2 0.7 0.07400 0.03404 2.17394
cttcttc cttcttc 0.0002791781425 0.0001076085579 52 20.04 2e-09 3.2e-05 4.50 3 6 312 7.14 20.043 2.5944 48 19.65 2e-08 0.00033 3.5 0.09600 0.03930 2.44301
tatataa tatataa 0.0003704479199 0.0001674831130 69 31.20 3.6e-09 5.9e-05 4.23 4 0 408 6.77 31.196 2.2119 65 30.24 7.7e-09 0.00013 3.9 0.13000 0.06049 2.14913
atgatga atgatga 0.0002040147964 0.0000746637879 38 13.91 7.5e-08 1.2e-03 2.92 5 1 223 6.46 13.907 2.7324 35 13.72 6.8e-07 0.011 2.0 0.07000 0.02743 2.55180
ggtggtg ggtggtg 0.0001234826400 0.0000354721005 23 6.61 5.2e-07 8.4e-03 2.07 6 3 134 6.38 6.607 3.4811 22 6.56 1.3e-06 0.021 1.7 0.04400 0.01313 3.35176
cggtggt cggtggt 0.0001020073982 0.0000263872537 19 4.91 1.1e-06 1.8e-02 1.75 7 0 111 6.35 4.915 3.8658 19 4.89 8.4e-07 0.014 1.9 0.03800 0.00978 3.88476
ttctttt ttctttt 0.0005261434224 0.0003150761754 98 58.69 1.7e-06 2.8e-02 1.56 8 2 578 5.13 58.686 1.6699 84 55.38 7.9e-05 1.3 -0.1 0.16800 0.11076 1.51675
cgatgac cgatgac 0.0000966385878 0.0000249729469 18 4.65 2e-06 3.3e-02 1.48 9 0 101 6.19 4.651 3.8697 16 4.63 2.5e-05 0.41 0.4 0.03200 0.00926 3.45574
aatagca aatagca 0.0002040147964 0.0000865060676 38 16.11 2.4e-06 3.9e-02 1.41 10 0 228 5.45 16.113 2.3584 34 15.86 3.6e-05 0.59 0.2 0.06800 0.03171 2.14423
tgatgaa tgatgaa 0.0002308588486 0.0001043183771 43 19.43 2.7e-06 4.4e-02 1.36 11 0 249 5.35 19.430 2.2130 35 19.06 0.00051 8.4 -0.9 0.07000 0.03812 1.83643
tgctgct tgctgct 0.0001503266921 0.0000550075187 28 10.25 3.5e-06 5.7e-02 1.24 12 2 168 5.55 10.246 2.7328 24 10.14 0.00012 2 -0.3 0.04800 0.02028 2.36645
ttcttct ttcttct 0.0003167598155 0.0001651734833 59 30.77 4e-06 6.4e-02 1.19 13 5 343 5.09 30.765 1.9177 56 29.84 5.9e-06 0.097 1.0 0.11200 0.05968 1.87665
ttatttt ttatttt 0.0004670865076 0.0002767138498 87 51.54 4.2e-06 6.8e-02 1.17 14 1 510 4.94 51.541 1.6880 78 48.98 3e-05 0.5 0.3 0.15600 0.09796 1.59249
gctgctg gctgctg 0.0001127450191 0.0000348254703 21 6.49 4.7e-06 7.7e-02 1.12 15 1 126 5.70 6.487 3.2374 20 6.44 1.2e-05 0.2 0.7 0.04000 0.01289 3.10326
tgatgat tgatgat 0.0001718019338 0.0000688940153 32 12.83 4.8e-06 7.8e-02 1.11 16 3 188 5.35 12.832 2.4937 32 12.67 2.6e-06 0.042 1.4 0.06400 0.02534 2.52576
ttttctt ttttctt 0.0005154058015 0.0003150761754 96 58.69 4.9e-06 7.9e-02 1.10 17 3 572 4.87 58.686 1.6358 83 55.38 0.00013 2.1 -0.3 0.16600 0.11076 1.49870
gacgaag gacgaag 0.0001395890712 0.0000501000811 26 9.33 5.5e-06 8.9e-02 1.05 18 0 152 5.46 9.332 2.7862 22 9.25 0.00021 3.5 -0.5 0.04400 0.01849 2.37957
ggtggta ggtggta 0.0001288514504 0.0000444714563 24 8.28 6.6e-06 1.1e-01 0.97 19 0 134 5.46 8.283 2.8974 22 8.22 4.1e-05 0.67 0.2 0.04400 0.01643 2.67795
ctctttt ctctttt 0.0003274974364 0.0001761807886 61 32.82 7e-06 1.1e-01 0.95 20 0 366 4.92 32.816 1.8589 52 31.76 0.00039 6.3 -0.8 0.10400 0.06353 1.63704
aagagga aagagga 0.0002415964695 0.0001172060601 45 21.83 9.4e-06 1.5e-01 0.82 21 0 267 4.96 21.831 2.0613 42 21.36 3.3e-05 0.54 0.3 0.08400 0.04272 1.96607
tcttttt tcttttt 0.0005046681807 0.0003132204611 94 58.34 1.1e-05 1.7e-01 0.76 22 0 561 4.67 58.341 1.6112 77 55.07 0.00170 28 -1.4 0.15400 0.11015 1.39812
aacagca aacagca 0.0001932771756 0.0000877165863 36 16.34 1.8e-05 2.9e-01 0.54 23 0 214 4.86 16.338 2.2034 27 16.07 0.00697 1.1e+02 -2.1 0.05400 0.03215 1.67965
caacagc caacagc 0.0001449578817 0.0000571368992 27 10.64 1.9e-05 3.0e-01 0.52 24 0 162 5.01 10.642 2.5370 20 10.53 0.00545 89 -2.0 0.04000 0.02106 1.89930
actacca actacca 0.0001556955025 0.0000638025961 29 11.88 1.9e-05 3.1e-01 0.51 25 0 170 4.97 11.884 2.4403 25 11.74 0.00043 7 -0.8 0.05000 0.02349 2.12871
caatggc caatggc 0.0001395890712 0.0000541116911 26 10.08 2e-05 3.3e-01 0.49 26 0 156 5.01 10.079 2.5796 24 9.98 9.6e-05 1.6 -0.2 0.04800 0.01996 2.40523
gcgatga gcgatga 0.0000912697774 0.0000269477783 17 5.02 2.1e-05 3.4e-01 0.47 27 0 97 5.35 5.019 3.3869 17 4.99 1.7e-05 0.28 0.6 0.03400 0.00999 3.40390
ccattga ccattga 0.0001718019338 0.0000750313205 32 13.98 2.5e-05 4.0e-01 0.40 28 0 192 4.82 13.975 2.2897 29 13.78 0.00018 3 -0.5 0.05800 0.02756 2.10413
gataatg gataatg 0.0001556955025 0.0000652511929 29 12.15 2.8e-05 4.6e-01 0.34 29 2 174 4.83 12.154 2.3861 27 12.01 0.00011 1.8 -0.2 0.05400 0.02402 2.24857
tcctcca tcctcca 0.0001503266921 0.0000619635882 28 11.54 2.9e-05 4.7e-01 0.33 30 0 168 4.84 11.541 2.4260 26 11.41 0.00012 1.9 -0.3 0.05200 0.02282 2.27879
gacgatg gacgatg 0.0000912697774 0.0000289230115 17 5.39 4.9e-05 8.0e-01 0.10 31 0 102 5.00 5.387 3.1556 17 5.36 4.1e-05 0.67 0.2 0.03400 0.01072 3.17260
atatata atatata 0.0003113910051 0.0001780106025 58 33.16 5.9e-05 9.5e-01 0.02 32 21 342 4.31 33.156 1.7493 53 32.08 0.00027 4.5 -0.7 0.10600 0.06417 1.65193
gaggaaa gaggaaa 0.0002201212277 0.0001116895045 41 20.80 5.9e-05 9.6e-01 0.02 33 0 240 4.43 20.803 1.9708 41 20.38 2.4e-05 0.4 0.4 0.08200 0.04076 2.01201
; Host name rsat
; Job started 2026-05-11.133716
; Job done 2026-05-11.133717
; Seconds 1.51
; user 1.51
; system 0.03
; cuser 0
; csystem 0
; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return freq,mseq,occ,proba,rank,ratio,zscore -1str -noov -quick_if_possible -seqtype dna -markov 2 -pseudo 0.01 -l 8 -o $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_8nt.tab
; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42.
; Program version 1.169
; Slow counting mode
; Detection of over-represented words (right-tail test)
; Oligomer length 8
; Input file $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged
; Input format fasta
; Output file $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_8nt.tab
; Discard overlapping matches
; Counted on a single strand
; Background model Markov
; Background estimation method Markov model estimated from input sequences
; Markov chain order 2
; Pseudo-frequency 0.01
; Pseudo-frequency per oligo 1.52587890625e-07
; Sequence type DNA
; Nb of sequences 500
; Sum of sequence lengths 189796
; discarded residues 535 (other letters than ACGT)
; discarded occurrences 535 (contain discarded residues)
; nb possible positions 185761
; total oligo occurrences 185761
; total overlapping occurrences 372
; total non overlapping occ 185389
; alphabet size 4
; nb possible oligomers 65536
; oligomers tested for significance 54084
;
; column headers
; 1 seq oligomer sequence
; 2 id oligomer identifier
; 3 obs_freq observed relative frequency
; 4 exp_freq expected relative frequency
; 5 occ observed occurrences
; 6 exp_occ expected occurrences
; 7 occ_P occurrence probability (binomial)
; 8 occ_E E-value for occurrences (binomial)
; 9 occ_sig occurrence significance (binomial)
; 10 rank rank
; 11 ovl_occ number of overlapping occurrences (discarded from the count)
; 12 forbocc forbidden positions (to avoid self-overlap)
; 13 zscore z-score (Gaussian approximation)
; 14 exp_var estimation of the variance on occurrences
; 15 ratio observed/expected ratio
; 16 ms number of matching sequences
; 17 exp_ms expected number of matching sequences
; 18 ms_P matching sequence probability (binomial)
; 19 ms_E E-value for matching sequences (binomial)
; 20 ms_sig matching sequenc significance (binomial)
; 21 ms_freq proportion of matching sequences (sequences with at least one occurrence)
; 22 exp_msf expected proportion matching sequences
; 23 ms_rati observed/expected numbers of matching sequences
#seq id obs_freq exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc zscore exp_var ratio ms exp_ms ms_P ms_E ms_sig ms_freq exp_msf ms_rati
gatgatga gatgatga 0.0000915154419 0.0000148233009 17 2.75 6.3e-09 3.4e-04 3.46 1 0 116 8.59 2.754 6.1738 17 2.75 5e-09 0.00033 3.5 0.03400 0.00549 6.19073
caacaaca caacaaca 0.0001238150096 0.0000318511213 23 5.92 7.9e-08 4.3e-03 2.37 2 2 161 7.02 5.917 3.8873 16 5.88 0.00037 25 -1.4 0.03200 0.01176 2.72020
aagaggaa aagaggaa 0.0001507313160 0.0000453251708 28 8.42 8.2e-08 4.4e-03 2.35 3 0 191 6.75 8.420 3.3256 27 8.35 1.7e-07 0.011 2.0 0.05400 0.01670 3.23379
tcttcttc tcttcttc 0.0001238150096 0.0000345025517 23 6.41 3.1e-07 1.7e-02 1.77 4 5 161 6.55 6.409 3.5886 20 6.37 1e-05 0.66 0.2 0.04000 0.01274 3.14049
ctcttttt ctcttttt 0.0001776476225 0.0000640316740 33 11.89 3.7e-07 2.0e-02 1.70 5 0 231 6.12 11.895 2.7744 31 11.75 1.5e-06 0.1 1.0 0.06200 0.02351 2.63727
tctttttt tctttttt 0.0002583965418 0.0001138818246 48 21.15 3.8e-07 2.0e-02 1.69 6 1 336 5.84 21.155 2.2690 44 20.71 3.2e-06 0.21 0.7 0.08800 0.04143 2.12410
tgatgatg tgatgatg 0.0000753656580 0.0000136156508 14 2.53 4.8e-07 2.6e-02 1.58 7 1 98 7.21 2.529 5.5352 14 2.52 4.1e-07 0.027 1.6 0.02800 0.00505 5.54920
tggtggtg tggtggtg 0.0000699823967 0.0000123645680 13 2.30 9.5e-07 5.2e-02 1.29 8 1 91 7.06 2.297 5.6599 13 2.29 8.4e-07 0.055 1.3 0.02600 0.00458 5.67289
cagcaaca cagcaaca 0.0000861321806 0.0000190270977 16 3.53 1e-06 5.6e-02 1.25 9 0 112 6.63 3.534 4.5268 12 3.52 0.00029 19 -1.3 0.02400 0.00704 3.40709
tttttttc tttttttc 0.0002853128482 0.0001392337974 53 25.86 1.9e-06 1.0e-01 0.98 10 0 371 5.34 25.864 2.0492 46 25.21 8e-05 5.3 -0.7 0.09200 0.05042 1.82479
tatatata tatatata 0.0001399647935 0.0000481653494 26 8.95 2.7e-06 1.4e-01 0.84 11 15 175 5.70 8.947 2.9059 25 8.87 5.2e-06 0.34 0.5 0.05000 0.01774 2.81916
tatataaa tatataaa 0.0001614978386 0.0000609840629 30 11.33 3e-06 1.6e-01 0.79 12 0 210 5.55 11.328 2.6482 29 11.20 4.8e-06 0.31 0.5 0.05800 0.02240 2.58896
ttatataa ttatataa 0.0001399647935 0.0000494952916 26 9.19 4.3e-06 2.3e-01 0.64 13 0 182 5.54 9.194 2.8278 25 9.11 8.2e-06 0.54 0.3 0.05000 0.01822 2.74409
atataata atataata 0.0001238150096 0.0000411332783 23 7.64 5.5e-06 3.0e-01 0.52 14 0 161 5.56 7.641 3.0101 23 7.58 3.9e-06 0.26 0.6 0.04600 0.01517 3.03309
acaacaac acaacaac 0.0000968987032 0.0000273606836 18 5.08 6.7e-06 3.6e-01 0.44 15 2 125 5.73 5.083 3.5415 17 5.06 2e-05 1.3 -0.1 0.03400 0.01011 3.36176
ataataac ataataac 0.0000915154419 0.0000249726014 17 4.64 7.8e-06 4.2e-01 0.38 16 0 119 5.74 4.639 3.6646 16 4.62 2.4e-05 1.6 -0.2 0.03200 0.00924 3.46505
cggtggta cggtggta 0.0000484493516 0.0000070301147 9 1.31 9.5e-06 5.1e-01 0.29 17 0 63 6.73 1.306 6.8917 9 1.30 8.9e-06 0.58 0.2 0.01800 0.00261 6.90067
gaagagga gaagagga 0.0000915154419 0.0000258409092 17 4.80 1.2e-05 6.5e-01 0.19 18 0 119 5.57 4.800 3.5415 16 4.78 3.6e-05 2.4 -0.4 0.03200 0.00955 3.34915
ttcctcga ttcctcga 0.0000645991354 0.0000134051627 12 2.49 1.2e-05 6.6e-01 0.18 19 0 84 6.03 2.490 4.8190 12 2.48 1.1e-05 0.71 0.1 0.02400 0.00497 4.83095
atgatgaa atgatgaa 0.0000968987032 0.0000288430520 18 5.36 1.3e-05 7.3e-01 0.14 20 0 122 5.46 5.358 3.3595 18 5.33 1.1e-05 0.71 0.2 0.03600 0.01066 3.37750
ttgatgat ttgatgat 0.0000861321806 0.0000234494097 16 4.36 1.4e-05 7.4e-01 0.13 21 0 112 5.58 4.356 3.6731 16 4.34 1.1e-05 0.75 0.1 0.03200 0.00867 3.68909
aaaaaaat aaaaaaat 0.0003122291547 0.0001692452639 58 31.44 1.4e-05 7.6e-01 0.12 22 0 403 4.74 31.439 1.8448 53 30.47 7.8e-05 5.1 -0.7 0.10600 0.06095 1.73921
gaagacga gaagacga 0.0000753656580 0.0000185419554 14 3.44 1.6e-05 8.5e-01 0.07 23 1 98 5.69 3.444 4.0646 13 3.43 5.8e-05 3.8 -0.6 0.02600 0.00687 3.78725
gaaaaaaa gaaaaaaa 0.0002960793708 0.0001588864333 55 29.51 1.8e-05 9.5e-01 0.02 24 0 378 4.69 29.515 1.8635 51 28.66 6.1e-05 4 -0.6 0.10200 0.05733 1.77931
aaaaaatg aaaaaatg 0.0001991806676 0.0000915928355 37 17.01 1.8e-05 9.9e-01 0.00 25 0 256 4.85 17.014 2.1746 36 16.73 2e-05 1.3 -0.1 0.07200 0.03346 2.15196
; Host name rsat
; Job started 2026-05-11.133717
; Job done 2026-05-11.133721
; Seconds 4.25
; user 4.25
; system 0.1
; cuser 0
; csystem 0