; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return freq,mseq,occ,proba,rank,ratio,zscore -1str -noov -quick_if_possible -seqtype dna -markov 2 -pseudo 0.01 -l 8 -o $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_8nt.tab
; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42.
; Program version 1.169
; Slow counting mode
; Detection of over-represented words (right-tail test)
; Oligomer length 8
; Input file $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged
; Input format fasta
; Output file $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_8nt.tab
; Discard overlapping matches
; Counted on a single strand
; Background model Markov
; Background estimation method Markov model estimated from input sequences
; Markov chain order 2
; Pseudo-frequency 0.01
; Pseudo-frequency per oligo 1.52587890625e-07
; Sequence type DNA
; Nb of sequences 500
; Sum of sequence lengths 189796
; discarded residues 535 (other letters than ACGT)
; discarded occurrences 535 (contain discarded residues)
; nb possible positions 185761
; total oligo occurrences 185761
; total overlapping occurrences 372
; total non overlapping occ 185389
; alphabet size 4
; nb possible oligomers 65536
; oligomers tested for significance 54084
;
; column headers
; 1 seq oligomer sequence
; 2 id oligomer identifier
; 3 obs_freq observed relative frequency
; 4 exp_freq expected relative frequency
; 5 occ observed occurrences
; 6 exp_occ expected occurrences
; 7 occ_P occurrence probability (binomial)
; 8 occ_E E-value for occurrences (binomial)
; 9 occ_sig occurrence significance (binomial)
; 10 rank rank
; 11 ovl_occ number of overlapping occurrences (discarded from the count)
; 12 forbocc forbidden positions (to avoid self-overlap)
; 13 zscore z-score (Gaussian approximation)
; 14 exp_var estimation of the variance on occurrences
; 15 ratio observed/expected ratio
; 16 ms number of matching sequences
; 17 exp_ms expected number of matching sequences
; 18 ms_P matching sequence probability (binomial)
; 19 ms_E E-value for matching sequences (binomial)
; 20 ms_sig matching sequenc significance (binomial)
; 21 ms_freq proportion of matching sequences (sequences with at least one occurrence)
; 22 exp_msf expected proportion matching sequences
; 23 ms_rati observed/expected numbers of matching sequences
#seq id obs_freq exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc zscore exp_var ratio ms exp_ms ms_P ms_E ms_sig ms_freq exp_msf ms_rati
gatgatga gatgatga 0.0000915154419 0.0000148233009 17 2.75 6.3e-09 3.4e-04 3.46 1 0 116 8.59 2.754 6.1738 17 2.75 5e-09 0.00033 3.5 0.03400 0.00549 6.19073
caacaaca caacaaca 0.0001238150096 0.0000318511213 23 5.92 7.9e-08 4.3e-03 2.37 2 2 161 7.02 5.917 3.8873 16 5.88 0.00037 25 -1.4 0.03200 0.01176 2.72020
aagaggaa aagaggaa 0.0001507313160 0.0000453251708 28 8.42 8.2e-08 4.4e-03 2.35 3 0 191 6.75 8.420 3.3256 27 8.35 1.7e-07 0.011 2.0 0.05400 0.01670 3.23379
tcttcttc tcttcttc 0.0001238150096 0.0000345025517 23 6.41 3.1e-07 1.7e-02 1.77 4 5 161 6.55 6.409 3.5886 20 6.37 1e-05 0.66 0.2 0.04000 0.01274 3.14049
ctcttttt ctcttttt 0.0001776476225 0.0000640316740 33 11.89 3.7e-07 2.0e-02 1.70 5 0 231 6.12 11.895 2.7744 31 11.75 1.5e-06 0.1 1.0 0.06200 0.02351 2.63727
tctttttt tctttttt 0.0002583965418 0.0001138818246 48 21.15 3.8e-07 2.0e-02 1.69 6 1 336 5.84 21.155 2.2690 44 20.71 3.2e-06 0.21 0.7 0.08800 0.04143 2.12410
tgatgatg tgatgatg 0.0000753656580 0.0000136156508 14 2.53 4.8e-07 2.6e-02 1.58 7 1 98 7.21 2.529 5.5352 14 2.52 4.1e-07 0.027 1.6 0.02800 0.00505 5.54920
tggtggtg tggtggtg 0.0000699823967 0.0000123645680 13 2.30 9.5e-07 5.2e-02 1.29 8 1 91 7.06 2.297 5.6599 13 2.29 8.4e-07 0.055 1.3 0.02600 0.00458 5.67289
cagcaaca cagcaaca 0.0000861321806 0.0000190270977 16 3.53 1e-06 5.6e-02 1.25 9 0 112 6.63 3.534 4.5268 12 3.52 0.00029 19 -1.3 0.02400 0.00704 3.40709
tttttttc tttttttc 0.0002853128482 0.0001392337974 53 25.86 1.9e-06 1.0e-01 0.98 10 0 371 5.34 25.864 2.0492 46 25.21 8e-05 5.3 -0.7 0.09200 0.05042 1.82479
tatatata tatatata 0.0001399647935 0.0000481653494 26 8.95 2.7e-06 1.4e-01 0.84 11 15 175 5.70 8.947 2.9059 25 8.87 5.2e-06 0.34 0.5 0.05000 0.01774 2.81916
tatataaa tatataaa 0.0001614978386 0.0000609840629 30 11.33 3e-06 1.6e-01 0.79 12 0 210 5.55 11.328 2.6482 29 11.20 4.8e-06 0.31 0.5 0.05800 0.02240 2.58896
ttatataa ttatataa 0.0001399647935 0.0000494952916 26 9.19 4.3e-06 2.3e-01 0.64 13 0 182 5.54 9.194 2.8278 25 9.11 8.2e-06 0.54 0.3 0.05000 0.01822 2.74409
atataata atataata 0.0001238150096 0.0000411332783 23 7.64 5.5e-06 3.0e-01 0.52 14 0 161 5.56 7.641 3.0101 23 7.58 3.9e-06 0.26 0.6 0.04600 0.01517 3.03309
acaacaac acaacaac 0.0000968987032 0.0000273606836 18 5.08 6.7e-06 3.6e-01 0.44 15 2 125 5.73 5.083 3.5415 17 5.06 2e-05 1.3 -0.1 0.03400 0.01011 3.36176
ataataac ataataac 0.0000915154419 0.0000249726014 17 4.64 7.8e-06 4.2e-01 0.38 16 0 119 5.74 4.639 3.6646 16 4.62 2.4e-05 1.6 -0.2 0.03200 0.00924 3.46505
cggtggta cggtggta 0.0000484493516 0.0000070301147 9 1.31 9.5e-06 5.1e-01 0.29 17 0 63 6.73 1.306 6.8917 9 1.30 8.9e-06 0.58 0.2 0.01800 0.00261 6.90067
gaagagga gaagagga 0.0000915154419 0.0000258409092 17 4.80 1.2e-05 6.5e-01 0.19 18 0 119 5.57 4.800 3.5415 16 4.78 3.6e-05 2.4 -0.4 0.03200 0.00955 3.34915
ttcctcga ttcctcga 0.0000645991354 0.0000134051627 12 2.49 1.2e-05 6.6e-01 0.18 19 0 84 6.03 2.490 4.8190 12 2.48 1.1e-05 0.71 0.1 0.02400 0.00497 4.83095
atgatgaa atgatgaa 0.0000968987032 0.0000288430520 18 5.36 1.3e-05 7.3e-01 0.14 20 0 122 5.46 5.358 3.3595 18 5.33 1.1e-05 0.71 0.2 0.03600 0.01066 3.37750
ttgatgat ttgatgat 0.0000861321806 0.0000234494097 16 4.36 1.4e-05 7.4e-01 0.13 21 0 112 5.58 4.356 3.6731 16 4.34 1.1e-05 0.75 0.1 0.03200 0.00867 3.68909
aaaaaaat aaaaaaat 0.0003122291547 0.0001692452639 58 31.44 1.4e-05 7.6e-01 0.12 22 0 403 4.74 31.439 1.8448 53 30.47 7.8e-05 5.1 -0.7 0.10600 0.06095 1.73921
gaagacga gaagacga 0.0000753656580 0.0000185419554 14 3.44 1.6e-05 8.5e-01 0.07 23 1 98 5.69 3.444 4.0646 13 3.43 5.8e-05 3.8 -0.6 0.02600 0.00687 3.78725
gaaaaaaa gaaaaaaa 0.0002960793708 0.0001588864333 55 29.51 1.8e-05 9.5e-01 0.02 24 0 378 4.69 29.515 1.8635 51 28.66 6.1e-05 4 -0.6 0.10200 0.05733 1.77931
aaaaaatg aaaaaatg 0.0001991806676 0.0000915928355 37 17.01 1.8e-05 9.9e-01 0.00 25 0 256 4.85 17.014 2.1746 36 16.73 2e-05 1.3 -0.1 0.07200 0.03346 2.15196
; Host name rsat
; Job started 2026-05-11.133717
; Job done 2026-05-11.133721
; Seconds 4.25
; user 4.25
; system 0.1
; cuser 0
; csystem 0