; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.134158_jt9VCY.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return freq,mseq,occ,proba,rank,ratio,zscore -1str -noov -quick_if_possible -seqtype dna -markov 2 -pseudo 0.01 -l 6 -o $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.134158_qgrcwl_6nt.tab
; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42.
; Program version 1.169
; Slow counting mode
; Detection of over-represented words (right-tail test)
; Oligomer length 6
; Input file $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.134158_jt9VCY.fasta.purged
; Input format fasta
; Output file $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.134158_qgrcwl_6nt.tab
; Discard overlapping matches
; Counted on a single strand
; Background model Markov
; Background estimation method Markov model estimated from input sequences
; Markov chain order 2
; Pseudo-frequency 0.01
; Pseudo-frequency per oligo 2.44140625e-06
; Sequence type DNA
; Nb of sequences 500
; Sum of sequence lengths 100000
; discarded residues 320 (other letters than ACGT)
; discarded occurrences 320 (contain discarded residues)
; nb possible positions 97180
; total oligo occurrences 97180
; total overlapping occurrences 733
; total non overlapping occ 96447
; alphabet size 4
; nb possible oligomers 4096
; oligomers tested for significance 4093
;
; column headers
; 1 seq oligomer sequence
; 2 id oligomer identifier
; 3 obs_freq observed relative frequency
; 4 exp_freq expected relative frequency
; 5 occ observed occurrences
; 6 exp_occ expected occurrences
; 7 occ_P occurrence probability (binomial)
; 8 occ_E E-value for occurrences (binomial)
; 9 occ_sig occurrence significance (binomial)
; 10 rank rank
; 11 ovl_occ number of overlapping occurrences (discarded from the count)
; 12 forbocc forbidden positions (to avoid self-overlap)
; 13 zscore z-score (Gaussian approximation)
; 14 exp_var estimation of the variance on occurrences
; 15 ratio observed/expected ratio
; 16 ms number of matching sequences
; 17 exp_ms expected number of matching sequences
; 18 ms_P matching sequence probability (binomial)
; 19 ms_E E-value for matching sequences (binomial)
; 20 ms_sig matching sequenc significance (binomial)
; 21 ms_freq proportion of matching sequences (sequences with at least one occurrence)
; 22 exp_msf expected proportion matching sequences
; 23 ms_rati observed/expected numbers of matching sequences
#seq id obs_freq exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc zscore exp_var ratio ms exp_ms ms_P ms_E ms_sig ms_freq exp_msf ms_rati
tttctt tttctt 0.0018522329697 0.0012367670946 180 120.19 2.1e-07 8.8e-04 3.06 1 8 885 5.46 120.189 1.4976 137 106.89 0.00083 3.4 -0.5 0.27400 0.21379 1.28165
atcaag atcaag 0.0006688619057 0.0003542159453 65 34.42 2.2e-06 9.0e-03 2.05 2 0 318 5.21 34.423 1.8883 63 33.27 1.1e-06 0.0044 2.4 0.12600 0.06654 1.89359
tatata tatata 0.0015126569253 0.0010201723903 147 99.14 4.2e-06 1.7e-02 1.77 3 35 729 4.81 99.140 1.4827 121 89.97 0.00030 1.2 -0.1 0.24200 0.17994 1.34487
tccttt tccttt 0.0009158263017 0.0005641017323 89 54.82 1.4e-05 5.6e-02 1.25 4 0 441 4.62 54.819 1.6235 79 51.93 0.00012 0.5 0.3 0.15800 0.10387 1.52113
tctttt tctttt 0.0017287507718 0.0012450307404 168 120.99 3e-05 1.2e-01 0.91 5 4 825 4.27 120.992 1.3885 134 107.52 0.00286 12 -1.1 0.26800 0.21505 1.24622
ttcttt ttcttt 0.0017184605886 0.0012367670946 167 120.19 3.1e-05 1.3e-01 0.90 6 5 809 4.27 120.189 1.3895 135 106.89 0.00166 6.8 -0.8 0.27000 0.21379 1.26294
aaggaa aaggaa 0.0008849557522 0.0005573756181 86 54.17 4e-05 1.6e-01 0.79 7 0 409 4.33 54.166 1.5877 78 51.35 0.00014 0.58 0.2 0.15600 0.10270 1.51903
aagaaa aagaaa 0.0016155587569 0.0011752686536 157 114.21 8.5e-05 3.5e-01 0.46 8 8 778 4.00 114.213 1.3746 132 102.16 0.00078 3.2 -0.5 0.26400 0.20432 1.29208
tattat tattat 0.0009569870344 0.0006356992621 93 61.78 0.00013 5.2e-01 0.29 9 2 449 3.97 61.777 1.5054 85 58.13 0.00024 0.98 0.0 0.17000 0.11626 1.46222
aaaggg aaaggg 0.0004939287919 0.0002824531653 48 27.45 0.00024 9.8e-01 0.01 10 0 240 3.92 27.449 1.7487 45 26.71 0.00054 2.2 -0.3 0.09000 0.05343 1.68460
; Host name rsat
; Job started 2026-05-11.134158
; Job done 2026-05-11.134159
; Seconds 0.59
; user 0.59
; system 0.02
; cuser 0
; csystem 0