; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.134158_jt9VCY.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return freq,mseq,occ,proba,rank,ratio,zscore -1str -noov -quick_if_possible -seqtype dna -markov 2 -pseudo 0.01 -l 7 -o $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.134158_qgrcwl_7nt.tab
; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42.
; Program version 1.169
; Slow counting mode
; Detection of over-represented words (right-tail test)
; Oligomer length 7
; Input file $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.134158_jt9VCY.fasta.purged
; Input format fasta
; Output file $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.134158_qgrcwl_7nt.tab
; Discard overlapping matches
; Counted on a single strand
; Background model Markov
; Background estimation method Markov model estimated from input sequences
; Markov chain order 2
; Pseudo-frequency 0.01
; Pseudo-frequency per oligo 6.103515625e-07
; Sequence type DNA
; Nb of sequences 500
; Sum of sequence lengths 100000
; discarded residues 320 (other letters than ACGT)
; discarded occurrences 320 (contain discarded residues)
; nb possible positions 96680
; total oligo occurrences 96680
; total overlapping occurrences 434
; total non overlapping occ 96246
; alphabet size 4
; nb possible oligomers 16384
; oligomers tested for significance 15396
;
; column headers
; 1 seq oligomer sequence
; 2 id oligomer identifier
; 3 obs_freq observed relative frequency
; 4 exp_freq expected relative frequency
; 5 occ observed occurrences
; 6 exp_occ expected occurrences
; 7 occ_P occurrence probability (binomial)
; 8 occ_E E-value for occurrences (binomial)
; 9 occ_sig occurrence significance (binomial)
; 10 rank rank
; 11 ovl_occ number of overlapping occurrences (discarded from the count)
; 12 forbocc forbidden positions (to avoid self-overlap)
; 13 zscore z-score (Gaussian approximation)
; 14 exp_var estimation of the variance on occurrences
; 15 ratio observed/expected ratio
; 16 ms number of matching sequences
; 17 exp_ms expected number of matching sequences
; 18 ms_P matching sequence probability (binomial)
; 19 ms_E E-value for matching sequences (binomial)
; 20 ms_sig matching sequenc significance (binomial)
; 21 ms_freq proportion of matching sequences (sequences with at least one occurrence)
; 22 exp_msf expected proportion matching sequences
; 23 ms_rati observed/expected numbers of matching sequences
#seq id obs_freq exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc zscore exp_var ratio ms exp_ms ms_P ms_E ms_sig ms_freq exp_msf ms_rati
ttttctt ttttctt 0.0009309060819 0.0004906926829 90 47.44 2.4e-08 3.8e-04 3.42 1 2 529 6.18 47.440 1.8971 74 45.27 2.2e-05 0.35 0.5 0.14800 0.09054 1.63465
tttcttt tttcttt 0.0009102192801 0.0004906926829 88 47.44 8.9e-08 1.4e-03 2.86 2 1 510 5.89 47.440 1.8550 77 45.27 3.5e-06 0.058 1.2 0.15400 0.09054 1.70092
atatata atatata 0.0006930078610 0.0003615487579 67 34.95 9.5e-07 1.5e-02 1.84 3 20 402 5.42 34.955 1.9168 59 33.77 2.6e-05 0.43 0.4 0.11800 0.06753 1.74729
gaaaatg gaaaatg 0.0003206454282 0.0001274808789 31 12.32 5.7e-06 8.7e-02 1.06 4 0 177 5.32 12.325 2.5152 30 12.17 8.4e-06 0.14 0.9 0.06000 0.02435 2.46407
tcctttt tcctttt 0.0004654530410 0.0002236145429 45 21.62 7.4e-06 1.1e-01 0.94 5 0 270 5.03 21.619 2.0815 40 21.16 0.00012 1.9 -0.3 0.08000 0.04232 1.89030
ttctttt ttctttt 0.0008274720728 0.0004906926829 80 47.44 1e-05 1.6e-01 0.81 6 2 475 4.73 47.440 1.6863 71 45.27 0.00012 1.9 -0.3 0.14200 0.09054 1.56838
tcttgtt tcttgtt 0.0003309888291 0.0001391690580 32 13.45 1.2e-05 1.9e-01 0.73 7 0 192 5.06 13.455 2.3783 31 13.28 1.7e-05 0.27 0.6 0.06200 0.02655 2.33498
tatataa tatataa 0.0005688870501 0.0003012466997 55 29.12 1.2e-05 1.9e-01 0.72 8 0 330 4.79 29.125 1.8884 53 28.30 1.1e-05 0.18 0.7 0.10600 0.05659 1.87301
tatatat tatatat 0.0006206040546 0.0003426965616 60 33.13 1.7e-05 2.6e-01 0.58 9 19 357 4.67 33.132 1.8109 55 32.06 8.1e-05 1.3 -0.1 0.11000 0.06413 1.71535
ttattat ttattat 0.0003930492346 0.0001865862821 38 18.04 2.8e-05 4.3e-01 0.37 10 2 224 4.70 18.039 2.1065 34 17.72 0.00029 4.7 -0.7 0.06800 0.03544 1.91882
ttttttc ttttttc 0.0009102192801 0.0005785421589 88 55.93 4.5e-05 6.9e-01 0.16 11 0 516 4.29 55.933 1.5733 73 52.93 0.00318 52 -1.7 0.14600 0.10587 1.37911
ctctttt ctctttt 0.0004447662391 0.0002289489701 43 22.13 5.5e-05 8.4e-01 0.07 12 0 258 4.43 22.135 1.9426 40 21.65 0.00018 3 -0.5 0.08000 0.04331 1.84720
; Host name rsat
; Job started 2026-05-11.134159
; Job done 2026-05-11.134200
; Seconds 1.15
; user 1.15
; system 0.04
; cuser 0
; csystem 0