; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.134158_jt9VCY.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return freq,mseq,occ,proba,rank,ratio,zscore -1str -noov -quick_if_possible -seqtype dna -markov 2 -pseudo 0.01 -l 8 -o $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.134158_qgrcwl_8nt.tab
; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42.
; Program version 1.169
; Slow counting mode
; Detection of over-represented words (right-tail test)
; Oligomer length 8
; Input file $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.134158_jt9VCY.fasta.purged
; Input format fasta
; Output file $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.134158_qgrcwl_8nt.tab
; Discard overlapping matches
; Counted on a single strand
; Background model Markov
; Background estimation method Markov model estimated from input sequences
; Markov chain order 2
; Pseudo-frequency 0.01
; Pseudo-frequency per oligo 1.52587890625e-07
; Sequence type DNA
; Nb of sequences 500
; Sum of sequence lengths 100000
; discarded residues 320 (other letters than ACGT)
; discarded occurrences 320 (contain discarded residues)
; nb possible positions 96180
; total oligo occurrences 96180
; total overlapping occurrences 247
; total non overlapping occ 95933
; alphabet size 4
; nb possible oligomers 65536
; oligomers tested for significance 41529
;
; column headers
; 1 seq oligomer sequence
; 2 id oligomer identifier
; 3 obs_freq observed relative frequency
; 4 exp_freq expected relative frequency
; 5 occ observed occurrences
; 6 exp_occ expected occurrences
; 7 occ_P occurrence probability (binomial)
; 8 occ_E E-value for occurrences (binomial)
; 9 occ_sig occurrence significance (binomial)
; 10 rank rank
; 11 ovl_occ number of overlapping occurrences (discarded from the count)
; 12 forbocc forbidden positions (to avoid self-overlap)
; 13 zscore z-score (Gaussian approximation)
; 14 exp_var estimation of the variance on occurrences
; 15 ratio observed/expected ratio
; 16 ms number of matching sequences
; 17 exp_ms expected number of matching sequences
; 18 ms_P matching sequence probability (binomial)
; 19 ms_E E-value for matching sequences (binomial)
; 20 ms_sig matching sequenc significance (binomial)
; 21 ms_freq proportion of matching sequences (sequences with at least one occurrence)
; 22 exp_msf expected proportion matching sequences
; 23 ms_rati observed/expected numbers of matching sequences
#seq id obs_freq exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc zscore exp_var ratio ms exp_ms ms_P ms_E ms_sig ms_freq exp_msf ms_rati
catatata catatata 0.0002911208151 0.0000703856513 28 6.77 8.8e-10 3.7e-05 4.44 1 0 196 8.16 6.770 4.1361 26 6.72 9e-09 0.00059 3.2 0.05200 0.01345 3.86657
ttcttgtt ttcttgtt 0.0002079434394 0.0000548007102 20 5.27 7.7e-07 3.2e-02 1.50 2 0 140 6.42 5.271 3.7945 20 5.24 5.7e-07 0.038 1.4 0.04000 0.01049 3.81447
gaaaatga gaaaatga 0.0001663547515 0.0000370307679 16 3.56 1.1e-06 4.8e-02 1.32 3 0 97 6.59 3.562 4.4923 15 3.55 4.4e-06 0.29 0.5 0.03000 0.00710 4.22651
cttttctt cttttctt 0.0002911208151 0.0001006401852 28 9.68 1.2e-06 5.1e-02 1.29 4 0 194 5.89 9.680 2.8927 28 9.59 7.3e-07 0.048 1.3 0.05600 0.01917 2.92063
tttctttt tttctttt 0.0004366812227 0.0001947371240 42 18.73 2.5e-06 1.1e-01 0.98 5 1 294 5.38 18.730 2.2424 39 18.39 1.2e-05 0.8 0.1 0.07800 0.03677 2.12128
ttttcttt ttttcttt 0.0004366812227 0.0001947371240 42 18.73 2.5e-06 1.1e-01 0.98 6 0 280 5.38 18.730 2.2424 37 18.39 6.1e-05 4 -0.6 0.07400 0.03677 2.01250
tttttttc tttttttc 0.0004782699106 0.0002296172828 46 22.08 5.8e-06 2.4e-01 0.62 7 0 318 5.09 22.085 2.0829 39 21.61 0.00035 23 -1.4 0.07800 0.04321 1.80502
ttgttttc ttgttttc 0.0002079434394 0.0000645966334 20 6.21 8.5e-06 3.5e-01 0.45 8 0 140 5.53 6.213 3.2191 18 6.17 7.1e-05 4.6 -0.7 0.03600 0.01235 2.91514
gctgccgg gctgccgg 0.0000519858598 0.0000027494683 5 0.26 8.7e-06 3.6e-01 0.44 9 0 35 9.21 0.264 18.9076 5 0.26 8.5e-06 0.56 0.3 0.01000 0.00053 18.91258
tatatata tatatata 0.0002911208151 0.0001136856815 28 10.93 1.1e-05 4.7e-01 0.33 10 11 196 5.16 10.934 2.5608 25 10.82 0.00013 8.3 -0.9 0.05000 0.02163 2.31135
atatatat atatatat 0.0003015179871 0.0001214735002 29 11.68 1.4e-05 5.8e-01 0.23 11 11 203 5.07 11.683 2.4822 27 11.55 5.7e-05 3.7 -0.6 0.05400 0.02310 2.33795
tccttttc tccttttc 0.0001663547515 0.0000466399633 16 4.49 2e-05 8.1e-01 0.09 12 0 112 5.44 4.486 3.5668 15 4.47 6.1e-05 4 -0.6 0.03000 0.00893 3.35881
; Host name rsat
; Job started 2026-05-11.134200
; Job done 2026-05-11.134203
; Seconds 2.98
; user 2.99
; system 0.08
; cuser 0
; csystem 0