; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/04/21/tmp_sequence_2026-04-21.095539_8fvtbN.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return occ,proba,rank -2str -noov -quick_if_possible -seqtype dna -bg upstream-noorf -org Saccharomyces_cerevisiae -pseudo 0.01 -l 7 -o $RSAT/public_html/tmp/www-data/2026/04/21/oligo-analysis_2026-04-21.095539_9pJODJ_7nt.tab
; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42.
; Program version 1.169
; Quick counting mode
; Detection of over-represented words (right-tail test)
; Oligomer length 7
; Input file $RSAT/public_html/tmp/www-data/2026/04/21/tmp_sequence_2026-04-21.095539_8fvtbN.fasta.purged
; Input format fasta
; Output file $RSAT/public_html/tmp/www-data/2026/04/21/oligo-analysis_2026-04-21.095539_9pJODJ_7nt.tab
; Discard overlapping matches
; Counted on both strands
; grouped by pairs of reverse complements
; Background model upstream-noorf
; Organism Saccharomyces_cerevisiae
; Background estimation method Frequency file
; Expected frequency file $RSAT/public_html/data/genomes/Saccharomyces_cerevisiae/oligo-frequencies/7nt_upstream-noorf_Saccharomyces_cerevisiae-noov-2str.freq
; Pseudo-frequency 0.01
; Pseudo-frequency per oligo 1.220703125e-06
; Sequence type DNA
; Nb of sequences 19
; Sum of sequence lengths 9485
; discarded residues NA (quick mode) (other letters than ACGT)
; discarded occurrences NA (quick mode) (contain discarded residues)
; nb possible positions NA (quick mode)
; total oligo occurrences 9315
; total overlapping occurrences 149
; total non overlapping occ 9166
; alphabet size 4
; nb possible oligomers 8192
; oligomers tested for significance 8192
; Sequences:
; MET8 463
; MET32 547
; MET18 568
; MET30 177
; MET28 489
; MET6 687
; MET10 338
; MET13 380
; MET3 800
; MET14 800
; MET1 702
; MET17 800
; MET2 481
; MET4 800
; MET22 215
; MET7 250
; MET31 161
; MET12 384
; MET16 443
;
; column headers
; 1 seq oligomer sequence
; 2 id oligomer identifier
; 3 exp_freq expected relative frequency
; 4 occ observed occurrences
; 5 exp_occ expected occurrences
; 6 occ_P occurrence probability (binomial)
; 7 occ_E E-value for occurrences (binomial)
; 8 occ_sig occurrence significance (binomial)
; 9 rank rank
; 10 ovl_occ number of overlapping occurrences (discarded from the count)
; 11 forbocc forbidden positions (to avoid self-overlap)
#seq id exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc
cacgtga cacgtga|tcacgtg 0.0001115745941 17 1.04 2e-15 1.6e-11 10.78 1 4 102
aactgtg aactgtg|cacagtt 0.0001251617098 11 1.17 4.7e-08 3.8e-04 3.42 2 0 66
actgtgg actgtgg|ccacagt 0.0000810864320 9 0.76 1.1e-07 9.1e-04 3.04 3 0 54
acgtgac acgtgac|gtcacgt 0.0000747899638 8 0.70 7.4e-07 6.1e-03 2.22 4 1 48
cacgtgc cacgtgc|gcacgtg 0.0000668365302 7 0.62 4.2e-06 3.4e-02 1.47 5 0 42
ctgtggc ctgtggc|gccacag 0.0000684934956 7 0.64 4.9e-06 4.0e-02 1.40 6 0 42
agccaca agccaca|tgtggct 0.0000946735477 7 0.88 3.8e-05 3.1e-01 0.50 7 0 42
atgacta atgacta|tagtcat 0.0001692369875 9 1.58 4e-05 3.3e-01 0.48 8 0 54
tcatgaa tcatgaa|ttcatga 0.0001367604671 8 1.27 5.6e-05 4.6e-01 0.34 9 4 48
atgcgcg atgcgcg|cgcgcat 0.0000462901601 5 0.43 8.7e-05 7.1e-01 0.15 10 0 30
acgtgca acgtgca|tgcacgt 0.0000790980736 6 0.74 0.00012 9.7e-01 0.01 11 0 36
; Host name rsat
; Job started 2026-04-21.095541
; Job done 2026-04-21.095541
; Seconds 0.68
; user 0.68
; system 0.03
; cuser 0.1
; csystem 0.03