; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/04/21/tmp_sequence_2026-04-21.095625_Jui4eP.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return occ,proba,rank -1str -nogrouprc -noov -quick_if_possible -seqtype dna -bg upstream-noorf -org Saccharomyces_cerevisiae -pseudo 0.01 -l 7 -o $RSAT/public_html/tmp/www-data/2026/04/21/oligo-analysis_2026-04-21.095625_d1Zgoz_7nt.tab ; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42. ; Program version 1.169 ; Quick counting mode ; Detection of over-represented words (right-tail test) ; Oligomer length 7 ; Input file $RSAT/public_html/tmp/www-data/2026/04/21/tmp_sequence_2026-04-21.095625_Jui4eP.fasta.purged ; Input format fasta ; Output file $RSAT/public_html/tmp/www-data/2026/04/21/oligo-analysis_2026-04-21.095625_d1Zgoz_7nt.tab ; Discard overlapping matches ; Counted on a single strand ; Background model upstream-noorf ; Organism Saccharomyces_cerevisiae ; Background estimation method Frequency file ; Expected frequency file $RSAT/public_html/data/genomes/Saccharomyces_cerevisiae/oligo-frequencies/7nt_upstream-noorf_Saccharomyces_cerevisiae-noov-1str.freq ; Pseudo-frequency 0.01 ; Pseudo-frequency per oligo 6.103515625e-07 ; Sequence type DNA ; Nb of sequences 19 ; Sum of sequence lengths 9485 ; discarded residues NA (quick mode) (other letters than ACGT) ; discarded occurrences NA (quick mode) (contain discarded residues) ; nb possible positions NA (quick mode) ; total oligo occurrences 9315 ; total overlapping occurrences 74 ; total non overlapping occ 9241 ; alphabet size 4 ; nb possible oligomers 16384 ; oligomers tested for significance 16384 ; Sequences: ; MET8 463 ; MET32 547 ; MET18 568 ; MET30 177 ; MET28 489 ; MET6 687 ; MET10 338 ; MET13 380 ; MET3 800 ; MET14 800 ; MET1 702 ; MET17 800 ; MET2 481 ; MET4 800 ; MET22 215 ; MET7 250 ; MET31 161 ; MET12 384 ; MET16 443 ; ; column headers ; 1 seq oligomer sequence ; 2 id oligomer identifier ; 3 exp_freq expected relative frequency ; 4 occ observed occurrences ; 5 exp_occ expected occurrences ; 6 occ_P occurrence probability (binomial) ; 7 occ_E E-value for occurrences (binomial) ; 8 occ_sig occurrence significance (binomial) ; 9 rank rank ; 10 ovl_occ number of overlapping occurrences (discarded from the count) ; 11 forbocc forbidden positions (to avoid self-overlap) #seq id exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc cacgtga cacgtga 0.0000738482191 11 0.69 2.2e-10 3.6e-06 5.45 1 0 66 tcacgtg tcacgtg 0.0000718598608 10 0.67 2.7e-09 4.4e-05 4.35 2 0 60 gccacag gccacag 0.0000357380166 6 0.33 1.4e-06 2.3e-02 1.63 3 0 36 acgtgac acgtgac 0.0000364008027 6 0.34 1.6e-06 2.6e-02 1.59 4 0 36 ccacagt ccacagt 0.0000460112016 6 0.43 6e-06 9.8e-02 1.01 5 0 36 gcacgtg gcacgtg 0.0000354066235 5 0.33 2.5e-05 4.0e-01 0.39 6 0 30 cacagtt cacagtt 0.0000652319994 6 0.61 4.2e-05 6.8e-01 0.17 7 0 36 ; Host name rsat ; Job started 2026-04-21.095626 ; Job done 2026-04-21.095627 ; Seconds 0.77 ; user 0.77 ; system 0.02 ; cuser 0.1 ; csystem 0.02