; oligo-analysis  -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/04/21/tmp_sequence_2026-04-21.135628_5pBXJv.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return occ,proba,rank -2str -noov -quick_if_possible -seqtype dna -bg upstream-noorf -org Saccharomyces_cerevisiae -pseudo 0.01 -l 8 -o $RSAT/public_html/tmp/www-data/2026/04/21/oligo-analysis_2026-04-21.135628_YlceDT_8nt.tab
; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42. 
; Program version              	1.169
; Quick counting mode          
; Detection of over-represented words (right-tail test)
; Oligomer length              	8
; Input file                   	$RSAT/public_html/tmp/www-data/2026/04/21/tmp_sequence_2026-04-21.135628_5pBXJv.fasta.purged
; Input format                 	fasta
; Output file                  	$RSAT/public_html/tmp/www-data/2026/04/21/oligo-analysis_2026-04-21.135628_YlceDT_8nt.tab
; Discard overlapping matches
; Counted on both strands
; 	grouped by pairs of reverse complements
; Background model             	upstream-noorf
; Organism                     	Saccharomyces_cerevisiae
; Background estimation method 	Frequency file
; Expected frequency file      	$RSAT/public_html/data/genomes/Saccharomyces_cerevisiae/oligo-frequencies/8nt_upstream-noorf_Saccharomyces_cerevisiae-noov-2str.freq
; Pseudo-frequency             	0.01
; Pseudo-frequency per oligo   	3.03988326848249e-07
; Sequence type                	DNA
; Nb of sequences              	19
; Sum of sequence lengths      	9485
; discarded residues           	NA (quick mode)	 (other letters than ACGT)
; discarded occurrences        	NA (quick mode)	 (contain discarded residues)
; nb possible positions        	NA (quick mode)
; total oligo occurrences      	9329
; total overlapping occurrences	107
; total non overlapping occ    	9222
; alphabet size                	4
; nb possible oligomers        	32896
; oligomers tested for significance	32896
; Sequences:
;	MET8	463
;	MET32	547
;	MET18	568
;	MET30	177
;	MET28	489
;	MET6	687
;	MET10	338
;	MET13	380
;	MET3	800
;	MET14	800
;	MET1	702
;	MET17	800
;	MET2	481
;	MET4	800
;	MET22	215
;	MET7	250
;	MET31	161
;	MET12	384
;	MET16	443
;
; column headers
;	1	seq            	oligomer sequence
;	2	id             	oligomer identifier
;	3	exp_freq       	expected relative frequency
;	4	occ            	observed occurrences
;	5	exp_occ        	expected occurrences
;	6	occ_P          	occurrence probability (binomial)
;	7	occ_E          	E-value for occurrences (binomial)
;	8	occ_sig        	occurrence significance (binomial)
;	9	rank           	rank
;	10	ovl_occ        	number of overlapping occurrences (discarded from the count)
;	11	forbocc        	forbidden positions (to avoid self-overlap)
#seq	id	exp_freq	occ	exp_occ	occ_P	occ_E	occ_sig	rank	ovl_occ	forbocc
aactgtgg	aactgtgg|ccacagtt	0.0000334807653	8	0.31	1.7e-09	5.6e-05	4.25	1	0	56
gcacgtga	gcacgtga|tcacgtgc	0.0000397843529	7	0.37	1.4e-07	4.6e-03	2.34	2	0	49
cacgtgac	cacgtgac|gtcacgtg	0.0000434337984	7	0.41	2.5e-07	8.2e-03	2.09	3	1	49
cacgtgaa	cacgtgaa|ttcacgtg	0.0000308266231	6	0.29	6.1e-07	2.0e-02	1.70	4	0	42
aaactgtg	aaactgtg|cacagttt	0.0000557092058	7	0.52	1.3e-06	4.2e-02	1.37	5	0	49
actgtggc	actgtggc|gccacagt	0.0000251865710	5	0.23	4.9e-06	1.6e-01	0.79	6	0	35
atcacgtg	atcacgtg|cacgtgat	0.0000464197083	6	0.43	6.3e-06	2.1e-01	0.68	7	0	42
aagccaca	aagccaca|tgtggctt	0.0000321536941	5	0.30	1.6e-05	5.2e-01	0.29	8	0	35
; Host name	rsat
; Job started	2026-04-21.135630
; Job done	2026-04-21.135633
; Seconds	2.74
;	user	2.74
;	system	0.07
;	cuser	0.15
;	csystem	0.03
