; oligo-analysis  -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/02/tmp_sequence_2026-05-02.224300_aU9YyQ.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return occ,proba,rank -1str -noov -quick_if_possible -seqtype dna -bg upstream-noorf -org Homo_sapiens_GRCh38 -pseudo 0.01 -l 5 -o $RSAT/public_html/tmp/www-data/2026/05/02/oligo-analysis_2026-05-02.224300_t2l33k_5nt.tab
; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42. 
; Program version              	1.169
; Quick counting mode          
; Detection of over-represented words (right-tail test)
; Oligomer length              	5
; Input file                   	$RSAT/public_html/tmp/www-data/2026/05/02/tmp_sequence_2026-05-02.224300_aU9YyQ.fasta.purged
; Input format                 	fasta
; Output file                  	$RSAT/public_html/tmp/www-data/2026/05/02/oligo-analysis_2026-05-02.224300_t2l33k_5nt.tab
; Discard overlapping matches
; Counted on a single strand
; Background model             	upstream-noorf
; Organism                     	Homo_sapiens_GRCh38
; Background estimation method 	Frequency file
; Expected frequency file      	$RSAT/public_html/data/genomes/Homo_sapiens_GRCh38/oligo-frequencies/5nt_upstream-noorf_Homo_sapiens_GRCh38-noov-1str.freq
; Pseudo-frequency             	0.01
; Pseudo-frequency per oligo   	9.765625e-06
; Sequence type                	DNA
; Nb of sequences              	3205
; Sum of sequence lengths      	99355
; discarded residues           	NA (quick mode)	 (other letters than ACGT)
; discarded occurrences        	NA (quick mode)	 (contain discarded residues)
; nb possible positions        	NA (quick mode)
; total oligo occurrences      	86535
; total overlapping occurrences	1267
; total non overlapping occ    	85268
; alphabet size                	4
; nb possible oligomers        	1024
; oligomers tested for significance	1024
;
; column headers
;	1	seq            	oligomer sequence
;	2	id             	oligomer identifier
;	3	exp_freq       	expected relative frequency
;	4	occ            	observed occurrences
;	5	exp_occ        	expected occurrences
;	6	occ_P          	occurrence probability (binomial)
;	7	occ_E          	E-value for occurrences (binomial)
;	8	occ_sig        	occurrence significance (binomial)
;	9	rank           	rank
;	10	ovl_occ        	number of overlapping occurrences (discarded from the count)
;	11	forbocc        	forbidden positions (to avoid self-overlap)
#seq	id	exp_freq	occ	exp_occ	occ_P	occ_E	occ_sig	rank	ovl_occ	forbocc
ataaa	ataaa	0.0023470463624	1581	203.10	0	0e+00	350.00	1	63	6324
taaat	taaat	0.0018926656999	906	163.78	0	0e+00	350.00	2	70	3624
aataa	aataa	0.0021857950064	1488	189.15	0	0e+00	350.00	3	96	5952
taaaa	taaaa	0.0029603745843	1060	256.18	8e-309	8e-306	305.09	4	0	4240
aaata	aaata	0.0028562069859	1021	247.16	6e-297	6e-294	293.19	5	60	4084
aaaat	aaaat	0.0036170789746	1048	313.00	1e-234	1e-231	230.91	6	0	4192
aaatt	aaatt	0.0024144828054	738	208.94	8e-178	9e-175	174.07	7	0	2952
ttaaa	ttaaa	0.0023505812501	718	203.41	7e-173	7e-170	169.14	8	0	2872
taata	taata	0.0013318280412	519	115.25	1e-166	1e-163	162.88	9	8	2076
attaa	attaa	0.0015142095306	469	131.03	1e-115	2e-112	111.82	10	4	1876
taaag	taaag	0.0012743555180	387	110.28	2.7e-93	2.8e-90	89.55	11	0	1548
aaatg	aaatg	0.0021082362575	507	182.44	1.2e-86	1.2e-83	82.91	12	0	2028
tttaa	tttaa	0.0023042677412	535	199.40	3.9e-86	4.0e-83	82.40	13	0	2140
ttaat	ttaat	0.0014854984669	406	128.55	9.6e-85	9.8e-82	81.01	14	4	1624
taaac	taaac	0.0009661795406	317	83.61	1.7e-84	1.7e-81	80.77	15	0	1268
caata	caata	0.0009918596722	307	85.83	3.2e-76	3.3e-73	72.48	16	0	1228
tgttt	tgttt	0.0020296120028	433	175.63	2.7e-60	2.7e-57	56.56	17	5	1732
aaact	aaact	0.0015919482636	347	137.76	1.2e-50	1.3e-47	46.90	18	0	1388
ttatt	ttatt	0.0020888123734	414	180.76	5e-50	5.1e-47	46.29	19	22	1656
aaaaa	aaaaa	0.0034794199347	586	301.09	3.9e-48	4.0e-45	44.40	20	353	2344
aattt	aattt	0.0023726041047	445	205.31	1e-47	1.0e-44	43.99	21	0	1780
aatgt	aatgt	0.0014486665203	318	125.36	3.8e-47	3.9e-44	43.41	22	0	1272
ttgtt	ttgtt	0.0016087155825	338	139.21	3.9e-46	4.0e-43	42.40	23	11	1352
tttgt	tttgt	0.0020470488625	395	177.14	3.1e-45	3.1e-42	41.50	24	1	1580
tttta	tttta	0.0028347528810	480	245.31	2.6e-40	2.7e-37	36.57	25	0	1920
aatta	aatta	0.0017625875902	343	152.53	3.1e-40	3.2e-37	36.49	26	1	1372
tgtgt	tgtgt	0.0014337062418	293	124.07	3.5e-38	3.6e-35	34.44	27	39	1172
tgaat	tgaat	0.0013355789099	279	115.57	5.4e-38	5.5e-35	34.26	28	8	1116
aattg	aattg	0.0010813333686	242	93.57	1.4e-37	1.5e-34	33.83	29	0	968
aattc	aattc	0.0012225848911	261	105.80	4e-37	4.1e-34	33.39	30	0	1044
aatat	aatat	0.0018735441890	348	162.13	6.3e-37	6.4e-34	33.19	31	0	1392
tttat	tttat	0.0022276737071	393	192.77	7.5e-37	7.7e-34	33.11	32	3	1572
tcatt	tcatt	0.0015051383319	298	130.25	1.9e-36	1.9e-33	32.71	33	3	1192
attgt	attgt	0.0011040977577	239	95.54	5.2e-35	5.3e-32	31.28	34	0	956
gaata	gaata	0.0010536374151	230	91.18	2.8e-34	2.9e-31	30.53	35	0	920
ttgaa	ttgaa	0.0015634531807	295	135.29	1.1e-32	1.2e-29	28.93	36	0	1180
tatta	tatta	0.0013135848527	259	113.67	1.2e-31	1.2e-28	27.92	37	14	1036
attta	attta	0.0018621691937	330	161.14	1.5e-31	1.5e-28	27.83	38	5	1320
tattt	tattt	0.0027467838517	433	237.69	3.7e-30	3.8e-27	26.42	39	6	1732
ataat	ataat	0.0015299977360	282	132.40	9.2e-30	9.4e-27	26.03	40	5	1128
tcttt	tcttt	0.0021928503832	365	189.76	9.4e-30	9.6e-27	26.02	41	4	1460
aactt	aactt	0.0012102091844	239	104.73	1.9e-29	2.0e-26	25.71	42	0	956
tgaaa	tgaaa	0.0020457601764	344	177.03	6.9e-29	7.1e-26	25.15	43	0	1376
aaatc	aaatc	0.0013079189532	250	113.18	9.8e-29	1.0e-25	25.00	44	0	1000
ttctt	ttctt	0.0021429515910	354	185.44	2.4e-28	2.4e-25	24.61	45	12	1416
attct	attct	0.0016283770457	288	140.91	1.2e-27	1.2e-24	23.91	46	0	1152
atttg	atttg	0.0015030649151	269	130.07	1.2e-26	1.2e-23	22.92	47	0	1076
ttgta	ttgta	0.0012143200213	230	105.08	4.4e-26	4.6e-23	22.34	48	0	920
tttct	tttct	0.0026951572122	411	233.23	4.5e-26	4.6e-23	22.34	49	6	1644
atttt	atttt	0.0034755394774	498	300.76	1.4e-25	1.4e-22	21.84	50	0	1992
; Host name	rsat
; Job started	2026-05-02.224302
; Job done	2026-05-02.224302
; Seconds	0.24
;	user	0.24
;	system	0.03
;	cuser	0.11
;	csystem	0.01
