; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return freq,mseq,occ,proba,rank,ratio,zscore -1str -noov -quick_if_possible -seqtype dna -markov 2 -pseudo 0.01 -l 6 -o $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_6nt.tab ; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42. ; Program version 1.169 ; Slow counting mode ; Detection of over-represented words (right-tail test) ; Oligomer length 6 ; Input file $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged ; Input format fasta ; Output file $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_6nt.tab ; Discard overlapping matches ; Counted on a single strand ; Background model Markov ; Background estimation method Markov model estimated from input sequences ; Markov chain order 2 ; Pseudo-frequency 0.01 ; Pseudo-frequency per oligo 2.44140625e-06 ; Sequence type DNA ; Nb of sequences 500 ; Sum of sequence lengths 189796 ; discarded residues 535 (other letters than ACGT) ; discarded occurrences 535 (contain discarded residues) ; nb possible positions 186761 ; total oligo occurrences 186761 ; total overlapping occurrences 1034 ; total non overlapping occ 185727 ; alphabet size 4 ; nb possible oligomers 4096 ; oligomers tested for significance 4096 ; ; column headers ; 1 seq oligomer sequence ; 2 id oligomer identifier ; 3 obs_freq observed relative frequency ; 4 exp_freq expected relative frequency ; 5 occ observed occurrences ; 6 exp_occ expected occurrences ; 7 occ_P occurrence probability (binomial) ; 8 occ_E E-value for occurrences (binomial) ; 9 occ_sig occurrence significance (binomial) ; 10 rank rank ; 11 ovl_occ number of overlapping occurrences (discarded from the count) ; 12 forbocc forbidden positions (to avoid self-overlap) ; 13 zscore z-score (Gaussian approximation) ; 14 exp_var estimation of the variance on occurrences ; 15 ratio observed/expected ratio ; 16 ms number of matching sequences ; 17 exp_ms expected number of matching sequences ; 18 ms_P matching sequence probability (binomial) ; 19 ms_E E-value for matching sequences (binomial) ; 20 ms_sig matching sequenc significance (binomial) ; 21 ms_freq proportion of matching sequences (sequences with at least one occurrence) ; 22 exp_msf expected proportion matching sequences ; 23 ms_rati observed/expected numbers of matching sequences #seq id obs_freq exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc zscore exp_var ratio ms exp_ms ms_P ms_E ms_sig ms_freq exp_msf ms_rati tgatga tgatga 0.0005515070063 0.0002701109552 103 50.45 5.9e-11 2.4e-07 6.62 1 7 510 7.40 50.446 2.0418 83 47.99 7.1e-07 0.0029 2.5 0.16600 0.09598 1.72949 tctttt tctttt 0.0012957737429 0.0008617198419 242 160.94 1.6e-09 6.5e-06 5.19 2 3 1203 6.39 160.936 1.5037 174 137.65 0.00022 0.91 0.0 0.34800 0.27531 1.26403 atgatg atgatg 0.0004926081998 0.0002477585921 92 46.27 2e-09 8.4e-06 5.08 3 5 450 6.72 46.272 1.9883 78 44.20 7.6e-07 0.0031 2.5 0.15600 0.08840 1.76469 ggtggt ggtggt 0.0003694561498 0.0001668323904 69 31.16 3.5e-09 1.4e-05 4.85 4 4 337 6.78 31.158 2.2145 58 30.21 2e-06 0.0081 2.1 0.11600 0.06042 1.91994 ttcttc ttcttc 0.0008567099127 0.0005261929040 160 98.27 6.8e-09 2.8e-05 4.55 5 11 792 6.23 98.272 1.6281 133 89.24 7.9e-07 0.0032 2.5 0.26600 0.17848 1.49038 aacagc aacagc 0.0004926081998 0.0002633125370 92 49.18 3.2e-08 1.3e-04 3.88 6 0 455 6.11 49.177 1.8708 74 46.84 6.5e-05 0.26 0.6 0.14800 0.09368 1.57980 cgatga cgatga 0.0003212662173 0.0001475721071 60 27.56 6.1e-08 2.5e-04 3.60 7 0 293 6.18 27.561 2.1770 55 26.82 5.3e-07 0.0022 2.7 0.11000 0.05363 2.05095 gaggaa gaggaa 0.0005300892585 0.0003071534815 99 57.36 3.8e-07 1.6e-03 2.80 8 0 488 5.50 57.364 1.7258 86 54.20 1.3e-05 0.052 1.3 0.17200 0.10841 1.58660 tatata tatata 0.0008245832909 0.0005517069312 154 103.04 1.7e-06 6.9e-03 2.16 9 37 761 5.02 103.037 1.4946 127 93.14 0.00011 0.46 0.3 0.25400 0.18627 1.36358 aagaaa aagaaa 0.0017455464471 0.0013354485904 326 249.41 2e-06 8.1e-03 2.09 10 9 1606 4.85 249.410 1.3071 218 196.48 0.02761 1.1e+02 -2.1 0.43600 0.39296 1.10954 aagagg aagagg 0.0005675703171 0.0003556591240 106 66.42 4.7e-06 1.9e-02 1.72 11 0 520 4.86 66.423 1.5958 94 62.21 3.1e-05 0.13 0.9 0.18800 0.12442 1.51100 agtaat agtaat 0.0004872537628 0.0002935297331 91 54.82 4.9e-06 2.0e-02 1.70 12 0 453 4.89 54.820 1.6600 81 51.93 4.3e-05 0.17 0.8 0.16200 0.10386 1.55983 ccattg ccattg 0.0004283549563 0.0002489761191 80 46.50 5.1e-06 2.1e-02 1.68 13 0 400 4.91 46.499 1.7205 70 44.41 0.00011 0.46 0.3 0.14000 0.08882 1.57631 atagca atagca 0.0004551271411 0.0002705082381 85 50.52 6e-06 2.5e-02 1.61 14 0 425 4.85 50.520 1.6825 78 48.06 1.6e-05 0.065 1.2 0.15600 0.09612 1.62304 tcttct tcttct 0.0006853679301 0.0004521104632 128 84.44 6.1e-06 2.5e-02 1.60 15 12 632 4.74 84.437 1.5159 107 77.71 0.00032 1.3 -0.1 0.21400 0.15542 1.37695 cctcca cctcca 0.0003480384020 0.0001907917490 65 35.63 6.4e-06 2.6e-02 1.58 16 0 321 4.92 35.632 1.8242 60 34.40 2.3e-05 0.096 1.0 0.12000 0.06879 1.74441 gctgct gctgct 0.0003212662173 0.0001717554616 60 32.08 6.9e-06 2.8e-02 1.55 17 3 300 4.93 32.077 1.8705 52 31.07 0.00023 0.95 0.0 0.10400 0.06215 1.67350 caacaa caacaa 0.0007763933584 0.0005323933804 145 99.43 1.1e-05 4.4e-02 1.35 18 8 712 4.57 99.430 1.4583 109 90.19 0.01831 75 -1.9 0.21800 0.18038 1.20856 tttctt tttctt 0.0011726216930 0.0008668206853 219 161.89 1.1e-05 4.7e-02 1.33 19 5 1084 4.49 161.888 1.3528 163 138.34 0.00860 35 -1.5 0.32600 0.27669 1.17822 gtggtg gtggtg 0.0002944940325 0.0001564914219 55 29.23 1.4e-05 5.6e-02 1.25 20 4 269 4.77 29.226 1.8819 51 28.39 4.8e-05 0.2 0.7 0.10200 0.05678 1.79635 ctgctg ctgctg 0.0003052029064 0.0001642528362 57 30.68 1.4e-05 5.6e-02 1.25 21 3 281 4.75 30.676 1.8581 53 29.76 4.3e-05 0.17 0.8 0.10600 0.05951 1.78113 gatgat gatgat 0.0004176460824 0.0002489560401 78 46.50 1.5e-05 6.3e-02 1.20 22 4 379 4.62 46.495 1.6776 67 44.40 0.00052 2.1 -0.3 0.13400 0.08881 1.50887 taagga taagga 0.0005140259476 0.0003250316287 96 60.70 1.8e-05 7.2e-02 1.14 23 0 477 4.53 60.703 1.5815 85 57.17 0.00014 0.57 0.2 0.17000 0.11434 1.48675 tgctgc tgctgc 0.0003159117803 0.0001750017899 59 32.68 2.2e-05 9.0e-02 1.05 24 2 295 4.60 32.684 1.8052 50 31.64 0.00107 4.4 -0.6 0.10000 0.06328 1.58023 tactac tactac 0.0003748105868 0.0002208480872 70 41.25 2.8e-05 1.2e-01 0.94 25 1 341 4.48 41.246 1.6971 65 39.59 6.4e-05 0.26 0.6 0.13000 0.07919 1.64164 cgctag cgctag 0.0001927597304 0.0000897110556 36 16.75 3e-05 1.2e-01 0.91 26 0 175 4.70 16.755 2.1487 32 16.48 0.00035 1.4 -0.2 0.06400 0.03296 1.94202 cttctt cttctt 0.0007067856780 0.0004878265292 132 91.11 3.4e-05 1.4e-01 0.86 27 7 660 4.28 91.107 1.4488 107 83.31 0.00342 14 -1.1 0.21400 0.16661 1.28441 attgac attgac 0.0004337093933 0.0002682945492 81 50.11 3.7e-05 1.5e-01 0.82 28 0 400 4.36 50.107 1.6165 72 47.68 0.00031 1.3 -0.1 0.14400 0.09537 1.50994 cattga cattga 0.0005086715106 0.0003278487935 95 61.23 3.8e-05 1.6e-01 0.80 29 0 475 4.32 61.229 1.5515 85 57.64 0.00018 0.74 0.1 0.17000 0.11528 1.47473 cccttc cccttc 0.0002837851586 0.0001551713189 53 28.98 4e-05 1.6e-01 0.79 30 0 261 4.46 28.980 1.8289 46 28.16 0.00088 3.6 -0.6 0.09200 0.05632 1.63363 gatgaa gatgaa 0.0005675703171 0.0003768434894 106 70.38 4.5e-05 1.9e-01 0.73 31 0 524 4.25 70.380 1.5061 82 65.66 0.02029 83 -1.9 0.16400 0.13132 1.24881 gatgac gatgac 0.0002944940325 0.0001646556990 55 30.75 5.1e-05 2.1e-01 0.68 32 0 270 4.37 30.751 1.7885 52 29.83 8.6e-05 0.35 0.5 0.10400 0.05965 1.74338 agaaga agaaga 0.0010441152061 0.0007788837352 195 145.47 5.2e-05 2.1e-01 0.67 33 9 968 4.11 145.465 1.3405 148 126.26 0.01549 63 -1.8 0.29600 0.25252 1.17220 gcgatg gcgatg 0.0001874052934 0.0000896745934 35 16.75 6.5e-05 2.7e-01 0.57 34 1 172 4.46 16.748 2.0898 33 16.47 0.00016 0.67 0.2 0.06600 0.03294 2.00351 ttcttt ttcttt 0.0011404950712 0.0008668206853 213 161.89 7e-05 2.9e-01 0.54 35 5 1049 4.02 161.888 1.3157 164 138.34 0.00659 27 -1.4 0.32800 0.27669 1.18544 tgttga tgttga 0.0004711904520 0.0003040362374 88 56.78 7.4e-05 3.0e-01 0.52 36 0 440 4.14 56.782 1.5498 78 53.68 0.00054 2.2 -0.3 0.15600 0.10737 1.45294 caagaa caagaa 0.0010548240800 0.0007946874286 197 148.42 8.1e-05 3.3e-01 0.48 37 0 979 3.99 148.417 1.3273 154 128.46 0.00584 24 -1.4 0.30800 0.25692 1.19882 tatcga tatcga 0.0003641017129 0.0002212341474 68 41.32 8.8e-05 3.6e-01 0.45 38 0 340 4.15 41.318 1.6458 63 39.66 0.00021 0.85 0.1 0.12600 0.07932 1.58846 aaggaa aaggaa 0.0008727732235 0.0006430398440 163 120.09 0.00011 4.7e-01 0.33 39 2 805 3.92 120.095 1.3573 130 106.79 0.00755 31 -1.5 0.26000 0.21358 1.21733 acagca acagca 0.0004069372085 0.0002569076954 76 47.98 0.00011 4.7e-01 0.33 40 0 375 4.05 47.980 1.5840 64 45.76 0.00422 17 -1.2 0.12800 0.09151 1.39873 agcagc agcagc 0.0002837851586 0.0001624151046 53 30.33 0.00012 5.0e-01 0.30 41 5 265 4.12 30.333 1.7473 48 29.43 0.00070 2.9 -0.5 0.09600 0.05887 1.63080 tagtaa tagtaa 0.0004015827716 0.0002532261638 75 47.29 0.00012 5.0e-01 0.30 42 0 375 4.03 47.293 1.5859 72 45.13 6.1e-05 0.25 0.6 0.14400 0.09026 1.59537 aacaat aacaat 0.0007924566692 0.0005764028353 148 107.65 0.00013 5.4e-01 0.27 43 0 735 3.89 107.650 1.3748 126 96.87 0.00084 3.4 -0.5 0.25200 0.19375 1.30065 atcatc atcatc 0.0004176460824 0.0002669342911 78 49.85 0.00014 5.6e-01 0.25 44 6 388 3.99 49.853 1.5646 67 47.45 0.00275 11 -1.1 0.13400 0.09491 1.41189 atataa atataa 0.0008406466018 0.0006190122688 157 115.61 0.00015 6.0e-01 0.22 45 1 780 3.85 115.607 1.3580 133 103.24 0.00084 3.4 -0.5 0.26600 0.20649 1.28821 ctgcta ctgcta 0.0003266206542 0.0001964275566 61 36.69 0.00015 6.1e-01 0.22 46 0 305 4.01 36.685 1.6628 52 35.37 0.00380 16 -1.2 0.10400 0.07075 1.46997 ataatg ataatg 0.0004926081998 0.0003287409216 92 61.40 0.00016 6.5e-01 0.18 47 0 458 3.91 61.396 1.4985 79 57.79 0.00269 11 -1.0 0.15800 0.11557 1.36713 ggcgta ggcgta 0.0001766964195 0.0000882115951 33 16.47 0.00022 8.9e-01 0.05 48 0 165 4.07 16.474 2.0031 32 16.21 0.00026 1.1 -0.0 0.06400 0.03241 1.97449 ctacca ctacca 0.0003587472759 0.0002253923408 67 42.09 0.00024 9.9e-01 0.00 49 0 327 3.84 42.094 1.5917 58 40.38 0.00371 15 -1.2 0.11600 0.08075 1.43651 ; Host name rsat ; Job started 2026-05-11.133715 ; Job done 2026-05-11.133715 ; Seconds 0.92 ; user 0.92 ; system 0.02 ; cuser 0 ; csystem 0 ; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return freq,mseq,occ,proba,rank,ratio,zscore -1str -noov -quick_if_possible -seqtype dna -markov 2 -pseudo 0.01 -l 7 -o $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_7nt.tab ; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42. ; Program version 1.169 ; Slow counting mode ; Detection of over-represented words (right-tail test) ; Oligomer length 7 ; Input file $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged ; Input format fasta ; Output file $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_7nt.tab ; Discard overlapping matches ; Counted on a single strand ; Background model Markov ; Background estimation method Markov model estimated from input sequences ; Markov chain order 2 ; Pseudo-frequency 0.01 ; Pseudo-frequency per oligo 6.103515625e-07 ; Sequence type DNA ; Nb of sequences 500 ; Sum of sequence lengths 189796 ; discarded residues 535 (other letters than ACGT) ; discarded occurrences 535 (contain discarded residues) ; nb possible positions 186261 ; total oligo occurrences 186261 ; total overlapping occurrences 627 ; total non overlapping occ 185634 ; alphabet size 4 ; nb possible oligomers 16384 ; oligomers tested for significance 16203 ; ; column headers ; 1 seq oligomer sequence ; 2 id oligomer identifier ; 3 obs_freq observed relative frequency ; 4 exp_freq expected relative frequency ; 5 occ observed occurrences ; 6 exp_occ expected occurrences ; 7 occ_P occurrence probability (binomial) ; 8 occ_E E-value for occurrences (binomial) ; 9 occ_sig occurrence significance (binomial) ; 10 rank rank ; 11 ovl_occ number of overlapping occurrences (discarded from the count) ; 12 forbocc forbidden positions (to avoid self-overlap) ; 13 zscore z-score (Gaussian approximation) ; 14 exp_var estimation of the variance on occurrences ; 15 ratio observed/expected ratio ; 16 ms number of matching sequences ; 17 exp_ms expected number of matching sequences ; 18 ms_P matching sequence probability (binomial) ; 19 ms_E E-value for matching sequences (binomial) ; 20 ms_sig matching sequenc significance (binomial) ; 21 ms_freq proportion of matching sequences (sequences with at least one occurrence) ; 22 exp_msf expected proportion matching sequences ; 23 ms_rati observed/expected numbers of matching sequences #seq id obs_freq exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc zscore exp_var ratio ms exp_ms ms_P ms_E ms_sig ms_freq exp_msf ms_rati gatgatg gatgatg 0.0001932771756 0.0000492060911 36 9.17 1.6e-11 2.6e-07 6.58 1 2 210 8.86 9.165 3.9279 34 9.08 1e-10 1.7e-06 5.8 0.06800 0.01816 3.74371 caacaac caacaac 0.0002630717112 0.0000929633159 49 17.32 3.6e-10 5.9e-06 5.23 2 5 294 7.61 17.315 2.8298 37 17.02 1.2e-05 0.2 0.7 0.07400 0.03404 2.17394 cttcttc cttcttc 0.0002791781425 0.0001076085579 52 20.04 2e-09 3.2e-05 4.50 3 6 312 7.14 20.043 2.5944 48 19.65 2e-08 0.00033 3.5 0.09600 0.03930 2.44301 tatataa tatataa 0.0003704479199 0.0001674831130 69 31.20 3.6e-09 5.9e-05 4.23 4 0 408 6.77 31.196 2.2119 65 30.24 7.7e-09 0.00013 3.9 0.13000 0.06049 2.14913 atgatga atgatga 0.0002040147964 0.0000746637879 38 13.91 7.5e-08 1.2e-03 2.92 5 1 223 6.46 13.907 2.7324 35 13.72 6.8e-07 0.011 2.0 0.07000 0.02743 2.55180 ggtggtg ggtggtg 0.0001234826400 0.0000354721005 23 6.61 5.2e-07 8.4e-03 2.07 6 3 134 6.38 6.607 3.4811 22 6.56 1.3e-06 0.021 1.7 0.04400 0.01313 3.35176 cggtggt cggtggt 0.0001020073982 0.0000263872537 19 4.91 1.1e-06 1.8e-02 1.75 7 0 111 6.35 4.915 3.8658 19 4.89 8.4e-07 0.014 1.9 0.03800 0.00978 3.88476 ttctttt ttctttt 0.0005261434224 0.0003150761754 98 58.69 1.7e-06 2.8e-02 1.56 8 2 578 5.13 58.686 1.6699 84 55.38 7.9e-05 1.3 -0.1 0.16800 0.11076 1.51675 cgatgac cgatgac 0.0000966385878 0.0000249729469 18 4.65 2e-06 3.3e-02 1.48 9 0 101 6.19 4.651 3.8697 16 4.63 2.5e-05 0.41 0.4 0.03200 0.00926 3.45574 aatagca aatagca 0.0002040147964 0.0000865060676 38 16.11 2.4e-06 3.9e-02 1.41 10 0 228 5.45 16.113 2.3584 34 15.86 3.6e-05 0.59 0.2 0.06800 0.03171 2.14423 tgatgaa tgatgaa 0.0002308588486 0.0001043183771 43 19.43 2.7e-06 4.4e-02 1.36 11 0 249 5.35 19.430 2.2130 35 19.06 0.00051 8.4 -0.9 0.07000 0.03812 1.83643 tgctgct tgctgct 0.0001503266921 0.0000550075187 28 10.25 3.5e-06 5.7e-02 1.24 12 2 168 5.55 10.246 2.7328 24 10.14 0.00012 2 -0.3 0.04800 0.02028 2.36645 ttcttct ttcttct 0.0003167598155 0.0001651734833 59 30.77 4e-06 6.4e-02 1.19 13 5 343 5.09 30.765 1.9177 56 29.84 5.9e-06 0.097 1.0 0.11200 0.05968 1.87665 ttatttt ttatttt 0.0004670865076 0.0002767138498 87 51.54 4.2e-06 6.8e-02 1.17 14 1 510 4.94 51.541 1.6880 78 48.98 3e-05 0.5 0.3 0.15600 0.09796 1.59249 gctgctg gctgctg 0.0001127450191 0.0000348254703 21 6.49 4.7e-06 7.7e-02 1.12 15 1 126 5.70 6.487 3.2374 20 6.44 1.2e-05 0.2 0.7 0.04000 0.01289 3.10326 tgatgat tgatgat 0.0001718019338 0.0000688940153 32 12.83 4.8e-06 7.8e-02 1.11 16 3 188 5.35 12.832 2.4937 32 12.67 2.6e-06 0.042 1.4 0.06400 0.02534 2.52576 ttttctt ttttctt 0.0005154058015 0.0003150761754 96 58.69 4.9e-06 7.9e-02 1.10 17 3 572 4.87 58.686 1.6358 83 55.38 0.00013 2.1 -0.3 0.16600 0.11076 1.49870 gacgaag gacgaag 0.0001395890712 0.0000501000811 26 9.33 5.5e-06 8.9e-02 1.05 18 0 152 5.46 9.332 2.7862 22 9.25 0.00021 3.5 -0.5 0.04400 0.01849 2.37957 ggtggta ggtggta 0.0001288514504 0.0000444714563 24 8.28 6.6e-06 1.1e-01 0.97 19 0 134 5.46 8.283 2.8974 22 8.22 4.1e-05 0.67 0.2 0.04400 0.01643 2.67795 ctctttt ctctttt 0.0003274974364 0.0001761807886 61 32.82 7e-06 1.1e-01 0.95 20 0 366 4.92 32.816 1.8589 52 31.76 0.00039 6.3 -0.8 0.10400 0.06353 1.63704 aagagga aagagga 0.0002415964695 0.0001172060601 45 21.83 9.4e-06 1.5e-01 0.82 21 0 267 4.96 21.831 2.0613 42 21.36 3.3e-05 0.54 0.3 0.08400 0.04272 1.96607 tcttttt tcttttt 0.0005046681807 0.0003132204611 94 58.34 1.1e-05 1.7e-01 0.76 22 0 561 4.67 58.341 1.6112 77 55.07 0.00170 28 -1.4 0.15400 0.11015 1.39812 aacagca aacagca 0.0001932771756 0.0000877165863 36 16.34 1.8e-05 2.9e-01 0.54 23 0 214 4.86 16.338 2.2034 27 16.07 0.00697 1.1e+02 -2.1 0.05400 0.03215 1.67965 caacagc caacagc 0.0001449578817 0.0000571368992 27 10.64 1.9e-05 3.0e-01 0.52 24 0 162 5.01 10.642 2.5370 20 10.53 0.00545 89 -2.0 0.04000 0.02106 1.89930 actacca actacca 0.0001556955025 0.0000638025961 29 11.88 1.9e-05 3.1e-01 0.51 25 0 170 4.97 11.884 2.4403 25 11.74 0.00043 7 -0.8 0.05000 0.02349 2.12871 caatggc caatggc 0.0001395890712 0.0000541116911 26 10.08 2e-05 3.3e-01 0.49 26 0 156 5.01 10.079 2.5796 24 9.98 9.6e-05 1.6 -0.2 0.04800 0.01996 2.40523 gcgatga gcgatga 0.0000912697774 0.0000269477783 17 5.02 2.1e-05 3.4e-01 0.47 27 0 97 5.35 5.019 3.3869 17 4.99 1.7e-05 0.28 0.6 0.03400 0.00999 3.40390 ccattga ccattga 0.0001718019338 0.0000750313205 32 13.98 2.5e-05 4.0e-01 0.40 28 0 192 4.82 13.975 2.2897 29 13.78 0.00018 3 -0.5 0.05800 0.02756 2.10413 gataatg gataatg 0.0001556955025 0.0000652511929 29 12.15 2.8e-05 4.6e-01 0.34 29 2 174 4.83 12.154 2.3861 27 12.01 0.00011 1.8 -0.2 0.05400 0.02402 2.24857 tcctcca tcctcca 0.0001503266921 0.0000619635882 28 11.54 2.9e-05 4.7e-01 0.33 30 0 168 4.84 11.541 2.4260 26 11.41 0.00012 1.9 -0.3 0.05200 0.02282 2.27879 gacgatg gacgatg 0.0000912697774 0.0000289230115 17 5.39 4.9e-05 8.0e-01 0.10 31 0 102 5.00 5.387 3.1556 17 5.36 4.1e-05 0.67 0.2 0.03400 0.01072 3.17260 atatata atatata 0.0003113910051 0.0001780106025 58 33.16 5.9e-05 9.5e-01 0.02 32 21 342 4.31 33.156 1.7493 53 32.08 0.00027 4.5 -0.7 0.10600 0.06417 1.65193 gaggaaa gaggaaa 0.0002201212277 0.0001116895045 41 20.80 5.9e-05 9.6e-01 0.02 33 0 240 4.43 20.803 1.9708 41 20.38 2.4e-05 0.4 0.4 0.08200 0.04076 2.01201 ; Host name rsat ; Job started 2026-05-11.133716 ; Job done 2026-05-11.133717 ; Seconds 1.51 ; user 1.51 ; system 0.03 ; cuser 0 ; csystem 0 ; oligo-analysis -v 1 -sort -i $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged -format fasta -lth occ_sig 0 -uth rank 50 -return freq,mseq,occ,proba,rank,ratio,zscore -1str -noov -quick_if_possible -seqtype dna -markov 2 -pseudo 0.01 -l 8 -o $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_8nt.tab ; Citation: van Helden et al. (1998). J Mol Biol 281(5), 827-42. ; Program version 1.169 ; Slow counting mode ; Detection of over-represented words (right-tail test) ; Oligomer length 8 ; Input file $RSAT/public_html/tmp/www-data/2026/05/11/tmp_sequence_2026-05-11.133714_wlQojt.fasta.purged ; Input format fasta ; Output file $RSAT/public_html/tmp/www-data/2026/05/11/oligo-analysis_2026-05-11.133714_p71v1p_8nt.tab ; Discard overlapping matches ; Counted on a single strand ; Background model Markov ; Background estimation method Markov model estimated from input sequences ; Markov chain order 2 ; Pseudo-frequency 0.01 ; Pseudo-frequency per oligo 1.52587890625e-07 ; Sequence type DNA ; Nb of sequences 500 ; Sum of sequence lengths 189796 ; discarded residues 535 (other letters than ACGT) ; discarded occurrences 535 (contain discarded residues) ; nb possible positions 185761 ; total oligo occurrences 185761 ; total overlapping occurrences 372 ; total non overlapping occ 185389 ; alphabet size 4 ; nb possible oligomers 65536 ; oligomers tested for significance 54084 ; ; column headers ; 1 seq oligomer sequence ; 2 id oligomer identifier ; 3 obs_freq observed relative frequency ; 4 exp_freq expected relative frequency ; 5 occ observed occurrences ; 6 exp_occ expected occurrences ; 7 occ_P occurrence probability (binomial) ; 8 occ_E E-value for occurrences (binomial) ; 9 occ_sig occurrence significance (binomial) ; 10 rank rank ; 11 ovl_occ number of overlapping occurrences (discarded from the count) ; 12 forbocc forbidden positions (to avoid self-overlap) ; 13 zscore z-score (Gaussian approximation) ; 14 exp_var estimation of the variance on occurrences ; 15 ratio observed/expected ratio ; 16 ms number of matching sequences ; 17 exp_ms expected number of matching sequences ; 18 ms_P matching sequence probability (binomial) ; 19 ms_E E-value for matching sequences (binomial) ; 20 ms_sig matching sequenc significance (binomial) ; 21 ms_freq proportion of matching sequences (sequences with at least one occurrence) ; 22 exp_msf expected proportion matching sequences ; 23 ms_rati observed/expected numbers of matching sequences #seq id obs_freq exp_freq occ exp_occ occ_P occ_E occ_sig rank ovl_occ forbocc zscore exp_var ratio ms exp_ms ms_P ms_E ms_sig ms_freq exp_msf ms_rati gatgatga gatgatga 0.0000915154419 0.0000148233009 17 2.75 6.3e-09 3.4e-04 3.46 1 0 116 8.59 2.754 6.1738 17 2.75 5e-09 0.00033 3.5 0.03400 0.00549 6.19073 caacaaca caacaaca 0.0001238150096 0.0000318511213 23 5.92 7.9e-08 4.3e-03 2.37 2 2 161 7.02 5.917 3.8873 16 5.88 0.00037 25 -1.4 0.03200 0.01176 2.72020 aagaggaa aagaggaa 0.0001507313160 0.0000453251708 28 8.42 8.2e-08 4.4e-03 2.35 3 0 191 6.75 8.420 3.3256 27 8.35 1.7e-07 0.011 2.0 0.05400 0.01670 3.23379 tcttcttc tcttcttc 0.0001238150096 0.0000345025517 23 6.41 3.1e-07 1.7e-02 1.77 4 5 161 6.55 6.409 3.5886 20 6.37 1e-05 0.66 0.2 0.04000 0.01274 3.14049 ctcttttt ctcttttt 0.0001776476225 0.0000640316740 33 11.89 3.7e-07 2.0e-02 1.70 5 0 231 6.12 11.895 2.7744 31 11.75 1.5e-06 0.1 1.0 0.06200 0.02351 2.63727 tctttttt tctttttt 0.0002583965418 0.0001138818246 48 21.15 3.8e-07 2.0e-02 1.69 6 1 336 5.84 21.155 2.2690 44 20.71 3.2e-06 0.21 0.7 0.08800 0.04143 2.12410 tgatgatg tgatgatg 0.0000753656580 0.0000136156508 14 2.53 4.8e-07 2.6e-02 1.58 7 1 98 7.21 2.529 5.5352 14 2.52 4.1e-07 0.027 1.6 0.02800 0.00505 5.54920 tggtggtg tggtggtg 0.0000699823967 0.0000123645680 13 2.30 9.5e-07 5.2e-02 1.29 8 1 91 7.06 2.297 5.6599 13 2.29 8.4e-07 0.055 1.3 0.02600 0.00458 5.67289 cagcaaca cagcaaca 0.0000861321806 0.0000190270977 16 3.53 1e-06 5.6e-02 1.25 9 0 112 6.63 3.534 4.5268 12 3.52 0.00029 19 -1.3 0.02400 0.00704 3.40709 tttttttc tttttttc 0.0002853128482 0.0001392337974 53 25.86 1.9e-06 1.0e-01 0.98 10 0 371 5.34 25.864 2.0492 46 25.21 8e-05 5.3 -0.7 0.09200 0.05042 1.82479 tatatata tatatata 0.0001399647935 0.0000481653494 26 8.95 2.7e-06 1.4e-01 0.84 11 15 175 5.70 8.947 2.9059 25 8.87 5.2e-06 0.34 0.5 0.05000 0.01774 2.81916 tatataaa tatataaa 0.0001614978386 0.0000609840629 30 11.33 3e-06 1.6e-01 0.79 12 0 210 5.55 11.328 2.6482 29 11.20 4.8e-06 0.31 0.5 0.05800 0.02240 2.58896 ttatataa ttatataa 0.0001399647935 0.0000494952916 26 9.19 4.3e-06 2.3e-01 0.64 13 0 182 5.54 9.194 2.8278 25 9.11 8.2e-06 0.54 0.3 0.05000 0.01822 2.74409 atataata atataata 0.0001238150096 0.0000411332783 23 7.64 5.5e-06 3.0e-01 0.52 14 0 161 5.56 7.641 3.0101 23 7.58 3.9e-06 0.26 0.6 0.04600 0.01517 3.03309 acaacaac acaacaac 0.0000968987032 0.0000273606836 18 5.08 6.7e-06 3.6e-01 0.44 15 2 125 5.73 5.083 3.5415 17 5.06 2e-05 1.3 -0.1 0.03400 0.01011 3.36176 ataataac ataataac 0.0000915154419 0.0000249726014 17 4.64 7.8e-06 4.2e-01 0.38 16 0 119 5.74 4.639 3.6646 16 4.62 2.4e-05 1.6 -0.2 0.03200 0.00924 3.46505 cggtggta cggtggta 0.0000484493516 0.0000070301147 9 1.31 9.5e-06 5.1e-01 0.29 17 0 63 6.73 1.306 6.8917 9 1.30 8.9e-06 0.58 0.2 0.01800 0.00261 6.90067 gaagagga gaagagga 0.0000915154419 0.0000258409092 17 4.80 1.2e-05 6.5e-01 0.19 18 0 119 5.57 4.800 3.5415 16 4.78 3.6e-05 2.4 -0.4 0.03200 0.00955 3.34915 ttcctcga ttcctcga 0.0000645991354 0.0000134051627 12 2.49 1.2e-05 6.6e-01 0.18 19 0 84 6.03 2.490 4.8190 12 2.48 1.1e-05 0.71 0.1 0.02400 0.00497 4.83095 atgatgaa atgatgaa 0.0000968987032 0.0000288430520 18 5.36 1.3e-05 7.3e-01 0.14 20 0 122 5.46 5.358 3.3595 18 5.33 1.1e-05 0.71 0.2 0.03600 0.01066 3.37750 ttgatgat ttgatgat 0.0000861321806 0.0000234494097 16 4.36 1.4e-05 7.4e-01 0.13 21 0 112 5.58 4.356 3.6731 16 4.34 1.1e-05 0.75 0.1 0.03200 0.00867 3.68909 aaaaaaat aaaaaaat 0.0003122291547 0.0001692452639 58 31.44 1.4e-05 7.6e-01 0.12 22 0 403 4.74 31.439 1.8448 53 30.47 7.8e-05 5.1 -0.7 0.10600 0.06095 1.73921 gaagacga gaagacga 0.0000753656580 0.0000185419554 14 3.44 1.6e-05 8.5e-01 0.07 23 1 98 5.69 3.444 4.0646 13 3.43 5.8e-05 3.8 -0.6 0.02600 0.00687 3.78725 gaaaaaaa gaaaaaaa 0.0002960793708 0.0001588864333 55 29.51 1.8e-05 9.5e-01 0.02 24 0 378 4.69 29.515 1.8635 51 28.66 6.1e-05 4 -0.6 0.10200 0.05733 1.77931 aaaaaatg aaaaaatg 0.0001991806676 0.0000915928355 37 17.01 1.8e-05 9.9e-01 0.00 25 0 256 4.85 17.014 2.1746 36 16.73 2e-05 1.3 -0.1 0.07200 0.03346 2.15196 ; Host name rsat ; Job started 2026-05-11.133717 ; Job done 2026-05-11.133721 ; Seconds 4.25 ; user 4.25 ; system 0.1 ; cuser 0 ; csystem 0