Upload folder using huggingface_hub
Browse files- tokenizer/merges.txt +1006 -0
- tokenizer/special_tokens_map.json +5 -0
- tokenizer/tokenizer.json +2078 -0
- tokenizer/tokenizer_config.json +18 -0
- tokenizer/vocab.json +1 -0
tokenizer/merges.txt
ADDED
|
@@ -0,0 +1,1006 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#version: 0.2
|
| 2 |
+
G G
|
| 3 |
+
A A
|
| 4 |
+
U U
|
| 5 |
+
C C
|
| 6 |
+
A G
|
| 7 |
+
U G
|
| 8 |
+
A C
|
| 9 |
+
U C
|
| 10 |
+
U GG
|
| 11 |
+
G C
|
| 12 |
+
A GG
|
| 13 |
+
U AA
|
| 14 |
+
AG C
|
| 15 |
+
A UU
|
| 16 |
+
A CC
|
| 17 |
+
A UG
|
| 18 |
+
U CC
|
| 19 |
+
G AA
|
| 20 |
+
U AC
|
| 21 |
+
UG C
|
| 22 |
+
A UC
|
| 23 |
+
U AG
|
| 24 |
+
UU C
|
| 25 |
+
AA C
|
| 26 |
+
GG C
|
| 27 |
+
UU G
|
| 28 |
+
AA G
|
| 29 |
+
GG G
|
| 30 |
+
CC C
|
| 31 |
+
A U
|
| 32 |
+
UG AA
|
| 33 |
+
AC G
|
| 34 |
+
A UGG
|
| 35 |
+
UAA C
|
| 36 |
+
GC G
|
| 37 |
+
UC G
|
| 38 |
+
AGG C
|
| 39 |
+
UG AG
|
| 40 |
+
UGG C
|
| 41 |
+
AUG C
|
| 42 |
+
AG CC
|
| 43 |
+
UG CC
|
| 44 |
+
A UCC
|
| 45 |
+
GG AA
|
| 46 |
+
A UAA
|
| 47 |
+
U ACC
|
| 48 |
+
UU UU
|
| 49 |
+
AC GG
|
| 50 |
+
AGG G
|
| 51 |
+
U AUU
|
| 52 |
+
AG AA
|
| 53 |
+
UU GG
|
| 54 |
+
G CC
|
| 55 |
+
U AGC
|
| 56 |
+
UC AA
|
| 57 |
+
UU AA
|
| 58 |
+
GAA C
|
| 59 |
+
AC AA
|
| 60 |
+
U AGG
|
| 61 |
+
UGG G
|
| 62 |
+
ACC C
|
| 63 |
+
UGG GG
|
| 64 |
+
UG AC
|
| 65 |
+
A UAC
|
| 66 |
+
GC GG
|
| 67 |
+
AGG AA
|
| 68 |
+
UU CC
|
| 69 |
+
AGC G
|
| 70 |
+
UCC C
|
| 71 |
+
GC AA
|
| 72 |
+
AG AC
|
| 73 |
+
GG CC
|
| 74 |
+
AUU C
|
| 75 |
+
UU UC
|
| 76 |
+
UU GC
|
| 77 |
+
AA AA
|
| 78 |
+
AG AG
|
| 79 |
+
CC G
|
| 80 |
+
UAC G
|
| 81 |
+
AC AC
|
| 82 |
+
A UAG
|
| 83 |
+
GG GG
|
| 84 |
+
UG UC
|
| 85 |
+
UAA G
|
| 86 |
+
U AUC
|
| 87 |
+
UU UG
|
| 88 |
+
AG UC
|
| 89 |
+
AUU G
|
| 90 |
+
GGC G
|
| 91 |
+
AA AC
|
| 92 |
+
AAG UC
|
| 93 |
+
AUG AA
|
| 94 |
+
UG UG
|
| 95 |
+
UC UC
|
| 96 |
+
UGG AA
|
| 97 |
+
ACC G
|
| 98 |
+
AG UG
|
| 99 |
+
UGG GC
|
| 100 |
+
UU AC
|
| 101 |
+
UC GC
|
| 102 |
+
UUC GG
|
| 103 |
+
UGC G
|
| 104 |
+
U AUG
|
| 105 |
+
UUC G
|
| 106 |
+
UU UAA
|
| 107 |
+
UC GG
|
| 108 |
+
UU AG
|
| 109 |
+
UC UG
|
| 110 |
+
UCC G
|
| 111 |
+
AAC G
|
| 112 |
+
GAA G
|
| 113 |
+
AG UGG
|
| 114 |
+
UC AC
|
| 115 |
+
A UAAC
|
| 116 |
+
UG AGG
|
| 117 |
+
AUGG C
|
| 118 |
+
AG AGG
|
| 119 |
+
AG AU
|
| 120 |
+
AUG CC
|
| 121 |
+
ACC AA
|
| 122 |
+
U AGGC
|
| 123 |
+
GG GC
|
| 124 |
+
AUU AA
|
| 125 |
+
GG UGAA
|
| 126 |
+
UAC GGG
|
| 127 |
+
AUC G
|
| 128 |
+
AAG CC
|
| 129 |
+
UU GAA
|
| 130 |
+
U AU
|
| 131 |
+
UAC AC
|
| 132 |
+
GC GAA
|
| 133 |
+
CC UU
|
| 134 |
+
CCC G
|
| 135 |
+
AUGC G
|
| 136 |
+
AC UC
|
| 137 |
+
UG UU
|
| 138 |
+
GGC UAAC
|
| 139 |
+
AA GG
|
| 140 |
+
UC AG
|
| 141 |
+
AC GC
|
| 142 |
+
UG UAGC
|
| 143 |
+
UGAC GC
|
| 144 |
+
UGAG AC
|
| 145 |
+
UU CCC
|
| 146 |
+
GCG UAA
|
| 147 |
+
AGC AGCC
|
| 148 |
+
AUGG G
|
| 149 |
+
AGGC AGC
|
| 150 |
+
AG UGGC
|
| 151 |
+
AGG GC
|
| 152 |
+
UAC AA
|
| 153 |
+
UC AGC
|
| 154 |
+
AUU GG
|
| 155 |
+
GAA GGC
|
| 156 |
+
GCGG UAA
|
| 157 |
+
AC GAA
|
| 158 |
+
UU AAG
|
| 159 |
+
UGCC AGCAGCC
|
| 160 |
+
CC CC
|
| 161 |
+
UG UCG
|
| 162 |
+
UU GGG
|
| 163 |
+
UGC AA
|
| 164 |
+
AGC AA
|
| 165 |
+
AUCC C
|
| 166 |
+
UACGGG AGGCAGC
|
| 167 |
+
AC GGG
|
| 168 |
+
UU AAC
|
| 169 |
+
UUC GGG
|
| 170 |
+
AC UG
|
| 171 |
+
UUG CC
|
| 172 |
+
ACC GG
|
| 173 |
+
UAG AG
|
| 174 |
+
UUG UAA
|
| 175 |
+
UAG UCC
|
| 176 |
+
AGG AUU
|
| 177 |
+
UAA GG
|
| 178 |
+
UGCCAGCAGCC GCGGUAA
|
| 179 |
+
UCC UACGGGAGGCAGC
|
| 180 |
+
AGG GG
|
| 181 |
+
GC ACAA
|
| 182 |
+
AU AUU
|
| 183 |
+
AU AUC
|
| 184 |
+
AG UU
|
| 185 |
+
UAA UACC
|
| 186 |
+
UAA AA
|
| 187 |
+
UAC GG
|
| 188 |
+
AGG AAC
|
| 189 |
+
UG CCC
|
| 190 |
+
UUG AC
|
| 191 |
+
GAA GC
|
| 192 |
+
UGG CC
|
| 193 |
+
UC UU
|
| 194 |
+
U AGGG
|
| 195 |
+
AG CCC
|
| 196 |
+
UGAGAC ACGG
|
| 197 |
+
AUU AGC
|
| 198 |
+
AUAA G
|
| 199 |
+
GC UGGC
|
| 200 |
+
AGG CC
|
| 201 |
+
AC UU
|
| 202 |
+
AGCG UGGGG
|
| 203 |
+
AGC AAAC
|
| 204 |
+
ACC CC
|
| 205 |
+
AGGAA GG
|
| 206 |
+
UAA CC
|
| 207 |
+
UUG ACGG
|
| 208 |
+
AGGAUU AGAU
|
| 209 |
+
AC AG
|
| 210 |
+
AGAC UCCUACGGGAGGCAGC
|
| 211 |
+
UGG UC
|
| 212 |
+
GGC GG
|
| 213 |
+
GC GC
|
| 214 |
+
UACC C
|
| 215 |
+
UGG AGC
|
| 216 |
+
AUG UGG
|
| 217 |
+
AGUGG GGAA
|
| 218 |
+
UGUAGC GGUGAA
|
| 219 |
+
GGG CC
|
| 220 |
+
UAG UAA
|
| 221 |
+
UCC GG
|
| 222 |
+
N N
|
| 223 |
+
Ġ G
|
| 224 |
+
UG AAG
|
| 225 |
+
UAG CC
|
| 226 |
+
AC AUGC
|
| 227 |
+
UC AAC
|
| 228 |
+
AG UAC
|
| 229 |
+
AGG AUG
|
| 230 |
+
AGGAUUAGAU ACCC
|
| 231 |
+
AG UGC
|
| 232 |
+
U AUGG
|
| 233 |
+
ACG CC
|
| 234 |
+
UAG UUGG
|
| 235 |
+
UG UAA
|
| 236 |
+
AA CC
|
| 237 |
+
AC UGC
|
| 238 |
+
UAUU GG
|
| 239 |
+
UGG GCGUAA
|
| 240 |
+
UU UUC
|
| 241 |
+
UGAG UAAC
|
| 242 |
+
UGC UGC
|
| 243 |
+
UAG AA
|
| 244 |
+
AUU CC
|
| 245 |
+
UAA GC
|
| 246 |
+
U AUAA
|
| 247 |
+
ACG UC
|
| 248 |
+
AA GC
|
| 249 |
+
AG AAG
|
| 250 |
+
AGC GCAA
|
| 251 |
+
UG ACGG
|
| 252 |
+
AGC GC
|
| 253 |
+
UU UUG
|
| 254 |
+
UGC AAC
|
| 255 |
+
GG UG
|
| 256 |
+
UCAGC UCG
|
| 257 |
+
UGG UAGUCC
|
| 258 |
+
UU UCC
|
| 259 |
+
AGC GG
|
| 260 |
+
AG AAC
|
| 261 |
+
UG AAC
|
| 262 |
+
UGG AAC
|
| 263 |
+
UUC AA
|
| 264 |
+
AG AUU
|
| 265 |
+
AC UCC
|
| 266 |
+
AG AUG
|
| 267 |
+
UU AUU
|
| 268 |
+
UGG GAA
|
| 269 |
+
AG AGC
|
| 270 |
+
AUC AA
|
| 271 |
+
GGCUAAC UACG
|
| 272 |
+
AGC AAC
|
| 273 |
+
AGCGUGGGG AGCAAAC
|
| 274 |
+
AGGAUUAGAUACCC UGGUAGUCC
|
| 275 |
+
AC AUU
|
| 276 |
+
UAA ACG
|
| 277 |
+
UG AGGC
|
| 278 |
+
UG UGAA
|
| 279 |
+
GAA GG
|
| 280 |
+
AUGCG UAG
|
| 281 |
+
UU GGC
|
| 282 |
+
UAGG GG
|
| 283 |
+
AG UGAA
|
| 284 |
+
AGG GAA
|
| 285 |
+
UG AUC
|
| 286 |
+
UGGG AC
|
| 287 |
+
UUAAG UCCC
|
| 288 |
+
ACCG CCCG
|
| 289 |
+
GAAC GCUGGC
|
| 290 |
+
AAGUC GAAC
|
| 291 |
+
AGC GAA
|
| 292 |
+
AGC UC
|
| 293 |
+
UCAA AGGAA
|
| 294 |
+
UCAA CC
|
| 295 |
+
GCC UGGGG
|
| 296 |
+
CCC UU
|
| 297 |
+
UCC CC
|
| 298 |
+
UGCC G
|
| 299 |
+
UG AUCC
|
| 300 |
+
UGAG AUG
|
| 301 |
+
UU ACC
|
| 302 |
+
AGACUCCUACGGGAGGCAGC AGUGGGGAA
|
| 303 |
+
UCG CC
|
| 304 |
+
GGG AC
|
| 305 |
+
AGGC G
|
| 306 |
+
AGGAAGG UGGGG
|
| 307 |
+
GGG CCC
|
| 308 |
+
UAUU C
|
| 309 |
+
UACG UUCCC
|
| 310 |
+
UCAAAGGAA UUGACGG
|
| 311 |
+
AU ACC
|
| 312 |
+
UGAGACACGG CCC
|
| 313 |
+
AU AGC
|
| 314 |
+
UC AUU
|
| 315 |
+
UACAC ACCGCCCG
|
| 316 |
+
UC GAA
|
| 317 |
+
AU AGG
|
| 318 |
+
AUC GG
|
| 319 |
+
UU UGG
|
| 320 |
+
UG AUGC
|
| 321 |
+
UGC GAA
|
| 322 |
+
UAG AGG
|
| 323 |
+
GCACAA GCGG
|
| 324 |
+
AAG UCG
|
| 325 |
+
UGGC G
|
| 326 |
+
UC GGAA
|
| 327 |
+
GGCG ACG
|
| 328 |
+
UG AUG
|
| 329 |
+
UAGC G
|
| 330 |
+
AUAC G
|
| 331 |
+
AACG AGCGCAA
|
| 332 |
+
UCAGCUCG UGUCG
|
| 333 |
+
CCUU ACC
|
| 334 |
+
UUGGG UUAAGUCCC
|
| 335 |
+
ACG UGC
|
| 336 |
+
AC UGG
|
| 337 |
+
AG UAA
|
| 338 |
+
GCAA GG
|
| 339 |
+
UG UGG
|
| 340 |
+
UCAGCUCGUGUCG UGAGAUG
|
| 341 |
+
U AUCC
|
| 342 |
+
AG UUC
|
| 343 |
+
AG ACC
|
| 344 |
+
ACC AGUGGC
|
| 345 |
+
AU AUG
|
| 346 |
+
UC AGG
|
| 347 |
+
UC UUC
|
| 348 |
+
GC AACGAGCGCAA
|
| 349 |
+
UUAC UGGGCGUAA
|
| 350 |
+
UG AUU
|
| 351 |
+
UU AUCC
|
| 352 |
+
UG ACC
|
| 353 |
+
UC AUC
|
| 354 |
+
U AUGC
|
| 355 |
+
UAG UC
|
| 356 |
+
GCC G
|
| 357 |
+
AUC AGC
|
| 358 |
+
AUUC G
|
| 359 |
+
UAAUACC GC
|
| 360 |
+
UGG GGG
|
| 361 |
+
AAC GCGAA
|
| 362 |
+
AC AGG
|
| 363 |
+
UGC GG
|
| 364 |
+
GGCUAAC UCCG
|
| 365 |
+
AUGUGG UUUAA
|
| 366 |
+
AGGAAGGUGGGG AUG
|
| 367 |
+
GCC GCG
|
| 368 |
+
UCGC UAGUAA
|
| 369 |
+
UGAA AC
|
| 370 |
+
AC GGC
|
| 371 |
+
UUG UACACACCGCCCG
|
| 372 |
+
UGGAA UUCC
|
| 373 |
+
UCAGCUCGUGUCGUGAGAUG UUGGGUUAAGUCCC
|
| 374 |
+
GAA AGCC
|
| 375 |
+
AUU GC
|
| 376 |
+
UGGUC UGAG
|
| 377 |
+
UC GGC
|
| 378 |
+
UCC AA
|
| 379 |
+
AUUAGC UAGUUGG
|
| 380 |
+
UAGGC GG
|
| 381 |
+
AG UUG
|
| 382 |
+
GAAC GGG
|
| 383 |
+
UC ACC
|
| 384 |
+
UAA AAC
|
| 385 |
+
UC UGG
|
| 386 |
+
UAUU G
|
| 387 |
+
UUCGGG UUGUAA
|
| 388 |
+
AC UUC
|
| 389 |
+
ACGUGC UACAA
|
| 390 |
+
GAA AA
|
| 391 |
+
Ġ C
|
| 392 |
+
UC UGC
|
| 393 |
+
UU UGC
|
| 394 |
+
UACC G
|
| 395 |
+
UGCAAC UCG
|
| 396 |
+
AUGGC UGUCG
|
| 397 |
+
UUG UUGG
|
| 398 |
+
UG UGC
|
| 399 |
+
AACGCGAA GAA
|
| 400 |
+
UG UUC
|
| 401 |
+
AG AGGG
|
| 402 |
+
AUCC G
|
| 403 |
+
GCG UUG
|
| 404 |
+
AAC AA
|
| 405 |
+
UU GGAA
|
| 406 |
+
AU AU
|
| 407 |
+
UC UCC
|
| 408 |
+
AG AUC
|
| 409 |
+
ACG CCG
|
| 410 |
+
UUAA CC
|
| 411 |
+
AGGC GG
|
| 412 |
+
ACAUGC AAGUCGAAC
|
| 413 |
+
UGG UGC
|
| 414 |
+
UAA UAC
|
| 415 |
+
UACC AA
|
| 416 |
+
GG CCC
|
| 417 |
+
AGC AC
|
| 418 |
+
UGAA CC
|
| 419 |
+
ACAC UGGGAC
|
| 420 |
+
AUC AGG
|
| 421 |
+
UGAGUAAC ACG
|
| 422 |
+
GCG UG
|
| 423 |
+
U AUAC
|
| 424 |
+
UUG UC
|
| 425 |
+
GAA UC
|
| 426 |
+
UU AGC
|
| 427 |
+
UCAGCUCGUGUCGUGAGAUGUUGGGUUAAGUCCC GCAACGAGCGCAA
|
| 428 |
+
AGCAAC GCCGCG
|
| 429 |
+
AG UAGG
|
| 430 |
+
UAAC G
|
| 431 |
+
GCACAAGCGG UGGAGC
|
| 432 |
+
UU UAG
|
| 433 |
+
AGG GGG
|
| 434 |
+
UACAC ACGUGCUACAA
|
| 435 |
+
GGC GC
|
| 436 |
+
UGAG AGGG
|
| 437 |
+
UGC GC
|
| 438 |
+
AGCC G
|
| 439 |
+
UGAA UACGUUCCC
|
| 440 |
+
UU UAC
|
| 441 |
+
NN NN
|
| 442 |
+
GGCUAACUCCG UGCCAGCAGCCGCGGUAA
|
| 443 |
+
AUGG AA
|
| 444 |
+
UGGGC GC
|
| 445 |
+
UGGGC GAAAGCC
|
| 446 |
+
U AUAG
|
| 447 |
+
GAA GGCC
|
| 448 |
+
GGC AGC
|
| 449 |
+
AUC GC
|
| 450 |
+
UG UUG
|
| 451 |
+
ACCC G
|
| 452 |
+
GGCUAACUACG UGCCAGCAGCCGCGGUAA
|
| 453 |
+
AG UCC
|
| 454 |
+
AUC AGCC
|
| 455 |
+
UG UCC
|
| 456 |
+
UCAAAGGAAUUGACGG GGGCCC
|
| 457 |
+
UGACGC UGAGGC
|
| 458 |
+
UG AGC
|
| 459 |
+
UUCC G
|
| 460 |
+
AAG AC
|
| 461 |
+
GAAC G
|
| 462 |
+
AACGCGAAGAA CCUUACC
|
| 463 |
+
UGGC GAAGGC
|
| 464 |
+
AAC GC
|
| 465 |
+
GG AUU
|
| 466 |
+
ACACUGGGAC UGAGACACGGCCC
|
| 467 |
+
AGCC AUGCC
|
| 468 |
+
AUG AC
|
| 469 |
+
GCACAAGCGGUGGAGC AUGUGGUUUAA
|
| 470 |
+
GCG CC
|
| 471 |
+
UG AUGG
|
| 472 |
+
UGCUGC AUGGCUGUCG
|
| 473 |
+
AGG UC
|
| 474 |
+
AUG UC
|
| 475 |
+
GCC CC
|
| 476 |
+
UG ACG
|
| 477 |
+
GGGCC UUGUACACACCGCCCG
|
| 478 |
+
ACC UC
|
| 479 |
+
GG GGC
|
| 480 |
+
UCAC ACC
|
| 481 |
+
AUUGG GCGUAA
|
| 482 |
+
UAAC AAGG
|
| 483 |
+
UUAA AA
|
| 484 |
+
ACC GC
|
| 485 |
+
UGUAGCGGUGAA AUGCGUAG
|
| 486 |
+
UUGG GC
|
| 487 |
+
UAAC GGC
|
| 488 |
+
ACGCCG UAAACG
|
| 489 |
+
GAA AC
|
| 490 |
+
AGC UAAC
|
| 491 |
+
AUAA AA
|
| 492 |
+
AGCGUGGGGAGCAAAC AGGAUUAGAUACCCUGGUAGUCC
|
| 493 |
+
AGC GAAC
|
| 494 |
+
UCC UC
|
| 495 |
+
AGAA AA
|
| 496 |
+
UGAA GG
|
| 497 |
+
UAUU GCACAA
|
| 498 |
+
UGGGCGC AAGCC
|
| 499 |
+
UUUU GG
|
| 500 |
+
UGGUCUGAG AGGAUG
|
| 501 |
+
AUC AG
|
| 502 |
+
ACCAA GGCGACG
|
| 503 |
+
GAACGCUGGC GGC
|
| 504 |
+
GGCUAACUACGUGCCAGCAGCCGCGGUAA UACG
|
| 505 |
+
UGAGACACGG UCC
|
| 506 |
+
AGAA GC
|
| 507 |
+
UCCC G
|
| 508 |
+
UUC GGAA
|
| 509 |
+
ACGG CC
|
| 510 |
+
U AUGAA
|
| 511 |
+
UGACGC UGAGG
|
| 512 |
+
AUC AUU
|
| 513 |
+
ACCAGUGGC GAAGGC
|
| 514 |
+
ACCAA GGC
|
| 515 |
+
U A
|
| 516 |
+
UU UGAC
|
| 517 |
+
AC AAC
|
| 518 |
+
AUG UGAA
|
| 519 |
+
UGUAGCGGUGAA AUGC
|
| 520 |
+
UG UAG
|
| 521 |
+
UGG GAAC
|
| 522 |
+
AUC AUC
|
| 523 |
+
GGCC G
|
| 524 |
+
UAA UC
|
| 525 |
+
GGCUAACUCCGUGCCAGCAGCCGCGGUAA UACGG
|
| 526 |
+
UAA AGC
|
| 527 |
+
UGGC UC
|
| 528 |
+
AGAC UGCC
|
| 529 |
+
UG UAC
|
| 530 |
+
UUG AG
|
| 531 |
+
GG UC
|
| 532 |
+
ACAC UGGAAC
|
| 533 |
+
UAAUACC GG
|
| 534 |
+
UCC GGAA
|
| 535 |
+
UUAA UCGGAA
|
| 536 |
+
GCCUGGGG AGUAC
|
| 537 |
+
AUAA CC
|
| 538 |
+
AG UCG
|
| 539 |
+
AUGG GC
|
| 540 |
+
GGG UC
|
| 541 |
+
AG UUCGG
|
| 542 |
+
AGGAAGGUGGGGAUG ACGUC
|
| 543 |
+
UGAG AA
|
| 544 |
+
AUCC CC
|
| 545 |
+
GCGG UGAAUACGUUCCC
|
| 546 |
+
UGG AGG
|
| 547 |
+
AGAG UUUG
|
| 548 |
+
UGCAA GCG
|
| 549 |
+
UU UAUU
|
| 550 |
+
UGG AC
|
| 551 |
+
UGAG UAA
|
| 552 |
+
GAAGC ACC
|
| 553 |
+
AGCCAUGCC GCG
|
| 554 |
+
GGC AA
|
| 555 |
+
UUG UCG
|
| 556 |
+
UAUUGG ACAA
|
| 557 |
+
UUGG GG
|
| 558 |
+
AUC UC
|
| 559 |
+
GAA AGC
|
| 560 |
+
UGAA AA
|
| 561 |
+
AC AGC
|
| 562 |
+
UG AUGAA
|
| 563 |
+
GCCUGGGGAGUAC GGCC
|
| 564 |
+
GAA CC
|
| 565 |
+
UGG GCC
|
| 566 |
+
AG AGAA
|
| 567 |
+
AUGG GG
|
| 568 |
+
AGG CCC
|
| 569 |
+
AUAAC G
|
| 570 |
+
AUGCG UAGAG
|
| 571 |
+
GAA GGCG
|
| 572 |
+
UC GGG
|
| 573 |
+
UGGC AA
|
| 574 |
+
AGCC CC
|
| 575 |
+
UC GCGG
|
| 576 |
+
GG ACGGG
|
| 577 |
+
UCG UAACAAGG
|
| 578 |
+
AGC UUGC
|
| 579 |
+
UUUU AA
|
| 580 |
+
AGCG ACGCC
|
| 581 |
+
UUAAUCGGAA UUACUGGGCGUAA
|
| 582 |
+
GGAA GG
|
| 583 |
+
AC AUC
|
| 584 |
+
UGAGUAAC GCG
|
| 585 |
+
UU AUG
|
| 586 |
+
GCCUGGGG AG
|
| 587 |
+
UAG CCG
|
| 588 |
+
UGGGG UAA
|
| 589 |
+
UUCG AUGC
|
| 590 |
+
CCC UUG
|
| 591 |
+
CCC GG
|
| 592 |
+
UU UGAA
|
| 593 |
+
GCAA GGC
|
| 594 |
+
AUGG CCCUU
|
| 595 |
+
AUU UC
|
| 596 |
+
AGG AC
|
| 597 |
+
GAACGCUGGC GGCG
|
| 598 |
+
GGCGG ACGGG
|
| 599 |
+
UUAA GC
|
| 600 |
+
U AUGGG
|
| 601 |
+
UU AUC
|
| 602 |
+
AU AUUC
|
| 603 |
+
UGG AG
|
| 604 |
+
AAGUC AUC
|
| 605 |
+
UGG GGC
|
| 606 |
+
AGUC UGCAACUCG
|
| 607 |
+
ACCC GC
|
| 608 |
+
AG AUGG
|
| 609 |
+
GGAA UCGCUAGUAA
|
| 610 |
+
UUC UC
|
| 611 |
+
AUU AAG
|
| 612 |
+
ACG UCAA
|
| 613 |
+
CC AA
|
| 614 |
+
UUUU GC
|
| 615 |
+
UCAA AA
|
| 616 |
+
AUG AAG
|
| 617 |
+
AUG AAC
|
| 618 |
+
AG UAG
|
| 619 |
+
AC ACC
|
| 620 |
+
UGC UUAAC
|
| 621 |
+
ACACUGGAAC UGAGACACGGUCC
|
| 622 |
+
ACACUGGGACUGAGACACGGCCC AGACUCCUACGGGAGGCAGCAGUGGGGAA
|
| 623 |
+
AC UGGG
|
| 624 |
+
UAUC AGC
|
| 625 |
+
UGGUGC AUGG
|
| 626 |
+
ACAUGC AAGUCG
|
| 627 |
+
UAC GAA
|
| 628 |
+
UU AUUGGGCGUAA
|
| 629 |
+
CCC AA
|
| 630 |
+
AUG AUU
|
| 631 |
+
AAC GG
|
| 632 |
+
UU UCG
|
| 633 |
+
AC UUG
|
| 634 |
+
AGG AGG
|
| 635 |
+
AAAA AA
|
| 636 |
+
UUGAA AC
|
| 637 |
+
GGGCCUUGUACACACCGCCCG UCACACC
|
| 638 |
+
AGGG UGCG
|
| 639 |
+
UAAGC ACC
|
| 640 |
+
UGC GGC
|
| 641 |
+
UGGC GC
|
| 642 |
+
UGC AUU
|
| 643 |
+
UUUU CC
|
| 644 |
+
UCCC AA
|
| 645 |
+
UU AGG
|
| 646 |
+
AGCG UUG
|
| 647 |
+
UGAA GAAGGCC
|
| 648 |
+
UCC GC
|
| 649 |
+
UU UGGG
|
| 650 |
+
UUC GGGG
|
| 651 |
+
Ġ AGAGUUUG
|
| 652 |
+
UUAUCC GGAUU
|
| 653 |
+
UG UUGG
|
| 654 |
+
UAGG AA
|
| 655 |
+
UGAA GC
|
| 656 |
+
Ġ CC
|
| 657 |
+
UGC AC
|
| 658 |
+
AGUGGC GAACGGG
|
| 659 |
+
UAA AC
|
| 660 |
+
AC GAACGCUGGCGGCG
|
| 661 |
+
UU AAGUC
|
| 662 |
+
UGGGG GAA
|
| 663 |
+
AUU GAA
|
| 664 |
+
AGG UGCUGCAUGGCUGUCG
|
| 665 |
+
UAUC G
|
| 666 |
+
UUG ACC
|
| 667 |
+
UAUU CC
|
| 668 |
+
AGUG AGGAA
|
| 669 |
+
ACC ACC
|
| 670 |
+
UU GCG
|
| 671 |
+
ACAA AA
|
| 672 |
+
AGG AAG
|
| 673 |
+
UAU AUU
|
| 674 |
+
UAAUAC AUGC
|
| 675 |
+
ACAUU GGGAC
|
| 676 |
+
AUGCC CCUU
|
| 677 |
+
UGCC CC
|
| 678 |
+
AC UAC
|
| 679 |
+
AC AAG
|
| 680 |
+
GG GAA
|
| 681 |
+
AGAA GAAGCACC
|
| 682 |
+
UGC GGG
|
| 683 |
+
UUC AG
|
| 684 |
+
UAGCC GGCC
|
| 685 |
+
UUC GAAGC
|
| 686 |
+
AGCC AC
|
| 687 |
+
AGCAACGCCGCG UGAG
|
| 688 |
+
AUU GAACGCUGGCGGC
|
| 689 |
+
UAGC UGGUCUGAGAGGAUG
|
| 690 |
+
UU GCAA
|
| 691 |
+
AUG AAGUC
|
| 692 |
+
UAGAGG UGAA
|
| 693 |
+
UUGCC AGC
|
| 694 |
+
UUAA AAC
|
| 695 |
+
AC UAA
|
| 696 |
+
UGAG AGG
|
| 697 |
+
UC UUG
|
| 698 |
+
ACCGG UGGCGAAGGC
|
| 699 |
+
AGCC AA
|
| 700 |
+
Ġ UACG
|
| 701 |
+
AUG CCC
|
| 702 |
+
UAGG GC
|
| 703 |
+
ACGCCGUAAACG AUG
|
| 704 |
+
AG UUGG
|
| 705 |
+
UG AGGG
|
| 706 |
+
AUU UAA
|
| 707 |
+
UGACGG UACC
|
| 708 |
+
UC UAA
|
| 709 |
+
UGG GGAA
|
| 710 |
+
GG AC
|
| 711 |
+
UGG UGUAGCGGUGAAAUGC
|
| 712 |
+
UC AAG
|
| 713 |
+
AG UGGG
|
| 714 |
+
AUAC AA
|
| 715 |
+
GCUGGC GGCG
|
| 716 |
+
GG AG
|
| 717 |
+
UAAC ACAUGCAAGUCGAAC
|
| 718 |
+
GCG AGG
|
| 719 |
+
ACC UGAGAGGG
|
| 720 |
+
ACCAGUGGCGAAGGC GGC
|
| 721 |
+
UUUU UUUU
|
| 722 |
+
UCGC AAG
|
| 723 |
+
ACGG UACC
|
| 724 |
+
AUG UG
|
| 725 |
+
UAC GC
|
| 726 |
+
UGCC GC
|
| 727 |
+
AU AUAA
|
| 728 |
+
GCG UGAG
|
| 729 |
+
UAGC GAA
|
| 730 |
+
GGUG ACAA
|
| 731 |
+
AUU AUU
|
| 732 |
+
AG ACG
|
| 733 |
+
AA UAA
|
| 734 |
+
UCAAAGGAAUUGACGGGGGCCC GCACAAGCGGUGGAGCAUGUGGUUUAA
|
| 735 |
+
UUCGG AUUG
|
| 736 |
+
AGC UCC
|
| 737 |
+
UG UGGC
|
| 738 |
+
GGAA UUCC
|
| 739 |
+
AUUCG UAG
|
| 740 |
+
GG AAC
|
| 741 |
+
UGAC AC
|
| 742 |
+
UU AGGG
|
| 743 |
+
UAGGC GGC
|
| 744 |
+
AG UUUU
|
| 745 |
+
UGGGC UACACACGUGCUACAA
|
| 746 |
+
UGG UUC
|
| 747 |
+
ACGUCAA AUCAUC
|
| 748 |
+
UGAAG UCGUAACAAGG
|
| 749 |
+
AUCC AA
|
| 750 |
+
NNNN NNNN
|
| 751 |
+
AUC AC
|
| 752 |
+
GGGC UCAACC
|
| 753 |
+
UAAC GCG
|
| 754 |
+
AUG UCC
|
| 755 |
+
UUCGG AUCG
|
| 756 |
+
UGGGGGAA ACCC
|
| 757 |
+
GCC GG
|
| 758 |
+
AGGC AA
|
| 759 |
+
GGC UAA
|
| 760 |
+
UGAUC GGCC
|
| 761 |
+
UAGAGGUGAA AUUCGUAG
|
| 762 |
+
UG AUAC
|
| 763 |
+
AUG ACC
|
| 764 |
+
UGAG CC
|
| 765 |
+
UGAGG UAA
|
| 766 |
+
UC UAC
|
| 767 |
+
UGACGCUGAGGC GCGAA
|
| 768 |
+
AUU UU
|
| 769 |
+
UC GCG
|
| 770 |
+
AGC AGG
|
| 771 |
+
AUU AG
|
| 772 |
+
UCC CCC
|
| 773 |
+
UC UGCC
|
| 774 |
+
UACCAA GGCGACG
|
| 775 |
+
GAA GAA
|
| 776 |
+
ĠAGAGUUUG AUCC
|
| 777 |
+
GGUGACAA ACCGG
|
| 778 |
+
GCAA UGGGCGAAAGCC
|
| 779 |
+
UGUAGCGGUGAA AUGCGUAGAG
|
| 780 |
+
AGG ACG
|
| 781 |
+
AC UGCC
|
| 782 |
+
AUGGC GAAGGC
|
| 783 |
+
UGG UG
|
| 784 |
+
AUGG CC
|
| 785 |
+
UC AUG
|
| 786 |
+
AGC AUC
|
| 787 |
+
GG GGG
|
| 788 |
+
AG ACGG
|
| 789 |
+
U AUAAC
|
| 790 |
+
AGCUAAC GC
|
| 791 |
+
U AUAAG
|
| 792 |
+
UUG UU
|
| 793 |
+
AUGC AA
|
| 794 |
+
UUGAC AUCC
|
| 795 |
+
AUUC AA
|
| 796 |
+
ĠG ACGAACGCUGGCGGCG
|
| 797 |
+
GGCUAACUACG UG
|
| 798 |
+
AGUGGC GGACGGG
|
| 799 |
+
UGGG UAGC
|
| 800 |
+
UGAUCC AGCCAUGCCGCG
|
| 801 |
+
UUC AC
|
| 802 |
+
AGG GGC
|
| 803 |
+
UAG AGC
|
| 804 |
+
ACC AGCC
|
| 805 |
+
GCCUGGGGAG UACGG
|
| 806 |
+
ACG CCC
|
| 807 |
+
UGCUUAAC ACAUGCAAGUCGAAC
|
| 808 |
+
UGGUGCAUGG UUGUCG
|
| 809 |
+
UAAC GG
|
| 810 |
+
UAAUACCGC AUACG
|
| 811 |
+
UGUAGCGGUGAAAUGCGUAG AUAUC
|
| 812 |
+
AGCC GCC
|
| 813 |
+
GCCUGGGGAGUACGGCC GCAAGG
|
| 814 |
+
GGGG GC
|
| 815 |
+
UG UGAC
|
| 816 |
+
AUU UAC
|
| 817 |
+
AGAA GAA
|
| 818 |
+
UAUU GC
|
| 819 |
+
UUCGAUGC AACGCGAAGAACCUUACC
|
| 820 |
+
GGUGAA UACGUUCCC
|
| 821 |
+
UAGC AA
|
| 822 |
+
ACG UU
|
| 823 |
+
UAUUGG UCAA
|
| 824 |
+
AU AUGC
|
| 825 |
+
AUAG CC
|
| 826 |
+
UG UUUU
|
| 827 |
+
GGG UUUAA
|
| 828 |
+
AGCAA UGCC
|
| 829 |
+
UACC CC
|
| 830 |
+
UAGG UGG
|
| 831 |
+
AGC AUU
|
| 832 |
+
AUGAA GC
|
| 833 |
+
AGGC GC
|
| 834 |
+
UGCC GG
|
| 835 |
+
AAGUCAUC AUGGCCCUU
|
| 836 |
+
UGCC UAAUACAUGC
|
| 837 |
+
CCC GCG
|
| 838 |
+
AGCGUGGGGAGCAAAC AGG
|
| 839 |
+
ACCAGUGGC GAAGGCG
|
| 840 |
+
UGCAAGCG UUAAUCGGAAUUACUGGGCGUAA
|
| 841 |
+
UGG UAA
|
| 842 |
+
UU UGGC
|
| 843 |
+
UAGUCC GG
|
| 844 |
+
UACC GG
|
| 845 |
+
UG AAGUC
|
| 846 |
+
UCAA GC
|
| 847 |
+
AGCGUGGGG AGCGAAC
|
| 848 |
+
UCG AUG
|
| 849 |
+
UAA GAA
|
| 850 |
+
U AUGGC
|
| 851 |
+
AGCC GG
|
| 852 |
+
UGG UGG
|
| 853 |
+
ACCC AA
|
| 854 |
+
ACC AC
|
| 855 |
+
CCC GC
|
| 856 |
+
AGAA GG
|
| 857 |
+
UUC UUC
|
| 858 |
+
GG ACCC
|
| 859 |
+
AGG UAG
|
| 860 |
+
AG AGGAA
|
| 861 |
+
UUC GGC
|
| 862 |
+
UCUC AGUUCGG
|
| 863 |
+
AUUAA GC
|
| 864 |
+
UAC GGGG
|
| 865 |
+
UGC UCC
|
| 866 |
+
GC AGAU
|
| 867 |
+
AGACUCCUACGGGAGGCAGC AGUAGG
|
| 868 |
+
AGC UAA
|
| 869 |
+
AUCAGG AGGAAC
|
| 870 |
+
AUU AC
|
| 871 |
+
UC UAG
|
| 872 |
+
UAUU AA
|
| 873 |
+
AGG UGGUGCAUGGUUGUCG
|
| 874 |
+
AGG AGGAAC
|
| 875 |
+
ACGUCAAAUCAUC AUGCCCCUU
|
| 876 |
+
GCGG CC
|
| 877 |
+
UGG AUG
|
| 878 |
+
AUU AGAU
|
| 879 |
+
UGC AGC
|
| 880 |
+
UU UGAG
|
| 881 |
+
UGAA GAAGG
|
| 882 |
+
UAA UAA
|
| 883 |
+
UU UGUC
|
| 884 |
+
UGAGG UAACGGC
|
| 885 |
+
AUAG AA
|
| 886 |
+
AAC UC
|
| 887 |
+
UGG GCG
|
| 888 |
+
AG UUUC
|
| 889 |
+
AUG UUC
|
| 890 |
+
UGG ACC
|
| 891 |
+
UUCC CC
|
| 892 |
+
AG UUGC
|
| 893 |
+
UGAA AGCCC
|
| 894 |
+
UGC AGG
|
| 895 |
+
AAG UCCUC
|
| 896 |
+
UG ACCG
|
| 897 |
+
UGG AUC
|
| 898 |
+
AAG AGG
|
| 899 |
+
AUU GCGAA
|
| 900 |
+
ACG AUG
|
| 901 |
+
UGG AAAC
|
| 902 |
+
AUAA GC
|
| 903 |
+
GG UGGAA
|
| 904 |
+
UGACGCUGAGG AGCGAA
|
| 905 |
+
GAAC GC
|
| 906 |
+
GAAUC UUCC
|
| 907 |
+
UUC GC
|
| 908 |
+
ACCUGAGAGGG UGAUCGGCC
|
| 909 |
+
ACACUGGAACUGAGACACGGUCC AGACUCCUACGGGAGGCAGCAGUGGGGAA
|
| 910 |
+
GGCUAAC UUCG
|
| 911 |
+
AG AGAC
|
| 912 |
+
AG AGGC
|
| 913 |
+
UAC UC
|
| 914 |
+
UAAC GGCCC
|
| 915 |
+
UUG AGUGC
|
| 916 |
+
AAC AC
|
| 917 |
+
AG UGCC
|
| 918 |
+
AGCGC GCG
|
| 919 |
+
UG UGCC
|
| 920 |
+
AGC AGC
|
| 921 |
+
ACCC GAA
|
| 922 |
+
ACAA CC
|
| 923 |
+
GGG AGGAAC
|
| 924 |
+
ACC UGGGG
|
| 925 |
+
ACGAA AGUC
|
| 926 |
+
UC AUGC
|
| 927 |
+
ACGG GG
|
| 928 |
+
AU AUGG
|
| 929 |
+
UC UUUU
|
| 930 |
+
GGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGG AGGG
|
| 931 |
+
UU AGAG
|
| 932 |
+
UGAUGC AGCGACGCC
|
| 933 |
+
UG UAGG
|
| 934 |
+
GC AUGG
|
| 935 |
+
AGAA AGCCAC
|
| 936 |
+
UGG AUU
|
| 937 |
+
UUGC AGAA
|
| 938 |
+
UU UCCC
|
| 939 |
+
UG UUAA
|
| 940 |
+
UU GAAG
|
| 941 |
+
UCAA CCG
|
| 942 |
+
UGG UAG
|
| 943 |
+
GGCUAACUACGUGCCAGCAGCCGCGGUAAUACG UAGG
|
| 944 |
+
GAA AGG
|
| 945 |
+
UG AGGAA
|
| 946 |
+
UU ACCAAGGC
|
| 947 |
+
UGUAGC AGUGAA
|
| 948 |
+
UAGCCGGCC UGAGAGGG
|
| 949 |
+
UGG UAC
|
| 950 |
+
UCGCGG AUCAGC
|
| 951 |
+
GGAA ACG
|
| 952 |
+
UGUG UGAAGAAGGCC
|
| 953 |
+
GGCC ACAUUGGGAC
|
| 954 |
+
AUC UCC
|
| 955 |
+
AGGGC GCG
|
| 956 |
+
UG UGGG
|
| 957 |
+
UAAC GC
|
| 958 |
+
ACC UCC
|
| 959 |
+
GGGCCUUGUACACACCGCCCGUCACACC AUGGG
|
| 960 |
+
UU UCAA
|
| 961 |
+
UGG UCGG
|
| 962 |
+
AGGG AC
|
| 963 |
+
UAGGC G
|
| 964 |
+
UG UAAG
|
| 965 |
+
UGG AGGAA
|
| 966 |
+
UUGACGG UACC
|
| 967 |
+
AGUGAGGAA UAUUGGUCAA
|
| 968 |
+
UG ACAA
|
| 969 |
+
AUU UUC
|
| 970 |
+
AGGUGGUGCAUGGUUGUCG UCAGCUCGUGUCGUGAGAUGUUGGGUUAAGUCCCGCAACGAGCGCAA
|
| 971 |
+
AGC ACC
|
| 972 |
+
AGAA CC
|
| 973 |
+
AUGAAGUC GGAAUCGCUAGUAA
|
| 974 |
+
GG UCC
|
| 975 |
+
AG UGAC
|
| 976 |
+
AG AGCC
|
| 977 |
+
UGC UC
|
| 978 |
+
AC AUG
|
| 979 |
+
UAUG CC
|
| 980 |
+
AUUAGC UAG
|
| 981 |
+
UCAA CCC
|
| 982 |
+
AU AUAC
|
| 983 |
+
UAA ACC
|
| 984 |
+
AU AUCC
|
| 985 |
+
UU AUUC
|
| 986 |
+
UAC AGAGGG
|
| 987 |
+
UUC GAA
|
| 988 |
+
UU GAAC
|
| 989 |
+
AG UAAC
|
| 990 |
+
AGC GGC
|
| 991 |
+
UCC UCC
|
| 992 |
+
AGC UCG
|
| 993 |
+
UUCGAAGC AACGCGAAGAACCUUACC
|
| 994 |
+
U AUCCC
|
| 995 |
+
GCGUUG UCCGGAA
|
| 996 |
+
UGG CCC
|
| 997 |
+
AG UACG
|
| 998 |
+
ACGGCC UUCGGGUUGUAA
|
| 999 |
+
AAG ACC
|
| 1000 |
+
UAUUGG GCGUAA
|
| 1001 |
+
AA GAA
|
| 1002 |
+
UU UAAG
|
| 1003 |
+
UUCGGAA UUACUGGGCGUAA
|
| 1004 |
+
UGAG AUAC
|
| 1005 |
+
UC UUGC
|
| 1006 |
+
AG UUAA
|
tokenizer/special_tokens_map.json
ADDED
|
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": "<|endoftext|>",
|
| 3 |
+
"eos_token": "<|endoftext|>",
|
| 4 |
+
"unk_token": "<|endoftext|>"
|
| 5 |
+
}
|
tokenizer/tokenizer.json
ADDED
|
@@ -0,0 +1,2078 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"version": "1.0",
|
| 3 |
+
"truncation": null,
|
| 4 |
+
"padding": null,
|
| 5 |
+
"added_tokens": [
|
| 6 |
+
{
|
| 7 |
+
"id": 0,
|
| 8 |
+
"content": "<|endoftext|>",
|
| 9 |
+
"single_word": false,
|
| 10 |
+
"lstrip": false,
|
| 11 |
+
"rstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"special": true
|
| 14 |
+
}
|
| 15 |
+
],
|
| 16 |
+
"normalizer": null,
|
| 17 |
+
"pre_tokenizer": {
|
| 18 |
+
"type": "ByteLevel",
|
| 19 |
+
"add_prefix_space": true,
|
| 20 |
+
"trim_offsets": true,
|
| 21 |
+
"use_regex": true
|
| 22 |
+
},
|
| 23 |
+
"post_processor": {
|
| 24 |
+
"type": "ByteLevel",
|
| 25 |
+
"add_prefix_space": true,
|
| 26 |
+
"trim_offsets": true,
|
| 27 |
+
"use_regex": true
|
| 28 |
+
},
|
| 29 |
+
"decoder": {
|
| 30 |
+
"type": "ByteLevel",
|
| 31 |
+
"add_prefix_space": true,
|
| 32 |
+
"trim_offsets": true,
|
| 33 |
+
"use_regex": true
|
| 34 |
+
},
|
| 35 |
+
"model": {
|
| 36 |
+
"type": "BPE",
|
| 37 |
+
"dropout": null,
|
| 38 |
+
"unk_token": null,
|
| 39 |
+
"continuing_subword_prefix": null,
|
| 40 |
+
"end_of_word_suffix": null,
|
| 41 |
+
"fuse_unk": false,
|
| 42 |
+
"byte_fallback": false,
|
| 43 |
+
"ignore_merges": false,
|
| 44 |
+
"vocab": {
|
| 45 |
+
"<|endoftext|>": 0,
|
| 46 |
+
"A": 1,
|
| 47 |
+
"B": 2,
|
| 48 |
+
"C": 3,
|
| 49 |
+
"D": 4,
|
| 50 |
+
"G": 5,
|
| 51 |
+
"H": 6,
|
| 52 |
+
"K": 7,
|
| 53 |
+
"M": 8,
|
| 54 |
+
"N": 9,
|
| 55 |
+
"R": 10,
|
| 56 |
+
"S": 11,
|
| 57 |
+
"U": 12,
|
| 58 |
+
"V": 13,
|
| 59 |
+
"W": 14,
|
| 60 |
+
"X": 15,
|
| 61 |
+
"Y": 16,
|
| 62 |
+
"Ċ": 17,
|
| 63 |
+
"Ġ": 18,
|
| 64 |
+
"GG": 19,
|
| 65 |
+
"AA": 20,
|
| 66 |
+
"UU": 21,
|
| 67 |
+
"CC": 22,
|
| 68 |
+
"AG": 23,
|
| 69 |
+
"UG": 24,
|
| 70 |
+
"AC": 25,
|
| 71 |
+
"UC": 26,
|
| 72 |
+
"UGG": 27,
|
| 73 |
+
"GC": 28,
|
| 74 |
+
"AGG": 29,
|
| 75 |
+
"UAA": 30,
|
| 76 |
+
"AGC": 31,
|
| 77 |
+
"AUU": 32,
|
| 78 |
+
"ACC": 33,
|
| 79 |
+
"AUG": 34,
|
| 80 |
+
"UCC": 35,
|
| 81 |
+
"GAA": 36,
|
| 82 |
+
"UAC": 37,
|
| 83 |
+
"UGC": 38,
|
| 84 |
+
"AUC": 39,
|
| 85 |
+
"UAG": 40,
|
| 86 |
+
"UUC": 41,
|
| 87 |
+
"AAC": 42,
|
| 88 |
+
"GGC": 43,
|
| 89 |
+
"UUG": 44,
|
| 90 |
+
"AAG": 45,
|
| 91 |
+
"GGG": 46,
|
| 92 |
+
"CCC": 47,
|
| 93 |
+
"AU": 48,
|
| 94 |
+
"UGAA": 49,
|
| 95 |
+
"ACG": 50,
|
| 96 |
+
"AUGG": 51,
|
| 97 |
+
"UAAC": 52,
|
| 98 |
+
"GCG": 53,
|
| 99 |
+
"UCG": 54,
|
| 100 |
+
"AGGC": 55,
|
| 101 |
+
"UGAG": 56,
|
| 102 |
+
"UGGC": 57,
|
| 103 |
+
"AUGC": 58,
|
| 104 |
+
"AGCC": 59,
|
| 105 |
+
"UGCC": 60,
|
| 106 |
+
"AUCC": 61,
|
| 107 |
+
"GGAA": 62,
|
| 108 |
+
"AUAA": 63,
|
| 109 |
+
"UACC": 64,
|
| 110 |
+
"UUUU": 65,
|
| 111 |
+
"ACGG": 66,
|
| 112 |
+
"AGGG": 67,
|
| 113 |
+
"UAUU": 68,
|
| 114 |
+
"AGAA": 69,
|
| 115 |
+
"UUGG": 70,
|
| 116 |
+
"GCC": 71,
|
| 117 |
+
"UAGC": 72,
|
| 118 |
+
"UCAA": 73,
|
| 119 |
+
"UUAA": 74,
|
| 120 |
+
"GAAC": 75,
|
| 121 |
+
"ACAA": 76,
|
| 122 |
+
"UAGG": 77,
|
| 123 |
+
"UGGG": 78,
|
| 124 |
+
"ACCC": 79,
|
| 125 |
+
"UGGGG": 80,
|
| 126 |
+
"UGAC": 81,
|
| 127 |
+
"AUAC": 82,
|
| 128 |
+
"GCGG": 83,
|
| 129 |
+
"AGGAA": 84,
|
| 130 |
+
"UUCC": 85,
|
| 131 |
+
"AGCG": 86,
|
| 132 |
+
"UCCC": 87,
|
| 133 |
+
"GCAA": 88,
|
| 134 |
+
"AGAC": 89,
|
| 135 |
+
"GGCC": 90,
|
| 136 |
+
"AUUC": 91,
|
| 137 |
+
"UUUC": 92,
|
| 138 |
+
"UUGC": 93,
|
| 139 |
+
"AAAA": 94,
|
| 140 |
+
"AGAG": 95,
|
| 141 |
+
"CCG": 96,
|
| 142 |
+
"UACG": 97,
|
| 143 |
+
"ACAC": 98,
|
| 144 |
+
"AUAG": 99,
|
| 145 |
+
"GGGG": 100,
|
| 146 |
+
"UGUC": 101,
|
| 147 |
+
"UAAG": 102,
|
| 148 |
+
"UAUC": 103,
|
| 149 |
+
"UUUG": 104,
|
| 150 |
+
"AGUC": 105,
|
| 151 |
+
"AUUG": 106,
|
| 152 |
+
"GGCG": 107,
|
| 153 |
+
"AAAC": 108,
|
| 154 |
+
"AAGUC": 109,
|
| 155 |
+
"AUGAA": 110,
|
| 156 |
+
"UGUG": 111,
|
| 157 |
+
"UCUC": 112,
|
| 158 |
+
"UGGAA": 113,
|
| 159 |
+
"ACCG": 114,
|
| 160 |
+
"AGUG": 115,
|
| 161 |
+
"UGGGC": 116,
|
| 162 |
+
"UUAC": 117,
|
| 163 |
+
"UCGC": 118,
|
| 164 |
+
"UUCGG": 119,
|
| 165 |
+
"UGCG": 120,
|
| 166 |
+
"UAUG": 121,
|
| 167 |
+
"UUCG": 122,
|
| 168 |
+
"UUUAA": 123,
|
| 169 |
+
"UCGG": 124,
|
| 170 |
+
"UUAG": 125,
|
| 171 |
+
"UCUG": 126,
|
| 172 |
+
"UCCG": 127,
|
| 173 |
+
"AACG": 128,
|
| 174 |
+
"GAAG": 129,
|
| 175 |
+
"AGUGG": 130,
|
| 176 |
+
"UCAC": 131,
|
| 177 |
+
"AUAAC": 132,
|
| 178 |
+
"UGAGG": 133,
|
| 179 |
+
"AUGGC": 134,
|
| 180 |
+
"AGAGG": 135,
|
| 181 |
+
"AGAU": 136,
|
| 182 |
+
"AUGCC": 137,
|
| 183 |
+
"ACCAA": 138,
|
| 184 |
+
"UAGGC": 139,
|
| 185 |
+
"GGGC": 140,
|
| 186 |
+
"AUUAA": 141,
|
| 187 |
+
"GGUGAA": 142,
|
| 188 |
+
"UACGGG": 143,
|
| 189 |
+
"AUCG": 144,
|
| 190 |
+
"AAGCC": 145,
|
| 191 |
+
"UUGAA": 146,
|
| 192 |
+
"UAU": 147,
|
| 193 |
+
"UACAC": 148,
|
| 194 |
+
"GCGAA": 149,
|
| 195 |
+
"CCUU": 150,
|
| 196 |
+
"CCCG": 151,
|
| 197 |
+
"AUGCG": 152,
|
| 198 |
+
"ACUC": 153,
|
| 199 |
+
"UGUU": 154,
|
| 200 |
+
"GGCUAAC": 155,
|
| 201 |
+
"AAGG": 156,
|
| 202 |
+
"UCAG": 157,
|
| 203 |
+
"ACGC": 158,
|
| 204 |
+
"UGUAGC": 159,
|
| 205 |
+
"UGACGC": 160,
|
| 206 |
+
"UGAGAC": 161,
|
| 207 |
+
"UUCCC": 162,
|
| 208 |
+
"GCGUAA": 163,
|
| 209 |
+
"AGCAGCC": 164,
|
| 210 |
+
"AUGGG": 165,
|
| 211 |
+
"AGGCAGC": 166,
|
| 212 |
+
"AGUGGC": 167,
|
| 213 |
+
"AGGGC": 168,
|
| 214 |
+
"UACAA": 169,
|
| 215 |
+
"UCAGC": 170,
|
| 216 |
+
"AUUGG": 171,
|
| 217 |
+
"GAAGGC": 172,
|
| 218 |
+
"GCGGUAA": 173,
|
| 219 |
+
"ACGAA": 174,
|
| 220 |
+
"UUAAG": 175,
|
| 221 |
+
"UGCCAGCAGCC": 176,
|
| 222 |
+
"CCCC": 177,
|
| 223 |
+
"UGUCG": 178,
|
| 224 |
+
"UUGGG": 179,
|
| 225 |
+
"UGCAA": 180,
|
| 226 |
+
"AGCAA": 181,
|
| 227 |
+
"AUCCC": 182,
|
| 228 |
+
"UACGGGAGGCAGC": 183,
|
| 229 |
+
"ACGGG": 184,
|
| 230 |
+
"UUAAC": 185,
|
| 231 |
+
"UUCGGG": 186,
|
| 232 |
+
"ACUG": 187,
|
| 233 |
+
"UUGCC": 188,
|
| 234 |
+
"ACCGG": 189,
|
| 235 |
+
"UAGAG": 190,
|
| 236 |
+
"UUGUAA": 191,
|
| 237 |
+
"UAGUCC": 192,
|
| 238 |
+
"AGGAUU": 193,
|
| 239 |
+
"UAAGG": 194,
|
| 240 |
+
"UGCCAGCAGCCGCGGUAA": 195,
|
| 241 |
+
"UCCUACGGGAGGCAGC": 196,
|
| 242 |
+
"AGGGG": 197,
|
| 243 |
+
"GCACAA": 198,
|
| 244 |
+
"AUAUU": 199,
|
| 245 |
+
"AUAUC": 200,
|
| 246 |
+
"AGUU": 201,
|
| 247 |
+
"UAAUACC": 202,
|
| 248 |
+
"UAAAA": 203,
|
| 249 |
+
"UACGG": 204,
|
| 250 |
+
"AGGAAC": 205,
|
| 251 |
+
"UGCCC": 206,
|
| 252 |
+
"UUGAC": 207,
|
| 253 |
+
"GAAGC": 208,
|
| 254 |
+
"UGGCC": 209,
|
| 255 |
+
"UCUU": 210,
|
| 256 |
+
"UAGGG": 211,
|
| 257 |
+
"AGCCC": 212,
|
| 258 |
+
"UGAGACACGG": 213,
|
| 259 |
+
"AUUAGC": 214,
|
| 260 |
+
"AUAAG": 215,
|
| 261 |
+
"GCUGGC": 216,
|
| 262 |
+
"AGGCC": 217,
|
| 263 |
+
"ACUU": 218,
|
| 264 |
+
"AGCGUGGGG": 219,
|
| 265 |
+
"AGCAAAC": 220,
|
| 266 |
+
"ACCCC": 221,
|
| 267 |
+
"AGGAAGG": 222,
|
| 268 |
+
"UAACC": 223,
|
| 269 |
+
"UUGACGG": 224,
|
| 270 |
+
"AGGAUUAGAU": 225,
|
| 271 |
+
"ACAG": 226,
|
| 272 |
+
"AGACUCCUACGGGAGGCAGC": 227,
|
| 273 |
+
"UGGUC": 228,
|
| 274 |
+
"GGCGG": 229,
|
| 275 |
+
"GCGC": 230,
|
| 276 |
+
"UACCC": 231,
|
| 277 |
+
"UGGAGC": 232,
|
| 278 |
+
"AUGUGG": 233,
|
| 279 |
+
"AGUGGGGAA": 234,
|
| 280 |
+
"UGUAGCGGUGAA": 235,
|
| 281 |
+
"GGGCC": 236,
|
| 282 |
+
"UAGUAA": 237,
|
| 283 |
+
"UCCGG": 238,
|
| 284 |
+
"NN": 239,
|
| 285 |
+
"ĠG": 240,
|
| 286 |
+
"UGAAG": 241,
|
| 287 |
+
"UAGCC": 242,
|
| 288 |
+
"ACAUGC": 243,
|
| 289 |
+
"UCAAC": 244,
|
| 290 |
+
"AGUAC": 245,
|
| 291 |
+
"AGGAUG": 246,
|
| 292 |
+
"AGGAUUAGAUACCC": 247,
|
| 293 |
+
"AGUGC": 248,
|
| 294 |
+
"UAUGG": 249,
|
| 295 |
+
"ACGCC": 250,
|
| 296 |
+
"UAGUUGG": 251,
|
| 297 |
+
"UGUAA": 252,
|
| 298 |
+
"AACC": 253,
|
| 299 |
+
"ACUGC": 254,
|
| 300 |
+
"UAUUGG": 255,
|
| 301 |
+
"UGGGCGUAA": 256,
|
| 302 |
+
"UUUUC": 257,
|
| 303 |
+
"UGAGUAAC": 258,
|
| 304 |
+
"UGCUGC": 259,
|
| 305 |
+
"UAGAA": 260,
|
| 306 |
+
"AUUCC": 261,
|
| 307 |
+
"UAAGC": 262,
|
| 308 |
+
"UAUAA": 263,
|
| 309 |
+
"ACGUC": 264,
|
| 310 |
+
"AAGC": 265,
|
| 311 |
+
"AGAAG": 266,
|
| 312 |
+
"AGCGCAA": 267,
|
| 313 |
+
"UGACGG": 268,
|
| 314 |
+
"AGCGC": 269,
|
| 315 |
+
"UUUUG": 270,
|
| 316 |
+
"UGCAAC": 271,
|
| 317 |
+
"GGUG": 272,
|
| 318 |
+
"UCAGCUCG": 273,
|
| 319 |
+
"UGGUAGUCC": 274,
|
| 320 |
+
"UUUCC": 275,
|
| 321 |
+
"AGCGG": 276,
|
| 322 |
+
"AGAAC": 277,
|
| 323 |
+
"UGAAC": 278,
|
| 324 |
+
"UGGAAC": 279,
|
| 325 |
+
"UUCAA": 280,
|
| 326 |
+
"AGAUU": 281,
|
| 327 |
+
"ACUCC": 282,
|
| 328 |
+
"AGAUG": 283,
|
| 329 |
+
"UUAUU": 284,
|
| 330 |
+
"UGGGAA": 285,
|
| 331 |
+
"AGAGC": 286,
|
| 332 |
+
"AUCAA": 287,
|
| 333 |
+
"GGCUAACUACG": 288,
|
| 334 |
+
"AGCAAC": 289,
|
| 335 |
+
"AGCGUGGGGAGCAAAC": 290,
|
| 336 |
+
"AGGAUUAGAUACCCUGGUAGUCC": 291,
|
| 337 |
+
"ACAUU": 292,
|
| 338 |
+
"UAAACG": 293,
|
| 339 |
+
"UGAGGC": 294,
|
| 340 |
+
"UGUGAA": 295,
|
| 341 |
+
"GAAGG": 296,
|
| 342 |
+
"AUGCGUAG": 297,
|
| 343 |
+
"UUGGC": 298,
|
| 344 |
+
"UAGGGG": 299,
|
| 345 |
+
"AGUGAA": 300,
|
| 346 |
+
"AGGGAA": 301,
|
| 347 |
+
"UGAUC": 302,
|
| 348 |
+
"UGGGAC": 303,
|
| 349 |
+
"UUAAGUCCC": 304,
|
| 350 |
+
"ACCGCCCG": 305,
|
| 351 |
+
"GAACGCUGGC": 306,
|
| 352 |
+
"AAGUCGAAC": 307,
|
| 353 |
+
"AGCGAA": 308,
|
| 354 |
+
"AGCUC": 309,
|
| 355 |
+
"UCAAAGGAA": 310,
|
| 356 |
+
"UCAACC": 311,
|
| 357 |
+
"GCCUGGGG": 312,
|
| 358 |
+
"CCCUU": 313,
|
| 359 |
+
"UCCCC": 314,
|
| 360 |
+
"UGCCG": 315,
|
| 361 |
+
"UGAUCC": 316,
|
| 362 |
+
"UGAGAUG": 317,
|
| 363 |
+
"UUACC": 318,
|
| 364 |
+
"AGACUCCUACGGGAGGCAGCAGUGGGGAA": 319,
|
| 365 |
+
"UCGCC": 320,
|
| 366 |
+
"GGGAC": 321,
|
| 367 |
+
"AGGCG": 322,
|
| 368 |
+
"AGGAAGGUGGGG": 323,
|
| 369 |
+
"GGGCCC": 324,
|
| 370 |
+
"UAUUC": 325,
|
| 371 |
+
"UACGUUCCC": 326,
|
| 372 |
+
"UCAAAGGAAUUGACGG": 327,
|
| 373 |
+
"AUACC": 328,
|
| 374 |
+
"UGAGACACGGCCC": 329,
|
| 375 |
+
"AUAGC": 330,
|
| 376 |
+
"UCAUU": 331,
|
| 377 |
+
"UACACACCGCCCG": 332,
|
| 378 |
+
"UCGAA": 333,
|
| 379 |
+
"AUAGG": 334,
|
| 380 |
+
"AUCGG": 335,
|
| 381 |
+
"UUUGG": 336,
|
| 382 |
+
"UGAUGC": 337,
|
| 383 |
+
"UGCGAA": 338,
|
| 384 |
+
"UAGAGG": 339,
|
| 385 |
+
"GCACAAGCGG": 340,
|
| 386 |
+
"AAGUCG": 341,
|
| 387 |
+
"UGGCG": 342,
|
| 388 |
+
"UCGGAA": 343,
|
| 389 |
+
"GGCGACG": 344,
|
| 390 |
+
"UGAUG": 345,
|
| 391 |
+
"UAGCG": 346,
|
| 392 |
+
"AUACG": 347,
|
| 393 |
+
"AACGAGCGCAA": 348,
|
| 394 |
+
"UCAGCUCGUGUCG": 349,
|
| 395 |
+
"CCUUACC": 350,
|
| 396 |
+
"UUGGGUUAAGUCCC": 351,
|
| 397 |
+
"ACGUGC": 352,
|
| 398 |
+
"ACUGG": 353,
|
| 399 |
+
"AGUAA": 354,
|
| 400 |
+
"GCAAGG": 355,
|
| 401 |
+
"UGUGG": 356,
|
| 402 |
+
"UCAGCUCGUGUCGUGAGAUG": 357,
|
| 403 |
+
"UAUCC": 358,
|
| 404 |
+
"AGUUC": 359,
|
| 405 |
+
"AGACC": 360,
|
| 406 |
+
"ACCAGUGGC": 361,
|
| 407 |
+
"AUAUG": 362,
|
| 408 |
+
"UCAGG": 363,
|
| 409 |
+
"UCUUC": 364,
|
| 410 |
+
"GCAACGAGCGCAA": 365,
|
| 411 |
+
"UUACUGGGCGUAA": 366,
|
| 412 |
+
"UGAUU": 367,
|
| 413 |
+
"UUAUCC": 368,
|
| 414 |
+
"UGACC": 369,
|
| 415 |
+
"UCAUC": 370,
|
| 416 |
+
"UAUGC": 371,
|
| 417 |
+
"UAGUC": 372,
|
| 418 |
+
"GCCG": 373,
|
| 419 |
+
"AUCAGC": 374,
|
| 420 |
+
"AUUCG": 375,
|
| 421 |
+
"UAAUACCGC": 376,
|
| 422 |
+
"UGGGGG": 377,
|
| 423 |
+
"AACGCGAA": 378,
|
| 424 |
+
"ACAGG": 379,
|
| 425 |
+
"UGCGG": 380,
|
| 426 |
+
"GGCUAACUCCG": 381,
|
| 427 |
+
"AUGUGGUUUAA": 382,
|
| 428 |
+
"AGGAAGGUGGGGAUG": 383,
|
| 429 |
+
"GCCGCG": 384,
|
| 430 |
+
"UCGCUAGUAA": 385,
|
| 431 |
+
"UGAAAC": 386,
|
| 432 |
+
"ACGGC": 387,
|
| 433 |
+
"UUGUACACACCGCCCG": 388,
|
| 434 |
+
"UGGAAUUCC": 389,
|
| 435 |
+
"UCAGCUCGUGUCGUGAGAUGUUGGGUUAAGUCCC": 390,
|
| 436 |
+
"GAAAGCC": 391,
|
| 437 |
+
"AUUGC": 392,
|
| 438 |
+
"UGGUCUGAG": 393,
|
| 439 |
+
"UCGGC": 394,
|
| 440 |
+
"UCCAA": 395,
|
| 441 |
+
"AUUAGCUAGUUGG": 396,
|
| 442 |
+
"UAGGCGG": 397,
|
| 443 |
+
"AGUUG": 398,
|
| 444 |
+
"GAACGGG": 399,
|
| 445 |
+
"UCACC": 400,
|
| 446 |
+
"UAAAAC": 401,
|
| 447 |
+
"UCUGG": 402,
|
| 448 |
+
"UAUUG": 403,
|
| 449 |
+
"UUCGGGUUGUAA": 404,
|
| 450 |
+
"ACUUC": 405,
|
| 451 |
+
"ACGUGCUACAA": 406,
|
| 452 |
+
"GAAAA": 407,
|
| 453 |
+
"ĠC": 408,
|
| 454 |
+
"UCUGC": 409,
|
| 455 |
+
"UUUGC": 410,
|
| 456 |
+
"UACCG": 411,
|
| 457 |
+
"UGCAACUCG": 412,
|
| 458 |
+
"AUGGCUGUCG": 413,
|
| 459 |
+
"UUGUUGG": 414,
|
| 460 |
+
"UGUGC": 415,
|
| 461 |
+
"AACGCGAAGAA": 416,
|
| 462 |
+
"UGUUC": 417,
|
| 463 |
+
"AGAGGG": 418,
|
| 464 |
+
"AUCCG": 419,
|
| 465 |
+
"GCGUUG": 420,
|
| 466 |
+
"AACAA": 421,
|
| 467 |
+
"UUGGAA": 422,
|
| 468 |
+
"AUAU": 423,
|
| 469 |
+
"UCUCC": 424,
|
| 470 |
+
"AGAUC": 425,
|
| 471 |
+
"ACGCCG": 426,
|
| 472 |
+
"UUAACC": 427,
|
| 473 |
+
"AGGCGG": 428,
|
| 474 |
+
"ACAUGCAAGUCGAAC": 429,
|
| 475 |
+
"UGGUGC": 430,
|
| 476 |
+
"UAAUAC": 431,
|
| 477 |
+
"UACCAA": 432,
|
| 478 |
+
"GGCCC": 433,
|
| 479 |
+
"AGCAC": 434,
|
| 480 |
+
"UGAACC": 435,
|
| 481 |
+
"ACACUGGGAC": 436,
|
| 482 |
+
"AUCAGG": 437,
|
| 483 |
+
"UGAGUAACACG": 438,
|
| 484 |
+
"GCGUG": 439,
|
| 485 |
+
"UAUAC": 440,
|
| 486 |
+
"UUGUC": 441,
|
| 487 |
+
"GAAUC": 442,
|
| 488 |
+
"UUAGC": 443,
|
| 489 |
+
"UCAGCUCGUGUCGUGAGAUGUUGGGUUAAGUCCCGCAACGAGCGCAA": 444,
|
| 490 |
+
"AGCAACGCCGCG": 445,
|
| 491 |
+
"AGUAGG": 446,
|
| 492 |
+
"UAACG": 447,
|
| 493 |
+
"GCACAAGCGGUGGAGC": 448,
|
| 494 |
+
"UUUAG": 449,
|
| 495 |
+
"AGGGGG": 450,
|
| 496 |
+
"UACACACGUGCUACAA": 451,
|
| 497 |
+
"GGCGC": 452,
|
| 498 |
+
"UGAGAGGG": 453,
|
| 499 |
+
"UGCGC": 454,
|
| 500 |
+
"AGCCG": 455,
|
| 501 |
+
"UGAAUACGUUCCC": 456,
|
| 502 |
+
"UUUAC": 457,
|
| 503 |
+
"NNNN": 458,
|
| 504 |
+
"GGCUAACUCCGUGCCAGCAGCCGCGGUAA": 459,
|
| 505 |
+
"AUGGAA": 460,
|
| 506 |
+
"UGGGCGC": 461,
|
| 507 |
+
"UGGGCGAAAGCC": 462,
|
| 508 |
+
"UAUAG": 463,
|
| 509 |
+
"GAAGGCC": 464,
|
| 510 |
+
"GGCAGC": 465,
|
| 511 |
+
"AUCGC": 466,
|
| 512 |
+
"UGUUG": 467,
|
| 513 |
+
"ACCCG": 468,
|
| 514 |
+
"GGCUAACUACGUGCCAGCAGCCGCGGUAA": 469,
|
| 515 |
+
"AGUCC": 470,
|
| 516 |
+
"AUCAGCC": 471,
|
| 517 |
+
"UGUCC": 472,
|
| 518 |
+
"UCAAAGGAAUUGACGGGGGCCC": 473,
|
| 519 |
+
"UGACGCUGAGGC": 474,
|
| 520 |
+
"UGAGC": 475,
|
| 521 |
+
"UUCCG": 476,
|
| 522 |
+
"AAGAC": 477,
|
| 523 |
+
"GAACG": 478,
|
| 524 |
+
"AACGCGAAGAACCUUACC": 479,
|
| 525 |
+
"UGGCGAAGGC": 480,
|
| 526 |
+
"AACGC": 481,
|
| 527 |
+
"GGAUU": 482,
|
| 528 |
+
"ACACUGGGACUGAGACACGGCCC": 483,
|
| 529 |
+
"AGCCAUGCC": 484,
|
| 530 |
+
"AUGAC": 485,
|
| 531 |
+
"GCACAAGCGGUGGAGCAUGUGGUUUAA": 486,
|
| 532 |
+
"GCGCC": 487,
|
| 533 |
+
"UGAUGG": 488,
|
| 534 |
+
"UGCUGCAUGGCUGUCG": 489,
|
| 535 |
+
"AGGUC": 490,
|
| 536 |
+
"AUGUC": 491,
|
| 537 |
+
"GCCCC": 492,
|
| 538 |
+
"UGACG": 493,
|
| 539 |
+
"GGGCCUUGUACACACCGCCCG": 494,
|
| 540 |
+
"ACCUC": 495,
|
| 541 |
+
"GGGGC": 496,
|
| 542 |
+
"UCACACC": 497,
|
| 543 |
+
"AUUGGGCGUAA": 498,
|
| 544 |
+
"UAACAAGG": 499,
|
| 545 |
+
"UUAAAA": 500,
|
| 546 |
+
"ACCGC": 501,
|
| 547 |
+
"UGUAGCGGUGAAAUGCGUAG": 502,
|
| 548 |
+
"UUGGGC": 503,
|
| 549 |
+
"UAACGGC": 504,
|
| 550 |
+
"ACGCCGUAAACG": 505,
|
| 551 |
+
"GAAAC": 506,
|
| 552 |
+
"AGCUAAC": 507,
|
| 553 |
+
"AUAAAA": 508,
|
| 554 |
+
"AGCGUGGGGAGCAAACAGGAUUAGAUACCCUGGUAGUCC": 509,
|
| 555 |
+
"AGCGAAC": 510,
|
| 556 |
+
"UCCUC": 511,
|
| 557 |
+
"AGAAAA": 512,
|
| 558 |
+
"UGAAGG": 513,
|
| 559 |
+
"UAUUGCACAA": 514,
|
| 560 |
+
"UGGGCGCAAGCC": 515,
|
| 561 |
+
"UUUUGG": 516,
|
| 562 |
+
"UGGUCUGAGAGGAUG": 517,
|
| 563 |
+
"AUCAG": 518,
|
| 564 |
+
"ACCAAGGCGACG": 519,
|
| 565 |
+
"GAACGCUGGCGGC": 520,
|
| 566 |
+
"GGCUAACUACGUGCCAGCAGCCGCGGUAAUACG": 521,
|
| 567 |
+
"UGAGACACGGUCC": 522,
|
| 568 |
+
"AGAAGC": 523,
|
| 569 |
+
"UCCCG": 524,
|
| 570 |
+
"UUCGGAA": 525,
|
| 571 |
+
"ACGGCC": 526,
|
| 572 |
+
"UAUGAA": 527,
|
| 573 |
+
"UGACGCUGAGG": 528,
|
| 574 |
+
"AUCAUU": 529,
|
| 575 |
+
"ACCAGUGGCGAAGGC": 530,
|
| 576 |
+
"ACCAAGGC": 531,
|
| 577 |
+
"UA": 532,
|
| 578 |
+
"UUUGAC": 533,
|
| 579 |
+
"ACAAC": 534,
|
| 580 |
+
"AUGUGAA": 535,
|
| 581 |
+
"UGUAGCGGUGAAAUGC": 536,
|
| 582 |
+
"UGUAG": 537,
|
| 583 |
+
"UGGGAAC": 538,
|
| 584 |
+
"AUCAUC": 539,
|
| 585 |
+
"GGCCG": 540,
|
| 586 |
+
"UAAUC": 541,
|
| 587 |
+
"GGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGG": 542,
|
| 588 |
+
"UAAAGC": 543,
|
| 589 |
+
"UGGCUC": 544,
|
| 590 |
+
"AGACUGCC": 545,
|
| 591 |
+
"UGUAC": 546,
|
| 592 |
+
"UUGAG": 547,
|
| 593 |
+
"GGUC": 548,
|
| 594 |
+
"ACACUGGAAC": 549,
|
| 595 |
+
"UAAUACCGG": 550,
|
| 596 |
+
"UCCGGAA": 551,
|
| 597 |
+
"UUAAUCGGAA": 552,
|
| 598 |
+
"GCCUGGGGAGUAC": 553,
|
| 599 |
+
"AUAACC": 554,
|
| 600 |
+
"AGUCG": 555,
|
| 601 |
+
"AUGGGC": 556,
|
| 602 |
+
"GGGUC": 557,
|
| 603 |
+
"AGUUCGG": 558,
|
| 604 |
+
"AGGAAGGUGGGGAUGACGUC": 559,
|
| 605 |
+
"UGAGAA": 560,
|
| 606 |
+
"AUCCCC": 561,
|
| 607 |
+
"GCGGUGAAUACGUUCCC": 562,
|
| 608 |
+
"UGGAGG": 563,
|
| 609 |
+
"AGAGUUUG": 564,
|
| 610 |
+
"UGCAAGCG": 565,
|
| 611 |
+
"UUUAUU": 566,
|
| 612 |
+
"UGGAC": 567,
|
| 613 |
+
"UGAGUAA": 568,
|
| 614 |
+
"GAAGCACC": 569,
|
| 615 |
+
"AGCCAUGCCGCG": 570,
|
| 616 |
+
"GGCAA": 571,
|
| 617 |
+
"UUGUCG": 572,
|
| 618 |
+
"UAUUGGACAA": 573,
|
| 619 |
+
"UUGGGG": 574,
|
| 620 |
+
"AUCUC": 575,
|
| 621 |
+
"GAAAGC": 576,
|
| 622 |
+
"UGAAAA": 577,
|
| 623 |
+
"ACAGC": 578,
|
| 624 |
+
"UGAUGAA": 579,
|
| 625 |
+
"GCCUGGGGAGUACGGCC": 580,
|
| 626 |
+
"GAACC": 581,
|
| 627 |
+
"UGGGCC": 582,
|
| 628 |
+
"AGAGAA": 583,
|
| 629 |
+
"AUGGGG": 584,
|
| 630 |
+
"AGGCCC": 585,
|
| 631 |
+
"AUAACG": 586,
|
| 632 |
+
"AUGCGUAGAG": 587,
|
| 633 |
+
"GAAGGCG": 588,
|
| 634 |
+
"UCGGG": 589,
|
| 635 |
+
"UGGCAA": 590,
|
| 636 |
+
"AGCCCC": 591,
|
| 637 |
+
"UCGCGG": 592,
|
| 638 |
+
"GGACGGG": 593,
|
| 639 |
+
"UCGUAACAAGG": 594,
|
| 640 |
+
"AGCUUGC": 595,
|
| 641 |
+
"UUUUAA": 596,
|
| 642 |
+
"AGCGACGCC": 597,
|
| 643 |
+
"UUAAUCGGAAUUACUGGGCGUAA": 598,
|
| 644 |
+
"GGAAGG": 599,
|
| 645 |
+
"ACAUC": 600,
|
| 646 |
+
"UGAGUAACGCG": 601,
|
| 647 |
+
"UUAUG": 602,
|
| 648 |
+
"GCCUGGGGAG": 603,
|
| 649 |
+
"UAGCCG": 604,
|
| 650 |
+
"UGGGGUAA": 605,
|
| 651 |
+
"UUCGAUGC": 606,
|
| 652 |
+
"CCCUUG": 607,
|
| 653 |
+
"CCCGG": 608,
|
| 654 |
+
"UUUGAA": 609,
|
| 655 |
+
"GCAAGGC": 610,
|
| 656 |
+
"AUGGCCCUU": 611,
|
| 657 |
+
"AUUUC": 612,
|
| 658 |
+
"AGGAC": 613,
|
| 659 |
+
"GAACGCUGGCGGCG": 614,
|
| 660 |
+
"GGCGGACGGG": 615,
|
| 661 |
+
"UUAAGC": 616,
|
| 662 |
+
"UAUGGG": 617,
|
| 663 |
+
"UUAUC": 618,
|
| 664 |
+
"AUAUUC": 619,
|
| 665 |
+
"UGGAG": 620,
|
| 666 |
+
"AAGUCAUC": 621,
|
| 667 |
+
"UGGGGC": 622,
|
| 668 |
+
"AGUCUGCAACUCG": 623,
|
| 669 |
+
"ACCCGC": 624,
|
| 670 |
+
"AGAUGG": 625,
|
| 671 |
+
"GGAAUCGCUAGUAA": 626,
|
| 672 |
+
"UUCUC": 627,
|
| 673 |
+
"AUUAAG": 628,
|
| 674 |
+
"ACGUCAA": 629,
|
| 675 |
+
"CCAA": 630,
|
| 676 |
+
"UUUUGC": 631,
|
| 677 |
+
"UCAAAA": 632,
|
| 678 |
+
"AUGAAG": 633,
|
| 679 |
+
"AUGAAC": 634,
|
| 680 |
+
"AGUAG": 635,
|
| 681 |
+
"ACACC": 636,
|
| 682 |
+
"UGCUUAAC": 637,
|
| 683 |
+
"ACACUGGAACUGAGACACGGUCC": 638,
|
| 684 |
+
"ACACUGGGACUGAGACACGGCCCAGACUCCUACGGGAGGCAGCAGUGGGGAA": 639,
|
| 685 |
+
"ACUGGG": 640,
|
| 686 |
+
"UAUCAGC": 641,
|
| 687 |
+
"UGGUGCAUGG": 642,
|
| 688 |
+
"ACAUGCAAGUCG": 643,
|
| 689 |
+
"UACGAA": 644,
|
| 690 |
+
"UUAUUGGGCGUAA": 645,
|
| 691 |
+
"CCCAA": 646,
|
| 692 |
+
"AUGAUU": 647,
|
| 693 |
+
"AACGG": 648,
|
| 694 |
+
"UUUCG": 649,
|
| 695 |
+
"ACUUG": 650,
|
| 696 |
+
"AGGAGG": 651,
|
| 697 |
+
"AAAAAA": 652,
|
| 698 |
+
"UUGAAAC": 653,
|
| 699 |
+
"GGGCCUUGUACACACCGCCCGUCACACC": 654,
|
| 700 |
+
"AGGGUGCG": 655,
|
| 701 |
+
"UAAGCACC": 656,
|
| 702 |
+
"UGCGGC": 657,
|
| 703 |
+
"UGGCGC": 658,
|
| 704 |
+
"UGCAUU": 659,
|
| 705 |
+
"UUUUCC": 660,
|
| 706 |
+
"UCCCAA": 661,
|
| 707 |
+
"UUAGG": 662,
|
| 708 |
+
"AGCGUUG": 663,
|
| 709 |
+
"UGAAGAAGGCC": 664,
|
| 710 |
+
"UCCGC": 665,
|
| 711 |
+
"UUUGGG": 666,
|
| 712 |
+
"UUCGGGG": 667,
|
| 713 |
+
"ĠAGAGUUUG": 668,
|
| 714 |
+
"UUAUCCGGAUU": 669,
|
| 715 |
+
"UGUUGG": 670,
|
| 716 |
+
"UAGGAA": 671,
|
| 717 |
+
"UGAAGC": 672,
|
| 718 |
+
"ĠCC": 673,
|
| 719 |
+
"UGCAC": 674,
|
| 720 |
+
"AGUGGCGAACGGG": 675,
|
| 721 |
+
"UAAAC": 676,
|
| 722 |
+
"ACGAACGCUGGCGGCG": 677,
|
| 723 |
+
"UUAAGUC": 678,
|
| 724 |
+
"UGGGGGAA": 679,
|
| 725 |
+
"AUUGAA": 680,
|
| 726 |
+
"AGGUGCUGCAUGGCUGUCG": 681,
|
| 727 |
+
"UAUCG": 682,
|
| 728 |
+
"UUGACC": 683,
|
| 729 |
+
"UAUUCC": 684,
|
| 730 |
+
"AGUGAGGAA": 685,
|
| 731 |
+
"ACCACC": 686,
|
| 732 |
+
"UUGCG": 687,
|
| 733 |
+
"ACAAAA": 688,
|
| 734 |
+
"AGGAAG": 689,
|
| 735 |
+
"UAUAUU": 690,
|
| 736 |
+
"UAAUACAUGC": 691,
|
| 737 |
+
"ACAUUGGGAC": 692,
|
| 738 |
+
"AUGCCCCUU": 693,
|
| 739 |
+
"UGCCCC": 694,
|
| 740 |
+
"ACUAC": 695,
|
| 741 |
+
"ACAAG": 696,
|
| 742 |
+
"GGGAA": 697,
|
| 743 |
+
"AGAAGAAGCACC": 698,
|
| 744 |
+
"UGCGGG": 699,
|
| 745 |
+
"UUCAG": 700,
|
| 746 |
+
"UAGCCGGCC": 701,
|
| 747 |
+
"UUCGAAGC": 702,
|
| 748 |
+
"AGCCAC": 703,
|
| 749 |
+
"AGCAACGCCGCGUGAG": 704,
|
| 750 |
+
"AUUGAACGCUGGCGGC": 705,
|
| 751 |
+
"UAGCUGGUCUGAGAGGAUG": 706,
|
| 752 |
+
"UUGCAA": 707,
|
| 753 |
+
"AUGAAGUC": 708,
|
| 754 |
+
"UAGAGGUGAA": 709,
|
| 755 |
+
"UUGCCAGC": 710,
|
| 756 |
+
"UUAAAAC": 711,
|
| 757 |
+
"ACUAA": 712,
|
| 758 |
+
"UGAGAGG": 713,
|
| 759 |
+
"UCUUG": 714,
|
| 760 |
+
"ACCGGUGGCGAAGGC": 715,
|
| 761 |
+
"AGCCAA": 716,
|
| 762 |
+
"ĠUACG": 717,
|
| 763 |
+
"AUGCCC": 718,
|
| 764 |
+
"UAGGGC": 719,
|
| 765 |
+
"ACGCCGUAAACGAUG": 720,
|
| 766 |
+
"AGUUGG": 721,
|
| 767 |
+
"UGAGGG": 722,
|
| 768 |
+
"AUUUAA": 723,
|
| 769 |
+
"UGACGGUACC": 724,
|
| 770 |
+
"UCUAA": 725,
|
| 771 |
+
"UGGGGAA": 726,
|
| 772 |
+
"GGAC": 727,
|
| 773 |
+
"UGGUGUAGCGGUGAAAUGC": 728,
|
| 774 |
+
"UCAAG": 729,
|
| 775 |
+
"AGUGGG": 730,
|
| 776 |
+
"AUACAA": 731,
|
| 777 |
+
"GCUGGCGGCG": 732,
|
| 778 |
+
"GGAG": 733,
|
| 779 |
+
"UAACACAUGCAAGUCGAAC": 734,
|
| 780 |
+
"GCGAGG": 735,
|
| 781 |
+
"ACCUGAGAGGG": 736,
|
| 782 |
+
"ACCAGUGGCGAAGGCGGC": 737,
|
| 783 |
+
"UUUUUUUU": 738,
|
| 784 |
+
"UCGCAAG": 739,
|
| 785 |
+
"ACGGUACC": 740,
|
| 786 |
+
"AUGUG": 741,
|
| 787 |
+
"UACGC": 742,
|
| 788 |
+
"UGCCGC": 743,
|
| 789 |
+
"AUAUAA": 744,
|
| 790 |
+
"GCGUGAG": 745,
|
| 791 |
+
"UAGCGAA": 746,
|
| 792 |
+
"GGUGACAA": 747,
|
| 793 |
+
"AUUAUU": 748,
|
| 794 |
+
"AGACG": 749,
|
| 795 |
+
"AAUAA": 750,
|
| 796 |
+
"UCAAAGGAAUUGACGGGGGCCCGCACAAGCGGUGGAGCAUGUGGUUUAA": 751,
|
| 797 |
+
"UUCGGAUUG": 752,
|
| 798 |
+
"AGCUCC": 753,
|
| 799 |
+
"UGUGGC": 754,
|
| 800 |
+
"GGAAUUCC": 755,
|
| 801 |
+
"AUUCGUAG": 756,
|
| 802 |
+
"GGAAC": 757,
|
| 803 |
+
"UGACAC": 758,
|
| 804 |
+
"UUAGGG": 759,
|
| 805 |
+
"UAGGCGGC": 760,
|
| 806 |
+
"AGUUUU": 761,
|
| 807 |
+
"UGGGCUACACACGUGCUACAA": 762,
|
| 808 |
+
"UGGUUC": 763,
|
| 809 |
+
"ACGUCAAAUCAUC": 764,
|
| 810 |
+
"UGAAGUCGUAACAAGG": 765,
|
| 811 |
+
"AUCCAA": 766,
|
| 812 |
+
"NNNNNNNN": 767,
|
| 813 |
+
"AUCAC": 768,
|
| 814 |
+
"GGGCUCAACC": 769,
|
| 815 |
+
"UAACGCG": 770,
|
| 816 |
+
"AUGUCC": 771,
|
| 817 |
+
"UUCGGAUCG": 772,
|
| 818 |
+
"UGGGGGAAACCC": 773,
|
| 819 |
+
"GCCGG": 774,
|
| 820 |
+
"AGGCAA": 775,
|
| 821 |
+
"GGCUAA": 776,
|
| 822 |
+
"UGAUCGGCC": 777,
|
| 823 |
+
"UAGAGGUGAAAUUCGUAG": 778,
|
| 824 |
+
"UGAUAC": 779,
|
| 825 |
+
"AUGACC": 780,
|
| 826 |
+
"UGAGCC": 781,
|
| 827 |
+
"UGAGGUAA": 782,
|
| 828 |
+
"UCUAC": 783,
|
| 829 |
+
"UGACGCUGAGGCGCGAA": 784,
|
| 830 |
+
"AUUUU": 785,
|
| 831 |
+
"UCGCG": 786,
|
| 832 |
+
"AGCAGG": 787,
|
| 833 |
+
"AUUAG": 788,
|
| 834 |
+
"UCCCCC": 789,
|
| 835 |
+
"UCUGCC": 790,
|
| 836 |
+
"UACCAAGGCGACG": 791,
|
| 837 |
+
"GAAGAA": 792,
|
| 838 |
+
"ĠAGAGUUUGAUCC": 793,
|
| 839 |
+
"GGUGACAAACCGG": 794,
|
| 840 |
+
"GCAAUGGGCGAAAGCC": 795,
|
| 841 |
+
"UGUAGCGGUGAAAUGCGUAGAG": 796,
|
| 842 |
+
"AGGACG": 797,
|
| 843 |
+
"ACUGCC": 798,
|
| 844 |
+
"AUGGCGAAGGC": 799,
|
| 845 |
+
"UGGUG": 800,
|
| 846 |
+
"AUGGCC": 801,
|
| 847 |
+
"UCAUG": 802,
|
| 848 |
+
"AGCAUC": 803,
|
| 849 |
+
"GGGGG": 804,
|
| 850 |
+
"AGACGG": 805,
|
| 851 |
+
"UAUAAC": 806,
|
| 852 |
+
"AGCUAACGC": 807,
|
| 853 |
+
"UAUAAG": 808,
|
| 854 |
+
"UUGUU": 809,
|
| 855 |
+
"AUGCAA": 810,
|
| 856 |
+
"UUGACAUCC": 811,
|
| 857 |
+
"AUUCAA": 812,
|
| 858 |
+
"ĠGACGAACGCUGGCGGCG": 813,
|
| 859 |
+
"GGCUAACUACGUG": 814,
|
| 860 |
+
"AGUGGCGGACGGG": 815,
|
| 861 |
+
"UGGGUAGC": 816,
|
| 862 |
+
"UGAUCCAGCCAUGCCGCG": 817,
|
| 863 |
+
"UUCAC": 818,
|
| 864 |
+
"AGGGGC": 819,
|
| 865 |
+
"UAGAGC": 820,
|
| 866 |
+
"ACCAGCC": 821,
|
| 867 |
+
"GCCUGGGGAGUACGG": 822,
|
| 868 |
+
"ACGCCC": 823,
|
| 869 |
+
"UGCUUAACACAUGCAAGUCGAAC": 824,
|
| 870 |
+
"UGGUGCAUGGUUGUCG": 825,
|
| 871 |
+
"UAACGG": 826,
|
| 872 |
+
"UAAUACCGCAUACG": 827,
|
| 873 |
+
"UGUAGCGGUGAAAUGCGUAGAUAUC": 828,
|
| 874 |
+
"AGCCGCC": 829,
|
| 875 |
+
"GCCUGGGGAGUACGGCCGCAAGG": 830,
|
| 876 |
+
"GGGGGC": 831,
|
| 877 |
+
"UGUGAC": 832,
|
| 878 |
+
"AUUUAC": 833,
|
| 879 |
+
"AGAAGAA": 834,
|
| 880 |
+
"UAUUGC": 835,
|
| 881 |
+
"UUCGAUGCAACGCGAAGAACCUUACC": 836,
|
| 882 |
+
"GGUGAAUACGUUCCC": 837,
|
| 883 |
+
"UAGCAA": 838,
|
| 884 |
+
"ACGUU": 839,
|
| 885 |
+
"UAUUGGUCAA": 840,
|
| 886 |
+
"AUAUGC": 841,
|
| 887 |
+
"AUAGCC": 842,
|
| 888 |
+
"UGUUUU": 843,
|
| 889 |
+
"GGGUUUAA": 844,
|
| 890 |
+
"AGCAAUGCC": 845,
|
| 891 |
+
"UACCCC": 846,
|
| 892 |
+
"UAGGUGG": 847,
|
| 893 |
+
"AGCAUU": 848,
|
| 894 |
+
"AUGAAGC": 849,
|
| 895 |
+
"AGGCGC": 850,
|
| 896 |
+
"UGCCGG": 851,
|
| 897 |
+
"AAGUCAUCAUGGCCCUU": 852,
|
| 898 |
+
"UGCCUAAUACAUGC": 853,
|
| 899 |
+
"CCCGCG": 854,
|
| 900 |
+
"AGCGUGGGGAGCAAACAGG": 855,
|
| 901 |
+
"ACCAGUGGCGAAGGCG": 856,
|
| 902 |
+
"UGCAAGCGUUAAUCGGAAUUACUGGGCGUAA": 857,
|
| 903 |
+
"UGGUAA": 858,
|
| 904 |
+
"UUUGGC": 859,
|
| 905 |
+
"UAGUCCGG": 860,
|
| 906 |
+
"UACCGG": 861,
|
| 907 |
+
"UGAAGUC": 862,
|
| 908 |
+
"UCAAGC": 863,
|
| 909 |
+
"AGCGUGGGGAGCGAAC": 864,
|
| 910 |
+
"UCGAUG": 865,
|
| 911 |
+
"UAAGAA": 866,
|
| 912 |
+
"UAUGGC": 867,
|
| 913 |
+
"AGCCGG": 868,
|
| 914 |
+
"UGGUGG": 869,
|
| 915 |
+
"ACCCAA": 870,
|
| 916 |
+
"ACCAC": 871,
|
| 917 |
+
"CCCGC": 872,
|
| 918 |
+
"AGAAGG": 873,
|
| 919 |
+
"UUCUUC": 874,
|
| 920 |
+
"GGACCC": 875,
|
| 921 |
+
"AGGUAG": 876,
|
| 922 |
+
"AGAGGAA": 877,
|
| 923 |
+
"UUCGGC": 878,
|
| 924 |
+
"UCUCAGUUCGG": 879,
|
| 925 |
+
"AUUAAGC": 880,
|
| 926 |
+
"UACGGGG": 881,
|
| 927 |
+
"UGCUCC": 882,
|
| 928 |
+
"GCAGAU": 883,
|
| 929 |
+
"AGACUCCUACGGGAGGCAGCAGUAGG": 884,
|
| 930 |
+
"AGCUAA": 885,
|
| 931 |
+
"AUCAGGAGGAAC": 886,
|
| 932 |
+
"AUUAC": 887,
|
| 933 |
+
"UCUAG": 888,
|
| 934 |
+
"UAUUAA": 889,
|
| 935 |
+
"AGGUGGUGCAUGGUUGUCG": 890,
|
| 936 |
+
"AGGAGGAAC": 891,
|
| 937 |
+
"ACGUCAAAUCAUCAUGCCCCUU": 892,
|
| 938 |
+
"GCGGCC": 893,
|
| 939 |
+
"UGGAUG": 894,
|
| 940 |
+
"AUUAGAU": 895,
|
| 941 |
+
"UGCAGC": 896,
|
| 942 |
+
"UUUGAG": 897,
|
| 943 |
+
"UGAAGAAGG": 898,
|
| 944 |
+
"UAAUAA": 899,
|
| 945 |
+
"UUUGUC": 900,
|
| 946 |
+
"UGAGGUAACGGC": 901,
|
| 947 |
+
"AUAGAA": 902,
|
| 948 |
+
"AACUC": 903,
|
| 949 |
+
"UGGGCG": 904,
|
| 950 |
+
"AGUUUC": 905,
|
| 951 |
+
"AUGUUC": 906,
|
| 952 |
+
"UGGACC": 907,
|
| 953 |
+
"UUCCCC": 908,
|
| 954 |
+
"AGUUGC": 909,
|
| 955 |
+
"UGAAAGCCC": 910,
|
| 956 |
+
"UGCAGG": 911,
|
| 957 |
+
"AAGUCCUC": 912,
|
| 958 |
+
"UGACCG": 913,
|
| 959 |
+
"UGGAUC": 914,
|
| 960 |
+
"AAGAGG": 915,
|
| 961 |
+
"AUUGCGAA": 916,
|
| 962 |
+
"ACGAUG": 917,
|
| 963 |
+
"UGGAAAC": 918,
|
| 964 |
+
"AUAAGC": 919,
|
| 965 |
+
"GGUGGAA": 920,
|
| 966 |
+
"UGACGCUGAGGAGCGAA": 921,
|
| 967 |
+
"GAACGC": 922,
|
| 968 |
+
"GAAUCUUCC": 923,
|
| 969 |
+
"UUCGC": 924,
|
| 970 |
+
"ACCUGAGAGGGUGAUCGGCC": 925,
|
| 971 |
+
"ACACUGGAACUGAGACACGGUCCAGACUCCUACGGGAGGCAGCAGUGGGGAA": 926,
|
| 972 |
+
"GGCUAACUUCG": 927,
|
| 973 |
+
"AGAGAC": 928,
|
| 974 |
+
"AGAGGC": 929,
|
| 975 |
+
"UACUC": 930,
|
| 976 |
+
"UAACGGCCC": 931,
|
| 977 |
+
"UUGAGUGC": 932,
|
| 978 |
+
"AACAC": 933,
|
| 979 |
+
"AGUGCC": 934,
|
| 980 |
+
"AGCGCGCG": 935,
|
| 981 |
+
"UGUGCC": 936,
|
| 982 |
+
"AGCAGC": 937,
|
| 983 |
+
"ACCCGAA": 938,
|
| 984 |
+
"ACAACC": 939,
|
| 985 |
+
"GGGAGGAAC": 940,
|
| 986 |
+
"ACCUGGGG": 941,
|
| 987 |
+
"ACGAAAGUC": 942,
|
| 988 |
+
"UCAUGC": 943,
|
| 989 |
+
"ACGGGG": 944,
|
| 990 |
+
"AUAUGG": 945,
|
| 991 |
+
"UCUUUU": 946,
|
| 992 |
+
"GGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGGAGGG": 947,
|
| 993 |
+
"UUAGAG": 948,
|
| 994 |
+
"UGAUGCAGCGACGCC": 949,
|
| 995 |
+
"UGUAGG": 950,
|
| 996 |
+
"GCAUGG": 951,
|
| 997 |
+
"AGAAAGCCAC": 952,
|
| 998 |
+
"UGGAUU": 953,
|
| 999 |
+
"UUGCAGAA": 954,
|
| 1000 |
+
"UUUCCC": 955,
|
| 1001 |
+
"UGUUAA": 956,
|
| 1002 |
+
"UUGAAG": 957,
|
| 1003 |
+
"UCAACCG": 958,
|
| 1004 |
+
"UGGUAG": 959,
|
| 1005 |
+
"GGCUAACUACGUGCCAGCAGCCGCGGUAAUACGUAGG": 960,
|
| 1006 |
+
"GAAAGG": 961,
|
| 1007 |
+
"UGAGGAA": 962,
|
| 1008 |
+
"UUACCAAGGC": 963,
|
| 1009 |
+
"UGUAGCAGUGAA": 964,
|
| 1010 |
+
"UAGCCGGCCUGAGAGGG": 965,
|
| 1011 |
+
"UGGUAC": 966,
|
| 1012 |
+
"UCGCGGAUCAGC": 967,
|
| 1013 |
+
"GGAAACG": 968,
|
| 1014 |
+
"UGUGUGAAGAAGGCC": 969,
|
| 1015 |
+
"GGCCACAUUGGGAC": 970,
|
| 1016 |
+
"AUCUCC": 971,
|
| 1017 |
+
"AGGGCGCG": 972,
|
| 1018 |
+
"UGUGGG": 973,
|
| 1019 |
+
"UAACGC": 974,
|
| 1020 |
+
"ACCUCC": 975,
|
| 1021 |
+
"GGGCCUUGUACACACCGCCCGUCACACCAUGGG": 976,
|
| 1022 |
+
"UUUCAA": 977,
|
| 1023 |
+
"UGGUCGG": 978,
|
| 1024 |
+
"AGGGAC": 979,
|
| 1025 |
+
"UAGGCG": 980,
|
| 1026 |
+
"UGUAAG": 981,
|
| 1027 |
+
"UGGAGGAA": 982,
|
| 1028 |
+
"UUGACGGUACC": 983,
|
| 1029 |
+
"AGUGAGGAAUAUUGGUCAA": 984,
|
| 1030 |
+
"UGACAA": 985,
|
| 1031 |
+
"AUUUUC": 986,
|
| 1032 |
+
"AGGUGGUGCAUGGUUGUCGUCAGCUCGUGUCGUGAGAUGUUGGGUUAAGUCCCGCAACGAGCGCAA": 987,
|
| 1033 |
+
"AGCACC": 988,
|
| 1034 |
+
"AGAACC": 989,
|
| 1035 |
+
"AUGAAGUCGGAAUCGCUAGUAA": 990,
|
| 1036 |
+
"GGUCC": 991,
|
| 1037 |
+
"AGUGAC": 992,
|
| 1038 |
+
"AGAGCC": 993,
|
| 1039 |
+
"UGCUC": 994,
|
| 1040 |
+
"ACAUG": 995,
|
| 1041 |
+
"UAUGCC": 996,
|
| 1042 |
+
"AUUAGCUAG": 997,
|
| 1043 |
+
"UCAACCC": 998,
|
| 1044 |
+
"AUAUAC": 999,
|
| 1045 |
+
"UAAACC": 1000,
|
| 1046 |
+
"AUAUCC": 1001,
|
| 1047 |
+
"UUAUUC": 1002,
|
| 1048 |
+
"UACAGAGGG": 1003,
|
| 1049 |
+
"UUCGAA": 1004,
|
| 1050 |
+
"UUGAAC": 1005,
|
| 1051 |
+
"AGUAAC": 1006,
|
| 1052 |
+
"AGCGGC": 1007,
|
| 1053 |
+
"UCCUCC": 1008,
|
| 1054 |
+
"AGCUCG": 1009,
|
| 1055 |
+
"UUCGAAGCAACGCGAAGAACCUUACC": 1010,
|
| 1056 |
+
"UAUCCC": 1011,
|
| 1057 |
+
"GCGUUGUCCGGAA": 1012,
|
| 1058 |
+
"UGGCCC": 1013,
|
| 1059 |
+
"AGUACG": 1014,
|
| 1060 |
+
"ACGGCCUUCGGGUUGUAA": 1015,
|
| 1061 |
+
"AAGACC": 1016,
|
| 1062 |
+
"UAUUGGGCGUAA": 1017,
|
| 1063 |
+
"AAGAA": 1018,
|
| 1064 |
+
"UUUAAG": 1019,
|
| 1065 |
+
"UUCGGAAUUACUGGGCGUAA": 1020,
|
| 1066 |
+
"UGAGAUAC": 1021,
|
| 1067 |
+
"UCUUGC": 1022,
|
| 1068 |
+
"AGUUAA": 1023
|
| 1069 |
+
},
|
| 1070 |
+
"merges": [
|
| 1071 |
+
"G G",
|
| 1072 |
+
"A A",
|
| 1073 |
+
"U U",
|
| 1074 |
+
"C C",
|
| 1075 |
+
"A G",
|
| 1076 |
+
"U G",
|
| 1077 |
+
"A C",
|
| 1078 |
+
"U C",
|
| 1079 |
+
"U GG",
|
| 1080 |
+
"G C",
|
| 1081 |
+
"A GG",
|
| 1082 |
+
"U AA",
|
| 1083 |
+
"AG C",
|
| 1084 |
+
"A UU",
|
| 1085 |
+
"A CC",
|
| 1086 |
+
"A UG",
|
| 1087 |
+
"U CC",
|
| 1088 |
+
"G AA",
|
| 1089 |
+
"U AC",
|
| 1090 |
+
"UG C",
|
| 1091 |
+
"A UC",
|
| 1092 |
+
"U AG",
|
| 1093 |
+
"UU C",
|
| 1094 |
+
"AA C",
|
| 1095 |
+
"GG C",
|
| 1096 |
+
"UU G",
|
| 1097 |
+
"AA G",
|
| 1098 |
+
"GG G",
|
| 1099 |
+
"CC C",
|
| 1100 |
+
"A U",
|
| 1101 |
+
"UG AA",
|
| 1102 |
+
"AC G",
|
| 1103 |
+
"A UGG",
|
| 1104 |
+
"UAA C",
|
| 1105 |
+
"GC G",
|
| 1106 |
+
"UC G",
|
| 1107 |
+
"AGG C",
|
| 1108 |
+
"UG AG",
|
| 1109 |
+
"UGG C",
|
| 1110 |
+
"AUG C",
|
| 1111 |
+
"AG CC",
|
| 1112 |
+
"UG CC",
|
| 1113 |
+
"A UCC",
|
| 1114 |
+
"GG AA",
|
| 1115 |
+
"A UAA",
|
| 1116 |
+
"U ACC",
|
| 1117 |
+
"UU UU",
|
| 1118 |
+
"AC GG",
|
| 1119 |
+
"AGG G",
|
| 1120 |
+
"U AUU",
|
| 1121 |
+
"AG AA",
|
| 1122 |
+
"UU GG",
|
| 1123 |
+
"G CC",
|
| 1124 |
+
"U AGC",
|
| 1125 |
+
"UC AA",
|
| 1126 |
+
"UU AA",
|
| 1127 |
+
"GAA C",
|
| 1128 |
+
"AC AA",
|
| 1129 |
+
"U AGG",
|
| 1130 |
+
"UGG G",
|
| 1131 |
+
"ACC C",
|
| 1132 |
+
"UGG GG",
|
| 1133 |
+
"UG AC",
|
| 1134 |
+
"A UAC",
|
| 1135 |
+
"GC GG",
|
| 1136 |
+
"AGG AA",
|
| 1137 |
+
"UU CC",
|
| 1138 |
+
"AGC G",
|
| 1139 |
+
"UCC C",
|
| 1140 |
+
"GC AA",
|
| 1141 |
+
"AG AC",
|
| 1142 |
+
"GG CC",
|
| 1143 |
+
"AUU C",
|
| 1144 |
+
"UU UC",
|
| 1145 |
+
"UU GC",
|
| 1146 |
+
"AA AA",
|
| 1147 |
+
"AG AG",
|
| 1148 |
+
"CC G",
|
| 1149 |
+
"UAC G",
|
| 1150 |
+
"AC AC",
|
| 1151 |
+
"A UAG",
|
| 1152 |
+
"GG GG",
|
| 1153 |
+
"UG UC",
|
| 1154 |
+
"UAA G",
|
| 1155 |
+
"U AUC",
|
| 1156 |
+
"UU UG",
|
| 1157 |
+
"AG UC",
|
| 1158 |
+
"AUU G",
|
| 1159 |
+
"GGC G",
|
| 1160 |
+
"AA AC",
|
| 1161 |
+
"AAG UC",
|
| 1162 |
+
"AUG AA",
|
| 1163 |
+
"UG UG",
|
| 1164 |
+
"UC UC",
|
| 1165 |
+
"UGG AA",
|
| 1166 |
+
"ACC G",
|
| 1167 |
+
"AG UG",
|
| 1168 |
+
"UGG GC",
|
| 1169 |
+
"UU AC",
|
| 1170 |
+
"UC GC",
|
| 1171 |
+
"UUC GG",
|
| 1172 |
+
"UGC G",
|
| 1173 |
+
"U AUG",
|
| 1174 |
+
"UUC G",
|
| 1175 |
+
"UU UAA",
|
| 1176 |
+
"UC GG",
|
| 1177 |
+
"UU AG",
|
| 1178 |
+
"UC UG",
|
| 1179 |
+
"UCC G",
|
| 1180 |
+
"AAC G",
|
| 1181 |
+
"GAA G",
|
| 1182 |
+
"AG UGG",
|
| 1183 |
+
"UC AC",
|
| 1184 |
+
"A UAAC",
|
| 1185 |
+
"UG AGG",
|
| 1186 |
+
"AUGG C",
|
| 1187 |
+
"AG AGG",
|
| 1188 |
+
"AG AU",
|
| 1189 |
+
"AUG CC",
|
| 1190 |
+
"ACC AA",
|
| 1191 |
+
"U AGGC",
|
| 1192 |
+
"GG GC",
|
| 1193 |
+
"AUU AA",
|
| 1194 |
+
"GG UGAA",
|
| 1195 |
+
"UAC GGG",
|
| 1196 |
+
"AUC G",
|
| 1197 |
+
"AAG CC",
|
| 1198 |
+
"UU GAA",
|
| 1199 |
+
"U AU",
|
| 1200 |
+
"UAC AC",
|
| 1201 |
+
"GC GAA",
|
| 1202 |
+
"CC UU",
|
| 1203 |
+
"CCC G",
|
| 1204 |
+
"AUGC G",
|
| 1205 |
+
"AC UC",
|
| 1206 |
+
"UG UU",
|
| 1207 |
+
"GGC UAAC",
|
| 1208 |
+
"AA GG",
|
| 1209 |
+
"UC AG",
|
| 1210 |
+
"AC GC",
|
| 1211 |
+
"UG UAGC",
|
| 1212 |
+
"UGAC GC",
|
| 1213 |
+
"UGAG AC",
|
| 1214 |
+
"UU CCC",
|
| 1215 |
+
"GCG UAA",
|
| 1216 |
+
"AGC AGCC",
|
| 1217 |
+
"AUGG G",
|
| 1218 |
+
"AGGC AGC",
|
| 1219 |
+
"AG UGGC",
|
| 1220 |
+
"AGG GC",
|
| 1221 |
+
"UAC AA",
|
| 1222 |
+
"UC AGC",
|
| 1223 |
+
"AUU GG",
|
| 1224 |
+
"GAA GGC",
|
| 1225 |
+
"GCGG UAA",
|
| 1226 |
+
"AC GAA",
|
| 1227 |
+
"UU AAG",
|
| 1228 |
+
"UGCC AGCAGCC",
|
| 1229 |
+
"CC CC",
|
| 1230 |
+
"UG UCG",
|
| 1231 |
+
"UU GGG",
|
| 1232 |
+
"UGC AA",
|
| 1233 |
+
"AGC AA",
|
| 1234 |
+
"AUCC C",
|
| 1235 |
+
"UACGGG AGGCAGC",
|
| 1236 |
+
"AC GGG",
|
| 1237 |
+
"UU AAC",
|
| 1238 |
+
"UUC GGG",
|
| 1239 |
+
"AC UG",
|
| 1240 |
+
"UUG CC",
|
| 1241 |
+
"ACC GG",
|
| 1242 |
+
"UAG AG",
|
| 1243 |
+
"UUG UAA",
|
| 1244 |
+
"UAG UCC",
|
| 1245 |
+
"AGG AUU",
|
| 1246 |
+
"UAA GG",
|
| 1247 |
+
"UGCCAGCAGCC GCGGUAA",
|
| 1248 |
+
"UCC UACGGGAGGCAGC",
|
| 1249 |
+
"AGG GG",
|
| 1250 |
+
"GC ACAA",
|
| 1251 |
+
"AU AUU",
|
| 1252 |
+
"AU AUC",
|
| 1253 |
+
"AG UU",
|
| 1254 |
+
"UAA UACC",
|
| 1255 |
+
"UAA AA",
|
| 1256 |
+
"UAC GG",
|
| 1257 |
+
"AGG AAC",
|
| 1258 |
+
"UG CCC",
|
| 1259 |
+
"UUG AC",
|
| 1260 |
+
"GAA GC",
|
| 1261 |
+
"UGG CC",
|
| 1262 |
+
"UC UU",
|
| 1263 |
+
"U AGGG",
|
| 1264 |
+
"AG CCC",
|
| 1265 |
+
"UGAGAC ACGG",
|
| 1266 |
+
"AUU AGC",
|
| 1267 |
+
"AUAA G",
|
| 1268 |
+
"GC UGGC",
|
| 1269 |
+
"AGG CC",
|
| 1270 |
+
"AC UU",
|
| 1271 |
+
"AGCG UGGGG",
|
| 1272 |
+
"AGC AAAC",
|
| 1273 |
+
"ACC CC",
|
| 1274 |
+
"AGGAA GG",
|
| 1275 |
+
"UAA CC",
|
| 1276 |
+
"UUG ACGG",
|
| 1277 |
+
"AGGAUU AGAU",
|
| 1278 |
+
"AC AG",
|
| 1279 |
+
"AGAC UCCUACGGGAGGCAGC",
|
| 1280 |
+
"UGG UC",
|
| 1281 |
+
"GGC GG",
|
| 1282 |
+
"GC GC",
|
| 1283 |
+
"UACC C",
|
| 1284 |
+
"UGG AGC",
|
| 1285 |
+
"AUG UGG",
|
| 1286 |
+
"AGUGG GGAA",
|
| 1287 |
+
"UGUAGC GGUGAA",
|
| 1288 |
+
"GGG CC",
|
| 1289 |
+
"UAG UAA",
|
| 1290 |
+
"UCC GG",
|
| 1291 |
+
"N N",
|
| 1292 |
+
"Ġ G",
|
| 1293 |
+
"UG AAG",
|
| 1294 |
+
"UAG CC",
|
| 1295 |
+
"AC AUGC",
|
| 1296 |
+
"UC AAC",
|
| 1297 |
+
"AG UAC",
|
| 1298 |
+
"AGG AUG",
|
| 1299 |
+
"AGGAUUAGAU ACCC",
|
| 1300 |
+
"AG UGC",
|
| 1301 |
+
"U AUGG",
|
| 1302 |
+
"ACG CC",
|
| 1303 |
+
"UAG UUGG",
|
| 1304 |
+
"UG UAA",
|
| 1305 |
+
"AA CC",
|
| 1306 |
+
"AC UGC",
|
| 1307 |
+
"UAUU GG",
|
| 1308 |
+
"UGG GCGUAA",
|
| 1309 |
+
"UU UUC",
|
| 1310 |
+
"UGAG UAAC",
|
| 1311 |
+
"UGC UGC",
|
| 1312 |
+
"UAG AA",
|
| 1313 |
+
"AUU CC",
|
| 1314 |
+
"UAA GC",
|
| 1315 |
+
"U AUAA",
|
| 1316 |
+
"ACG UC",
|
| 1317 |
+
"AA GC",
|
| 1318 |
+
"AG AAG",
|
| 1319 |
+
"AGC GCAA",
|
| 1320 |
+
"UG ACGG",
|
| 1321 |
+
"AGC GC",
|
| 1322 |
+
"UU UUG",
|
| 1323 |
+
"UGC AAC",
|
| 1324 |
+
"GG UG",
|
| 1325 |
+
"UCAGC UCG",
|
| 1326 |
+
"UGG UAGUCC",
|
| 1327 |
+
"UU UCC",
|
| 1328 |
+
"AGC GG",
|
| 1329 |
+
"AG AAC",
|
| 1330 |
+
"UG AAC",
|
| 1331 |
+
"UGG AAC",
|
| 1332 |
+
"UUC AA",
|
| 1333 |
+
"AG AUU",
|
| 1334 |
+
"AC UCC",
|
| 1335 |
+
"AG AUG",
|
| 1336 |
+
"UU AUU",
|
| 1337 |
+
"UGG GAA",
|
| 1338 |
+
"AG AGC",
|
| 1339 |
+
"AUC AA",
|
| 1340 |
+
"GGCUAAC UACG",
|
| 1341 |
+
"AGC AAC",
|
| 1342 |
+
"AGCGUGGGG AGCAAAC",
|
| 1343 |
+
"AGGAUUAGAUACCC UGGUAGUCC",
|
| 1344 |
+
"AC AUU",
|
| 1345 |
+
"UAA ACG",
|
| 1346 |
+
"UG AGGC",
|
| 1347 |
+
"UG UGAA",
|
| 1348 |
+
"GAA GG",
|
| 1349 |
+
"AUGCG UAG",
|
| 1350 |
+
"UU GGC",
|
| 1351 |
+
"UAGG GG",
|
| 1352 |
+
"AG UGAA",
|
| 1353 |
+
"AGG GAA",
|
| 1354 |
+
"UG AUC",
|
| 1355 |
+
"UGGG AC",
|
| 1356 |
+
"UUAAG UCCC",
|
| 1357 |
+
"ACCG CCCG",
|
| 1358 |
+
"GAAC GCUGGC",
|
| 1359 |
+
"AAGUC GAAC",
|
| 1360 |
+
"AGC GAA",
|
| 1361 |
+
"AGC UC",
|
| 1362 |
+
"UCAA AGGAA",
|
| 1363 |
+
"UCAA CC",
|
| 1364 |
+
"GCC UGGGG",
|
| 1365 |
+
"CCC UU",
|
| 1366 |
+
"UCC CC",
|
| 1367 |
+
"UGCC G",
|
| 1368 |
+
"UG AUCC",
|
| 1369 |
+
"UGAG AUG",
|
| 1370 |
+
"UU ACC",
|
| 1371 |
+
"AGACUCCUACGGGAGGCAGC AGUGGGGAA",
|
| 1372 |
+
"UCG CC",
|
| 1373 |
+
"GGG AC",
|
| 1374 |
+
"AGGC G",
|
| 1375 |
+
"AGGAAGG UGGGG",
|
| 1376 |
+
"GGG CCC",
|
| 1377 |
+
"UAUU C",
|
| 1378 |
+
"UACG UUCCC",
|
| 1379 |
+
"UCAAAGGAA UUGACGG",
|
| 1380 |
+
"AU ACC",
|
| 1381 |
+
"UGAGACACGG CCC",
|
| 1382 |
+
"AU AGC",
|
| 1383 |
+
"UC AUU",
|
| 1384 |
+
"UACAC ACCGCCCG",
|
| 1385 |
+
"UC GAA",
|
| 1386 |
+
"AU AGG",
|
| 1387 |
+
"AUC GG",
|
| 1388 |
+
"UU UGG",
|
| 1389 |
+
"UG AUGC",
|
| 1390 |
+
"UGC GAA",
|
| 1391 |
+
"UAG AGG",
|
| 1392 |
+
"GCACAA GCGG",
|
| 1393 |
+
"AAG UCG",
|
| 1394 |
+
"UGGC G",
|
| 1395 |
+
"UC GGAA",
|
| 1396 |
+
"GGCG ACG",
|
| 1397 |
+
"UG AUG",
|
| 1398 |
+
"UAGC G",
|
| 1399 |
+
"AUAC G",
|
| 1400 |
+
"AACG AGCGCAA",
|
| 1401 |
+
"UCAGCUCG UGUCG",
|
| 1402 |
+
"CCUU ACC",
|
| 1403 |
+
"UUGGG UUAAGUCCC",
|
| 1404 |
+
"ACG UGC",
|
| 1405 |
+
"AC UGG",
|
| 1406 |
+
"AG UAA",
|
| 1407 |
+
"GCAA GG",
|
| 1408 |
+
"UG UGG",
|
| 1409 |
+
"UCAGCUCGUGUCG UGAGAUG",
|
| 1410 |
+
"U AUCC",
|
| 1411 |
+
"AG UUC",
|
| 1412 |
+
"AG ACC",
|
| 1413 |
+
"ACC AGUGGC",
|
| 1414 |
+
"AU AUG",
|
| 1415 |
+
"UC AGG",
|
| 1416 |
+
"UC UUC",
|
| 1417 |
+
"GC AACGAGCGCAA",
|
| 1418 |
+
"UUAC UGGGCGUAA",
|
| 1419 |
+
"UG AUU",
|
| 1420 |
+
"UU AUCC",
|
| 1421 |
+
"UG ACC",
|
| 1422 |
+
"UC AUC",
|
| 1423 |
+
"U AUGC",
|
| 1424 |
+
"UAG UC",
|
| 1425 |
+
"GCC G",
|
| 1426 |
+
"AUC AGC",
|
| 1427 |
+
"AUUC G",
|
| 1428 |
+
"UAAUACC GC",
|
| 1429 |
+
"UGG GGG",
|
| 1430 |
+
"AAC GCGAA",
|
| 1431 |
+
"AC AGG",
|
| 1432 |
+
"UGC GG",
|
| 1433 |
+
"GGCUAAC UCCG",
|
| 1434 |
+
"AUGUGG UUUAA",
|
| 1435 |
+
"AGGAAGGUGGGG AUG",
|
| 1436 |
+
"GCC GCG",
|
| 1437 |
+
"UCGC UAGUAA",
|
| 1438 |
+
"UGAA AC",
|
| 1439 |
+
"AC GGC",
|
| 1440 |
+
"UUG UACACACCGCCCG",
|
| 1441 |
+
"UGGAA UUCC",
|
| 1442 |
+
"UCAGCUCGUGUCGUGAGAUG UUGGGUUAAGUCCC",
|
| 1443 |
+
"GAA AGCC",
|
| 1444 |
+
"AUU GC",
|
| 1445 |
+
"UGGUC UGAG",
|
| 1446 |
+
"UC GGC",
|
| 1447 |
+
"UCC AA",
|
| 1448 |
+
"AUUAGC UAGUUGG",
|
| 1449 |
+
"UAGGC GG",
|
| 1450 |
+
"AG UUG",
|
| 1451 |
+
"GAAC GGG",
|
| 1452 |
+
"UC ACC",
|
| 1453 |
+
"UAA AAC",
|
| 1454 |
+
"UC UGG",
|
| 1455 |
+
"UAUU G",
|
| 1456 |
+
"UUCGGG UUGUAA",
|
| 1457 |
+
"AC UUC",
|
| 1458 |
+
"ACGUGC UACAA",
|
| 1459 |
+
"GAA AA",
|
| 1460 |
+
"Ġ C",
|
| 1461 |
+
"UC UGC",
|
| 1462 |
+
"UU UGC",
|
| 1463 |
+
"UACC G",
|
| 1464 |
+
"UGCAAC UCG",
|
| 1465 |
+
"AUGGC UGUCG",
|
| 1466 |
+
"UUG UUGG",
|
| 1467 |
+
"UG UGC",
|
| 1468 |
+
"AACGCGAA GAA",
|
| 1469 |
+
"UG UUC",
|
| 1470 |
+
"AG AGGG",
|
| 1471 |
+
"AUCC G",
|
| 1472 |
+
"GCG UUG",
|
| 1473 |
+
"AAC AA",
|
| 1474 |
+
"UU GGAA",
|
| 1475 |
+
"AU AU",
|
| 1476 |
+
"UC UCC",
|
| 1477 |
+
"AG AUC",
|
| 1478 |
+
"ACG CCG",
|
| 1479 |
+
"UUAA CC",
|
| 1480 |
+
"AGGC GG",
|
| 1481 |
+
"ACAUGC AAGUCGAAC",
|
| 1482 |
+
"UGG UGC",
|
| 1483 |
+
"UAA UAC",
|
| 1484 |
+
"UACC AA",
|
| 1485 |
+
"GG CCC",
|
| 1486 |
+
"AGC AC",
|
| 1487 |
+
"UGAA CC",
|
| 1488 |
+
"ACAC UGGGAC",
|
| 1489 |
+
"AUC AGG",
|
| 1490 |
+
"UGAGUAAC ACG",
|
| 1491 |
+
"GCG UG",
|
| 1492 |
+
"U AUAC",
|
| 1493 |
+
"UUG UC",
|
| 1494 |
+
"GAA UC",
|
| 1495 |
+
"UU AGC",
|
| 1496 |
+
"UCAGCUCGUGUCGUGAGAUGUUGGGUUAAGUCCC GCAACGAGCGCAA",
|
| 1497 |
+
"AGCAAC GCCGCG",
|
| 1498 |
+
"AG UAGG",
|
| 1499 |
+
"UAAC G",
|
| 1500 |
+
"GCACAAGCGG UGGAGC",
|
| 1501 |
+
"UU UAG",
|
| 1502 |
+
"AGG GGG",
|
| 1503 |
+
"UACAC ACGUGCUACAA",
|
| 1504 |
+
"GGC GC",
|
| 1505 |
+
"UGAG AGGG",
|
| 1506 |
+
"UGC GC",
|
| 1507 |
+
"AGCC G",
|
| 1508 |
+
"UGAA UACGUUCCC",
|
| 1509 |
+
"UU UAC",
|
| 1510 |
+
"NN NN",
|
| 1511 |
+
"GGCUAACUCCG UGCCAGCAGCCGCGGUAA",
|
| 1512 |
+
"AUGG AA",
|
| 1513 |
+
"UGGGC GC",
|
| 1514 |
+
"UGGGC GAAAGCC",
|
| 1515 |
+
"U AUAG",
|
| 1516 |
+
"GAA GGCC",
|
| 1517 |
+
"GGC AGC",
|
| 1518 |
+
"AUC GC",
|
| 1519 |
+
"UG UUG",
|
| 1520 |
+
"ACCC G",
|
| 1521 |
+
"GGCUAACUACG UGCCAGCAGCCGCGGUAA",
|
| 1522 |
+
"AG UCC",
|
| 1523 |
+
"AUC AGCC",
|
| 1524 |
+
"UG UCC",
|
| 1525 |
+
"UCAAAGGAAUUGACGG GGGCCC",
|
| 1526 |
+
"UGACGC UGAGGC",
|
| 1527 |
+
"UG AGC",
|
| 1528 |
+
"UUCC G",
|
| 1529 |
+
"AAG AC",
|
| 1530 |
+
"GAAC G",
|
| 1531 |
+
"AACGCGAAGAA CCUUACC",
|
| 1532 |
+
"UGGC GAAGGC",
|
| 1533 |
+
"AAC GC",
|
| 1534 |
+
"GG AUU",
|
| 1535 |
+
"ACACUGGGAC UGAGACACGGCCC",
|
| 1536 |
+
"AGCC AUGCC",
|
| 1537 |
+
"AUG AC",
|
| 1538 |
+
"GCACAAGCGGUGGAGC AUGUGGUUUAA",
|
| 1539 |
+
"GCG CC",
|
| 1540 |
+
"UG AUGG",
|
| 1541 |
+
"UGCUGC AUGGCUGUCG",
|
| 1542 |
+
"AGG UC",
|
| 1543 |
+
"AUG UC",
|
| 1544 |
+
"GCC CC",
|
| 1545 |
+
"UG ACG",
|
| 1546 |
+
"GGGCC UUGUACACACCGCCCG",
|
| 1547 |
+
"ACC UC",
|
| 1548 |
+
"GG GGC",
|
| 1549 |
+
"UCAC ACC",
|
| 1550 |
+
"AUUGG GCGUAA",
|
| 1551 |
+
"UAAC AAGG",
|
| 1552 |
+
"UUAA AA",
|
| 1553 |
+
"ACC GC",
|
| 1554 |
+
"UGUAGCGGUGAA AUGCGUAG",
|
| 1555 |
+
"UUGG GC",
|
| 1556 |
+
"UAAC GGC",
|
| 1557 |
+
"ACGCCG UAAACG",
|
| 1558 |
+
"GAA AC",
|
| 1559 |
+
"AGC UAAC",
|
| 1560 |
+
"AUAA AA",
|
| 1561 |
+
"AGCGUGGGGAGCAAAC AGGAUUAGAUACCCUGGUAGUCC",
|
| 1562 |
+
"AGC GAAC",
|
| 1563 |
+
"UCC UC",
|
| 1564 |
+
"AGAA AA",
|
| 1565 |
+
"UGAA GG",
|
| 1566 |
+
"UAUU GCACAA",
|
| 1567 |
+
"UGGGCGC AAGCC",
|
| 1568 |
+
"UUUU GG",
|
| 1569 |
+
"UGGUCUGAG AGGAUG",
|
| 1570 |
+
"AUC AG",
|
| 1571 |
+
"ACCAA GGCGACG",
|
| 1572 |
+
"GAACGCUGGC GGC",
|
| 1573 |
+
"GGCUAACUACGUGCCAGCAGCCGCGGUAA UACG",
|
| 1574 |
+
"UGAGACACGG UCC",
|
| 1575 |
+
"AGAA GC",
|
| 1576 |
+
"UCCC G",
|
| 1577 |
+
"UUC GGAA",
|
| 1578 |
+
"ACGG CC",
|
| 1579 |
+
"U AUGAA",
|
| 1580 |
+
"UGACGC UGAGG",
|
| 1581 |
+
"AUC AUU",
|
| 1582 |
+
"ACCAGUGGC GAAGGC",
|
| 1583 |
+
"ACCAA GGC",
|
| 1584 |
+
"U A",
|
| 1585 |
+
"UU UGAC",
|
| 1586 |
+
"AC AAC",
|
| 1587 |
+
"AUG UGAA",
|
| 1588 |
+
"UGUAGCGGUGAA AUGC",
|
| 1589 |
+
"UG UAG",
|
| 1590 |
+
"UGG GAAC",
|
| 1591 |
+
"AUC AUC",
|
| 1592 |
+
"GGCC G",
|
| 1593 |
+
"UAA UC",
|
| 1594 |
+
"GGCUAACUCCGUGCCAGCAGCCGCGGUAA UACGG",
|
| 1595 |
+
"UAA AGC",
|
| 1596 |
+
"UGGC UC",
|
| 1597 |
+
"AGAC UGCC",
|
| 1598 |
+
"UG UAC",
|
| 1599 |
+
"UUG AG",
|
| 1600 |
+
"GG UC",
|
| 1601 |
+
"ACAC UGGAAC",
|
| 1602 |
+
"UAAUACC GG",
|
| 1603 |
+
"UCC GGAA",
|
| 1604 |
+
"UUAA UCGGAA",
|
| 1605 |
+
"GCCUGGGG AGUAC",
|
| 1606 |
+
"AUAA CC",
|
| 1607 |
+
"AG UCG",
|
| 1608 |
+
"AUGG GC",
|
| 1609 |
+
"GGG UC",
|
| 1610 |
+
"AG UUCGG",
|
| 1611 |
+
"AGGAAGGUGGGGAUG ACGUC",
|
| 1612 |
+
"UGAG AA",
|
| 1613 |
+
"AUCC CC",
|
| 1614 |
+
"GCGG UGAAUACGUUCCC",
|
| 1615 |
+
"UGG AGG",
|
| 1616 |
+
"AGAG UUUG",
|
| 1617 |
+
"UGCAA GCG",
|
| 1618 |
+
"UU UAUU",
|
| 1619 |
+
"UGG AC",
|
| 1620 |
+
"UGAG UAA",
|
| 1621 |
+
"GAAGC ACC",
|
| 1622 |
+
"AGCCAUGCC GCG",
|
| 1623 |
+
"GGC AA",
|
| 1624 |
+
"UUG UCG",
|
| 1625 |
+
"UAUUGG ACAA",
|
| 1626 |
+
"UUGG GG",
|
| 1627 |
+
"AUC UC",
|
| 1628 |
+
"GAA AGC",
|
| 1629 |
+
"UGAA AA",
|
| 1630 |
+
"AC AGC",
|
| 1631 |
+
"UG AUGAA",
|
| 1632 |
+
"GCCUGGGGAGUAC GGCC",
|
| 1633 |
+
"GAA CC",
|
| 1634 |
+
"UGG GCC",
|
| 1635 |
+
"AG AGAA",
|
| 1636 |
+
"AUGG GG",
|
| 1637 |
+
"AGG CCC",
|
| 1638 |
+
"AUAAC G",
|
| 1639 |
+
"AUGCG UAGAG",
|
| 1640 |
+
"GAA GGCG",
|
| 1641 |
+
"UC GGG",
|
| 1642 |
+
"UGGC AA",
|
| 1643 |
+
"AGCC CC",
|
| 1644 |
+
"UC GCGG",
|
| 1645 |
+
"GG ACGGG",
|
| 1646 |
+
"UCG UAACAAGG",
|
| 1647 |
+
"AGC UUGC",
|
| 1648 |
+
"UUUU AA",
|
| 1649 |
+
"AGCG ACGCC",
|
| 1650 |
+
"UUAAUCGGAA UUACUGGGCGUAA",
|
| 1651 |
+
"GGAA GG",
|
| 1652 |
+
"AC AUC",
|
| 1653 |
+
"UGAGUAAC GCG",
|
| 1654 |
+
"UU AUG",
|
| 1655 |
+
"GCCUGGGG AG",
|
| 1656 |
+
"UAG CCG",
|
| 1657 |
+
"UGGGG UAA",
|
| 1658 |
+
"UUCG AUGC",
|
| 1659 |
+
"CCC UUG",
|
| 1660 |
+
"CCC GG",
|
| 1661 |
+
"UU UGAA",
|
| 1662 |
+
"GCAA GGC",
|
| 1663 |
+
"AUGG CCCUU",
|
| 1664 |
+
"AUU UC",
|
| 1665 |
+
"AGG AC",
|
| 1666 |
+
"GAACGCUGGC GGCG",
|
| 1667 |
+
"GGCGG ACGGG",
|
| 1668 |
+
"UUAA GC",
|
| 1669 |
+
"U AUGGG",
|
| 1670 |
+
"UU AUC",
|
| 1671 |
+
"AU AUUC",
|
| 1672 |
+
"UGG AG",
|
| 1673 |
+
"AAGUC AUC",
|
| 1674 |
+
"UGG GGC",
|
| 1675 |
+
"AGUC UGCAACUCG",
|
| 1676 |
+
"ACCC GC",
|
| 1677 |
+
"AG AUGG",
|
| 1678 |
+
"GGAA UCGCUAGUAA",
|
| 1679 |
+
"UUC UC",
|
| 1680 |
+
"AUU AAG",
|
| 1681 |
+
"ACG UCAA",
|
| 1682 |
+
"CC AA",
|
| 1683 |
+
"UUUU GC",
|
| 1684 |
+
"UCAA AA",
|
| 1685 |
+
"AUG AAG",
|
| 1686 |
+
"AUG AAC",
|
| 1687 |
+
"AG UAG",
|
| 1688 |
+
"AC ACC",
|
| 1689 |
+
"UGC UUAAC",
|
| 1690 |
+
"ACACUGGAAC UGAGACACGGUCC",
|
| 1691 |
+
"ACACUGGGACUGAGACACGGCCC AGACUCCUACGGGAGGCAGCAGUGGGGAA",
|
| 1692 |
+
"AC UGGG",
|
| 1693 |
+
"UAUC AGC",
|
| 1694 |
+
"UGGUGC AUGG",
|
| 1695 |
+
"ACAUGC AAGUCG",
|
| 1696 |
+
"UAC GAA",
|
| 1697 |
+
"UU AUUGGGCGUAA",
|
| 1698 |
+
"CCC AA",
|
| 1699 |
+
"AUG AUU",
|
| 1700 |
+
"AAC GG",
|
| 1701 |
+
"UU UCG",
|
| 1702 |
+
"AC UUG",
|
| 1703 |
+
"AGG AGG",
|
| 1704 |
+
"AAAA AA",
|
| 1705 |
+
"UUGAA AC",
|
| 1706 |
+
"GGGCCUUGUACACACCGCCCG UCACACC",
|
| 1707 |
+
"AGGG UGCG",
|
| 1708 |
+
"UAAGC ACC",
|
| 1709 |
+
"UGC GGC",
|
| 1710 |
+
"UGGC GC",
|
| 1711 |
+
"UGC AUU",
|
| 1712 |
+
"UUUU CC",
|
| 1713 |
+
"UCCC AA",
|
| 1714 |
+
"UU AGG",
|
| 1715 |
+
"AGCG UUG",
|
| 1716 |
+
"UGAA GAAGGCC",
|
| 1717 |
+
"UCC GC",
|
| 1718 |
+
"UU UGGG",
|
| 1719 |
+
"UUC GGGG",
|
| 1720 |
+
"Ġ AGAGUUUG",
|
| 1721 |
+
"UUAUCC GGAUU",
|
| 1722 |
+
"UG UUGG",
|
| 1723 |
+
"UAGG AA",
|
| 1724 |
+
"UGAA GC",
|
| 1725 |
+
"Ġ CC",
|
| 1726 |
+
"UGC AC",
|
| 1727 |
+
"AGUGGC GAACGGG",
|
| 1728 |
+
"UAA AC",
|
| 1729 |
+
"AC GAACGCUGGCGGCG",
|
| 1730 |
+
"UU AAGUC",
|
| 1731 |
+
"UGGGG GAA",
|
| 1732 |
+
"AUU GAA",
|
| 1733 |
+
"AGG UGCUGCAUGGCUGUCG",
|
| 1734 |
+
"UAUC G",
|
| 1735 |
+
"UUG ACC",
|
| 1736 |
+
"UAUU CC",
|
| 1737 |
+
"AGUG AGGAA",
|
| 1738 |
+
"ACC ACC",
|
| 1739 |
+
"UU GCG",
|
| 1740 |
+
"ACAA AA",
|
| 1741 |
+
"AGG AAG",
|
| 1742 |
+
"UAU AUU",
|
| 1743 |
+
"UAAUAC AUGC",
|
| 1744 |
+
"ACAUU GGGAC",
|
| 1745 |
+
"AUGCC CCUU",
|
| 1746 |
+
"UGCC CC",
|
| 1747 |
+
"AC UAC",
|
| 1748 |
+
"AC AAG",
|
| 1749 |
+
"GG GAA",
|
| 1750 |
+
"AGAA GAAGCACC",
|
| 1751 |
+
"UGC GGG",
|
| 1752 |
+
"UUC AG",
|
| 1753 |
+
"UAGCC GGCC",
|
| 1754 |
+
"UUC GAAGC",
|
| 1755 |
+
"AGCC AC",
|
| 1756 |
+
"AGCAACGCCGCG UGAG",
|
| 1757 |
+
"AUU GAACGCUGGCGGC",
|
| 1758 |
+
"UAGC UGGUCUGAGAGGAUG",
|
| 1759 |
+
"UU GCAA",
|
| 1760 |
+
"AUG AAGUC",
|
| 1761 |
+
"UAGAGG UGAA",
|
| 1762 |
+
"UUGCC AGC",
|
| 1763 |
+
"UUAA AAC",
|
| 1764 |
+
"AC UAA",
|
| 1765 |
+
"UGAG AGG",
|
| 1766 |
+
"UC UUG",
|
| 1767 |
+
"ACCGG UGGCGAAGGC",
|
| 1768 |
+
"AGCC AA",
|
| 1769 |
+
"Ġ UACG",
|
| 1770 |
+
"AUG CCC",
|
| 1771 |
+
"UAGG GC",
|
| 1772 |
+
"ACGCCGUAAACG AUG",
|
| 1773 |
+
"AG UUGG",
|
| 1774 |
+
"UG AGGG",
|
| 1775 |
+
"AUU UAA",
|
| 1776 |
+
"UGACGG UACC",
|
| 1777 |
+
"UC UAA",
|
| 1778 |
+
"UGG GGAA",
|
| 1779 |
+
"GG AC",
|
| 1780 |
+
"UGG UGUAGCGGUGAAAUGC",
|
| 1781 |
+
"UC AAG",
|
| 1782 |
+
"AG UGGG",
|
| 1783 |
+
"AUAC AA",
|
| 1784 |
+
"GCUGGC GGCG",
|
| 1785 |
+
"GG AG",
|
| 1786 |
+
"UAAC ACAUGCAAGUCGAAC",
|
| 1787 |
+
"GCG AGG",
|
| 1788 |
+
"ACC UGAGAGGG",
|
| 1789 |
+
"ACCAGUGGCGAAGGC GGC",
|
| 1790 |
+
"UUUU UUUU",
|
| 1791 |
+
"UCGC AAG",
|
| 1792 |
+
"ACGG UACC",
|
| 1793 |
+
"AUG UG",
|
| 1794 |
+
"UAC GC",
|
| 1795 |
+
"UGCC GC",
|
| 1796 |
+
"AU AUAA",
|
| 1797 |
+
"GCG UGAG",
|
| 1798 |
+
"UAGC GAA",
|
| 1799 |
+
"GGUG ACAA",
|
| 1800 |
+
"AUU AUU",
|
| 1801 |
+
"AG ACG",
|
| 1802 |
+
"AA UAA",
|
| 1803 |
+
"UCAAAGGAAUUGACGGGGGCCC GCACAAGCGGUGGAGCAUGUGGUUUAA",
|
| 1804 |
+
"UUCGG AUUG",
|
| 1805 |
+
"AGC UCC",
|
| 1806 |
+
"UG UGGC",
|
| 1807 |
+
"GGAA UUCC",
|
| 1808 |
+
"AUUCG UAG",
|
| 1809 |
+
"GG AAC",
|
| 1810 |
+
"UGAC AC",
|
| 1811 |
+
"UU AGGG",
|
| 1812 |
+
"UAGGC GGC",
|
| 1813 |
+
"AG UUUU",
|
| 1814 |
+
"UGGGC UACACACGUGCUACAA",
|
| 1815 |
+
"UGG UUC",
|
| 1816 |
+
"ACGUCAA AUCAUC",
|
| 1817 |
+
"UGAAG UCGUAACAAGG",
|
| 1818 |
+
"AUCC AA",
|
| 1819 |
+
"NNNN NNNN",
|
| 1820 |
+
"AUC AC",
|
| 1821 |
+
"GGGC UCAACC",
|
| 1822 |
+
"UAAC GCG",
|
| 1823 |
+
"AUG UCC",
|
| 1824 |
+
"UUCGG AUCG",
|
| 1825 |
+
"UGGGGGAA ACCC",
|
| 1826 |
+
"GCC GG",
|
| 1827 |
+
"AGGC AA",
|
| 1828 |
+
"GGC UAA",
|
| 1829 |
+
"UGAUC GGCC",
|
| 1830 |
+
"UAGAGGUGAA AUUCGUAG",
|
| 1831 |
+
"UG AUAC",
|
| 1832 |
+
"AUG ACC",
|
| 1833 |
+
"UGAG CC",
|
| 1834 |
+
"UGAGG UAA",
|
| 1835 |
+
"UC UAC",
|
| 1836 |
+
"UGACGCUGAGGC GCGAA",
|
| 1837 |
+
"AUU UU",
|
| 1838 |
+
"UC GCG",
|
| 1839 |
+
"AGC AGG",
|
| 1840 |
+
"AUU AG",
|
| 1841 |
+
"UCC CCC",
|
| 1842 |
+
"UC UGCC",
|
| 1843 |
+
"UACCAA GGCGACG",
|
| 1844 |
+
"GAA GAA",
|
| 1845 |
+
"ĠAGAGUUUG AUCC",
|
| 1846 |
+
"GGUGACAA ACCGG",
|
| 1847 |
+
"GCAA UGGGCGAAAGCC",
|
| 1848 |
+
"UGUAGCGGUGAA AUGCGUAGAG",
|
| 1849 |
+
"AGG ACG",
|
| 1850 |
+
"AC UGCC",
|
| 1851 |
+
"AUGGC GAAGGC",
|
| 1852 |
+
"UGG UG",
|
| 1853 |
+
"AUGG CC",
|
| 1854 |
+
"UC AUG",
|
| 1855 |
+
"AGC AUC",
|
| 1856 |
+
"GG GGG",
|
| 1857 |
+
"AG ACGG",
|
| 1858 |
+
"U AUAAC",
|
| 1859 |
+
"AGCUAAC GC",
|
| 1860 |
+
"U AUAAG",
|
| 1861 |
+
"UUG UU",
|
| 1862 |
+
"AUGC AA",
|
| 1863 |
+
"UUGAC AUCC",
|
| 1864 |
+
"AUUC AA",
|
| 1865 |
+
"ĠG ACGAACGCUGGCGGCG",
|
| 1866 |
+
"GGCUAACUACG UG",
|
| 1867 |
+
"AGUGGC GGACGGG",
|
| 1868 |
+
"UGGG UAGC",
|
| 1869 |
+
"UGAUCC AGCCAUGCCGCG",
|
| 1870 |
+
"UUC AC",
|
| 1871 |
+
"AGG GGC",
|
| 1872 |
+
"UAG AGC",
|
| 1873 |
+
"ACC AGCC",
|
| 1874 |
+
"GCCUGGGGAG UACGG",
|
| 1875 |
+
"ACG CCC",
|
| 1876 |
+
"UGCUUAAC ACAUGCAAGUCGAAC",
|
| 1877 |
+
"UGGUGCAUGG UUGUCG",
|
| 1878 |
+
"UAAC GG",
|
| 1879 |
+
"UAAUACCGC AUACG",
|
| 1880 |
+
"UGUAGCGGUGAAAUGCGUAG AUAUC",
|
| 1881 |
+
"AGCC GCC",
|
| 1882 |
+
"GCCUGGGGAGUACGGCC GCAAGG",
|
| 1883 |
+
"GGGG GC",
|
| 1884 |
+
"UG UGAC",
|
| 1885 |
+
"AUU UAC",
|
| 1886 |
+
"AGAA GAA",
|
| 1887 |
+
"UAUU GC",
|
| 1888 |
+
"UUCGAUGC AACGCGAAGAACCUUACC",
|
| 1889 |
+
"GGUGAA UACGUUCCC",
|
| 1890 |
+
"UAGC AA",
|
| 1891 |
+
"ACG UU",
|
| 1892 |
+
"UAUUGG UCAA",
|
| 1893 |
+
"AU AUGC",
|
| 1894 |
+
"AUAG CC",
|
| 1895 |
+
"UG UUUU",
|
| 1896 |
+
"GGG UUUAA",
|
| 1897 |
+
"AGCAA UGCC",
|
| 1898 |
+
"UACC CC",
|
| 1899 |
+
"UAGG UGG",
|
| 1900 |
+
"AGC AUU",
|
| 1901 |
+
"AUGAA GC",
|
| 1902 |
+
"AGGC GC",
|
| 1903 |
+
"UGCC GG",
|
| 1904 |
+
"AAGUCAUC AUGGCCCUU",
|
| 1905 |
+
"UGCC UAAUACAUGC",
|
| 1906 |
+
"CCC GCG",
|
| 1907 |
+
"AGCGUGGGGAGCAAAC AGG",
|
| 1908 |
+
"ACCAGUGGC GAAGGCG",
|
| 1909 |
+
"UGCAAGCG UUAAUCGGAAUUACUGGGCGUAA",
|
| 1910 |
+
"UGG UAA",
|
| 1911 |
+
"UU UGGC",
|
| 1912 |
+
"UAGUCC GG",
|
| 1913 |
+
"UACC GG",
|
| 1914 |
+
"UG AAGUC",
|
| 1915 |
+
"UCAA GC",
|
| 1916 |
+
"AGCGUGGGG AGCGAAC",
|
| 1917 |
+
"UCG AUG",
|
| 1918 |
+
"UAA GAA",
|
| 1919 |
+
"U AUGGC",
|
| 1920 |
+
"AGCC GG",
|
| 1921 |
+
"UGG UGG",
|
| 1922 |
+
"ACCC AA",
|
| 1923 |
+
"ACC AC",
|
| 1924 |
+
"CCC GC",
|
| 1925 |
+
"AGAA GG",
|
| 1926 |
+
"UUC UUC",
|
| 1927 |
+
"GG ACCC",
|
| 1928 |
+
"AGG UAG",
|
| 1929 |
+
"AG AGGAA",
|
| 1930 |
+
"UUC GGC",
|
| 1931 |
+
"UCUC AGUUCGG",
|
| 1932 |
+
"AUUAA GC",
|
| 1933 |
+
"UAC GGGG",
|
| 1934 |
+
"UGC UCC",
|
| 1935 |
+
"GC AGAU",
|
| 1936 |
+
"AGACUCCUACGGGAGGCAGC AGUAGG",
|
| 1937 |
+
"AGC UAA",
|
| 1938 |
+
"AUCAGG AGGAAC",
|
| 1939 |
+
"AUU AC",
|
| 1940 |
+
"UC UAG",
|
| 1941 |
+
"UAUU AA",
|
| 1942 |
+
"AGG UGGUGCAUGGUUGUCG",
|
| 1943 |
+
"AGG AGGAAC",
|
| 1944 |
+
"ACGUCAAAUCAUC AUGCCCCUU",
|
| 1945 |
+
"GCGG CC",
|
| 1946 |
+
"UGG AUG",
|
| 1947 |
+
"AUU AGAU",
|
| 1948 |
+
"UGC AGC",
|
| 1949 |
+
"UU UGAG",
|
| 1950 |
+
"UGAA GAAGG",
|
| 1951 |
+
"UAA UAA",
|
| 1952 |
+
"UU UGUC",
|
| 1953 |
+
"UGAGG UAACGGC",
|
| 1954 |
+
"AUAG AA",
|
| 1955 |
+
"AAC UC",
|
| 1956 |
+
"UGG GCG",
|
| 1957 |
+
"AG UUUC",
|
| 1958 |
+
"AUG UUC",
|
| 1959 |
+
"UGG ACC",
|
| 1960 |
+
"UUCC CC",
|
| 1961 |
+
"AG UUGC",
|
| 1962 |
+
"UGAA AGCCC",
|
| 1963 |
+
"UGC AGG",
|
| 1964 |
+
"AAG UCCUC",
|
| 1965 |
+
"UG ACCG",
|
| 1966 |
+
"UGG AUC",
|
| 1967 |
+
"AAG AGG",
|
| 1968 |
+
"AUU GCGAA",
|
| 1969 |
+
"ACG AUG",
|
| 1970 |
+
"UGG AAAC",
|
| 1971 |
+
"AUAA GC",
|
| 1972 |
+
"GG UGGAA",
|
| 1973 |
+
"UGACGCUGAGG AGCGAA",
|
| 1974 |
+
"GAAC GC",
|
| 1975 |
+
"GAAUC UUCC",
|
| 1976 |
+
"UUC GC",
|
| 1977 |
+
"ACCUGAGAGGG UGAUCGGCC",
|
| 1978 |
+
"ACACUGGAACUGAGACACGGUCC AGACUCCUACGGGAGGCAGCAGUGGGGAA",
|
| 1979 |
+
"GGCUAAC UUCG",
|
| 1980 |
+
"AG AGAC",
|
| 1981 |
+
"AG AGGC",
|
| 1982 |
+
"UAC UC",
|
| 1983 |
+
"UAAC GGCCC",
|
| 1984 |
+
"UUG AGUGC",
|
| 1985 |
+
"AAC AC",
|
| 1986 |
+
"AG UGCC",
|
| 1987 |
+
"AGCGC GCG",
|
| 1988 |
+
"UG UGCC",
|
| 1989 |
+
"AGC AGC",
|
| 1990 |
+
"ACCC GAA",
|
| 1991 |
+
"ACAA CC",
|
| 1992 |
+
"GGG AGGAAC",
|
| 1993 |
+
"ACC UGGGG",
|
| 1994 |
+
"ACGAA AGUC",
|
| 1995 |
+
"UC AUGC",
|
| 1996 |
+
"ACGG GG",
|
| 1997 |
+
"AU AUGG",
|
| 1998 |
+
"UC UUUU",
|
| 1999 |
+
"GGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGG AGGG",
|
| 2000 |
+
"UU AGAG",
|
| 2001 |
+
"UGAUGC AGCGACGCC",
|
| 2002 |
+
"UG UAGG",
|
| 2003 |
+
"GC AUGG",
|
| 2004 |
+
"AGAA AGCCAC",
|
| 2005 |
+
"UGG AUU",
|
| 2006 |
+
"UUGC AGAA",
|
| 2007 |
+
"UU UCCC",
|
| 2008 |
+
"UG UUAA",
|
| 2009 |
+
"UU GAAG",
|
| 2010 |
+
"UCAA CCG",
|
| 2011 |
+
"UGG UAG",
|
| 2012 |
+
"GGCUAACUACGUGCCAGCAGCCGCGGUAAUACG UAGG",
|
| 2013 |
+
"GAA AGG",
|
| 2014 |
+
"UG AGGAA",
|
| 2015 |
+
"UU ACCAAGGC",
|
| 2016 |
+
"UGUAGC AGUGAA",
|
| 2017 |
+
"UAGCCGGCC UGAGAGGG",
|
| 2018 |
+
"UGG UAC",
|
| 2019 |
+
"UCGCGG AUCAGC",
|
| 2020 |
+
"GGAA ACG",
|
| 2021 |
+
"UGUG UGAAGAAGGCC",
|
| 2022 |
+
"GGCC ACAUUGGGAC",
|
| 2023 |
+
"AUC UCC",
|
| 2024 |
+
"AGGGC GCG",
|
| 2025 |
+
"UG UGGG",
|
| 2026 |
+
"UAAC GC",
|
| 2027 |
+
"ACC UCC",
|
| 2028 |
+
"GGGCCUUGUACACACCGCCCGUCACACC AUGGG",
|
| 2029 |
+
"UU UCAA",
|
| 2030 |
+
"UGG UCGG",
|
| 2031 |
+
"AGGG AC",
|
| 2032 |
+
"UAGGC G",
|
| 2033 |
+
"UG UAAG",
|
| 2034 |
+
"UGG AGGAA",
|
| 2035 |
+
"UUGACGG UACC",
|
| 2036 |
+
"AGUGAGGAA UAUUGGUCAA",
|
| 2037 |
+
"UG ACAA",
|
| 2038 |
+
"AUU UUC",
|
| 2039 |
+
"AGGUGGUGCAUGGUUGUCG UCAGCUCGUGUCGUGAGAUGUUGGGUUAAGUCCCGCAACGAGCGCAA",
|
| 2040 |
+
"AGC ACC",
|
| 2041 |
+
"AGAA CC",
|
| 2042 |
+
"AUGAAGUC GGAAUCGCUAGUAA",
|
| 2043 |
+
"GG UCC",
|
| 2044 |
+
"AG UGAC",
|
| 2045 |
+
"AG AGCC",
|
| 2046 |
+
"UGC UC",
|
| 2047 |
+
"AC AUG",
|
| 2048 |
+
"UAUG CC",
|
| 2049 |
+
"AUUAGC UAG",
|
| 2050 |
+
"UCAA CCC",
|
| 2051 |
+
"AU AUAC",
|
| 2052 |
+
"UAA ACC",
|
| 2053 |
+
"AU AUCC",
|
| 2054 |
+
"UU AUUC",
|
| 2055 |
+
"UAC AGAGGG",
|
| 2056 |
+
"UUC GAA",
|
| 2057 |
+
"UU GAAC",
|
| 2058 |
+
"AG UAAC",
|
| 2059 |
+
"AGC GGC",
|
| 2060 |
+
"UCC UCC",
|
| 2061 |
+
"AGC UCG",
|
| 2062 |
+
"UUCGAAGC AACGCGAAGAACCUUACC",
|
| 2063 |
+
"U AUCCC",
|
| 2064 |
+
"GCGUUG UCCGGAA",
|
| 2065 |
+
"UGG CCC",
|
| 2066 |
+
"AG UACG",
|
| 2067 |
+
"ACGGCC UUCGGGUUGUAA",
|
| 2068 |
+
"AAG ACC",
|
| 2069 |
+
"UAUUGG GCGUAA",
|
| 2070 |
+
"AA GAA",
|
| 2071 |
+
"UU UAAG",
|
| 2072 |
+
"UUCGGAA UUACUGGGCGUAA",
|
| 2073 |
+
"UGAG AUAC",
|
| 2074 |
+
"UC UUGC",
|
| 2075 |
+
"AG UUAA"
|
| 2076 |
+
]
|
| 2077 |
+
}
|
| 2078 |
+
}
|
tokenizer/tokenizer_config.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": false,
|
| 3 |
+
"added_tokens_decoder": {
|
| 4 |
+
"0": {
|
| 5 |
+
"content": "",
|
| 6 |
+
"lstrip": false,
|
| 7 |
+
"normalized": true,
|
| 8 |
+
"rstrip": false,
|
| 9 |
+
"single_word": false,
|
| 10 |
+
"special": true
|
| 11 |
+
}
|
| 12 |
+
},
|
| 13 |
+
"bos_token": "<|endoftext|>",
|
| 14 |
+
"clean_up_tokenization_spaces": true,
|
| 15 |
+
"eos_token": "<|endoftext|>",
|
| 16 |
+
"model_max_length": 1024,
|
| 17 |
+
"tokenizer_class": "GPT2Tokenizer"
|
| 18 |
+
}
|
tokenizer/vocab.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"<|endoftext|>":0,"A":1,"B":2,"C":3,"D":4,"G":5,"H":6,"K":7,"M":8,"N":9,"R":10,"S":11,"U":12,"V":13,"W":14,"X":15,"Y":16,"Ċ":17,"Ġ":18,"GG":19,"AA":20,"UU":21,"CC":22,"AG":23,"UG":24,"AC":25,"UC":26,"UGG":27,"GC":28,"AGG":29,"UAA":30,"AGC":31,"AUU":32,"ACC":33,"AUG":34,"UCC":35,"GAA":36,"UAC":37,"UGC":38,"AUC":39,"UAG":40,"UUC":41,"AAC":42,"GGC":43,"UUG":44,"AAG":45,"GGG":46,"CCC":47,"AU":48,"UGAA":49,"ACG":50,"AUGG":51,"UAAC":52,"GCG":53,"UCG":54,"AGGC":55,"UGAG":56,"UGGC":57,"AUGC":58,"AGCC":59,"UGCC":60,"AUCC":61,"GGAA":62,"AUAA":63,"UACC":64,"UUUU":65,"ACGG":66,"AGGG":67,"UAUU":68,"AGAA":69,"UUGG":70,"GCC":71,"UAGC":72,"UCAA":73,"UUAA":74,"GAAC":75,"ACAA":76,"UAGG":77,"UGGG":78,"ACCC":79,"UGGGG":80,"UGAC":81,"AUAC":82,"GCGG":83,"AGGAA":84,"UUCC":85,"AGCG":86,"UCCC":87,"GCAA":88,"AGAC":89,"GGCC":90,"AUUC":91,"UUUC":92,"UUGC":93,"AAAA":94,"AGAG":95,"CCG":96,"UACG":97,"ACAC":98,"AUAG":99,"GGGG":100,"UGUC":101,"UAAG":102,"UAUC":103,"UUUG":104,"AGUC":105,"AUUG":106,"GGCG":107,"AAAC":108,"AAGUC":109,"AUGAA":110,"UGUG":111,"UCUC":112,"UGGAA":113,"ACCG":114,"AGUG":115,"UGGGC":116,"UUAC":117,"UCGC":118,"UUCGG":119,"UGCG":120,"UAUG":121,"UUCG":122,"UUUAA":123,"UCGG":124,"UUAG":125,"UCUG":126,"UCCG":127,"AACG":128,"GAAG":129,"AGUGG":130,"UCAC":131,"AUAAC":132,"UGAGG":133,"AUGGC":134,"AGAGG":135,"AGAU":136,"AUGCC":137,"ACCAA":138,"UAGGC":139,"GGGC":140,"AUUAA":141,"GGUGAA":142,"UACGGG":143,"AUCG":144,"AAGCC":145,"UUGAA":146,"UAU":147,"UACAC":148,"GCGAA":149,"CCUU":150,"CCCG":151,"AUGCG":152,"ACUC":153,"UGUU":154,"GGCUAAC":155,"AAGG":156,"UCAG":157,"ACGC":158,"UGUAGC":159,"UGACGC":160,"UGAGAC":161,"UUCCC":162,"GCGUAA":163,"AGCAGCC":164,"AUGGG":165,"AGGCAGC":166,"AGUGGC":167,"AGGGC":168,"UACAA":169,"UCAGC":170,"AUUGG":171,"GAAGGC":172,"GCGGUAA":173,"ACGAA":174,"UUAAG":175,"UGCCAGCAGCC":176,"CCCC":177,"UGUCG":178,"UUGGG":179,"UGCAA":180,"AGCAA":181,"AUCCC":182,"UACGGGAGGCAGC":183,"ACGGG":184,"UUAAC":185,"UUCGGG":186,"ACUG":187,"UUGCC":188,"ACCGG":189,"UAGAG":190,"UUGUAA":191,"UAGUCC":192,"AGGAUU":193,"UAAGG":194,"UGCCAGCAGCCGCGGUAA":195,"UCCUACGGGAGGCAGC":196,"AGGGG":197,"GCACAA":198,"AUAUU":199,"AUAUC":200,"AGUU":201,"UAAUACC":202,"UAAAA":203,"UACGG":204,"AGGAAC":205,"UGCCC":206,"UUGAC":207,"GAAGC":208,"UGGCC":209,"UCUU":210,"UAGGG":211,"AGCCC":212,"UGAGACACGG":213,"AUUAGC":214,"AUAAG":215,"GCUGGC":216,"AGGCC":217,"ACUU":218,"AGCGUGGGG":219,"AGCAAAC":220,"ACCCC":221,"AGGAAGG":222,"UAACC":223,"UUGACGG":224,"AGGAUUAGAU":225,"ACAG":226,"AGACUCCUACGGGAGGCAGC":227,"UGGUC":228,"GGCGG":229,"GCGC":230,"UACCC":231,"UGGAGC":232,"AUGUGG":233,"AGUGGGGAA":234,"UGUAGCGGUGAA":235,"GGGCC":236,"UAGUAA":237,"UCCGG":238,"NN":239,"ĠG":240,"UGAAG":241,"UAGCC":242,"ACAUGC":243,"UCAAC":244,"AGUAC":245,"AGGAUG":246,"AGGAUUAGAUACCC":247,"AGUGC":248,"UAUGG":249,"ACGCC":250,"UAGUUGG":251,"UGUAA":252,"AACC":253,"ACUGC":254,"UAUUGG":255,"UGGGCGUAA":256,"UUUUC":257,"UGAGUAAC":258,"UGCUGC":259,"UAGAA":260,"AUUCC":261,"UAAGC":262,"UAUAA":263,"ACGUC":264,"AAGC":265,"AGAAG":266,"AGCGCAA":267,"UGACGG":268,"AGCGC":269,"UUUUG":270,"UGCAAC":271,"GGUG":272,"UCAGCUCG":273,"UGGUAGUCC":274,"UUUCC":275,"AGCGG":276,"AGAAC":277,"UGAAC":278,"UGGAAC":279,"UUCAA":280,"AGAUU":281,"ACUCC":282,"AGAUG":283,"UUAUU":284,"UGGGAA":285,"AGAGC":286,"AUCAA":287,"GGCUAACUACG":288,"AGCAAC":289,"AGCGUGGGGAGCAAAC":290,"AGGAUUAGAUACCCUGGUAGUCC":291,"ACAUU":292,"UAAACG":293,"UGAGGC":294,"UGUGAA":295,"GAAGG":296,"AUGCGUAG":297,"UUGGC":298,"UAGGGG":299,"AGUGAA":300,"AGGGAA":301,"UGAUC":302,"UGGGAC":303,"UUAAGUCCC":304,"ACCGCCCG":305,"GAACGCUGGC":306,"AAGUCGAAC":307,"AGCGAA":308,"AGCUC":309,"UCAAAGGAA":310,"UCAACC":311,"GCCUGGGG":312,"CCCUU":313,"UCCCC":314,"UGCCG":315,"UGAUCC":316,"UGAGAUG":317,"UUACC":318,"AGACUCCUACGGGAGGCAGCAGUGGGGAA":319,"UCGCC":320,"GGGAC":321,"AGGCG":322,"AGGAAGGUGGGG":323,"GGGCCC":324,"UAUUC":325,"UACGUUCCC":326,"UCAAAGGAAUUGACGG":327,"AUACC":328,"UGAGACACGGCCC":329,"AUAGC":330,"UCAUU":331,"UACACACCGCCCG":332,"UCGAA":333,"AUAGG":334,"AUCGG":335,"UUUGG":336,"UGAUGC":337,"UGCGAA":338,"UAGAGG":339,"GCACAAGCGG":340,"AAGUCG":341,"UGGCG":342,"UCGGAA":343,"GGCGACG":344,"UGAUG":345,"UAGCG":346,"AUACG":347,"AACGAGCGCAA":348,"UCAGCUCGUGUCG":349,"CCUUACC":350,"UUGGGUUAAGUCCC":351,"ACGUGC":352,"ACUGG":353,"AGUAA":354,"GCAAGG":355,"UGUGG":356,"UCAGCUCGUGUCGUGAGAUG":357,"UAUCC":358,"AGUUC":359,"AGACC":360,"ACCAGUGGC":361,"AUAUG":362,"UCAGG":363,"UCUUC":364,"GCAACGAGCGCAA":365,"UUACUGGGCGUAA":366,"UGAUU":367,"UUAUCC":368,"UGACC":369,"UCAUC":370,"UAUGC":371,"UAGUC":372,"GCCG":373,"AUCAGC":374,"AUUCG":375,"UAAUACCGC":376,"UGGGGG":377,"AACGCGAA":378,"ACAGG":379,"UGCGG":380,"GGCUAACUCCG":381,"AUGUGGUUUAA":382,"AGGAAGGUGGGGAUG":383,"GCCGCG":384,"UCGCUAGUAA":385,"UGAAAC":386,"ACGGC":387,"UUGUACACACCGCCCG":388,"UGGAAUUCC":389,"UCAGCUCGUGUCGUGAGAUGUUGGGUUAAGUCCC":390,"GAAAGCC":391,"AUUGC":392,"UGGUCUGAG":393,"UCGGC":394,"UCCAA":395,"AUUAGCUAGUUGG":396,"UAGGCGG":397,"AGUUG":398,"GAACGGG":399,"UCACC":400,"UAAAAC":401,"UCUGG":402,"UAUUG":403,"UUCGGGUUGUAA":404,"ACUUC":405,"ACGUGCUACAA":406,"GAAAA":407,"ĠC":408,"UCUGC":409,"UUUGC":410,"UACCG":411,"UGCAACUCG":412,"AUGGCUGUCG":413,"UUGUUGG":414,"UGUGC":415,"AACGCGAAGAA":416,"UGUUC":417,"AGAGGG":418,"AUCCG":419,"GCGUUG":420,"AACAA":421,"UUGGAA":422,"AUAU":423,"UCUCC":424,"AGAUC":425,"ACGCCG":426,"UUAACC":427,"AGGCGG":428,"ACAUGCAAGUCGAAC":429,"UGGUGC":430,"UAAUAC":431,"UACCAA":432,"GGCCC":433,"AGCAC":434,"UGAACC":435,"ACACUGGGAC":436,"AUCAGG":437,"UGAGUAACACG":438,"GCGUG":439,"UAUAC":440,"UUGUC":441,"GAAUC":442,"UUAGC":443,"UCAGCUCGUGUCGUGAGAUGUUGGGUUAAGUCCCGCAACGAGCGCAA":444,"AGCAACGCCGCG":445,"AGUAGG":446,"UAACG":447,"GCACAAGCGGUGGAGC":448,"UUUAG":449,"AGGGGG":450,"UACACACGUGCUACAA":451,"GGCGC":452,"UGAGAGGG":453,"UGCGC":454,"AGCCG":455,"UGAAUACGUUCCC":456,"UUUAC":457,"NNNN":458,"GGCUAACUCCGUGCCAGCAGCCGCGGUAA":459,"AUGGAA":460,"UGGGCGC":461,"UGGGCGAAAGCC":462,"UAUAG":463,"GAAGGCC":464,"GGCAGC":465,"AUCGC":466,"UGUUG":467,"ACCCG":468,"GGCUAACUACGUGCCAGCAGCCGCGGUAA":469,"AGUCC":470,"AUCAGCC":471,"UGUCC":472,"UCAAAGGAAUUGACGGGGGCCC":473,"UGACGCUGAGGC":474,"UGAGC":475,"UUCCG":476,"AAGAC":477,"GAACG":478,"AACGCGAAGAACCUUACC":479,"UGGCGAAGGC":480,"AACGC":481,"GGAUU":482,"ACACUGGGACUGAGACACGGCCC":483,"AGCCAUGCC":484,"AUGAC":485,"GCACAAGCGGUGGAGCAUGUGGUUUAA":486,"GCGCC":487,"UGAUGG":488,"UGCUGCAUGGCUGUCG":489,"AGGUC":490,"AUGUC":491,"GCCCC":492,"UGACG":493,"GGGCCUUGUACACACCGCCCG":494,"ACCUC":495,"GGGGC":496,"UCACACC":497,"AUUGGGCGUAA":498,"UAACAAGG":499,"UUAAAA":500,"ACCGC":501,"UGUAGCGGUGAAAUGCGUAG":502,"UUGGGC":503,"UAACGGC":504,"ACGCCGUAAACG":505,"GAAAC":506,"AGCUAAC":507,"AUAAAA":508,"AGCGUGGGGAGCAAACAGGAUUAGAUACCCUGGUAGUCC":509,"AGCGAAC":510,"UCCUC":511,"AGAAAA":512,"UGAAGG":513,"UAUUGCACAA":514,"UGGGCGCAAGCC":515,"UUUUGG":516,"UGGUCUGAGAGGAUG":517,"AUCAG":518,"ACCAAGGCGACG":519,"GAACGCUGGCGGC":520,"GGCUAACUACGUGCCAGCAGCCGCGGUAAUACG":521,"UGAGACACGGUCC":522,"AGAAGC":523,"UCCCG":524,"UUCGGAA":525,"ACGGCC":526,"UAUGAA":527,"UGACGCUGAGG":528,"AUCAUU":529,"ACCAGUGGCGAAGGC":530,"ACCAAGGC":531,"UA":532,"UUUGAC":533,"ACAAC":534,"AUGUGAA":535,"UGUAGCGGUGAAAUGC":536,"UGUAG":537,"UGGGAAC":538,"AUCAUC":539,"GGCCG":540,"UAAUC":541,"GGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGG":542,"UAAAGC":543,"UGGCUC":544,"AGACUGCC":545,"UGUAC":546,"UUGAG":547,"GGUC":548,"ACACUGGAAC":549,"UAAUACCGG":550,"UCCGGAA":551,"UUAAUCGGAA":552,"GCCUGGGGAGUAC":553,"AUAACC":554,"AGUCG":555,"AUGGGC":556,"GGGUC":557,"AGUUCGG":558,"AGGAAGGUGGGGAUGACGUC":559,"UGAGAA":560,"AUCCCC":561,"GCGGUGAAUACGUUCCC":562,"UGGAGG":563,"AGAGUUUG":564,"UGCAAGCG":565,"UUUAUU":566,"UGGAC":567,"UGAGUAA":568,"GAAGCACC":569,"AGCCAUGCCGCG":570,"GGCAA":571,"UUGUCG":572,"UAUUGGACAA":573,"UUGGGG":574,"AUCUC":575,"GAAAGC":576,"UGAAAA":577,"ACAGC":578,"UGAUGAA":579,"GCCUGGGGAGUACGGCC":580,"GAACC":581,"UGGGCC":582,"AGAGAA":583,"AUGGGG":584,"AGGCCC":585,"AUAACG":586,"AUGCGUAGAG":587,"GAAGGCG":588,"UCGGG":589,"UGGCAA":590,"AGCCCC":591,"UCGCGG":592,"GGACGGG":593,"UCGUAACAAGG":594,"AGCUUGC":595,"UUUUAA":596,"AGCGACGCC":597,"UUAAUCGGAAUUACUGGGCGUAA":598,"GGAAGG":599,"ACAUC":600,"UGAGUAACGCG":601,"UUAUG":602,"GCCUGGGGAG":603,"UAGCCG":604,"UGGGGUAA":605,"UUCGAUGC":606,"CCCUUG":607,"CCCGG":608,"UUUGAA":609,"GCAAGGC":610,"AUGGCCCUU":611,"AUUUC":612,"AGGAC":613,"GAACGCUGGCGGCG":614,"GGCGGACGGG":615,"UUAAGC":616,"UAUGGG":617,"UUAUC":618,"AUAUUC":619,"UGGAG":620,"AAGUCAUC":621,"UGGGGC":622,"AGUCUGCAACUCG":623,"ACCCGC":624,"AGAUGG":625,"GGAAUCGCUAGUAA":626,"UUCUC":627,"AUUAAG":628,"ACGUCAA":629,"CCAA":630,"UUUUGC":631,"UCAAAA":632,"AUGAAG":633,"AUGAAC":634,"AGUAG":635,"ACACC":636,"UGCUUAAC":637,"ACACUGGAACUGAGACACGGUCC":638,"ACACUGGGACUGAGACACGGCCCAGACUCCUACGGGAGGCAGCAGUGGGGAA":639,"ACUGGG":640,"UAUCAGC":641,"UGGUGCAUGG":642,"ACAUGCAAGUCG":643,"UACGAA":644,"UUAUUGGGCGUAA":645,"CCCAA":646,"AUGAUU":647,"AACGG":648,"UUUCG":649,"ACUUG":650,"AGGAGG":651,"AAAAAA":652,"UUGAAAC":653,"GGGCCUUGUACACACCGCCCGUCACACC":654,"AGGGUGCG":655,"UAAGCACC":656,"UGCGGC":657,"UGGCGC":658,"UGCAUU":659,"UUUUCC":660,"UCCCAA":661,"UUAGG":662,"AGCGUUG":663,"UGAAGAAGGCC":664,"UCCGC":665,"UUUGGG":666,"UUCGGGG":667,"ĠAGAGUUUG":668,"UUAUCCGGAUU":669,"UGUUGG":670,"UAGGAA":671,"UGAAGC":672,"ĠCC":673,"UGCAC":674,"AGUGGCGAACGGG":675,"UAAAC":676,"ACGAACGCUGGCGGCG":677,"UUAAGUC":678,"UGGGGGAA":679,"AUUGAA":680,"AGGUGCUGCAUGGCUGUCG":681,"UAUCG":682,"UUGACC":683,"UAUUCC":684,"AGUGAGGAA":685,"ACCACC":686,"UUGCG":687,"ACAAAA":688,"AGGAAG":689,"UAUAUU":690,"UAAUACAUGC":691,"ACAUUGGGAC":692,"AUGCCCCUU":693,"UGCCCC":694,"ACUAC":695,"ACAAG":696,"GGGAA":697,"AGAAGAAGCACC":698,"UGCGGG":699,"UUCAG":700,"UAGCCGGCC":701,"UUCGAAGC":702,"AGCCAC":703,"AGCAACGCCGCGUGAG":704,"AUUGAACGCUGGCGGC":705,"UAGCUGGUCUGAGAGGAUG":706,"UUGCAA":707,"AUGAAGUC":708,"UAGAGGUGAA":709,"UUGCCAGC":710,"UUAAAAC":711,"ACUAA":712,"UGAGAGG":713,"UCUUG":714,"ACCGGUGGCGAAGGC":715,"AGCCAA":716,"ĠUACG":717,"AUGCCC":718,"UAGGGC":719,"ACGCCGUAAACGAUG":720,"AGUUGG":721,"UGAGGG":722,"AUUUAA":723,"UGACGGUACC":724,"UCUAA":725,"UGGGGAA":726,"GGAC":727,"UGGUGUAGCGGUGAAAUGC":728,"UCAAG":729,"AGUGGG":730,"AUACAA":731,"GCUGGCGGCG":732,"GGAG":733,"UAACACAUGCAAGUCGAAC":734,"GCGAGG":735,"ACCUGAGAGGG":736,"ACCAGUGGCGAAGGCGGC":737,"UUUUUUUU":738,"UCGCAAG":739,"ACGGUACC":740,"AUGUG":741,"UACGC":742,"UGCCGC":743,"AUAUAA":744,"GCGUGAG":745,"UAGCGAA":746,"GGUGACAA":747,"AUUAUU":748,"AGACG":749,"AAUAA":750,"UCAAAGGAAUUGACGGGGGCCCGCACAAGCGGUGGAGCAUGUGGUUUAA":751,"UUCGGAUUG":752,"AGCUCC":753,"UGUGGC":754,"GGAAUUCC":755,"AUUCGUAG":756,"GGAAC":757,"UGACAC":758,"UUAGGG":759,"UAGGCGGC":760,"AGUUUU":761,"UGGGCUACACACGUGCUACAA":762,"UGGUUC":763,"ACGUCAAAUCAUC":764,"UGAAGUCGUAACAAGG":765,"AUCCAA":766,"NNNNNNNN":767,"AUCAC":768,"GGGCUCAACC":769,"UAACGCG":770,"AUGUCC":771,"UUCGGAUCG":772,"UGGGGGAAACCC":773,"GCCGG":774,"AGGCAA":775,"GGCUAA":776,"UGAUCGGCC":777,"UAGAGGUGAAAUUCGUAG":778,"UGAUAC":779,"AUGACC":780,"UGAGCC":781,"UGAGGUAA":782,"UCUAC":783,"UGACGCUGAGGCGCGAA":784,"AUUUU":785,"UCGCG":786,"AGCAGG":787,"AUUAG":788,"UCCCCC":789,"UCUGCC":790,"UACCAAGGCGACG":791,"GAAGAA":792,"ĠAGAGUUUGAUCC":793,"GGUGACAAACCGG":794,"GCAAUGGGCGAAAGCC":795,"UGUAGCGGUGAAAUGCGUAGAG":796,"AGGACG":797,"ACUGCC":798,"AUGGCGAAGGC":799,"UGGUG":800,"AUGGCC":801,"UCAUG":802,"AGCAUC":803,"GGGGG":804,"AGACGG":805,"UAUAAC":806,"AGCUAACGC":807,"UAUAAG":808,"UUGUU":809,"AUGCAA":810,"UUGACAUCC":811,"AUUCAA":812,"ĠGACGAACGCUGGCGGCG":813,"GGCUAACUACGUG":814,"AGUGGCGGACGGG":815,"UGGGUAGC":816,"UGAUCCAGCCAUGCCGCG":817,"UUCAC":818,"AGGGGC":819,"UAGAGC":820,"ACCAGCC":821,"GCCUGGGGAGUACGG":822,"ACGCCC":823,"UGCUUAACACAUGCAAGUCGAAC":824,"UGGUGCAUGGUUGUCG":825,"UAACGG":826,"UAAUACCGCAUACG":827,"UGUAGCGGUGAAAUGCGUAGAUAUC":828,"AGCCGCC":829,"GCCUGGGGAGUACGGCCGCAAGG":830,"GGGGGC":831,"UGUGAC":832,"AUUUAC":833,"AGAAGAA":834,"UAUUGC":835,"UUCGAUGCAACGCGAAGAACCUUACC":836,"GGUGAAUACGUUCCC":837,"UAGCAA":838,"ACGUU":839,"UAUUGGUCAA":840,"AUAUGC":841,"AUAGCC":842,"UGUUUU":843,"GGGUUUAA":844,"AGCAAUGCC":845,"UACCCC":846,"UAGGUGG":847,"AGCAUU":848,"AUGAAGC":849,"AGGCGC":850,"UGCCGG":851,"AAGUCAUCAUGGCCCUU":852,"UGCCUAAUACAUGC":853,"CCCGCG":854,"AGCGUGGGGAGCAAACAGG":855,"ACCAGUGGCGAAGGCG":856,"UGCAAGCGUUAAUCGGAAUUACUGGGCGUAA":857,"UGGUAA":858,"UUUGGC":859,"UAGUCCGG":860,"UACCGG":861,"UGAAGUC":862,"UCAAGC":863,"AGCGUGGGGAGCGAAC":864,"UCGAUG":865,"UAAGAA":866,"UAUGGC":867,"AGCCGG":868,"UGGUGG":869,"ACCCAA":870,"ACCAC":871,"CCCGC":872,"AGAAGG":873,"UUCUUC":874,"GGACCC":875,"AGGUAG":876,"AGAGGAA":877,"UUCGGC":878,"UCUCAGUUCGG":879,"AUUAAGC":880,"UACGGGG":881,"UGCUCC":882,"GCAGAU":883,"AGACUCCUACGGGAGGCAGCAGUAGG":884,"AGCUAA":885,"AUCAGGAGGAAC":886,"AUUAC":887,"UCUAG":888,"UAUUAA":889,"AGGUGGUGCAUGGUUGUCG":890,"AGGAGGAAC":891,"ACGUCAAAUCAUCAUGCCCCUU":892,"GCGGCC":893,"UGGAUG":894,"AUUAGAU":895,"UGCAGC":896,"UUUGAG":897,"UGAAGAAGG":898,"UAAUAA":899,"UUUGUC":900,"UGAGGUAACGGC":901,"AUAGAA":902,"AACUC":903,"UGGGCG":904,"AGUUUC":905,"AUGUUC":906,"UGGACC":907,"UUCCCC":908,"AGUUGC":909,"UGAAAGCCC":910,"UGCAGG":911,"AAGUCCUC":912,"UGACCG":913,"UGGAUC":914,"AAGAGG":915,"AUUGCGAA":916,"ACGAUG":917,"UGGAAAC":918,"AUAAGC":919,"GGUGGAA":920,"UGACGCUGAGGAGCGAA":921,"GAACGC":922,"GAAUCUUCC":923,"UUCGC":924,"ACCUGAGAGGGUGAUCGGCC":925,"ACACUGGAACUGAGACACGGUCCAGACUCCUACGGGAGGCAGCAGUGGGGAA":926,"GGCUAACUUCG":927,"AGAGAC":928,"AGAGGC":929,"UACUC":930,"UAACGGCCC":931,"UUGAGUGC":932,"AACAC":933,"AGUGCC":934,"AGCGCGCG":935,"UGUGCC":936,"AGCAGC":937,"ACCCGAA":938,"ACAACC":939,"GGGAGGAAC":940,"ACCUGGGG":941,"ACGAAAGUC":942,"UCAUGC":943,"ACGGGG":944,"AUAUGG":945,"UCUUUU":946,"GGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGGAGGG":947,"UUAGAG":948,"UGAUGCAGCGACGCC":949,"UGUAGG":950,"GCAUGG":951,"AGAAAGCCAC":952,"UGGAUU":953,"UUGCAGAA":954,"UUUCCC":955,"UGUUAA":956,"UUGAAG":957,"UCAACCG":958,"UGGUAG":959,"GGCUAACUACGUGCCAGCAGCCGCGGUAAUACGUAGG":960,"GAAAGG":961,"UGAGGAA":962,"UUACCAAGGC":963,"UGUAGCAGUGAA":964,"UAGCCGGCCUGAGAGGG":965,"UGGUAC":966,"UCGCGGAUCAGC":967,"GGAAACG":968,"UGUGUGAAGAAGGCC":969,"GGCCACAUUGGGAC":970,"AUCUCC":971,"AGGGCGCG":972,"UGUGGG":973,"UAACGC":974,"ACCUCC":975,"GGGCCUUGUACACACCGCCCGUCACACCAUGGG":976,"UUUCAA":977,"UGGUCGG":978,"AGGGAC":979,"UAGGCG":980,"UGUAAG":981,"UGGAGGAA":982,"UUGACGGUACC":983,"AGUGAGGAAUAUUGGUCAA":984,"UGACAA":985,"AUUUUC":986,"AGGUGGUGCAUGGUUGUCGUCAGCUCGUGUCGUGAGAUGUUGGGUUAAGUCCCGCAACGAGCGCAA":987,"AGCACC":988,"AGAACC":989,"AUGAAGUCGGAAUCGCUAGUAA":990,"GGUCC":991,"AGUGAC":992,"AGAGCC":993,"UGCUC":994,"ACAUG":995,"UAUGCC":996,"AUUAGCUAG":997,"UCAACCC":998,"AUAUAC":999,"UAAACC":1000,"AUAUCC":1001,"UUAUUC":1002,"UACAGAGGG":1003,"UUCGAA":1004,"UUGAAC":1005,"AGUAAC":1006,"AGCGGC":1007,"UCCUCC":1008,"AGCUCG":1009,"UUCGAAGCAACGCGAAGAACCUUACC":1010,"UAUCCC":1011,"GCGUUGUCCGGAA":1012,"UGGCCC":1013,"AGUACG":1014,"ACGGCCUUCGGGUUGUAA":1015,"AAGACC":1016,"UAUUGGGCGUAA":1017,"AAGAA":1018,"UUUAAG":1019,"UUCGGAAUUACUGGGCGUAA":1020,"UGAGAUAC":1021,"UCUUGC":1022,"AGUUAA":1023}
|