acorrochano commited on
Commit
e668d04
·
verified ·
1 Parent(s): 456fe4b

Training in progress, step 1000

Browse files
config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "gpt2",
3
+ "activation_function": "gelu_new",
4
+ "architectures": [
5
+ "GPT2LMHeadModel"
6
+ ],
7
+ "attn_pdrop": 0.1,
8
+ "bos_token_id": 50256,
9
+ "embd_pdrop": 0.1,
10
+ "eos_token_id": 50256,
11
+ "initializer_range": 0.02,
12
+ "layer_norm_epsilon": 1e-05,
13
+ "model_type": "gpt2",
14
+ "n_ctx": 1024,
15
+ "n_embd": 768,
16
+ "n_head": 12,
17
+ "n_inner": null,
18
+ "n_layer": 12,
19
+ "n_positions": 1024,
20
+ "reorder_and_upcast_attn": false,
21
+ "resid_pdrop": 0.1,
22
+ "scale_attn_by_inverse_layer_idx": false,
23
+ "scale_attn_weights": true,
24
+ "summary_activation": null,
25
+ "summary_first_dropout": 0.1,
26
+ "summary_proj_to_labels": true,
27
+ "summary_type": "cls_index",
28
+ "summary_use_proj": true,
29
+ "task_specific_params": {
30
+ "text-generation": {
31
+ "do_sample": true,
32
+ "max_length": 50
33
+ }
34
+ },
35
+ "torch_dtype": "float32",
36
+ "transformers_version": "4.47.1",
37
+ "use_cache": true,
38
+ "vocab_size": 1024
39
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6725615a418199becfc4e1f4897f302deb56c0f4ad5c765544b05d89d7775bbc
3
+ size 346530432
runs/Jan29_15-12-30_7162016/events.out.tfevents.1738163556.7162016 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:416a365288392ca4bbff0f082cc6b472ea84ebbb06daa71d0861aa4f48eb83bd
3
+ size 5462
special_tokens_map.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<|endoftext|>",
3
+ "eos_token": "<|endoftext|>",
4
+ "pad_token": "<pad>",
5
+ "unk_token": "<unk>"
6
+ }
tokenizer.json ADDED
@@ -0,0 +1,5162 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 13,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
+ "padding": {
10
+ "strategy": {
11
+ "Fixed": 13
12
+ },
13
+ "direction": "Right",
14
+ "pad_to_multiple_of": null,
15
+ "pad_id": 2,
16
+ "pad_type_id": 0,
17
+ "pad_token": "<pad>"
18
+ },
19
+ "added_tokens": [
20
+ {
21
+ "id": 0,
22
+ "content": "<|endoftext|>",
23
+ "single_word": false,
24
+ "lstrip": false,
25
+ "rstrip": false,
26
+ "normalized": false,
27
+ "special": true
28
+ },
29
+ {
30
+ "id": 1,
31
+ "content": "<unk>",
32
+ "single_word": false,
33
+ "lstrip": false,
34
+ "rstrip": false,
35
+ "normalized": false,
36
+ "special": true
37
+ },
38
+ {
39
+ "id": 2,
40
+ "content": "<pad>",
41
+ "single_word": false,
42
+ "lstrip": false,
43
+ "rstrip": false,
44
+ "normalized": false,
45
+ "special": true
46
+ }
47
+ ],
48
+ "normalizer": {
49
+ "type": "NFKC"
50
+ },
51
+ "pre_tokenizer": {
52
+ "type": "Metaspace",
53
+ "replacement": "▁",
54
+ "prepend_scheme": "always",
55
+ "split": true
56
+ },
57
+ "post_processor": null,
58
+ "decoder": {
59
+ "type": "Metaspace",
60
+ "replacement": "▁",
61
+ "prepend_scheme": "always",
62
+ "split": true
63
+ },
64
+ "model": {
65
+ "type": "BPE",
66
+ "dropout": null,
67
+ "unk_token": "<unk>",
68
+ "continuing_subword_prefix": null,
69
+ "end_of_word_suffix": null,
70
+ "fuse_unk": false,
71
+ "byte_fallback": false,
72
+ "ignore_merges": false,
73
+ "vocab": {
74
+ "<|endoftext|>": 0,
75
+ "<unk>": 1,
76
+ "<pad>": 2,
77
+ "\n": 3,
78
+ "A": 4,
79
+ "C": 5,
80
+ "G": 6,
81
+ "T": 7,
82
+ "▁": 8,
83
+ "AA": 9,
84
+ "CC": 10,
85
+ "TT": 11,
86
+ "GG": 12,
87
+ "AC": 13,
88
+ "GC": 14,
89
+ "TC": 15,
90
+ "AG": 16,
91
+ "TG": 17,
92
+ "AT": 18,
93
+ "AAAA": 19,
94
+ "ACC": 20,
95
+ "AGG": 21,
96
+ "GT": 22,
97
+ "AAC": 23,
98
+ "ATT": 24,
99
+ "AGC": 25,
100
+ "ATC": 26,
101
+ "CCC": 27,
102
+ "ACG": 28,
103
+ "GGC": 29,
104
+ "ATG": 30,
105
+ "TGC": 31,
106
+ "TCC": 32,
107
+ "AAG": 33,
108
+ "TTC": 34,
109
+ "TGG": 35,
110
+ "GCC": 36,
111
+ "▁C": 37,
112
+ "TAC": 38,
113
+ "TAA": 39,
114
+ "TTTT": 40,
115
+ "TCG": 41,
116
+ "TAG": 42,
117
+ "AAAAAAAA": 43,
118
+ "GCG": 44,
119
+ "TTG": 45,
120
+ "CCG": 46,
121
+ "ACCC": 47,
122
+ "GGG": 48,
123
+ "TAT": 49,
124
+ "▁G": 50,
125
+ "AAAC": 51,
126
+ "AACC": 52,
127
+ "AGAC": 53,
128
+ "AGGC": 54,
129
+ "AGCC": 55,
130
+ "TGCC": 56,
131
+ "AAGC": 57,
132
+ "ACAC": 58,
133
+ "ATCC": 59,
134
+ "ATTC": 60,
135
+ "TACC": 61,
136
+ "ATGC": 62,
137
+ "AAAG": 63,
138
+ "TCCC": 64,
139
+ "ACGG": 65,
140
+ "ACGC": 66,
141
+ "AAGG": 67,
142
+ "TCGC": 68,
143
+ "TCGG": 69,
144
+ "TAAC": 70,
145
+ "ATGG": 71,
146
+ "ACCG": 72,
147
+ "AATT": 73,
148
+ "AATC": 74,
149
+ "TTCC": 75,
150
+ "AGCG": 76,
151
+ "▁CC": 77,
152
+ "ATCG": 78,
153
+ "TGGC": 79,
154
+ "ATAC": 80,
155
+ "TTGC": 81,
156
+ "AATG": 82,
157
+ "AGTC": 83,
158
+ "GTCC": 84,
159
+ "AACG": 85,
160
+ "TTTTTTTT": 86,
161
+ "TTGG": 87,
162
+ "ACTG": 88,
163
+ "TAGG": 89,
164
+ "ATTG": 90,
165
+ "AGTG": 91,
166
+ "TAGC": 92,
167
+ "CCCG": 93,
168
+ "AGTT": 94,
169
+ "GTGC": 95,
170
+ "▁GC": 96,
171
+ "TACG": 97,
172
+ "TCAC": 98,
173
+ "GTGG": 99,
174
+ "▁AC": 100,
175
+ "AAAAC": 101,
176
+ "AAAT": 102,
177
+ "TATT": 103,
178
+ "TATC": 104,
179
+ "TGAC": 105,
180
+ "TCCG": 106,
181
+ "TGCG": 107,
182
+ "TTCG": 108,
183
+ "GGCC": 109,
184
+ "AGAG": 110,
185
+ "TATG": 111,
186
+ "TGTC": 112,
187
+ "TAAG": 113,
188
+ "AGGG": 114,
189
+ "GGCG": 115,
190
+ "TTTC": 116,
191
+ "ACTC": 117,
192
+ "AGAA": 118,
193
+ "ATAA": 119,
194
+ "▁TC": 120,
195
+ "ACTT": 121,
196
+ "▁AA": 122,
197
+ "▁GG": 123,
198
+ "GCGG": 124,
199
+ "TGTG": 125,
200
+ "ATAG": 126,
201
+ "▁AAAAAAAA": 127,
202
+ "▁CG": 128,
203
+ "▁TT": 129,
204
+ "GCCG": 130,
205
+ "TAAAA": 131,
206
+ "TGTT": 132,
207
+ "ACAA": 133,
208
+ "TCTC": 134,
209
+ "GCGC": 135,
210
+ "▁AG": 136,
211
+ "ACAG": 137,
212
+ "TGGG": 138,
213
+ "AAGT": 139,
214
+ "ACCCC": 140,
215
+ "ACGCC": 141,
216
+ "TCTT": 142,
217
+ "TCTG": 143,
218
+ "TTTG": 144,
219
+ "ACGT": 145,
220
+ "AAAAG": 146,
221
+ "AAGCC": 147,
222
+ "ATGCC": 148,
223
+ "GGGG": 149,
224
+ "▁TG": 150,
225
+ "AAACC": 151,
226
+ "AGGCC": 152,
227
+ "TTAC": 153,
228
+ "GGGC": 154,
229
+ "ACTGC": 155,
230
+ "ATAT": 156,
231
+ "ACCGC": 157,
232
+ "TGAG": 158,
233
+ "GTAC": 159,
234
+ "TA": 160,
235
+ "TCAG": 161,
236
+ "ACCCG": 162,
237
+ "▁AT": 163,
238
+ "AACCC": 164,
239
+ "ACCGG": 165,
240
+ "AAAGC": 166,
241
+ "TTAG": 167,
242
+ "ATTCC": 168,
243
+ "▁AAAA": 169,
244
+ "AACGC": 170,
245
+ "TAACC": 171,
246
+ "GTAG": 172,
247
+ "AAAAAAAAAAAAAAAA": 173,
248
+ "ACAT": 174,
249
+ "TCCCC": 175,
250
+ "TGAA": 176,
251
+ "ATCGC": 177,
252
+ "TCAA": 178,
253
+ "TGGCC": 179,
254
+ "TCGT": 180,
255
+ "AACGG": 181,
256
+ "TAGCC": 182,
257
+ "TACCC": 183,
258
+ "ATTGC": 184,
259
+ "AGCGG": 185,
260
+ "AGCGC": 186,
261
+ "ATCGG": 187,
262
+ "CCCGC": 188,
263
+ "▁GT": 189,
264
+ "TTAA": 190,
265
+ "▁AAC": 191,
266
+ "ACGTC": 192,
267
+ "▁GCC": 193,
268
+ "TGCGG": 194,
269
+ "AGAT": 195,
270
+ "▁ACC": 196,
271
+ "TCGCC": 197,
272
+ "CCCGG": 198,
273
+ "ACATC": 199,
274
+ "TCCGC": 200,
275
+ "AGGCG": 201,
276
+ "TTGCC": 202,
277
+ "ATACC": 203,
278
+ "AATAA": 204,
279
+ "ATAAC": 205,
280
+ "AGGGC": 206,
281
+ "AGACC": 207,
282
+ "▁ATT": 208,
283
+ "ACACC": 209,
284
+ "ACAAC": 210,
285
+ "TTTTTTTTTTTTTTTT": 211,
286
+ "TTGT": 212,
287
+ "TCCGG": 213,
288
+ "AAATC": 214,
289
+ "TTCGC": 215,
290
+ "TTCGG": 216,
291
+ "TACGC": 217,
292
+ "TGCCC": 218,
293
+ "ATCCC": 219,
294
+ "▁CCC": 220,
295
+ "TGCGC": 221,
296
+ "AGAAC": 222,
297
+ "AGCCC": 223,
298
+ "TACGG": 224,
299
+ "AAATG": 225,
300
+ "AAAGG": 226,
301
+ "▁AAAAAAAAAAAAAAAA": 227,
302
+ "TATCC": 228,
303
+ "AAATT": 229,
304
+ "GGCGG": 230,
305
+ "▁AAG": 231,
306
+ "▁TAA": 232,
307
+ "ATTCG": 233,
308
+ "TGACC": 234,
309
+ "GGCGC": 235,
310
+ "ATTGG": 236,
311
+ "AATAC": 237,
312
+ "AATGC": 238,
313
+ "AAT": 239,
314
+ "▁ATC": 240,
315
+ "AGGGG": 241,
316
+ "▁AGC": 242,
317
+ "ATAGC": 243,
318
+ "ACAGC": 244,
319
+ "TCCCG": 245,
320
+ "ACGTT": 246,
321
+ "GCCCC": 247,
322
+ "▁AAAAAAAAAAAA": 248,
323
+ "AATCC": 249,
324
+ "AACCG": 250,
325
+ "TAAGC": 251,
326
+ "ACGTG": 252,
327
+ "▁CGC": 253,
328
+ "ACT": 254,
329
+ "TCTGC": 255,
330
+ "ACATT": 256,
331
+ "AAGGC": 257,
332
+ "ATATC": 258,
333
+ "AGAGC": 259,
334
+ "TGGGC": 260,
335
+ "AAAAAAAAAAAA": 261,
336
+ "ATGGC": 262,
337
+ "TATGC": 263,
338
+ "AGTCC": 264,
339
+ "TGAAC": 265,
340
+ "ATCCG": 266,
341
+ "TACCG": 267,
342
+ "TTTTC": 268,
343
+ "ACGGC": 269,
344
+ "TCGTC": 270,
345
+ "TAGGC": 271,
346
+ "TTACC": 272,
347
+ "GCGTC": 273,
348
+ "ACTCC": 274,
349
+ "ACATG": 275,
350
+ "AGTGC": 276,
351
+ "TGTCC": 277,
352
+ "▁ATG": 278,
353
+ "AAGTC": 279,
354
+ "TGGGG": 280,
355
+ "AGCCG": 281,
356
+ "AATAG": 282,
357
+ "ATAGG": 283,
358
+ "ACTAA": 284,
359
+ "TTAAC": 285,
360
+ "TGCCG": 286,
361
+ "TTCCC": 287,
362
+ "TCACC": 288,
363
+ "ACAGG": 289,
364
+ "AATTC": 290,
365
+ "AAACG": 291,
366
+ "ATAAG": 292,
367
+ "ACTAC": 293,
368
+ "AGT": 294,
369
+ "TGAGC": 295,
370
+ "TAACG": 296,
371
+ "ATATG": 297,
372
+ "AGATG": 298,
373
+ "ATATT": 299,
374
+ "AGATC": 300,
375
+ "TGTGC": 301,
376
+ "TTTCC": 302,
377
+ "AGAGG": 303,
378
+ "ATGCG": 304,
379
+ "▁TAC": 305,
380
+ "▁TCC": 306,
381
+ "▁TGC": 307,
382
+ "AGTAC": 308,
383
+ "TTTTG": 309,
384
+ "TGGCG": 310,
385
+ "AGTAA": 311,
386
+ "AGATT": 312,
387
+ "AGACG": 313,
388
+ "ACTGG": 314,
389
+ "ACAAG": 315,
390
+ "ACTTC": 316,
391
+ "CCCC": 317,
392
+ "▁GGC": 318,
393
+ "TCAAC": 319,
394
+ "TCGGC": 320,
395
+ "▁CCG": 321,
396
+ "TTTGC": 322,
397
+ "ATAAAA": 323,
398
+ "AGAAG": 324,
399
+ "TGTGG": 325,
400
+ "TGAGG": 326,
401
+ "TATGG": 327,
402
+ "ACA": 328,
403
+ "TCTAC": 329,
404
+ "AATGG": 330,
405
+ "GCCGC": 331,
406
+ "TCATC": 332,
407
+ "AGTGG": 333,
408
+ "ACTTG": 334,
409
+ "TCTCC": 335,
410
+ "TTGGC": 336,
411
+ "▁AGG": 337,
412
+ "GCCGG": 338,
413
+ "AAGCG": 339,
414
+ "▁CGG": 340,
415
+ "ATACG": 341,
416
+ "TTAGC": 342,
417
+ "AGTTC": 343,
418
+ "AGA": 344,
419
+ "TGT": 345,
420
+ "TGACG": 346,
421
+ "ACGCG": 347,
422
+ "GTCCC": 348,
423
+ "TCAGC": 349,
424
+ "AGAAAA": 350,
425
+ "TAAGG": 351,
426
+ "AGTAG": 352,
427
+ "AATCG": 353,
428
+ "ACTAG": 354,
429
+ "TGATC": 355,
430
+ "TTCCG": 356,
431
+ "TTTGG": 357,
432
+ "TTTAC": 358,
433
+ "ACACG": 359,
434
+ "AATTG": 360,
435
+ "TGATG": 361,
436
+ "GTACC": 362,
437
+ "TGA": 363,
438
+ "TGTAC": 364,
439
+ "TCTGG": 365,
440
+ "TGATT": 366,
441
+ "TATTC": 367,
442
+ "▁ACG": 368,
443
+ "ATGGG": 369,
444
+ "AGTCG": 370,
445
+ "▁TAG": 371,
446
+ "TTATC": 372,
447
+ "ACGGG": 373,
448
+ "TCAGG": 374,
449
+ "TGTTC": 375,
450
+ "TCGCG": 376,
451
+ "CCGC": 377,
452
+ "TCTTC": 378,
453
+ "ACTCG": 379,
454
+ "▁GCG": 380,
455
+ "TTTAA": 381,
456
+ "TTAGG": 382,
457
+ "ACAAAA": 383,
458
+ "TGTAG": 384,
459
+ "TAGCG": 385,
460
+ "ACTGCAGAC": 386,
461
+ "AGTTG": 387,
462
+ "GTGGC": 388,
463
+ "GTAAC": 389,
464
+ "CCGG": 390,
465
+ "GTCCG": 391,
466
+ "TTATT": 392,
467
+ "TTGCG": 393,
468
+ "TGAAG": 394,
469
+ "AAGGG": 395,
470
+ "TCATT": 396,
471
+ "▁TTC": 397,
472
+ "TGTCG": 398,
473
+ "TTTAG": 399,
474
+ "▁AAAC": 400,
475
+ "TCATG": 401,
476
+ "▁TTG": 402,
477
+ "TATCG": 403,
478
+ "TTTCG": 404,
479
+ "TAGGG": 405,
480
+ "TTATG": 406,
481
+ "▁TCG": 407,
482
+ "TGTAA": 408,
483
+ "TCTAA": 409,
484
+ "TCGGG": 410,
485
+ "AAAACC": 411,
486
+ "GTAGC": 412,
487
+ "TCTAG": 413,
488
+ "ACCCGC": 414,
489
+ "TGCAGAC": 415,
490
+ "TTAAG": 416,
491
+ "TCAT": 417,
492
+ "TCTCG": 418,
493
+ "TTACG": 419,
494
+ "AAAACG": 420,
495
+ "TGTTG": 421,
496
+ "AACCCC": 422,
497
+ "GTGCG": 423,
498
+ "TCAAG": 424,
499
+ "TGAT": 425,
500
+ "TCACG": 426,
501
+ "TTGGG": 427,
502
+ "GTATC": 428,
503
+ "TCTTG": 429,
504
+ "AGCCCC": 430,
505
+ "AATAT": 431,
506
+ "AAAAGC": 432,
507
+ "▁AAAG": 433,
508
+ "GTAGG": 434,
509
+ "AACCGC": 435,
510
+ "TGCCCC": 436,
511
+ "AGCCGC": 437,
512
+ "TATTG": 438,
513
+ "ACCAC": 439,
514
+ "GTAA": 440,
515
+ "ACCCGG": 441,
516
+ "AAACGC": 442,
517
+ "AACAC": 443,
518
+ "TCA": 444,
519
+ "TCT": 445,
520
+ "TGCCGC": 446,
521
+ "TTAT": 447,
522
+ "GTATT": 448,
523
+ "AGACGC": 449,
524
+ "GTATG": 450,
525
+ "ACCTG": 451,
526
+ "▁TAT": 452,
527
+ "AACCGG": 453,
528
+ "TCACTGCAGAC": 454,
529
+ "AGCCGG": 455,
530
+ "TGCCGG": 456,
531
+ "AGACGG": 457,
532
+ "GTGGG": 458,
533
+ "ACCTC": 459,
534
+ "ATCCCC": 460,
535
+ "AACAAC": 461,
536
+ "▁TGG": 462,
537
+ "GTACG": 463,
538
+ "AAGAC": 464,
539
+ "ACCTT": 465,
540
+ "ATGCGG": 466,
541
+ "ACCGCC": 467,
542
+ "▁AATT": 468,
543
+ "ATAAAC": 469,
544
+ "AAGGCC": 470,
545
+ "▁ACAC": 471,
546
+ "AAGAAC": 472,
547
+ "ACGGCC": 473,
548
+ "ATA": 474,
549
+ "TCGGCC": 475,
550
+ "▁CTT": 476,
551
+ "AAGCGC": 477,
552
+ "TAAAAC": 478,
553
+ "TCGCGG": 479,
554
+ "TTTTTTTTTTTTTTTTTTTT": 480,
555
+ "AAAGAC": 481,
556
+ "ATCCGG": 482,
557
+ "AAAAGG": 483,
558
+ "AGTAT": 484,
559
+ "ATCCGC": 485,
560
+ "AAA": 486,
561
+ "ACGAC": 487,
562
+ "AGCAC": 488,
563
+ "AGGCGC": 489,
564
+ "AAGTT": 490,
565
+ "ATCTAC": 491,
566
+ "AAACCC": 492,
567
+ "TACGCC": 493,
568
+ "▁AACC": 494,
569
+ "ACGA": 495,
570
+ "ATGTC": 496,
571
+ "AACTC": 497,
572
+ "ATGCGC": 498,
573
+ "AAACGG": 499,
574
+ "AACTG": 500,
575
+ "AGGCGG": 501,
576
+ "TCGCGC": 502,
577
+ "AAAAAAAAAAAAAAAAAAAA": 503,
578
+ "AAGTG": 504,
579
+ "AACTT": 505,
580
+ "ATGGCC": 506,
581
+ "AACATC": 507,
582
+ "TTTTTTTTTTTT": 508,
583
+ "ACGCCC": 509,
584
+ "AAGCGG": 510,
585
+ "ACTAT": 511,
586
+ "▁GGG": 512,
587
+ "TCCCGC": 513,
588
+ "▁ACCC": 514,
589
+ "AATAAC": 515,
590
+ "AGGTC": 516,
591
+ "AAAGCC": 517,
592
+ "ACCCCC": 518,
593
+ "ACGCGG": 519,
594
+ "ACGCGC": 520,
595
+ "▁AAAT": 521,
596
+ "TACCCC": 522,
597
+ "TACCGC": 523,
598
+ "GTAT": 524,
599
+ "AGAAAC": 525,
600
+ "GTA": 526,
601
+ "TTCCGC": 527,
602
+ "TTT": 528,
603
+ "AAGCCC": 529,
604
+ "TAAAAG": 530,
605
+ "TCGTG": 531,
606
+ "TTCACTGCAGAC": 532,
607
+ "AGCTG": 533,
608
+ "ATGAC": 534,
609
+ "TAAGCC": 535,
610
+ "AGCTC": 536,
611
+ "ACCAG": 537,
612
+ "ACACGC": 538,
613
+ "TCCCGG": 539,
614
+ "AGCTT": 540,
615
+ "TCGAC": 541,
616
+ "AATTGC": 542,
617
+ "AACACC": 543,
618
+ "ATCTG": 544,
619
+ "TCGCCC": 545,
620
+ "AACAG": 546,
621
+ "TTCCCC": 547,
622
+ "ATGCCC": 548,
623
+ "AAATGC": 549,
624
+ "▁CCCC": 550,
625
+ "TTCCGG": 551,
626
+ "TTGGCC": 552,
627
+ "ACAAAC": 553,
628
+ "ACGGGC": 554,
629
+ "ATCGCC": 555,
630
+ "ATTTG": 556,
631
+ "TCGGGC": 557,
632
+ "TTGCGG": 558,
633
+ "AACGCC": 559,
634
+ "▁AAGC": 560,
635
+ "AGCAG": 561,
636
+ "▁GTC": 562,
637
+ "ACCACC": 563,
638
+ "ATCAC": 564,
639
+ "ACGAG": 565,
640
+ "▁AATC": 566,
641
+ "AAGAAAA": 567,
642
+ "AGCGCC": 568,
643
+ "ATGTG": 569,
644
+ "AAGTCC": 570,
645
+ "ATAACC": 571,
646
+ "▁AATG": 572,
647
+ "ATCTT": 573,
648
+ "ATGGGC": 574,
649
+ "TTGCCC": 575,
650
+ "AAGGGC": 576,
651
+ "▁GCCC": 577,
652
+ "AAGAG": 578,
653
+ "▁CTC": 579,
654
+ "▁AGAC": 580,
655
+ "AGGAC": 581,
656
+ "TCGGGG": 582,
657
+ "TTGCGC": 583,
658
+ "▁GTT": 584,
659
+ "ACACGG": 585,
660
+ "ATCTC": 586,
661
+ "▁AGCC": 587,
662
+ "ATTCGC": 588,
663
+ "AATACC": 589,
664
+ "▁CAC": 590,
665
+ "ATTTC": 591,
666
+ "ACGACC": 592,
667
+ "TTCGCC": 593,
668
+ "ACGAAC": 594,
669
+ "▁CCGC": 595,
670
+ "ATGTT": 596,
671
+ "ATTCGG": 597,
672
+ "AGGTG": 598,
673
+ "TTTTCC": 599,
674
+ "TTGAC": 600,
675
+ "ACGGGG": 601,
676
+ "AAATAC": 602,
677
+ "ATTGCC": 603,
678
+ "GTAAG": 604,
679
+ "TTGTC": 605,
680
+ "TATGCC": 606,
681
+ "AATGCC": 607,
682
+ "AGGCCC": 608,
683
+ "AGAACC": 609,
684
+ "ACCGGC": 610,
685
+ "TTA": 611,
686
+ "AGCTGC": 612,
687
+ "ACGTCC": 613,
688
+ "AACTGC": 614,
689
+ "ACCTCC": 615,
690
+ "ATTTT": 616,
691
+ "TACCGG": 617,
692
+ "AAACCG": 618,
693
+ "AAATCC": 619,
694
+ "TTTTGC": 620,
695
+ "ATCTGC": 621,
696
+ "AAGTGC": 622,
697
+ "TAAAC": 623,
698
+ "AATTCC": 624,
699
+ "▁TAAC": 625,
700
+ "▁GAC": 626,
701
+ "▁CTG": 627,
702
+ "TCGTT": 628,
703
+ "GCGTG": 629,
704
+ "TGGCGG": 630,
705
+ "▁CTGC": 631,
706
+ "ACCGT": 632,
707
+ "ATGGGG": 633,
708
+ "AGACCC": 634,
709
+ "ACGAGC": 635,
710
+ "ATTAC": 636,
711
+ "▁GTCC": 637,
712
+ "TGGCGC": 638,
713
+ "ATACCC": 639,
714
+ "ATAGCC": 640,
715
+ "ATAAAG": 641,
716
+ "AATAAAA": 642,
717
+ "AGGTT": 643,
718
+ "▁CGCC": 644,
719
+ "TCGAG": 645,
720
+ "ACCTGC": 646,
721
+ "ACCAAC": 647,
722
+ "TAGGCC": 648,
723
+ "AAAGGC": 649,
724
+ "TTGTG": 650,
725
+ "▁CATC": 651,
726
+ "▁ATCC": 652,
727
+ "TCCGCC": 653,
728
+ "GTGGCC": 654,
729
+ "AGAAAG": 655,
730
+ "TCGA": 656,
731
+ "▁GGCC": 657,
732
+ "▁CTAA": 658,
733
+ "ATACAC": 659,
734
+ "AGAAGC": 660,
735
+ "ACCTAC": 661,
736
+ "▁ACGC": 662,
737
+ "▁CATT": 663,
738
+ "AGCATC": 664,
739
+ "AACGT": 665,
740
+ "AATTGG": 666,
741
+ "▁AAAAG": 667,
742
+ "AGGGCC": 668,
743
+ "▁ATAC": 669,
744
+ "ATGTCC": 670,
745
+ "▁TTTT": 671,
746
+ "ACCCCG": 672,
747
+ "AATAGC": 673,
748
+ "ATAAGC": 674,
749
+ "TTCTC": 675,
750
+ "ACAACC": 676,
751
+ "ACGAGG": 677,
752
+ "ACCTGG": 678,
753
+ "TAACGC": 679,
754
+ "AAGCCG": 680,
755
+ "▁CAAC": 681,
756
+ "TTGGGC": 682,
757
+ "ACGCCG": 683,
758
+ "AATCCC": 684,
759
+ "AATCGC": 685,
760
+ "▁AGTC": 686,
761
+ "TTCTG": 687,
762
+ "CCCTC": 688,
763
+ "ACCATC": 689,
764
+ "AGCAAC": 690,
765
+ "TTTAT": 691,
766
+ "▁ATGC": 692,
767
+ "GTCCGG": 693,
768
+ "ACCA": 694,
769
+ "CCCTG": 695,
770
+ "▁AAGG": 696,
771
+ "ATGAAC": 697,
772
+ "CCCAC": 698,
773
+ "TTAAAA": 699,
774
+ "GTGCGG": 700,
775
+ "ATAGAC": 701,
776
+ "AGGCCG": 702,
777
+ "▁CTAC": 703,
778
+ "TCCTG": 704,
779
+ "AGAGCC": 705,
780
+ "TAATC": 706,
781
+ "GTCCCC": 707,
782
+ "TGCTG": 708,
783
+ "AGCTAC": 709,
784
+ "AGCGGC": 710,
785
+ "▁GCGC": 711,
786
+ "AAGGGG": 712,
787
+ "▁AAAAC": 713,
788
+ "AACCCG": 714,
789
+ "ATACGC": 715,
790
+ "AGTGCC": 716,
791
+ "GCGTT": 717,
792
+ "TATCGC": 718,
793
+ "▁TACC": 719,
794
+ "TTGTT": 720,
795
+ "AAAAAAC": 721,
796
+ "GTCCGC": 722,
797
+ "TGCTC": 723,
798
+ "AAGACC": 724,
799
+ "AGCGT": 725,
800
+ "TCCTC": 726,
801
+ "ATGACC": 727,
802
+ "▁TTGC": 728,
803
+ "ACATCC": 729,
804
+ "AGGA": 730,
805
+ "TTCGGC": 731,
806
+ "ATCAG": 732,
807
+ "TTGGGG": 733,
808
+ "TGCGCC": 734,
809
+ "▁ACCG": 735,
810
+ "ATATCC": 736,
811
+ "▁TATT": 737,
812
+ "AAATGG": 738,
813
+ "TAGCGG": 739,
814
+ "▁AGTT": 740,
815
+ "TGAAAA": 741,
816
+ "TTCTT": 742,
817
+ "GGGTC": 743,
818
+ "AAGAGC": 744,
819
+ "GCGAC": 745,
820
+ "AACTAC": 746,
821
+ "TAGCGC": 747,
822
+ "ATGCCG": 748,
823
+ "AATAAG": 749,
824
+ "▁TGCC": 750,
825
+ "GGGA": 751,
826
+ "AACATT": 752,
827
+ "CCCGCC": 753,
828
+ "▁ACTG": 754,
829
+ "▁GTGC": 755,
830
+ "ACGATT": 756,
831
+ "TGGTC": 757,
832
+ "TCCAC": 758,
833
+ "ATGTGC": 759,
834
+ "AAAGCG": 760,
835
+ "AACGGC": 761,
836
+ "TTTTGG": 762,
837
+ "ACCATT": 763,
838
+ "AGGAG": 764,
839
+ "ATGAG": 765,
840
+ "ATAATC": 766,
841
+ "▁TCCC": 767,
842
+ "▁CCGG": 768,
843
+ "▁CAG": 769,
844
+ "ACGATC": 770,
845
+ "▁TAAAA": 771,
846
+ "GCGCCC": 772,
847
+ "AATATT": 773,
848
+ "AGCTCC": 774,
849
+ "TACAC": 775,
850
+ "AAGAAG": 776,
851
+ "▁AGGC": 777,
852
+ "GCGA": 778,
853
+ "▁TCGC": 779,
854
+ "ATCCCG": 780,
855
+ "▁CTCC": 781,
856
+ "ATACGG": 782,
857
+ "ACCTAA": 783,
858
+ "GGCTC": 784,
859
+ "▁ATTC": 785,
860
+ "TAACGG": 786,
861
+ "ATAATG": 787,
862
+ "AATATC": 788,
863
+ "AACTAA": 789,
864
+ "▁CGT": 790,
865
+ "ATCGT": 791,
866
+ "AAGTGG": 792,
867
+ "▁ATAA": 793,
868
+ "TCGACC": 794,
869
+ "TAGTC": 795,
870
+ "AACAGC": 796,
871
+ "▁GTG": 797,
872
+ "TTCAC": 798,
873
+ "ATGTGG": 799,
874
+ "ATGTAC": 800,
875
+ "TTCTGC": 801,
876
+ "AAATCG": 802,
877
+ "AATAGG": 803,
878
+ "TTGACC": 804,
879
+ "AATCGG": 805,
880
+ "ACTGCC": 806,
881
+ "ATAAGG": 807,
882
+ "▁CCCG": 808,
883
+ "▁CAAAA": 809,
884
+ "ATATGC": 810,
885
+ "CCGTC": 811,
886
+ "GGCTG": 812,
887
+ "ACAGCC": 813,
888
+ "AGACCG": 814,
889
+ "TTTGCC": 815,
890
+ "▁ACGG": 816,
891
+ "ATTTCC": 817,
892
+ "ATCTCC": 818,
893
+ "ATACCG": 819,
894
+ "TCGAGG": 820,
895
+ "TCGAAC": 821,
896
+ "▁GCGG": 822,
897
+ "AGCACC": 823,
898
+ "GTGCGC": 824,
899
+ "ATAACG": 825,
900
+ "▁AGTG": 826,
901
+ "TAACCC": 827,
902
+ "TTAACC": 828,
903
+ "ACACCC": 829,
904
+ "AAATTC": 830,
905
+ "▁GAAAA": 831,
906
+ "ATCGGC": 832,
907
+ "TGTAT": 833,
908
+ "AAATTG": 834,
909
+ "AGTCCC": 835,
910
+ "AACTCC": 836,
911
+ "AGCATT": 837,
912
+ "TGACGG": 838,
913
+ "AATGGC": 839,
914
+ "AGTACC": 840,
915
+ "▁ATTG": 841,
916
+ "GTAAAA": 842,
917
+ "AAGATT": 843,
918
+ "AATATG": 844,
919
+ "AGAAGG": 845,
920
+ "AAGATG": 846,
921
+ "▁TAGC": 847,
922
+ "ATAATT": 848,
923
+ "▁CTTC": 849,
924
+ "AAGAGG": 850,
925
+ "▁CTAG": 851,
926
+ "AGCCCG": 852,
927
+ "TACTC": 853,
928
+ "AGCTGG": 854,
929
+ "▁GACC": 855,
930
+ "▁GCCG": 856,
931
+ "TGACGC": 857,
932
+ "ATCTGG": 858,
933
+ "▁GATT": 859,
934
+ "ACAGAC": 860,
935
+ "▁AACG": 861,
936
+ "ACGTTC": 862,
937
+ "AGCTAA": 863,
938
+ "AGTCGC": 864,
939
+ "AGGTGC": 865,
940
+ "TATTGC": 866,
941
+ "AAGATC": 867,
942
+ "GGGAC": 868,
943
+ "TGACCC": 869,
944
+ "AATCCG": 870,
945
+ "TATCGG": 871,
946
+ "CCCTT": 872,
947
+ "▁TAAG": 873,
948
+ "▁GAAC": 874,
949
+ "AGTCGG": 875,
950
+ "GGCGCC": 876,
951
+ "TCGAGC": 877,
952
+ "▁TGAC": 878,
953
+ "▁AGAA": 879,
954
+ "AGAACG": 880,
955
+ "GGCAC": 881,
956
+ "AGAGAC": 882,
957
+ "TTCTCC": 883,
958
+ "TGAACC": 884,
959
+ "AGTTGC": 885,
960
+ "TGCAC": 886,
961
+ "▁CACC": 887,
962
+ "▁TCAC": 888,
963
+ "GGCCCC": 889,
964
+ "GCCTC": 890,
965
+ "AACAAAA": 891,
966
+ "AGCAGG": 892,
967
+ "GTGGGC": 893,
968
+ "▁TTTC": 894,
969
+ "ACGATG": 895,
970
+ "TCGATC": 896,
971
+ "TATTCC": 897,
972
+ "ATTCCC": 898,
973
+ "AGTAAC": 899,
974
+ "TAGGGC": 900,
975
+ "ATAGTC": 901,
976
+ "AGAGGC": 902,
977
+ "TTCGT": 903,
978
+ "TGCTT": 904,
979
+ "▁CGGC": 905,
980
+ "ATATAC": 906,
981
+ "GGCCGC": 907,
982
+ "ATAGGC": 908,
983
+ "TCTAT": 909,
984
+ "AGCAGC": 910,
985
+ "TGAGCC": 911,
986
+ "AACAGG": 912,
987
+ "GTGGGG": 913,
988
+ "TAGCCC": 914,
989
+ "GGCCGG": 915,
990
+ "TGTGCC": 916,
991
+ "AATTTT": 917,
992
+ "TCAAAA": 918,
993
+ "TACCCG": 919,
994
+ "AGATGC": 920,
995
+ "ACAAAG": 921,
996
+ "ATGAGG": 922,
997
+ "AATACG": 923,
998
+ "▁AGAG": 924,
999
+ "TTGACG": 925,
1000
+ "TTGAGG": 926,
1001
+ "ACCTAG": 927,
1002
+ "TGCCCG": 928,
1003
+ "TTAAAC": 929,
1004
+ "ACAAGC": 930,
1005
+ "ACGTGC": 931,
1006
+ "TTCTGG": 932,
1007
+ "ATGT": 933,
1008
+ "ACCAGG": 934,
1009
+ "TTGAAC": 935,
1010
+ "ATCTAA": 936,
1011
+ "▁TATG": 937,
1012
+ "ACCAGC": 938,
1013
+ "ATTTGC": 939,
1014
+ "ATTTAC": 940,
1015
+ "AAAGAAAA": 941,
1016
+ "TCTACG": 942,
1017
+ "▁TATC": 943,
1018
+ "AGTAGC": 944,
1019
+ "AGTTCC": 945,
1020
+ "GGCTT": 946,
1021
+ "▁ATCG": 947,
1022
+ "GGGCCC": 948,
1023
+ "ACAATC": 949,
1024
+ "ACCT": 950,
1025
+ "ATCAAC": 951,
1026
+ "▁TGTC": 952,
1027
+ "AGAATC": 953,
1028
+ "ATCA": 954,
1029
+ "TGTCCC": 955,
1030
+ "ACCTTC": 956,
1031
+ "ACGTCG": 957,
1032
+ "ATCT": 958,
1033
+ "AAGGCG": 959,
1034
+ "TGAAGC": 960,
1035
+ "AGGTCC": 961,
1036
+ "AGGTAC": 962,
1037
+ "TCACTG": 963,
1038
+ "▁AGCG": 964,
1039
+ "AATGCG": 965,
1040
+ "TGGCCC": 966,
1041
+ "AACATG": 967,
1042
+ "AAGACG": 968,
1043
+ "TTTACC": 969,
1044
+ "TTGTCC": 970,
1045
+ "TAAAAAAAA": 971,
1046
+ "ACTACC": 972,
1047
+ "AACTAG": 973,
1048
+ "CCGTG": 974,
1049
+ "TTAGCC": 975,
1050
+ "TTACCC": 976,
1051
+ "AAGA": 977,
1052
+ "ATGTAA": 978,
1053
+ "TGGGCC": 979,
1054
+ "AGGT": 980,
1055
+ "GGGTG": 981,
1056
+ "ATAAAT": 982,
1057
+ "ATAGTG": 983,
1058
+ "ACATCG": 984,
1059
+ "ATGA": 985,
1060
+ "AGTTGG": 986,
1061
+ "ATGGCG": 987,
1062
+ "AGTCCG": 988,
1063
+ "AGCTAG": 989,
1064
+ "AGATGG": 990,
1065
+ "ATATGG": 991,
1066
+ "ATCATC": 992,
1067
+ "TGAAAC": 993,
1068
+ "▁TCGG": 994,
1069
+ "TCCCCC": 995,
1070
+ "TTTCACTGCAGAC": 996,
1071
+ "AGAATG": 997,
1072
+ "TTCACTG": 998,
1073
+ "AGGGGC": 999,
1074
+ "TATCCC": 1000,
1075
+ "TTTCCC": 1001,
1076
+ "ATTGGC": 1002,
1077
+ "ATTTGG": 1003,
1078
+ "CCGCCC": 1004,
1079
+ "ATTTAA": 1005,
1080
+ "TTCTAC": 1006,
1081
+ "TCGTCC": 1007,
1082
+ "ATTGT": 1008,
1083
+ "AACTGG": 1009,
1084
+ "ACGTGG": 1010,
1085
+ "ATATCG": 1011,
1086
+ "ACCATG": 1012,
1087
+ "AACA": 1013,
1088
+ "ATCGCG": 1014,
1089
+ "ACCGCG": 1015,
1090
+ "▁TTGG": 1016,
1091
+ "▁CAGC": 1017,
1092
+ "TAGGGG": 1018,
1093
+ "▁TTCC": 1019,
1094
+ "ACAAGG": 1020,
1095
+ "TGTCGC": 1021,
1096
+ "ACATGC": 1022,
1097
+ "AAGTTC": 1023
1098
+ },
1099
+ "merges": [
1100
+ [
1101
+ "A",
1102
+ "A"
1103
+ ],
1104
+ [
1105
+ "C",
1106
+ "C"
1107
+ ],
1108
+ [
1109
+ "T",
1110
+ "T"
1111
+ ],
1112
+ [
1113
+ "G",
1114
+ "G"
1115
+ ],
1116
+ [
1117
+ "A",
1118
+ "C"
1119
+ ],
1120
+ [
1121
+ "G",
1122
+ "C"
1123
+ ],
1124
+ [
1125
+ "T",
1126
+ "C"
1127
+ ],
1128
+ [
1129
+ "A",
1130
+ "G"
1131
+ ],
1132
+ [
1133
+ "T",
1134
+ "G"
1135
+ ],
1136
+ [
1137
+ "A",
1138
+ "T"
1139
+ ],
1140
+ [
1141
+ "AA",
1142
+ "AA"
1143
+ ],
1144
+ [
1145
+ "A",
1146
+ "CC"
1147
+ ],
1148
+ [
1149
+ "A",
1150
+ "GG"
1151
+ ],
1152
+ [
1153
+ "G",
1154
+ "T"
1155
+ ],
1156
+ [
1157
+ "AA",
1158
+ "C"
1159
+ ],
1160
+ [
1161
+ "A",
1162
+ "TT"
1163
+ ],
1164
+ [
1165
+ "A",
1166
+ "GC"
1167
+ ],
1168
+ [
1169
+ "A",
1170
+ "TC"
1171
+ ],
1172
+ [
1173
+ "CC",
1174
+ "C"
1175
+ ],
1176
+ [
1177
+ "AC",
1178
+ "G"
1179
+ ],
1180
+ [
1181
+ "GG",
1182
+ "C"
1183
+ ],
1184
+ [
1185
+ "A",
1186
+ "TG"
1187
+ ],
1188
+ [
1189
+ "T",
1190
+ "GC"
1191
+ ],
1192
+ [
1193
+ "T",
1194
+ "CC"
1195
+ ],
1196
+ [
1197
+ "AA",
1198
+ "G"
1199
+ ],
1200
+ [
1201
+ "TT",
1202
+ "C"
1203
+ ],
1204
+ [
1205
+ "T",
1206
+ "GG"
1207
+ ],
1208
+ [
1209
+ "G",
1210
+ "CC"
1211
+ ],
1212
+ [
1213
+ "▁",
1214
+ "C"
1215
+ ],
1216
+ [
1217
+ "T",
1218
+ "AC"
1219
+ ],
1220
+ [
1221
+ "T",
1222
+ "AA"
1223
+ ],
1224
+ [
1225
+ "TT",
1226
+ "TT"
1227
+ ],
1228
+ [
1229
+ "TC",
1230
+ "G"
1231
+ ],
1232
+ [
1233
+ "T",
1234
+ "AG"
1235
+ ],
1236
+ [
1237
+ "AAAA",
1238
+ "AAAA"
1239
+ ],
1240
+ [
1241
+ "GC",
1242
+ "G"
1243
+ ],
1244
+ [
1245
+ "TT",
1246
+ "G"
1247
+ ],
1248
+ [
1249
+ "CC",
1250
+ "G"
1251
+ ],
1252
+ [
1253
+ "ACC",
1254
+ "C"
1255
+ ],
1256
+ [
1257
+ "GG",
1258
+ "G"
1259
+ ],
1260
+ [
1261
+ "T",
1262
+ "AT"
1263
+ ],
1264
+ [
1265
+ "▁",
1266
+ "G"
1267
+ ],
1268
+ [
1269
+ "AA",
1270
+ "AC"
1271
+ ],
1272
+ [
1273
+ "AA",
1274
+ "CC"
1275
+ ],
1276
+ [
1277
+ "AG",
1278
+ "AC"
1279
+ ],
1280
+ [
1281
+ "AGG",
1282
+ "C"
1283
+ ],
1284
+ [
1285
+ "AG",
1286
+ "CC"
1287
+ ],
1288
+ [
1289
+ "TG",
1290
+ "CC"
1291
+ ],
1292
+ [
1293
+ "AA",
1294
+ "GC"
1295
+ ],
1296
+ [
1297
+ "AC",
1298
+ "AC"
1299
+ ],
1300
+ [
1301
+ "AT",
1302
+ "CC"
1303
+ ],
1304
+ [
1305
+ "ATT",
1306
+ "C"
1307
+ ],
1308
+ [
1309
+ "T",
1310
+ "ACC"
1311
+ ],
1312
+ [
1313
+ "AT",
1314
+ "GC"
1315
+ ],
1316
+ [
1317
+ "AA",
1318
+ "AG"
1319
+ ],
1320
+ [
1321
+ "T",
1322
+ "CCC"
1323
+ ],
1324
+ [
1325
+ "AC",
1326
+ "GG"
1327
+ ],
1328
+ [
1329
+ "AC",
1330
+ "GC"
1331
+ ],
1332
+ [
1333
+ "AA",
1334
+ "GG"
1335
+ ],
1336
+ [
1337
+ "TC",
1338
+ "GC"
1339
+ ],
1340
+ [
1341
+ "TC",
1342
+ "GG"
1343
+ ],
1344
+ [
1345
+ "T",
1346
+ "AAC"
1347
+ ],
1348
+ [
1349
+ "AT",
1350
+ "GG"
1351
+ ],
1352
+ [
1353
+ "ACC",
1354
+ "G"
1355
+ ],
1356
+ [
1357
+ "AA",
1358
+ "TT"
1359
+ ],
1360
+ [
1361
+ "AA",
1362
+ "TC"
1363
+ ],
1364
+ [
1365
+ "TT",
1366
+ "CC"
1367
+ ],
1368
+ [
1369
+ "AGC",
1370
+ "G"
1371
+ ],
1372
+ [
1373
+ "▁",
1374
+ "CC"
1375
+ ],
1376
+ [
1377
+ "ATC",
1378
+ "G"
1379
+ ],
1380
+ [
1381
+ "T",
1382
+ "GGC"
1383
+ ],
1384
+ [
1385
+ "AT",
1386
+ "AC"
1387
+ ],
1388
+ [
1389
+ "TT",
1390
+ "GC"
1391
+ ],
1392
+ [
1393
+ "AA",
1394
+ "TG"
1395
+ ],
1396
+ [
1397
+ "AG",
1398
+ "TC"
1399
+ ],
1400
+ [
1401
+ "GT",
1402
+ "CC"
1403
+ ],
1404
+ [
1405
+ "AAC",
1406
+ "G"
1407
+ ],
1408
+ [
1409
+ "TTTT",
1410
+ "TTTT"
1411
+ ],
1412
+ [
1413
+ "TT",
1414
+ "GG"
1415
+ ],
1416
+ [
1417
+ "AC",
1418
+ "TG"
1419
+ ],
1420
+ [
1421
+ "T",
1422
+ "AGG"
1423
+ ],
1424
+ [
1425
+ "ATT",
1426
+ "G"
1427
+ ],
1428
+ [
1429
+ "AG",
1430
+ "TG"
1431
+ ],
1432
+ [
1433
+ "T",
1434
+ "AGC"
1435
+ ],
1436
+ [
1437
+ "CCC",
1438
+ "G"
1439
+ ],
1440
+ [
1441
+ "AG",
1442
+ "TT"
1443
+ ],
1444
+ [
1445
+ "GT",
1446
+ "GC"
1447
+ ],
1448
+ [
1449
+ "▁",
1450
+ "GC"
1451
+ ],
1452
+ [
1453
+ "T",
1454
+ "ACG"
1455
+ ],
1456
+ [
1457
+ "TC",
1458
+ "AC"
1459
+ ],
1460
+ [
1461
+ "GT",
1462
+ "GG"
1463
+ ],
1464
+ [
1465
+ "▁",
1466
+ "AC"
1467
+ ],
1468
+ [
1469
+ "AAAA",
1470
+ "C"
1471
+ ],
1472
+ [
1473
+ "AA",
1474
+ "AT"
1475
+ ],
1476
+ [
1477
+ "T",
1478
+ "ATT"
1479
+ ],
1480
+ [
1481
+ "T",
1482
+ "ATC"
1483
+ ],
1484
+ [
1485
+ "TG",
1486
+ "AC"
1487
+ ],
1488
+ [
1489
+ "TCC",
1490
+ "G"
1491
+ ],
1492
+ [
1493
+ "TGC",
1494
+ "G"
1495
+ ],
1496
+ [
1497
+ "TTC",
1498
+ "G"
1499
+ ],
1500
+ [
1501
+ "GG",
1502
+ "CC"
1503
+ ],
1504
+ [
1505
+ "AG",
1506
+ "AG"
1507
+ ],
1508
+ [
1509
+ "T",
1510
+ "ATG"
1511
+ ],
1512
+ [
1513
+ "TG",
1514
+ "TC"
1515
+ ],
1516
+ [
1517
+ "T",
1518
+ "AAG"
1519
+ ],
1520
+ [
1521
+ "AGG",
1522
+ "G"
1523
+ ],
1524
+ [
1525
+ "GGC",
1526
+ "G"
1527
+ ],
1528
+ [
1529
+ "TT",
1530
+ "TC"
1531
+ ],
1532
+ [
1533
+ "AC",
1534
+ "TC"
1535
+ ],
1536
+ [
1537
+ "AG",
1538
+ "AA"
1539
+ ],
1540
+ [
1541
+ "AT",
1542
+ "AA"
1543
+ ],
1544
+ [
1545
+ "▁",
1546
+ "TC"
1547
+ ],
1548
+ [
1549
+ "AC",
1550
+ "TT"
1551
+ ],
1552
+ [
1553
+ "▁",
1554
+ "AA"
1555
+ ],
1556
+ [
1557
+ "▁",
1558
+ "GG"
1559
+ ],
1560
+ [
1561
+ "GC",
1562
+ "GG"
1563
+ ],
1564
+ [
1565
+ "TG",
1566
+ "TG"
1567
+ ],
1568
+ [
1569
+ "AT",
1570
+ "AG"
1571
+ ],
1572
+ [
1573
+ "▁",
1574
+ "AAAAAAAA"
1575
+ ],
1576
+ [
1577
+ "▁C",
1578
+ "G"
1579
+ ],
1580
+ [
1581
+ "▁",
1582
+ "TT"
1583
+ ],
1584
+ [
1585
+ "GCC",
1586
+ "G"
1587
+ ],
1588
+ [
1589
+ "T",
1590
+ "AAAA"
1591
+ ],
1592
+ [
1593
+ "TG",
1594
+ "TT"
1595
+ ],
1596
+ [
1597
+ "AC",
1598
+ "AA"
1599
+ ],
1600
+ [
1601
+ "TC",
1602
+ "TC"
1603
+ ],
1604
+ [
1605
+ "GC",
1606
+ "GC"
1607
+ ],
1608
+ [
1609
+ "▁",
1610
+ "AG"
1611
+ ],
1612
+ [
1613
+ "AC",
1614
+ "AG"
1615
+ ],
1616
+ [
1617
+ "TGG",
1618
+ "G"
1619
+ ],
1620
+ [
1621
+ "AA",
1622
+ "GT"
1623
+ ],
1624
+ [
1625
+ "ACC",
1626
+ "CC"
1627
+ ],
1628
+ [
1629
+ "ACG",
1630
+ "CC"
1631
+ ],
1632
+ [
1633
+ "TC",
1634
+ "TT"
1635
+ ],
1636
+ [
1637
+ "TC",
1638
+ "TG"
1639
+ ],
1640
+ [
1641
+ "TT",
1642
+ "TG"
1643
+ ],
1644
+ [
1645
+ "AC",
1646
+ "GT"
1647
+ ],
1648
+ [
1649
+ "AAAA",
1650
+ "G"
1651
+ ],
1652
+ [
1653
+ "AAG",
1654
+ "CC"
1655
+ ],
1656
+ [
1657
+ "ATG",
1658
+ "CC"
1659
+ ],
1660
+ [
1661
+ "GG",
1662
+ "GG"
1663
+ ],
1664
+ [
1665
+ "▁",
1666
+ "TG"
1667
+ ],
1668
+ [
1669
+ "AA",
1670
+ "ACC"
1671
+ ],
1672
+ [
1673
+ "AGG",
1674
+ "CC"
1675
+ ],
1676
+ [
1677
+ "TT",
1678
+ "AC"
1679
+ ],
1680
+ [
1681
+ "GG",
1682
+ "GC"
1683
+ ],
1684
+ [
1685
+ "AC",
1686
+ "TGC"
1687
+ ],
1688
+ [
1689
+ "AT",
1690
+ "AT"
1691
+ ],
1692
+ [
1693
+ "ACC",
1694
+ "GC"
1695
+ ],
1696
+ [
1697
+ "TG",
1698
+ "AG"
1699
+ ],
1700
+ [
1701
+ "GT",
1702
+ "AC"
1703
+ ],
1704
+ [
1705
+ "T",
1706
+ "A"
1707
+ ],
1708
+ [
1709
+ "TC",
1710
+ "AG"
1711
+ ],
1712
+ [
1713
+ "ACCC",
1714
+ "G"
1715
+ ],
1716
+ [
1717
+ "▁",
1718
+ "AT"
1719
+ ],
1720
+ [
1721
+ "AA",
1722
+ "CCC"
1723
+ ],
1724
+ [
1725
+ "ACC",
1726
+ "GG"
1727
+ ],
1728
+ [
1729
+ "AA",
1730
+ "AGC"
1731
+ ],
1732
+ [
1733
+ "TT",
1734
+ "AG"
1735
+ ],
1736
+ [
1737
+ "ATT",
1738
+ "CC"
1739
+ ],
1740
+ [
1741
+ "▁",
1742
+ "AAAA"
1743
+ ],
1744
+ [
1745
+ "AAC",
1746
+ "GC"
1747
+ ],
1748
+ [
1749
+ "TAA",
1750
+ "CC"
1751
+ ],
1752
+ [
1753
+ "GT",
1754
+ "AG"
1755
+ ],
1756
+ [
1757
+ "AAAAAAAA",
1758
+ "AAAAAAAA"
1759
+ ],
1760
+ [
1761
+ "AC",
1762
+ "AT"
1763
+ ],
1764
+ [
1765
+ "TCC",
1766
+ "CC"
1767
+ ],
1768
+ [
1769
+ "TG",
1770
+ "AA"
1771
+ ],
1772
+ [
1773
+ "ATC",
1774
+ "GC"
1775
+ ],
1776
+ [
1777
+ "TC",
1778
+ "AA"
1779
+ ],
1780
+ [
1781
+ "TGG",
1782
+ "CC"
1783
+ ],
1784
+ [
1785
+ "TC",
1786
+ "GT"
1787
+ ],
1788
+ [
1789
+ "AAC",
1790
+ "GG"
1791
+ ],
1792
+ [
1793
+ "TAG",
1794
+ "CC"
1795
+ ],
1796
+ [
1797
+ "T",
1798
+ "ACCC"
1799
+ ],
1800
+ [
1801
+ "ATT",
1802
+ "GC"
1803
+ ],
1804
+ [
1805
+ "AGC",
1806
+ "GG"
1807
+ ],
1808
+ [
1809
+ "AGC",
1810
+ "GC"
1811
+ ],
1812
+ [
1813
+ "ATC",
1814
+ "GG"
1815
+ ],
1816
+ [
1817
+ "CCC",
1818
+ "GC"
1819
+ ],
1820
+ [
1821
+ "▁",
1822
+ "GT"
1823
+ ],
1824
+ [
1825
+ "TT",
1826
+ "AA"
1827
+ ],
1828
+ [
1829
+ "▁",
1830
+ "AAC"
1831
+ ],
1832
+ [
1833
+ "ACG",
1834
+ "TC"
1835
+ ],
1836
+ [
1837
+ "▁",
1838
+ "GCC"
1839
+ ],
1840
+ [
1841
+ "TGC",
1842
+ "GG"
1843
+ ],
1844
+ [
1845
+ "AG",
1846
+ "AT"
1847
+ ],
1848
+ [
1849
+ "▁",
1850
+ "ACC"
1851
+ ],
1852
+ [
1853
+ "TC",
1854
+ "GCC"
1855
+ ],
1856
+ [
1857
+ "CCC",
1858
+ "GG"
1859
+ ],
1860
+ [
1861
+ "AC",
1862
+ "ATC"
1863
+ ],
1864
+ [
1865
+ "TCC",
1866
+ "GC"
1867
+ ],
1868
+ [
1869
+ "AGGC",
1870
+ "G"
1871
+ ],
1872
+ [
1873
+ "TT",
1874
+ "GCC"
1875
+ ],
1876
+ [
1877
+ "AT",
1878
+ "ACC"
1879
+ ],
1880
+ [
1881
+ "AA",
1882
+ "TAA"
1883
+ ],
1884
+ [
1885
+ "AT",
1886
+ "AAC"
1887
+ ],
1888
+ [
1889
+ "AGG",
1890
+ "GC"
1891
+ ],
1892
+ [
1893
+ "AG",
1894
+ "ACC"
1895
+ ],
1896
+ [
1897
+ "▁",
1898
+ "ATT"
1899
+ ],
1900
+ [
1901
+ "AC",
1902
+ "ACC"
1903
+ ],
1904
+ [
1905
+ "AC",
1906
+ "AAC"
1907
+ ],
1908
+ [
1909
+ "TTTTTTTT",
1910
+ "TTTTTTTT"
1911
+ ],
1912
+ [
1913
+ "TT",
1914
+ "GT"
1915
+ ],
1916
+ [
1917
+ "TCC",
1918
+ "GG"
1919
+ ],
1920
+ [
1921
+ "AA",
1922
+ "ATC"
1923
+ ],
1924
+ [
1925
+ "TTC",
1926
+ "GC"
1927
+ ],
1928
+ [
1929
+ "TTC",
1930
+ "GG"
1931
+ ],
1932
+ [
1933
+ "TAC",
1934
+ "GC"
1935
+ ],
1936
+ [
1937
+ "TG",
1938
+ "CCC"
1939
+ ],
1940
+ [
1941
+ "AT",
1942
+ "CCC"
1943
+ ],
1944
+ [
1945
+ "▁",
1946
+ "CCC"
1947
+ ],
1948
+ [
1949
+ "TGC",
1950
+ "GC"
1951
+ ],
1952
+ [
1953
+ "AG",
1954
+ "AAC"
1955
+ ],
1956
+ [
1957
+ "AG",
1958
+ "CCC"
1959
+ ],
1960
+ [
1961
+ "TAC",
1962
+ "GG"
1963
+ ],
1964
+ [
1965
+ "AA",
1966
+ "ATG"
1967
+ ],
1968
+ [
1969
+ "AA",
1970
+ "AGG"
1971
+ ],
1972
+ [
1973
+ "▁AAAAAAAA",
1974
+ "AAAAAAAA"
1975
+ ],
1976
+ [
1977
+ "TAT",
1978
+ "CC"
1979
+ ],
1980
+ [
1981
+ "AA",
1982
+ "ATT"
1983
+ ],
1984
+ [
1985
+ "GGC",
1986
+ "GG"
1987
+ ],
1988
+ [
1989
+ "▁",
1990
+ "AAG"
1991
+ ],
1992
+ [
1993
+ "▁",
1994
+ "TAA"
1995
+ ],
1996
+ [
1997
+ "ATTC",
1998
+ "G"
1999
+ ],
2000
+ [
2001
+ "TG",
2002
+ "ACC"
2003
+ ],
2004
+ [
2005
+ "GGC",
2006
+ "GC"
2007
+ ],
2008
+ [
2009
+ "ATT",
2010
+ "GG"
2011
+ ],
2012
+ [
2013
+ "AA",
2014
+ "TAC"
2015
+ ],
2016
+ [
2017
+ "AA",
2018
+ "TGC"
2019
+ ],
2020
+ [
2021
+ "AA",
2022
+ "T"
2023
+ ],
2024
+ [
2025
+ "▁",
2026
+ "ATC"
2027
+ ],
2028
+ [
2029
+ "AGG",
2030
+ "GG"
2031
+ ],
2032
+ [
2033
+ "▁",
2034
+ "AGC"
2035
+ ],
2036
+ [
2037
+ "AT",
2038
+ "AGC"
2039
+ ],
2040
+ [
2041
+ "AC",
2042
+ "AGC"
2043
+ ],
2044
+ [
2045
+ "TCCC",
2046
+ "G"
2047
+ ],
2048
+ [
2049
+ "ACG",
2050
+ "TT"
2051
+ ],
2052
+ [
2053
+ "GCC",
2054
+ "CC"
2055
+ ],
2056
+ [
2057
+ "▁AAAAAAAA",
2058
+ "AAAA"
2059
+ ],
2060
+ [
2061
+ "AA",
2062
+ "TCC"
2063
+ ],
2064
+ [
2065
+ "AA",
2066
+ "CCG"
2067
+ ],
2068
+ [
2069
+ "TAA",
2070
+ "GC"
2071
+ ],
2072
+ [
2073
+ "ACG",
2074
+ "TG"
2075
+ ],
2076
+ [
2077
+ "▁C",
2078
+ "GC"
2079
+ ],
2080
+ [
2081
+ "AC",
2082
+ "T"
2083
+ ],
2084
+ [
2085
+ "TC",
2086
+ "TGC"
2087
+ ],
2088
+ [
2089
+ "AC",
2090
+ "ATT"
2091
+ ],
2092
+ [
2093
+ "AA",
2094
+ "GGC"
2095
+ ],
2096
+ [
2097
+ "AT",
2098
+ "ATC"
2099
+ ],
2100
+ [
2101
+ "AG",
2102
+ "AGC"
2103
+ ],
2104
+ [
2105
+ "TGG",
2106
+ "GC"
2107
+ ],
2108
+ [
2109
+ "AAAAAAAA",
2110
+ "AAAA"
2111
+ ],
2112
+ [
2113
+ "AT",
2114
+ "GGC"
2115
+ ],
2116
+ [
2117
+ "TAT",
2118
+ "GC"
2119
+ ],
2120
+ [
2121
+ "AG",
2122
+ "TCC"
2123
+ ],
2124
+ [
2125
+ "TG",
2126
+ "AAC"
2127
+ ],
2128
+ [
2129
+ "AT",
2130
+ "CCG"
2131
+ ],
2132
+ [
2133
+ "TACC",
2134
+ "G"
2135
+ ],
2136
+ [
2137
+ "TT",
2138
+ "TTC"
2139
+ ],
2140
+ [
2141
+ "AC",
2142
+ "GGC"
2143
+ ],
2144
+ [
2145
+ "TCG",
2146
+ "TC"
2147
+ ],
2148
+ [
2149
+ "T",
2150
+ "AGGC"
2151
+ ],
2152
+ [
2153
+ "TT",
2154
+ "ACC"
2155
+ ],
2156
+ [
2157
+ "GCG",
2158
+ "TC"
2159
+ ],
2160
+ [
2161
+ "AC",
2162
+ "TCC"
2163
+ ],
2164
+ [
2165
+ "AC",
2166
+ "ATG"
2167
+ ],
2168
+ [
2169
+ "AG",
2170
+ "TGC"
2171
+ ],
2172
+ [
2173
+ "TG",
2174
+ "TCC"
2175
+ ],
2176
+ [
2177
+ "▁",
2178
+ "ATG"
2179
+ ],
2180
+ [
2181
+ "AAG",
2182
+ "TC"
2183
+ ],
2184
+ [
2185
+ "TGG",
2186
+ "GG"
2187
+ ],
2188
+ [
2189
+ "AG",
2190
+ "CCG"
2191
+ ],
2192
+ [
2193
+ "AA",
2194
+ "TAG"
2195
+ ],
2196
+ [
2197
+ "AT",
2198
+ "AGG"
2199
+ ],
2200
+ [
2201
+ "AC",
2202
+ "TAA"
2203
+ ],
2204
+ [
2205
+ "TT",
2206
+ "AAC"
2207
+ ],
2208
+ [
2209
+ "TG",
2210
+ "CCG"
2211
+ ],
2212
+ [
2213
+ "TT",
2214
+ "CCC"
2215
+ ],
2216
+ [
2217
+ "TC",
2218
+ "ACC"
2219
+ ],
2220
+ [
2221
+ "AC",
2222
+ "AGG"
2223
+ ],
2224
+ [
2225
+ "AA",
2226
+ "TTC"
2227
+ ],
2228
+ [
2229
+ "AA",
2230
+ "ACG"
2231
+ ],
2232
+ [
2233
+ "AT",
2234
+ "AAG"
2235
+ ],
2236
+ [
2237
+ "AC",
2238
+ "TAC"
2239
+ ],
2240
+ [
2241
+ "AG",
2242
+ "T"
2243
+ ],
2244
+ [
2245
+ "TG",
2246
+ "AGC"
2247
+ ],
2248
+ [
2249
+ "TAAC",
2250
+ "G"
2251
+ ],
2252
+ [
2253
+ "AT",
2254
+ "ATG"
2255
+ ],
2256
+ [
2257
+ "AG",
2258
+ "ATG"
2259
+ ],
2260
+ [
2261
+ "AT",
2262
+ "ATT"
2263
+ ],
2264
+ [
2265
+ "AG",
2266
+ "ATC"
2267
+ ],
2268
+ [
2269
+ "TG",
2270
+ "TGC"
2271
+ ],
2272
+ [
2273
+ "TT",
2274
+ "TCC"
2275
+ ],
2276
+ [
2277
+ "AG",
2278
+ "AGG"
2279
+ ],
2280
+ [
2281
+ "AT",
2282
+ "GCG"
2283
+ ],
2284
+ [
2285
+ "▁",
2286
+ "TAC"
2287
+ ],
2288
+ [
2289
+ "▁",
2290
+ "TCC"
2291
+ ],
2292
+ [
2293
+ "▁",
2294
+ "TGC"
2295
+ ],
2296
+ [
2297
+ "AG",
2298
+ "TAC"
2299
+ ],
2300
+ [
2301
+ "TTTT",
2302
+ "G"
2303
+ ],
2304
+ [
2305
+ "TGGC",
2306
+ "G"
2307
+ ],
2308
+ [
2309
+ "AG",
2310
+ "TAA"
2311
+ ],
2312
+ [
2313
+ "AG",
2314
+ "ATT"
2315
+ ],
2316
+ [
2317
+ "AG",
2318
+ "ACG"
2319
+ ],
2320
+ [
2321
+ "AC",
2322
+ "TGG"
2323
+ ],
2324
+ [
2325
+ "AC",
2326
+ "AAG"
2327
+ ],
2328
+ [
2329
+ "AC",
2330
+ "TTC"
2331
+ ],
2332
+ [
2333
+ "CC",
2334
+ "CC"
2335
+ ],
2336
+ [
2337
+ "▁",
2338
+ "GGC"
2339
+ ],
2340
+ [
2341
+ "TC",
2342
+ "AAC"
2343
+ ],
2344
+ [
2345
+ "TC",
2346
+ "GGC"
2347
+ ],
2348
+ [
2349
+ "▁",
2350
+ "CCG"
2351
+ ],
2352
+ [
2353
+ "TT",
2354
+ "TGC"
2355
+ ],
2356
+ [
2357
+ "AT",
2358
+ "AAAA"
2359
+ ],
2360
+ [
2361
+ "AG",
2362
+ "AAG"
2363
+ ],
2364
+ [
2365
+ "TG",
2366
+ "TGG"
2367
+ ],
2368
+ [
2369
+ "TG",
2370
+ "AGG"
2371
+ ],
2372
+ [
2373
+ "TAT",
2374
+ "GG"
2375
+ ],
2376
+ [
2377
+ "AC",
2378
+ "A"
2379
+ ],
2380
+ [
2381
+ "TC",
2382
+ "TAC"
2383
+ ],
2384
+ [
2385
+ "AA",
2386
+ "TGG"
2387
+ ],
2388
+ [
2389
+ "GCC",
2390
+ "GC"
2391
+ ],
2392
+ [
2393
+ "TC",
2394
+ "ATC"
2395
+ ],
2396
+ [
2397
+ "AG",
2398
+ "TGG"
2399
+ ],
2400
+ [
2401
+ "AC",
2402
+ "TTG"
2403
+ ],
2404
+ [
2405
+ "TC",
2406
+ "TCC"
2407
+ ],
2408
+ [
2409
+ "TT",
2410
+ "GGC"
2411
+ ],
2412
+ [
2413
+ "▁",
2414
+ "AGG"
2415
+ ],
2416
+ [
2417
+ "GCC",
2418
+ "GG"
2419
+ ],
2420
+ [
2421
+ "AA",
2422
+ "GCG"
2423
+ ],
2424
+ [
2425
+ "▁C",
2426
+ "GG"
2427
+ ],
2428
+ [
2429
+ "AT",
2430
+ "ACG"
2431
+ ],
2432
+ [
2433
+ "TT",
2434
+ "AGC"
2435
+ ],
2436
+ [
2437
+ "AG",
2438
+ "TTC"
2439
+ ],
2440
+ [
2441
+ "AG",
2442
+ "A"
2443
+ ],
2444
+ [
2445
+ "TG",
2446
+ "T"
2447
+ ],
2448
+ [
2449
+ "TG",
2450
+ "ACG"
2451
+ ],
2452
+ [
2453
+ "AC",
2454
+ "GCG"
2455
+ ],
2456
+ [
2457
+ "GT",
2458
+ "CCC"
2459
+ ],
2460
+ [
2461
+ "TC",
2462
+ "AGC"
2463
+ ],
2464
+ [
2465
+ "AG",
2466
+ "AAAA"
2467
+ ],
2468
+ [
2469
+ "TAA",
2470
+ "GG"
2471
+ ],
2472
+ [
2473
+ "AG",
2474
+ "TAG"
2475
+ ],
2476
+ [
2477
+ "AA",
2478
+ "TCG"
2479
+ ],
2480
+ [
2481
+ "AC",
2482
+ "TAG"
2483
+ ],
2484
+ [
2485
+ "TG",
2486
+ "ATC"
2487
+ ],
2488
+ [
2489
+ "TT",
2490
+ "CCG"
2491
+ ],
2492
+ [
2493
+ "TT",
2494
+ "TGG"
2495
+ ],
2496
+ [
2497
+ "TT",
2498
+ "TAC"
2499
+ ],
2500
+ [
2501
+ "AC",
2502
+ "ACG"
2503
+ ],
2504
+ [
2505
+ "AA",
2506
+ "TTG"
2507
+ ],
2508
+ [
2509
+ "TG",
2510
+ "ATG"
2511
+ ],
2512
+ [
2513
+ "GT",
2514
+ "ACC"
2515
+ ],
2516
+ [
2517
+ "TG",
2518
+ "A"
2519
+ ],
2520
+ [
2521
+ "TG",
2522
+ "TAC"
2523
+ ],
2524
+ [
2525
+ "TC",
2526
+ "TGG"
2527
+ ],
2528
+ [
2529
+ "TG",
2530
+ "ATT"
2531
+ ],
2532
+ [
2533
+ "T",
2534
+ "ATTC"
2535
+ ],
2536
+ [
2537
+ "▁",
2538
+ "ACG"
2539
+ ],
2540
+ [
2541
+ "AT",
2542
+ "GGG"
2543
+ ],
2544
+ [
2545
+ "AG",
2546
+ "TCG"
2547
+ ],
2548
+ [
2549
+ "▁",
2550
+ "TAG"
2551
+ ],
2552
+ [
2553
+ "TT",
2554
+ "ATC"
2555
+ ],
2556
+ [
2557
+ "AC",
2558
+ "GGG"
2559
+ ],
2560
+ [
2561
+ "TC",
2562
+ "AGG"
2563
+ ],
2564
+ [
2565
+ "TG",
2566
+ "TTC"
2567
+ ],
2568
+ [
2569
+ "TC",
2570
+ "GCG"
2571
+ ],
2572
+ [
2573
+ "CC",
2574
+ "GC"
2575
+ ],
2576
+ [
2577
+ "TC",
2578
+ "TTC"
2579
+ ],
2580
+ [
2581
+ "AC",
2582
+ "TCG"
2583
+ ],
2584
+ [
2585
+ "▁",
2586
+ "GCG"
2587
+ ],
2588
+ [
2589
+ "TT",
2590
+ "TAA"
2591
+ ],
2592
+ [
2593
+ "TT",
2594
+ "AGG"
2595
+ ],
2596
+ [
2597
+ "AC",
2598
+ "AAAA"
2599
+ ],
2600
+ [
2601
+ "TG",
2602
+ "TAG"
2603
+ ],
2604
+ [
2605
+ "T",
2606
+ "AGCG"
2607
+ ],
2608
+ [
2609
+ "ACTGC",
2610
+ "AGAC"
2611
+ ],
2612
+ [
2613
+ "AG",
2614
+ "TTG"
2615
+ ],
2616
+ [
2617
+ "GT",
2618
+ "GGC"
2619
+ ],
2620
+ [
2621
+ "GT",
2622
+ "AAC"
2623
+ ],
2624
+ [
2625
+ "CC",
2626
+ "GG"
2627
+ ],
2628
+ [
2629
+ "GT",
2630
+ "CCG"
2631
+ ],
2632
+ [
2633
+ "TT",
2634
+ "ATT"
2635
+ ],
2636
+ [
2637
+ "TT",
2638
+ "GCG"
2639
+ ],
2640
+ [
2641
+ "TG",
2642
+ "AAG"
2643
+ ],
2644
+ [
2645
+ "AA",
2646
+ "GGG"
2647
+ ],
2648
+ [
2649
+ "TC",
2650
+ "ATT"
2651
+ ],
2652
+ [
2653
+ "▁",
2654
+ "TTC"
2655
+ ],
2656
+ [
2657
+ "TG",
2658
+ "TCG"
2659
+ ],
2660
+ [
2661
+ "TT",
2662
+ "TAG"
2663
+ ],
2664
+ [
2665
+ "▁",
2666
+ "AAAC"
2667
+ ],
2668
+ [
2669
+ "TC",
2670
+ "ATG"
2671
+ ],
2672
+ [
2673
+ "▁",
2674
+ "TTG"
2675
+ ],
2676
+ [
2677
+ "T",
2678
+ "ATCG"
2679
+ ],
2680
+ [
2681
+ "TT",
2682
+ "TCG"
2683
+ ],
2684
+ [
2685
+ "TAGG",
2686
+ "G"
2687
+ ],
2688
+ [
2689
+ "TT",
2690
+ "ATG"
2691
+ ],
2692
+ [
2693
+ "▁",
2694
+ "TCG"
2695
+ ],
2696
+ [
2697
+ "TG",
2698
+ "TAA"
2699
+ ],
2700
+ [
2701
+ "TC",
2702
+ "TAA"
2703
+ ],
2704
+ [
2705
+ "TC",
2706
+ "GGG"
2707
+ ],
2708
+ [
2709
+ "AAAA",
2710
+ "CC"
2711
+ ],
2712
+ [
2713
+ "GT",
2714
+ "AGC"
2715
+ ],
2716
+ [
2717
+ "TC",
2718
+ "TAG"
2719
+ ],
2720
+ [
2721
+ "ACCC",
2722
+ "GC"
2723
+ ],
2724
+ [
2725
+ "TGC",
2726
+ "AGAC"
2727
+ ],
2728
+ [
2729
+ "TT",
2730
+ "AAG"
2731
+ ],
2732
+ [
2733
+ "TC",
2734
+ "AT"
2735
+ ],
2736
+ [
2737
+ "TC",
2738
+ "TCG"
2739
+ ],
2740
+ [
2741
+ "TT",
2742
+ "ACG"
2743
+ ],
2744
+ [
2745
+ "AAAAC",
2746
+ "G"
2747
+ ],
2748
+ [
2749
+ "TG",
2750
+ "TTG"
2751
+ ],
2752
+ [
2753
+ "AACC",
2754
+ "CC"
2755
+ ],
2756
+ [
2757
+ "GT",
2758
+ "GCG"
2759
+ ],
2760
+ [
2761
+ "TC",
2762
+ "AAG"
2763
+ ],
2764
+ [
2765
+ "TG",
2766
+ "AT"
2767
+ ],
2768
+ [
2769
+ "TC",
2770
+ "ACG"
2771
+ ],
2772
+ [
2773
+ "TT",
2774
+ "GGG"
2775
+ ],
2776
+ [
2777
+ "GT",
2778
+ "ATC"
2779
+ ],
2780
+ [
2781
+ "TC",
2782
+ "TTG"
2783
+ ],
2784
+ [
2785
+ "AGCC",
2786
+ "CC"
2787
+ ],
2788
+ [
2789
+ "AA",
2790
+ "TAT"
2791
+ ],
2792
+ [
2793
+ "AAAA",
2794
+ "GC"
2795
+ ],
2796
+ [
2797
+ "▁",
2798
+ "AAAG"
2799
+ ],
2800
+ [
2801
+ "GT",
2802
+ "AGG"
2803
+ ],
2804
+ [
2805
+ "AACC",
2806
+ "GC"
2807
+ ],
2808
+ [
2809
+ "TGCC",
2810
+ "CC"
2811
+ ],
2812
+ [
2813
+ "AGCC",
2814
+ "GC"
2815
+ ],
2816
+ [
2817
+ "T",
2818
+ "ATTG"
2819
+ ],
2820
+ [
2821
+ "ACC",
2822
+ "AC"
2823
+ ],
2824
+ [
2825
+ "GT",
2826
+ "AA"
2827
+ ],
2828
+ [
2829
+ "ACCC",
2830
+ "GG"
2831
+ ],
2832
+ [
2833
+ "AAAC",
2834
+ "GC"
2835
+ ],
2836
+ [
2837
+ "AAC",
2838
+ "AC"
2839
+ ],
2840
+ [
2841
+ "TC",
2842
+ "A"
2843
+ ],
2844
+ [
2845
+ "TC",
2846
+ "T"
2847
+ ],
2848
+ [
2849
+ "TGCC",
2850
+ "GC"
2851
+ ],
2852
+ [
2853
+ "TT",
2854
+ "AT"
2855
+ ],
2856
+ [
2857
+ "GT",
2858
+ "ATT"
2859
+ ],
2860
+ [
2861
+ "AGAC",
2862
+ "GC"
2863
+ ],
2864
+ [
2865
+ "GT",
2866
+ "ATG"
2867
+ ],
2868
+ [
2869
+ "ACC",
2870
+ "TG"
2871
+ ],
2872
+ [
2873
+ "▁",
2874
+ "TAT"
2875
+ ],
2876
+ [
2877
+ "AACC",
2878
+ "GG"
2879
+ ],
2880
+ [
2881
+ "TCAC",
2882
+ "TGCAGAC"
2883
+ ],
2884
+ [
2885
+ "AGCC",
2886
+ "GG"
2887
+ ],
2888
+ [
2889
+ "TGCC",
2890
+ "GG"
2891
+ ],
2892
+ [
2893
+ "AGAC",
2894
+ "GG"
2895
+ ],
2896
+ [
2897
+ "GT",
2898
+ "GGG"
2899
+ ],
2900
+ [
2901
+ "ACC",
2902
+ "TC"
2903
+ ],
2904
+ [
2905
+ "ATCC",
2906
+ "CC"
2907
+ ],
2908
+ [
2909
+ "AAC",
2910
+ "AAC"
2911
+ ],
2912
+ [
2913
+ "▁",
2914
+ "TGG"
2915
+ ],
2916
+ [
2917
+ "GT",
2918
+ "ACG"
2919
+ ],
2920
+ [
2921
+ "AAG",
2922
+ "AC"
2923
+ ],
2924
+ [
2925
+ "ACC",
2926
+ "TT"
2927
+ ],
2928
+ [
2929
+ "ATGC",
2930
+ "GG"
2931
+ ],
2932
+ [
2933
+ "ACC",
2934
+ "GCC"
2935
+ ],
2936
+ [
2937
+ "▁",
2938
+ "AATT"
2939
+ ],
2940
+ [
2941
+ "AT",
2942
+ "AAAC"
2943
+ ],
2944
+ [
2945
+ "AAGG",
2946
+ "CC"
2947
+ ],
2948
+ [
2949
+ "▁",
2950
+ "ACAC"
2951
+ ],
2952
+ [
2953
+ "AAG",
2954
+ "AAC"
2955
+ ],
2956
+ [
2957
+ "ACGG",
2958
+ "CC"
2959
+ ],
2960
+ [
2961
+ "AT",
2962
+ "A"
2963
+ ],
2964
+ [
2965
+ "TCGG",
2966
+ "CC"
2967
+ ],
2968
+ [
2969
+ "▁C",
2970
+ "TT"
2971
+ ],
2972
+ [
2973
+ "AAGC",
2974
+ "GC"
2975
+ ],
2976
+ [
2977
+ "T",
2978
+ "AAAAC"
2979
+ ],
2980
+ [
2981
+ "TCGC",
2982
+ "GG"
2983
+ ],
2984
+ [
2985
+ "TTTTTTTTTTTTTTTT",
2986
+ "TTTT"
2987
+ ],
2988
+ [
2989
+ "AA",
2990
+ "AGAC"
2991
+ ],
2992
+ [
2993
+ "ATCC",
2994
+ "GG"
2995
+ ],
2996
+ [
2997
+ "AAAA",
2998
+ "GG"
2999
+ ],
3000
+ [
3001
+ "AG",
3002
+ "TAT"
3003
+ ],
3004
+ [
3005
+ "ATCC",
3006
+ "GC"
3007
+ ],
3008
+ [
3009
+ "AA",
3010
+ "A"
3011
+ ],
3012
+ [
3013
+ "ACG",
3014
+ "AC"
3015
+ ],
3016
+ [
3017
+ "AGC",
3018
+ "AC"
3019
+ ],
3020
+ [
3021
+ "AGGC",
3022
+ "GC"
3023
+ ],
3024
+ [
3025
+ "AAG",
3026
+ "TT"
3027
+ ],
3028
+ [
3029
+ "ATC",
3030
+ "TAC"
3031
+ ],
3032
+ [
3033
+ "AA",
3034
+ "ACCC"
3035
+ ],
3036
+ [
3037
+ "TACG",
3038
+ "CC"
3039
+ ],
3040
+ [
3041
+ "▁",
3042
+ "AACC"
3043
+ ],
3044
+ [
3045
+ "ACG",
3046
+ "A"
3047
+ ],
3048
+ [
3049
+ "ATG",
3050
+ "TC"
3051
+ ],
3052
+ [
3053
+ "AAC",
3054
+ "TC"
3055
+ ],
3056
+ [
3057
+ "ATGC",
3058
+ "GC"
3059
+ ],
3060
+ [
3061
+ "AAAC",
3062
+ "GG"
3063
+ ],
3064
+ [
3065
+ "AAC",
3066
+ "TG"
3067
+ ],
3068
+ [
3069
+ "AGGC",
3070
+ "GG"
3071
+ ],
3072
+ [
3073
+ "TCGC",
3074
+ "GC"
3075
+ ],
3076
+ [
3077
+ "AAAAAAAAAAAAAAAA",
3078
+ "AAAA"
3079
+ ],
3080
+ [
3081
+ "AAG",
3082
+ "TG"
3083
+ ],
3084
+ [
3085
+ "AAC",
3086
+ "TT"
3087
+ ],
3088
+ [
3089
+ "ATGG",
3090
+ "CC"
3091
+ ],
3092
+ [
3093
+ "AAC",
3094
+ "ATC"
3095
+ ],
3096
+ [
3097
+ "TTTTTTTT",
3098
+ "TTTT"
3099
+ ],
3100
+ [
3101
+ "ACG",
3102
+ "CCC"
3103
+ ],
3104
+ [
3105
+ "AAGC",
3106
+ "GG"
3107
+ ],
3108
+ [
3109
+ "AC",
3110
+ "TAT"
3111
+ ],
3112
+ [
3113
+ "▁",
3114
+ "GGG"
3115
+ ],
3116
+ [
3117
+ "TCCC",
3118
+ "GC"
3119
+ ],
3120
+ [
3121
+ "▁",
3122
+ "ACCC"
3123
+ ],
3124
+ [
3125
+ "AA",
3126
+ "TAAC"
3127
+ ],
3128
+ [
3129
+ "AGG",
3130
+ "TC"
3131
+ ],
3132
+ [
3133
+ "AA",
3134
+ "AGCC"
3135
+ ],
3136
+ [
3137
+ "ACC",
3138
+ "CCC"
3139
+ ],
3140
+ [
3141
+ "ACGC",
3142
+ "GG"
3143
+ ],
3144
+ [
3145
+ "ACGC",
3146
+ "GC"
3147
+ ],
3148
+ [
3149
+ "▁",
3150
+ "AAAT"
3151
+ ],
3152
+ [
3153
+ "TACC",
3154
+ "CC"
3155
+ ],
3156
+ [
3157
+ "TACC",
3158
+ "GC"
3159
+ ],
3160
+ [
3161
+ "GT",
3162
+ "AT"
3163
+ ],
3164
+ [
3165
+ "AG",
3166
+ "AAAC"
3167
+ ],
3168
+ [
3169
+ "GT",
3170
+ "A"
3171
+ ],
3172
+ [
3173
+ "TTCC",
3174
+ "GC"
3175
+ ],
3176
+ [
3177
+ "TT",
3178
+ "T"
3179
+ ],
3180
+ [
3181
+ "AAG",
3182
+ "CCC"
3183
+ ],
3184
+ [
3185
+ "TAAAA",
3186
+ "G"
3187
+ ],
3188
+ [
3189
+ "TCG",
3190
+ "TG"
3191
+ ],
3192
+ [
3193
+ "TTC",
3194
+ "ACTGCAGAC"
3195
+ ],
3196
+ [
3197
+ "AGC",
3198
+ "TG"
3199
+ ],
3200
+ [
3201
+ "ATG",
3202
+ "AC"
3203
+ ],
3204
+ [
3205
+ "TAAG",
3206
+ "CC"
3207
+ ],
3208
+ [
3209
+ "AGC",
3210
+ "TC"
3211
+ ],
3212
+ [
3213
+ "ACC",
3214
+ "AG"
3215
+ ],
3216
+ [
3217
+ "ACAC",
3218
+ "GC"
3219
+ ],
3220
+ [
3221
+ "TCCC",
3222
+ "GG"
3223
+ ],
3224
+ [
3225
+ "AGC",
3226
+ "TT"
3227
+ ],
3228
+ [
3229
+ "TCG",
3230
+ "AC"
3231
+ ],
3232
+ [
3233
+ "AATT",
3234
+ "GC"
3235
+ ],
3236
+ [
3237
+ "AAC",
3238
+ "ACC"
3239
+ ],
3240
+ [
3241
+ "ATC",
3242
+ "TG"
3243
+ ],
3244
+ [
3245
+ "TCG",
3246
+ "CCC"
3247
+ ],
3248
+ [
3249
+ "AAC",
3250
+ "AG"
3251
+ ],
3252
+ [
3253
+ "TTCC",
3254
+ "CC"
3255
+ ],
3256
+ [
3257
+ "ATG",
3258
+ "CCC"
3259
+ ],
3260
+ [
3261
+ "AA",
3262
+ "ATGC"
3263
+ ],
3264
+ [
3265
+ "▁CC",
3266
+ "CC"
3267
+ ],
3268
+ [
3269
+ "TTCC",
3270
+ "GG"
3271
+ ],
3272
+ [
3273
+ "TTGG",
3274
+ "CC"
3275
+ ],
3276
+ [
3277
+ "AC",
3278
+ "AAAC"
3279
+ ],
3280
+ [
3281
+ "ACGG",
3282
+ "GC"
3283
+ ],
3284
+ [
3285
+ "ATC",
3286
+ "GCC"
3287
+ ],
3288
+ [
3289
+ "ATT",
3290
+ "TG"
3291
+ ],
3292
+ [
3293
+ "TCGG",
3294
+ "GC"
3295
+ ],
3296
+ [
3297
+ "TTGC",
3298
+ "GG"
3299
+ ],
3300
+ [
3301
+ "AAC",
3302
+ "GCC"
3303
+ ],
3304
+ [
3305
+ "▁",
3306
+ "AAGC"
3307
+ ],
3308
+ [
3309
+ "AGC",
3310
+ "AG"
3311
+ ],
3312
+ [
3313
+ "▁G",
3314
+ "TC"
3315
+ ],
3316
+ [
3317
+ "ACC",
3318
+ "ACC"
3319
+ ],
3320
+ [
3321
+ "ATC",
3322
+ "AC"
3323
+ ],
3324
+ [
3325
+ "ACG",
3326
+ "AG"
3327
+ ],
3328
+ [
3329
+ "▁",
3330
+ "AATC"
3331
+ ],
3332
+ [
3333
+ "AAG",
3334
+ "AAAA"
3335
+ ],
3336
+ [
3337
+ "AGC",
3338
+ "GCC"
3339
+ ],
3340
+ [
3341
+ "ATG",
3342
+ "TG"
3343
+ ],
3344
+ [
3345
+ "AA",
3346
+ "GTCC"
3347
+ ],
3348
+ [
3349
+ "AT",
3350
+ "AACC"
3351
+ ],
3352
+ [
3353
+ "▁",
3354
+ "AATG"
3355
+ ],
3356
+ [
3357
+ "ATC",
3358
+ "TT"
3359
+ ],
3360
+ [
3361
+ "ATGG",
3362
+ "GC"
3363
+ ],
3364
+ [
3365
+ "TTG",
3366
+ "CCC"
3367
+ ],
3368
+ [
3369
+ "AAGG",
3370
+ "GC"
3371
+ ],
3372
+ [
3373
+ "▁G",
3374
+ "CCC"
3375
+ ],
3376
+ [
3377
+ "AAG",
3378
+ "AG"
3379
+ ],
3380
+ [
3381
+ "▁C",
3382
+ "TC"
3383
+ ],
3384
+ [
3385
+ "▁",
3386
+ "AGAC"
3387
+ ],
3388
+ [
3389
+ "AGG",
3390
+ "AC"
3391
+ ],
3392
+ [
3393
+ "TCGG",
3394
+ "GG"
3395
+ ],
3396
+ [
3397
+ "TTGC",
3398
+ "GC"
3399
+ ],
3400
+ [
3401
+ "▁G",
3402
+ "TT"
3403
+ ],
3404
+ [
3405
+ "ACAC",
3406
+ "GG"
3407
+ ],
3408
+ [
3409
+ "ATC",
3410
+ "TC"
3411
+ ],
3412
+ [
3413
+ "▁",
3414
+ "AGCC"
3415
+ ],
3416
+ [
3417
+ "ATTC",
3418
+ "GC"
3419
+ ],
3420
+ [
3421
+ "AA",
3422
+ "TACC"
3423
+ ],
3424
+ [
3425
+ "▁C",
3426
+ "AC"
3427
+ ],
3428
+ [
3429
+ "ATT",
3430
+ "TC"
3431
+ ],
3432
+ [
3433
+ "ACG",
3434
+ "ACC"
3435
+ ],
3436
+ [
3437
+ "TTC",
3438
+ "GCC"
3439
+ ],
3440
+ [
3441
+ "ACG",
3442
+ "AAC"
3443
+ ],
3444
+ [
3445
+ "▁CC",
3446
+ "GC"
3447
+ ],
3448
+ [
3449
+ "ATG",
3450
+ "TT"
3451
+ ],
3452
+ [
3453
+ "ATTC",
3454
+ "GG"
3455
+ ],
3456
+ [
3457
+ "AGG",
3458
+ "TG"
3459
+ ],
3460
+ [
3461
+ "TTTT",
3462
+ "CC"
3463
+ ],
3464
+ [
3465
+ "TTG",
3466
+ "AC"
3467
+ ],
3468
+ [
3469
+ "ACGG",
3470
+ "GG"
3471
+ ],
3472
+ [
3473
+ "AA",
3474
+ "ATAC"
3475
+ ],
3476
+ [
3477
+ "ATT",
3478
+ "GCC"
3479
+ ],
3480
+ [
3481
+ "GT",
3482
+ "AAG"
3483
+ ],
3484
+ [
3485
+ "TTG",
3486
+ "TC"
3487
+ ],
3488
+ [
3489
+ "TATG",
3490
+ "CC"
3491
+ ],
3492
+ [
3493
+ "AA",
3494
+ "TGCC"
3495
+ ],
3496
+ [
3497
+ "AGG",
3498
+ "CCC"
3499
+ ],
3500
+ [
3501
+ "AG",
3502
+ "AACC"
3503
+ ],
3504
+ [
3505
+ "ACC",
3506
+ "GGC"
3507
+ ],
3508
+ [
3509
+ "TT",
3510
+ "A"
3511
+ ],
3512
+ [
3513
+ "AGC",
3514
+ "TGC"
3515
+ ],
3516
+ [
3517
+ "AC",
3518
+ "GTCC"
3519
+ ],
3520
+ [
3521
+ "AAC",
3522
+ "TGC"
3523
+ ],
3524
+ [
3525
+ "ACC",
3526
+ "TCC"
3527
+ ],
3528
+ [
3529
+ "ATT",
3530
+ "TT"
3531
+ ],
3532
+ [
3533
+ "TACC",
3534
+ "GG"
3535
+ ],
3536
+ [
3537
+ "AA",
3538
+ "ACCG"
3539
+ ],
3540
+ [
3541
+ "AA",
3542
+ "ATCC"
3543
+ ],
3544
+ [
3545
+ "TTTT",
3546
+ "GC"
3547
+ ],
3548
+ [
3549
+ "ATC",
3550
+ "TGC"
3551
+ ],
3552
+ [
3553
+ "AA",
3554
+ "GTGC"
3555
+ ],
3556
+ [
3557
+ "TAA",
3558
+ "AC"
3559
+ ],
3560
+ [
3561
+ "AATT",
3562
+ "CC"
3563
+ ],
3564
+ [
3565
+ "▁",
3566
+ "TAAC"
3567
+ ],
3568
+ [
3569
+ "▁G",
3570
+ "AC"
3571
+ ],
3572
+ [
3573
+ "▁C",
3574
+ "TG"
3575
+ ],
3576
+ [
3577
+ "TCG",
3578
+ "TT"
3579
+ ],
3580
+ [
3581
+ "GCG",
3582
+ "TG"
3583
+ ],
3584
+ [
3585
+ "TGGC",
3586
+ "GG"
3587
+ ],
3588
+ [
3589
+ "▁C",
3590
+ "TGC"
3591
+ ],
3592
+ [
3593
+ "ACC",
3594
+ "GT"
3595
+ ],
3596
+ [
3597
+ "ATGG",
3598
+ "GG"
3599
+ ],
3600
+ [
3601
+ "AG",
3602
+ "ACCC"
3603
+ ],
3604
+ [
3605
+ "ACG",
3606
+ "AGC"
3607
+ ],
3608
+ [
3609
+ "ATT",
3610
+ "AC"
3611
+ ],
3612
+ [
3613
+ "▁",
3614
+ "GTCC"
3615
+ ],
3616
+ [
3617
+ "TGGC",
3618
+ "GC"
3619
+ ],
3620
+ [
3621
+ "AT",
3622
+ "ACCC"
3623
+ ],
3624
+ [
3625
+ "AT",
3626
+ "AGCC"
3627
+ ],
3628
+ [
3629
+ "AT",
3630
+ "AAAG"
3631
+ ],
3632
+ [
3633
+ "AA",
3634
+ "TAAAA"
3635
+ ],
3636
+ [
3637
+ "AGG",
3638
+ "TT"
3639
+ ],
3640
+ [
3641
+ "▁C",
3642
+ "GCC"
3643
+ ],
3644
+ [
3645
+ "TCG",
3646
+ "AG"
3647
+ ],
3648
+ [
3649
+ "ACC",
3650
+ "TGC"
3651
+ ],
3652
+ [
3653
+ "ACC",
3654
+ "AAC"
3655
+ ],
3656
+ [
3657
+ "TAGG",
3658
+ "CC"
3659
+ ],
3660
+ [
3661
+ "AA",
3662
+ "AGGC"
3663
+ ],
3664
+ [
3665
+ "TTG",
3666
+ "TG"
3667
+ ],
3668
+ [
3669
+ "▁C",
3670
+ "ATC"
3671
+ ],
3672
+ [
3673
+ "▁",
3674
+ "ATCC"
3675
+ ],
3676
+ [
3677
+ "TCC",
3678
+ "GCC"
3679
+ ],
3680
+ [
3681
+ "GTGG",
3682
+ "CC"
3683
+ ],
3684
+ [
3685
+ "AG",
3686
+ "AAAG"
3687
+ ],
3688
+ [
3689
+ "TCG",
3690
+ "A"
3691
+ ],
3692
+ [
3693
+ "▁",
3694
+ "GGCC"
3695
+ ],
3696
+ [
3697
+ "▁C",
3698
+ "TAA"
3699
+ ],
3700
+ [
3701
+ "AT",
3702
+ "ACAC"
3703
+ ],
3704
+ [
3705
+ "AG",
3706
+ "AAGC"
3707
+ ],
3708
+ [
3709
+ "ACC",
3710
+ "TAC"
3711
+ ],
3712
+ [
3713
+ "▁",
3714
+ "ACGC"
3715
+ ],
3716
+ [
3717
+ "▁C",
3718
+ "ATT"
3719
+ ],
3720
+ [
3721
+ "AGC",
3722
+ "ATC"
3723
+ ],
3724
+ [
3725
+ "AAC",
3726
+ "GT"
3727
+ ],
3728
+ [
3729
+ "AATT",
3730
+ "GG"
3731
+ ],
3732
+ [
3733
+ "▁",
3734
+ "AAAAG"
3735
+ ],
3736
+ [
3737
+ "AGG",
3738
+ "GCC"
3739
+ ],
3740
+ [
3741
+ "▁",
3742
+ "ATAC"
3743
+ ],
3744
+ [
3745
+ "ATG",
3746
+ "TCC"
3747
+ ],
3748
+ [
3749
+ "▁",
3750
+ "TTTT"
3751
+ ],
3752
+ [
3753
+ "ACC",
3754
+ "CCG"
3755
+ ],
3756
+ [
3757
+ "AA",
3758
+ "TAGC"
3759
+ ],
3760
+ [
3761
+ "AT",
3762
+ "AAGC"
3763
+ ],
3764
+ [
3765
+ "TTC",
3766
+ "TC"
3767
+ ],
3768
+ [
3769
+ "AC",
3770
+ "AACC"
3771
+ ],
3772
+ [
3773
+ "ACG",
3774
+ "AGG"
3775
+ ],
3776
+ [
3777
+ "ACC",
3778
+ "TGG"
3779
+ ],
3780
+ [
3781
+ "TAAC",
3782
+ "GC"
3783
+ ],
3784
+ [
3785
+ "AAG",
3786
+ "CCG"
3787
+ ],
3788
+ [
3789
+ "▁C",
3790
+ "AAC"
3791
+ ],
3792
+ [
3793
+ "TTGG",
3794
+ "GC"
3795
+ ],
3796
+ [
3797
+ "ACG",
3798
+ "CCG"
3799
+ ],
3800
+ [
3801
+ "AA",
3802
+ "TCCC"
3803
+ ],
3804
+ [
3805
+ "AA",
3806
+ "TCGC"
3807
+ ],
3808
+ [
3809
+ "▁",
3810
+ "AGTC"
3811
+ ],
3812
+ [
3813
+ "TTC",
3814
+ "TG"
3815
+ ],
3816
+ [
3817
+ "CCC",
3818
+ "TC"
3819
+ ],
3820
+ [
3821
+ "ACC",
3822
+ "ATC"
3823
+ ],
3824
+ [
3825
+ "AGC",
3826
+ "AAC"
3827
+ ],
3828
+ [
3829
+ "TT",
3830
+ "TAT"
3831
+ ],
3832
+ [
3833
+ "▁",
3834
+ "ATGC"
3835
+ ],
3836
+ [
3837
+ "GTCC",
3838
+ "GG"
3839
+ ],
3840
+ [
3841
+ "ACC",
3842
+ "A"
3843
+ ],
3844
+ [
3845
+ "CCC",
3846
+ "TG"
3847
+ ],
3848
+ [
3849
+ "▁",
3850
+ "AAGG"
3851
+ ],
3852
+ [
3853
+ "ATG",
3854
+ "AAC"
3855
+ ],
3856
+ [
3857
+ "CCC",
3858
+ "AC"
3859
+ ],
3860
+ [
3861
+ "TT",
3862
+ "AAAA"
3863
+ ],
3864
+ [
3865
+ "GTGC",
3866
+ "GG"
3867
+ ],
3868
+ [
3869
+ "AT",
3870
+ "AGAC"
3871
+ ],
3872
+ [
3873
+ "AGG",
3874
+ "CCG"
3875
+ ],
3876
+ [
3877
+ "▁C",
3878
+ "TAC"
3879
+ ],
3880
+ [
3881
+ "TCC",
3882
+ "TG"
3883
+ ],
3884
+ [
3885
+ "AG",
3886
+ "AGCC"
3887
+ ],
3888
+ [
3889
+ "TAA",
3890
+ "TC"
3891
+ ],
3892
+ [
3893
+ "GTCC",
3894
+ "CC"
3895
+ ],
3896
+ [
3897
+ "TGC",
3898
+ "TG"
3899
+ ],
3900
+ [
3901
+ "AGC",
3902
+ "TAC"
3903
+ ],
3904
+ [
3905
+ "AGC",
3906
+ "GGC"
3907
+ ],
3908
+ [
3909
+ "▁GC",
3910
+ "GC"
3911
+ ],
3912
+ [
3913
+ "AAGG",
3914
+ "GG"
3915
+ ],
3916
+ [
3917
+ "▁",
3918
+ "AAAAC"
3919
+ ],
3920
+ [
3921
+ "AA",
3922
+ "CCCG"
3923
+ ],
3924
+ [
3925
+ "AT",
3926
+ "ACGC"
3927
+ ],
3928
+ [
3929
+ "AG",
3930
+ "TGCC"
3931
+ ],
3932
+ [
3933
+ "GCG",
3934
+ "TT"
3935
+ ],
3936
+ [
3937
+ "TATC",
3938
+ "GC"
3939
+ ],
3940
+ [
3941
+ "▁",
3942
+ "TACC"
3943
+ ],
3944
+ [
3945
+ "TTG",
3946
+ "TT"
3947
+ ],
3948
+ [
3949
+ "AAAA",
3950
+ "AAC"
3951
+ ],
3952
+ [
3953
+ "GTCC",
3954
+ "GC"
3955
+ ],
3956
+ [
3957
+ "TGC",
3958
+ "TC"
3959
+ ],
3960
+ [
3961
+ "AAG",
3962
+ "ACC"
3963
+ ],
3964
+ [
3965
+ "AGC",
3966
+ "GT"
3967
+ ],
3968
+ [
3969
+ "TCC",
3970
+ "TC"
3971
+ ],
3972
+ [
3973
+ "ATG",
3974
+ "ACC"
3975
+ ],
3976
+ [
3977
+ "▁",
3978
+ "TTGC"
3979
+ ],
3980
+ [
3981
+ "AC",
3982
+ "ATCC"
3983
+ ],
3984
+ [
3985
+ "AGG",
3986
+ "A"
3987
+ ],
3988
+ [
3989
+ "TTC",
3990
+ "GGC"
3991
+ ],
3992
+ [
3993
+ "ATC",
3994
+ "AG"
3995
+ ],
3996
+ [
3997
+ "TTGG",
3998
+ "GG"
3999
+ ],
4000
+ [
4001
+ "TGC",
4002
+ "GCC"
4003
+ ],
4004
+ [
4005
+ "▁",
4006
+ "ACCG"
4007
+ ],
4008
+ [
4009
+ "AT",
4010
+ "ATCC"
4011
+ ],
4012
+ [
4013
+ "▁",
4014
+ "TATT"
4015
+ ],
4016
+ [
4017
+ "AA",
4018
+ "ATGG"
4019
+ ],
4020
+ [
4021
+ "TAGC",
4022
+ "GG"
4023
+ ],
4024
+ [
4025
+ "▁",
4026
+ "AGTT"
4027
+ ],
4028
+ [
4029
+ "TG",
4030
+ "AAAA"
4031
+ ],
4032
+ [
4033
+ "TTC",
4034
+ "TT"
4035
+ ],
4036
+ [
4037
+ "GGG",
4038
+ "TC"
4039
+ ],
4040
+ [
4041
+ "AAG",
4042
+ "AGC"
4043
+ ],
4044
+ [
4045
+ "GCG",
4046
+ "AC"
4047
+ ],
4048
+ [
4049
+ "AAC",
4050
+ "TAC"
4051
+ ],
4052
+ [
4053
+ "TAGC",
4054
+ "GC"
4055
+ ],
4056
+ [
4057
+ "ATG",
4058
+ "CCG"
4059
+ ],
4060
+ [
4061
+ "AA",
4062
+ "TAAG"
4063
+ ],
4064
+ [
4065
+ "▁",
4066
+ "TGCC"
4067
+ ],
4068
+ [
4069
+ "GGG",
4070
+ "A"
4071
+ ],
4072
+ [
4073
+ "AAC",
4074
+ "ATT"
4075
+ ],
4076
+ [
4077
+ "CCC",
4078
+ "GCC"
4079
+ ],
4080
+ [
4081
+ "▁",
4082
+ "ACTG"
4083
+ ],
4084
+ [
4085
+ "▁",
4086
+ "GTGC"
4087
+ ],
4088
+ [
4089
+ "ACG",
4090
+ "ATT"
4091
+ ],
4092
+ [
4093
+ "TGG",
4094
+ "TC"
4095
+ ],
4096
+ [
4097
+ "TCC",
4098
+ "AC"
4099
+ ],
4100
+ [
4101
+ "ATG",
4102
+ "TGC"
4103
+ ],
4104
+ [
4105
+ "AA",
4106
+ "AGCG"
4107
+ ],
4108
+ [
4109
+ "AAC",
4110
+ "GGC"
4111
+ ],
4112
+ [
4113
+ "TTTT",
4114
+ "GG"
4115
+ ],
4116
+ [
4117
+ "ACC",
4118
+ "ATT"
4119
+ ],
4120
+ [
4121
+ "AGG",
4122
+ "AG"
4123
+ ],
4124
+ [
4125
+ "ATG",
4126
+ "AG"
4127
+ ],
4128
+ [
4129
+ "AT",
4130
+ "AATC"
4131
+ ],
4132
+ [
4133
+ "▁",
4134
+ "TCCC"
4135
+ ],
4136
+ [
4137
+ "▁CC",
4138
+ "GG"
4139
+ ],
4140
+ [
4141
+ "▁C",
4142
+ "AG"
4143
+ ],
4144
+ [
4145
+ "ACG",
4146
+ "ATC"
4147
+ ],
4148
+ [
4149
+ "▁",
4150
+ "TAAAA"
4151
+ ],
4152
+ [
4153
+ "GCG",
4154
+ "CCC"
4155
+ ],
4156
+ [
4157
+ "AA",
4158
+ "TATT"
4159
+ ],
4160
+ [
4161
+ "AGC",
4162
+ "TCC"
4163
+ ],
4164
+ [
4165
+ "TAC",
4166
+ "AC"
4167
+ ],
4168
+ [
4169
+ "AAG",
4170
+ "AAG"
4171
+ ],
4172
+ [
4173
+ "▁",
4174
+ "AGGC"
4175
+ ],
4176
+ [
4177
+ "GCG",
4178
+ "A"
4179
+ ],
4180
+ [
4181
+ "▁",
4182
+ "TCGC"
4183
+ ],
4184
+ [
4185
+ "AT",
4186
+ "CCCG"
4187
+ ],
4188
+ [
4189
+ "▁C",
4190
+ "TCC"
4191
+ ],
4192
+ [
4193
+ "AT",
4194
+ "ACGG"
4195
+ ],
4196
+ [
4197
+ "ACC",
4198
+ "TAA"
4199
+ ],
4200
+ [
4201
+ "GGC",
4202
+ "TC"
4203
+ ],
4204
+ [
4205
+ "▁",
4206
+ "ATTC"
4207
+ ],
4208
+ [
4209
+ "TAAC",
4210
+ "GG"
4211
+ ],
4212
+ [
4213
+ "AT",
4214
+ "AATG"
4215
+ ],
4216
+ [
4217
+ "AA",
4218
+ "TATC"
4219
+ ],
4220
+ [
4221
+ "AAC",
4222
+ "TAA"
4223
+ ],
4224
+ [
4225
+ "▁C",
4226
+ "GT"
4227
+ ],
4228
+ [
4229
+ "ATC",
4230
+ "GT"
4231
+ ],
4232
+ [
4233
+ "AA",
4234
+ "GTGG"
4235
+ ],
4236
+ [
4237
+ "▁",
4238
+ "ATAA"
4239
+ ],
4240
+ [
4241
+ "TCG",
4242
+ "ACC"
4243
+ ],
4244
+ [
4245
+ "TAG",
4246
+ "TC"
4247
+ ],
4248
+ [
4249
+ "AAC",
4250
+ "AGC"
4251
+ ],
4252
+ [
4253
+ "▁G",
4254
+ "TG"
4255
+ ],
4256
+ [
4257
+ "TTC",
4258
+ "AC"
4259
+ ],
4260
+ [
4261
+ "ATG",
4262
+ "TGG"
4263
+ ],
4264
+ [
4265
+ "ATG",
4266
+ "TAC"
4267
+ ],
4268
+ [
4269
+ "TTC",
4270
+ "TGC"
4271
+ ],
4272
+ [
4273
+ "AA",
4274
+ "ATCG"
4275
+ ],
4276
+ [
4277
+ "AA",
4278
+ "TAGG"
4279
+ ],
4280
+ [
4281
+ "TTG",
4282
+ "ACC"
4283
+ ],
4284
+ [
4285
+ "AA",
4286
+ "TCGG"
4287
+ ],
4288
+ [
4289
+ "AC",
4290
+ "TGCC"
4291
+ ],
4292
+ [
4293
+ "AT",
4294
+ "AAGG"
4295
+ ],
4296
+ [
4297
+ "▁",
4298
+ "CCCG"
4299
+ ],
4300
+ [
4301
+ "▁C",
4302
+ "AAAA"
4303
+ ],
4304
+ [
4305
+ "AT",
4306
+ "ATGC"
4307
+ ],
4308
+ [
4309
+ "CCG",
4310
+ "TC"
4311
+ ],
4312
+ [
4313
+ "GGC",
4314
+ "TG"
4315
+ ],
4316
+ [
4317
+ "AC",
4318
+ "AGCC"
4319
+ ],
4320
+ [
4321
+ "AG",
4322
+ "ACCG"
4323
+ ],
4324
+ [
4325
+ "TT",
4326
+ "TGCC"
4327
+ ],
4328
+ [
4329
+ "▁",
4330
+ "ACGG"
4331
+ ],
4332
+ [
4333
+ "ATT",
4334
+ "TCC"
4335
+ ],
4336
+ [
4337
+ "ATC",
4338
+ "TCC"
4339
+ ],
4340
+ [
4341
+ "AT",
4342
+ "ACCG"
4343
+ ],
4344
+ [
4345
+ "TCG",
4346
+ "AGG"
4347
+ ],
4348
+ [
4349
+ "TCG",
4350
+ "AAC"
4351
+ ],
4352
+ [
4353
+ "▁GC",
4354
+ "GG"
4355
+ ],
4356
+ [
4357
+ "AGC",
4358
+ "ACC"
4359
+ ],
4360
+ [
4361
+ "GTGC",
4362
+ "GC"
4363
+ ],
4364
+ [
4365
+ "AT",
4366
+ "AACG"
4367
+ ],
4368
+ [
4369
+ "▁",
4370
+ "AGTG"
4371
+ ],
4372
+ [
4373
+ "TAA",
4374
+ "CCC"
4375
+ ],
4376
+ [
4377
+ "TT",
4378
+ "AACC"
4379
+ ],
4380
+ [
4381
+ "AC",
4382
+ "ACCC"
4383
+ ],
4384
+ [
4385
+ "AA",
4386
+ "ATTC"
4387
+ ],
4388
+ [
4389
+ "▁G",
4390
+ "AAAA"
4391
+ ],
4392
+ [
4393
+ "ATC",
4394
+ "GGC"
4395
+ ],
4396
+ [
4397
+ "TG",
4398
+ "TAT"
4399
+ ],
4400
+ [
4401
+ "AA",
4402
+ "ATTG"
4403
+ ],
4404
+ [
4405
+ "AG",
4406
+ "TCCC"
4407
+ ],
4408
+ [
4409
+ "AAC",
4410
+ "TCC"
4411
+ ],
4412
+ [
4413
+ "AGC",
4414
+ "ATT"
4415
+ ],
4416
+ [
4417
+ "TG",
4418
+ "ACGG"
4419
+ ],
4420
+ [
4421
+ "AA",
4422
+ "TGGC"
4423
+ ],
4424
+ [
4425
+ "AG",
4426
+ "TACC"
4427
+ ],
4428
+ [
4429
+ "▁",
4430
+ "ATTG"
4431
+ ],
4432
+ [
4433
+ "GT",
4434
+ "AAAA"
4435
+ ],
4436
+ [
4437
+ "AAG",
4438
+ "ATT"
4439
+ ],
4440
+ [
4441
+ "AA",
4442
+ "TATG"
4443
+ ],
4444
+ [
4445
+ "AG",
4446
+ "AAGG"
4447
+ ],
4448
+ [
4449
+ "AAG",
4450
+ "ATG"
4451
+ ],
4452
+ [
4453
+ "▁",
4454
+ "TAGC"
4455
+ ],
4456
+ [
4457
+ "AT",
4458
+ "AATT"
4459
+ ],
4460
+ [
4461
+ "▁C",
4462
+ "TTC"
4463
+ ],
4464
+ [
4465
+ "AAG",
4466
+ "AGG"
4467
+ ],
4468
+ [
4469
+ "▁C",
4470
+ "TAG"
4471
+ ],
4472
+ [
4473
+ "AG",
4474
+ "CCCG"
4475
+ ],
4476
+ [
4477
+ "TAC",
4478
+ "TC"
4479
+ ],
4480
+ [
4481
+ "AGC",
4482
+ "TGG"
4483
+ ],
4484
+ [
4485
+ "▁G",
4486
+ "ACC"
4487
+ ],
4488
+ [
4489
+ "▁",
4490
+ "GCCG"
4491
+ ],
4492
+ [
4493
+ "TG",
4494
+ "ACGC"
4495
+ ],
4496
+ [
4497
+ "ATC",
4498
+ "TGG"
4499
+ ],
4500
+ [
4501
+ "▁G",
4502
+ "ATT"
4503
+ ],
4504
+ [
4505
+ "AC",
4506
+ "AGAC"
4507
+ ],
4508
+ [
4509
+ "▁",
4510
+ "AACG"
4511
+ ],
4512
+ [
4513
+ "ACG",
4514
+ "TTC"
4515
+ ],
4516
+ [
4517
+ "AGC",
4518
+ "TAA"
4519
+ ],
4520
+ [
4521
+ "AG",
4522
+ "TCGC"
4523
+ ],
4524
+ [
4525
+ "AGG",
4526
+ "TGC"
4527
+ ],
4528
+ [
4529
+ "TATT",
4530
+ "GC"
4531
+ ],
4532
+ [
4533
+ "AAG",
4534
+ "ATC"
4535
+ ],
4536
+ [
4537
+ "GGG",
4538
+ "AC"
4539
+ ],
4540
+ [
4541
+ "TG",
4542
+ "ACCC"
4543
+ ],
4544
+ [
4545
+ "AA",
4546
+ "TCCG"
4547
+ ],
4548
+ [
4549
+ "TATC",
4550
+ "GG"
4551
+ ],
4552
+ [
4553
+ "CCC",
4554
+ "TT"
4555
+ ],
4556
+ [
4557
+ "▁",
4558
+ "TAAG"
4559
+ ],
4560
+ [
4561
+ "▁G",
4562
+ "AAC"
4563
+ ],
4564
+ [
4565
+ "AG",
4566
+ "TCGG"
4567
+ ],
4568
+ [
4569
+ "GGC",
4570
+ "GCC"
4571
+ ],
4572
+ [
4573
+ "TCG",
4574
+ "AGC"
4575
+ ],
4576
+ [
4577
+ "▁",
4578
+ "TGAC"
4579
+ ],
4580
+ [
4581
+ "▁",
4582
+ "AGAA"
4583
+ ],
4584
+ [
4585
+ "AG",
4586
+ "AACG"
4587
+ ],
4588
+ [
4589
+ "GGC",
4590
+ "AC"
4591
+ ],
4592
+ [
4593
+ "AG",
4594
+ "AGAC"
4595
+ ],
4596
+ [
4597
+ "TTC",
4598
+ "TCC"
4599
+ ],
4600
+ [
4601
+ "TG",
4602
+ "AACC"
4603
+ ],
4604
+ [
4605
+ "AG",
4606
+ "TTGC"
4607
+ ],
4608
+ [
4609
+ "TGC",
4610
+ "AC"
4611
+ ],
4612
+ [
4613
+ "▁C",
4614
+ "ACC"
4615
+ ],
4616
+ [
4617
+ "▁",
4618
+ "TCAC"
4619
+ ],
4620
+ [
4621
+ "GGCC",
4622
+ "CC"
4623
+ ],
4624
+ [
4625
+ "GCC",
4626
+ "TC"
4627
+ ],
4628
+ [
4629
+ "AAC",
4630
+ "AAAA"
4631
+ ],
4632
+ [
4633
+ "AGC",
4634
+ "AGG"
4635
+ ],
4636
+ [
4637
+ "GTGG",
4638
+ "GC"
4639
+ ],
4640
+ [
4641
+ "▁",
4642
+ "TTTC"
4643
+ ],
4644
+ [
4645
+ "ACG",
4646
+ "ATG"
4647
+ ],
4648
+ [
4649
+ "TCG",
4650
+ "ATC"
4651
+ ],
4652
+ [
4653
+ "TATT",
4654
+ "CC"
4655
+ ],
4656
+ [
4657
+ "ATT",
4658
+ "CCC"
4659
+ ],
4660
+ [
4661
+ "AG",
4662
+ "TAAC"
4663
+ ],
4664
+ [
4665
+ "TAGG",
4666
+ "GC"
4667
+ ],
4668
+ [
4669
+ "AT",
4670
+ "AGTC"
4671
+ ],
4672
+ [
4673
+ "AG",
4674
+ "AGGC"
4675
+ ],
4676
+ [
4677
+ "TTC",
4678
+ "GT"
4679
+ ],
4680
+ [
4681
+ "TGC",
4682
+ "TT"
4683
+ ],
4684
+ [
4685
+ "▁C",
4686
+ "GGC"
4687
+ ],
4688
+ [
4689
+ "AT",
4690
+ "ATAC"
4691
+ ],
4692
+ [
4693
+ "GGCC",
4694
+ "GC"
4695
+ ],
4696
+ [
4697
+ "AT",
4698
+ "AGGC"
4699
+ ],
4700
+ [
4701
+ "TC",
4702
+ "TAT"
4703
+ ],
4704
+ [
4705
+ "AGC",
4706
+ "AGC"
4707
+ ],
4708
+ [
4709
+ "TG",
4710
+ "AGCC"
4711
+ ],
4712
+ [
4713
+ "AAC",
4714
+ "AGG"
4715
+ ],
4716
+ [
4717
+ "GTGG",
4718
+ "GG"
4719
+ ],
4720
+ [
4721
+ "TAG",
4722
+ "CCC"
4723
+ ],
4724
+ [
4725
+ "GGCC",
4726
+ "GG"
4727
+ ],
4728
+ [
4729
+ "TG",
4730
+ "TGCC"
4731
+ ],
4732
+ [
4733
+ "AA",
4734
+ "TTTT"
4735
+ ],
4736
+ [
4737
+ "TC",
4738
+ "AAAA"
4739
+ ],
4740
+ [
4741
+ "T",
4742
+ "ACCCG"
4743
+ ],
4744
+ [
4745
+ "AG",
4746
+ "ATGC"
4747
+ ],
4748
+ [
4749
+ "AC",
4750
+ "AAAG"
4751
+ ],
4752
+ [
4753
+ "ATG",
4754
+ "AGG"
4755
+ ],
4756
+ [
4757
+ "AA",
4758
+ "TACG"
4759
+ ],
4760
+ [
4761
+ "▁",
4762
+ "AGAG"
4763
+ ],
4764
+ [
4765
+ "TTG",
4766
+ "ACG"
4767
+ ],
4768
+ [
4769
+ "TTG",
4770
+ "AGG"
4771
+ ],
4772
+ [
4773
+ "ACC",
4774
+ "TAG"
4775
+ ],
4776
+ [
4777
+ "TG",
4778
+ "CCCG"
4779
+ ],
4780
+ [
4781
+ "TT",
4782
+ "AAAC"
4783
+ ],
4784
+ [
4785
+ "AC",
4786
+ "AAGC"
4787
+ ],
4788
+ [
4789
+ "AC",
4790
+ "GTGC"
4791
+ ],
4792
+ [
4793
+ "TTC",
4794
+ "TGG"
4795
+ ],
4796
+ [
4797
+ "ATG",
4798
+ "T"
4799
+ ],
4800
+ [
4801
+ "ACC",
4802
+ "AGG"
4803
+ ],
4804
+ [
4805
+ "TTG",
4806
+ "AAC"
4807
+ ],
4808
+ [
4809
+ "ATC",
4810
+ "TAA"
4811
+ ],
4812
+ [
4813
+ "▁",
4814
+ "TATG"
4815
+ ],
4816
+ [
4817
+ "ACC",
4818
+ "AGC"
4819
+ ],
4820
+ [
4821
+ "ATT",
4822
+ "TGC"
4823
+ ],
4824
+ [
4825
+ "ATT",
4826
+ "TAC"
4827
+ ],
4828
+ [
4829
+ "AAAG",
4830
+ "AAAA"
4831
+ ],
4832
+ [
4833
+ "TC",
4834
+ "TACG"
4835
+ ],
4836
+ [
4837
+ "▁",
4838
+ "TATC"
4839
+ ],
4840
+ [
4841
+ "AG",
4842
+ "TAGC"
4843
+ ],
4844
+ [
4845
+ "AG",
4846
+ "TTCC"
4847
+ ],
4848
+ [
4849
+ "GGC",
4850
+ "TT"
4851
+ ],
4852
+ [
4853
+ "▁",
4854
+ "ATCG"
4855
+ ],
4856
+ [
4857
+ "GGG",
4858
+ "CCC"
4859
+ ],
4860
+ [
4861
+ "AC",
4862
+ "AATC"
4863
+ ],
4864
+ [
4865
+ "ACC",
4866
+ "T"
4867
+ ],
4868
+ [
4869
+ "ATC",
4870
+ "AAC"
4871
+ ],
4872
+ [
4873
+ "▁",
4874
+ "TGTC"
4875
+ ],
4876
+ [
4877
+ "AG",
4878
+ "AATC"
4879
+ ],
4880
+ [
4881
+ "ATC",
4882
+ "A"
4883
+ ],
4884
+ [
4885
+ "TG",
4886
+ "TCCC"
4887
+ ],
4888
+ [
4889
+ "ACC",
4890
+ "TTC"
4891
+ ],
4892
+ [
4893
+ "ACG",
4894
+ "TCG"
4895
+ ],
4896
+ [
4897
+ "ATC",
4898
+ "T"
4899
+ ],
4900
+ [
4901
+ "AA",
4902
+ "GGCG"
4903
+ ],
4904
+ [
4905
+ "TG",
4906
+ "AAGC"
4907
+ ],
4908
+ [
4909
+ "AGG",
4910
+ "TCC"
4911
+ ],
4912
+ [
4913
+ "AGG",
4914
+ "TAC"
4915
+ ],
4916
+ [
4917
+ "TC",
4918
+ "ACTG"
4919
+ ],
4920
+ [
4921
+ "▁",
4922
+ "AGCG"
4923
+ ],
4924
+ [
4925
+ "AA",
4926
+ "TGCG"
4927
+ ],
4928
+ [
4929
+ "TGG",
4930
+ "CCC"
4931
+ ],
4932
+ [
4933
+ "AAC",
4934
+ "ATG"
4935
+ ],
4936
+ [
4937
+ "AAG",
4938
+ "ACG"
4939
+ ],
4940
+ [
4941
+ "TT",
4942
+ "TACC"
4943
+ ],
4944
+ [
4945
+ "TT",
4946
+ "GTCC"
4947
+ ],
4948
+ [
4949
+ "T",
4950
+ "AAAAAAAA"
4951
+ ],
4952
+ [
4953
+ "AC",
4954
+ "TACC"
4955
+ ],
4956
+ [
4957
+ "AAC",
4958
+ "TAG"
4959
+ ],
4960
+ [
4961
+ "CCG",
4962
+ "TG"
4963
+ ],
4964
+ [
4965
+ "TT",
4966
+ "AGCC"
4967
+ ],
4968
+ [
4969
+ "TT",
4970
+ "ACCC"
4971
+ ],
4972
+ [
4973
+ "AAG",
4974
+ "A"
4975
+ ],
4976
+ [
4977
+ "ATG",
4978
+ "TAA"
4979
+ ],
4980
+ [
4981
+ "TGG",
4982
+ "GCC"
4983
+ ],
4984
+ [
4985
+ "AGG",
4986
+ "T"
4987
+ ],
4988
+ [
4989
+ "GGG",
4990
+ "TG"
4991
+ ],
4992
+ [
4993
+ "AT",
4994
+ "AAAT"
4995
+ ],
4996
+ [
4997
+ "AT",
4998
+ "AGTG"
4999
+ ],
5000
+ [
5001
+ "AC",
5002
+ "ATCG"
5003
+ ],
5004
+ [
5005
+ "ATG",
5006
+ "A"
5007
+ ],
5008
+ [
5009
+ "AG",
5010
+ "TTGG"
5011
+ ],
5012
+ [
5013
+ "AT",
5014
+ "GGCG"
5015
+ ],
5016
+ [
5017
+ "AG",
5018
+ "TCCG"
5019
+ ],
5020
+ [
5021
+ "AGC",
5022
+ "TAG"
5023
+ ],
5024
+ [
5025
+ "AG",
5026
+ "ATGG"
5027
+ ],
5028
+ [
5029
+ "AT",
5030
+ "ATGG"
5031
+ ],
5032
+ [
5033
+ "ATC",
5034
+ "ATC"
5035
+ ],
5036
+ [
5037
+ "TG",
5038
+ "AAAC"
5039
+ ],
5040
+ [
5041
+ "▁",
5042
+ "TCGG"
5043
+ ],
5044
+ [
5045
+ "TCC",
5046
+ "CCC"
5047
+ ],
5048
+ [
5049
+ "TT",
5050
+ "TCACTGCAGAC"
5051
+ ],
5052
+ [
5053
+ "AG",
5054
+ "AATG"
5055
+ ],
5056
+ [
5057
+ "TTC",
5058
+ "ACTG"
5059
+ ],
5060
+ [
5061
+ "AGG",
5062
+ "GGC"
5063
+ ],
5064
+ [
5065
+ "TAT",
5066
+ "CCC"
5067
+ ],
5068
+ [
5069
+ "TT",
5070
+ "TCCC"
5071
+ ],
5072
+ [
5073
+ "ATT",
5074
+ "GGC"
5075
+ ],
5076
+ [
5077
+ "ATT",
5078
+ "TGG"
5079
+ ],
5080
+ [
5081
+ "CCG",
5082
+ "CCC"
5083
+ ],
5084
+ [
5085
+ "ATT",
5086
+ "TAA"
5087
+ ],
5088
+ [
5089
+ "TTC",
5090
+ "TAC"
5091
+ ],
5092
+ [
5093
+ "TC",
5094
+ "GTCC"
5095
+ ],
5096
+ [
5097
+ "ATT",
5098
+ "GT"
5099
+ ],
5100
+ [
5101
+ "AAC",
5102
+ "TGG"
5103
+ ],
5104
+ [
5105
+ "AC",
5106
+ "GTGG"
5107
+ ],
5108
+ [
5109
+ "AT",
5110
+ "ATCG"
5111
+ ],
5112
+ [
5113
+ "ACC",
5114
+ "ATG"
5115
+ ],
5116
+ [
5117
+ "AAC",
5118
+ "A"
5119
+ ],
5120
+ [
5121
+ "ATC",
5122
+ "GCG"
5123
+ ],
5124
+ [
5125
+ "ACC",
5126
+ "GCG"
5127
+ ],
5128
+ [
5129
+ "▁",
5130
+ "TTGG"
5131
+ ],
5132
+ [
5133
+ "▁C",
5134
+ "AGC"
5135
+ ],
5136
+ [
5137
+ "TAGG",
5138
+ "GG"
5139
+ ],
5140
+ [
5141
+ "▁",
5142
+ "TTCC"
5143
+ ],
5144
+ [
5145
+ "AC",
5146
+ "AAGG"
5147
+ ],
5148
+ [
5149
+ "TG",
5150
+ "TCGC"
5151
+ ],
5152
+ [
5153
+ "AC",
5154
+ "ATGC"
5155
+ ],
5156
+ [
5157
+ "AAG",
5158
+ "TTC"
5159
+ ]
5160
+ ]
5161
+ }
5162
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<|endoftext|>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<unk>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "<pad>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ }
27
+ },
28
+ "bos_token": "<|endoftext|>",
29
+ "clean_tokenization_spaces": true,
30
+ "clean_up_tokenization_spaces": false,
31
+ "eos_token": "<|endoftext|>",
32
+ "extra_special_tokens": {},
33
+ "model_max_length": 13,
34
+ "pad_token": "<pad>",
35
+ "padding_side": "right",
36
+ "return_tensors": "pt",
37
+ "tokenizer_class": "PreTrainedTokenizerFast",
38
+ "truncation_side": "right",
39
+ "unk_token": "<unk>"
40
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fc63f9abc0fdf882e2c78d5582a1e0cf74eb8a3a3c0a544ebb379c6bf405220
3
+ size 5304