From 0452d344074485d0e7eb5d5c12447b7c9dbc9619 Mon Sep 17 00:00:00 2001 From: Yih-Dar SHIEH Date: Wed, 23 Nov 2022 18:52:13 +0000 Subject: [PATCH] Upload tiny models for CLIPModel --- config.json | 171 ++++ merges.txt | 727 +++++++++++++++ preprocessor_config.json | 27 + pytorch_model.bin | 3 + special_tokens_map.json | 24 + tf_model.h5 | 3 + tokenizer.json | 1843 ++++++++++++++++++++++++++++++++++++++ tokenizer_config.json | 34 + vocab.json | 1026 +++++++++++++++++++++ 9 files changed, 3858 insertions(+) create mode 100644 config.json create mode 100644 merges.txt create mode 100644 preprocessor_config.json create mode 100644 pytorch_model.bin create mode 100644 special_tokens_map.json create mode 100644 tf_model.h5 create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 vocab.json diff --git a/config.json b/config.json new file mode 100644 index 0000000..2bb7a35 --- /dev/null +++ b/config.json @@ -0,0 +1,171 @@ +{ + "_commit_hash": null, + "_name_or_path": "temp/dummy/clip/CLIPModel", + "architectures": [ + "CLIPModel" + ], + "bos_token_id": 0, + "eos_token_id": 1, + "initializer_factor": 1.0, + "logit_scale_init_value": 2.6592, + "model_type": "clip", + "pad_token_id": 1, + "projection_dim": 64, + "text_config": { + "_name_or_path": "", + "add_cross_attention": false, + "architectures": null, + "attention_dropout": 0.1, + "bad_words_ids": null, + "begin_suppress_tokens": null, + "bos_token_id": 0, + "chunk_size_feed_forward": 0, + "cross_attention_hidden_size": null, + "decoder_start_token_id": null, + "diversity_penalty": 0.0, + "do_sample": false, + "dropout": 0.1, + "early_stopping": false, + "encoder_no_repeat_ngram_size": 0, + "eos_token_id": 2, + "exponential_decay_length_penalty": null, + "finetuning_task": null, + "forced_bos_token_id": null, + "forced_eos_token_id": null, + "hidden_act": "quick_gelu", + "hidden_size": 32, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1" + }, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 37, + "is_decoder": false, + "is_encoder_decoder": false, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1 + }, + "layer_norm_eps": 1e-05, + "length_penalty": 1.0, + "max_length": 20, + "max_position_embeddings": 512, + "min_length": 0, + "model_type": "clip_text_model", + "no_repeat_ngram_size": 0, + "num_attention_heads": 4, + "num_beam_groups": 1, + "num_beams": 1, + "num_hidden_layers": 5, + "num_return_sequences": 1, + "output_attentions": false, + "output_hidden_states": false, + "output_scores": false, + "pad_token_id": 1, + "prefix": null, + "problem_type": null, + "projection_dim": 32, + "pruned_heads": {}, + "remove_invalid_values": false, + "repetition_penalty": 1.0, + "return_dict": true, + "return_dict_in_generate": false, + "sep_token_id": null, + "suppress_tokens": null, + "task_specific_params": null, + "temperature": 1.0, + "tf_legacy_loss": false, + "tie_encoder_decoder": false, + "tie_word_embeddings": true, + "tokenizer_class": null, + "top_k": 50, + "top_p": 1.0, + "torch_dtype": null, + "torchscript": false, + "transformers_version": "4.25.0.dev0", + "typical_p": 1.0, + "use_bfloat16": false, + "vocab_size": 1024 + }, + "torch_dtype": "float32", + "transformers_version": null, + "vision_config": { + "_name_or_path": "", + "add_cross_attention": false, + "architectures": null, + "attention_dropout": 0.1, + "bad_words_ids": null, + "begin_suppress_tokens": null, + "bos_token_id": null, + "chunk_size_feed_forward": 0, + "cross_attention_hidden_size": null, + "decoder_start_token_id": null, + "diversity_penalty": 0.0, + "do_sample": false, + "dropout": 0.1, + "early_stopping": false, + "encoder_no_repeat_ngram_size": 0, + "eos_token_id": null, + "exponential_decay_length_penalty": null, + "finetuning_task": null, + "forced_bos_token_id": null, + "forced_eos_token_id": null, + "hidden_act": "quick_gelu", + "hidden_size": 32, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1" + }, + "image_size": 30, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 37, + "is_decoder": false, + "is_encoder_decoder": false, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1 + }, + "layer_norm_eps": 1e-05, + "length_penalty": 1.0, + "max_length": 20, + "min_length": 0, + "model_type": "clip_vision_model", + "no_repeat_ngram_size": 0, + "num_attention_heads": 4, + "num_beam_groups": 1, + "num_beams": 1, + "num_channels": 3, + "num_hidden_layers": 5, + "num_return_sequences": 1, + "output_attentions": false, + "output_hidden_states": false, + "output_scores": false, + "pad_token_id": null, + "patch_size": 2, + "prefix": null, + "problem_type": null, + "projection_dim": 32, + "pruned_heads": {}, + "remove_invalid_values": false, + "repetition_penalty": 1.0, + "return_dict": true, + "return_dict_in_generate": false, + "sep_token_id": null, + "suppress_tokens": null, + "task_specific_params": null, + "temperature": 1.0, + "tf_legacy_loss": false, + "tie_encoder_decoder": false, + "tie_word_embeddings": true, + "tokenizer_class": null, + "top_k": 50, + "top_p": 1.0, + "torch_dtype": null, + "torchscript": false, + "transformers_version": "4.25.0.dev0", + "typical_p": 1.0, + "use_bfloat16": false + } +} diff --git a/merges.txt b/merges.txt new file mode 100644 index 0000000..6a7d865 --- /dev/null +++ b/merges.txt @@ -0,0 +1,727 @@ +#version: 0.2 +t h +th e +i n +a n +e d +e r +r e +a r +t i +o n +e n +o f +o r +an d +e r +o n +i n +in g +s t +r o +a l +i t +t o +a s +a t +e s +o u +h i +a c +s i +a t +r i +a l +e l +a n +a m +o r +s t +l i +u r +e c +o m +d i +w as +l y +e n +e a +c h +u n +ti on +l a +i s +f i +o l +d e +- @ +@ -@ +r a +v i +l e +l o +s h +e m +b e +th at +' s +c on +m a +f or +h a +s u +b y +it h +v e +w ith +s e +c h +th e +en t +p o +c e +i l +s e +en t +l e +c om +s p +er e +p ro +n o +b u +w h +i t +t h +v er +n e +c a +i s +f or +a g +er s +m o +g h +f ro +t ed +fro m +ti on +o p +hi s +a d +a b +i c +h e +ou n +a s +t s +s c +d e +o w +e x +w hi +r u +t er +a p +d s +w ere +p re +d u +g u +p ar +i r +b o +th er +q u +l u +t er +t w +e s +re c +p er +t a +at e +v er +at ed +d ing +it y +m an +e ar +s ed +d ed +a u +al l +am e +c i +on e +in g +ar e +a f +i r +a tion +â Ģ +ha d +t r +u l +l d +whi ch +w a +i m +l ea +b e +t o +ti m +fi r +w or +on g +p or +m ar +m e +al ly +s o +ou t +tion s +it s +g h +g e +b er +f e +p u +s er +d er +p l +s s +in e +in c +m i +gh t +g o +th is +t ur +d a +ro u +bu t +u m +s on +w e +v ed +si on +k e +p la +the ir +i es +fir st +s a +o c +at t +o f +p e +no t +g i +n a +ar y +m u +l ed +âĢ ĵ +h er +r an +c o +the y +d er +al i +al so +or e +e p +ou ld +af ter +s hi +u s +e t +ti c +st or +w i +e v +o ther +s h +t ing +ar d +t e +tw o +n i +ha ve +ou r +com m +t e +ac k +o o +f in +s ec +ent s +h as +com p +b ec +k s +con t +l and +be en +en ce +k ing +e l +ag e +lo w +m in +. @ +@ .@ +om e +m ent +ch ar +g e +at er +n or +h o +ou s +wh o +ea r +sp ec +c ol +el y +t y +j o +ur ing +du c +b ri +st r +c an +or i +t ra +p a +sh e +d o +ti ve +m on +ne w +r it +tim e +on s +s o +m an +d ec +c ent +l an +p i +ou r +in ter +f er +g ra +g re +re s +inc lu +m il +d uring +ow n +pre s +j u +n ed +el l +, @ +@ ,@ +it e +g en +wh en +si g +b i +re n +f a +g a +pla y +en g +tion al +oun d +th ou +m ore +re e +em ber +e i +s ou +s ur +s ti +c ar +for m +l ar +s es +t en +in to +t u +c es +mo st +k ed +wa y +c re +c oun +u p +l es +ac e +al s +k e +w ould +an t +b er +f u +it ed +p ri +whi le +o ver +ing s +r e +fi l +s y +e st +ab le +w n +s ea +ac h +s ing +in s +ti c +i d +on ly +at es +t ri +v ing +b a +v el +an ce +st a +er n +f ol +e en +in ed +st ru +un i +g ame +la r +s el +b li +u sed +n ing +p s +ti es +k no +c or +f t +rec or +b le +vi e +y s +w il +ic al +ap p +t ro +th ree +c la +ol d +sh ed +h ea +ab out +w rit +th an +st e +l ater +ar i +d y +pu bli +lo c +ag a +th rou +s si +en d +ma y +an g +ac h +v es +o g +hi m +be tw +thou gh +betw een +u m +st ar +sc ri +re a +on d +shi p +o k +h el +s ong +c hi +ca p +e ver +da y +c ri +s ome +b ro +n o +th ere +an s +al l +n um +r ed +ear s +st s +an y +w ar +p h +p p +g in +stru c +am er +pro duc +s ch +c es +ur e +at ing +em p +t or +sea son +for e +i c +c ity +g ro +fol low +su b +b el +y ear +c an +s in +wh ere +an d +ma de +re lea +s m +b l +t en +wi th +s on +man y +a re +e d +h ow +amer ic +ur y +st u +mu si +c u +n am +em ent +su ch +al bu +bu il +be fore +e f +ar m +t on +the m +c al +b ar +d es +m at +gen er +o d +ser ies +c er +sh o +en ti +h er +o ver +an n +w ell +wor ld +g an +e st +sec ond +t ers +si de +tr an +l ine +tur e +por t +be ing +y ears +bo th +in di +the se +na tional +hi stor +f e +v o +st ed +an i +b as +po in +s ing +fil m +p en +su p +m is +c ro +st ri +l in +t re +wa r +how ever +y ing +l ing +y p +ec ted +di rec +vi sion +albu m +th en +l l +se ver +throu gh +kno wn +b or +c ul +c lu +st er +sou th +r y +ec t +lo w +p r +s k +is o +nor th +par t +f ac +t ly +per i +e u +b att +st ate +c ed +con si +in f +po li +ol og +ear ly +po si +am es +w in +de vel +o b +v e +v en +op er +g er +of fi +char ac +m s +hi gh +a d +th o +sever al +d re +de scri +al e +num ber +a ir +inclu ding +in st +aga inst +l s +su l +ep iso +c am +di f +so ci +bec ame +li ke +t el +f our +âĢ Ķ +h ou +jo h +un ited +in v +un der +no v +ti v +su c +a tions +ac k +t or +r on +un d +w s +f o +g r +devel op +al though +cont in +we st +ori gin +musi c +or s +d on +cent ury +w ard +wor k +m e +am i +ch a +ver y +h ar +di s +z ed +d o +g s +t ow +s ol +follow ing +li on +re ma +n s +ti sh +ch ur +s om +m p +t le +go ver +d el +comp le +c ur +u se +b ack +h u +st ern +be gan +fi el +au se +d ra +p as +b il +ca tion +d ent +b ed +bec ause +an t +ea m +p hi +y o +contin u +ta in +tr y +f re +pe op +cal led +f ound +episo de +de sig +m or +se t +le y +ea st +tr ac +c ra diff --git a/preprocessor_config.json b/preprocessor_config.json new file mode 100644 index 0000000..ea6c8ed --- /dev/null +++ b/preprocessor_config.json @@ -0,0 +1,27 @@ +{ + "crop_size": { + "height": 30, + "width": 30 + }, + "do_center_crop": true, + "do_convert_rgb": true, + "do_normalize": true, + "do_rescale": true, + "do_resize": true, + "image_mean": [ + 0.48145466, + 0.4578275, + 0.40821073 + ], + "image_processor_type": "CLIPImageProcessor", + "image_std": [ + 0.26862954, + 0.26130258, + 0.27577711 + ], + "resample": 3, + "rescale_factor": 0.00392156862745098, + "size": { + "shortest_edge": 30 + } +} diff --git a/pytorch_model.bin b/pytorch_model.bin new file mode 100644 index 0000000..bc46990 --- /dev/null +++ b/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0ce4dd8f7b4bd5fd35cec79eb5bfdd153357d0dea5a7b109a63294468e64d8 +size 578637 diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..2c2130b --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,24 @@ +{ + "bos_token": { + "content": "<|startoftext|>", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "pad_token": "<|endoftext|>", + "unk_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + } +} diff --git a/tf_model.h5 b/tf_model.h5 new file mode 100644 index 0000000..7eb2fcd --- /dev/null +++ b/tf_model.h5 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7714fee94709ec380e321fd721c26b740f7f1e6740b4e87e54ead6d42d3daee0 +size 722684 diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..5283a2c --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,1843 @@ +{ + "version": "1.0", + "truncation": null, + "padding": null, + "added_tokens": [ + { + "id": 0, + "content": "<|startoftext|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": true + }, + { + "id": 1, + "content": "<|endoftext|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + } + ], + "normalizer": { + "type": "Sequence", + "normalizers": [ + { + "type": "NFC" + }, + { + "type": "Replace", + "pattern": { + "Regex": "\\s+" + }, + "content": " " + }, + { + "type": "Lowercase" + } + ] + }, + "pre_tokenizer": { + "type": "Sequence", + "pretokenizers": [ + { + "type": "Split", + "pattern": { + "Regex": "<\\|startoftext\\|>|<\\|endoftext\\|>|'s|'t|'re|'ve|'m|'ll|'d|[\\p{L}]+|[\\p{N}]|[^\\s\\p{L}\\p{N}]+" + }, + "behavior": "Removed", + "invert": true + }, + { + "type": "ByteLevel", + "add_prefix_space": false, + "trim_offsets": true, + "use_regex": true + } + ] + }, + "post_processor": { + "type": "RobertaProcessing", + "sep": [ + "<|endoftext|>", + 1 + ], + "cls": [ + "<|startoftext|>", + 0 + ], + "trim_offsets": false, + "add_prefix_space": false + }, + "decoder": { + "type": "ByteLevel", + "add_prefix_space": true, + "trim_offsets": true, + "use_regex": true + }, + "model": { + "type": "BPE", + "dropout": null, + "unk_token": "<|endoftext|>", + "continuing_subword_prefix": "", + "end_of_word_suffix": "", + "fuse_unk": false, + "vocab": { + "<|startoftext|>": 0, + "<|endoftext|>": 1, + "!": 2, + "\"": 3, + "#": 4, + "$": 5, + "%": 6, + "&": 7, + "'": 8, + "(": 9, + ")": 10, + "*": 11, + "+": 12, + ",": 13, + "-": 14, + ".": 15, + "/": 16, + "0": 17, + "1": 18, + "2": 19, + "3": 20, + "4": 21, + "5": 22, + "6": 23, + "7": 24, + "8": 25, + "9": 26, + ":": 27, + ";": 28, + "<": 29, + "=": 30, + ">": 31, + "?": 32, + "@": 33, + "[": 34, + "\\": 35, + "]": 36, + "^": 37, + "_": 38, + "`": 39, + "a": 40, + "b": 41, + "c": 42, + "d": 43, + "e": 44, + "f": 45, + "g": 46, + "h": 47, + "i": 48, + "j": 49, + "k": 50, + "l": 51, + "m": 52, + "n": 53, + "o": 54, + "p": 55, + "q": 56, + "r": 57, + "s": 58, + "t": 59, + "u": 60, + "v": 61, + "w": 62, + "x": 63, + "y": 64, + "z": 65, + "|": 66, + "}": 67, + "~": 68, + "¡": 69, + "¢": 70, + "£": 71, + "¤": 72, + "¥": 73, + "¦": 74, + "§": 75, + "¨": 76, + "©": 77, + "ª": 78, + "«": 79, + "¬": 80, + "®": 81, + "¯": 82, + "°": 83, + "±": 84, + "²": 85, + "³": 86, + "´": 87, + "µ": 88, + "¶": 89, + "·": 90, + "¸": 91, + "¹": 92, + "º": 93, + "»": 94, + "¼": 95, + "½": 96, + "¾": 97, + "¿": 98, + "Â": 99, + "Ã": 100, + "Ä": 101, + "Å": 102, + "Æ": 103, + "Ç": 104, + "È": 105, + "É": 106, + "Ê": 107, + "Ë": 108, + "Ì": 109, + "Í": 110, + "Î": 111, + "Ï": 112, + "Ð": 113, + "Ñ": 114, + "Ö": 115, + "×": 116, + "Ø": 117, + "Ù": 118, + "Ü": 119, + "à": 120, + "á": 121, + "â": 122, + "ã": 123, + "ä": 124, + "å": 125, + "æ": 126, + "ç": 127, + "è": 128, + "é": 129, + "ë": 130, + "ì": 131, + "ï": 132, + "Ģ": 133, + "ģ": 134, + "Ĥ": 135, + "ĥ": 136, + "Ħ": 137, + "ħ": 138, + "Ĩ": 139, + "ĩ": 140, + "Ī": 141, + "ī": 142, + "Ĭ": 143, + "ĭ": 144, + "Į": 145, + "į": 146, + "İ": 147, + "ı": 148, + "IJ": 149, + "ij": 150, + "Ĵ": 151, + "ĵ": 152, + "Ķ": 153, + "ķ": 154, + "ĸ": 155, + "Ĺ": 156, + "ĺ": 157, + "Ļ": 158, + "ļ": 159, + "Ľ": 160, + "ľ": 161, + "Ŀ": 162, + "ŀ": 163, + "Ł": 164, + "ł": 165, + "Ń": 166, + "d": 167, + "h": 168, + "y": 169, + "s": 170, + "e": 171, + "l": 172, + "m": 173, + "n": 174, + "g": 175, + "r": 176, + "¨": 177, + "c": 178, + "±": 179, + "t": 180, + "į": 181, + "o": 182, + "k": 183, + "a": 184, + "i": 185, + "u": 186, + "f": 187, + "©": 188, + "p": 189, + "¯": 190, + "¾": 191, + "¤": 192, + "z": 193, + "w": 194, + "Ĥ": 195, + "v": 196, + "ĩ": 197, + "»": 198, + "b": 199, + "x": 200, + "°": 201, + "ª": 202, + "j": 203, + "º": 204, + "«": 205, + "¡": 206, + "¹": 207, + "ĥ": 208, + "Ĭ": 209, + "q": 210, + "·": 211, + "¥": 212, + "Ń": 213, + "¶": 214, + "¦": 215, + "IJ": 216, + "¸": 217, + "9": 218, + "Į": 219, + "Ł": 220, + "¢": 221, + "ı": 222, + "'": 223, + "¼": 224, + "µ": 225, + "§": 226, + "}": 227, + ";": 228, + "Ķ": 229, + "Ĺ": 230, + "@": 231, + "¬": 232, + "Ļ": 233, + "Ĵ": 234, + "³": 235, + ".": 236, + "ĺ": 237, + "Ĩ": 238, + "Ħ": 239, + "8": 240, + "ł": 241, + "ķ": 242, + "£": 243, + "ŀ": 244, + "Ŀ": 245, + "²": 246, + "-": 247, + "®": 248, + "¿": 249, + "ļ": 250, + "ľ": 251, + "Ģ": 252, + "ī": 253, + "Ľ": 254, + "%": 255, + "Ī": 256, + "´": 257, + "&": 258, + "ĭ": 259, + "ģ": 260, + "İ": 261, + "ij": 262, + "ĵ": 263, + "=": 264, + "<": 265, + "ĸ": 266, + "`": 267, + "|": 268, + "_": 269, + "ħ": 270, + "½": 271, + "/": 272, + ">": 273, + "$": 274, + "5": 275, + ",": 276, + "!": 277, + "]": 278, + ")": 279, + "7": 280, + "\"": 281, + "^": 282, + "[": 283, + "4": 284, + "0": 285, + "2": 286, + "~": 287, + "#": 288, + "(": 289, + "6": 290, + "3": 291, + ":": 292, + "1": 293, + "+": 294, + "*": 295, + "?": 296, + "\\": 297, + "th": 298, + "the": 299, + "in": 300, + "an": 301, + "ed": 302, + "er": 303, + "re": 304, + "ar": 305, + "ti": 306, + "on": 307, + "en": 308, + "of": 309, + "or": 310, + "and": 311, + "er": 312, + "on": 313, + "in": 314, + "ing": 315, + "st": 316, + "ro": 317, + "al": 318, + "it": 319, + "to": 320, + "as": 321, + "at": 322, + "es": 323, + "ou": 324, + "hi": 325, + "ac": 326, + "si": 327, + "at": 328, + "ri": 329, + "al": 330, + "el": 331, + "an": 332, + "am": 333, + "or": 334, + "st": 335, + "li": 336, + "ur": 337, + "ec": 338, + "om": 339, + "di": 340, + "was": 341, + "ly": 342, + "en": 343, + "ea": 344, + "ch": 345, + "un": 346, + "tion": 347, + "la": 348, + "is": 349, + "fi": 350, + "ol": 351, + "de": 352, + "-@": 353, + "@-@": 354, + "ra": 355, + "vi": 356, + "le": 357, + "lo": 358, + "sh": 359, + "em": 360, + "be": 361, + "that": 362, + "'s": 363, + "con": 364, + "ma": 365, + "for": 366, + "ha": 367, + "su": 368, + "by": 369, + "ith": 370, + "ve": 371, + "with": 372, + "se": 373, + "ch": 374, + "the": 375, + "ent": 376, + "po": 377, + "ce": 378, + "il": 379, + "se": 380, + "ent": 381, + "le": 382, + "com": 383, + "sp": 384, + "ere": 385, + "pro": 386, + "no": 387, + "bu": 388, + "wh": 389, + "it": 390, + "th": 391, + "ver": 392, + "ne": 393, + "ca": 394, + "is": 395, + "for": 396, + "ag": 397, + "ers": 398, + "mo": 399, + "gh": 400, + "fro": 401, + "ted": 402, + "from": 403, + "tion": 404, + "op": 405, + "his": 406, + "ad": 407, + "ab": 408, + "ic": 409, + "he": 410, + "oun": 411, + "as": 412, + "ts": 413, + "sc": 414, + "de": 415, + "ow": 416, + "ex": 417, + "whi": 418, + "ru": 419, + "ter": 420, + "ap": 421, + "ds": 422, + "were": 423, + "pre": 424, + "du": 425, + "gu": 426, + "par": 427, + "ir": 428, + "bo": 429, + "ther": 430, + "qu": 431, + "lu": 432, + "ter": 433, + "tw": 434, + "es": 435, + "rec": 436, + "per": 437, + "ta": 438, + "ate": 439, + "ver": 440, + "ated": 441, + "ding": 442, + "ity": 443, + "man": 444, + "ear": 445, + "sed": 446, + "ded": 447, + "au": 448, + "all": 449, + "ame": 450, + "ci": 451, + "one": 452, + "ing": 453, + "are": 454, + "af": 455, + "ir": 456, + "ation": 457, + "âĢ": 458, + "had": 459, + "tr": 460, + "ul": 461, + "ld": 462, + "which": 463, + "wa": 464, + "im": 465, + "lea": 466, + "be": 467, + "to": 468, + "tim": 469, + "fir": 470, + "wor": 471, + "ong": 472, + "por": 473, + "mar": 474, + "me": 475, + "ally": 476, + "so": 477, + "out": 478, + "tions": 479, + "its": 480, + "gh": 481, + "ge": 482, + "ber": 483, + "fe": 484, + "pu": 485, + "ser": 486, + "der": 487, + "pl": 488, + "ss": 489, + "ine": 490, + "inc": 491, + "mi": 492, + "ght": 493, + "go": 494, + "this": 495, + "tur": 496, + "da": 497, + "rou": 498, + "but": 499, + "um": 500, + "son": 501, + "we": 502, + "ved": 503, + "sion": 504, + "ke": 505, + "pla": 506, + "their": 507, + "ies": 508, + "first": 509, + "sa": 510, + "oc": 511, + "att": 512, + "of": 513, + "pe": 514, + "not": 515, + "gi": 516, + "na": 517, + "ary": 518, + "mu": 519, + "led": 520, + "âĢĵ": 521, + "her": 522, + "ran": 523, + "co": 524, + "they": 525, + "der": 526, + "ali": 527, + "also": 528, + "ore": 529, + "ep": 530, + "ould": 531, + "after": 532, + "shi": 533, + "us": 534, + "et": 535, + "tic": 536, + "stor": 537, + "wi": 538, + "ev": 539, + "other": 540, + "sh": 541, + "ting": 542, + "ard": 543, + "te": 544, + "two": 545, + "ni": 546, + "have": 547, + "our": 548, + "comm": 549, + "te": 550, + "ack": 551, + "oo": 552, + "fin": 553, + "sec": 554, + "ents": 555, + "has": 556, + "comp": 557, + "bec": 558, + "ks": 559, + "cont": 560, + "land": 561, + "been": 562, + "ence": 563, + "king": 564, + "el": 565, + "age": 566, + "low": 567, + "min": 568, + ".@": 569, + "@.@": 570, + "ome": 571, + "ment": 572, + "char": 573, + "ge": 574, + "ater": 575, + "nor": 576, + "ho": 577, + "ous": 578, + "who": 579, + "ear": 580, + "spec": 581, + "col": 582, + "ely": 583, + "ty": 584, + "jo": 585, + "uring": 586, + "duc": 587, + "bri": 588, + "str": 589, + "can": 590, + "ori": 591, + "tra": 592, + "pa": 593, + "she": 594, + "do": 595, + "tive": 596, + "mon": 597, + "new": 598, + "rit": 599, + "time": 600, + "ons": 601, + "so": 602, + "man": 603, + "dec": 604, + "cent": 605, + "lan": 606, + "pi": 607, + "our": 608, + "inter": 609, + "fer": 610, + "gra": 611, + "gre": 612, + "res": 613, + "inclu": 614, + "mil": 615, + "during": 616, + "own": 617, + "pres": 618, + "ju": 619, + "ned": 620, + "ell": 621, + ",@": 622, + "@,@": 623, + "ite": 624, + "gen": 625, + "when": 626, + "sig": 627, + "bi": 628, + "ren": 629, + "fa": 630, + "ga": 631, + "play": 632, + "eng": 633, + "tional": 634, + "ound": 635, + "thou": 636, + "more": 637, + "ree": 638, + "ember": 639, + "ei": 640, + "sou": 641, + "sur": 642, + "sti": 643, + "car": 644, + "form": 645, + "lar": 646, + "ses": 647, + "ten": 648, + "into": 649, + "tu": 650, + "ces": 651, + "most": 652, + "ked": 653, + "way": 654, + "cre": 655, + "coun": 656, + "up": 657, + "les": 658, + "ace": 659, + "als": 660, + "ke": 661, + "would": 662, + "ant": 663, + "ber": 664, + "fu": 665, + "ited": 666, + "pri": 667, + "while": 668, + "over": 669, + "ings": 670, + "re": 671, + "fil": 672, + "sy": 673, + "est": 674, + "able": 675, + "wn": 676, + "sea": 677, + "ach": 678, + "sing": 679, + "ins": 680, + "tic": 681, + "id": 682, + "only": 683, + "ates": 684, + "tri": 685, + "ving": 686, + "ba": 687, + "vel": 688, + "ance": 689, + "sta": 690, + "ern": 691, + "fol": 692, + "een": 693, + "ined": 694, + "stru": 695, + "uni": 696, + "game": 697, + "lar": 698, + "sel": 699, + "bli": 700, + "used": 701, + "ning": 702, + "ps": 703, + "ties": 704, + "kno": 705, + "cor": 706, + "ft": 707, + "recor": 708, + "ble": 709, + "vie": 710, + "ys": 711, + "wil": 712, + "ical": 713, + "app": 714, + "tro": 715, + "three": 716, + "cla": 717, + "old": 718, + "shed": 719, + "hea": 720, + "about": 721, + "writ": 722, + "than": 723, + "ste": 724, + "later": 725, + "ari": 726, + "dy": 727, + "publi": 728, + "loc": 729, + "aga": 730, + "throu": 731, + "ssi": 732, + "end": 733, + "may": 734, + "ang": 735, + "ach": 736, + "ves": 737, + "og": 738, + "him": 739, + "betw": 740, + "though": 741, + "between": 742, + "um": 743, + "star": 744, + "scri": 745, + "rea": 746, + "ond": 747, + "ship": 748, + "ok": 749, + "hel": 750, + "song": 751, + "chi": 752, + "cap": 753, + "ever": 754, + "day": 755, + "cri": 756, + "some": 757, + "bro": 758, + "no": 759, + "there": 760, + "ans": 761, + "all": 762, + "num": 763, + "red": 764, + "ears": 765, + "sts": 766, + "any": 767, + "war": 768, + "ph": 769, + "pp": 770, + "gin": 771, + "struc": 772, + "amer": 773, + "produc": 774, + "sch": 775, + "ces": 776, + "ure": 777, + "ating": 778, + "emp": 779, + "tor": 780, + "season": 781, + "fore": 782, + "ic": 783, + "city": 784, + "gro": 785, + "follow": 786, + "sub": 787, + "bel": 788, + "year": 789, + "can": 790, + "sin": 791, + "where": 792, + "and": 793, + "made": 794, + "relea": 795, + "sm": 796, + "bl": 797, + "ten": 798, + "with": 799, + "son": 800, + "many": 801, + "are": 802, + "ed": 803, + "how": 804, + "americ": 805, + "ury": 806, + "stu": 807, + "musi": 808, + "cu": 809, + "nam": 810, + "ement": 811, + "such": 812, + "albu": 813, + "buil": 814, + "before": 815, + "ef": 816, + "arm": 817, + "ton": 818, + "them": 819, + "cal": 820, + "bar": 821, + "des": 822, + "mat": 823, + "gener": 824, + "od": 825, + "series": 826, + "cer": 827, + "sho": 828, + "enti": 829, + "her": 830, + "over": 831, + "ann": 832, + "well": 833, + "world": 834, + "gan": 835, + "est": 836, + "second": 837, + "ters": 838, + "side": 839, + "tran": 840, + "line": 841, + "ture": 842, + "port": 843, + "being": 844, + "years": 845, + "both": 846, + "indi": 847, + "these": 848, + "national": 849, + "histor": 850, + "fe": 851, + "vo": 852, + "sted": 853, + "ani": 854, + "bas": 855, + "poin": 856, + "sing": 857, + "film": 858, + "pen": 859, + "sup": 860, + "mis": 861, + "cro": 862, + "stri": 863, + "lin": 864, + "tre": 865, + "war": 866, + "however": 867, + "ying": 868, + "ling": 869, + "yp": 870, + "ected": 871, + "direc": 872, + "vision": 873, + "album": 874, + "then": 875, + "ll": 876, + "sever": 877, + "through": 878, + "known": 879, + "bor": 880, + "cul": 881, + "clu": 882, + "ster": 883, + "south": 884, + "ry": 885, + "ect": 886, + "low": 887, + "pr": 888, + "sk": 889, + "iso": 890, + "north": 891, + "part": 892, + "fac": 893, + "tly": 894, + "peri": 895, + "eu": 896, + "batt": 897, + "state": 898, + "ced": 899, + "consi": 900, + "inf": 901, + "poli": 902, + "olog": 903, + "early": 904, + "posi": 905, + "ames": 906, + "win": 907, + "devel": 908, + "ob": 909, + "ve": 910, + "ven": 911, + "oper": 912, + "ger": 913, + "offi": 914, + "charac": 915, + "ms": 916, + "high": 917, + "ad": 918, + "tho": 919, + "several": 920, + "dre": 921, + "descri": 922, + "ale": 923, + "number": 924, + "air": 925, + "including": 926, + "inst": 927, + "against": 928, + "ls": 929, + "sul": 930, + "episo": 931, + "cam": 932, + "dif": 933, + "soci": 934, + "became": 935, + "like": 936, + "tel": 937, + "four": 938, + "âĢĶ": 939, + "hou": 940, + "joh": 941, + "united": 942, + "inv": 943, + "under": 944, + "nov": 945, + "tiv": 946, + "suc": 947, + "ations": 948, + "ack": 949, + "tor": 950, + "ron": 951, + "und": 952, + "ws": 953, + "fo": 954, + "gr": 955, + "develop": 956, + "although": 957, + "contin": 958, + "west": 959, + "origin": 960, + "music": 961, + "ors": 962, + "don": 963, + "century": 964, + "ward": 965, + "work": 966, + "me": 967, + "ami": 968, + "cha": 969, + "very": 970, + "har": 971, + "dis": 972, + "zed": 973, + "do": 974, + "gs": 975, + "tow": 976, + "sol": 977, + "following": 978, + "lion": 979, + "rema": 980, + "ns": 981, + "tish": 982, + "chur": 983, + "som": 984, + "mp": 985, + "tle": 986, + "gover": 987, + "del": 988, + "comple": 989, + "cur": 990, + "use": 991, + "back": 992, + "hu": 993, + "stern": 994, + "began": 995, + "fiel": 996, + "ause": 997, + "dra": 998, + "pas": 999, + "bil": 1000, + "cation": 1001, + "dent": 1002, + "bed": 1003, + "because": 1004, + "ant": 1005, + "eam": 1006, + "phi": 1007, + "yo": 1008, + "continu": 1009, + "tain": 1010, + "try": 1011, + "fre": 1012, + "peop": 1013, + "called": 1014, + "found": 1015, + "episode": 1016, + "desig": 1017, + "mor": 1018, + "set": 1019, + "ley": 1020, + "east": 1021, + "trac": 1022, + "cra": 1023 + }, + "merges": [ + "t h", + "th e", + "i n", + "a n", + "e d", + "e r", + "r e", + "a r", + "t i", + "o n", + "e n", + "o f", + "o r", + "an d", + "e r", + "o n", + "i n", + "in g", + "s t", + "r o", + "a l", + "i t", + "t o", + "a s", + "a t", + "e s", + "o u", + "h i", + "a c", + "s i", + "a t", + "r i", + "a l", + "e l", + "a n", + "a m", + "o r", + "s t", + "l i", + "u r", + "e c", + "o m", + "d i", + "w as", + "l y", + "e n", + "e a", + "c h", + "u n", + "ti on", + "l a", + "i s", + "f i", + "o l", + "d e", + "- @", + "@ -@", + "r a", + "v i", + "l e", + "l o", + "s h", + "e m", + "b e", + "th at", + "' s", + "c on", + "m a", + "f or", + "h a", + "s u", + "b y", + "it h", + "v e", + "w ith", + "s e", + "c h", + "th e", + "en t", + "p o", + "c e", + "i l", + "s e", + "en t", + "l e", + "c om", + "s p", + "er e", + "p ro", + "n o", + "b u", + "w h", + "i t", + "t h", + "v er", + "n e", + "c a", + "i s", + "f or", + "a g", + "er s", + "m o", + "g h", + "f ro", + "t ed", + "fro m", + "ti on", + "o p", + "hi s", + "a d", + "a b", + "i c", + "h e", + "ou n", + "a s", + "t s", + "s c", + "d e", + "o w", + "e x", + "w hi", + "r u", + "t er", + "a p", + "d s", + "w ere", + "p re", + "d u", + "g u", + "p ar", + "i r", + "b o", + "th er", + "q u", + "l u", + "t er", + "t w", + "e s", + "re c", + "p er", + "t a", + "at e", + "v er", + "at ed", + "d ing", + "it y", + "m an", + "e ar", + "s ed", + "d ed", + "a u", + "al l", + "am e", + "c i", + "on e", + "in g", + "ar e", + "a f", + "i r", + "a tion", + "â Ģ", + "ha d", + "t r", + "u l", + "l d", + "whi ch", + "w a", + "i m", + "l ea", + "b e", + "t o", + "ti m", + "fi r", + "w or", + "on g", + "p or", + "m ar", + "m e", + "al ly", + "s o", + "ou t", + "tion s", + "it s", + "g h", + "g e", + "b er", + "f e", + "p u", + "s er", + "d er", + "p l", + "s s", + "in e", + "in c", + "m i", + "gh t", + "g o", + "th is", + "t ur", + "d a", + "ro u", + "bu t", + "u m", + "s on", + "w e", + "v ed", + "si on", + "k e", + "p la", + "the ir", + "i es", + "fir st", + "s a", + "o c", + "at t", + "o f", + "p e", + "no t", + "g i", + "n a", + "ar y", + "m u", + "l ed", + "âĢ ĵ", + "h er", + "r an", + "c o", + "the y", + "d er", + "al i", + "al so", + "or e", + "e p", + "ou ld", + "af ter", + "s hi", + "u s", + "e t", + "ti c", + "st or", + "w i", + "e v", + "o ther", + "s h", + "t ing", + "ar d", + "t e", + "tw o", + "n i", + "ha ve", + "ou r", + "com m", + "t e", + "ac k", + "o o", + "f in", + "s ec", + "ent s", + "h as", + "com p", + "b ec", + "k s", + "con t", + "l and", + "be en", + "en ce", + "k ing", + "e l", + "ag e", + "lo w", + "m in", + ". @", + "@ .@", + "om e", + "m ent", + "ch ar", + "g e", + "at er", + "n or", + "h o", + "ou s", + "wh o", + "ea r", + "sp ec", + "c ol", + "el y", + "t y", + "j o", + "ur ing", + "du c", + "b ri", + "st r", + "c an", + "or i", + "t ra", + "p a", + "sh e", + "d o", + "ti ve", + "m on", + "ne w", + "r it", + "tim e", + "on s", + "s o", + "m an", + "d ec", + "c ent", + "l an", + "p i", + "ou r", + "in ter", + "f er", + "g ra", + "g re", + "re s", + "inc lu", + "m il", + "d uring", + "ow n", + "pre s", + "j u", + "n ed", + "el l", + ", @", + "@ ,@", + "it e", + "g en", + "wh en", + "si g", + "b i", + "re n", + "f a", + "g a", + "pla y", + "en g", + "tion al", + "oun d", + "th ou", + "m ore", + "re e", + "em ber", + "e i", + "s ou", + "s ur", + "s ti", + "c ar", + "for m", + "l ar", + "s es", + "t en", + "in to", + "t u", + "c es", + "mo st", + "k ed", + "wa y", + "c re", + "c oun", + "u p", + "l es", + "ac e", + "al s", + "k e", + "w ould", + "an t", + "b er", + "f u", + "it ed", + "p ri", + "whi le", + "o ver", + "ing s", + "r e", + "fi l", + "s y", + "e st", + "ab le", + "w n", + "s ea", + "ac h", + "s ing", + "in s", + "ti c", + "i d", + "on ly", + "at es", + "t ri", + "v ing", + "b a", + "v el", + "an ce", + "st a", + "er n", + "f ol", + "e en", + "in ed", + "st ru", + "un i", + "g ame", + "la r", + "s el", + "b li", + "u sed", + "n ing", + "p s", + "ti es", + "k no", + "c or", + "f t", + "rec or", + "b le", + "vi e", + "y s", + "w il", + "ic al", + "ap p", + "t ro", + "th ree", + "c la", + "ol d", + "sh ed", + "h ea", + "ab out", + "w rit", + "th an", + "st e", + "l ater", + "ar i", + "d y", + "pu bli", + "lo c", + "ag a", + "th rou", + "s si", + "en d", + "ma y", + "an g", + "ac h", + "v es", + "o g", + "hi m", + "be tw", + "thou gh", + "betw een", + "u m", + "st ar", + "sc ri", + "re a", + "on d", + "shi p", + "o k", + "h el", + "s ong", + "c hi", + "ca p", + "e ver", + "da y", + "c ri", + "s ome", + "b ro", + "n o", + "th ere", + "an s", + "al l", + "n um", + "r ed", + "ear s", + "st s", + "an y", + "w ar", + "p h", + "p p", + "g in", + "stru c", + "am er", + "pro duc", + "s ch", + "c es", + "ur e", + "at ing", + "em p", + "t or", + "sea son", + "for e", + "i c", + "c ity", + "g ro", + "fol low", + "su b", + "b el", + "y ear", + "c an", + "s in", + "wh ere", + "an d", + "ma de", + "re lea", + "s m", + "b l", + "t en", + "wi th", + "s on", + "man y", + "a re", + "e d", + "h ow", + "amer ic", + "ur y", + "st u", + "mu si", + "c u", + "n am", + "em ent", + "su ch", + "al bu", + "bu il", + "be fore", + "e f", + "ar m", + "t on", + "the m", + "c al", + "b ar", + "d es", + "m at", + "gen er", + "o d", + "ser ies", + "c er", + "sh o", + "en ti", + "h er", + "o ver", + "an n", + "w ell", + "wor ld", + "g an", + "e st", + "sec ond", + "t ers", + "si de", + "tr an", + "l ine", + "tur e", + "por t", + "be ing", + "y ears", + "bo th", + "in di", + "the se", + "na tional", + "hi stor", + "f e", + "v o", + "st ed", + "an i", + "b as", + "po in", + "s ing", + "fil m", + "p en", + "su p", + "m is", + "c ro", + "st ri", + "l in", + "t re", + "wa r", + "how ever", + "y ing", + "l ing", + "y p", + "ec ted", + "di rec", + "vi sion", + "albu m", + "th en", + "l l", + "se ver", + "throu gh", + "kno wn", + "b or", + "c ul", + "c lu", + "st er", + "sou th", + "r y", + "ec t", + "lo w", + "p r", + "s k", + "is o", + "nor th", + "par t", + "f ac", + "t ly", + "per i", + "e u", + "b att", + "st ate", + "c ed", + "con si", + "in f", + "po li", + "ol og", + "ear ly", + "po si", + "am es", + "w in", + "de vel", + "o b", + "v e", + "v en", + "op er", + "g er", + "of fi", + "char ac", + "m s", + "hi gh", + "a d", + "th o", + "sever al", + "d re", + "de scri", + "al e", + "num ber", + "a ir", + "inclu ding", + "in st", + "aga inst", + "l s", + "su l", + "ep iso", + "c am", + "di f", + "so ci", + "bec ame", + "li ke", + "t el", + "f our", + "âĢ Ķ", + "h ou", + "jo h", + "un ited", + "in v", + "un der", + "no v", + "ti v", + "su c", + "a tions", + "ac k", + "t or", + "r on", + "un d", + "w s", + "f o", + "g r", + "devel op", + "al though", + "cont in", + "we st", + "ori gin", + "musi c", + "or s", + "d on", + "cent ury", + "w ard", + "wor k", + "m e", + "am i", + "ch a", + "ver y", + "h ar", + "di s", + "z ed", + "d o", + "g s", + "t ow", + "s ol", + "follow ing", + "li on", + "re ma", + "n s", + "ti sh", + "ch ur", + "s om", + "m p", + "t le", + "go ver", + "d el", + "comp le", + "c ur", + "u se", + "b ack", + "h u", + "st ern", + "be gan", + "fi el", + "au se", + "d ra", + "p as", + "b il", + "ca tion", + "d ent", + "b ed", + "bec ause", + "an t", + "ea m", + "p hi", + "y o", + "contin u", + "ta in", + "tr y", + "f re", + "pe op", + "cal led", + "f ound", + "episo de", + "de sig", + "m or", + "se t", + "le y", + "ea st", + "tr ac", + "c ra" + ] + } +} \ No newline at end of file diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..6892753 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,34 @@ +{ + "add_prefix_space": false, + "bos_token": { + "__type": "AddedToken", + "content": "<|startoftext|>", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "do_lower_case": true, + "eos_token": { + "__type": "AddedToken", + "content": "<|endoftext|>", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "errors": "replace", + "model_max_length": 77, + "name_or_path": "temp/dummy/clip/processors", + "pad_token": "<|endoftext|>", + "special_tokens_map_file": "/home/huggingface/.cache/huggingface/hub/models--openai--clip-vit-base-patch32/snapshots/e6a30b603a447e251fdaca1c3056b2a16cdfebeb/special_tokens_map.json", + "tokenizer_class": "CLIPTokenizer", + "unk_token": { + "__type": "AddedToken", + "content": "<|endoftext|>", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + } +} diff --git a/vocab.json b/vocab.json new file mode 100644 index 0000000..b73cde7 --- /dev/null +++ b/vocab.json @@ -0,0 +1,1026 @@ +{ + "!": 2, + "!": 277, + "\"": 3, + "\"": 281, + "#": 4, + "#": 288, + "$": 5, + "$": 274, + "%": 6, + "%": 255, + "&": 7, + "&": 258, + "'": 8, + "'": 223, + "'s": 363, + "(": 9, + "(": 289, + ")": 10, + ")": 279, + "*": 11, + "*": 295, + "+": 12, + "+": 294, + ",": 13, + ",": 276, + ",@": 622, + "-": 14, + "-": 247, + "-@": 353, + ".": 15, + ".": 236, + ".@": 569, + "/": 16, + "/": 272, + "0": 17, + "0": 285, + "1": 18, + "1": 293, + "2": 19, + "2": 286, + "3": 20, + "3": 291, + "4": 21, + "4": 284, + "5": 22, + "5": 275, + "6": 23, + "6": 290, + "7": 24, + "7": 280, + "8": 25, + "8": 240, + "9": 26, + "9": 218, + ":": 27, + ":": 292, + ";": 28, + ";": 228, + "<": 29, + "<": 265, + "<|endoftext|>": 1, + "<|startoftext|>": 0, + "=": 30, + "=": 264, + ">": 31, + ">": 273, + "?": 32, + "?": 296, + "@": 33, + "@,@": 623, + "@-@": 354, + "@.@": 570, + "@": 231, + "[": 34, + "[": 283, + "\\": 35, + "\\": 297, + "]": 36, + "]": 278, + "^": 37, + "^": 282, + "_": 38, + "_": 269, + "`": 39, + "`": 267, + "a": 40, + "a": 184, + "ab": 408, + "able": 675, + "about": 721, + "ac": 326, + "ace": 659, + "ach": 678, + "ach": 736, + "ack": 949, + "ack": 551, + "ad": 407, + "ad": 918, + "af": 455, + "after": 532, + "ag": 397, + "aga": 730, + "against": 928, + "age": 566, + "air": 925, + "al": 318, + "al": 330, + "albu": 813, + "album": 874, + "ale": 923, + "ali": 527, + "all": 762, + "all": 449, + "ally": 476, + "als": 660, + "also": 528, + "although": 957, + "am": 333, + "ame": 450, + "amer": 773, + "americ": 805, + "ames": 906, + "ami": 968, + "an": 301, + "an": 332, + "ance": 689, + "and": 793, + "and": 311, + "ang": 735, + "ani": 854, + "ann": 832, + "ans": 761, + "ant": 1005, + "ant": 663, + "any": 767, + "ap": 421, + "app": 714, + "ar": 305, + "ard": 543, + "are": 802, + "are": 454, + "ari": 726, + "arm": 817, + "ary": 518, + "as": 412, + "as": 321, + "at": 322, + "at": 328, + "ate": 439, + "ated": 441, + "ater": 575, + "ates": 684, + "ating": 778, + "ation": 457, + "ations": 948, + "att": 512, + "au": 448, + "ause": 997, + "b": 41, + "b": 199, + "ba": 687, + "back": 992, + "bar": 821, + "bas": 855, + "batt": 897, + "be": 361, + "be": 467, + "bec": 558, + "became": 935, + "because": 1004, + "bed": 1003, + "been": 562, + "before": 815, + "began": 995, + "being": 844, + "bel": 788, + "ber": 664, + "ber": 483, + "betw": 740, + "between": 742, + "bi": 628, + "bil": 1000, + "bl": 797, + "ble": 709, + "bli": 700, + "bo": 429, + "bor": 880, + "both": 846, + "bri": 588, + "bro": 758, + "bu": 388, + "buil": 814, + "but": 499, + "by": 369, + "c": 42, + "c": 178, + "ca": 394, + "cal": 820, + "called": 1014, + "cam": 932, + "can": 590, + "can": 790, + "cap": 753, + "car": 644, + "cation": 1001, + "ce": 378, + "ced": 899, + "cent": 605, + "century": 964, + "cer": 827, + "ces": 776, + "ces": 651, + "ch": 345, + "ch": 374, + "cha": 969, + "char": 573, + "charac": 915, + "chi": 752, + "chur": 983, + "ci": 451, + "city": 784, + "cla": 717, + "clu": 882, + "co": 524, + "col": 582, + "com": 383, + "comm": 549, + "comp": 557, + "comple": 989, + "con": 364, + "consi": 900, + "cont": 560, + "contin": 958, + "continu": 1009, + "cor": 706, + "coun": 656, + "cra": 1023, + "cre": 655, + "cri": 756, + "cro": 862, + "cu": 809, + "cul": 881, + "cur": 990, + "d": 43, + "d": 167, + "da": 497, + "day": 755, + "de": 352, + "de": 415, + "dec": 604, + "ded": 447, + "del": 988, + "dent": 1002, + "der": 487, + "der": 526, + "des": 822, + "descri": 922, + "desig": 1017, + "devel": 908, + "develop": 956, + "di": 340, + "dif": 933, + "ding": 442, + "direc": 872, + "dis": 972, + "do": 595, + "do": 974, + "don": 963, + "dra": 998, + "dre": 921, + "ds": 422, + "du": 425, + "duc": 587, + "during": 616, + "dy": 727, + "e": 44, + "e": 171, + "ea": 344, + "eam": 1006, + "ear": 445, + "ear": 580, + "early": 904, + "ears": 765, + "east": 1021, + "ec": 338, + "ect": 886, + "ected": 871, + "ed": 803, + "ed": 302, + "een": 693, + "ef": 816, + "ei": 640, + "el": 331, + "el": 565, + "ell": 621, + "ely": 583, + "em": 360, + "ember": 639, + "ement": 811, + "emp": 779, + "en": 308, + "en": 343, + "ence": 563, + "end": 733, + "eng": 633, + "ent": 376, + "ent": 381, + "enti": 829, + "ents": 555, + "ep": 530, + "episo": 931, + "episode": 1016, + "er": 303, + "er": 312, + "ere": 385, + "ern": 691, + "ers": 398, + "es": 435, + "es": 323, + "est": 674, + "est": 836, + "et": 535, + "eu": 896, + "ev": 539, + "ever": 754, + "ex": 417, + "f": 45, + "f": 187, + "fa": 630, + "fac": 893, + "fe": 484, + "fe": 851, + "fer": 610, + "fi": 350, + "fiel": 996, + "fil": 672, + "film": 858, + "fin": 553, + "fir": 470, + "first": 509, + "fo": 954, + "fol": 692, + "follow": 786, + "following": 978, + "for": 396, + "for": 366, + "fore": 782, + "form": 645, + "found": 1015, + "four": 938, + "fre": 1012, + "fro": 401, + "from": 403, + "ft": 707, + "fu": 665, + "g": 46, + "g": 175, + "ga": 631, + "game": 697, + "gan": 835, + "ge": 574, + "ge": 482, + "gen": 625, + "gener": 824, + "ger": 913, + "gh": 400, + "gh": 481, + "ght": 493, + "gi": 516, + "gin": 771, + "go": 494, + "gover": 987, + "gr": 955, + "gra": 611, + "gre": 612, + "gro": 785, + "gs": 975, + "gu": 426, + "h": 47, + "h": 168, + "ha": 367, + "had": 459, + "har": 971, + "has": 556, + "have": 547, + "he": 410, + "hea": 720, + "hel": 750, + "her": 830, + "her": 522, + "hi": 325, + "high": 917, + "him": 739, + "his": 406, + "histor": 850, + "ho": 577, + "hou": 940, + "how": 804, + "however": 867, + "hu": 993, + "i": 48, + "i": 185, + "ic": 409, + "ic": 783, + "ical": 713, + "id": 682, + "ies": 508, + "il": 379, + "im": 465, + "in": 300, + "in": 314, + "inc": 491, + "inclu": 614, + "including": 926, + "indi": 847, + "ine": 490, + "ined": 694, + "inf": 901, + "ing": 453, + "ing": 315, + "ings": 670, + "ins": 680, + "inst": 927, + "inter": 609, + "into": 649, + "inv": 943, + "ir": 428, + "ir": 456, + "is": 395, + "is": 349, + "iso": 890, + "it": 319, + "it": 390, + "ite": 624, + "ited": 666, + "ith": 370, + "its": 480, + "ity": 443, + "j": 49, + "j": 203, + "jo": 585, + "joh": 941, + "ju": 619, + "k": 50, + "k": 183, + "ke": 661, + "ke": 505, + "ked": 653, + "king": 564, + "kno": 705, + "known": 879, + "ks": 559, + "l": 51, + "l": 172, + "la": 348, + "lan": 606, + "land": 561, + "lar": 646, + "lar": 698, + "later": 725, + "ld": 462, + "le": 382, + "le": 357, + "lea": 466, + "led": 520, + "les": 658, + "ley": 1020, + "li": 336, + "like": 936, + "lin": 864, + "line": 841, + "ling": 869, + "lion": 979, + "ll": 876, + "lo": 358, + "loc": 729, + "low": 567, + "low": 887, + "ls": 929, + "lu": 432, + "ly": 342, + "m": 52, + "m": 173, + "ma": 365, + "made": 794, + "man": 444, + "man": 603, + "many": 801, + "mar": 474, + "mat": 823, + "may": 734, + "me": 475, + "me": 967, + "ment": 572, + "mi": 492, + "mil": 615, + "min": 568, + "mis": 861, + "mo": 399, + "mon": 597, + "mor": 1018, + "more": 637, + "most": 652, + "mp": 985, + "ms": 916, + "mu": 519, + "musi": 808, + "music": 961, + "n": 53, + "n": 174, + "na": 517, + "nam": 810, + "national": 849, + "ne": 393, + "ned": 620, + "new": 598, + "ni": 546, + "ning": 702, + "no": 387, + "no": 759, + "nor": 576, + "north": 891, + "not": 515, + "nov": 945, + "ns": 981, + "num": 763, + "number": 924, + "o": 54, + "o": 182, + "ob": 909, + "oc": 511, + "od": 825, + "of": 513, + "of": 309, + "offi": 914, + "og": 738, + "ok": 749, + "ol": 351, + "old": 718, + "olog": 903, + "om": 339, + "ome": 571, + "on": 307, + "on": 313, + "ond": 747, + "one": 452, + "ong": 472, + "only": 683, + "ons": 601, + "oo": 552, + "op": 405, + "oper": 912, + "or": 310, + "or": 334, + "ore": 529, + "ori": 591, + "origin": 960, + "ors": 962, + "other": 540, + "ou": 324, + "ould": 531, + "oun": 411, + "ound": 635, + "our": 548, + "our": 608, + "ous": 578, + "out": 478, + "over": 831, + "over": 669, + "ow": 416, + "own": 617, + "p": 55, + "p": 189, + "pa": 593, + "par": 427, + "part": 892, + "pas": 999, + "pe": 514, + "pen": 859, + "peop": 1013, + "per": 437, + "peri": 895, + "ph": 769, + "phi": 1007, + "pi": 607, + "pl": 488, + "pla": 506, + "play": 632, + "po": 377, + "poin": 856, + "poli": 902, + "por": 473, + "port": 843, + "posi": 905, + "pp": 770, + "pr": 888, + "pre": 424, + "pres": 618, + "pri": 667, + "pro": 386, + "produc": 774, + "ps": 703, + "pu": 485, + "publi": 728, + "q": 56, + "q": 210, + "qu": 431, + "r": 57, + "r": 176, + "ra": 355, + "ran": 523, + "re": 304, + "re": 671, + "rea": 746, + "rec": 436, + "recor": 708, + "red": 764, + "ree": 638, + "relea": 795, + "rema": 980, + "ren": 629, + "res": 613, + "ri": 329, + "rit": 599, + "ro": 317, + "ron": 951, + "rou": 498, + "ru": 419, + "ry": 885, + "s": 58, + "s": 170, + "sa": 510, + "sc": 414, + "sch": 775, + "scri": 745, + "se": 380, + "se": 373, + "sea": 677, + "season": 781, + "sec": 554, + "second": 837, + "sed": 446, + "sel": 699, + "ser": 486, + "series": 826, + "ses": 647, + "set": 1019, + "sever": 877, + "several": 920, + "sh": 359, + "sh": 541, + "she": 594, + "shed": 719, + "shi": 533, + "ship": 748, + "sho": 828, + "si": 327, + "side": 839, + "sig": 627, + "sin": 791, + "sing": 857, + "sing": 679, + "sion": 504, + "sk": 889, + "sm": 796, + "so": 602, + "so": 477, + "soci": 934, + "sol": 977, + "som": 984, + "some": 757, + "son": 800, + "son": 501, + "song": 751, + "sou": 641, + "south": 884, + "sp": 384, + "spec": 581, + "ss": 489, + "ssi": 732, + "st": 316, + "st": 335, + "sta": 690, + "star": 744, + "state": 898, + "ste": 724, + "sted": 853, + "ster": 883, + "stern": 994, + "sti": 643, + "stor": 537, + "str": 589, + "stri": 863, + "stru": 695, + "struc": 772, + "sts": 766, + "stu": 807, + "su": 368, + "sub": 787, + "suc": 947, + "such": 812, + "sul": 930, + "sup": 860, + "sur": 642, + "sy": 673, + "t": 59, + "t": 180, + "ta": 438, + "tain": 1010, + "te": 544, + "te": 550, + "ted": 402, + "tel": 937, + "ten": 648, + "ten": 798, + "ter": 433, + "ter": 420, + "ters": 838, + "th": 298, + "th": 391, + "than": 723, + "that": 362, + "the": 375, + "the": 299, + "their": 507, + "them": 819, + "then": 875, + "ther": 430, + "there": 760, + "these": 848, + "they": 525, + "this": 495, + "tho": 919, + "thou": 636, + "though": 741, + "three": 716, + "throu": 731, + "through": 878, + "ti": 306, + "tic": 536, + "tic": 681, + "ties": 704, + "tim": 469, + "time": 600, + "ting": 542, + "tion": 404, + "tion": 347, + "tional": 634, + "tions": 479, + "tish": 982, + "tiv": 946, + "tive": 596, + "tle": 986, + "tly": 894, + "to": 468, + "to": 320, + "ton": 818, + "tor": 780, + "tor": 950, + "tow": 976, + "tr": 460, + "tra": 592, + "trac": 1022, + "tran": 840, + "tre": 865, + "tri": 685, + "tro": 715, + "try": 1011, + "ts": 413, + "tu": 650, + "tur": 496, + "ture": 842, + "tw": 434, + "two": 545, + "ty": 584, + "u": 60, + "u": 186, + "ul": 461, + "um": 500, + "um": 743, + "un": 346, + "und": 952, + "under": 944, + "uni": 696, + "united": 942, + "up": 657, + "ur": 337, + "ure": 777, + "uring": 586, + "ury": 806, + "us": 534, + "use": 991, + "used": 701, + "v": 61, + "v": 196, + "ve": 910, + "ve": 371, + "ved": 503, + "vel": 688, + "ven": 911, + "ver": 392, + "ver": 440, + "very": 970, + "ves": 737, + "vi": 356, + "vie": 710, + "ving": 686, + "vision": 873, + "vo": 852, + "w": 62, + "w": 194, + "wa": 464, + "war": 768, + "war": 866, + "ward": 965, + "was": 341, + "way": 654, + "we": 502, + "well": 833, + "were": 423, + "west": 959, + "wh": 389, + "when": 626, + "where": 792, + "whi": 418, + "which": 463, + "while": 668, + "who": 579, + "wi": 538, + "wil": 712, + "win": 907, + "with": 799, + "with": 372, + "wn": 676, + "wor": 471, + "work": 966, + "world": 834, + "would": 662, + "writ": 722, + "ws": 953, + "x": 63, + "x": 200, + "y": 64, + "y": 169, + "year": 789, + "years": 845, + "ying": 868, + "yo": 1008, + "yp": 870, + "ys": 711, + "z": 65, + "z": 193, + "zed": 973, + "|": 66, + "|": 268, + "}": 67, + "}": 227, + "~": 68, + "~": 287, + "¡": 69, + "¡": 206, + "¢": 70, + "¢": 221, + "£": 71, + "£": 243, + "¤": 72, + "¤": 192, + "¥": 73, + "¥": 212, + "¦": 74, + "¦": 215, + "§": 75, + "§": 226, + "¨": 76, + "¨": 177, + "©": 77, + "©": 188, + "ª": 78, + "ª": 202, + "«": 79, + "«": 205, + "¬": 80, + "¬": 232, + "®": 81, + "®": 248, + "¯": 82, + "¯": 190, + "°": 83, + "°": 201, + "±": 84, + "±": 179, + "²": 85, + "²": 246, + "³": 86, + "³": 235, + "´": 87, + "´": 257, + "µ": 88, + "µ": 225, + "¶": 89, + "¶": 214, + "·": 90, + "·": 211, + "¸": 91, + "¸": 217, + "¹": 92, + "¹": 207, + "º": 93, + "º": 204, + "»": 94, + "»": 198, + "¼": 95, + "¼": 224, + "½": 96, + "½": 271, + "¾": 97, + "¾": 191, + "¿": 98, + "¿": 249, + "Â": 99, + "Ã": 100, + "Ä": 101, + "Å": 102, + "Æ": 103, + "Ç": 104, + "È": 105, + "É": 106, + "Ê": 107, + "Ë": 108, + "Ì": 109, + "Í": 110, + "Î": 111, + "Ï": 112, + "Ð": 113, + "Ñ": 114, + "Ö": 115, + "×": 116, + "Ø": 117, + "Ù": 118, + "Ü": 119, + "à": 120, + "á": 121, + "â": 122, + "âĢ": 458, + "âĢĵ": 521, + "âĢĶ": 939, + "ã": 123, + "ä": 124, + "å": 125, + "æ": 126, + "ç": 127, + "è": 128, + "é": 129, + "ë": 130, + "ì": 131, + "ï": 132, + "Ģ": 133, + "Ģ": 252, + "ģ": 134, + "ģ": 260, + "Ĥ": 135, + "Ĥ": 195, + "ĥ": 136, + "ĥ": 208, + "Ħ": 137, + "Ħ": 239, + "ħ": 138, + "ħ": 270, + "Ĩ": 139, + "Ĩ": 238, + "ĩ": 140, + "ĩ": 197, + "Ī": 141, + "Ī": 256, + "ī": 142, + "ī": 253, + "Ĭ": 143, + "Ĭ": 209, + "ĭ": 144, + "ĭ": 259, + "Į": 145, + "Į": 219, + "į": 146, + "į": 181, + "İ": 147, + "İ": 261, + "ı": 148, + "ı": 222, + "IJ": 149, + "IJ": 216, + "ij": 150, + "ij": 262, + "Ĵ": 151, + "Ĵ": 234, + "ĵ": 152, + "ĵ": 263, + "Ķ": 153, + "Ķ": 229, + "ķ": 154, + "ķ": 242, + "ĸ": 155, + "ĸ": 266, + "Ĺ": 156, + "Ĺ": 230, + "ĺ": 157, + "ĺ": 237, + "Ļ": 158, + "Ļ": 233, + "ļ": 159, + "ļ": 250, + "Ľ": 160, + "Ľ": 254, + "ľ": 161, + "ľ": 251, + "Ŀ": 162, + "Ŀ": 245, + "ŀ": 163, + "ŀ": 244, + "Ł": 164, + "Ł": 220, + "ł": 165, + "ł": 241, + "Ń": 166, + "Ń": 213 +}