add downloader

2026-03-21 08:08:13 +00:00 · 2024-06-24 16:45:35 +08:00
parent 00f294454b
commit e9ec2f2706
26 changed files with 430 additions and 42 deletions
--- a/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer/special_tokens_map.json
+++ b/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer/special_tokens_map.json
@@ -0,0 +1,7 @@
+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}
--- a/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer/tokenizer_config.json
+++ b/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer/tokenizer_config.json
@@ -0,0 +1,16 @@
+{
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "name_or_path": "hfl/chinese-roberta-wwm-ext",
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "special_tokens_map_file": "/home/chenweifeng/.cache/huggingface/hub/models--hfl--chinese-roberta-wwm-ext/snapshots/5c58d0b8ec1d9014354d691c538661bf00bfdb44/special_tokens_map.json",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]",
+  "model_max_length": 77
+}
--- a/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer/vocab.txt
+++ b/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer/vocab.txt
--- a/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer/vocab_org.txt
+++ b/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer/vocab_org.txt
--- a/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer_t5/config.json
+++ b/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer_t5/config.json
@@ -0,0 +1,28 @@
+{
+  "_name_or_path": "/home/patrick/t5/mt5-xl",
+  "architectures": [
+    "MT5ForConditionalGeneration"
+  ],
+  "d_ff": 5120,
+  "d_kv": 64,
+  "d_model": 2048,
+  "decoder_start_token_id": 0,
+  "dropout_rate": 0.1,
+  "eos_token_id": 1,
+  "feed_forward_proj": "gated-gelu",
+  "initializer_factor": 1.0,
+  "is_encoder_decoder": true,
+  "layer_norm_epsilon": 1e-06,
+  "model_type": "mt5",
+  "num_decoder_layers": 24,
+  "num_heads": 32,
+  "num_layers": 24,
+  "output_past": true,
+  "pad_token_id": 0,
+  "relative_attention_num_buckets": 32,
+  "tie_word_embeddings": false,
+  "tokenizer_class": "T5Tokenizer",
+  "transformers_version": "4.10.0.dev0",
+  "use_cache": true,
+  "vocab_size": 250112
+}
--- a/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer_t5/special_tokens_map.json
+++ b/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer_t5/special_tokens_map.json
@@ -0,0 +1 @@
+{"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>"}
--- a/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer_t5/spiece.model
+++ b/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer_t5/spiece.model
--- a/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer_t5/tokenizer_config.json
+++ b/diffsynth/tokenizer_configs/hunyuan_dit/tokenizer_t5/tokenizer_config.json
@@ -0,0 +1 @@
+{"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>", "extra_ids": 0, "additional_special_tokens": null, "special_tokens_map_file": "", "tokenizer_file": null, "name_or_path": "google/mt5-small", "model_max_length": 256, "legacy": true}
--- a/diffsynth/tokenizer_configs/stable_diffusion/tokenizer/merges.txt
+++ b/diffsynth/tokenizer_configs/stable_diffusion/tokenizer/merges.txt
--- a/diffsynth/tokenizer_configs/stable_diffusion/tokenizer/special_tokens_map.json
+++ b/diffsynth/tokenizer_configs/stable_diffusion/tokenizer/special_tokens_map.json
@@ -0,0 +1,24 @@
+{
+  "bos_token": {
+    "content": "<|startoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<|endoftext|>",
+  "unk_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}
--- a/diffsynth/tokenizer_configs/stable_diffusion/tokenizer/tokenizer_config.json
+++ b/diffsynth/tokenizer_configs/stable_diffusion/tokenizer/tokenizer_config.json
@@ -0,0 +1,34 @@
+{
+  "add_prefix_space": false,
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "<|startoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "do_lower_case": true,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "errors": "replace",
+  "model_max_length": 77,
+  "name_or_path": "openai/clip-vit-large-patch14",
+  "pad_token": "<|endoftext|>",
+  "special_tokens_map_file": "./special_tokens_map.json",
+  "tokenizer_class": "CLIPTokenizer",
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}
--- a/diffsynth/tokenizer_configs/stable_diffusion/tokenizer/vocab.json
+++ b/diffsynth/tokenizer_configs/stable_diffusion/tokenizer/vocab.json
--- a/diffsynth/tokenizer_configs/stable_diffusion_xl/tokenizer_2/merges.txt
+++ b/diffsynth/tokenizer_configs/stable_diffusion_xl/tokenizer_2/merges.txt
--- a/diffsynth/tokenizer_configs/stable_diffusion_xl/tokenizer_2/special_tokens_map.json
+++ b/diffsynth/tokenizer_configs/stable_diffusion_xl/tokenizer_2/special_tokens_map.json
@@ -0,0 +1,24 @@
+{
+    "bos_token": {
+      "content": "<|startoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    "eos_token": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    },
+    "pad_token": "!",
+    "unk_token": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false
+    }
+}
--- a/diffsynth/tokenizer_configs/stable_diffusion_xl/tokenizer_2/tokenizer_config.json
+++ b/diffsynth/tokenizer_configs/stable_diffusion_xl/tokenizer_2/tokenizer_config.json
@@ -0,0 +1,38 @@
+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "!",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "49406": {
+      "content": "<|startoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "49407": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|startoftext|>",
+  "clean_up_tokenization_spaces": true,
+  "do_lower_case": true,
+  "eos_token": "<|endoftext|>",
+  "errors": "replace",
+  "model_max_length": 77,
+  "pad_token": "!",
+  "tokenizer_class": "CLIPTokenizer",
+  "unk_token": "<|endoftext|>"
+}
--- a/diffsynth/tokenizer_configs/stable_diffusion_xl/tokenizer_2/vocab.json
+++ b/diffsynth/tokenizer_configs/stable_diffusion_xl/tokenizer_2/vocab.json
				`@@ -0,0 +1 @@`
				`{"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>"}`