johnrachwanpruna commited on
Commit
5da70fe
·
verified ·
1 Parent(s): 9945884

Add files using upload-large-folder tool

Browse files
safety_checker/config.json CHANGED
@@ -8,30 +8,52 @@
8
  "model_type": "clip",
9
  "projection_dim": 64,
10
  "text_config": {
 
11
  "attention_dropout": 0.1,
12
  "bos_token_id": 0,
 
 
13
  "dropout": 0.1,
14
  "dtype": "float32",
15
  "eos_token_id": 2,
 
16
  "gradient_checkpointing": false,
17
  "hidden_act": "quick_gelu",
18
  "hidden_size": 32,
19
  "initializer_factor": 1.0,
20
  "initializer_range": 0.02,
21
  "intermediate_size": 37,
 
22
  "layer_norm_eps": 1e-05,
23
  "max_position_embeddings": 512,
24
  "model_type": "clip_text_model",
25
  "num_attention_heads": 4,
26
  "num_hidden_layers": 5,
 
 
27
  "projection_dim": 512,
 
 
 
 
 
 
 
 
 
28
  "vocab_size": 99
29
  },
30
- "transformers_version": "4.57.6",
31
  "vision_config": {
 
32
  "attention_dropout": 0.1,
 
 
 
33
  "dropout": 0.1,
34
  "dtype": "float32",
 
 
35
  "gradient_checkpointing": false,
36
  "hidden_act": "quick_gelu",
37
  "hidden_size": 32,
@@ -39,13 +61,25 @@
39
  "initializer_factor": 1.0,
40
  "initializer_range": 0.02,
41
  "intermediate_size": 37,
 
42
  "layer_norm_eps": 1e-05,
43
  "model_type": "clip_vision_model",
44
  "num_attention_heads": 4,
45
  "num_channels": 3,
46
  "num_hidden_layers": 5,
 
47
  "patch_size": 2,
48
- "projection_dim": 512
 
 
 
 
 
 
 
 
 
 
49
  },
50
  "vocab_size": 1000
51
  }
 
8
  "model_type": "clip",
9
  "projection_dim": 64,
10
  "text_config": {
11
+ "add_cross_attention": false,
12
  "attention_dropout": 0.1,
13
  "bos_token_id": 0,
14
+ "cross_attention_hidden_size": null,
15
+ "decoder_start_token_id": null,
16
  "dropout": 0.1,
17
  "dtype": "float32",
18
  "eos_token_id": 2,
19
+ "finetuning_task": null,
20
  "gradient_checkpointing": false,
21
  "hidden_act": "quick_gelu",
22
  "hidden_size": 32,
23
  "initializer_factor": 1.0,
24
  "initializer_range": 0.02,
25
  "intermediate_size": 37,
26
+ "is_decoder": false,
27
  "layer_norm_eps": 1e-05,
28
  "max_position_embeddings": 512,
29
  "model_type": "clip_text_model",
30
  "num_attention_heads": 4,
31
  "num_hidden_layers": 5,
32
+ "pad_token_id": 1,
33
+ "prefix": null,
34
  "projection_dim": 512,
35
+ "pruned_heads": {},
36
+ "sep_token_id": null,
37
+ "task_specific_params": null,
38
+ "tf_legacy_loss": false,
39
+ "tie_encoder_decoder": false,
40
+ "tie_word_embeddings": true,
41
+ "tokenizer_class": null,
42
+ "torchscript": false,
43
+ "use_bfloat16": false,
44
  "vocab_size": 99
45
  },
46
+ "transformers_version": "5.1.0",
47
  "vision_config": {
48
+ "add_cross_attention": false,
49
  "attention_dropout": 0.1,
50
+ "bos_token_id": null,
51
+ "cross_attention_hidden_size": null,
52
+ "decoder_start_token_id": null,
53
  "dropout": 0.1,
54
  "dtype": "float32",
55
+ "eos_token_id": null,
56
+ "finetuning_task": null,
57
  "gradient_checkpointing": false,
58
  "hidden_act": "quick_gelu",
59
  "hidden_size": 32,
 
61
  "initializer_factor": 1.0,
62
  "initializer_range": 0.02,
63
  "intermediate_size": 37,
64
+ "is_decoder": false,
65
  "layer_norm_eps": 1e-05,
66
  "model_type": "clip_vision_model",
67
  "num_attention_heads": 4,
68
  "num_channels": 3,
69
  "num_hidden_layers": 5,
70
+ "pad_token_id": null,
71
  "patch_size": 2,
72
+ "prefix": null,
73
+ "projection_dim": 512,
74
+ "pruned_heads": {},
75
+ "sep_token_id": null,
76
+ "task_specific_params": null,
77
+ "tf_legacy_loss": false,
78
+ "tie_encoder_decoder": false,
79
+ "tie_word_embeddings": true,
80
+ "tokenizer_class": null,
81
+ "torchscript": false,
82
+ "use_bfloat16": false
83
  },
84
  "vocab_size": 1000
85
  }
text_encoder/config.json CHANGED
@@ -19,6 +19,6 @@
19
  "num_hidden_layers": 5,
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
- "transformers_version": "4.57.6",
23
  "vocab_size": 1000
24
  }
 
19
  "num_hidden_layers": 5,
20
  "pad_token_id": 1,
21
  "projection_dim": 512,
22
+ "transformers_version": "5.1.0",
23
  "vocab_size": 1000
24
  }
tokenizer/tokenizer_config.json CHANGED
@@ -1,29 +1,11 @@
1
  {
2
  "add_prefix_space": false,
3
- "added_tokens_decoder": {
4
- "0": {
5
- "content": "<|startoftext|>",
6
- "lstrip": false,
7
- "normalized": true,
8
- "rstrip": false,
9
- "single_word": false,
10
- "special": true
11
- },
12
- "1": {
13
- "content": "<|endoftext|>",
14
- "lstrip": false,
15
- "normalized": true,
16
- "rstrip": false,
17
- "single_word": false,
18
- "special": true
19
- }
20
- },
21
  "bos_token": "<|startoftext|>",
22
- "clean_up_tokenization_spaces": false,
23
  "do_lower_case": true,
24
  "eos_token": "<|endoftext|>",
25
  "errors": "replace",
26
- "extra_special_tokens": {},
27
  "model_max_length": 77,
28
  "pad_token": "<|endoftext|>",
29
  "tokenizer_class": "CLIPTokenizer",
 
1
  {
2
  "add_prefix_space": false,
3
+ "backend": "tokenizers",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
  "bos_token": "<|startoftext|>",
 
5
  "do_lower_case": true,
6
  "eos_token": "<|endoftext|>",
7
  "errors": "replace",
8
+ "is_local": true,
9
  "model_max_length": 77,
10
  "pad_token": "<|endoftext|>",
11
  "tokenizer_class": "CLIPTokenizer",