mattdangerw commited on
Commit
91ff790
·
verified ·
1 Parent(s): 7a6202c

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. config.json +2 -2
  2. metadata.json +7 -3
  3. preprocessor.json +26 -8
  4. task.json +31 -13
  5. tokenizer.json +14 -4
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "module": "keras_nlp.src.models.bert.bert_backbone",
3
  "class_name": "BertBackbone",
4
  "config": {
5
  "name": "bert_backbone",
@@ -13,5 +13,5 @@
13
  "max_sequence_length": 512,
14
  "num_segments": 2
15
  },
16
- "registered_name": "keras_nlp>BertBackbone"
17
  }
 
1
  {
2
+ "module": "keras_hub.src.models.bert.bert_backbone",
3
  "class_name": "BertBackbone",
4
  "config": {
5
  "name": "bert_backbone",
 
13
  "max_sequence_length": 512,
14
  "num_segments": 2
15
  },
16
+ "registered_name": "keras_hub>BertBackbone"
17
  }
metadata.json CHANGED
@@ -1,6 +1,10 @@
1
  {
2
- "keras_version": "3.3.2",
3
- "keras_nlp_version": "0.10.0.dev0",
4
  "parameter_count": 4385920,
5
- "date_saved": "2024-04-26@21:06:10"
 
 
 
 
6
  }
 
1
  {
2
+ "keras_version": "3.7.0",
3
+ "keras_hub_version": "0.19.0",
4
  "parameter_count": 4385920,
5
+ "date_saved": "2024-12-20@19:42:55",
6
+ "tasks": [
7
+ "MaskedLM",
8
+ "TextClassifier"
9
+ ]
10
  }
preprocessor.json CHANGED
@@ -1,29 +1,47 @@
1
  {
2
- "module": "keras_nlp.src.models.bert.bert_preprocessor",
3
- "class_name": "BertPreprocessor",
4
  "config": {
5
  "name": "bert_preprocessor_2",
6
  "trainable": true,
7
- "dtype": "float32",
 
 
 
 
 
 
 
8
  "tokenizer": {
9
- "module": "keras_nlp.src.models.bert.bert_tokenizer",
10
  "class_name": "BertTokenizer",
11
  "config": {
12
  "name": "bert_tokenizer",
13
  "trainable": true,
14
- "dtype": "int32",
 
 
 
 
 
 
 
 
15
  "vocabulary": null,
16
  "sequence_length": null,
17
  "lowercase": true,
18
  "strip_accents": false,
19
  "split": true,
20
  "suffix_indicator": "##",
21
- "oov_token": "[UNK]"
 
 
22
  },
23
- "registered_name": "keras_nlp>BertTokenizer"
24
  },
 
25
  "sequence_length": 512,
26
  "truncate": "round_robin"
27
  },
28
- "registered_name": "keras_nlp>BertPreprocessor"
29
  }
 
1
  {
2
+ "module": "keras_hub.src.models.bert.bert_text_classifier_preprocessor",
3
+ "class_name": "BertTextClassifierPreprocessor",
4
  "config": {
5
  "name": "bert_preprocessor_2",
6
  "trainable": true,
7
+ "dtype": {
8
+ "module": "keras",
9
+ "class_name": "DTypePolicy",
10
+ "config": {
11
+ "name": "float32"
12
+ },
13
+ "registered_name": null
14
+ },
15
  "tokenizer": {
16
+ "module": "keras_hub.src.models.bert.bert_tokenizer",
17
  "class_name": "BertTokenizer",
18
  "config": {
19
  "name": "bert_tokenizer",
20
  "trainable": true,
21
+ "dtype": {
22
+ "module": "keras",
23
+ "class_name": "DTypePolicy",
24
+ "config": {
25
+ "name": "int32"
26
+ },
27
+ "registered_name": null
28
+ },
29
+ "config_file": "tokenizer.json",
30
  "vocabulary": null,
31
  "sequence_length": null,
32
  "lowercase": true,
33
  "strip_accents": false,
34
  "split": true,
35
  "suffix_indicator": "##",
36
+ "oov_token": "[UNK]",
37
+ "special_tokens": null,
38
+ "special_tokens_in_strings": false
39
  },
40
+ "registered_name": "keras_hub>BertTokenizer"
41
  },
42
+ "config_file": "preprocessor.json",
43
  "sequence_length": 512,
44
  "truncate": "round_robin"
45
  },
46
+ "registered_name": "keras_hub>BertTextClassifierPreprocessor"
47
  }
task.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "module": "keras_nlp.src.models.bert.bert_classifier",
3
- "class_name": "BertClassifier",
4
  "config": {
5
  "backbone": {
6
- "module": "keras_nlp.src.models.bert.bert_backbone",
7
  "class_name": "BertBackbone",
8
  "config": {
9
  "name": "bert_backbone",
@@ -17,41 +17,59 @@
17
  "max_sequence_length": 512,
18
  "num_segments": 2
19
  },
20
- "registered_name": "keras_nlp>BertBackbone"
21
  },
22
  "preprocessor": {
23
- "module": "keras_nlp.src.models.bert.bert_preprocessor",
24
- "class_name": "BertPreprocessor",
25
  "config": {
26
  "name": "bert_preprocessor_2",
27
  "trainable": true,
28
- "dtype": "float32",
 
 
 
 
 
 
 
29
  "tokenizer": {
30
- "module": "keras_nlp.src.models.bert.bert_tokenizer",
31
  "class_name": "BertTokenizer",
32
  "config": {
33
  "name": "bert_tokenizer",
34
  "trainable": true,
35
- "dtype": "int32",
 
 
 
 
 
 
 
 
36
  "vocabulary": null,
37
  "sequence_length": null,
38
  "lowercase": true,
39
  "strip_accents": false,
40
  "split": true,
41
  "suffix_indicator": "##",
42
- "oov_token": "[UNK]"
 
 
43
  },
44
- "registered_name": "keras_nlp>BertTokenizer"
45
  },
 
46
  "sequence_length": 512,
47
  "truncate": "round_robin"
48
  },
49
- "registered_name": "keras_nlp>BertPreprocessor"
50
  },
51
  "name": "bert_classifier_2",
52
  "num_classes": 2,
53
  "activation": "linear",
54
  "dropout": 0.1
55
  },
56
- "registered_name": "keras_nlp>BertClassifier"
57
  }
 
1
  {
2
+ "module": "keras_hub.src.models.bert.bert_text_classifier",
3
+ "class_name": "BertTextClassifier",
4
  "config": {
5
  "backbone": {
6
+ "module": "keras_hub.src.models.bert.bert_backbone",
7
  "class_name": "BertBackbone",
8
  "config": {
9
  "name": "bert_backbone",
 
17
  "max_sequence_length": 512,
18
  "num_segments": 2
19
  },
20
+ "registered_name": "keras_hub>BertBackbone"
21
  },
22
  "preprocessor": {
23
+ "module": "keras_hub.src.models.bert.bert_text_classifier_preprocessor",
24
+ "class_name": "BertTextClassifierPreprocessor",
25
  "config": {
26
  "name": "bert_preprocessor_2",
27
  "trainable": true,
28
+ "dtype": {
29
+ "module": "keras",
30
+ "class_name": "DTypePolicy",
31
+ "config": {
32
+ "name": "float32"
33
+ },
34
+ "registered_name": null
35
+ },
36
  "tokenizer": {
37
+ "module": "keras_hub.src.models.bert.bert_tokenizer",
38
  "class_name": "BertTokenizer",
39
  "config": {
40
  "name": "bert_tokenizer",
41
  "trainable": true,
42
+ "dtype": {
43
+ "module": "keras",
44
+ "class_name": "DTypePolicy",
45
+ "config": {
46
+ "name": "int32"
47
+ },
48
+ "registered_name": null
49
+ },
50
+ "config_file": "tokenizer.json",
51
  "vocabulary": null,
52
  "sequence_length": null,
53
  "lowercase": true,
54
  "strip_accents": false,
55
  "split": true,
56
  "suffix_indicator": "##",
57
+ "oov_token": "[UNK]",
58
+ "special_tokens": null,
59
+ "special_tokens_in_strings": false
60
  },
61
+ "registered_name": "keras_hub>BertTokenizer"
62
  },
63
+ "config_file": "preprocessor.json",
64
  "sequence_length": 512,
65
  "truncate": "round_robin"
66
  },
67
+ "registered_name": "keras_hub>BertTextClassifierPreprocessor"
68
  },
69
  "name": "bert_classifier_2",
70
  "num_classes": 2,
71
  "activation": "linear",
72
  "dropout": 0.1
73
  },
74
+ "registered_name": "keras_hub>BertTextClassifier"
75
  }
tokenizer.json CHANGED
@@ -1,17 +1,27 @@
1
  {
2
- "module": "keras_nlp.src.models.bert.bert_tokenizer",
3
  "class_name": "BertTokenizer",
4
  "config": {
5
  "name": "bert_tokenizer",
6
  "trainable": true,
7
- "dtype": "int32",
 
 
 
 
 
 
 
 
8
  "vocabulary": null,
9
  "sequence_length": null,
10
  "lowercase": true,
11
  "strip_accents": false,
12
  "split": true,
13
  "suffix_indicator": "##",
14
- "oov_token": "[UNK]"
 
 
15
  },
16
- "registered_name": "keras_nlp>BertTokenizer"
17
  }
 
1
  {
2
+ "module": "keras_hub.src.models.bert.bert_tokenizer",
3
  "class_name": "BertTokenizer",
4
  "config": {
5
  "name": "bert_tokenizer",
6
  "trainable": true,
7
+ "dtype": {
8
+ "module": "keras",
9
+ "class_name": "DTypePolicy",
10
+ "config": {
11
+ "name": "int32"
12
+ },
13
+ "registered_name": null
14
+ },
15
+ "config_file": "tokenizer.json",
16
  "vocabulary": null,
17
  "sequence_length": null,
18
  "lowercase": true,
19
  "strip_accents": false,
20
  "split": true,
21
  "suffix_indicator": "##",
22
+ "oov_token": "[UNK]",
23
+ "special_tokens": null,
24
+ "special_tokens_in_strings": false
25
  },
26
+ "registered_name": "keras_hub>BertTokenizer"
27
  }