dosai commited on
Commit
d67f0cc
1 Parent(s): 7a4f1a1

Training in progress epoch 0

Browse files
Files changed (4) hide show
  1. README.md +5 -13
  2. config.json +3 -2
  3. tf_model.h5 +1 -1
  4. tokenizer.json +16 -2
README.md CHANGED
@@ -1,5 +1,4 @@
1
  ---
2
- license: apache-2.0
3
  tags:
4
  - generated_from_keras_callback
5
  model-index:
@@ -12,10 +11,10 @@ probably proofread and complete it, then remove this comment. -->
12
 
13
  # dosai/bert-sudb
14
 
15
- This model is a fine-tuned version of [bert-base-multilingual-uncased](https://huggingface.co/bert-base-multilingual-uncased) on an unknown dataset.
16
  It achieves the following results on the evaluation set:
17
- - Train Loss: 5.9514
18
- - Epoch: 7
19
 
20
  ## Model description
21
 
@@ -41,19 +40,12 @@ The following hyperparameters were used during training:
41
 
42
  | Train Loss | Epoch |
43
  |:----------:|:-----:|
44
- | 5.9578 | 0 |
45
- | 5.9547 | 1 |
46
- | 5.9542 | 2 |
47
- | 5.9526 | 3 |
48
- | 5.9522 | 4 |
49
- | 5.9520 | 5 |
50
- | 5.9515 | 6 |
51
- | 5.9514 | 7 |
52
 
53
 
54
  ### Framework versions
55
 
56
- - Transformers 4.29.2
57
  - TensorFlow 2.12.0
58
  - Datasets 2.12.0
59
  - Tokenizers 0.13.3
 
1
  ---
 
2
  tags:
3
  - generated_from_keras_callback
4
  model-index:
 
11
 
12
  # dosai/bert-sudb
13
 
14
+ This model is a fine-tuned version of [alon-albalak/bert-base-multilingual-xquad](https://huggingface.co/alon-albalak/bert-base-multilingual-xquad) on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
+ - Train Loss: 5.9549
17
+ - Epoch: 0
18
 
19
  ## Model description
20
 
 
40
 
41
  | Train Loss | Epoch |
42
  |:----------:|:-----:|
43
+ | 5.9549 | 0 |
 
 
 
 
 
 
 
44
 
45
 
46
  ### Framework versions
47
 
48
+ - Transformers 4.30.0
49
  - TensorFlow 2.12.0
50
  - Datasets 2.12.0
51
  - Tokenizers 0.13.3
config.json CHANGED
@@ -1,11 +1,12 @@
1
  {
2
- "_name_or_path": "bert-base-multilingual-uncased",
3
  "architectures": [
4
  "BertForQuestionAnswering"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
8
  "directionality": "bidi",
 
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
@@ -23,7 +24,7 @@
23
  "pooler_size_per_head": 128,
24
  "pooler_type": "first_token_transform",
25
  "position_embedding_type": "absolute",
26
- "transformers_version": "4.29.2",
27
  "type_vocab_size": 2,
28
  "use_cache": true,
29
  "vocab_size": 105879
 
1
  {
2
+ "_name_or_path": "alon-albalak/bert-base-multilingual-xquad",
3
  "architectures": [
4
  "BertForQuestionAnswering"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
8
  "directionality": "bidi",
9
+ "gradient_checkpointing": false,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
 
24
  "pooler_size_per_head": 128,
25
  "pooler_type": "first_token_transform",
26
  "position_embedding_type": "absolute",
27
+ "transformers_version": "4.30.0",
28
  "type_vocab_size": 2,
29
  "use_cache": true,
30
  "vocab_size": 105879
tf_model.h5 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aff3729e311f72630613f3df49b436b1972a4cd394fd5ea04592958edd5384b0
3
  size 667338704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1512574c243da9578d9b7586146c7ceb1249726a201a0b51b10b60bbe101fed
3
  size 667338704
tokenizer.json CHANGED
@@ -1,7 +1,21 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
4
- "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 384,
6
+ "strategy": "OnlySecond",
7
+ "stride": 128
8
+ },
9
+ "padding": {
10
+ "strategy": {
11
+ "Fixed": 384
12
+ },
13
+ "direction": "Right",
14
+ "pad_to_multiple_of": null,
15
+ "pad_id": 0,
16
+ "pad_type_id": 0,
17
+ "pad_token": "[PAD]"
18
+ },
19
  "added_tokens": [
20
  {
21
  "id": 0,