aner commited on
Commit
cca1c77
1 Parent(s): a5b3245

Model save

Browse files
Files changed (3) hide show
  1. README.md +49 -0
  2. config.json +3 -3
  3. model.safetensors +2 -2
README.md ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: cc-by-4.0
3
+ base_model: deepset/minilm-uncased-squad2
4
+ tags:
5
+ - generated_from_trainer
6
+ model-index:
7
+ - name: qa_finetuned
8
+ results: []
9
+ ---
10
+
11
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
12
+ should probably proofread and complete it, then remove this comment. -->
13
+
14
+ # qa_finetuned
15
+
16
+ This model is a fine-tuned version of [deepset/minilm-uncased-squad2](https://huggingface.co/deepset/minilm-uncased-squad2) on the None dataset.
17
+
18
+ ## Model description
19
+
20
+ More information needed
21
+
22
+ ## Intended uses & limitations
23
+
24
+ More information needed
25
+
26
+ ## Training and evaluation data
27
+
28
+ More information needed
29
+
30
+ ## Training procedure
31
+
32
+ ### Training hyperparameters
33
+
34
+ The following hyperparameters were used during training:
35
+ - learning_rate: 2e-05
36
+ - train_batch_size: 8
37
+ - eval_batch_size: 8
38
+ - seed: 42
39
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
+ - lr_scheduler_type: linear
41
+ - num_epochs: 3
42
+ - mixed_precision_training: Native AMP
43
+
44
+ ### Framework versions
45
+
46
+ - Transformers 4.35.2
47
+ - Pytorch 2.1.0+cu121
48
+ - Datasets 2.16.0
49
+ - Tokenizers 0.15.0
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "bert-base-uncased",
3
  "architectures": [
4
  "BertForQuestionAnswering"
5
  ],
@@ -8,9 +8,9 @@
8
  "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
- "hidden_size": 768,
12
  "initializer_range": 0.02,
13
- "intermediate_size": 3072,
14
  "layer_norm_eps": 1e-12,
15
  "max_position_embeddings": 512,
16
  "model_type": "bert",
 
1
  {
2
+ "_name_or_path": "deepset/minilm-uncased-squad2",
3
  "architectures": [
4
  "BertForQuestionAnswering"
5
  ],
 
8
  "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 384,
12
  "initializer_range": 0.02,
13
+ "intermediate_size": 1536,
14
  "layer_norm_eps": 1e-12,
15
  "max_position_embeddings": 512,
16
  "model_type": "bert",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f212bffb8242b06dbae543e3aa6641e35bc2ef7fd5e54f8141cb6d899892853d
3
- size 435596088
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:588733eba6f8458a138cefa233691fcbdf6f75882f378087e6cb45cb16f4cf92
3
+ size 132874824