vikp commited on
Commit
db657d7
·
verified ·
1 Parent(s): 6aaffb1

Model save

Browse files
Files changed (4) hide show
  1. README.md +53 -2
  2. config.json +4 -4
  3. model.safetensors +2 -2
  4. training_args.bin +3 -0
README.md CHANGED
@@ -1,5 +1,56 @@
1
  ---
2
- license: cc-by-nc-sa-4.0
 
 
 
 
 
3
  ---
4
 
5
- Specialized math model for [surya](https://github.com/VikParuchuri/surya).
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
+ base_model: vikp/line_detector_clean
3
+ tags:
4
+ - generated_from_trainer
5
+ model-index:
6
+ - name: line_detector_math
7
+ results: []
8
  ---
9
 
10
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
11
+ should probably proofread and complete it, then remove this comment. -->
12
+
13
+ # line_detector_math
14
+
15
+ This model is a fine-tuned version of [vikp/line_detector_clean](https://huggingface.co/vikp/line_detector_clean) on an unknown dataset.
16
+
17
+ ## Model description
18
+
19
+ More information needed
20
+
21
+ ## Intended uses & limitations
22
+
23
+ More information needed
24
+
25
+ ## Training and evaluation data
26
+
27
+ More information needed
28
+
29
+ ## Training procedure
30
+
31
+ ### Training hyperparameters
32
+
33
+ The following hyperparameters were used during training:
34
+ - learning_rate: 6e-05
35
+ - train_batch_size: 8
36
+ - eval_batch_size: 8
37
+ - seed: 42
38
+ - distributed_type: multi-GPU
39
+ - gradient_accumulation_steps: 8
40
+ - total_train_batch_size: 64
41
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
+ - lr_scheduler_type: cosine
43
+ - lr_scheduler_warmup_ratio: 0.1
44
+ - num_epochs: 8
45
+ - mixed_precision_training: Native AMP
46
+
47
+ ### Training results
48
+
49
+
50
+
51
+ ### Framework versions
52
+
53
+ - Transformers 4.36.2
54
+ - Pytorch 2.2.0+cu121
55
+ - Datasets 2.16.1
56
+ - Tokenizers 0.15.0
config.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "_name_or_path": "line_detector_math/checkpoint-4000",
3
  "architectures": [
4
  "SegformerForRegressionMask"
5
  ],
6
  "attention_probs_dropout_prob": 0.0,
7
  "classifier_dropout_prob": 0.1,
8
- "decoder_hidden_size": 768,
9
- "decoder_layer_hidden_size": 192,
10
  "decoder_upsample_rate": 2,
11
  "depths": [
12
  3,
@@ -76,5 +76,5 @@
76
  2
77
  ],
78
  "torch_dtype": "float32",
79
- "transformers_version": "4.36.0"
80
  }
 
1
  {
2
+ "_name_or_path": "vikp/line_detector_clean",
3
  "architectures": [
4
  "SegformerForRegressionMask"
5
  ],
6
  "attention_probs_dropout_prob": 0.0,
7
  "classifier_dropout_prob": 0.1,
8
+ "decoder_hidden_size": 512,
9
+ "decoder_layer_hidden_size": 128,
10
  "decoder_upsample_rate": 2,
11
  "depths": [
12
  3,
 
76
  2
77
  ],
78
  "torch_dtype": "float32",
79
+ "transformers_version": "4.36.2"
80
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5db3424351c0ea83b0707baea44a87125e010924df0a8050b8f6872b2721ae8a
3
- size 119881240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fd328b31e077aaa33f293d7b53ea3dec682ed143b4a754b93f44a9cd37ffee0
3
+ size 118301152
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:065444b2c0a4b8e4f7aec04feea41bbe8267e80d2931844d095c76a8726f3937
3
+ size 4728