logasja commited on
Commit
c98ba92
·
verified ·
1 Parent(s): f76f45e

Upload README.md with huggingface_hub

Browse files
Files changed (1) hide show
  1. README.md +78 -9
README.md CHANGED
@@ -1,17 +1,86 @@
1
-
2
  ---
3
  library_name: keras
4
  ---
 
 
 
5
 
6
- This model has been uploaded using the Keras library and can be used with JAX,
7
- TensorFlow, and PyTorch backends.
8
 
9
- This model card has been generated automatically and should be completed by the
10
- model author.
11
- See [Model Cards documentation](https://huggingface.co/docs/hub/model-cards) for
12
- more information.
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
 
14
- For more details about the model architecture, check out
15
- [config.json](./config.json).
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
 
 
17
  ![](./assets/summary_plot.png)
 
 
1
  ---
2
  library_name: keras
3
  ---
4
+ <Gallery />
5
+
6
+ Training logs [here](https://wandb.ai/spuds/auramask/runs/c7f3f8c1813cc1ea9727ea45501e3ce1)
7
 
8
+ # Model Description
9
+ This model uses a modified vnet for 2D input/output implemented [here](https://github.com/logasja/keras3-unets) with the following configuration.
10
 
11
+ ```json
12
+ {
13
+ "activation": "ReLU",
14
+ "batch_norm": false,
15
+ "filter_num": [
16
+ 64,
17
+ 128,
18
+ 256,
19
+ 512,
20
+ 512
21
+ ],
22
+ "n_labels": 3,
23
+ "output_activation": "tanh",
24
+ "pool": false,
25
+ "res_num_ini": 1,
26
+ "res_num_max": 3,
27
+ "unpool": false
28
+ }
29
+ ```
30
 
31
+ ```json
32
+ {
33
+ "alpha": 0.0001,
34
+ "batch": 64,
35
+ "epochs": 500,
36
+ "epsilon": 1,
37
+ "input": "(256, 256)",
38
+ "losses": {
39
+ "FEAT_ArcFace": {
40
+ "d": "cosine_similarity",
41
+ "f": "ArcFace",
42
+ "name": "FEAT_ArcFace",
43
+ "reduction": "sum_over_batch_size",
44
+ "threshold": 0.68,
45
+ "weight": 0.1
46
+ },
47
+ "TopIQ": {
48
+ "full_ref": true,
49
+ "lower_better": false,
50
+ "name": "TopIQ",
51
+ "reduction": "sum_over_batch_size",
52
+ "score_range": "~0, ~1",
53
+ "weight": 0.9
54
+ },
55
+ "mean_squared_error": {
56
+ "name": "mean_squared_error",
57
+ "reduction": "sum_over_batch_size",
58
+ "weight": 0.1
59
+ }
60
+ },
61
+ "mixed_precision": true,
62
+ "optimizer": {
63
+ "amsgrad": false,
64
+ "beta_1": 0.9,
65
+ "beta_2": 0.999,
66
+ "clipnorm": null,
67
+ "clipvalue": null,
68
+ "ema_momentum": 0.99,
69
+ "ema_overwrite_frequency": null,
70
+ "epsilon": 1e-07,
71
+ "global_clipnorm": null,
72
+ "gradient_accumulation_steps": null,
73
+ "learning_rate": 9.999999747378752e-05,
74
+ "loss_scale_factor": null,
75
+ "name": "adamw",
76
+ "use_ema": false,
77
+ "weight_decay": 0.004
78
+ },
79
+ "seed": "BIIIIIGSTRETCH",
80
+ "testing": 0.01,
81
+ "training": 0.99
82
+ }
83
+ ```
84
 
85
+ ## Model Architecture Plot
86
  ![](./assets/summary_plot.png)