Spaces:

peterkros
/

COFOG-Bert-AutoClassifier

Sleeping

App Files Files Community

peterkros commited on Dec 13, 2023

Commit

0f6885b

1 Parent(s): b9a616c

Update app.py

Browse files

Files changed (1) hide show

app.py +61 -39

app.py CHANGED Viewed

@@ -27,46 +27,68 @@ markdown_text = """
 - Input one budget line per time.
 - Accuracy of the model is ~88%.
 """
-# HTML formatted table
 html_table = """
-<table>
-  <tr>
-    <th>Epoch</th>
-    <th>Training Loss</th>
-    <th>Validation Loss</th>
-    <th>Accuracy</th>
-  </tr>
-  <tr>
-    <td>1</td>
-    <td>No log</td>
-    <td>2.095209</td>
-    <td>0.340764</td>
-  </tr>
-  <tr>
-    <td>2</td>
-    <td>No log</td>
-    <td>1.419945</td>
-    <td>0.662420</td>
-  </tr>
-  <tr>
-    <td>3</td>
-    <td>No log</td>
-    <td>0.683810</td>
-    <td>0.850318</td>
-  </tr>
-  <tr>
-    <td>4</td>
-    <td>No log</td>
-    <td>0.460408</td>
-    <td>0.872611</td>
-  </tr>
-  <tr>
-    <td>5</td>
-    <td>No log</td>
-    <td>0.422096</td>
-    <td>0.888535</td>
-  </tr>
-</table>
 """
 iface = gr.Interface(

 - Input one budget line per time.
 - Accuracy of the model is ~88%.
 """
 html_table = """
+  <h2 style="text-align: center;">COFOG Budget Classification</h2>
+  <p style='text-align: justify'>
+    This classifier was developed utilizing the pre-trained BERT
+    (Bidirectional Encoder Representations from Transformers) model
+    with an uncased configuration, with over 1500 manually
+    labeled dataset comprising budget line items extracted from
+    various budgetary documents. To balance the data, additional data
+    was generated using GPT-4 where categories were not available
+    in budget documents. The model training was executed
+    on a Google Colab environment, specifically utilizing a Tesla T4 GPU.
+    Detailed metrics of the training process are as follows:
+    <code>TrainOutput(global_step=395, training_loss=1.1497593360611156,
+    metrics={'train_runtime': 650.0119, 'train_samples_per_second':
+      9.638, 'train_steps_per_second': 0.608, 'total_flos': 1648509163714560.0,
+      'train_loss': 1.1497593360611156, 'epoch': 5.0})</code>. The model
+    is designed to predict the primary classification level
+    of the Classification of the Functions of Government (COFOG),
+    with the predictions from the first level serving as contextual
+    input for subsequent second-level classification. The project
+    is conducted with an exclusive focus on academic and research
+    objectives.
+  </p>
+  <table style="margin-left: auto; margin-right: auto;">
+    <tr>
+      <th>Epoch</th>
+      <th>Training Loss</th>
+      <th>Validation Loss</th>
+      <th>Accuracy</th>
+    </tr>
+    <tr>
+      <td>1</td>
+      <td>No log</td>
+      <td>2.095209</td>
+      <td>0.340764</td>
+    </tr>
+    <tr>
+      <td>2</td>
+      <td>No log</td>
+      <td>1.419945</td>
+      <td>0.662420</td>
+    </tr>
+    <tr>
+      <td>3</td>
+      <td>No log</td>
+      <td>0.683810</td>
+      <td>0.850318</td>
+    </tr>
+    <tr>
+      <td>4</td>
+      <td>No log</td>
+      <td>0.460408</td>
+      <td>0.872611</td>
+    </tr>
+    <tr>
+      <td>5</td>
+      <td>No log</td>
+      <td>0.422096</td>
+      <td>0.888535</td>
+    </tr>
+  </table>
+</div>
 """
 iface = gr.Interface(