Model save

Browse files

Files changed (7) hide show

README.md +16 -17
eval_results.json +5 -5
logs/events.out.tfevents.1722463228.nathan.173807.0 +3 -0
logs/events.out.tfevents.1722465205.nathan.173807.1 +3 -0
model.safetensors +1 -1
run_config.json +4 -3
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [docketanalyzer/docket-lm-xs](https://huggingface.co/docketanalyzer/docket-lm-xs) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.0064
-- F1: 0.9987
 ## Model description
@@ -38,32 +38,31 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 5e-05
-- train_batch_size: 8
 - eval_batch_size: 16
 - seed: 42
-- gradient_accumulation_steps: 2
-- total_train_batch_size: 16
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_ratio: 0.02
 - num_epochs: 1
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | F1     |
 |:-------------:|:-----:|:----:|:---------------:|:------:|
-| 0.016         | 0.08  | 380  | 0.0157          | 0.9965 |
-| 0.0006        | 0.16  | 760  | 0.0150          | 0.9975 |
-| 0.0007        | 0.24  | 1140 | 0.0136          | 0.9977 |
-| 0.0003        | 0.32  | 1520 | 0.0128          | 0.9982 |
-| 0.0005        | 0.4   | 1900 | 0.0110          | 0.9985 |
-| 0.0004        | 0.48  | 2280 | 0.0053          | 0.9987 |
-| 0.0004        | 0.56  | 2660 | 0.0035          | 0.9995 |
-| 0.0003        | 0.64  | 3040 | 0.0049          | 0.9987 |
-| 0.0004        | 0.72  | 3420 | 0.0080          | 0.9985 |
-| 0.0577        | 0.8   | 3800 | 0.0081          | 0.9982 |
-| 0.0002        | 0.88  | 4180 | 0.0077          | 0.9987 |
-| 0.0002        | 0.96  | 4560 | 0.0063          | 0.9987 |
 ### Framework versions

 This model is a fine-tuned version of [docketanalyzer/docket-lm-xs](https://huggingface.co/docketanalyzer/docket-lm-xs) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.0015
+- F1: 0.9995
 ## Model description
 The following hyperparameters were used during training:
 - learning_rate: 5e-05
+- train_batch_size: 16
 - eval_batch_size: 16
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_ratio: 0.02
 - num_epochs: 1
+- mixed_precision_training: Native AMP
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | F1     |
 |:-------------:|:-----:|:----:|:---------------:|:------:|
+| 0.0013        | 0.08  | 380  | 0.0054          | 0.9983 |
+| 0.0007        | 0.16  | 760  | 0.0139          | 0.9976 |
+| 0.0003        | 0.24  | 1140 | 0.0061          | 0.9985 |
+| 0.0002        | 0.32  | 1520 | 0.0109          | 0.9981 |
+| 0.0005        | 0.4   | 1900 | 0.0093          | 0.9985 |
+| 0.0002        | 0.48  | 2280 | 0.0080          | 0.9988 |
+| 0.0004        | 0.56  | 2660 | 0.0099          | 0.9978 |
+| 0.0004        | 0.64  | 3040 | 0.0024          | 0.9990 |
+| 0.0002        | 0.72  | 3420 | 0.0037          | 0.9988 |
+| 0.0003        | 0.8   | 3800 | 0.0013          | 0.9998 |
+| 0.0003        | 0.88  | 4180 | 0.0034          | 0.9993 |
+| 0.0002        | 0.96  | 4560 | 0.0017          | 0.9993 |
 ### Framework versions

eval_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-    "eval_loss": 0.0064284102991223335,
-    "eval_f1": 0.9987344975955453,
-    "eval_runtime": 40.1494,
-    "eval_samples_per_second": 99.628,
-    "eval_steps_per_second": 6.227,
     "epoch": 1.0
 }

 {
+    "eval_loss": 0.0014596829423680902,
+    "eval_f1": 0.9995131450827653,
+    "eval_runtime": 8.2463,
+    "eval_samples_per_second": 485.069,
+    "eval_steps_per_second": 30.317,
     "epoch": 1.0
 }

logs/events.out.tfevents.1722463228.nathan.173807.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62e8708557de010a167899eb5d5e54a4960bf8ed5e9b084c3dffc66f4c703bf3
+size 510331

logs/events.out.tfevents.1722465205.nathan.173807.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f985d34adea2e9a1d80da94c3239daa4d1945bbf531e2934080619656a049ae5
+size 405

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6f2de238ced3864b54a6be60056b08d535489fec6bf3a5ee54b5e9aaa702d890
 size 283347432

 version https://git-lfs.github.com/spec/v1
+oid sha256:0566ceb185a37aceb7b77f0d65402f1449a3d7df5c6688cfc268627f2c4ab89b
 size 283347432

run_config.json CHANGED Viewed

@@ -5,16 +5,17 @@
     },
     "training_args": {
         "num_train_epochs": 1,
-        "per_device_train_batch_size": 8,
         "per_device_eval_batch_size": 16,
-        "gradient_accumulation_steps": 2,
         "learning_rate": 5e-05,
         "weight_decay": 0.1,
         "warmup_ratio": 0.02,
         "evaluation_strategy": "steps",
         "eval_steps": 0.08,
         "save_steps": 0.08,
-        "save_total_limit": 2
     },
     "run_name": "complaint",
     "run_type": "ClassificationRoutine"

     },
     "training_args": {
         "num_train_epochs": 1,
+        "per_device_train_batch_size": 16,
         "per_device_eval_batch_size": 16,
+        "gradient_accumulation_steps": 1,
         "learning_rate": 5e-05,
         "weight_decay": 0.1,
         "warmup_ratio": 0.02,
         "evaluation_strategy": "steps",
         "eval_steps": 0.08,
         "save_steps": 0.08,
+        "save_total_limit": 2,
+        "fp16": true
     },
     "run_name": "complaint",
     "run_type": "ClassificationRoutine"

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:66ef2207833c0afa403c72448d2b06f189c7278d0be4661827287b01ffc17100
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:30d3579d075a2b7dcef799631a3bf63aed51391f5e3e930601890e8d9c6c88eb
 size 5240