eskayML
/

interview_electra

@@ -18,8 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [mrm8488/electra-small-finetuned-squadv2](https://huggingface.co/mrm8488/electra-small-finetuned-squadv2) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.4590
-- Accuracy: 0.6164
 ## Model description
@@ -42,7 +42,7 @@ The following hyperparameters were used during training:
 - train_batch_size: 2
 - eval_batch_size: 2
 - seed: 42
-- optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 - lr_scheduler_type: linear
 - num_epochs: 10
@@ -50,16 +50,16 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:--------:|
-| 2.782         | 1.0   | 579  | 2.6037          | 0.1983   |
-| 2.5903        | 2.0   | 1158 | 2.4794          | 0.1983   |
-| 2.5114        | 3.0   | 1737 | 2.3349          | 0.2586   |
-| 2.3676        | 4.0   | 2316 | 2.1538          | 0.4569   |
-| 2.2466        | 5.0   | 2895 | 1.9574          | 0.4526   |
-| 2.0461        | 6.0   | 3474 | 1.7796          | 0.5690   |
-| 1.7791        | 7.0   | 4053 | 1.6913          | 0.5776   |
-| 1.7205        | 8.0   | 4632 | 1.5485          | 0.5733   |
-| 1.59          | 9.0   | 5211 | 1.4805          | 0.6121   |
-| 1.5614        | 10.0  | 5790 | 1.4590          | 0.6164   |
 ### Framework versions

 This model is a fine-tuned version of [mrm8488/electra-small-finetuned-squadv2](https://huggingface.co/mrm8488/electra-small-finetuned-squadv2) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 2.2729
+- Accuracy: 0.1111
 ## Model description
 - train_batch_size: 2
 - eval_batch_size: 2
 - seed: 42
+- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 - lr_scheduler_type: linear
 - num_epochs: 10
 | Training Loss | Epoch | Step | Validation Loss | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:--------:|
+| No log        | 1.0   | 54   | 2.2936          | 0.0370   |
+| No log        | 2.0   | 108  | 2.2872          | 0.1111   |
+| No log        | 3.0   | 162  | 2.2796          | 0.0741   |
+| No log        | 4.0   | 216  | 2.2798          | 0.0741   |
+| No log        | 5.0   | 270  | 2.2775          | 0.0741   |
+| No log        | 6.0   | 324  | 2.2780          | 0.1111   |
+| No log        | 7.0   | 378  | 2.2801          | 0.0370   |
+| No log        | 8.0   | 432  | 2.2741          | 0.1111   |
+| No log        | 9.0   | 486  | 2.2733          | 0.0370   |
+| 2.2069        | 10.0  | 540  | 2.2729          | 0.1111   |
 ### Framework versions

config.json CHANGED Viewed

@@ -10,50 +10,30 @@
   "hidden_dropout_prob": 0.1,
   "hidden_size": 256,
   "id2label": {
-    "0": 0,
-    "1": 1,
-    "2": 2,
-    "3": 3,
-    "4": 4,
-    "5": 5,
-    "6": 6,
-    "7": 7,
-    "8": 8,
-    "9": 9,
-    "10": 10,
-    "11": 11,
-    "12": 12,
-    "13": 13,
-    "14": 14,
-    "15": 15,
-    "16": 16,
-    "17": 17,
-    "18": 18,
-    "19": 19
   },
   "initializer_range": 0.02,
   "intermediate_size": 1024,
   "label2id": {
-    "0": 0,
-    "1": 1,
-    "2": 2,
-    "3": 3,
-    "4": 4,
-    "5": 5,
-    "6": 6,
-    "7": 7,
-    "8": 8,
-    "9": 9,
-    "10": 10,
-    "11": 11,
-    "12": 12,
-    "13": 13,
-    "14": 14,
-    "15": 15,
-    "16": 16,
-    "17": 17,
-    "18": 18,
-    "19": 19
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,

   "hidden_dropout_prob": 0.1,
   "hidden_size": 256,
   "id2label": {
+    "0": "Provider Characteristics",
+    "1": "Finanicial Impact",
+    "2": "Imaging modalities in general",
+    "3": "Clinical utility & efficiency-Provider perspective",
+    "4": "Health System Characteristics",
+    "5": "Training",
+    "6": "Value equation",
+    "7": "Workflow related problems",
+    "8": "Credentialing / Quality Assurance Infrastructure",
+    "9": "Patient/Physican interaction in LUS"
   },
   "initializer_range": 0.02,
   "intermediate_size": 1024,
   "label2id": {
+    "Clinical utility & efficiency-Provider perspective": 3,
+    "Credentialing / Quality Assurance Infrastructure": 8,
+    "Finanicial Impact": 1,
+    "Health System Characteristics": 4,
+    "Imaging modalities in general": 2,
+    "Patient/Physican interaction in LUS": 9,
+    "Provider Characteristics": 0,
+    "Training": 5,
+    "Value equation": 6,
+    "Workflow related problems": 7
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5678dd28a6ad932eda4117ba2efc7a01bb83e3a55364844c3a361908bb1a5748
-size 54239712

 version https://git-lfs.github.com/spec/v1
+oid sha256:e39f45a0be0b095f4c30756e3d98ef4c1f7ceb03f2f6f0652863ceb8ac226767
+size 54229432

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:696c8c84281637804e271799054d0fb3f501144c057011eeb79843e891e858f0
 size 5304

 version https://git-lfs.github.com/spec/v1
+oid sha256:1f90cb18423480090e5952f92b4845315772b669a221438661b8ddad1ce0062b
 size 5304