MuhiimAli
diff --git a/‎README.md
Lines changed: 18 additions & 0 deletions b/‎README.md
Lines changed: 18 additions & 0 deletions
diff --git a/‎__pycache__/data.cpython-39.pyc
-22 Bytes b/‎__pycache__/data.cpython-39.pyc
-22 Bytes
diff --git a/‎__pycache__/loss.cpython-39.pyc
0 Bytes b/‎__pycache__/loss.cpython-39.pyc
0 Bytes
diff --git a/‎__pycache__/train.cpython-39.pyc
586 Bytes b/‎__pycache__/train.cpython-39.pyc
586 Bytes
diff --git a/‎output1.log
Lines changed: 15 additions & 1 deletion b/‎output1.log
Lines changed: 15 additions & 1 deletion
diff --git a/‎train.py
Lines changed: 15 additions & 15 deletions b/‎train.py
Lines changed: 15 additions & 15 deletions
@@ -45,3 +45,21 @@ The model is built on top of DistilBERT and has been adapted for question answer
 3. Answer Type: Linear layer to classify the type of answer
 
 The model takes a question-answer pair as input, processes it through DistilBERT, and then uses these three linear layers to make predictions. 
+
+## Hyperparameters
+
+Best performing configuration:
+- Learning rate: 0.00003882259533696199
+- Number of epochs: 2
+- Number of workers: 4
+- Random seed: 42
+- Weight decay: 0
+
+## Model Performance
+
+Final metrics achieved:
+- Precision: 0.6131
+- Recall: 0.4786
+- F1: 0.5376
+
+For detailed training logs and complete output, refer to the output.log and output.log1 files generated during training.
@@ -283,7 +283,7 @@ def train(args, data, tokenizer, use_wandb=False):
             criterion=criterion,
             tokenizer=tokenizer,
             device=device, 
-            max_answer_length=30
+            max_answer_length=100000000000
         )
 
         # Print detailed metrics
@@ -299,21 +299,21 @@ def train(args, data, tokenizer, use_wandb=False):
         print(f"Recall: {eval_metrics['recall']:.4f}")
         print(f"F1: {eval_metrics['f1']:.4f}")
 
-        # print("\nDetailed Token Statistics:")
-        # print(f"True Positives: {eval_metrics['true_positives']}")
-        # print(f"False Positives: {eval_metrics['false_positives']}")
-        # print(f"False Negatives: {eval_metrics['false_negatives']}")
+        print("\nDetailed Token Statistics:")
+        print(f"True Positives: {eval_metrics['true_positives']}")
+        print(f"False Positives: {eval_metrics['false_positives']}")
+        print(f"False Negatives: {eval_metrics['false_negatives']}")
 
-        # print("\nOverprediction Analysis:")
-        # print(f"Total Questions: {eval_metrics['total_questions']}")
-        # print(f"Overprediction Cases: {eval_metrics['overprediction_cases']}")
-        # if eval_metrics['overprediction_cases'] > 0:
-        #     overpred_percentage = (eval_metrics['overprediction_cases'] / eval_metrics['total_questions']) * 100
-        #     print(f"Overprediction Percentage: {overpred_percentage:.1f}%")
-        #     print(f"Average Predicted Length: {eval_metrics['avg_overprediction_length']:.1f} tokens")
-        #     print(f"Average True Length: {eval_metrics['avg_true_length']:.1f} tokens")
-        #     avg_extra = eval_metrics['avg_overprediction_length'] - eval_metrics['avg_true_length']
-        #     print(f"Average Extra Tokens: {avg_extra:.1f}")
+        print("\nOverprediction Analysis:")
+        print(f"Total Questions: {eval_metrics['total_questions']}")
+        print(f"Overprediction Cases: {eval_metrics['overprediction_cases']}")
+        if eval_metrics['overprediction_cases'] > 0:
+            overpred_percentage = (eval_metrics['overprediction_cases'] / eval_metrics['total_questions']) * 100
+            print(f"Overprediction Percentage: {overpred_percentage:.1f}%")
+            print(f"Average Predicted Length: {eval_metrics['avg_overprediction_length']:.1f} tokens")
+            print(f"Average True Length: {eval_metrics['avg_true_length']:.1f} tokens")
+            avg_extra = eval_metrics['avg_overprediction_length'] - eval_metrics['avg_true_length']
+            print(f"Average Extra Tokens: {avg_extra:.1f}")
 
         if use_wandb:
             wandb.log({