Merge remote-tracking branch 'origin/master'

9f712c09 · Thomas Wolf · 8774a58f · 8c7c8819 · 9f712c09 · 9f712c09
Commit 9f712c09 authored 2 weeks ago by Thomas Wolf
--- a/src/experiments/NEC_evaluation/evaluation.py
+++ b/src/experiments/NEC_evaluation/evaluation.py
@@ -108,5 +108,5 @@ def read_NEC_metrics(directory):
        print(f"Model: {model}, Dataset: {dataset}, Accuracy: {avg_accuracy:.2f}%")


-#run_NEC_tests_all()
+# run_NEC_tests_all()
 read_NEC_metrics("results")
--- a/src/experiments/finetune_T5/plotting/plot_loss.py
+++ b/src/experiments/finetune_T5/plotting/plot_loss.py
@@ -15,7 +15,7 @@ def plot_loss_curve(logfile, title):
                eval_losses.append(float(match.group(1)))

    plt.figure(figsize=(10,5))
-    plt.plot(eval_losses)
+    plt.plot(eval_losses, label="Eval Loss")

    plt.xlabel("Epoch")
    plt.ylabel("Eval Loss")
@@ -23,7 +23,7 @@ def plot_loss_curve(logfile, title):
    plt.legend()
    plt.grid(True)

-    plt.savefig(f"eval_loss_{os.path.basename(logfile)}.pdf")
+    plt.savefig(f"eval_loss_{os.path.basename(logfile)}.svg")

 plot_loss_curve("logs/finetune_T5_MLM_entity_427082.txt", "T5 Finetuning - MLM Entity Masking")
 plot_loss_curve("logs/finetune_T5_MLM_label_427081.txt", "T5 Finetuning - MLM Label Masking")

--- a/src/models/T5_MLM_entity.py
+++ b/src/models/T5_MLM_entity.py
@@ -7,10 +7,23 @@ from datasets import Dataset, DatasetDict

 model_name = "google-t5/t5-base"

-print("Loading model: T5 MLM entity")
-tokenizer = T5Tokenizer.from_pretrained(model_name)
-model = T5ForConditionalGeneration.from_pretrained(model_name)
-print("Finished loading model: T5 MLM entity")
+def load_base():
+    global model
+    global tokenizer
+    print("Loading model: T5 MLM entity")
+    tokenizer = T5Tokenizer.from_pretrained(model_name)
+    model = T5ForConditionalGeneration.from_pretrained(model_name)
+    print("Finished loading model: T5 MLM entity")
+    
+
+def load_finetuned(input_dir):
+    global model
+    global tokenizer
+    print(f"Loading model: T5 MLM entity finetuned ({input_dir})")
+    tokenizer = T5Tokenizer.from_pretrained(input_dir)
+    model = T5ForConditionalGeneration.from_pretrained(input_dir)
+    print(f"Finished loading model: T5 MLM entity finetuned")
+

 def set_label_dict(label_dict):
    global label_representatives
@@ -113,3 +126,6 @@ def finetune_model(sentences, entities, labels, output_dir, epochs=10):

    model.save_pretrained(output_dir)
    tokenizer.save_pretrained(output_dir)
+
+load_base()
+# load_finetuned("./src/models/t5_mlm_entity_finetuned_model/checkpoints/checkpoint-12200")
--- a/src/models/T5_MLM_label.py
+++ b/src/models/T5_MLM_label.py
@@ -6,10 +6,23 @@ from datasets import Dataset, DatasetDict

 model_name = "google-t5/t5-base"

-print("Loading model: T5 MLM label")
-tokenizer = T5Tokenizer.from_pretrained(model_name)
-model = T5ForConditionalGeneration.from_pretrained(model_name)
-print("Finished loading model: T5 MLM label")
+def load_base():
+    global model
+    global tokenizer
+    print("Loading model: T5 MLM label")
+    tokenizer = T5Tokenizer.from_pretrained(model_name)
+    model = T5ForConditionalGeneration.from_pretrained(model_name)
+    print("Finished loading model: T5 MLM label")
+    
+
+def load_finetuned(input_dir):
+    global model
+    global tokenizer
+    print(f"Loading model: T5 MLM label finetuned ({input_dir})")
+    tokenizer = T5Tokenizer.from_pretrained(input_dir)
+    model = T5ForConditionalGeneration.from_pretrained(input_dir)
+    print(f"Finished loading model: T5 MLM label finetuned")
+

 def classify_entity(sentence, entity, labels):
    sentence_with_masked_hypothesis = f"{sentence} {entity} is a <extra_id_0>."
@@ -89,3 +102,6 @@ def finetune_model(sentences, entities, labels, output_dir, epochs=10):

    model.save_pretrained(output_dir)
    tokenizer.save_pretrained(output_dir)
+
+load_base()
+# load_finetuned("./src/models/t5_mlm_label_finetuned_model/checkpoints/checkpoint-9638")
--- a/src/models/T5_NLI.py
+++ b/src/models/T5_NLI.py
@@ -139,4 +139,4 @@ def finetune_model(premises, hypotheses, entailment, output_dir, epochs=10):
    tokenizer.save_pretrained(output_dir)

 load_base()
-# load_finetuned("./src/models/t5_nli_finetuned_model/pretrained_CoNLL_epoch20")
+# load_finetuned("./src/models/t5_nli_finetuned_model/checkpoints/checkpoint-85500")