From bd6e799262660976fb4e424ec90181e6aca6a582 Mon Sep 17 00:00:00 2001 From: Utaemon Toyota <toyota@cl.uni-heidelberg.de> Date: Tue, 26 Feb 2019 18:34:20 +0100 Subject: [PATCH] add some stopwords --- Senseval_Prep/senseval_preprocessing.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/Senseval_Prep/senseval_preprocessing.py b/Senseval_Prep/senseval_preprocessing.py index 4389e11..c24bf89 100644 --- a/Senseval_Prep/senseval_preprocessing.py +++ b/Senseval_Prep/senseval_preprocessing.py @@ -29,6 +29,9 @@ def get_stopword_list(stop_path): stopli = [] for line in f: stopli.append(line[:-1]) + stopli.append("n't") + stopli.append("'m") + stopli.append("whether") return stopli def get_infos(tree_path): -- GitLab