From 6bae7a216848055dafd43e45ddbf6b311a99070b Mon Sep 17 00:00:00 2001 From: Henry Dowd Date: Tue, 18 Nov 2025 14:53:32 +0000 Subject: [PATCH] sample notebooks and test files --- .gitignore | 1 + config.yaml | 18 ++++++++++++++++++ notebooks/01_data_exploration.ipynb | 0 notebooks/02_baseline_experiments.ipynb | 0 notebooks/03_semantic_methods.ipynb | 0 notebooks/04_fusion_model.ipynb | 0 notebooks/05_final_evaluation.ipynb | 0 tests/test_lexical_features.py | 0 tests/test_models.py | 0 tests/test_semantic_features.py | 0 10 files changed, 19 insertions(+) create mode 100644 notebooks/01_data_exploration.ipynb create mode 100644 notebooks/02_baseline_experiments.ipynb create mode 100644 notebooks/03_semantic_methods.ipynb create mode 100644 notebooks/04_fusion_model.ipynb create mode 100644 notebooks/05_final_evaluation.ipynb create mode 100644 tests/test_lexical_features.py create mode 100644 tests/test_models.py create mode 100644 tests/test_semantic_features.py diff --git a/.gitignore b/.gitignore index 0e1491f..45b6519 100644 --- a/.gitignore +++ b/.gitignore @@ -1,4 +1,5 @@ venv +.venv .vscode .idea __pycache__ diff --git a/config.yaml b/config.yaml index e69de29..dce57ff 100644 --- a/config.yaml +++ b/config.yaml @@ -0,0 +1,18 @@ +#Basic config, MUST CHANGE +#CHANGE +similarity_thresholds: + jaccard: 99 + semantic: 99 + syntactic: 99 + +semantic_methods: + use_weighted_average: true + use_sif: true + pos_weights: + NOUN: 99 + VERB: 99 + OTHER: 99 + +model: + fusion_classifier: "logistic_regression" + test_size: 0.2 \ No newline at end of file diff --git a/notebooks/01_data_exploration.ipynb b/notebooks/01_data_exploration.ipynb new file mode 100644 index 0000000..e69de29 diff --git a/notebooks/02_baseline_experiments.ipynb b/notebooks/02_baseline_experiments.ipynb new file mode 100644 index 0000000..e69de29 diff --git a/notebooks/03_semantic_methods.ipynb b/notebooks/03_semantic_methods.ipynb new file mode 100644 index 0000000..e69de29 diff --git a/notebooks/04_fusion_model.ipynb b/notebooks/04_fusion_model.ipynb new file mode 100644 index 0000000..e69de29 diff --git a/notebooks/05_final_evaluation.ipynb b/notebooks/05_final_evaluation.ipynb new file mode 100644 index 0000000..e69de29 diff --git a/tests/test_lexical_features.py b/tests/test_lexical_features.py new file mode 100644 index 0000000..e69de29 diff --git a/tests/test_models.py b/tests/test_models.py new file mode 100644 index 0000000..e69de29 diff --git a/tests/test_semantic_features.py b/tests/test_semantic_features.py new file mode 100644 index 0000000..e69de29