aboutsummaryrefslogtreecommitdiffhomepage
path: root/src/sec_certs/model
diff options
context:
space:
mode:
authoradamjanovsky2023-11-23 09:23:11 +0100
committeradamjanovsky2023-11-23 09:23:11 +0100
commit14df232736e43dde9de47d3bbe506bdaae6fa53d (patch)
tree3695d40bbd69a372e0f5b6d1ab441829bc0d5eb5 /src/sec_certs/model
parent68b1c2d504657069a7b698b4a28112fde3789890 (diff)
downloadsec-certs-14df232736e43dde9de47d3bbe506bdaae6fa53d.tar.gz
sec-certs-14df232736e43dde9de47d3bbe506bdaae6fa53d.tar.zst
sec-certs-14df232736e43dde9de47d3bbe506bdaae6fa53d.zip
hardcode optimal hyperparams for embeddings
Diffstat (limited to 'src/sec_certs/model')
-rw-r--r--src/sec_certs/model/references_nlp/feature_extraction.py8
1 files changed, 4 insertions, 4 deletions
diff --git a/src/sec_certs/model/references_nlp/feature_extraction.py b/src/sec_certs/model/references_nlp/feature_extraction.py
index eed90959..c875cfab 100644
--- a/src/sec_certs/model/references_nlp/feature_extraction.py
+++ b/src/sec_certs/model/references_nlp/feature_extraction.py
@@ -155,11 +155,11 @@ def _build_transformer_embeddings(
segments,
prec_recall_metric,
mode=mode,
- n_iterations=34,
- n_epochs=1,
- learning_rate=0.01,
+ n_iterations=8,
+ n_epochs=2,
+ learning_rate=1.23e-5,
batch_size=16,
- segmenter_metric="f1",
+ segmenter_metric="balanced_accuracy",
ensemble_soft_voting_power=2,
show_progress_bar=False,
)