diff --git a/annif/backend/xtransformer.py b/annif/backend/xtransformer.py index a914b082..bc75198e 100644 --- a/annif/backend/xtransformer.py +++ b/annif/backend/xtransformer.py @@ -93,7 +93,7 @@ class XTransformerBackend(mixins.TfidfVectorizerMixin, backend.AnnifBackend): "imbalanced_depth": 100, "max_match_clusters": 32768, "do_fine_tune": True, - "model_shortcut": "bert-base-multilingual-uncased", + "model_shortcut": "distilbert-base-multilingual-uncased", "beam_size": 20, "limit": 100, "post_processor": "sigmoid", diff --git a/tests/test_backend_xtransformer.py b/tests/test_backend_xtransformer.py index 78628f47..2d4b1bc6 100644 --- a/tests/test_backend_xtransformer.py +++ b/tests/test_backend_xtransformer.py @@ -41,8 +41,8 @@ def test_xtransformer_default_params(project): "imbalanced_depth": 100, "max_match_clusters": 32768, "do_fine_tune": True, - # 'model_shortcut': 'distilbert-base-multilingual-cased', - "model_shortcut": "bert-base-multilingual-uncased", + 'model_shortcut': 'distilbert-base-multilingual-uncased', + # "model_shortcut": "bert-base-multilingual-uncased", "beam_size": 20, "limit": 100, "post_processor": "sigmoid", @@ -144,8 +144,8 @@ def test_xtransformer_train(datadir, document_corpus, project, mocked_xtransform "max_leaf_size": 100, "imbalanced_ratio": 0.0, "imbalanced_depth": 100, - "model_shortcut": "bert-base-multilingual-uncased", - # 'model_shortcut': 'distilbert-base-multilingual-cased', + # "model_shortcut": "bert-base-multilingual-uncased", + 'model_shortcut': 'distilbert-base-multilingual-uncased', "post_processor": "sigmoid", "negative_sampling": "tfn", "ensemble_method": "transformer-only",