|
a |
|
b/resources/bioner.yml |
|
|
1 |
#@meta {desc: 'configure the SciSpacy BioNLP parser', date: '2024-04-06'} |
|
|
2 |
#@meta {doc: 'A spaCy NER model trained on the BIONLP13CG corpus.'} |
|
|
3 |
#@meta {url: 'https://allenai.github.io/scispacy/'} |
|
|
4 |
|
|
|
5 |
|
|
|
6 |
## Natural language |
|
|
7 |
# |
|
|
8 |
# use the biomedical NER |
|
|
9 |
mednlp_biomed_doc_parser: |
|
|
10 |
model_name: en_ner_bionlp13cg_md |
|
|
11 |
|
|
|
12 |
# configure the model for download |
|
|
13 |
medcat_resource: |
|
|
14 |
auto_install_models: |
|
|
15 |
- ${mednlp_biomed_doc_parser:model_name} |
|
|
16 |
|
|
|
17 |
|
|
|
18 |
## Vectorization |
|
|
19 |
# |
|
|
20 |
medent_spacy_feature_vectorizer: |
|
|
21 |
class_name: zensols.deepnlp.vectorize.spacy.SpacyFeatureVectorizer |
|
|
22 |
feature_id: medent |
|
|
23 |
description: medical named entity recognition |
|
|
24 |
torch_config: 'instance: gpu_torch_config' |
|
|
25 |
model: >- |
|
|
26 |
call({'param': {'attribute': 'model'}}): mednlp_biomed_doc_parser |
|
|
27 |
symbols: ner |
|
|
28 |
|
|
|
29 |
# uncomment to add the vectorizer to the default configuration in `vectorizer.conf` |
|
|
30 |
# language_vectorizer_manager: |
|
|
31 |
# configured_spacy_vectorizers: >- |
|
|
32 |
# instance: tuple: |
|
|
33 |
# ner_spacy_feature_vectorizer, |
|
|
34 |
# dep_spacy_feature_vectorizer, |
|
|
35 |
# pos_spacy_feature_vectorizer, |
|
|
36 |
# medent_spacy_feature_vectorizer |