Diff of /resources/bioner.yml [000000] .. [ca4dac]

Switch to side-by-side view

--- a
+++ b/resources/bioner.yml
@@ -0,0 +1,36 @@
+#@meta {desc: 'configure the SciSpacy BioNLP parser', date: '2024-04-06'}
+#@meta {doc: 'A spaCy NER model trained on the BIONLP13CG corpus.'}
+#@meta {url: 'https://allenai.github.io/scispacy/'}
+
+
+## Natural language
+#
+# use the biomedical NER
+mednlp_biomed_doc_parser:
+  model_name: en_ner_bionlp13cg_md
+
+# configure the model for download
+medcat_resource:
+  auto_install_models:
+    - ${mednlp_biomed_doc_parser:model_name}
+
+
+## Vectorization
+#
+medent_spacy_feature_vectorizer:
+  class_name: zensols.deepnlp.vectorize.spacy.SpacyFeatureVectorizer
+  feature_id: medent
+  description: medical named entity recognition
+  torch_config: 'instance: gpu_torch_config'
+  model: >-
+    call({'param': {'attribute': 'model'}}): mednlp_biomed_doc_parser
+  symbols: ner
+
+# uncomment to add the vectorizer to the default configuration in `vectorizer.conf`
+# language_vectorizer_manager:
+#   configured_spacy_vectorizers: >-
+#     instance: tuple:
+#       ner_spacy_feature_vectorizer,
+#       dep_spacy_feature_vectorizer,
+#       pos_spacy_feature_vectorizer,
+#       medent_spacy_feature_vectorizer