Source code for construe.gliner

"""
GLiNER named entity discovery benchmark runner
"""

from .exceptions import DatasetsError
from .models import load_gliner, cleanup_gliner
from .benchmark import Benchmark, limit_generator
from .datasets import load_essays, cleanup_essays, DATASETS


[docs] class GLiNER(Benchmark):
[docs] @staticmethod def total(**kwargs): # Return the number of essays from the manifest use_sample = kwargs.pop("use_sample", True) name = "essays-sample" if use_sample else "essays" if name not in DATASETS: raise DatasetsError("essays dataset not found in manifest") return DATASETS[name]["instances"]
@property def description(self): return ( "applies the GLiNER model to identify and classify " "named entities in long-form essays" )
[docs] def before(self): model, processor = load_gliner(model_home=self.model_home) self.model = model self.processor = processor
[docs] def after(self, cleanup=True): if cleanup: cleanup_gliner(model_home=self.model_home) cleanup_essays(data_home=self.data_home, sample=self.use_sample)
[docs] def instances(self, limit=None): dataset = load_essays(data_home=self.data_home, sample=self.use_sample) return limit_generator(dataset, limit)
[docs] def preprocess(self, instance): raise NotImplementedError("GLiNER preprocess not implemented")
[docs] def inference(self, instance): raise NotImplementedError("GLiNER inference not implemented")