Source code for construe.offensive

"""
Offensive speech benchmark runner
"""

from .exceptions import DatasetsError
from .benchmark import Benchmark, limit_generator
from .models import load_offensive, cleanup_offensive
from .datasets import load_aegis, cleanup_aegis, DATASETS


[docs] class Offensive(Benchmark):
[docs] @staticmethod def total(**kwargs): ## Return the number of aegis comments from the manifest use_sample = kwargs.pop("use_sample", True) name = "aegis-sample" if use_sample else "aegis" if name not in DATASETS: raise DatasetsError("aegis dataset not found in manifest") return DATASETS[name]["instances"]
@property def description(self): return ( "applies the offensive speech detection model " "to the aegis content safety dataset" )
[docs] def before(self): model, processor = load_offensive(model_home=self.model_home) self.model = model self.processor = processor
[docs] def after(self, cleanup=True): if cleanup: cleanup_offensive(model_home=self.model_home) cleanup_aegis(data_home=self.data_home, sample=self.use_sample)
[docs] def instances(self, limit=None): dataset = load_aegis(data_home=self.data_home, sample=self.use_sample) return limit_generator(dataset, limit)
[docs] def preprocess(self, instance): raise NotImplementedError("Offensive preprocess not implemented")
[docs] def inference(self, instance): raise NotImplementedError("Offensive inference not implemented")