Source code for malaya.jawi

from malaya.supervised.huggingface import load
from malaya.torch_model.huggingface import Translation

available_huggingface = {
    'mesolitica/jawi-nanot5-tiny-malaysian-cased': {
        'Size (MB)': 205,
        'Suggested length': 2048,
        'jawi-rumi chrF2++': 97.72,
        'rumi-jawi chrF2++': 98.57,
        'from lang': ['jawi', 'rumi'],
        'to lang': ['jawi', 'rumi'],
    },
    'mesolitica/jawi-nanot5-small-malaysian-cased': {
        'Size (MB)': 358,
        'Suggested length': 2048,
        'jawi-rumi chrF2++': 98.01,
        'rumi-jawi chrF2++': 98.97,
        'from lang': ['jawi', 'rumi'],
        'to lang': ['jawi', 'rumi'],
    },
}


info = """
tested on first 10k Rumi-Jawi test set, dataset at https://huggingface.co/datasets/mesolitica/rumi-jawi
""".strip()


[docs]def huggingface( model: str = 'mesolitica/jawi-nanot5-small-malaysian-cased', force_check: bool = True, **kwargs, ): """ Load HuggingFace model to translate. Parameters ---------- model: str, optional (default='mesolitica/jawi-nanot5-small-malaysian-cased') Check available models at `malaya.jawi.available_huggingface`. force_check: bool, optional (default=True) Force check model one of malaya model. Set to False if you have your own huggingface model. Returns ------- result: malaya.torch_model.huggingface.Translation """ return load( model=model, class_model=Translation, available_huggingface=available_huggingface, force_check=force_check, path=__name__, **kwargs, )