Source code for pykeen.datasets.wordnet

# -*- coding: utf-8 -*-

"""WordNet datasets."""

import os

from .base import TarFileRemoteDataset

__all__ = [
    'WN18',
    'WN18RR',
]


[docs]class WN18(TarFileRemoteDataset): """The WN18 dataset.""" def __init__(self, create_inverse_triples: bool = False, **kwargs): """Initialize the WordNet-18 dataset. :param create_inverse_triples: Should inverse triples be created? Defaults to false. :param kwargs: keyword arguments passed to :class:`pykeen.datasets.base.TarFileRemoteDataset`. .. warning:: This dataset contains testing leakage. Use :class:`WN18RR` instead. """ super().__init__( url='https://everest.hds.utc.fr/lib/exe/fetch.php?media=en:wordnet-mlj12.tar.gz', relative_training_path=os.path.join('wordnet-mlj12', 'wordnet-mlj12-train.txt'), relative_testing_path=os.path.join('wordnet-mlj12', 'wordnet-mlj12-test.txt'), relative_validation_path=os.path.join('wordnet-mlj12', 'wordnet-mlj12-valid.txt'), create_inverse_triples=create_inverse_triples, **kwargs, )
[docs]class WN18RR(TarFileRemoteDataset): """The WN18-RR dataset.""" def __init__(self, create_inverse_triples: bool = False, **kwargs): """Initialize the WordNet-18 (RR) dataset. :param create_inverse_triples: Should inverse triples be created? Defaults to false. :param kwargs: keyword arguments passed to :class:`pykeen.datasets.base.TarFileRemoteDataset`. """ super().__init__( url='https://github.com/TimDettmers/ConvE/raw/master/WN18RR.tar.gz', relative_training_path='train.txt', relative_testing_path='test.txt', relative_validation_path='valid.txt', create_inverse_triples=create_inverse_triples, **kwargs, )