Source code for pykeen.datasets.db100k

# -*- coding: utf-8 -*-

"""The DB100K dataset."""

from docdata import parse_docdata

from .base import UnpackedRemoteDataset

BASE_URL = "https://raw.githubusercontent.com/iieir-km/ComplEx-NNE_AER/master/datasets/DB100K"

__all__ = [
    "DB100K",
]


[docs]@parse_docdata class DB100K(UnpackedRemoteDataset): """The DB100K dataset from [ding2018]_. --- name: DB100K citation: author: Ding year: 2018 link: https://arxiv.org/abs/1805.02408 github: iieir-km/ComplEx-NNE_AER statistics: entities: 99604 relations: 470 training: 597482 testing: 50000 validation: 49997 triples: 697479 """ def __init__(self, **kwargs): """Initialize the DB100K small dataset. :param kwargs: keyword arguments passed to :class:`pykeen.datasets.base.UnpackedRemoteDataset`. """ super().__init__( training_url=f"{BASE_URL}/_train.txt", testing_url=f"{BASE_URL}/_test.txt", validation_url=f"{BASE_URL}/_valid.txt", **kwargs, )
if __name__ == "__main__": DB100K.cli()