لاما

مراجع:

trex

برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:

ds = tfds.load('huggingface:lama/trex')
  • توضیحات :
LAMA is a dataset used to probe and analyze the factual and commonsense knowledge contained in pretrained language models. See https://github.com/facebookresearch/LAMA.
تقسیم کنید نمونه ها
'train' 1304391
  • ویژگی ها :
{
    "uuid": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "obj_uri": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "obj_label": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "sub_uri": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "sub_label": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "predicate_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "sub_surface": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "obj_surface": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "masked_sentence": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "template": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "template_negated": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "label": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "description": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "type": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    }
}

تیم

برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:

ds = tfds.load('huggingface:lama/squad')
  • توضیحات :
LAMA is a dataset used to probe and analyze the factual and commonsense knowledge contained in pretrained language models. See https://github.com/facebookresearch/LAMA.
تقسیم کنید نمونه ها
'train' 305
  • ویژگی ها :
{
    "id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "sub_label": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "obj_label": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "negated": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "masked_sentence": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    }
}

google_re

برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:

ds = tfds.load('huggingface:lama/google_re')
  • توضیحات :
LAMA is a dataset used to probe and analyze the factual and commonsense knowledge contained in pretrained language models. See https://github.com/facebookresearch/LAMA.
تقسیم کنید نمونه ها
'train' 6106
  • ویژگی ها :
{
    "pred": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "sub": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "obj": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "evidences": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "judgments": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "sub_w": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "sub_label": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "sub_aliases": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "obj_w": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "obj_label": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "obj_aliases": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "uuid": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "masked_sentence": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "template": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "template_negated": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    }
}

شبکه مفهومی

برای بارگذاری این مجموعه داده در TFDS از دستور زیر استفاده کنید:

ds = tfds.load('huggingface:lama/conceptnet')
  • توضیحات :
LAMA is a dataset used to probe and analyze the factual and commonsense knowledge contained in pretrained language models. See https://github.com/facebookresearch/LAMA.
تقسیم کنید نمونه ها
'train' 29774
  • ویژگی ها :
{
    "uuid": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "sub": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "obj": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "pred": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "obj_label": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "masked_sentence": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "negated": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    }
}