ウィキSQL

参考文献:

次のコマンドを使用して、このデータセットを TFDS にロードします。

ds = tfds.load('huggingface:wikisql')
  • 説明
A large crowd-sourced dataset for developing natural language interfaces for relational databases
  • ライセンス: 既知のライセンスはありません
  • バージョン: 0.1.0
  • 分割:
スプリット
'test' 15878
'train' 56355
'validation' 8421
  • 特徴
{
    "phase": {
        "dtype": "int32",
        "id": null,
        "_type": "Value"
    },
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "table": {
        "header": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "page_title": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "page_id": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "types": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "id": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "section_title": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "caption": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "rows": {
            "feature": {
                "feature": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "length": -1,
                "id": null,
                "_type": "Sequence"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    },
    "sql": {
        "human_readable": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "sel": {
            "dtype": "int32",
            "id": null,
            "_type": "Value"
        },
        "agg": {
            "dtype": "int32",
            "id": null,
            "_type": "Value"
        },
        "conds": {
            "feature": {
                "column_index": {
                    "dtype": "int32",
                    "id": null,
                    "_type": "Value"
                },
                "operator_index": {
                    "dtype": "int32",
                    "id": null,
                    "_type": "Value"
                },
                "condition": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                }
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        }
    }
}