mkqa

Referências:

mkqa

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:mkqa/mkqa')
  • Descrição :
We introduce MKQA, an open-domain question answering evaluation set comprising 10k question-answer pairs aligned across 26 typologically diverse languages (260k question-answer pairs in total). The goal of this dataset is to provide a challenging benchmark for question answering quality across a wide set of languages.
  • Licença : CC BY-SA 3.0
  • Versão : 1.0.0
  • Divisões :
Dividir Exemplos
'train' 10.000
  • Características :
{
    "example_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "queries": {
        "ar": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "da": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "de": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "en": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "es": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "fi": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "fr": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "he": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "hu": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "it": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "ja": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "ko": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "km": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "ms": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "nl": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "no": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "pl": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "pt": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "ru": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "sv": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "th": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "tr": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "vi": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "zh_cn": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "zh_hk": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "zh_tw": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    },
    "query": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "answers": {
        "ar": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "da": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "de": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "en": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "es": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "fi": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "fr": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "he": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "hu": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "it": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "ja": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "ko": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "km": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "ms": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "nl": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "no": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "pl": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "pt": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "ru": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "sv": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "th": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "tr": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "vi": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "zh_cn": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "zh_hk": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ],
        "zh_tw": [
            {
                "type": {
                    "num_classes": 8,
                    "names": [
                        "entity",
                        "long_answer",
                        "unanswerable",
                        "date",
                        "number",
                        "number_with_unit",
                        "short_phrase",
                        "binary"
                    ],
                    "names_file": null,
                    "id": null,
                    "_type": "ClassLabel"
                },
                "entity": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "text": {
                    "dtype": "string",
                    "id": null,
                    "_type": "Value"
                },
                "aliases": [
                    {
                        "dtype": "string",
                        "id": null,
                        "_type": "Value"
                    }
                ]
            }
        ]
    }
}