curiosidades_qa

Referências:

rc

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/rc')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 17210
'train' 138384
'validation' 17944
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

rc.nocontext

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/rc.nocontext')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 17210
'train' 138384
'validation' 17944
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

não filtrado

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/unfiltered')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 10832
'train' 87622
'validation' 11313
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

não filtrado.sem contexto

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/unfiltered.nocontext')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 10832
'train' 87622
'validation' 11313
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

rc.web

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/rc.web')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 9509
'train' 76496
'validation' 9951
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

rc.web.nocontext

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/rc.web.nocontext')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 9509
'train' 76496
'validation' 9951
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

não filtrado.web

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/unfiltered.web')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 0
'train' 0
'validation' 0
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

não filtrado.web.nocontext

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/unfiltered.web.nocontext')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 0
'train' 0
'validation' 0
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

rc.wikipedia

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/rc.wikipedia')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 7701
'train' 61888
'validation' 7993
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

rc.wikipedia.nocontext

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/rc.wikipedia.nocontext')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 7701
'train' 61888
'validation' 7993
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

não filtrado.wikipedia

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/unfiltered.wikipedia')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 0
'train' 0
'validation' 0
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}

unfiltered.wikipedia.nocontext

Use o seguinte comando para carregar esse conjunto de dados no TFDS:

ds = tfds.load('huggingface:trivia_qa/unfiltered.wikipedia.nocontext')
  • Descrição :
TriviaqQA is a reading comprehension dataset containing over 650K
question-answer-evidence triples. TriviaqQA includes 95K question-answer
pairs authored by trivia enthusiasts and independently gathered evidence
documents, six per question on average, that provide high quality distant
supervision for answering the questions.
  • Licença : Nenhuma licença conhecida
  • Versão : 1.2.0
  • Divisões :
Dividir Exemplos
'test' 0
'train' 0
'validation' 0
  • Características :
{
    "question": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_id": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "question_source": {
        "dtype": "string",
        "id": null,
        "_type": "Value"
    },
    "entity_pages": {
        "feature": {
            "doc_source": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "wiki_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "search_results": {
        "feature": {
            "description": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "filename": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "rank": {
                "dtype": "int32",
                "id": null,
                "_type": "Value"
            },
            "title": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "url": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "search_context": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            }
        },
        "length": -1,
        "id": null,
        "_type": "Sequence"
    },
    "answer": {
        "aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "normalized_aliases": {
            "feature": {
                "dtype": "string",
                "id": null,
                "_type": "Value"
            },
            "length": -1,
            "id": null,
            "_type": "Sequence"
        },
        "matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_matched_wiki_entity_name": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "normalized_value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "type": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        },
        "value": {
            "dtype": "string",
            "id": null,
            "_type": "Value"
        }
    }
}