Create dataset xnli
albertvillanova opened this issue · comments
Albert Villanova del Moral commented
- uid: xnli
- type: primary
- description:
- name: XNLI
- description: it is a Cross-lingual Natural Language Inference corpus that
- homepage: https://github.com/facebookresearch/XNLI
- validated: True
- languages:
- language_names:
- English
- French
- Spanish
- Arabic
- Vietnamese
- Chinese
- ar-MSA
- German
- Greek languages
- Bulgarian
- Russian
- Arabic
- Turkish
- Thai
- Hindi
- Swahili (macrolanguage)
- Urdu
- language_comments:
- language_locations:
- validated: False
- language_names:
- custodian:
- name:
- in_catalogue:
- type:
- location:
- contact_name: XNLI
- contact_email:
- contact_submitter: False
- additional:
- validated: False
- availability:
- procurement:
- for_download: Yes - it has a direct download link or links
- download_url: https://dl.fbaipublicfiles.com/XNLI/XNLI-MT-1.0.zip
- download_email:
- licensing:
- has_licenses: Yes
- license_text:
- license_properties:
- open license
- public domain
- license_list:
- pii:
- has_pii: Unclear
- generic_pii_likely:
- generic_pii_list:
- numeric_pii_likely:
- numeric_pii_list:
- sensitive_pii_likely:
- sensitive_pii_list:
- no_pii_justification_class: general knowledge not written by or referring to private persons
- no_pii_justification_text:
- validated: False
- procurement:
- source_category:
- category_type: collection
- category_web:
- category_media:
- validated: False
- media:
- category:
- text
- text_format:
- .CSV
- audiovisual_format:
- image_format:
- database_format:
- .ZIP
- text_is_transcribed: Yes - audiovisual
- instance_type:
- instance_count: 100K<n<1M
- instance_size: 10<n<100
- validated: False
- category:
- fname: xnli.json