Skip to content

Commit

Permalink
add the splits to the only card that needs them, and a smallie for ma…
Browse files Browse the repository at this point in the history
…ke docs-serve

Signed-off-by: dafnapension <[email protected]>
  • Loading branch information
dafnapension committed Feb 13, 2025
1 parent 8d06b62 commit 5cd66bb
Show file tree
Hide file tree
Showing 48 changed files with 308 additions and 77 deletions.
2 changes: 1 addition & 1 deletion prepare/cards/xlsum.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,7 @@

for lang in langs:
card = TaskCard(
loader=LoadHF(path="GEM/xlsum", name=lang),
loader=LoadHF(path="GEM/xlsum", name=lang, splits=["test", "train", "validation"]),
preprocess_steps=[
Rename(field_to_field={"text": "document"}),
Wrap(field="target", inside="list", to_field="summaries"),
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/amharic.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "amharic"
"name": "amharic",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/arabic.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "arabic"
"name": "arabic",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/azerbaijani.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "azerbaijani"
"name": "azerbaijani",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/bengali.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "bengali"
"name": "bengali",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/burmese.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "burmese"
"name": "burmese",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/chinese_simplified.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "chinese_simplified"
"name": "chinese_simplified",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/chinese_traditional.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "chinese_traditional"
"name": "chinese_traditional",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/english.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "english"
"name": "english",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/french.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "french"
"name": "french",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/gujarati.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "gujarati"
"name": "gujarati",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/hausa.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "hausa"
"name": "hausa",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/hindi.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "hindi"
"name": "hindi",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/igbo.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "igbo"
"name": "igbo",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/indonesian.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "indonesian"
"name": "indonesian",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/japanese.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "japanese"
"name": "japanese",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/kirundi.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "kirundi"
"name": "kirundi",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/korean.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "korean"
"name": "korean",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/kyrgyz.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "kyrgyz"
"name": "kyrgyz",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/marathi.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "marathi"
"name": "marathi",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/nepali.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "nepali"
"name": "nepali",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/oromo.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "oromo"
"name": "oromo",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/pashto.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "pashto"
"name": "pashto",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/persian.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "persian"
"name": "persian",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/pidgin.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "pidgin"
"name": "pidgin",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/portuguese.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "portuguese"
"name": "portuguese",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/punjabi.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "punjabi"
"name": "punjabi",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
7 changes: 6 additions & 1 deletion src/unitxt/catalog/cards/xlsum/russian.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,12 @@
"loader": {
"__type__": "load_hf",
"path": "GEM/xlsum",
"name": "russian"
"name": "russian",
"splits": [
"test",
"train",
"validation"
]
},
"preprocess_steps": [
{
Expand Down
Loading

0 comments on commit 5cd66bb

Please sign in to comment.