diff --git a/prepare/cards/natural_instructions.py b/prepare/cards/natural_instructions.py new file mode 100644 index 000000000..18165465d --- /dev/null +++ b/prepare/cards/natural_instructions.py @@ -0,0 +1,58 @@ +import os.path + +import numpy as np +from datasets import load_dataset +from src.unitxt.blocks import InputOutputTemplate, LoadHF, SplitRandomMix, TemplatesList +from src.unitxt.card import TaskCard +from src.unitxt.catalog import add_to_catalog +from src.unitxt.instructions import InstructionsList, TextualInstruction +from src.unitxt.operators import CopyFields, FilterByValues +from src.unitxt.prepare_utils.card_types import addClassificationChoices +from src.unitxt.task import FormTask +from src.unitxt.test_utils.card import test_card + +hf_df = load_dataset("Muennighoff/natural-instructions") +tasks_names = [] +for split in ["train"]: + # for split in ["train", "validation", "test"]: + names = np.unique(hf_df[split]["task_name"]) + tasks_names.append(names) + + pandas_df_split = hf_df[split].to_pandas() + + for task in names: + print("task name:", task) + json_url = f"https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/{task}.json" + definitions = pandas_df_split[pandas_df_split["task_name"] == task]["definition"].unique().tolist() + assert len(definitions) == 1 + print(definitions) + task_instruction = definitions[0] + task = task.replace("-", "_") + + if os.path.isfile( + f"/u/shachardon/repo/unitxt/src/unitxt/catalog/cards/natural_instructions/{split}/{task}.json" + ): + print("already exists. skipping") + continue + + instruction = TextualInstruction(task_instruction) + add_to_catalog(instruction, f"instructions.natural_instructions.{split}.{task}", overwrite=True) + + card = TaskCard( + loader=LoadHF("json", data_files=json_url, field="Instances"), + preprocess_steps=[ + SplitRandomMix({"train": "train[90%]", "validation": "train[5%]", "test": "train[5%]"}), + CopyFields(field_to_field=[["output/0", "target"]], use_query=True), + ], + task=FormTask(inputs=["input"], outputs=["target"], metrics=["metrics.rouge"]), + instructions=InstructionsList([f"instructions.natural_instructions.{split}.{task}"]), + templates=TemplatesList([f"templates.input_output"]), + ) + + try: + test_card(card) + except Exception as e: + print("error while generating task", task) + print(e) + + add_to_catalog(card, f"cards.natural_instructions.{split}.{task}", overwrite=True) diff --git a/prepare/formats/input_output_prefix.py b/prepare/formats/input_output_prefix.py new file mode 100644 index 000000000..e5d749296 --- /dev/null +++ b/prepare/formats/input_output_prefix.py @@ -0,0 +1,9 @@ +from src.unitxt.catalog import add_to_catalog +from src.unitxt.formats import ICLFormat + +format = ICLFormat( + input_prefix="input: ", + output_prefix="output: ", +) + +add_to_catalog(format, f"formats.input_output_prefix", overwrite=True) diff --git a/prepare/templates/input_output.py b/prepare/templates/input_output.py new file mode 100644 index 000000000..c42e4632f --- /dev/null +++ b/prepare/templates/input_output.py @@ -0,0 +1,8 @@ +from src.unitxt.blocks import InputOutputTemplate +from src.unitxt.catalog import add_to_catalog + +template = InputOutputTemplate( + input_format="{input}", + output_format="{target}", +) +add_to_catalog(template, f"templates.input_output", overwrite=True) diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task001_quoref_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task001_quoref_question_generation.json new file mode 100644 index 000000000..054290e7d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task001_quoref_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task001_quoref_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task001_quoref_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task002_quoref_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task002_quoref_answer_generation.json new file mode 100644 index 000000000..1370641b7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task002_quoref_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task002_quoref_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task002_quoref_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task022_cosmosqa_passage_inappropriate_binary.json b/src/unitxt/catalog/cards/natural_instructions/train/task022_cosmosqa_passage_inappropriate_binary.json new file mode 100644 index 000000000..1621b8086 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task022_cosmosqa_passage_inappropriate_binary.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task022_cosmosqa_passage_inappropriate_binary.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task022_cosmosqa_passage_inappropriate_binary" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task023_cosmosqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task023_cosmosqa_question_generation.json new file mode 100644 index 000000000..80144c986 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task023_cosmosqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task023_cosmosqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task023_cosmosqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task024_cosmosqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task024_cosmosqa_answer_generation.json new file mode 100644 index 000000000..96163d1f4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task024_cosmosqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task024_cosmosqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task024_cosmosqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task025_cosmosqa_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task025_cosmosqa_incorrect_answer_generation.json new file mode 100644 index 000000000..9dcf65f31 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task025_cosmosqa_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task025_cosmosqa_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task025_cosmosqa_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task026_drop_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task026_drop_question_generation.json new file mode 100644 index 000000000..5bb3a4148 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task026_drop_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task026_drop_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task026_drop_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task027_drop_answer_type_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task027_drop_answer_type_generation.json new file mode 100644 index 000000000..f7f9d9270 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task027_drop_answer_type_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task027_drop_answer_type_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task027_drop_answer_type_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task028_drop_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task028_drop_answer_generation.json new file mode 100644 index 000000000..6c6c8b2b6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task028_drop_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task028_drop_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task028_drop_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task043_essential_terms_answering_incomplete_questions.json b/src/unitxt/catalog/cards/natural_instructions/train/task043_essential_terms_answering_incomplete_questions.json new file mode 100644 index 000000000..8c85b11c4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task043_essential_terms_answering_incomplete_questions.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task043_essential_terms_answering_incomplete_questions.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task043_essential_terms_answering_incomplete_questions" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task044_essential_terms_identifying_essential_words.json b/src/unitxt/catalog/cards/natural_instructions/train/task044_essential_terms_identifying_essential_words.json new file mode 100644 index 000000000..948e7c670 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task044_essential_terms_identifying_essential_words.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task044_essential_terms_identifying_essential_words.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task044_essential_terms_identifying_essential_words" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task045_miscellaneous_sentence_paraphrasing.json b/src/unitxt/catalog/cards/natural_instructions/train/task045_miscellaneous_sentence_paraphrasing.json new file mode 100644 index 000000000..a1c040a03 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task045_miscellaneous_sentence_paraphrasing.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task045_miscellaneous_sentence_paraphrasing.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task045_miscellaneous_sentence_paraphrasing" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task046_miscellaneous_question_typing.json b/src/unitxt/catalog/cards/natural_instructions/train/task046_miscellaneous_question_typing.json new file mode 100644 index 000000000..9c7a691f2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task046_miscellaneous_question_typing.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task046_miscellaneous_question_typing.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task046_miscellaneous_question_typing" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task047_miscellaneous_answering_science_questions.json b/src/unitxt/catalog/cards/natural_instructions/train/task047_miscellaneous_answering_science_questions.json new file mode 100644 index 000000000..264c48e8a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task047_miscellaneous_answering_science_questions.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task047_miscellaneous_answering_science_questions.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task047_miscellaneous_answering_science_questions" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task059_ropes_story_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task059_ropes_story_generation.json new file mode 100644 index 000000000..a8bb1412b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task059_ropes_story_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task059_ropes_story_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task059_ropes_story_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task060_ropes_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task060_ropes_question_generation.json new file mode 100644 index 000000000..e8e77e082 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task060_ropes_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task060_ropes_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task060_ropes_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task061_ropes_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task061_ropes_answer_generation.json new file mode 100644 index 000000000..60ad048ec --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task061_ropes_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task061_ropes_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task061_ropes_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task062_bigbench_repeat_copy_logic.json b/src/unitxt/catalog/cards/natural_instructions/train/task062_bigbench_repeat_copy_logic.json new file mode 100644 index 000000000..c042c64b0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task062_bigbench_repeat_copy_logic.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task062_bigbench_repeat_copy_logic.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task062_bigbench_repeat_copy_logic" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task063_first_i_elements.json b/src/unitxt/catalog/cards/natural_instructions/train/task063_first_i_elements.json new file mode 100644 index 000000000..48d459b19 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task063_first_i_elements.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task063_first_i_elements.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task063_first_i_elements" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task064_all_elements_except_first_i.json b/src/unitxt/catalog/cards/natural_instructions/train/task064_all_elements_except_first_i.json new file mode 100644 index 000000000..a797c4d67 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task064_all_elements_except_first_i.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task064_all_elements_except_first_i.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task064_all_elements_except_first_i" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task065_timetravel_consistent_sentence_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task065_timetravel_consistent_sentence_classification.json new file mode 100644 index 000000000..e4969af2f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task065_timetravel_consistent_sentence_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task065_timetravel_consistent_sentence_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task065_timetravel_consistent_sentence_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task066_timetravel_binary_consistency_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task066_timetravel_binary_consistency_classification.json new file mode 100644 index 000000000..4f610bf06 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task066_timetravel_binary_consistency_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task066_timetravel_binary_consistency_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task066_timetravel_binary_consistency_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task067_abductivenli_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task067_abductivenli_answer_generation.json new file mode 100644 index 000000000..f5c099493 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task067_abductivenli_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task067_abductivenli_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task067_abductivenli_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task068_abductivenli_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task068_abductivenli_incorrect_answer_generation.json new file mode 100644 index 000000000..19259ddaa --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task068_abductivenli_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task068_abductivenli_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task068_abductivenli_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task069_abductivenli_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task069_abductivenli_classification.json new file mode 100644 index 000000000..bd997964b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task069_abductivenli_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task069_abductivenli_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task069_abductivenli_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task070_abductivenli_incorrect_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task070_abductivenli_incorrect_classification.json new file mode 100644 index 000000000..9459f4291 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task070_abductivenli_incorrect_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task070_abductivenli_incorrect_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task070_abductivenli_incorrect_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task071_abductivenli_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task071_abductivenli_answer_generation.json new file mode 100644 index 000000000..0167f1003 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task071_abductivenli_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task071_abductivenli_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task071_abductivenli_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task072_abductivenli_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task072_abductivenli_answer_generation.json new file mode 100644 index 000000000..a9f172cfc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task072_abductivenli_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task072_abductivenli_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task072_abductivenli_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task073_commonsenseqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task073_commonsenseqa_answer_generation.json new file mode 100644 index 000000000..dc41ec5cd --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task073_commonsenseqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task073_commonsenseqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task073_commonsenseqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task074_squad1/1_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task074_squad1/1_question_generation.json new file mode 100644 index 000000000..d28840243 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task074_squad1/1_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task074_squad1.1_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task074_squad1.1_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task075_squad1/1_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task075_squad1/1_answer_generation.json new file mode 100644 index 000000000..050e929ee --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task075_squad1/1_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task075_squad1.1_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task075_squad1.1_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task076_splash_correcting_sql_mistake.json b/src/unitxt/catalog/cards/natural_instructions/train/task076_splash_correcting_sql_mistake.json new file mode 100644 index 000000000..1c995609b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task076_splash_correcting_sql_mistake.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task076_splash_correcting_sql_mistake.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task076_splash_correcting_sql_mistake" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task077_splash_explanation_to_sql.json b/src/unitxt/catalog/cards/natural_instructions/train/task077_splash_explanation_to_sql.json new file mode 100644 index 000000000..a7f804681 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task077_splash_explanation_to_sql.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task077_splash_explanation_to_sql.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task077_splash_explanation_to_sql" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task078_all_elements_except_last_i.json b/src/unitxt/catalog/cards/natural_instructions/train/task078_all_elements_except_last_i.json new file mode 100644 index 000000000..6f58203ba --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task078_all_elements_except_last_i.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task078_all_elements_except_last_i.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task078_all_elements_except_last_i" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task079_conala_concat_strings.json b/src/unitxt/catalog/cards/natural_instructions/train/task079_conala_concat_strings.json new file mode 100644 index 000000000..a3fff6c6c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task079_conala_concat_strings.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task079_conala_concat_strings.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task079_conala_concat_strings" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task080_piqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task080_piqa_answer_generation.json new file mode 100644 index 000000000..01df7011d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task080_piqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task080_piqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task080_piqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task081_piqa_wrong_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task081_piqa_wrong_answer_generation.json new file mode 100644 index 000000000..9ece0a32c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task081_piqa_wrong_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task081_piqa_wrong_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task081_piqa_wrong_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task082_babi_t1_single_supporting_fact_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task082_babi_t1_single_supporting_fact_question_generation.json new file mode 100644 index 000000000..e4862a092 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task082_babi_t1_single_supporting_fact_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task082_babi_t1_single_supporting_fact_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task082_babi_t1_single_supporting_fact_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task083_babi_t1_single_supporting_fact_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task083_babi_t1_single_supporting_fact_answer_generation.json new file mode 100644 index 000000000..55f1721c2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task083_babi_t1_single_supporting_fact_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task083_babi_t1_single_supporting_fact_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task083_babi_t1_single_supporting_fact_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task084_babi_t1_single_supporting_fact_identify_relevant_fact.json b/src/unitxt/catalog/cards/natural_instructions/train/task084_babi_t1_single_supporting_fact_identify_relevant_fact.json new file mode 100644 index 000000000..63ca61721 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task084_babi_t1_single_supporting_fact_identify_relevant_fact.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task084_babi_t1_single_supporting_fact_identify_relevant_fact.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task084_babi_t1_single_supporting_fact_identify_relevant_fact" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task085_unnatural_addsub_arithmetic.json b/src/unitxt/catalog/cards/natural_instructions/train/task085_unnatural_addsub_arithmetic.json new file mode 100644 index 000000000..7ca42343a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task085_unnatural_addsub_arithmetic.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task085_unnatural_addsub_arithmetic.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task085_unnatural_addsub_arithmetic" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task087_new_operator_addsub_arithmetic.json b/src/unitxt/catalog/cards/natural_instructions/train/task087_new_operator_addsub_arithmetic.json new file mode 100644 index 000000000..b4d2dc34d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task087_new_operator_addsub_arithmetic.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task087_new_operator_addsub_arithmetic.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task087_new_operator_addsub_arithmetic" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task088_identify_typo_verification.json b/src/unitxt/catalog/cards/natural_instructions/train/task088_identify_typo_verification.json new file mode 100644 index 000000000..2dc630194 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task088_identify_typo_verification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task088_identify_typo_verification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task088_identify_typo_verification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task089_swap_words_verification.json b/src/unitxt/catalog/cards/natural_instructions/train/task089_swap_words_verification.json new file mode 100644 index 000000000..80091534f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task089_swap_words_verification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task089_swap_words_verification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task089_swap_words_verification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task090_equation_learner_algebra.json b/src/unitxt/catalog/cards/natural_instructions/train/task090_equation_learner_algebra.json new file mode 100644 index 000000000..e8e98bf95 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task090_equation_learner_algebra.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task090_equation_learner_algebra.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task090_equation_learner_algebra" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task091_all_elements_from_index_i_to_j.json b/src/unitxt/catalog/cards/natural_instructions/train/task091_all_elements_from_index_i_to_j.json new file mode 100644 index 000000000..d301f5a4c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task091_all_elements_from_index_i_to_j.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task091_all_elements_from_index_i_to_j.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task091_all_elements_from_index_i_to_j" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task092_check_prime_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task092_check_prime_classification.json new file mode 100644 index 000000000..241ae1cf6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task092_check_prime_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task092_check_prime_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task092_check_prime_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task093_conala_normalize_lists.json b/src/unitxt/catalog/cards/natural_instructions/train/task093_conala_normalize_lists.json new file mode 100644 index 000000000..6422688ce --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task093_conala_normalize_lists.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task093_conala_normalize_lists.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task093_conala_normalize_lists" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task094_conala_calculate_mean.json b/src/unitxt/catalog/cards/natural_instructions/train/task094_conala_calculate_mean.json new file mode 100644 index 000000000..8cd4a6dcc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task094_conala_calculate_mean.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task094_conala_calculate_mean.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task094_conala_calculate_mean" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task095_conala_max_absolute_value.json b/src/unitxt/catalog/cards/natural_instructions/train/task095_conala_max_absolute_value.json new file mode 100644 index 000000000..089ce7ceb --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task095_conala_max_absolute_value.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task095_conala_max_absolute_value.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task095_conala_max_absolute_value" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task096_conala_list_index_subtraction.json b/src/unitxt/catalog/cards/natural_instructions/train/task096_conala_list_index_subtraction.json new file mode 100644 index 000000000..5b30d76a9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task096_conala_list_index_subtraction.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task096_conala_list_index_subtraction.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task096_conala_list_index_subtraction" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task097_conala_remove_duplicates.json b/src/unitxt/catalog/cards/natural_instructions/train/task097_conala_remove_duplicates.json new file mode 100644 index 000000000..32e4c0e47 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task097_conala_remove_duplicates.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task097_conala_remove_duplicates.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task097_conala_remove_duplicates" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task098_conala_list_intersection.json b/src/unitxt/catalog/cards/natural_instructions/train/task098_conala_list_intersection.json new file mode 100644 index 000000000..12e8d3f78 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task098_conala_list_intersection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task098_conala_list_intersection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task098_conala_list_intersection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task099_reverse_elements_between_index_i_and_j.json b/src/unitxt/catalog/cards/natural_instructions/train/task099_reverse_elements_between_index_i_and_j.json new file mode 100644 index 000000000..c51cc4a83 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task099_reverse_elements_between_index_i_and_j.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task099_reverse_elements_between_index_i_and_j.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task099_reverse_elements_between_index_i_and_j" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task100_concatenate_all_elements_from_index_i_to_j.json b/src/unitxt/catalog/cards/natural_instructions/train/task100_concatenate_all_elements_from_index_i_to_j.json new file mode 100644 index 000000000..6d2e4b303 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task100_concatenate_all_elements_from_index_i_to_j.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task100_concatenate_all_elements_from_index_i_to_j.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task100_concatenate_all_elements_from_index_i_to_j" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task101_reverse_and_concatenate_all_elements_from_index_i_to_j.json b/src/unitxt/catalog/cards/natural_instructions/train/task101_reverse_and_concatenate_all_elements_from_index_i_to_j.json new file mode 100644 index 000000000..df440fdd1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task101_reverse_and_concatenate_all_elements_from_index_i_to_j.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task101_reverse_and_concatenate_all_elements_from_index_i_to_j.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task101_reverse_and_concatenate_all_elements_from_index_i_to_j" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task103_facts2story_long_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task103_facts2story_long_text_generation.json new file mode 100644 index 000000000..f8498c9aa --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task103_facts2story_long_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task103_facts2story_long_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task103_facts2story_long_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task104_semeval_2019_task10_closed_vocabulary_mathematical_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task104_semeval_2019_task10_closed_vocabulary_mathematical_answer_generation.json new file mode 100644 index 000000000..745678e63 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task104_semeval_2019_task10_closed_vocabulary_mathematical_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task104_semeval_2019_task10_closed_vocabulary_mathematical_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task104_semeval_2019_task10_closed_vocabulary_mathematical_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task105_story_cloze_rocstories_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task105_story_cloze_rocstories_sentence_generation.json new file mode 100644 index 000000000..8579e564c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task105_story_cloze_rocstories_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task105_story_cloze-rocstories_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task105_story_cloze_rocstories_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task107_splash_question_to_sql.json b/src/unitxt/catalog/cards/natural_instructions/train/task107_splash_question_to_sql.json new file mode 100644 index 000000000..7cd72befa --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task107_splash_question_to_sql.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task107_splash_question_to_sql.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task107_splash_question_to_sql" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1087_two_number_sum.json b/src/unitxt/catalog/cards/natural_instructions/train/task1087_two_number_sum.json new file mode 100644 index 000000000..db6fc0768 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1087_two_number_sum.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1087_two_number_sum.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1087_two_number_sum" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1088_array_of_products.json b/src/unitxt/catalog/cards/natural_instructions/train/task1088_array_of_products.json new file mode 100644 index 000000000..fbb2675d5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1088_array_of_products.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1088_array_of_products.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1088_array_of_products" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1089_check_monotonic_array.json b/src/unitxt/catalog/cards/natural_instructions/train/task1089_check_monotonic_array.json new file mode 100644 index 000000000..1f8952f84 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1089_check_monotonic_array.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1089_check_monotonic_array.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1089_check_monotonic_array" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task108_contextualabusedetection_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task108_contextualabusedetection_classification.json new file mode 100644 index 000000000..7e1438913 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task108_contextualabusedetection_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task108_contextualabusedetection_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task108_contextualabusedetection_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task109_smsspamcollection_spamsmsdetection.json b/src/unitxt/catalog/cards/natural_instructions/train/task109_smsspamcollection_spamsmsdetection.json new file mode 100644 index 000000000..2247003f0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task109_smsspamcollection_spamsmsdetection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task109_smsspamcollection_spamsmsdetection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task109_smsspamcollection_spamsmsdetection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task110_logic2text_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task110_logic2text_sentence_generation.json new file mode 100644 index 000000000..b371a200d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task110_logic2text_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task110_logic2text_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task110_logic2text_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task111_asset_sentence_simplification.json b/src/unitxt/catalog/cards/natural_instructions/train/task111_asset_sentence_simplification.json new file mode 100644 index 000000000..1f54a852b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task111_asset_sentence_simplification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task111_asset_sentence_simplification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task111_asset_sentence_simplification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task112_asset_simple_sentence_identification.json b/src/unitxt/catalog/cards/natural_instructions/train/task112_asset_simple_sentence_identification.json new file mode 100644 index 000000000..24bd97ee1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task112_asset_simple_sentence_identification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task112_asset_simple_sentence_identification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task112_asset_simple_sentence_identification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1135_xcsr_en_commonsense_mc_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1135_xcsr_en_commonsense_mc_classification.json new file mode 100644 index 000000000..ff5892839 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1135_xcsr_en_commonsense_mc_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1135_xcsr_en_commonsense_mc_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1135_xcsr_en_commonsense_mc_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task113_count_frequency_of_letter.json b/src/unitxt/catalog/cards/natural_instructions/train/task113_count_frequency_of_letter.json new file mode 100644 index 000000000..d2b93500d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task113_count_frequency_of_letter.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task113_count_frequency_of_letter.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task113_count_frequency_of_letter" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1146_country_capital.json b/src/unitxt/catalog/cards/natural_instructions/train/task1146_country_capital.json new file mode 100644 index 000000000..ef78fd000 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1146_country_capital.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1146_country_capital.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1146_country_capital" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1147_country_currency.json b/src/unitxt/catalog/cards/natural_instructions/train/task1147_country_currency.json new file mode 100644 index 000000000..6bb2e371e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1147_country_currency.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1147_country_currency.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1147_country_currency" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1148_maximum_ascii_value.json b/src/unitxt/catalog/cards/natural_instructions/train/task1148_maximum_ascii_value.json new file mode 100644 index 000000000..948bee392 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1148_maximum_ascii_value.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1148_maximum_ascii_value.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1148_maximum_ascii_value" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1149_item_check_edible.json b/src/unitxt/catalog/cards/natural_instructions/train/task1149_item_check_edible.json new file mode 100644 index 000000000..62e83b68c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1149_item_check_edible.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1149_item_check_edible.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1149_item_check_edible" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task114_is_the_given_word_longest.json b/src/unitxt/catalog/cards/natural_instructions/train/task114_is_the_given_word_longest.json new file mode 100644 index 000000000..faed20f89 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task114_is_the_given_word_longest.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task114_is_the_given_word_longest.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task114_is_the_given_word_longest" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1150_delete_max_min.json b/src/unitxt/catalog/cards/natural_instructions/train/task1150_delete_max_min.json new file mode 100644 index 000000000..399700443 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1150_delete_max_min.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1150_delete_max_min.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1150_delete_max_min" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1151_swap_max_min.json b/src/unitxt/catalog/cards/natural_instructions/train/task1151_swap_max_min.json new file mode 100644 index 000000000..4936d125c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1151_swap_max_min.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1151_swap_max_min.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1151_swap_max_min" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task115_help_advice_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task115_help_advice_classification.json new file mode 100644 index 000000000..87f22b056 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task115_help_advice_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task115_help_advice_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task115_help_advice_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1167_penn_treebank_coarse_pos_tagging.json b/src/unitxt/catalog/cards/natural_instructions/train/task1167_penn_treebank_coarse_pos_tagging.json new file mode 100644 index 000000000..eb940c4d8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1167_penn_treebank_coarse_pos_tagging.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1167_penn_treebank_coarse_pos_tagging.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1167_penn_treebank_coarse_pos_tagging" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1168_brown_coarse_pos_tagging.json b/src/unitxt/catalog/cards/natural_instructions/train/task1168_brown_coarse_pos_tagging.json new file mode 100644 index 000000000..65d36e8a4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1168_brown_coarse_pos_tagging.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1168_brown_coarse_pos_tagging.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1168_brown_coarse_pos_tagging" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task116_com2sense_commonsense_reasoning.json b/src/unitxt/catalog/cards/natural_instructions/train/task116_com2sense_commonsense_reasoning.json new file mode 100644 index 000000000..8e91788d9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task116_com2sense_commonsense_reasoning.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task116_com2sense_commonsense_reasoning.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task116_com2sense_commonsense_reasoning" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1186_nne_hrngo_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1186_nne_hrngo_classification.json new file mode 100644 index 000000000..72434733b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1186_nne_hrngo_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1186_nne_hrngo_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1186_nne_hrngo_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1188_count_max_freq_char.json b/src/unitxt/catalog/cards/natural_instructions/train/task1188_count_max_freq_char.json new file mode 100644 index 000000000..13dd0743b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1188_count_max_freq_char.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1188_count_max_freq_char.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1188_count_max_freq_char" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1189_check_char_in_string.json b/src/unitxt/catalog/cards/natural_instructions/train/task1189_check_char_in_string.json new file mode 100644 index 000000000..ca7826de5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1189_check_char_in_string.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1189_check_char_in_string.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1189_check_char_in_string" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task118_semeval_2019_task10_open_vocabulary_mathematical_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task118_semeval_2019_task10_open_vocabulary_mathematical_answer_generation.json new file mode 100644 index 000000000..f1a5137b8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task118_semeval_2019_task10_open_vocabulary_mathematical_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task118_semeval_2019_task10_open_vocabulary_mathematical_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task118_semeval_2019_task10_open_vocabulary_mathematical_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1190_add_integer_to_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task1190_add_integer_to_list.json new file mode 100644 index 000000000..01e5bc414 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1190_add_integer_to_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1190_add_integer_to_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1190_add_integer_to_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1191_food_veg_nonveg.json b/src/unitxt/catalog/cards/natural_instructions/train/task1191_food_veg_nonveg.json new file mode 100644 index 000000000..1b5851b7e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1191_food_veg_nonveg.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1191_food_veg_nonveg.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1191_food_veg_nonveg" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1192_food_flavor_profile.json b/src/unitxt/catalog/cards/natural_instructions/train/task1192_food_flavor_profile.json new file mode 100644 index 000000000..17424bb6e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1192_food_flavor_profile.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1192_food_flavor_profile.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1192_food_flavor_profile" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1193_food_course_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1193_food_course_classification.json new file mode 100644 index 000000000..6a07a4150 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1193_food_course_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1193_food_course_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1193_food_course_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1194_kth_largest_element.json b/src/unitxt/catalog/cards/natural_instructions/train/task1194_kth_largest_element.json new file mode 100644 index 000000000..cfa678b1b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1194_kth_largest_element.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1194_kth_largest_element.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1194_kth_largest_element" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1196_atomic_classification_oeffect.json b/src/unitxt/catalog/cards/natural_instructions/train/task1196_atomic_classification_oeffect.json new file mode 100644 index 000000000..2840496a8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1196_atomic_classification_oeffect.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1196_atomic_classification_oeffect.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1196_atomic_classification_oeffect" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1197_atomic_classification_oreact.json b/src/unitxt/catalog/cards/natural_instructions/train/task1197_atomic_classification_oreact.json new file mode 100644 index 000000000..a9afc87c4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1197_atomic_classification_oreact.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1197_atomic_classification_oreact.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1197_atomic_classification_oreact" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1198_atomic_classification_owant.json b/src/unitxt/catalog/cards/natural_instructions/train/task1198_atomic_classification_owant.json new file mode 100644 index 000000000..47d79347a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1198_atomic_classification_owant.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1198_atomic_classification_owant.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1198_atomic_classification_owant" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1199_atomic_classification_xattr.json b/src/unitxt/catalog/cards/natural_instructions/train/task1199_atomic_classification_xattr.json new file mode 100644 index 000000000..2c6a49855 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1199_atomic_classification_xattr.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1199_atomic_classification_xattr.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1199_atomic_classification_xattr" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task119_semeval_2019_task10_geometric_mathematical_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task119_semeval_2019_task10_geometric_mathematical_answer_generation.json new file mode 100644 index 000000000..d4addd34d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task119_semeval_2019_task10_geometric_mathematical_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task119_semeval_2019_task10_geometric_mathematical_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task119_semeval_2019_task10_geometric_mathematical_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1200_atomic_classification_xeffect.json b/src/unitxt/catalog/cards/natural_instructions/train/task1200_atomic_classification_xeffect.json new file mode 100644 index 000000000..3a22f6652 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1200_atomic_classification_xeffect.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1200_atomic_classification_xeffect.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1200_atomic_classification_xeffect" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1201_atomic_classification_xintent.json b/src/unitxt/catalog/cards/natural_instructions/train/task1201_atomic_classification_xintent.json new file mode 100644 index 000000000..e73184a84 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1201_atomic_classification_xintent.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1201_atomic_classification_xintent.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1201_atomic_classification_xintent" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1202_atomic_classification_xneed.json b/src/unitxt/catalog/cards/natural_instructions/train/task1202_atomic_classification_xneed.json new file mode 100644 index 000000000..bba741bf6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1202_atomic_classification_xneed.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1202_atomic_classification_xneed.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1202_atomic_classification_xneed" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1203_atomic_classification_xreact.json b/src/unitxt/catalog/cards/natural_instructions/train/task1203_atomic_classification_xreact.json new file mode 100644 index 000000000..f822cecd0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1203_atomic_classification_xreact.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1203_atomic_classification_xreact.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1203_atomic_classification_xreact" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1204_atomic_classification_hinderedby.json b/src/unitxt/catalog/cards/natural_instructions/train/task1204_atomic_classification_hinderedby.json new file mode 100644 index 000000000..7c2a5ab83 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1204_atomic_classification_hinderedby.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1204_atomic_classification_hinderedby.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1204_atomic_classification_hinderedby" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1205_atomic_classification_isafter.json b/src/unitxt/catalog/cards/natural_instructions/train/task1205_atomic_classification_isafter.json new file mode 100644 index 000000000..e70bf3292 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1205_atomic_classification_isafter.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1205_atomic_classification_isafter.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1205_atomic_classification_isafter" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1206_atomic_classification_isbefore.json b/src/unitxt/catalog/cards/natural_instructions/train/task1206_atomic_classification_isbefore.json new file mode 100644 index 000000000..30e0455d0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1206_atomic_classification_isbefore.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1206_atomic_classification_isbefore.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1206_atomic_classification_isbefore" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1207_atomic_classification_atlocation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1207_atomic_classification_atlocation.json new file mode 100644 index 000000000..8076d6322 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1207_atomic_classification_atlocation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1207_atomic_classification_atlocation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1207_atomic_classification_atlocation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1208_atomic_classification_xreason.json b/src/unitxt/catalog/cards/natural_instructions/train/task1208_atomic_classification_xreason.json new file mode 100644 index 000000000..db1cee0a9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1208_atomic_classification_xreason.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1208_atomic_classification_xreason.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1208_atomic_classification_xreason" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1209_atomic_classification_objectuse.json b/src/unitxt/catalog/cards/natural_instructions/train/task1209_atomic_classification_objectuse.json new file mode 100644 index 000000000..143127dfe --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1209_atomic_classification_objectuse.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1209_atomic_classification_objectuse.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1209_atomic_classification_objectuse" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1210_atomic_classification_madeupof.json b/src/unitxt/catalog/cards/natural_instructions/train/task1210_atomic_classification_madeupof.json new file mode 100644 index 000000000..5ac8d2ca7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1210_atomic_classification_madeupof.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1210_atomic_classification_madeupof.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1210_atomic_classification_madeupof" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1211_atomic_classification_hassubevent.json b/src/unitxt/catalog/cards/natural_instructions/train/task1211_atomic_classification_hassubevent.json new file mode 100644 index 000000000..f060435aa --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1211_atomic_classification_hassubevent.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1211_atomic_classification_hassubevent.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1211_atomic_classification_hassubevent" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1212_atomic_classification_hasproperty.json b/src/unitxt/catalog/cards/natural_instructions/train/task1212_atomic_classification_hasproperty.json new file mode 100644 index 000000000..cfaaf4dbf --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1212_atomic_classification_hasproperty.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1212_atomic_classification_hasproperty.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1212_atomic_classification_hasproperty" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1213_atomic_classification_desires.json b/src/unitxt/catalog/cards/natural_instructions/train/task1213_atomic_classification_desires.json new file mode 100644 index 000000000..60ee21490 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1213_atomic_classification_desires.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1213_atomic_classification_desires.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1213_atomic_classification_desires" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1214_atomic_classification_xwant.json b/src/unitxt/catalog/cards/natural_instructions/train/task1214_atomic_classification_xwant.json new file mode 100644 index 000000000..a79111de5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1214_atomic_classification_xwant.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1214_atomic_classification_xwant.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1214_atomic_classification_xwant" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1215_atomic_classification_capableof.json b/src/unitxt/catalog/cards/natural_instructions/train/task1215_atomic_classification_capableof.json new file mode 100644 index 000000000..3e0f0b5d2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1215_atomic_classification_capableof.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1215_atomic_classification_capableof.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1215_atomic_classification_capableof" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1216_atomic_classification_causes.json b/src/unitxt/catalog/cards/natural_instructions/train/task1216_atomic_classification_causes.json new file mode 100644 index 000000000..3163ebb90 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1216_atomic_classification_causes.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1216_atomic_classification_causes.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1216_atomic_classification_causes" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1217_atomic_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1217_atomic_answer_generation.json new file mode 100644 index 000000000..41d1b86a3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1217_atomic_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1217_atomic_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1217_atomic_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task122_conala_list_index_addition.json b/src/unitxt/catalog/cards/natural_instructions/train/task122_conala_list_index_addition.json new file mode 100644 index 000000000..5af04947c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task122_conala_list_index_addition.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task122_conala_list_index_addition.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task122_conala_list_index_addition" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task123_conala_sort_dictionary.json b/src/unitxt/catalog/cards/natural_instructions/train/task123_conala_sort_dictionary.json new file mode 100644 index 000000000..2face4b72 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task123_conala_sort_dictionary.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task123_conala_sort_dictionary.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task123_conala_sort_dictionary" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task124_conala_pair_averages.json b/src/unitxt/catalog/cards/natural_instructions/train/task124_conala_pair_averages.json new file mode 100644 index 000000000..acfddb63e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task124_conala_pair_averages.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task124_conala_pair_averages.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task124_conala_pair_averages" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task125_conala_pair_differences.json b/src/unitxt/catalog/cards/natural_instructions/train/task125_conala_pair_differences.json new file mode 100644 index 000000000..f297e495c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task125_conala_pair_differences.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task125_conala_pair_differences.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task125_conala_pair_differences" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task126_scan_structured_text_generation_command_action_all.json b/src/unitxt/catalog/cards/natural_instructions/train/task126_scan_structured_text_generation_command_action_all.json new file mode 100644 index 000000000..6757fb48f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task126_scan_structured_text_generation_command_action_all.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task126_scan_structured_text_generation_command_action_all.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task126_scan_structured_text_generation_command_action_all" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task127_scan_long_text_generation_action_command_all.json b/src/unitxt/catalog/cards/natural_instructions/train/task127_scan_long_text_generation_action_command_all.json new file mode 100644 index 000000000..eeffc27ca --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task127_scan_long_text_generation_action_command_all.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task127_scan_long_text_generation_action_command_all.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task127_scan_long_text_generation_action_command_all" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1283_hrngo_quality_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1283_hrngo_quality_classification.json new file mode 100644 index 000000000..d93ca5639 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1283_hrngo_quality_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1283_hrngo_quality_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1283_hrngo_quality_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1284_hrngo_informativeness_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1284_hrngo_informativeness_classification.json new file mode 100644 index 000000000..58b7c3c67 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1284_hrngo_informativeness_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1284_hrngo_informativeness_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1284_hrngo_informativeness_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1285_kpa_keypoint_matching.json b/src/unitxt/catalog/cards/natural_instructions/train/task1285_kpa_keypoint_matching.json new file mode 100644 index 000000000..a71003b88 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1285_kpa_keypoint_matching.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1285_kpa_keypoint_matching.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1285_kpa_keypoint_matching" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1286_openbookqa_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task1286_openbookqa_question_answering.json new file mode 100644 index 000000000..7b9ce559a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1286_openbookqa_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1286_openbookqa_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1286_openbookqa_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1288_glue_mrpc_paraphrasing.json b/src/unitxt/catalog/cards/natural_instructions/train/task1288_glue_mrpc_paraphrasing.json new file mode 100644 index 000000000..98ac76c90 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1288_glue_mrpc_paraphrasing.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1288_glue_mrpc_paraphrasing.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1288_glue_mrpc_paraphrasing" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1289_trec_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1289_trec_classification.json new file mode 100644 index 000000000..7b8e189f3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1289_trec_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1289_trec_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1289_trec_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task128_scan_structured_text_generation_command_action_short.json b/src/unitxt/catalog/cards/natural_instructions/train/task128_scan_structured_text_generation_command_action_short.json new file mode 100644 index 000000000..5445ac711 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task128_scan_structured_text_generation_command_action_short.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task128_scan_structured_text_generation_command_action_short.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task128_scan_structured_text_generation_command_action_short" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1290_xsum_summarization.json b/src/unitxt/catalog/cards/natural_instructions/train/task1290_xsum_summarization.json new file mode 100644 index 000000000..b99edc13e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1290_xsum_summarization.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1290_xsum_summarization.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1290_xsum_summarization" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1291_multi_news_summarization.json b/src/unitxt/catalog/cards/natural_instructions/train/task1291_multi_news_summarization.json new file mode 100644 index 000000000..ecb293b28 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1291_multi_news_summarization.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1291_multi_news_summarization.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1291_multi_news_summarization" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1292_yelp_review_full_text_categorization.json b/src/unitxt/catalog/cards/natural_instructions/train/task1292_yelp_review_full_text_categorization.json new file mode 100644 index 000000000..f5fd6c66b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1292_yelp_review_full_text_categorization.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1292_yelp_review_full_text_categorization.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1292_yelp_review_full_text_categorization" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1293_kilt_tasks_hotpotqa_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task1293_kilt_tasks_hotpotqa_question_answering.json new file mode 100644 index 000000000..b2d6edf0f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1293_kilt_tasks_hotpotqa_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1293_kilt_tasks_hotpotqa_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1293_kilt_tasks_hotpotqa_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1294_wiki_qa_answer_verification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1294_wiki_qa_answer_verification.json new file mode 100644 index 000000000..768201fa0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1294_wiki_qa_answer_verification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1294_wiki_qa_answer_verification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1294_wiki_qa_answer_verification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1295_adversarial_qa_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task1295_adversarial_qa_question_answering.json new file mode 100644 index 000000000..d1d879944 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1295_adversarial_qa_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1295_adversarial_qa_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1295_adversarial_qa_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1296_wiki_hop_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task1296_wiki_hop_question_answering.json new file mode 100644 index 000000000..555d84350 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1296_wiki_hop_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1296_wiki_hop_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1296_wiki_hop_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task129_scan_long_text_generation_action_command_short.json b/src/unitxt/catalog/cards/natural_instructions/train/task129_scan_long_text_generation_action_command_short.json new file mode 100644 index 000000000..f1c6a4d5d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task129_scan_long_text_generation_action_command_short.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task129_scan_long_text_generation_action_command_short.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task129_scan_long_text_generation_action_command_short" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1308_amazonreview_category_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1308_amazonreview_category_classification.json new file mode 100644 index 000000000..a9580bb36 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1308_amazonreview_category_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1308_amazonreview_category_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1308_amazonreview_category_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1309_amazonreview_summary_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1309_amazonreview_summary_classification.json new file mode 100644 index 000000000..9a2435ab1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1309_amazonreview_summary_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1309_amazonreview_summary_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1309_amazonreview_summary_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task130_scan_structured_text_generation_command_action_long.json b/src/unitxt/catalog/cards/natural_instructions/train/task130_scan_structured_text_generation_command_action_long.json new file mode 100644 index 000000000..97bae2e3f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task130_scan_structured_text_generation_command_action_long.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task130_scan_structured_text_generation_command_action_long.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task130_scan_structured_text_generation_command_action_long" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1310_amazonreview_rating_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1310_amazonreview_rating_classification.json new file mode 100644 index 000000000..d03fb4c3b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1310_amazonreview_rating_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1310_amazonreview_rating_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1310_amazonreview_rating_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1311_amazonreview_rating_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1311_amazonreview_rating_classification.json new file mode 100644 index 000000000..d4f8e656c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1311_amazonreview_rating_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1311_amazonreview_rating_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1311_amazonreview_rating_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1312_amazonreview_polarity_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1312_amazonreview_polarity_classification.json new file mode 100644 index 000000000..20b85b5e6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1312_amazonreview_polarity_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1312_amazonreview_polarity_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1312_amazonreview_polarity_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1313_amazonreview_polarity_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1313_amazonreview_polarity_classification.json new file mode 100644 index 000000000..21664ffd5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1313_amazonreview_polarity_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1313_amazonreview_polarity_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1313_amazonreview_polarity_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1314_country_abbreviation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1314_country_abbreviation.json new file mode 100644 index 000000000..768e42a22 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1314_country_abbreviation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1314_country_abbreviation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1314_country_abbreviation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1315_find_range_array.json b/src/unitxt/catalog/cards/natural_instructions/train/task1315_find_range_array.json new file mode 100644 index 000000000..75418d4e0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1315_find_range_array.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1315_find_range_array.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1315_find_range_array" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1316_remove_duplicates_string.json b/src/unitxt/catalog/cards/natural_instructions/train/task1316_remove_duplicates_string.json new file mode 100644 index 000000000..74bd1561b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1316_remove_duplicates_string.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1316_remove_duplicates_string.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1316_remove_duplicates_string" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1317_country_calling_code.json b/src/unitxt/catalog/cards/natural_instructions/train/task1317_country_calling_code.json new file mode 100644 index 000000000..07ad8bd38 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1317_country_calling_code.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1317_country_calling_code.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1317_country_calling_code" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1318_country_national_dish.json b/src/unitxt/catalog/cards/natural_instructions/train/task1318_country_national_dish.json new file mode 100644 index 000000000..90c87c0fc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1318_country_national_dish.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1318_country_national_dish.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1318_country_national_dish" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1319_country_by_barcode_prefix.json b/src/unitxt/catalog/cards/natural_instructions/train/task1319_country_by_barcode_prefix.json new file mode 100644 index 000000000..9be5504d7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1319_country_by_barcode_prefix.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1319_country_by_barcode_prefix.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1319_country_by_barcode_prefix" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task131_scan_long_text_generation_action_command_long.json b/src/unitxt/catalog/cards/natural_instructions/train/task131_scan_long_text_generation_action_command_long.json new file mode 100644 index 000000000..07ff92bf1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task131_scan_long_text_generation_action_command_long.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task131_scan_long_text_generation_action_command_long.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task131_scan_long_text_generation_action_command_long" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1320_country_domain_tld.json b/src/unitxt/catalog/cards/natural_instructions/train/task1320_country_domain_tld.json new file mode 100644 index 000000000..26af7a5f9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1320_country_domain_tld.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1320_country_domain_tld.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1320_country_domain_tld" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1321_country_continent.json b/src/unitxt/catalog/cards/natural_instructions/train/task1321_country_continent.json new file mode 100644 index 000000000..0cf1b3c69 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1321_country_continent.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1321_country_continent.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1321_country_continent" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1322_country_government_type.json b/src/unitxt/catalog/cards/natural_instructions/train/task1322_country_government_type.json new file mode 100644 index 000000000..eb62a288b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1322_country_government_type.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1322_country_government_type.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1322_country_government_type" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1325_qa_zre_question_generation_on_subject_relation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1325_qa_zre_question_generation_on_subject_relation.json new file mode 100644 index 000000000..5421606e1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1325_qa_zre_question_generation_on_subject_relation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1325_qa_zre_question_generation_on_subject_relation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1325_qa_zre_question_generation_on_subject_relation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1326_qa_zre_question_generation_from_answer.json b/src/unitxt/catalog/cards/natural_instructions/train/task1326_qa_zre_question_generation_from_answer.json new file mode 100644 index 000000000..19cc8dcb0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1326_qa_zre_question_generation_from_answer.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1326_qa_zre_question_generation_from_answer.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1326_qa_zre_question_generation_from_answer" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1327_qa_zre_answer_generation_from_question.json b/src/unitxt/catalog/cards/natural_instructions/train/task1327_qa_zre_answer_generation_from_question.json new file mode 100644 index 000000000..c4cfff8f1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1327_qa_zre_answer_generation_from_question.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1327_qa_zre_answer_generation_from_question.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1327_qa_zre_answer_generation_from_question" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1328_qa_zre_relation_generation_from_question.json b/src/unitxt/catalog/cards/natural_instructions/train/task1328_qa_zre_relation_generation_from_question.json new file mode 100644 index 000000000..4244e5ce5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1328_qa_zre_relation_generation_from_question.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1328_qa_zre_relation_generation_from_question.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1328_qa_zre_relation_generation_from_question" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task132_dais_text_modification.json b/src/unitxt/catalog/cards/natural_instructions/train/task132_dais_text_modification.json new file mode 100644 index 000000000..bc1d38fff --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task132_dais_text_modification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task132_dais_text_modification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task132_dais_text_modification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1331_reverse_array.json b/src/unitxt/catalog/cards/natural_instructions/train/task1331_reverse_array.json new file mode 100644 index 000000000..212e79620 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1331_reverse_array.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1331_reverse_array.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1331_reverse_array" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1332_check_leap_year.json b/src/unitxt/catalog/cards/natural_instructions/train/task1332_check_leap_year.json new file mode 100644 index 000000000..d35ce8ca9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1332_check_leap_year.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1332_check_leap_year.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1332_check_leap_year" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1333_check_validity_date_ddmmyyyy.json b/src/unitxt/catalog/cards/natural_instructions/train/task1333_check_validity_date_ddmmyyyy.json new file mode 100644 index 000000000..40d210a34 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1333_check_validity_date_ddmmyyyy.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1333_check_validity_date_ddmmyyyy.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1333_check_validity_date_ddmmyyyy" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1336_peixian_equity_evaluation_corpus_gender_classifier.json b/src/unitxt/catalog/cards/natural_instructions/train/task1336_peixian_equity_evaluation_corpus_gender_classifier.json new file mode 100644 index 000000000..7a4f6b4fc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1336_peixian_equity_evaluation_corpus_gender_classifier.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1336_peixian_equity_evaluation_corpus_gender_classifier.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1336_peixian_equity_evaluation_corpus_gender_classifier" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1338_peixian_equity_evaluation_corpus_sentiment_classifier.json b/src/unitxt/catalog/cards/natural_instructions/train/task1338_peixian_equity_evaluation_corpus_sentiment_classifier.json new file mode 100644 index 000000000..cd25017af --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1338_peixian_equity_evaluation_corpus_sentiment_classifier.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1338_peixian_equity_evaluation_corpus_sentiment_classifier.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1338_peixian_equity_evaluation_corpus_sentiment_classifier" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1339_peixian_equity_evaluation_corpus_text_completion.json b/src/unitxt/catalog/cards/natural_instructions/train/task1339_peixian_equity_evaluation_corpus_text_completion.json new file mode 100644 index 000000000..2793cb14d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1339_peixian_equity_evaluation_corpus_text_completion.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1339_peixian_equity_evaluation_corpus_text_completion.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1339_peixian_equity_evaluation_corpus_text_completion" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1340_msr_text_compression_compression.json b/src/unitxt/catalog/cards/natural_instructions/train/task1340_msr_text_compression_compression.json new file mode 100644 index 000000000..bb696672c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1340_msr_text_compression_compression.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1340_msr_text_compression_compression.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1340_msr_text_compression_compression" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1341_msr_text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1341_msr_text_classification.json new file mode 100644 index 000000000..48a11060e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1341_msr_text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1341_msr_text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1341_msr_text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1346_glue_cola_grammatical_correctness_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1346_glue_cola_grammatical_correctness_classification.json new file mode 100644 index 000000000..73d4ff971 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1346_glue_cola_grammatical_correctness_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1346_glue_cola_grammatical_correctness_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1346_glue_cola_grammatical_correctness_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1347_glue_sts_b_similarity_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1347_glue_sts_b_similarity_classification.json new file mode 100644 index 000000000..37a9b1b67 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1347_glue_sts_b_similarity_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1347_glue_sts-b_similarity_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1347_glue_sts_b_similarity_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1354_sent_comp_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1354_sent_comp_classification.json new file mode 100644 index 000000000..c0c44ee87 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1354_sent_comp_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1354_sent_comp_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1354_sent_comp_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1355_sent_comp_summarization.json b/src/unitxt/catalog/cards/natural_instructions/train/task1355_sent_comp_summarization.json new file mode 100644 index 000000000..ac6d08924 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1355_sent_comp_summarization.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1355_sent_comp_summarization.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1355_sent_comp_summarization" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1359_numer_sense_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1359_numer_sense_answer_generation.json new file mode 100644 index 000000000..d537adb4e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1359_numer_sense_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1359_numer_sense_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1359_numer_sense_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1360_numer_sense_multiple_choice_qa_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1360_numer_sense_multiple_choice_qa_generation.json new file mode 100644 index 000000000..3322e1add --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1360_numer_sense_multiple_choice_qa_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1360_numer_sense_multiple_choice_qa_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1360_numer_sense_multiple_choice_qa_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1361_movierationales_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1361_movierationales_classification.json new file mode 100644 index 000000000..7ef8cf133 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1361_movierationales_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1361_movierationales_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1361_movierationales_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1364_hans_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1364_hans_answer_generation.json new file mode 100644 index 000000000..e8e1e27cd --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1364_hans_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1364_hans_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1364_hans_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1366_healthfact_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1366_healthfact_classification.json new file mode 100644 index 000000000..ccaea4180 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1366_healthfact_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1366_healthfact_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1366_healthfact_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1368_healthfact_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1368_healthfact_sentence_generation.json new file mode 100644 index 000000000..b234a8f75 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1368_healthfact_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1368_healthfact_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1368_healthfact_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1369_healthfact_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1369_healthfact_sentence_generation.json new file mode 100644 index 000000000..30ee13ee9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1369_healthfact_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1369_healthfact_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1369_healthfact_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1378_quarel_correct_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1378_quarel_correct_answer_generation.json new file mode 100644 index 000000000..5c954236b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1378_quarel_correct_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1378_quarel_correct_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1378_quarel_correct_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1379_quarel_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1379_quarel_incorrect_answer_generation.json new file mode 100644 index 000000000..32b994f51 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1379_quarel_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1379_quarel_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1379_quarel_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task137_detoxifying_lms_classification_toxicity.json b/src/unitxt/catalog/cards/natural_instructions/train/task137_detoxifying_lms_classification_toxicity.json new file mode 100644 index 000000000..4f6b93f67 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task137_detoxifying_lms_classification_toxicity.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task137_detoxifying-lms_classification_toxicity.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task137_detoxifying_lms_classification_toxicity" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1380_quarel_correct_option_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1380_quarel_correct_option_generation.json new file mode 100644 index 000000000..2dd90af45 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1380_quarel_correct_option_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1380_quarel_correct_option_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1380_quarel_correct_option_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1381_quarel_incorrect_option_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1381_quarel_incorrect_option_generation.json new file mode 100644 index 000000000..368476d67 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1381_quarel_incorrect_option_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1381_quarel_incorrect_option_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1381_quarel_incorrect_option_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1382_quarel_write_correct_answer.json b/src/unitxt/catalog/cards/natural_instructions/train/task1382_quarel_write_correct_answer.json new file mode 100644 index 000000000..4d1135829 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1382_quarel_write_correct_answer.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1382_quarel_write_correct_answer.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1382_quarel_write_correct_answer" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1383_quarel_write_incorrect_answer.json b/src/unitxt/catalog/cards/natural_instructions/train/task1383_quarel_write_incorrect_answer.json new file mode 100644 index 000000000..bd45e63be --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1383_quarel_write_incorrect_answer.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1383_quarel_write_incorrect_answer.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1383_quarel_write_incorrect_answer" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1384_deal_or_no_dialog_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1384_deal_or_no_dialog_classification.json new file mode 100644 index 000000000..874762242 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1384_deal_or_no_dialog_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1384_deal_or_no_dialog_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1384_deal_or_no_dialog_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1389_hellaswag_completion.json b/src/unitxt/catalog/cards/natural_instructions/train/task1389_hellaswag_completion.json new file mode 100644 index 000000000..a53b9e595 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1389_hellaswag_completion.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1389_hellaswag_completion.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1389_hellaswag_completion" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task138_detoxifying_lms_classification_fluency.json b/src/unitxt/catalog/cards/natural_instructions/train/task138_detoxifying_lms_classification_fluency.json new file mode 100644 index 000000000..863ea4bf7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task138_detoxifying_lms_classification_fluency.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task138_detoxifying-lms_classification_fluency.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task138_detoxifying_lms_classification_fluency" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1398_obqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1398_obqa_question_generation.json new file mode 100644 index 000000000..16ae1e285 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1398_obqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1398_obqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1398_obqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1399_obqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1399_obqa_answer_generation.json new file mode 100644 index 000000000..e6d0bdae7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1399_obqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1399_obqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1399_obqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task139_detoxifying_lms_classification_topicality.json b/src/unitxt/catalog/cards/natural_instructions/train/task139_detoxifying_lms_classification_topicality.json new file mode 100644 index 000000000..96bd336da --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task139_detoxifying_lms_classification_topicality.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task139_detoxifying-lms_classification_topicality.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task139_detoxifying_lms_classification_topicality" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1400_obqa_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1400_obqa_incorrect_answer_generation.json new file mode 100644 index 000000000..f99d762a0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1400_obqa_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1400_obqa_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1400_obqa_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1401_obqa_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1401_obqa_sentence_generation.json new file mode 100644 index 000000000..9c115b545 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1401_obqa_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1401_obqa_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1401_obqa_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1403_check_validity_date_mmddyyyy.json b/src/unitxt/catalog/cards/natural_instructions/train/task1403_check_validity_date_mmddyyyy.json new file mode 100644 index 000000000..ba4730a31 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1403_check_validity_date_mmddyyyy.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1403_check_validity_date_mmddyyyy.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1403_check_validity_date_mmddyyyy" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1404_date_conversion.json b/src/unitxt/catalog/cards/natural_instructions/train/task1404_date_conversion.json new file mode 100644 index 000000000..28f13d5f8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1404_date_conversion.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1404_date_conversion.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1404_date_conversion" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1405_find_median.json b/src/unitxt/catalog/cards/natural_instructions/train/task1405_find_median.json new file mode 100644 index 000000000..75c150ad6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1405_find_median.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1405_find_median.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1405_find_median" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1406_kth_smallest_element.json b/src/unitxt/catalog/cards/natural_instructions/train/task1406_kth_smallest_element.json new file mode 100644 index 000000000..2fa063dfd --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1406_kth_smallest_element.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1406_kth_smallest_element.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1406_kth_smallest_element" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task140_detoxifying_lms_classification_style.json b/src/unitxt/catalog/cards/natural_instructions/train/task140_detoxifying_lms_classification_style.json new file mode 100644 index 000000000..527954d63 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task140_detoxifying_lms_classification_style.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task140_detoxifying-lms_classification_style.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task140_detoxifying_lms_classification_style" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1412_web_questions_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task1412_web_questions_question_answering.json new file mode 100644 index 000000000..6825d83ab --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1412_web_questions_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1412_web_questions_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1412_web_questions_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1418_bless_semantic_relation_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1418_bless_semantic_relation_classification.json new file mode 100644 index 000000000..fe563e577 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1418_bless_semantic_relation_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1418_bless_semantic_relation_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1418_bless_semantic_relation_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1419_mathqa_gain.json b/src/unitxt/catalog/cards/natural_instructions/train/task1419_mathqa_gain.json new file mode 100644 index 000000000..026be7f74 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1419_mathqa_gain.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1419_mathqa_gain.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1419_mathqa_gain" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task141_odd_man_out_classification_category.json b/src/unitxt/catalog/cards/natural_instructions/train/task141_odd_man_out_classification_category.json new file mode 100644 index 000000000..4e7eb3dbd --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task141_odd_man_out_classification_category.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task141_odd-man-out_classification_category.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task141_odd_man_out_classification_category" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1420_mathqa_general.json b/src/unitxt/catalog/cards/natural_instructions/train/task1420_mathqa_general.json new file mode 100644 index 000000000..7482a5c31 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1420_mathqa_general.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1420_mathqa_general.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1420_mathqa_general" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1421_mathqa_other.json b/src/unitxt/catalog/cards/natural_instructions/train/task1421_mathqa_other.json new file mode 100644 index 000000000..d71810f2a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1421_mathqa_other.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1421_mathqa_other.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1421_mathqa_other" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1422_mathqa_physics.json b/src/unitxt/catalog/cards/natural_instructions/train/task1422_mathqa_physics.json new file mode 100644 index 000000000..a8a73d25a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1422_mathqa_physics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1422_mathqa_physics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1422_mathqa_physics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1423_mathqa_geometry.json b/src/unitxt/catalog/cards/natural_instructions/train/task1423_mathqa_geometry.json new file mode 100644 index 000000000..199e5f296 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1423_mathqa_geometry.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1423_mathqa_geometry.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1423_mathqa_geometry" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1424_mathqa_probability.json b/src/unitxt/catalog/cards/natural_instructions/train/task1424_mathqa_probability.json new file mode 100644 index 000000000..b172e87b4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1424_mathqa_probability.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1424_mathqa_probability.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1424_mathqa_probability" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1425_country_iso_numeric.json b/src/unitxt/catalog/cards/natural_instructions/train/task1425_country_iso_numeric.json new file mode 100644 index 000000000..cd35fbb98 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1425_country_iso_numeric.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1425_country_iso_numeric.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1425_country_iso_numeric" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1426_country_independence_year.json b/src/unitxt/catalog/cards/natural_instructions/train/task1426_country_independence_year.json new file mode 100644 index 000000000..57098a9e9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1426_country_independence_year.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1426_country_independence_year.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1426_country_independence_year" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1427_country_region_in_world.json b/src/unitxt/catalog/cards/natural_instructions/train/task1427_country_region_in_world.json new file mode 100644 index 000000000..9e0486f15 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1427_country_region_in_world.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1427_country_region_in_world.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1427_country_region_in_world" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1428_country_surface_area.json b/src/unitxt/catalog/cards/natural_instructions/train/task1428_country_surface_area.json new file mode 100644 index 000000000..4559bfa2c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1428_country_surface_area.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1428_country_surface_area.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1428_country_surface_area" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1429_evalution_semantic_relation_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1429_evalution_semantic_relation_classification.json new file mode 100644 index 000000000..5972b792d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1429_evalution_semantic_relation_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1429_evalution_semantic_relation_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1429_evalution_semantic_relation_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task142_odd_man_out_classification_no_category.json b/src/unitxt/catalog/cards/natural_instructions/train/task142_odd_man_out_classification_no_category.json new file mode 100644 index 000000000..61b215d8f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task142_odd_man_out_classification_no_category.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task142_odd-man-out_classification_no_category.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task142_odd_man_out_classification_no_category" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1431_head_qa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1431_head_qa_answer_generation.json new file mode 100644 index 000000000..7a0de9435 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1431_head_qa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1431_head_qa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1431_head_qa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1434_head_qa_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1434_head_qa_classification.json new file mode 100644 index 000000000..87c64290d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1434_head_qa_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1434_head_qa_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1434_head_qa_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task143_odd_man_out_classification_generate_category.json b/src/unitxt/catalog/cards/natural_instructions/train/task143_odd_man_out_classification_generate_category.json new file mode 100644 index 000000000..cf7a6765d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task143_odd_man_out_classification_generate_category.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task143_odd-man-out_classification_generate_category.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task143_odd_man_out_classification_generate_category" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1443_string_to_number.json b/src/unitxt/catalog/cards/natural_instructions/train/task1443_string_to_number.json new file mode 100644 index 000000000..171abf68a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1443_string_to_number.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1443_string_to_number.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1443_string_to_number" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1444_round_power_of_two.json b/src/unitxt/catalog/cards/natural_instructions/train/task1444_round_power_of_two.json new file mode 100644 index 000000000..f58aff83f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1444_round_power_of_two.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1444_round_power_of_two.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1444_round_power_of_two" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1445_closest_integers.json b/src/unitxt/catalog/cards/natural_instructions/train/task1445_closest_integers.json new file mode 100644 index 000000000..7b7f0d5e3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1445_closest_integers.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1445_closest_integers.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1445_closest_integers" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1446_farthest_integers.json b/src/unitxt/catalog/cards/natural_instructions/train/task1446_farthest_integers.json new file mode 100644 index 000000000..b4f6ec11e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1446_farthest_integers.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1446_farthest_integers.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1446_farthest_integers" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1447_drug_extraction_ade.json b/src/unitxt/catalog/cards/natural_instructions/train/task1447_drug_extraction_ade.json new file mode 100644 index 000000000..ae8329027 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1447_drug_extraction_ade.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1447_drug_extraction_ade.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1447_drug_extraction_ade" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1448_disease_entity_extraction_ncbi_dataset.json b/src/unitxt/catalog/cards/natural_instructions/train/task1448_disease_entity_extraction_ncbi_dataset.json new file mode 100644 index 000000000..1260175af --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1448_disease_entity_extraction_ncbi_dataset.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1448_disease_entity_extraction_ncbi_dataset.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1448_disease_entity_extraction_ncbi_dataset" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1449_disease_entity_extraction_bc5cdr_dataset.json b/src/unitxt/catalog/cards/natural_instructions/train/task1449_disease_entity_extraction_bc5cdr_dataset.json new file mode 100644 index 000000000..3e6a827e5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1449_disease_entity_extraction_bc5cdr_dataset.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1449_disease_entity_extraction_bc5cdr_dataset.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1449_disease_entity_extraction_bc5cdr_dataset" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task144_subjqa_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task144_subjqa_question_answering.json new file mode 100644 index 000000000..a1c973810 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task144_subjqa_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task144_subjqa_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task144_subjqa_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1451_drug_dose_extraction.json b/src/unitxt/catalog/cards/natural_instructions/train/task1451_drug_dose_extraction.json new file mode 100644 index 000000000..23688787c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1451_drug_dose_extraction.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1451_drug_dose_extraction.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1451_drug_dose_extraction" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1452_location_entity_extraction_btc_corpus.json b/src/unitxt/catalog/cards/natural_instructions/train/task1452_location_entity_extraction_btc_corpus.json new file mode 100644 index 000000000..0f912b727 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1452_location_entity_extraction_btc_corpus.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1452_location_entity_extraction_btc_corpus.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1452_location_entity_extraction_btc_corpus" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1453_person_entity_extraction_btc_corpus.json b/src/unitxt/catalog/cards/natural_instructions/train/task1453_person_entity_extraction_btc_corpus.json new file mode 100644 index 000000000..4355016d9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1453_person_entity_extraction_btc_corpus.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1453_person_entity_extraction_btc_corpus.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1453_person_entity_extraction_btc_corpus" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task145_afs_argument_similarity_death_penalty.json b/src/unitxt/catalog/cards/natural_instructions/train/task145_afs_argument_similarity_death_penalty.json new file mode 100644 index 000000000..2feb82de6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task145_afs_argument_similarity_death_penalty.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task145_afs_argument_similarity_death_penalty.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task145_afs_argument_similarity_death_penalty" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task146_afs_argument_similarity_gun_control.json b/src/unitxt/catalog/cards/natural_instructions/train/task146_afs_argument_similarity_gun_control.json new file mode 100644 index 000000000..0e45cd41a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task146_afs_argument_similarity_gun_control.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task146_afs_argument_similarity_gun_control.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task146_afs_argument_similarity_gun_control" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1479_organization_entity_extraction_btc_corpus.json b/src/unitxt/catalog/cards/natural_instructions/train/task1479_organization_entity_extraction_btc_corpus.json new file mode 100644 index 000000000..6aceb206b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1479_organization_entity_extraction_btc_corpus.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1479_organization_entity_extraction_btc_corpus.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1479_organization_entity_extraction_btc_corpus" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task147_afs_argument_similarity_gay_marriage.json b/src/unitxt/catalog/cards/natural_instructions/train/task147_afs_argument_similarity_gay_marriage.json new file mode 100644 index 000000000..8c97a9742 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task147_afs_argument_similarity_gay_marriage.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task147_afs_argument_similarity_gay_marriage.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task147_afs_argument_similarity_gay_marriage" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1480_gene_extraction_jnlpba_dataset.json b/src/unitxt/catalog/cards/natural_instructions/train/task1480_gene_extraction_jnlpba_dataset.json new file mode 100644 index 000000000..d4894ef13 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1480_gene_extraction_jnlpba_dataset.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1480_gene_extraction_jnlpba_dataset.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1480_gene_extraction_jnlpba_dataset" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1481_gene_extraction_bc2gm_dataset.json b/src/unitxt/catalog/cards/natural_instructions/train/task1481_gene_extraction_bc2gm_dataset.json new file mode 100644 index 000000000..63974bfb8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1481_gene_extraction_bc2gm_dataset.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1481_gene_extraction_bc2gm_dataset.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1481_gene_extraction_bc2gm_dataset" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1482_gene_extraction_chemprot_dataset.json b/src/unitxt/catalog/cards/natural_instructions/train/task1482_gene_extraction_chemprot_dataset.json new file mode 100644 index 000000000..3bb2f5178 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1482_gene_extraction_chemprot_dataset.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1482_gene_extraction_chemprot_dataset.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1482_gene_extraction_chemprot_dataset" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1483_chemical_extraction_chemprot_dataset.json b/src/unitxt/catalog/cards/natural_instructions/train/task1483_chemical_extraction_chemprot_dataset.json new file mode 100644 index 000000000..12af29cd5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1483_chemical_extraction_chemprot_dataset.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1483_chemical_extraction_chemprot_dataset.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1483_chemical_extraction_chemprot_dataset" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1484_gene_extraction_linnaeus_dataset.json b/src/unitxt/catalog/cards/natural_instructions/train/task1484_gene_extraction_linnaeus_dataset.json new file mode 100644 index 000000000..1075b45ae --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1484_gene_extraction_linnaeus_dataset.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1484_gene_extraction_linnaeus_dataset.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1484_gene_extraction_linnaeus_dataset" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1485_organ_extraction_anem_dataset.json b/src/unitxt/catalog/cards/natural_instructions/train/task1485_organ_extraction_anem_dataset.json new file mode 100644 index 000000000..8f2abefea --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1485_organ_extraction_anem_dataset.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1485_organ_extraction_anem_dataset.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1485_organ_extraction_anem_dataset" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1486_cell_extraction_anem_dataset.json b/src/unitxt/catalog/cards/natural_instructions/train/task1486_cell_extraction_anem_dataset.json new file mode 100644 index 000000000..06f39564b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1486_cell_extraction_anem_dataset.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1486_cell_extraction_anem_dataset.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1486_cell_extraction_anem_dataset" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1487_organism_substance_extraction_anem_dataset.json b/src/unitxt/catalog/cards/natural_instructions/train/task1487_organism_substance_extraction_anem_dataset.json new file mode 100644 index 000000000..b8aea7f62 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1487_organism_substance_extraction_anem_dataset.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1487_organism_substance_extraction_anem_dataset.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1487_organism_substance_extraction_anem_dataset" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1488_sarcasmdetection_headline_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1488_sarcasmdetection_headline_classification.json new file mode 100644 index 000000000..8908e67f2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1488_sarcasmdetection_headline_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1488_sarcasmdetection_headline_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1488_sarcasmdetection_headline_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1489_sarcasmdetection_tweet_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1489_sarcasmdetection_tweet_classification.json new file mode 100644 index 000000000..6100a4d80 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1489_sarcasmdetection_tweet_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1489_sarcasmdetection_tweet_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1489_sarcasmdetection_tweet_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task148_afs_argument_quality_gay_marriage.json b/src/unitxt/catalog/cards/natural_instructions/train/task148_afs_argument_quality_gay_marriage.json new file mode 100644 index 000000000..a564933e8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task148_afs_argument_quality_gay_marriage.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task148_afs_argument_quality_gay_marriage.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task148_afs_argument_quality_gay_marriage" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1495_adverse_drug_event_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1495_adverse_drug_event_classification.json new file mode 100644 index 000000000..c44a1ea77 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1495_adverse_drug_event_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1495_adverse_drug_event_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1495_adverse_drug_event_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1498_24hour_to_12hour_clock.json b/src/unitxt/catalog/cards/natural_instructions/train/task1498_24hour_to_12hour_clock.json new file mode 100644 index 000000000..f72dbbf92 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1498_24hour_to_12hour_clock.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1498_24hour_to_12hour_clock.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1498_24hour_to_12hour_clock" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1499_dstc3_summarization.json b/src/unitxt/catalog/cards/natural_instructions/train/task1499_dstc3_summarization.json new file mode 100644 index 000000000..52ad60c87 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1499_dstc3_summarization.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1499_dstc3_summarization.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1499_dstc3_summarization" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task149_afs_argument_quality_death_penalty.json b/src/unitxt/catalog/cards/natural_instructions/train/task149_afs_argument_quality_death_penalty.json new file mode 100644 index 000000000..3790017e2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task149_afs_argument_quality_death_penalty.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task149_afs_argument_quality_death_penalty.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task149_afs_argument_quality_death_penalty" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1500_dstc3_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1500_dstc3_classification.json new file mode 100644 index 000000000..6e556b878 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1500_dstc3_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1500_dstc3_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1500_dstc3_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1501_dstc3_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1501_dstc3_answer_generation.json new file mode 100644 index 000000000..7671196ab --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1501_dstc3_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1501_dstc3_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1501_dstc3_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1502_hatexplain_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1502_hatexplain_classification.json new file mode 100644 index 000000000..9f62ee994 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1502_hatexplain_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1502_hatexplain_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1502_hatexplain_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1503_hatexplain_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1503_hatexplain_classification.json new file mode 100644 index 000000000..5b7502b15 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1503_hatexplain_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1503_hatexplain_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1503_hatexplain_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1504_hatexplain_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1504_hatexplain_answer_generation.json new file mode 100644 index 000000000..e679b7c2b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1504_hatexplain_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1504_hatexplain_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1504_hatexplain_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1505_root09_semantic_relation_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1505_root09_semantic_relation_classification.json new file mode 100644 index 000000000..afabc8ee7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1505_root09_semantic_relation_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1505_root09_semantic_relation_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1505_root09_semantic_relation_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1506_celebrity_minimal_dob_span.json b/src/unitxt/catalog/cards/natural_instructions/train/task1506_celebrity_minimal_dob_span.json new file mode 100644 index 000000000..c460f5833 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1506_celebrity_minimal_dob_span.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1506_celebrity_minimal_dob_span.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1506_celebrity_minimal_dob_span" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1507_boolean_temporal_reasoning.json b/src/unitxt/catalog/cards/natural_instructions/train/task1507_boolean_temporal_reasoning.json new file mode 100644 index 000000000..fe8b73dba --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1507_boolean_temporal_reasoning.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1507_boolean_temporal_reasoning.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1507_boolean_temporal_reasoning" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1508_wordnet_antonyms.json b/src/unitxt/catalog/cards/natural_instructions/train/task1508_wordnet_antonyms.json new file mode 100644 index 000000000..cfd3fd300 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1508_wordnet_antonyms.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1508_wordnet_antonyms.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1508_wordnet_antonyms" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1509_evalution_antonyms.json b/src/unitxt/catalog/cards/natural_instructions/train/task1509_evalution_antonyms.json new file mode 100644 index 000000000..009fc44aa --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1509_evalution_antonyms.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1509_evalution_antonyms.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1509_evalution_antonyms" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task150_afs_argument_quality_gun_control.json b/src/unitxt/catalog/cards/natural_instructions/train/task150_afs_argument_quality_gun_control.json new file mode 100644 index 000000000..53f0f89cc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task150_afs_argument_quality_gun_control.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task150_afs_argument_quality_gun_control.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task150_afs_argument_quality_gun_control" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1510_evalution_relation_extraction.json b/src/unitxt/catalog/cards/natural_instructions/train/task1510_evalution_relation_extraction.json new file mode 100644 index 000000000..bb0f8f284 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1510_evalution_relation_extraction.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1510_evalution_relation_extraction.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1510_evalution_relation_extraction" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1517_limit_classfication.json b/src/unitxt/catalog/cards/natural_instructions/train/task1517_limit_classfication.json new file mode 100644 index 000000000..ed3d0b3bd --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1517_limit_classfication.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1517_limit_classfication.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1517_limit_classfication" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1518_limit_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1518_limit_answer_generation.json new file mode 100644 index 000000000..b37520f2d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1518_limit_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1518_limit_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1518_limit_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1519_qa_srl_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1519_qa_srl_question_generation.json new file mode 100644 index 000000000..231b394d1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1519_qa_srl_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1519_qa_srl_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1519_qa_srl_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task151_tomqa_find_location_easy_clean.json b/src/unitxt/catalog/cards/natural_instructions/train/task151_tomqa_find_location_easy_clean.json new file mode 100644 index 000000000..ec7610079 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task151_tomqa_find_location_easy_clean.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task151_tomqa_find_location_easy_clean.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task151_tomqa_find_location_easy_clean" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1520_qa_srl_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1520_qa_srl_answer_generation.json new file mode 100644 index 000000000..20e2efed7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1520_qa_srl_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1520_qa_srl_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1520_qa_srl_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task152_tomqa_find_location_easy_noise.json b/src/unitxt/catalog/cards/natural_instructions/train/task152_tomqa_find_location_easy_noise.json new file mode 100644 index 000000000..aa3c4b02a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task152_tomqa_find_location_easy_noise.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task152_tomqa_find_location_easy_noise.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task152_tomqa_find_location_easy_noise" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task153_tomqa_find_location_hard_clean.json b/src/unitxt/catalog/cards/natural_instructions/train/task153_tomqa_find_location_hard_clean.json new file mode 100644 index 000000000..46e55c6c2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task153_tomqa_find_location_hard_clean.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task153_tomqa_find_location_hard_clean.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task153_tomqa_find_location_hard_clean" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1541_agnews_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1541_agnews_classification.json new file mode 100644 index 000000000..9549811e8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1541_agnews_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1541_agnews_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1541_agnews_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1542_every_ith_element_from_starting.json b/src/unitxt/catalog/cards/natural_instructions/train/task1542_every_ith_element_from_starting.json new file mode 100644 index 000000000..57e058def --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1542_every_ith_element_from_starting.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1542_every_ith_element_from_starting.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1542_every_ith_element_from_starting" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1548_wiqa_binary_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1548_wiqa_binary_classification.json new file mode 100644 index 000000000..4a671da9c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1548_wiqa_binary_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1548_wiqa_binary_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1548_wiqa_binary_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1549_wiqa_answer_generation_missing_step.json b/src/unitxt/catalog/cards/natural_instructions/train/task1549_wiqa_answer_generation_missing_step.json new file mode 100644 index 000000000..ce8382a11 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1549_wiqa_answer_generation_missing_step.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1549_wiqa_answer_generation_missing_step.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1549_wiqa_answer_generation_missing_step" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task154_tomqa_find_location_hard_noise.json b/src/unitxt/catalog/cards/natural_instructions/train/task154_tomqa_find_location_hard_noise.json new file mode 100644 index 000000000..5f9891b69 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task154_tomqa_find_location_hard_noise.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task154_tomqa_find_location_hard_noise.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task154_tomqa_find_location_hard_noise" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1551_every_ith_element_from_kth_element.json b/src/unitxt/catalog/cards/natural_instructions/train/task1551_every_ith_element_from_kth_element.json new file mode 100644 index 000000000..6ef23dced --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1551_every_ith_element_from_kth_element.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1551_every_ith_element_from_kth_element.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1551_every_ith_element_from_kth_element" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1553_cnn_dailymail_summarization.json b/src/unitxt/catalog/cards/natural_instructions/train/task1553_cnn_dailymail_summarization.json new file mode 100644 index 000000000..4430cdffa --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1553_cnn_dailymail_summarization.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1553_cnn_dailymail_summarization.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1553_cnn_dailymail_summarization" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1559_blimp_binary_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1559_blimp_binary_classification.json new file mode 100644 index 000000000..11ea59a52 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1559_blimp_binary_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1559_blimp_binary_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1559_blimp_binary_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task155_count_nouns_verbs.json b/src/unitxt/catalog/cards/natural_instructions/train/task155_count_nouns_verbs.json new file mode 100644 index 000000000..4122b9039 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task155_count_nouns_verbs.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task155_count_nouns_verbs.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task155_count_nouns_verbs" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1560_blimp_binary_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1560_blimp_binary_classification.json new file mode 100644 index 000000000..8c2f34007 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1560_blimp_binary_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1560_blimp_binary_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1560_blimp_binary_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1564_triviaqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1564_triviaqa_answer_generation.json new file mode 100644 index 000000000..e24fc1dd7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1564_triviaqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1564_triviaqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1564_triviaqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1565_triviaqa_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1565_triviaqa_classification.json new file mode 100644 index 000000000..22f5bd9b2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1565_triviaqa_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1565_triviaqa_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1565_triviaqa_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1566_propara_structured_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1566_propara_structured_text_generation.json new file mode 100644 index 000000000..6505d8be8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1566_propara_structured_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1566_propara_structured_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1566_propara_structured_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1567_propara_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1567_propara_question_generation.json new file mode 100644 index 000000000..a4475bb6c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1567_propara_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1567_propara_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1567_propara_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1568_propara_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1568_propara_classification.json new file mode 100644 index 000000000..2ed7ed30c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1568_propara_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1568_propara_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1568_propara_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task156_codah_classification_adversarial.json b/src/unitxt/catalog/cards/natural_instructions/train/task156_codah_classification_adversarial.json new file mode 100644 index 000000000..00379dd26 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task156_codah_classification_adversarial.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task156_codah_classification_adversarial.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task156_codah_classification_adversarial" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1572_samsum_summary.json b/src/unitxt/catalog/cards/natural_instructions/train/task1572_samsum_summary.json new file mode 100644 index 000000000..22361fb69 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1572_samsum_summary.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1572_samsum_summary.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1572_samsum_summary" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1573_samsum_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1573_samsum_classification.json new file mode 100644 index 000000000..7421c4258 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1573_samsum_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1573_samsum_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1573_samsum_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task157_count_vowels_and_consonants.json b/src/unitxt/catalog/cards/natural_instructions/train/task157_count_vowels_and_consonants.json new file mode 100644 index 000000000..13abedd41 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task157_count_vowels_and_consonants.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task157_count_vowels_and_consonants.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task157_count_vowels_and_consonants" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1580_eqasc_perturbed_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1580_eqasc_perturbed_question_generation.json new file mode 100644 index 000000000..3dea832d1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1580_eqasc_perturbed_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1580_eqasc-perturbed_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1580_eqasc_perturbed_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1581_eqasc_perturbed_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1581_eqasc_perturbed_answer_generation.json new file mode 100644 index 000000000..c8dcc1356 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1581_eqasc_perturbed_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1581_eqasc-perturbed_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1581_eqasc_perturbed_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1582_bless_hypernym_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1582_bless_hypernym_generation.json new file mode 100644 index 000000000..f63074364 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1582_bless_hypernym_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1582_bless_hypernym_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1582_bless_hypernym_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1583_bless_meronym_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1583_bless_meronym_classification.json new file mode 100644 index 000000000..3d2358765 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1583_bless_meronym_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1583_bless_meronym_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1583_bless_meronym_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1584_evalution_meronym_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1584_evalution_meronym_classification.json new file mode 100644 index 000000000..8b7a9e551 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1584_evalution_meronym_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1584_evalution_meronym_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1584_evalution_meronym_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1585_root09_hypernym_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1585_root09_hypernym_generation.json new file mode 100644 index 000000000..0e873ec53 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1585_root09_hypernym_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1585_root09_hypernym_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1585_root09_hypernym_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task158_count_frequency_of_words.json b/src/unitxt/catalog/cards/natural_instructions/train/task158_count_frequency_of_words.json new file mode 100644 index 000000000..bea88dc89 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task158_count_frequency_of_words.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task158_count_frequency_of_words.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task158_count_frequency_of_words" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1590_diplomacy_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1590_diplomacy_text_generation.json new file mode 100644 index 000000000..cb9cc9e9e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1590_diplomacy_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1590_diplomacy_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1590_diplomacy_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1592_yahoo_answers_topics_classfication.json b/src/unitxt/catalog/cards/natural_instructions/train/task1592_yahoo_answers_topics_classfication.json new file mode 100644 index 000000000..019600084 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1592_yahoo_answers_topics_classfication.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1592_yahoo_answers_topics_classfication.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1592_yahoo_answers_topics_classfication" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1593_yahoo_answers_topics_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1593_yahoo_answers_topics_classification.json new file mode 100644 index 000000000..2253a56d1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1593_yahoo_answers_topics_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1593_yahoo_answers_topics_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1593_yahoo_answers_topics_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1594_yahoo_answers_topics_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1594_yahoo_answers_topics_question_generation.json new file mode 100644 index 000000000..498a3af9c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1594_yahoo_answers_topics_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1594_yahoo_answers_topics_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1594_yahoo_answers_topics_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1595_event2mind_text_generation_1.json b/src/unitxt/catalog/cards/natural_instructions/train/task1595_event2mind_text_generation_1.json new file mode 100644 index 000000000..0e9e30907 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1595_event2mind_text_generation_1.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1595_event2mind_text_generation_1.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1595_event2mind_text_generation_1" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1596_event2mind_text_generation_2.json b/src/unitxt/catalog/cards/natural_instructions/train/task1596_event2mind_text_generation_2.json new file mode 100644 index 000000000..08f4ba0b4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1596_event2mind_text_generation_2.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1596_event2mind_text_generation_2.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1596_event2mind_text_generation_2" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1599_smcalflow_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1599_smcalflow_classification.json new file mode 100644 index 000000000..007606a75 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1599_smcalflow_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1599_smcalflow_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1599_smcalflow_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task159_check_frequency_of_words_in_sentence_pair.json b/src/unitxt/catalog/cards/natural_instructions/train/task159_check_frequency_of_words_in_sentence_pair.json new file mode 100644 index 000000000..5c3e0277f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task159_check_frequency_of_words_in_sentence_pair.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task159_check_frequency_of_words_in_sentence_pair.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task159_check_frequency_of_words_in_sentence_pair" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1600_smcalflow_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1600_smcalflow_sentence_generation.json new file mode 100644 index 000000000..ce56684ae --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1600_smcalflow_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1600_smcalflow_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1600_smcalflow_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1601_webquestions_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1601_webquestions_answer_generation.json new file mode 100644 index 000000000..3556464a8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1601_webquestions_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1601_webquestions_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1601_webquestions_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1602_webquestion_question_genreation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1602_webquestion_question_genreation.json new file mode 100644 index 000000000..b7cfdd119 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1602_webquestion_question_genreation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1602_webquestion_question_genreation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1602_webquestion_question_genreation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1603_smcalflow_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1603_smcalflow_sentence_generation.json new file mode 100644 index 000000000..b5796b2de --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1603_smcalflow_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1603_smcalflow_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1603_smcalflow_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1604_ethos_text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1604_ethos_text_classification.json new file mode 100644 index 000000000..ba0e9dc9e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1604_ethos_text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1604_ethos_text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1604_ethos_text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1605_ethos_text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1605_ethos_text_classification.json new file mode 100644 index 000000000..72e3fa252 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1605_ethos_text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1605_ethos_text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1605_ethos_text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1606_ethos_text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1606_ethos_text_classification.json new file mode 100644 index 000000000..cf3659650 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1606_ethos_text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1606_ethos_text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1606_ethos_text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1607_ethos_text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1607_ethos_text_classification.json new file mode 100644 index 000000000..655be328b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1607_ethos_text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1607_ethos_text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1607_ethos_text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1608_xquad_en_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1608_xquad_en_answer_generation.json new file mode 100644 index 000000000..86ad39c11 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1608_xquad_en_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1608_xquad_en_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1608_xquad_en_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1609_xquad_en_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1609_xquad_en_question_generation.json new file mode 100644 index 000000000..91dab8938 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1609_xquad_en_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1609_xquad_en_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1609_xquad_en_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task160_replace_letter_in_a_sentence.json b/src/unitxt/catalog/cards/natural_instructions/train/task160_replace_letter_in_a_sentence.json new file mode 100644 index 000000000..fec5f8432 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task160_replace_letter_in_a_sentence.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task160_replace_letter_in_a_sentence.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task160_replace_letter_in_a_sentence" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task161_count_words_containing_letter.json b/src/unitxt/catalog/cards/natural_instructions/train/task161_count_words_containing_letter.json new file mode 100644 index 000000000..2e5ef7cb6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task161_count_words_containing_letter.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task161_count_words_containing_letter.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task161_count_words_containing_letter" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task162_count_words_starting_with_letter.json b/src/unitxt/catalog/cards/natural_instructions/train/task162_count_words_starting_with_letter.json new file mode 100644 index 000000000..703b981dc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task162_count_words_starting_with_letter.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task162_count_words_starting_with_letter.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task162_count_words_starting_with_letter" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task163_count_words_ending_with_letter.json b/src/unitxt/catalog/cards/natural_instructions/train/task163_count_words_ending_with_letter.json new file mode 100644 index 000000000..67484f954 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task163_count_words_ending_with_letter.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task163_count_words_ending_with_letter.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task163_count_words_ending_with_letter" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1645_medical_question_pair_dataset_text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1645_medical_question_pair_dataset_text_classification.json new file mode 100644 index 000000000..71e82cb41 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1645_medical_question_pair_dataset_text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1645_medical_question_pair_dataset_text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1645_medical_question_pair_dataset_text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task164_mcscript_question_answering_text.json b/src/unitxt/catalog/cards/natural_instructions/train/task164_mcscript_question_answering_text.json new file mode 100644 index 000000000..5847a24d0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task164_mcscript_question_answering_text.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task164_mcscript_question_answering_text.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task164_mcscript_question_answering_text" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1656_gooaq_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1656_gooaq_answer_generation.json new file mode 100644 index 000000000..1295f4aef --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1656_gooaq_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1656_gooaq_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1656_gooaq_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1657_gooaq_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1657_gooaq_question_generation.json new file mode 100644 index 000000000..8365a71d7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1657_gooaq_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1657_gooaq_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1657_gooaq_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task165_mcscript_question_answering_commonsense.json b/src/unitxt/catalog/cards/natural_instructions/train/task165_mcscript_question_answering_commonsense.json new file mode 100644 index 000000000..8a00cc8b7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task165_mcscript_question_answering_commonsense.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task165_mcscript_question_answering_commonsense.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task165_mcscript_question_answering_commonsense" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1660_super_glue_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1660_super_glue_question_generation.json new file mode 100644 index 000000000..ed5220341 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1660_super_glue_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1660_super_glue_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1660_super_glue_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1661_super_glue_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1661_super_glue_classification.json new file mode 100644 index 000000000..96e3bb2b5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1661_super_glue_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1661_super_glue_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1661_super_glue_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1665_trainglecopa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1665_trainglecopa_question_generation.json new file mode 100644 index 000000000..c42cf244a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1665_trainglecopa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1665_trainglecopa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1665_trainglecopa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1669_md_gender_bias_text_modification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1669_md_gender_bias_text_modification.json new file mode 100644 index 000000000..0882c37c3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1669_md_gender_bias_text_modification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1669_md_gender_bias_text_modification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1669_md_gender_bias_text_modification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task166_clariq_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task166_clariq_sentence_generation.json new file mode 100644 index 000000000..44612a85e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task166_clariq_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task166_clariq_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task166_clariq_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1670_md_gender_bias_text_modification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1670_md_gender_bias_text_modification.json new file mode 100644 index 000000000..969b8e708 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1670_md_gender_bias_text_modification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1670_md_gender_bias_text_modification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1670_md_gender_bias_text_modification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1678_mathqa_answer_selection.json b/src/unitxt/catalog/cards/natural_instructions/train/task1678_mathqa_answer_selection.json new file mode 100644 index 000000000..b6e15b784 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1678_mathqa_answer_selection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1678_mathqa_answer_selection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1678_mathqa_answer_selection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task167_strategyqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task167_strategyqa_question_generation.json new file mode 100644 index 000000000..c41dfe97c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task167_strategyqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task167_strategyqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task167_strategyqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task168_strategyqa_question_decomposition.json b/src/unitxt/catalog/cards/natural_instructions/train/task168_strategyqa_question_decomposition.json new file mode 100644 index 000000000..02ee49143 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task168_strategyqa_question_decomposition.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task168_strategyqa_question_decomposition.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task168_strategyqa_question_decomposition" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task169_strategyqa_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task169_strategyqa_sentence_generation.json new file mode 100644 index 000000000..84e7355f4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task169_strategyqa_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task169_strategyqa_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task169_strategyqa_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1703_ljspeech_textmodification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1703_ljspeech_textmodification.json new file mode 100644 index 000000000..519060732 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1703_ljspeech_textmodification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1703_ljspeech_textmodification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1703_ljspeech_textmodification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1704_ljspeech_textmodification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1704_ljspeech_textmodification.json new file mode 100644 index 000000000..b6549cc3a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1704_ljspeech_textmodification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1704_ljspeech_textmodification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1704_ljspeech_textmodification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1705_ljspeech_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1705_ljspeech_classification.json new file mode 100644 index 000000000..b72aaf268 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1705_ljspeech_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1705_ljspeech_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1705_ljspeech_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1706_ljspeech_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1706_ljspeech_classification.json new file mode 100644 index 000000000..acb0a9a42 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1706_ljspeech_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1706_ljspeech_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1706_ljspeech_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task170_hotpotqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task170_hotpotqa_answer_generation.json new file mode 100644 index 000000000..be50fc4e3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task170_hotpotqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task170_hotpotqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task170_hotpotqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1711_poki_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1711_poki_text_generation.json new file mode 100644 index 000000000..9176e46df --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1711_poki_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1711_poki_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1711_poki_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1712_poki_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1712_poki_classification.json new file mode 100644 index 000000000..1be8eb431 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1712_poki_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1712_poki_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1712_poki_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1713_convai3_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1713_convai3_sentence_generation.json new file mode 100644 index 000000000..3986d50e1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1713_convai3_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1713_convai3_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1713_convai3_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1714_convai3_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1714_convai3_sentence_generation.json new file mode 100644 index 000000000..902fc372b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1714_convai3_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1714_convai3_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1714_convai3_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1720_civil_comments_toxicity_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1720_civil_comments_toxicity_classification.json new file mode 100644 index 000000000..0ea1236c6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1720_civil_comments_toxicity_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1720_civil_comments_toxicity_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1720_civil_comments_toxicity_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1721_civil_comments_obscenity_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1721_civil_comments_obscenity_classification.json new file mode 100644 index 000000000..987175cfe --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1721_civil_comments_obscenity_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1721_civil_comments_obscenity_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1721_civil_comments_obscenity_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1722_civil_comments_threat_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1722_civil_comments_threat_classification.json new file mode 100644 index 000000000..d60360167 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1722_civil_comments_threat_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1722_civil_comments_threat_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1722_civil_comments_threat_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1723_civil_comments_sexuallyexplicit_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1723_civil_comments_sexuallyexplicit_classification.json new file mode 100644 index 000000000..786502fb1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1723_civil_comments_sexuallyexplicit_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1723_civil_comments_sexuallyexplicit_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1723_civil_comments_sexuallyexplicit_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1724_civil_comments_insult_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1724_civil_comments_insult_classification.json new file mode 100644 index 000000000..2b69733b6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1724_civil_comments_insult_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1724_civil_comments_insult_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1724_civil_comments_insult_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1725_civil_comments_severtoxicity_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task1725_civil_comments_severtoxicity_classification.json new file mode 100644 index 000000000..43ca265ea --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1725_civil_comments_severtoxicity_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1725_civil_comments_severtoxicity_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1725_civil_comments_severtoxicity_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1726_mathqa_correct_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task1726_mathqa_correct_answer_generation.json new file mode 100644 index 000000000..dda7fd5e3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1726_mathqa_correct_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1726_mathqa_correct_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1726_mathqa_correct_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1727_wiqa_what_is_the_effect.json b/src/unitxt/catalog/cards/natural_instructions/train/task1727_wiqa_what_is_the_effect.json new file mode 100644 index 000000000..e0a786cf4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1727_wiqa_what_is_the_effect.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1727_wiqa_what_is_the_effect.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1727_wiqa_what_is_the_effect" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1729_personachat_generate_next.json b/src/unitxt/catalog/cards/natural_instructions/train/task1729_personachat_generate_next.json new file mode 100644 index 000000000..745cd3f0d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1729_personachat_generate_next.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1729_personachat_generate_next.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1729_personachat_generate_next" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1730_personachat_choose_next.json b/src/unitxt/catalog/cards/natural_instructions/train/task1730_personachat_choose_next.json new file mode 100644 index 000000000..96213cf56 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1730_personachat_choose_next.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1730_personachat_choose_next.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1730_personachat_choose_next" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task1731_quartz_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task1731_quartz_question_answering.json new file mode 100644 index 000000000..2258dd5d6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task1731_quartz_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task1731_quartz_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task1731_quartz_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task176_break_decompose_questions.json b/src/unitxt/catalog/cards/natural_instructions/train/task176_break_decompose_questions.json new file mode 100644 index 000000000..d57efc967 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task176_break_decompose_questions.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task176_break_decompose_questions.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task176_break_decompose_questions" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task177_para_nmt_paraphrasing.json b/src/unitxt/catalog/cards/natural_instructions/train/task177_para_nmt_paraphrasing.json new file mode 100644 index 000000000..733d5f818 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task177_para_nmt_paraphrasing.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task177_para-nmt_paraphrasing.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task177_para_nmt_paraphrasing" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task178_quartz_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task178_quartz_question_answering.json new file mode 100644 index 000000000..1ea5d1046 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task178_quartz_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task178_quartz_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task178_quartz_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task179_participant_extraction.json b/src/unitxt/catalog/cards/natural_instructions/train/task179_participant_extraction.json new file mode 100644 index 000000000..55ceac0e7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task179_participant_extraction.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task179_participant_extraction.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task179_participant_extraction" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task180_intervention_extraction.json b/src/unitxt/catalog/cards/natural_instructions/train/task180_intervention_extraction.json new file mode 100644 index 000000000..2534d143e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task180_intervention_extraction.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task180_intervention_extraction.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task180_intervention_extraction" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task181_outcome_extraction.json b/src/unitxt/catalog/cards/natural_instructions/train/task181_outcome_extraction.json new file mode 100644 index 000000000..7f25716dc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task181_outcome_extraction.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task181_outcome_extraction.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task181_outcome_extraction" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task182_duorc_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task182_duorc_question_generation.json new file mode 100644 index 000000000..9f40c333c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task182_duorc_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task182_duorc_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task182_duorc_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task183_rhyme_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task183_rhyme_generation.json new file mode 100644 index 000000000..3c0f11a92 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task183_rhyme_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task183_rhyme_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task183_rhyme_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task184_break_generate_question.json b/src/unitxt/catalog/cards/natural_instructions/train/task184_break_generate_question.json new file mode 100644 index 000000000..da1215e9b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task184_break_generate_question.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task184_break_generate_question.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task184_break_generate_question" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task191_hotpotqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task191_hotpotqa_question_generation.json new file mode 100644 index 000000000..84f5b452c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task191_hotpotqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task191_hotpotqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task191_hotpotqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task192_hotpotqa_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task192_hotpotqa_sentence_generation.json new file mode 100644 index 000000000..8bfd99048 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task192_hotpotqa_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task192_hotpotqa_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task192_hotpotqa_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task193_duorc_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task193_duorc_question_generation.json new file mode 100644 index 000000000..ad2ae0e9e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task193_duorc_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task193_duorc_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task193_duorc_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task194_duorc_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task194_duorc_answer_generation.json new file mode 100644 index 000000000..34428141d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task194_duorc_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task194_duorc_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task194_duorc_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task195_sentiment140_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task195_sentiment140_classification.json new file mode 100644 index 000000000..08767efb7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task195_sentiment140_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task195_sentiment140_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task195_sentiment140_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task196_sentiment140_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task196_sentiment140_answer_generation.json new file mode 100644 index 000000000..eccf1d322 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task196_sentiment140_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task196_sentiment140_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task196_sentiment140_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task205_remove_even_elements.json b/src/unitxt/catalog/cards/natural_instructions/train/task205_remove_even_elements.json new file mode 100644 index 000000000..49aceac93 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task205_remove_even_elements.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task205_remove_even_elements.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task205_remove_even_elements" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task206_collatz_conjecture.json b/src/unitxt/catalog/cards/natural_instructions/train/task206_collatz_conjecture.json new file mode 100644 index 000000000..fa0f4fcb1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task206_collatz_conjecture.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task206_collatz_conjecture.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task206_collatz_conjecture" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task207_max_element_lists.json b/src/unitxt/catalog/cards/natural_instructions/train/task207_max_element_lists.json new file mode 100644 index 000000000..e1628cdf1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task207_max_element_lists.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task207_max_element_lists.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task207_max_element_lists" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task208_combinations_of_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task208_combinations_of_list.json new file mode 100644 index 000000000..ff5c16ae0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task208_combinations_of_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task208_combinations_of_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task208_combinations_of_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task209_stancedetection_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task209_stancedetection_classification.json new file mode 100644 index 000000000..d14a2c768 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task209_stancedetection_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task209_stancedetection_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task209_stancedetection_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task210_logic2text_structured_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task210_logic2text_structured_text_generation.json new file mode 100644 index 000000000..4dab59e5b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task210_logic2text_structured_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task210_logic2text_structured_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task210_logic2text_structured_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task211_logic2text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task211_logic2text_classification.json new file mode 100644 index 000000000..d45148b3e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task211_logic2text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task211_logic2text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task211_logic2text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task212_logic2text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task212_logic2text_classification.json new file mode 100644 index 000000000..f34cf159a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task212_logic2text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task212_logic2text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task212_logic2text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task223_quartz_explanation_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task223_quartz_explanation_generation.json new file mode 100644 index 000000000..5cabd1e85 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task223_quartz_explanation_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task223_quartz_explanation_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task223_quartz_explanation_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task227_clariq_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task227_clariq_classification.json new file mode 100644 index 000000000..be1ae5be4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task227_clariq_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task227_clariq_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task227_clariq_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task228_arc_answer_generation_easy.json b/src/unitxt/catalog/cards/natural_instructions/train/task228_arc_answer_generation_easy.json new file mode 100644 index 000000000..ce58dbb7f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task228_arc_answer_generation_easy.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task228_arc_answer_generation_easy.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task228_arc_answer_generation_easy" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task229_arc_answer_generation_hard.json b/src/unitxt/catalog/cards/natural_instructions/train/task229_arc_answer_generation_hard.json new file mode 100644 index 000000000..6ab2f46e3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task229_arc_answer_generation_hard.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task229_arc_answer_generation_hard.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task229_arc_answer_generation_hard" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task243_count_elements_in_set_intersection.json b/src/unitxt/catalog/cards/natural_instructions/train/task243_count_elements_in_set_intersection.json new file mode 100644 index 000000000..72d0e5e67 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task243_count_elements_in_set_intersection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task243_count_elements_in_set_intersection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task243_count_elements_in_set_intersection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task244_count_elements_in_set_union.json b/src/unitxt/catalog/cards/natural_instructions/train/task244_count_elements_in_set_union.json new file mode 100644 index 000000000..e248a2e65 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task244_count_elements_in_set_union.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task244_count_elements_in_set_union.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task244_count_elements_in_set_union" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task245_check_presence_in_set_intersection.json b/src/unitxt/catalog/cards/natural_instructions/train/task245_check_presence_in_set_intersection.json new file mode 100644 index 000000000..a1f44a191 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task245_check_presence_in_set_intersection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task245_check_presence_in_set_intersection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task245_check_presence_in_set_intersection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task246_dream_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task246_dream_question_generation.json new file mode 100644 index 000000000..58f3f0e73 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task246_dream_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task246_dream_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task246_dream_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task247_dream_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task247_dream_answer_generation.json new file mode 100644 index 000000000..42e262653 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task247_dream_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task247_dream_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task247_dream_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task248_dream_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task248_dream_classification.json new file mode 100644 index 000000000..c0517ca64 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task248_dream_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task248_dream_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task248_dream_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task267_concatenate_and_reverse_all_elements_from_index_i_to_j.json b/src/unitxt/catalog/cards/natural_instructions/train/task267_concatenate_and_reverse_all_elements_from_index_i_to_j.json new file mode 100644 index 000000000..38ed78791 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task267_concatenate_and_reverse_all_elements_from_index_i_to_j.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task267_concatenate_and_reverse_all_elements_from_index_i_to_j.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task267_concatenate_and_reverse_all_elements_from_index_i_to_j" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task268_casehold_legal_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task268_casehold_legal_answer_generation.json new file mode 100644 index 000000000..6b35473d8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task268_casehold_legal_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task268_casehold_legal_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task268_casehold_legal_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task269_csrg_counterfactual_story_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task269_csrg_counterfactual_story_generation.json new file mode 100644 index 000000000..886515115 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task269_csrg_counterfactual_story_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task269_csrg_counterfactual_story_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task269_csrg_counterfactual_story_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task270_csrg_counterfactual_context_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task270_csrg_counterfactual_context_generation.json new file mode 100644 index 000000000..1ea0c560d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task270_csrg_counterfactual_context_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task270_csrg_counterfactual_context_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task270_csrg_counterfactual_context_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task274_overruling_legal_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task274_overruling_legal_classification.json new file mode 100644 index 000000000..15238d384 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task274_overruling_legal_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task274_overruling_legal_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task274_overruling_legal_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task275_enhanced_wsc_paraphrase_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task275_enhanced_wsc_paraphrase_generation.json new file mode 100644 index 000000000..390e18af9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task275_enhanced_wsc_paraphrase_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task275_enhanced_wsc_paraphrase_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task275_enhanced_wsc_paraphrase_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task276_enhanced_wsc_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task276_enhanced_wsc_classification.json new file mode 100644 index 000000000..0efa08dfb --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task276_enhanced_wsc_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task276_enhanced_wsc_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task276_enhanced_wsc_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task277_stereoset_sentence_generation_stereotype.json b/src/unitxt/catalog/cards/natural_instructions/train/task277_stereoset_sentence_generation_stereotype.json new file mode 100644 index 000000000..a5dd7c3ce --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task277_stereoset_sentence_generation_stereotype.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task277_stereoset_sentence_generation_stereotype.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task277_stereoset_sentence_generation_stereotype" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task278_stereoset_sentence_generation_antistereotype.json b/src/unitxt/catalog/cards/natural_instructions/train/task278_stereoset_sentence_generation_antistereotype.json new file mode 100644 index 000000000..cf2414720 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task278_stereoset_sentence_generation_antistereotype.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task278_stereoset_sentence_generation_antistereotype.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task278_stereoset_sentence_generation_antistereotype" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task279_stereoset_classification_stereotype.json b/src/unitxt/catalog/cards/natural_instructions/train/task279_stereoset_classification_stereotype.json new file mode 100644 index 000000000..9a38c7468 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task279_stereoset_classification_stereotype.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task279_stereoset_classification_stereotype.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task279_stereoset_classification_stereotype" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task280_stereoset_classification_stereotype_type.json b/src/unitxt/catalog/cards/natural_instructions/train/task280_stereoset_classification_stereotype_type.json new file mode 100644 index 000000000..0be557962 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task280_stereoset_classification_stereotype_type.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task280_stereoset_classification_stereotype_type.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task280_stereoset_classification_stereotype_type" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task283_dream_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task283_dream_incorrect_answer_generation.json new file mode 100644 index 000000000..336974915 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task283_dream_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task283_dream_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task283_dream_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task284_imdb_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task284_imdb_classification.json new file mode 100644 index 000000000..631545132 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task284_imdb_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task284_imdb_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task284_imdb_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task285_imdb_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task285_imdb_answer_generation.json new file mode 100644 index 000000000..669e38e1c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task285_imdb_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task285_imdb_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task285_imdb_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task286_olid_offense_judgment.json b/src/unitxt/catalog/cards/natural_instructions/train/task286_olid_offense_judgment.json new file mode 100644 index 000000000..450f7b027 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task286_olid_offense_judgment.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task286_olid_offense_judgment.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task286_olid_offense_judgment" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task287_casehold_legal_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task287_casehold_legal_incorrect_answer_generation.json new file mode 100644 index 000000000..dd31f1de1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task287_casehold_legal_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task287_casehold_legal_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task287_casehold_legal_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task291_semeval_2020_task4_commonsense_validation.json b/src/unitxt/catalog/cards/natural_instructions/train/task291_semeval_2020_task4_commonsense_validation.json new file mode 100644 index 000000000..a88d00930 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task291_semeval_2020_task4_commonsense_validation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task291_semeval_2020_task4_commonsense_validation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task291_semeval_2020_task4_commonsense_validation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task292_storycommonsense_character_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task292_storycommonsense_character_text_generation.json new file mode 100644 index 000000000..3b6f27d5b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task292_storycommonsense_character_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task292_storycommonsense_character_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task292_storycommonsense_character_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task293_storycommonsense_emotion_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task293_storycommonsense_emotion_text_generation.json new file mode 100644 index 000000000..68adf10e2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task293_storycommonsense_emotion_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task293_storycommonsense_emotion_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task293_storycommonsense_emotion_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task294_storycommonsense_motiv_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task294_storycommonsense_motiv_text_generation.json new file mode 100644 index 000000000..fd8101bf9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task294_storycommonsense_motiv_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task294_storycommonsense_motiv_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task294_storycommonsense_motiv_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task295_semeval_2020_task4_commonsense_reasoning.json b/src/unitxt/catalog/cards/natural_instructions/train/task295_semeval_2020_task4_commonsense_reasoning.json new file mode 100644 index 000000000..a03cb0734 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task295_semeval_2020_task4_commonsense_reasoning.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task295_semeval_2020_task4_commonsense_reasoning.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task295_semeval_2020_task4_commonsense_reasoning" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task296_storycloze_correct_end_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task296_storycloze_correct_end_classification.json new file mode 100644 index 000000000..6c2b9c643 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task296_storycloze_correct_end_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task296_storycloze_correct_end_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task296_storycloze_correct_end_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task297_storycloze_incorrect_end_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task297_storycloze_incorrect_end_classification.json new file mode 100644 index 000000000..bec910262 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task297_storycloze_incorrect_end_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task297_storycloze_incorrect_end_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task297_storycloze_incorrect_end_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task298_storycloze_correct_end_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task298_storycloze_correct_end_classification.json new file mode 100644 index 000000000..1ac8d73c6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task298_storycloze_correct_end_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task298_storycloze_correct_end_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task298_storycloze_correct_end_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task299_storycloze_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task299_storycloze_sentence_generation.json new file mode 100644 index 000000000..269b8220a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task299_storycloze_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task299_storycloze_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task299_storycloze_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task300_storycloze_order_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task300_storycloze_order_generation.json new file mode 100644 index 000000000..8d7ac16ed --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task300_storycloze_order_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task300_storycloze_order_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task300_storycloze_order_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task301_record_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task301_record_question_generation.json new file mode 100644 index 000000000..eb0f27c2f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task301_record_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task301_record_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task301_record_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task302_record_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task302_record_classification.json new file mode 100644 index 000000000..6362e98f0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task302_record_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task302_record_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task302_record_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task303_record_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task303_record_incorrect_answer_generation.json new file mode 100644 index 000000000..cb0ef0628 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task303_record_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task303_record_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task303_record_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task305_jeopardy_answer_generation_normal.json b/src/unitxt/catalog/cards/natural_instructions/train/task305_jeopardy_answer_generation_normal.json new file mode 100644 index 000000000..cf3425730 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task305_jeopardy_answer_generation_normal.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task305_jeopardy_answer_generation_normal.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task305_jeopardy_answer_generation_normal" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task306_jeopardy_answer_generation_double.json b/src/unitxt/catalog/cards/natural_instructions/train/task306_jeopardy_answer_generation_double.json new file mode 100644 index 000000000..2d1f0f46f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task306_jeopardy_answer_generation_double.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task306_jeopardy_answer_generation_double.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task306_jeopardy_answer_generation_double" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task307_jeopardy_answer_generation_final.json b/src/unitxt/catalog/cards/natural_instructions/train/task307_jeopardy_answer_generation_final.json new file mode 100644 index 000000000..b19fdcf83 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task307_jeopardy_answer_generation_final.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task307_jeopardy_answer_generation_final.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task307_jeopardy_answer_generation_final" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task308_jeopardy_answer_generation_all.json b/src/unitxt/catalog/cards/natural_instructions/train/task308_jeopardy_answer_generation_all.json new file mode 100644 index 000000000..97221968b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task308_jeopardy_answer_generation_all.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task308_jeopardy_answer_generation_all.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task308_jeopardy_answer_generation_all" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task309_race_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task309_race_answer_generation.json new file mode 100644 index 000000000..0a521a7e1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task309_race_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task309_race_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task309_race_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task310_race_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task310_race_classification.json new file mode 100644 index 000000000..50f3d30c6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task310_race_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task310_race_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task310_race_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task311_race_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task311_race_question_generation.json new file mode 100644 index 000000000..db48e08ce --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task311_race_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task311_race_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task311_race_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task316_crows_pairs_classification_stereotype.json b/src/unitxt/catalog/cards/natural_instructions/train/task316_crows_pairs_classification_stereotype.json new file mode 100644 index 000000000..da66ff746 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task316_crows_pairs_classification_stereotype.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task316_crows-pairs_classification_stereotype.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task316_crows_pairs_classification_stereotype" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task317_crows_pairs_classification_stereotype_type.json b/src/unitxt/catalog/cards/natural_instructions/train/task317_crows_pairs_classification_stereotype_type.json new file mode 100644 index 000000000..2a38be65a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task317_crows_pairs_classification_stereotype_type.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task317_crows-pairs_classification_stereotype_type.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task317_crows_pairs_classification_stereotype_type" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task318_stereoset_classification_gender.json b/src/unitxt/catalog/cards/natural_instructions/train/task318_stereoset_classification_gender.json new file mode 100644 index 000000000..dfd0fb2dc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task318_stereoset_classification_gender.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task318_stereoset_classification_gender.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task318_stereoset_classification_gender" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task319_stereoset_classification_profession.json b/src/unitxt/catalog/cards/natural_instructions/train/task319_stereoset_classification_profession.json new file mode 100644 index 000000000..66812ad15 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task319_stereoset_classification_profession.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task319_stereoset_classification_profession.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task319_stereoset_classification_profession" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task320_stereoset_classification_race.json b/src/unitxt/catalog/cards/natural_instructions/train/task320_stereoset_classification_race.json new file mode 100644 index 000000000..fd55f0ae9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task320_stereoset_classification_race.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task320_stereoset_classification_race.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task320_stereoset_classification_race" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task321_stereoset_classification_religion.json b/src/unitxt/catalog/cards/natural_instructions/train/task321_stereoset_classification_religion.json new file mode 100644 index 000000000..219ae4727 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task321_stereoset_classification_religion.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task321_stereoset_classification_religion.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task321_stereoset_classification_religion" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task322_jigsaw_classification_threat.json b/src/unitxt/catalog/cards/natural_instructions/train/task322_jigsaw_classification_threat.json new file mode 100644 index 000000000..adf3362f9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task322_jigsaw_classification_threat.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task322_jigsaw_classification_threat.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task322_jigsaw_classification_threat" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task323_jigsaw_classification_sexually_explicit.json b/src/unitxt/catalog/cards/natural_instructions/train/task323_jigsaw_classification_sexually_explicit.json new file mode 100644 index 000000000..eb32eff71 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task323_jigsaw_classification_sexually_explicit.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task323_jigsaw_classification_sexually_explicit.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task323_jigsaw_classification_sexually_explicit" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task324_jigsaw_classification_disagree.json b/src/unitxt/catalog/cards/natural_instructions/train/task324_jigsaw_classification_disagree.json new file mode 100644 index 000000000..b53e784a3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task324_jigsaw_classification_disagree.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task324_jigsaw_classification_disagree.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task324_jigsaw_classification_disagree" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task325_jigsaw_classification_identity_attack.json b/src/unitxt/catalog/cards/natural_instructions/train/task325_jigsaw_classification_identity_attack.json new file mode 100644 index 000000000..732bffe94 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task325_jigsaw_classification_identity_attack.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task325_jigsaw_classification_identity_attack.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task325_jigsaw_classification_identity_attack" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task326_jigsaw_classification_obscene.json b/src/unitxt/catalog/cards/natural_instructions/train/task326_jigsaw_classification_obscene.json new file mode 100644 index 000000000..38017854d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task326_jigsaw_classification_obscene.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task326_jigsaw_classification_obscene.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task326_jigsaw_classification_obscene" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task327_jigsaw_classification_toxic.json b/src/unitxt/catalog/cards/natural_instructions/train/task327_jigsaw_classification_toxic.json new file mode 100644 index 000000000..3317cc553 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task327_jigsaw_classification_toxic.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task327_jigsaw_classification_toxic.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task327_jigsaw_classification_toxic" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task328_jigsaw_classification_insult.json b/src/unitxt/catalog/cards/natural_instructions/train/task328_jigsaw_classification_insult.json new file mode 100644 index 000000000..bc8ceb517 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task328_jigsaw_classification_insult.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task328_jigsaw_classification_insult.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task328_jigsaw_classification_insult" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task333_hateeval_classification_hate_en.json b/src/unitxt/catalog/cards/natural_instructions/train/task333_hateeval_classification_hate_en.json new file mode 100644 index 000000000..e0c5cf49d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task333_hateeval_classification_hate_en.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task333_hateeval_classification_hate_en.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task333_hateeval_classification_hate_en" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task335_hateeval_classification_aggresive_en.json b/src/unitxt/catalog/cards/natural_instructions/train/task335_hateeval_classification_aggresive_en.json new file mode 100644 index 000000000..bc0fe588d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task335_hateeval_classification_aggresive_en.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task335_hateeval_classification_aggresive_en.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task335_hateeval_classification_aggresive_en" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task337_hateeval_classification_individual_en.json b/src/unitxt/catalog/cards/natural_instructions/train/task337_hateeval_classification_individual_en.json new file mode 100644 index 000000000..d22f36fc0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task337_hateeval_classification_individual_en.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task337_hateeval_classification_individual_en.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task337_hateeval_classification_individual_en" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task339_record_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task339_record_answer_generation.json new file mode 100644 index 000000000..972611099 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task339_record_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task339_record_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task339_record_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task340_winomt_classification_gender_pro.json b/src/unitxt/catalog/cards/natural_instructions/train/task340_winomt_classification_gender_pro.json new file mode 100644 index 000000000..ce4e919d4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task340_winomt_classification_gender_pro.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task340_winomt_classification_gender_pro.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task340_winomt_classification_gender_pro" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task341_winomt_classification_gender_anti.json b/src/unitxt/catalog/cards/natural_instructions/train/task341_winomt_classification_gender_anti.json new file mode 100644 index 000000000..3a01ae813 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task341_winomt_classification_gender_anti.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task341_winomt_classification_gender_anti.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task341_winomt_classification_gender_anti" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task342_winomt_classification_profession_pro.json b/src/unitxt/catalog/cards/natural_instructions/train/task342_winomt_classification_profession_pro.json new file mode 100644 index 000000000..15ca90132 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task342_winomt_classification_profession_pro.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task342_winomt_classification_profession_pro.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task342_winomt_classification_profession_pro" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task343_winomt_classification_profession_anti.json b/src/unitxt/catalog/cards/natural_instructions/train/task343_winomt_classification_profession_anti.json new file mode 100644 index 000000000..5592804a6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task343_winomt_classification_profession_anti.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task343_winomt_classification_profession_anti.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task343_winomt_classification_profession_anti" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task344_hybridqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task344_hybridqa_answer_generation.json new file mode 100644 index 000000000..fa79cf184 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task344_hybridqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task344_hybridqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task344_hybridqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task345_hybridqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task345_hybridqa_answer_generation.json new file mode 100644 index 000000000..409e18e61 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task345_hybridqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task345_hybridqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task345_hybridqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task346_hybridqa_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task346_hybridqa_classification.json new file mode 100644 index 000000000..2c544b329 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task346_hybridqa_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task346_hybridqa_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task346_hybridqa_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task347_hybridqa_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task347_hybridqa_incorrect_answer_generation.json new file mode 100644 index 000000000..878f04eea --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task347_hybridqa_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task347_hybridqa_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task347_hybridqa_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task350_winomt_classification_gender_identifiability_pro.json b/src/unitxt/catalog/cards/natural_instructions/train/task350_winomt_classification_gender_identifiability_pro.json new file mode 100644 index 000000000..76b077a8a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task350_winomt_classification_gender_identifiability_pro.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task350_winomt_classification_gender_identifiability_pro.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task350_winomt_classification_gender_identifiability_pro" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task351_winomt_classification_gender_identifiability_anti.json b/src/unitxt/catalog/cards/natural_instructions/train/task351_winomt_classification_gender_identifiability_anti.json new file mode 100644 index 000000000..7e92605fe --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task351_winomt_classification_gender_identifiability_anti.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task351_winomt_classification_gender_identifiability_anti.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task351_winomt_classification_gender_identifiability_anti" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task353_casino_classification_negotiation_elicit_pref.json b/src/unitxt/catalog/cards/natural_instructions/train/task353_casino_classification_negotiation_elicit_pref.json new file mode 100644 index 000000000..ec8b39761 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task353_casino_classification_negotiation_elicit_pref.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task353_casino_classification_negotiation_elicit_pref.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task353_casino_classification_negotiation_elicit_pref" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task354_casino_classification_negotiation_no_need.json b/src/unitxt/catalog/cards/natural_instructions/train/task354_casino_classification_negotiation_no_need.json new file mode 100644 index 000000000..8f75a0fc1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task354_casino_classification_negotiation_no_need.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task354_casino_classification_negotiation_no_need.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task354_casino_classification_negotiation_no_need" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task355_casino_classification_negotiation_other_need.json b/src/unitxt/catalog/cards/natural_instructions/train/task355_casino_classification_negotiation_other_need.json new file mode 100644 index 000000000..171bb3e5c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task355_casino_classification_negotiation_other_need.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task355_casino_classification_negotiation_other_need.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task355_casino_classification_negotiation_other_need" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task356_casino_classification_negotiation_self_need.json b/src/unitxt/catalog/cards/natural_instructions/train/task356_casino_classification_negotiation_self_need.json new file mode 100644 index 000000000..2d22b2196 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task356_casino_classification_negotiation_self_need.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task356_casino_classification_negotiation_self_need.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task356_casino_classification_negotiation_self_need" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task357_casino_classification_negotiation_small_talk.json b/src/unitxt/catalog/cards/natural_instructions/train/task357_casino_classification_negotiation_small_talk.json new file mode 100644 index 000000000..92c99cdc3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task357_casino_classification_negotiation_small_talk.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task357_casino_classification_negotiation_small_talk.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task357_casino_classification_negotiation_small_talk" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task358_casino_classification_negotiation_uv_part.json b/src/unitxt/catalog/cards/natural_instructions/train/task358_casino_classification_negotiation_uv_part.json new file mode 100644 index 000000000..ec18ceeaf --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task358_casino_classification_negotiation_uv_part.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task358_casino_classification_negotiation_uv_part.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task358_casino_classification_negotiation_uv_part" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task359_casino_classification_negotiation_vouch_fair.json b/src/unitxt/catalog/cards/natural_instructions/train/task359_casino_classification_negotiation_vouch_fair.json new file mode 100644 index 000000000..c171cbdcf --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task359_casino_classification_negotiation_vouch_fair.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task359_casino_classification_negotiation_vouch_fair.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task359_casino_classification_negotiation_vouch_fair" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task363_sst2_polarity_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task363_sst2_polarity_classification.json new file mode 100644 index 000000000..5a6d1a90b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task363_sst2_polarity_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task363_sst2_polarity_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task363_sst2_polarity_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task364_regard_social_impact_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task364_regard_social_impact_classification.json new file mode 100644 index 000000000..5d453f007 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task364_regard_social_impact_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task364_regard_social_impact_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task364_regard_social_impact_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task365_synthetic_remove_vowels.json b/src/unitxt/catalog/cards/natural_instructions/train/task365_synthetic_remove_vowels.json new file mode 100644 index 000000000..7ceab61f8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task365_synthetic_remove_vowels.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task365_synthetic_remove_vowels.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task365_synthetic_remove_vowels" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task366_synthetic_return_primes.json b/src/unitxt/catalog/cards/natural_instructions/train/task366_synthetic_return_primes.json new file mode 100644 index 000000000..2e829c612 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task366_synthetic_return_primes.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task366_synthetic_return_primes.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task366_synthetic_return_primes" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task367_synthetic_remove_floats.json b/src/unitxt/catalog/cards/natural_instructions/train/task367_synthetic_remove_floats.json new file mode 100644 index 000000000..451f58f91 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task367_synthetic_remove_floats.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task367_synthetic_remove_floats.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task367_synthetic_remove_floats" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task368_synthetic_even_or_odd_calculation.json b/src/unitxt/catalog/cards/natural_instructions/train/task368_synthetic_even_or_odd_calculation.json new file mode 100644 index 000000000..ef4aa2523 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task368_synthetic_even_or_odd_calculation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task368_synthetic_even_or_odd_calculation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task368_synthetic_even_or_odd_calculation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task369_synthetic_remove_odds.json b/src/unitxt/catalog/cards/natural_instructions/train/task369_synthetic_remove_odds.json new file mode 100644 index 000000000..378d6fc1e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task369_synthetic_remove_odds.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task369_synthetic_remove_odds.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task369_synthetic_remove_odds" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task370_synthetic_remove_divisible_by_3.json b/src/unitxt/catalog/cards/natural_instructions/train/task370_synthetic_remove_divisible_by_3.json new file mode 100644 index 000000000..1171c3d16 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task370_synthetic_remove_divisible_by_3.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task370_synthetic_remove_divisible_by_3.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task370_synthetic_remove_divisible_by_3" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task371_synthetic_product_of_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task371_synthetic_product_of_list.json new file mode 100644 index 000000000..d97d99e02 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task371_synthetic_product_of_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task371_synthetic_product_of_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task371_synthetic_product_of_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task372_synthetic_palindrome_numbers.json b/src/unitxt/catalog/cards/natural_instructions/train/task372_synthetic_palindrome_numbers.json new file mode 100644 index 000000000..de07e6f2c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task372_synthetic_palindrome_numbers.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task372_synthetic_palindrome_numbers.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task372_synthetic_palindrome_numbers" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task373_synthetic_round_tens_place.json b/src/unitxt/catalog/cards/natural_instructions/train/task373_synthetic_round_tens_place.json new file mode 100644 index 000000000..b6c5d9bbb --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task373_synthetic_round_tens_place.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task373_synthetic_round_tens_place.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task373_synthetic_round_tens_place" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task374_synthetic_pos_or_neg_calculation.json b/src/unitxt/catalog/cards/natural_instructions/train/task374_synthetic_pos_or_neg_calculation.json new file mode 100644 index 000000000..6a5e5bd68 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task374_synthetic_pos_or_neg_calculation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task374_synthetic_pos_or_neg_calculation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task374_synthetic_pos_or_neg_calculation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task375_classify_type_of_sentence_in_debate.json b/src/unitxt/catalog/cards/natural_instructions/train/task375_classify_type_of_sentence_in_debate.json new file mode 100644 index 000000000..0702ea32f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task375_classify_type_of_sentence_in_debate.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task375_classify_type_of_sentence_in_debate.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task375_classify_type_of_sentence_in_debate" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task376_reverse_order_of_words.json b/src/unitxt/catalog/cards/natural_instructions/train/task376_reverse_order_of_words.json new file mode 100644 index 000000000..0801c5540 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task376_reverse_order_of_words.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task376_reverse_order_of_words.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task376_reverse_order_of_words" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task377_remove_words_of_given_length.json b/src/unitxt/catalog/cards/natural_instructions/train/task377_remove_words_of_given_length.json new file mode 100644 index 000000000..23f4461d8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task377_remove_words_of_given_length.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task377_remove_words_of_given_length.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task377_remove_words_of_given_length" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task378_reverse_words_of_given_length.json b/src/unitxt/catalog/cards/natural_instructions/train/task378_reverse_words_of_given_length.json new file mode 100644 index 000000000..3e8f235d7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task378_reverse_words_of_given_length.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task378_reverse_words_of_given_length.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task378_reverse_words_of_given_length" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task379_agnews_topic_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task379_agnews_topic_classification.json new file mode 100644 index 000000000..568e3b0c4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task379_agnews_topic_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task379_agnews_topic_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task379_agnews_topic_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task380_boolq_yes_no_question.json b/src/unitxt/catalog/cards/natural_instructions/train/task380_boolq_yes_no_question.json new file mode 100644 index 000000000..d5fce9e0e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task380_boolq_yes_no_question.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task380_boolq_yes_no_question.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task380_boolq_yes_no_question" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task381_boolq_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task381_boolq_question_generation.json new file mode 100644 index 000000000..665a9ab45 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task381_boolq_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task381_boolq_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task381_boolq_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task382_hybridqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task382_hybridqa_answer_generation.json new file mode 100644 index 000000000..59d8be40f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task382_hybridqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task382_hybridqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task382_hybridqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task383_matres_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task383_matres_classification.json new file mode 100644 index 000000000..be6c2f122 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task383_matres_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task383_matres_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task383_matres_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task384_socialiqa_question_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task384_socialiqa_question_classification.json new file mode 100644 index 000000000..9073fe21f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task384_socialiqa_question_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task384_socialiqa_question_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task384_socialiqa_question_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task385_socialiqa_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task385_socialiqa_incorrect_answer_generation.json new file mode 100644 index 000000000..cd6bb07bd --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task385_socialiqa_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task385_socialiqa_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task385_socialiqa_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task386_semeval_2018_task3_irony_detection.json b/src/unitxt/catalog/cards/natural_instructions/train/task386_semeval_2018_task3_irony_detection.json new file mode 100644 index 000000000..d2e7f3374 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task386_semeval_2018_task3_irony_detection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task386_semeval_2018_task3_irony_detection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task386_semeval_2018_task3_irony_detection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task387_semeval_2018_task3_irony_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task387_semeval_2018_task3_irony_classification.json new file mode 100644 index 000000000..95d6ced09 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task387_semeval_2018_task3_irony_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task387_semeval_2018_task3_irony_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task387_semeval_2018_task3_irony_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task388_torque_token_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task388_torque_token_classification.json new file mode 100644 index 000000000..666f1276d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task388_torque_token_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task388_torque_token_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task388_torque_token_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task389_torque_generate_temporal_question.json b/src/unitxt/catalog/cards/natural_instructions/train/task389_torque_generate_temporal_question.json new file mode 100644 index 000000000..923e586f9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task389_torque_generate_temporal_question.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task389_torque_generate_temporal_question.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task389_torque_generate_temporal_question" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task390_torque_text_span_selection.json b/src/unitxt/catalog/cards/natural_instructions/train/task390_torque_text_span_selection.json new file mode 100644 index 000000000..fef9513b9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task390_torque_text_span_selection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task390_torque_text_span_selection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task390_torque_text_span_selection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task397_semeval_2018_task1_tweet_anger_detection.json b/src/unitxt/catalog/cards/natural_instructions/train/task397_semeval_2018_task1_tweet_anger_detection.json new file mode 100644 index 000000000..ad9c40ad9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task397_semeval_2018_task1_tweet_anger_detection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task397_semeval_2018_task1_tweet_anger_detection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task397_semeval_2018_task1_tweet_anger_detection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task398_semeval_2018_task1_tweet_joy_detection.json b/src/unitxt/catalog/cards/natural_instructions/train/task398_semeval_2018_task1_tweet_joy_detection.json new file mode 100644 index 000000000..39485554f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task398_semeval_2018_task1_tweet_joy_detection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task398_semeval_2018_task1_tweet_joy_detection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task398_semeval_2018_task1_tweet_joy_detection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task399_semeval_2018_task1_tweet_sadness_detection.json b/src/unitxt/catalog/cards/natural_instructions/train/task399_semeval_2018_task1_tweet_sadness_detection.json new file mode 100644 index 000000000..415aaaef8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task399_semeval_2018_task1_tweet_sadness_detection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task399_semeval_2018_task1_tweet_sadness_detection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task399_semeval_2018_task1_tweet_sadness_detection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task400_paws_paraphrase_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task400_paws_paraphrase_classification.json new file mode 100644 index 000000000..7a5e40e8e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task400_paws_paraphrase_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task400_paws_paraphrase_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task400_paws_paraphrase_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task403_creak_commonsense_inference.json b/src/unitxt/catalog/cards/natural_instructions/train/task403_creak_commonsense_inference.json new file mode 100644 index 000000000..f11dabf3d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task403_creak_commonsense_inference.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task403_creak_commonsense_inference.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task403_creak_commonsense_inference" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task405_narrativeqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task405_narrativeqa_question_generation.json new file mode 100644 index 000000000..a84c93767 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task405_narrativeqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task405_narrativeqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task405_narrativeqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task413_mickey_en_sentence_perturbation_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task413_mickey_en_sentence_perturbation_generation.json new file mode 100644 index 000000000..66f0c107a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task413_mickey_en_sentence_perturbation_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task413_mickey_en_sentence_perturbation_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task413_mickey_en_sentence_perturbation_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task428_senteval_inversion.json b/src/unitxt/catalog/cards/natural_instructions/train/task428_senteval_inversion.json new file mode 100644 index 000000000..38511f508 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task428_senteval_inversion.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task428_senteval_inversion.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task428_senteval_inversion" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task429_senteval_tense.json b/src/unitxt/catalog/cards/natural_instructions/train/task429_senteval_tense.json new file mode 100644 index 000000000..18fde8fc6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task429_senteval_tense.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task429_senteval_tense.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task429_senteval_tense" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task430_senteval_subject_count.json b/src/unitxt/catalog/cards/natural_instructions/train/task430_senteval_subject_count.json new file mode 100644 index 000000000..aafbb2f50 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task430_senteval_subject_count.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task430_senteval_subject_count.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task430_senteval_subject_count" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task431_senteval_object_count.json b/src/unitxt/catalog/cards/natural_instructions/train/task431_senteval_object_count.json new file mode 100644 index 000000000..34a9d8384 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task431_senteval_object_count.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task431_senteval_object_count.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task431_senteval_object_count" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task453_swag_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task453_swag_answer_generation.json new file mode 100644 index 000000000..32976b94c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task453_swag_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task453_swag_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task453_swag_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task454_swag_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task454_swag_incorrect_answer_generation.json new file mode 100644 index 000000000..d7f804e2f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task454_swag_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task454_swag_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task454_swag_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task455_swag_context_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task455_swag_context_generation.json new file mode 100644 index 000000000..fa64a39f9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task455_swag_context_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task455_swag_context_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task455_swag_context_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task456_matres_intention_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task456_matres_intention_classification.json new file mode 100644 index 000000000..224baa582 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task456_matres_intention_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task456_matres_intention_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task456_matres_intention_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task457_matres_conditional_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task457_matres_conditional_classification.json new file mode 100644 index 000000000..534969a2a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task457_matres_conditional_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task457_matres_conditional_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task457_matres_conditional_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task458_matres_negation_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task458_matres_negation_classification.json new file mode 100644 index 000000000..514b6b2ef --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task458_matres_negation_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task458_matres_negation_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task458_matres_negation_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task459_matres_static_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task459_matres_static_classification.json new file mode 100644 index 000000000..9ce8e36cf --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task459_matres_static_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task459_matres_static_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task459_matres_static_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task460_qasper_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task460_qasper_answer_generation.json new file mode 100644 index 000000000..6981e1b3d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task460_qasper_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task460_qasper_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task460_qasper_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task461_qasper_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task461_qasper_question_generation.json new file mode 100644 index 000000000..31ef65085 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task461_qasper_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task461_qasper_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task461_qasper_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task462_qasper_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task462_qasper_classification.json new file mode 100644 index 000000000..709f5fd72 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task462_qasper_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task462_qasper_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task462_qasper_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task469_mrqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task469_mrqa_answer_generation.json new file mode 100644 index 000000000..cc1d8fd50 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task469_mrqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task469_mrqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task469_mrqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task470_mrqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task470_mrqa_question_generation.json new file mode 100644 index 000000000..1fe88d712 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task470_mrqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task470_mrqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task470_mrqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task471_haspart_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task471_haspart_answer_generation.json new file mode 100644 index 000000000..f25c9bfd8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task471_haspart_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task471_haspart_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task471_haspart_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task472_haspart_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task472_haspart_classification.json new file mode 100644 index 000000000..095d3410f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task472_haspart_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task472_haspart_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task472_haspart_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task475_yelp_polarity_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task475_yelp_polarity_classification.json new file mode 100644 index 000000000..6145b1a25 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task475_yelp_polarity_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task475_yelp_polarity_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task475_yelp_polarity_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task476_cls_english_books_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task476_cls_english_books_classification.json new file mode 100644 index 000000000..a2bdfa042 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task476_cls_english_books_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task476_cls_english_books_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task476_cls_english_books_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task477_cls_english_dvd_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task477_cls_english_dvd_classification.json new file mode 100644 index 000000000..68a769366 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task477_cls_english_dvd_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task477_cls_english_dvd_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task477_cls_english_dvd_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task478_cls_english_music_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task478_cls_english_music_classification.json new file mode 100644 index 000000000..5502142c5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task478_cls_english_music_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task478_cls_english_music_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task478_cls_english_music_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task488_extract_all_alphabetical_elements_from_list_in_order.json b/src/unitxt/catalog/cards/natural_instructions/train/task488_extract_all_alphabetical_elements_from_list_in_order.json new file mode 100644 index 000000000..d0ef08e72 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task488_extract_all_alphabetical_elements_from_list_in_order.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task488_extract_all_alphabetical_elements_from_list_in_order.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task488_extract_all_alphabetical_elements_from_list_in_order" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task489_mwsc_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task489_mwsc_question_generation.json new file mode 100644 index 000000000..d0059fa72 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task489_mwsc_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task489_mwsc_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task489_mwsc_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task490_mwsc_options_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task490_mwsc_options_generation.json new file mode 100644 index 000000000..c0b1eca7e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task490_mwsc_options_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task490_mwsc_options_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task490_mwsc_options_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task491_mwsc_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task491_mwsc_answer_generation.json new file mode 100644 index 000000000..fca35ed7a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task491_mwsc_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task491_mwsc_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task491_mwsc_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task492_mwsc_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task492_mwsc_incorrect_answer_generation.json new file mode 100644 index 000000000..ef8ab1e48 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task492_mwsc_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task492_mwsc_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task492_mwsc_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task493_review_polarity_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task493_review_polarity_classification.json new file mode 100644 index 000000000..cbb05d1de --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task493_review_polarity_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task493_review_polarity_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task493_review_polarity_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task494_review_polarity_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task494_review_polarity_answer_generation.json new file mode 100644 index 000000000..724201f2c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task494_review_polarity_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task494_review_polarity_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task494_review_polarity_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task495_semeval_headline_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task495_semeval_headline_classification.json new file mode 100644 index 000000000..37f998b64 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task495_semeval_headline_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task495_semeval_headline_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task495_semeval_headline_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task496_semeval_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task496_semeval_answer_generation.json new file mode 100644 index 000000000..82b7ed8ed --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task496_semeval_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task496_semeval_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task496_semeval_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task497_extract_all_numbers_from_list_in_order.json b/src/unitxt/catalog/cards/natural_instructions/train/task497_extract_all_numbers_from_list_in_order.json new file mode 100644 index 000000000..a01e9c0f9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task497_extract_all_numbers_from_list_in_order.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task497_extract_all_numbers_from_list_in_order.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task497_extract_all_numbers_from_list_in_order" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task499_extract_and_add_all_numbers_from_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task499_extract_and_add_all_numbers_from_list.json new file mode 100644 index 000000000..d8cfe796a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task499_extract_and_add_all_numbers_from_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task499_extract_and_add_all_numbers_from_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task499_extract_and_add_all_numbers_from_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task504_count_all_alphabetical_elements_in_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task504_count_all_alphabetical_elements_in_list.json new file mode 100644 index 000000000..42359bc1e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task504_count_all_alphabetical_elements_in_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task504_count_all_alphabetical_elements_in_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task504_count_all_alphabetical_elements_in_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task505_count_all_numerical_elements_in_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task505_count_all_numerical_elements_in_list.json new file mode 100644 index 000000000..1f7e4ae9c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task505_count_all_numerical_elements_in_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task505_count_all_numerical_elements_in_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task505_count_all_numerical_elements_in_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task506_position_of_all_alphabetical_elements_in_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task506_position_of_all_alphabetical_elements_in_list.json new file mode 100644 index 000000000..359c78182 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task506_position_of_all_alphabetical_elements_in_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task506_position_of_all_alphabetical_elements_in_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task506_position_of_all_alphabetical_elements_in_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task507_position_of_all_numerical_elements_in_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task507_position_of_all_numerical_elements_in_list.json new file mode 100644 index 000000000..db06645d5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task507_position_of_all_numerical_elements_in_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task507_position_of_all_numerical_elements_in_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task507_position_of_all_numerical_elements_in_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task509_collate_of_all_alphabetical_and_numerical_elements_in_list_separately.json b/src/unitxt/catalog/cards/natural_instructions/train/task509_collate_of_all_alphabetical_and_numerical_elements_in_list_separately.json new file mode 100644 index 000000000..32ddcefdd --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task509_collate_of_all_alphabetical_and_numerical_elements_in_list_separately.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task509_collate_of_all_alphabetical_and_numerical_elements_in_list_separately.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task509_collate_of_all_alphabetical_and_numerical_elements_in_list_separately" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task512_twitter_emotion_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task512_twitter_emotion_classification.json new file mode 100644 index 000000000..3741c6644 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task512_twitter_emotion_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task512_twitter_emotion_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task512_twitter_emotion_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task513_argument_stance_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task513_argument_stance_classification.json new file mode 100644 index 000000000..f660b0ece --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task513_argument_stance_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task513_argument_stance_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task513_argument_stance_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task514_argument_consequence_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task514_argument_consequence_classification.json new file mode 100644 index 000000000..1f5725628 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task514_argument_consequence_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task514_argument_consequence_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task514_argument_consequence_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task515_senteval_odd_word_out.json b/src/unitxt/catalog/cards/natural_instructions/train/task515_senteval_odd_word_out.json new file mode 100644 index 000000000..de570c32f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task515_senteval_odd_word_out.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task515_senteval_odd_word_out.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task515_senteval_odd_word_out" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task516_senteval_conjoints_inversion.json b/src/unitxt/catalog/cards/natural_instructions/train/task516_senteval_conjoints_inversion.json new file mode 100644 index 000000000..85a893933 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task516_senteval_conjoints_inversion.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task516_senteval_conjoints_inversion.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task516_senteval_conjoints_inversion" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task517_emo_classify_emotion_of_dialogue.json b/src/unitxt/catalog/cards/natural_instructions/train/task517_emo_classify_emotion_of_dialogue.json new file mode 100644 index 000000000..e41ed2fcd --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task517_emo_classify_emotion_of_dialogue.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task517_emo_classify_emotion_of_dialogue.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task517_emo_classify_emotion_of_dialogue" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task518_emo_different_dialogue_emotions.json b/src/unitxt/catalog/cards/natural_instructions/train/task518_emo_different_dialogue_emotions.json new file mode 100644 index 000000000..1e3eaf725 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task518_emo_different_dialogue_emotions.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task518_emo_different_dialogue_emotions.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task518_emo_different_dialogue_emotions" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task521_trivia_question_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task521_trivia_question_classification.json new file mode 100644 index 000000000..167d6883e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task521_trivia_question_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task521_trivia_question_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task521_trivia_question_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task522_news_editorial_summary.json b/src/unitxt/catalog/cards/natural_instructions/train/task522_news_editorial_summary.json new file mode 100644 index 000000000..b72942bb7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task522_news_editorial_summary.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task522_news_editorial_summary.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task522_news_editorial_summary" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task523_find_if_numbers_or_alphabets_are_more_in_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task523_find_if_numbers_or_alphabets_are_more_in_list.json new file mode 100644 index 000000000..5e80a137c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task523_find_if_numbers_or_alphabets_are_more_in_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task523_find_if_numbers_or_alphabets_are_more_in_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task523_find_if_numbers_or_alphabets_are_more_in_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task547_alt_translation_entk_en.json b/src/unitxt/catalog/cards/natural_instructions/train/task547_alt_translation_entk_en.json new file mode 100644 index 000000000..ba639249c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task547_alt_translation_entk_en.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task547_alt_translation_entk_en.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task547_alt_translation_entk_en" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task550_discofuse_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task550_discofuse_sentence_generation.json new file mode 100644 index 000000000..7ec3aec9d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task550_discofuse_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task550_discofuse_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task550_discofuse_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task560_alt_translation_en_entk.json b/src/unitxt/catalog/cards/natural_instructions/train/task560_alt_translation_en_entk.json new file mode 100644 index 000000000..94aa05a62 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task560_alt_translation_en_entk.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task560_alt_translation_en_entk.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task560_alt_translation_en_entk" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task563_discofuse_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task563_discofuse_answer_generation.json new file mode 100644 index 000000000..66d80b7a1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task563_discofuse_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task563_discofuse_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task563_discofuse_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task564_discofuse_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task564_discofuse_classification.json new file mode 100644 index 000000000..23cdecc7c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task564_discofuse_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task564_discofuse_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task564_discofuse_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task565_circa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task565_circa_answer_generation.json new file mode 100644 index 000000000..8efc40c37 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task565_circa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task565_circa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task565_circa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task566_circa_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task566_circa_classification.json new file mode 100644 index 000000000..ba88675c9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task566_circa_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task566_circa_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task566_circa_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task567_circa_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task567_circa_text_generation.json new file mode 100644 index 000000000..ad1bccc85 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task567_circa_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task567_circa_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task567_circa_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task568_circa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task568_circa_question_generation.json new file mode 100644 index 000000000..986da1873 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task568_circa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task568_circa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task568_circa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task573_air_dialogue_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task573_air_dialogue_classification.json new file mode 100644 index 000000000..9fbaf2524 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task573_air_dialogue_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task573_air_dialogue_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task573_air_dialogue_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task574_air_dialogue_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task574_air_dialogue_sentence_generation.json new file mode 100644 index 000000000..bbe43d5b9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task574_air_dialogue_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task574_air_dialogue_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task574_air_dialogue_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task575_air_dialogue_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task575_air_dialogue_classification.json new file mode 100644 index 000000000..9d47ec684 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task575_air_dialogue_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task575_air_dialogue_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task575_air_dialogue_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task576_curiosity_dialogs_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task576_curiosity_dialogs_answer_generation.json new file mode 100644 index 000000000..43825af53 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task576_curiosity_dialogs_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task576_curiosity_dialogs_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task576_curiosity_dialogs_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task577_curiosity_dialogs_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task577_curiosity_dialogs_classification.json new file mode 100644 index 000000000..ce1ea97f6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task577_curiosity_dialogs_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task577_curiosity_dialogs_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task577_curiosity_dialogs_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task578_curiosity_dialogs_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task578_curiosity_dialogs_answer_generation.json new file mode 100644 index 000000000..1f298dd66 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task578_curiosity_dialogs_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task578_curiosity_dialogs_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task578_curiosity_dialogs_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task579_socialiqa_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task579_socialiqa_classification.json new file mode 100644 index 000000000..ee82cf3ba --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task579_socialiqa_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task579_socialiqa_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task579_socialiqa_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task580_socialiqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task580_socialiqa_answer_generation.json new file mode 100644 index 000000000..21b600942 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task580_socialiqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task580_socialiqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task580_socialiqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task581_socialiqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task581_socialiqa_question_generation.json new file mode 100644 index 000000000..af3fcfc69 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task581_socialiqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task581_socialiqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task581_socialiqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task582_naturalquestion_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task582_naturalquestion_answer_generation.json new file mode 100644 index 000000000..87e1a9215 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task582_naturalquestion_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task582_naturalquestion_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task582_naturalquestion_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task583_udeps_eng_coarse_pos_tagging.json b/src/unitxt/catalog/cards/natural_instructions/train/task583_udeps_eng_coarse_pos_tagging.json new file mode 100644 index 000000000..0ad954d71 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task583_udeps_eng_coarse_pos_tagging.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task583_udeps_eng_coarse_pos_tagging.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task583_udeps_eng_coarse_pos_tagging" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task584_udeps_eng_fine_pos_tagging.json b/src/unitxt/catalog/cards/natural_instructions/train/task584_udeps_eng_fine_pos_tagging.json new file mode 100644 index 000000000..0b63791d1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task584_udeps_eng_fine_pos_tagging.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task584_udeps_eng_fine_pos_tagging.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task584_udeps_eng_fine_pos_tagging" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task585_preposition_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task585_preposition_classification.json new file mode 100644 index 000000000..41853fb10 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task585_preposition_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task585_preposition_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task585_preposition_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task586_amazonfood_polarity_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task586_amazonfood_polarity_classification.json new file mode 100644 index 000000000..8992aceb7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task586_amazonfood_polarity_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task586_amazonfood_polarity_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task586_amazonfood_polarity_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task587_amazonfood_polarity_correction_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task587_amazonfood_polarity_correction_classification.json new file mode 100644 index 000000000..a6d1888c6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task587_amazonfood_polarity_correction_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task587_amazonfood_polarity_correction_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task587_amazonfood_polarity_correction_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task588_amazonfood_rating_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task588_amazonfood_rating_classification.json new file mode 100644 index 000000000..f6ce2e8f6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task588_amazonfood_rating_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task588_amazonfood_rating_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task588_amazonfood_rating_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task589_amazonfood_summary_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task589_amazonfood_summary_text_generation.json new file mode 100644 index 000000000..f44eea69f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task589_amazonfood_summary_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task589_amazonfood_summary_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task589_amazonfood_summary_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task590_amazonfood_summary_correction_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task590_amazonfood_summary_correction_classification.json new file mode 100644 index 000000000..daf90b6b9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task590_amazonfood_summary_correction_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task590_amazonfood_summary_correction_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task590_amazonfood_summary_correction_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task591_sciq_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task591_sciq_answer_generation.json new file mode 100644 index 000000000..7fd09e193 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task591_sciq_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task591_sciq_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task591_sciq_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task592_sciq_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task592_sciq_incorrect_answer_generation.json new file mode 100644 index 000000000..8963a622c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task592_sciq_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task592_sciq_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task592_sciq_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task593_sciq_explanation_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task593_sciq_explanation_generation.json new file mode 100644 index 000000000..3bb400db3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task593_sciq_explanation_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task593_sciq_explanation_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task593_sciq_explanation_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task594_sciq_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task594_sciq_question_generation.json new file mode 100644 index 000000000..d9f4f6f97 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task594_sciq_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task594_sciq_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task594_sciq_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task595_mocha_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task595_mocha_answer_generation.json new file mode 100644 index 000000000..f3cdd8bdf --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task595_mocha_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task595_mocha_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task595_mocha_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task596_mocha_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task596_mocha_question_generation.json new file mode 100644 index 000000000..9e31887c2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task596_mocha_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task596_mocha_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task596_mocha_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task597_cuad_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task597_cuad_answer_generation.json new file mode 100644 index 000000000..7e9fa0839 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task597_cuad_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task597_cuad_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task597_cuad_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task598_cuad_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task598_cuad_answer_generation.json new file mode 100644 index 000000000..94803a750 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task598_cuad_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task598_cuad_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task598_cuad_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task599_cuad_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task599_cuad_question_generation.json new file mode 100644 index 000000000..9dc19113d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task599_cuad_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task599_cuad_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task599_cuad_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task600_find_the_longest_common_substring_in_two_strings.json b/src/unitxt/catalog/cards/natural_instructions/train/task600_find_the_longest_common_substring_in_two_strings.json new file mode 100644 index 000000000..8e09317ad --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task600_find_the_longest_common_substring_in_two_strings.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task600_find_the_longest_common_substring_in_two_strings.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task600_find_the_longest_common_substring_in_two_strings" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task605_find_the_longest_common_subsequence_in_two_lists.json b/src/unitxt/catalog/cards/natural_instructions/train/task605_find_the_longest_common_subsequence_in_two_lists.json new file mode 100644 index 000000000..bac450f01 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task605_find_the_longest_common_subsequence_in_two_lists.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task605_find_the_longest_common_subsequence_in_two_lists.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task605_find_the_longest_common_subsequence_in_two_lists" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task606_sum_of_all_numbers_in_list_between_positions_i_and_j.json b/src/unitxt/catalog/cards/natural_instructions/train/task606_sum_of_all_numbers_in_list_between_positions_i_and_j.json new file mode 100644 index 000000000..51e5dbf28 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task606_sum_of_all_numbers_in_list_between_positions_i_and_j.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task606_sum_of_all_numbers_in_list_between_positions_i_and_j.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task606_sum_of_all_numbers_in_list_between_positions_i_and_j" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task607_sbic_intentional_offense_binary_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task607_sbic_intentional_offense_binary_classification.json new file mode 100644 index 000000000..84eba739e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task607_sbic_intentional_offense_binary_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task607_sbic_intentional_offense_binary_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task607_sbic_intentional_offense_binary_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task608_sbic_sexual_offense_binary_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task608_sbic_sexual_offense_binary_classification.json new file mode 100644 index 000000000..275d073ef --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task608_sbic_sexual_offense_binary_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task608_sbic_sexual_offense_binary_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task608_sbic_sexual_offense_binary_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task609_sbic_potentially_offense_binary_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task609_sbic_potentially_offense_binary_classification.json new file mode 100644 index 000000000..09915a343 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task609_sbic_potentially_offense_binary_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task609_sbic_potentially_offense_binary_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task609_sbic_potentially_offense_binary_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task610_conllpp_ner.json b/src/unitxt/catalog/cards/natural_instructions/train/task610_conllpp_ner.json new file mode 100644 index 000000000..12ec9d081 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task610_conllpp_ner.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task610_conllpp_ner.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task610_conllpp_ner" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task611_mutual_multi_turn_dialogue.json b/src/unitxt/catalog/cards/natural_instructions/train/task611_mutual_multi_turn_dialogue.json new file mode 100644 index 000000000..6b17bc415 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task611_mutual_multi_turn_dialogue.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task611_mutual_multi_turn_dialogue.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task611_mutual_multi_turn_dialogue" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task615_moviesqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task615_moviesqa_answer_generation.json new file mode 100644 index 000000000..e9ca68a50 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task615_moviesqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task615_moviesqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task615_moviesqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task616_cola_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task616_cola_classification.json new file mode 100644 index 000000000..596d41644 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task616_cola_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task616_cola_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task616_cola_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task617_amazonreview_category_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task617_amazonreview_category_text_generation.json new file mode 100644 index 000000000..295be0ad9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task617_amazonreview_category_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task617_amazonreview_category_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task617_amazonreview_category_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task618_amazonreview_summary_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task618_amazonreview_summary_text_generation.json new file mode 100644 index 000000000..a845b387b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task618_amazonreview_summary_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task618_amazonreview_summary_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task618_amazonreview_summary_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task622_replace_alphabets_in_a_list_by_their_position_in_english_alphabet.json b/src/unitxt/catalog/cards/natural_instructions/train/task622_replace_alphabets_in_a_list_by_their_position_in_english_alphabet.json new file mode 100644 index 000000000..c36bc5e7a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task622_replace_alphabets_in_a_list_by_their_position_in_english_alphabet.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task622_replace_alphabets_in_a_list_by_their_position_in_english_alphabet.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task622_replace_alphabets_in_a_list_by_their_position_in_english_alphabet" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task625_xlwic_true_or_false_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task625_xlwic_true_or_false_answer_generation.json new file mode 100644 index 000000000..b00cd5850 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task625_xlwic_true_or_false_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task625_xlwic_true_or_false_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task625_xlwic_true_or_false_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task626_xlwic_sentence_based_on_given_word_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task626_xlwic_sentence_based_on_given_word_sentence_generation.json new file mode 100644 index 000000000..80d2f5f8f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task626_xlwic_sentence_based_on_given_word_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task626_xlwic_sentence_based_on_given_word_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task626_xlwic_sentence_based_on_given_word_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task627_xlwic_word_with_same_meaning_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task627_xlwic_word_with_same_meaning_sentence_generation.json new file mode 100644 index 000000000..99781b743 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task627_xlwic_word_with_same_meaning_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task627_xlwic_word_with_same_meaning_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task627_xlwic_word_with_same_meaning_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task628_xlwic_word_with_different_meaning_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task628_xlwic_word_with_different_meaning_sentence_generation.json new file mode 100644 index 000000000..d8781876e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task628_xlwic_word_with_different_meaning_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task628_xlwic_word_with_different_meaning_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task628_xlwic_word_with_different_meaning_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task629_dbpedia_14_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task629_dbpedia_14_classification.json new file mode 100644 index 000000000..77a8cc165 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task629_dbpedia_14_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task629_dbpedia_14_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task629_dbpedia_14_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task630_dbpedia_14_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task630_dbpedia_14_classification.json new file mode 100644 index 000000000..a13405b9c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task630_dbpedia_14_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task630_dbpedia_14_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task630_dbpedia_14_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task631_dbpedia_14_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task631_dbpedia_14_incorrect_answer_generation.json new file mode 100644 index 000000000..d81b04787 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task631_dbpedia_14_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task631_dbpedia_14_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task631_dbpedia_14_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task632_dbpedia_14_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task632_dbpedia_14_classification.json new file mode 100644 index 000000000..4efb8364c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task632_dbpedia_14_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task632_dbpedia_14_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task632_dbpedia_14_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task633_dbpedia_14_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task633_dbpedia_14_answer_generation.json new file mode 100644 index 000000000..5ba0b81f0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task633_dbpedia_14_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task633_dbpedia_14_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task633_dbpedia_14_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task636_extract_and_sort_unique_alphabets_in_a_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task636_extract_and_sort_unique_alphabets_in_a_list.json new file mode 100644 index 000000000..bb67bf32f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task636_extract_and_sort_unique_alphabets_in_a_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task636_extract_and_sort_unique_alphabets_in_a_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task636_extract_and_sort_unique_alphabets_in_a_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task637_extract_and_sort_unique_digits_in_a_list.json b/src/unitxt/catalog/cards/natural_instructions/train/task637_extract_and_sort_unique_digits_in_a_list.json new file mode 100644 index 000000000..7bacf87bc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task637_extract_and_sort_unique_digits_in_a_list.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task637_extract_and_sort_unique_digits_in_a_list.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task637_extract_and_sort_unique_digits_in_a_list" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task638_multi_woz_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task638_multi_woz_classification.json new file mode 100644 index 000000000..8eb9cc1e4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task638_multi_woz_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task638_multi_woz_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task638_multi_woz_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task639_multi_woz_user_utterance_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task639_multi_woz_user_utterance_generation.json new file mode 100644 index 000000000..57cb47f7d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task639_multi_woz_user_utterance_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task639_multi_woz_user_utterance_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task639_multi_woz_user_utterance_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task649_race_blank_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task649_race_blank_question_generation.json new file mode 100644 index 000000000..89ec1edcc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task649_race_blank_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task649_race_blank_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task649_race_blank_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task664_mmmlu_answer_generation_abstract_algebra.json b/src/unitxt/catalog/cards/natural_instructions/train/task664_mmmlu_answer_generation_abstract_algebra.json new file mode 100644 index 000000000..edc10c58c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task664_mmmlu_answer_generation_abstract_algebra.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task664_mmmlu_answer_generation_abstract_algebra.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task664_mmmlu_answer_generation_abstract_algebra" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task665_mmmlu_answer_generation_anatomy.json b/src/unitxt/catalog/cards/natural_instructions/train/task665_mmmlu_answer_generation_anatomy.json new file mode 100644 index 000000000..4bb2a82ae --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task665_mmmlu_answer_generation_anatomy.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task665_mmmlu_answer_generation_anatomy.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task665_mmmlu_answer_generation_anatomy" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task666_mmmlu_answer_generation_astronomy.json b/src/unitxt/catalog/cards/natural_instructions/train/task666_mmmlu_answer_generation_astronomy.json new file mode 100644 index 000000000..3fa13ca48 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task666_mmmlu_answer_generation_astronomy.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task666_mmmlu_answer_generation_astronomy.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task666_mmmlu_answer_generation_astronomy" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task667_mmmlu_answer_generation_business_ethics.json b/src/unitxt/catalog/cards/natural_instructions/train/task667_mmmlu_answer_generation_business_ethics.json new file mode 100644 index 000000000..0cee6b175 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task667_mmmlu_answer_generation_business_ethics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task667_mmmlu_answer_generation_business_ethics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task667_mmmlu_answer_generation_business_ethics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task668_extreme_abstract_summarization.json b/src/unitxt/catalog/cards/natural_instructions/train/task668_extreme_abstract_summarization.json new file mode 100644 index 000000000..249efde0d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task668_extreme_abstract_summarization.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task668_extreme_abstract_summarization.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task668_extreme_abstract_summarization" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task672_amazon_and_yelp_summarization_dataset_summarization.json b/src/unitxt/catalog/cards/natural_instructions/train/task672_amazon_and_yelp_summarization_dataset_summarization.json new file mode 100644 index 000000000..bcd509f8a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task672_amazon_and_yelp_summarization_dataset_summarization.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task672_amazon_and_yelp_summarization_dataset_summarization.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task672_amazon_and_yelp_summarization_dataset_summarization" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task672_nummersense.json b/src/unitxt/catalog/cards/natural_instructions/train/task672_nummersense.json new file mode 100644 index 000000000..1249f1b3e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task672_nummersense.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task672_nummersense.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task672_nummersense" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task673_google_wellformed_query_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task673_google_wellformed_query_classification.json new file mode 100644 index 000000000..544013290 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task673_google_wellformed_query_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task673_google_wellformed_query_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task673_google_wellformed_query_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task674_google_wellformed_query_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task674_google_wellformed_query_sentence_generation.json new file mode 100644 index 000000000..bf082b2d4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task674_google_wellformed_query_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task674_google_wellformed_query_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task674_google_wellformed_query_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task675_google_wellformed_query_sentence_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task675_google_wellformed_query_sentence_generation.json new file mode 100644 index 000000000..3d65b8733 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task675_google_wellformed_query_sentence_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task675_google_wellformed_query_sentence_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task675_google_wellformed_query_sentence_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task679_hope_edi_english_text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task679_hope_edi_english_text_classification.json new file mode 100644 index 000000000..b15f9321b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task679_hope_edi_english_text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task679_hope_edi_english_text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task679_hope_edi_english_text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task681_hope_edi_malayalam_text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task681_hope_edi_malayalam_text_classification.json new file mode 100644 index 000000000..c13e76d51 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task681_hope_edi_malayalam_text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task681_hope_edi_malayalam_text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task681_hope_edi_malayalam_text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task682_online_privacy_policy_text_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task682_online_privacy_policy_text_classification.json new file mode 100644 index 000000000..78535031d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task682_online_privacy_policy_text_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task682_online_privacy_policy_text_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task682_online_privacy_policy_text_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task683_online_privacy_policy_text_purpose_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task683_online_privacy_policy_text_purpose_answer_generation.json new file mode 100644 index 000000000..2d96c1864 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task683_online_privacy_policy_text_purpose_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task683_online_privacy_policy_text_purpose_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task683_online_privacy_policy_text_purpose_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task684_online_privacy_policy_text_information_type_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task684_online_privacy_policy_text_information_type_generation.json new file mode 100644 index 000000000..0860b4dc3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task684_online_privacy_policy_text_information_type_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task684_online_privacy_policy_text_information_type_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task684_online_privacy_policy_text_information_type_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task685_mmmlu_answer_generation_clinical_knowledge.json b/src/unitxt/catalog/cards/natural_instructions/train/task685_mmmlu_answer_generation_clinical_knowledge.json new file mode 100644 index 000000000..7db7852f6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task685_mmmlu_answer_generation_clinical_knowledge.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task685_mmmlu_answer_generation_clinical_knowledge.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task685_mmmlu_answer_generation_clinical_knowledge" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task686_mmmlu_answer_generation_college_biology.json b/src/unitxt/catalog/cards/natural_instructions/train/task686_mmmlu_answer_generation_college_biology.json new file mode 100644 index 000000000..1b31fc21a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task686_mmmlu_answer_generation_college_biology.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task686_mmmlu_answer_generation_college_biology.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task686_mmmlu_answer_generation_college_biology" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task687_mmmlu_answer_generation_college_chemistry.json b/src/unitxt/catalog/cards/natural_instructions/train/task687_mmmlu_answer_generation_college_chemistry.json new file mode 100644 index 000000000..1edd0b9df --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task687_mmmlu_answer_generation_college_chemistry.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task687_mmmlu_answer_generation_college_chemistry.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task687_mmmlu_answer_generation_college_chemistry" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task688_mmmlu_answer_generation_college_computer_science.json b/src/unitxt/catalog/cards/natural_instructions/train/task688_mmmlu_answer_generation_college_computer_science.json new file mode 100644 index 000000000..39ce487a1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task688_mmmlu_answer_generation_college_computer_science.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task688_mmmlu_answer_generation_college_computer_science.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task688_mmmlu_answer_generation_college_computer_science" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task689_mmmlu_answer_generation_college_mathematics.json b/src/unitxt/catalog/cards/natural_instructions/train/task689_mmmlu_answer_generation_college_mathematics.json new file mode 100644 index 000000000..f2f5d5546 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task689_mmmlu_answer_generation_college_mathematics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task689_mmmlu_answer_generation_college_mathematics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task689_mmmlu_answer_generation_college_mathematics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task690_mmmlu_answer_generation_college_medicine.json b/src/unitxt/catalog/cards/natural_instructions/train/task690_mmmlu_answer_generation_college_medicine.json new file mode 100644 index 000000000..5362ec617 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task690_mmmlu_answer_generation_college_medicine.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task690_mmmlu_answer_generation_college_medicine.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task690_mmmlu_answer_generation_college_medicine" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task691_mmmlu_answer_generation_college_physics.json b/src/unitxt/catalog/cards/natural_instructions/train/task691_mmmlu_answer_generation_college_physics.json new file mode 100644 index 000000000..815dcfb05 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task691_mmmlu_answer_generation_college_physics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task691_mmmlu_answer_generation_college_physics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task691_mmmlu_answer_generation_college_physics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task692_mmmlu_answer_generation_computer_security.json b/src/unitxt/catalog/cards/natural_instructions/train/task692_mmmlu_answer_generation_computer_security.json new file mode 100644 index 000000000..fd0fe35a6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task692_mmmlu_answer_generation_computer_security.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task692_mmmlu_answer_generation_computer_security.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task692_mmmlu_answer_generation_computer_security" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task693_mmmlu_answer_generation_conceptual_physics.json b/src/unitxt/catalog/cards/natural_instructions/train/task693_mmmlu_answer_generation_conceptual_physics.json new file mode 100644 index 000000000..380293159 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task693_mmmlu_answer_generation_conceptual_physics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task693_mmmlu_answer_generation_conceptual_physics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task693_mmmlu_answer_generation_conceptual_physics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task694_mmmlu_answer_generation_econometrics.json b/src/unitxt/catalog/cards/natural_instructions/train/task694_mmmlu_answer_generation_econometrics.json new file mode 100644 index 000000000..4720099e1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task694_mmmlu_answer_generation_econometrics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task694_mmmlu_answer_generation_econometrics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task694_mmmlu_answer_generation_econometrics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task695_mmmlu_answer_generation_electrical_engineering.json b/src/unitxt/catalog/cards/natural_instructions/train/task695_mmmlu_answer_generation_electrical_engineering.json new file mode 100644 index 000000000..b78e86b74 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task695_mmmlu_answer_generation_electrical_engineering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task695_mmmlu_answer_generation_electrical_engineering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task695_mmmlu_answer_generation_electrical_engineering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task696_mmmlu_answer_generation_elementary_mathematics.json b/src/unitxt/catalog/cards/natural_instructions/train/task696_mmmlu_answer_generation_elementary_mathematics.json new file mode 100644 index 000000000..290178dba --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task696_mmmlu_answer_generation_elementary_mathematics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task696_mmmlu_answer_generation_elementary_mathematics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task696_mmmlu_answer_generation_elementary_mathematics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task697_mmmlu_answer_generation_formal_logic.json b/src/unitxt/catalog/cards/natural_instructions/train/task697_mmmlu_answer_generation_formal_logic.json new file mode 100644 index 000000000..ac3833d32 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task697_mmmlu_answer_generation_formal_logic.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task697_mmmlu_answer_generation_formal_logic.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task697_mmmlu_answer_generation_formal_logic" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task698_mmmlu_answer_generation_global_facts.json b/src/unitxt/catalog/cards/natural_instructions/train/task698_mmmlu_answer_generation_global_facts.json new file mode 100644 index 000000000..0b03e7645 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task698_mmmlu_answer_generation_global_facts.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task698_mmmlu_answer_generation_global_facts.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task698_mmmlu_answer_generation_global_facts" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task699_mmmlu_answer_generation_high_school_biology.json b/src/unitxt/catalog/cards/natural_instructions/train/task699_mmmlu_answer_generation_high_school_biology.json new file mode 100644 index 000000000..9fa0472e1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task699_mmmlu_answer_generation_high_school_biology.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task699_mmmlu_answer_generation_high_school_biology.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task699_mmmlu_answer_generation_high_school_biology" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task700_mmmlu_answer_generation_high_school_chemistry.json b/src/unitxt/catalog/cards/natural_instructions/train/task700_mmmlu_answer_generation_high_school_chemistry.json new file mode 100644 index 000000000..47e178bbf --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task700_mmmlu_answer_generation_high_school_chemistry.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task700_mmmlu_answer_generation_high_school_chemistry.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task700_mmmlu_answer_generation_high_school_chemistry" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task701_mmmlu_answer_generation_high_school_computer_science.json b/src/unitxt/catalog/cards/natural_instructions/train/task701_mmmlu_answer_generation_high_school_computer_science.json new file mode 100644 index 000000000..200cabdb6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task701_mmmlu_answer_generation_high_school_computer_science.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task701_mmmlu_answer_generation_high_school_computer_science.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task701_mmmlu_answer_generation_high_school_computer_science" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task702_mmmlu_answer_generation_high_school_european_history.json b/src/unitxt/catalog/cards/natural_instructions/train/task702_mmmlu_answer_generation_high_school_european_history.json new file mode 100644 index 000000000..ead6c9160 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task702_mmmlu_answer_generation_high_school_european_history.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task702_mmmlu_answer_generation_high_school_european_history.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task702_mmmlu_answer_generation_high_school_european_history" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task703_mmmlu_answer_generation_high_school_geography.json b/src/unitxt/catalog/cards/natural_instructions/train/task703_mmmlu_answer_generation_high_school_geography.json new file mode 100644 index 000000000..e0175b668 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task703_mmmlu_answer_generation_high_school_geography.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task703_mmmlu_answer_generation_high_school_geography.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task703_mmmlu_answer_generation_high_school_geography" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task704_mmmlu_answer_generation_high_school_government_and_politics.json b/src/unitxt/catalog/cards/natural_instructions/train/task704_mmmlu_answer_generation_high_school_government_and_politics.json new file mode 100644 index 000000000..b6170d26a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task704_mmmlu_answer_generation_high_school_government_and_politics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task704_mmmlu_answer_generation_high_school_government_and_politics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task704_mmmlu_answer_generation_high_school_government_and_politics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task705_mmmlu_answer_generation_high_school_macroeconomics.json b/src/unitxt/catalog/cards/natural_instructions/train/task705_mmmlu_answer_generation_high_school_macroeconomics.json new file mode 100644 index 000000000..efc387663 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task705_mmmlu_answer_generation_high_school_macroeconomics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task705_mmmlu_answer_generation_high_school_macroeconomics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task705_mmmlu_answer_generation_high_school_macroeconomics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task706_mmmlu_answer_generation_high_school_mathematics.json b/src/unitxt/catalog/cards/natural_instructions/train/task706_mmmlu_answer_generation_high_school_mathematics.json new file mode 100644 index 000000000..4090a2cca --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task706_mmmlu_answer_generation_high_school_mathematics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task706_mmmlu_answer_generation_high_school_mathematics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task706_mmmlu_answer_generation_high_school_mathematics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task707_mmmlu_answer_generation_high_school_microeconomics.json b/src/unitxt/catalog/cards/natural_instructions/train/task707_mmmlu_answer_generation_high_school_microeconomics.json new file mode 100644 index 000000000..e765dbf70 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task707_mmmlu_answer_generation_high_school_microeconomics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task707_mmmlu_answer_generation_high_school_microeconomics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task707_mmmlu_answer_generation_high_school_microeconomics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task708_mmmlu_answer_generation_high_school_physics.json b/src/unitxt/catalog/cards/natural_instructions/train/task708_mmmlu_answer_generation_high_school_physics.json new file mode 100644 index 000000000..c923cf413 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task708_mmmlu_answer_generation_high_school_physics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task708_mmmlu_answer_generation_high_school_physics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task708_mmmlu_answer_generation_high_school_physics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task709_mmmlu_answer_generation_high_school_psychology.json b/src/unitxt/catalog/cards/natural_instructions/train/task709_mmmlu_answer_generation_high_school_psychology.json new file mode 100644 index 000000000..57770fa5d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task709_mmmlu_answer_generation_high_school_psychology.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task709_mmmlu_answer_generation_high_school_psychology.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task709_mmmlu_answer_generation_high_school_psychology" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task710_mmmlu_answer_generation_high_school_statistics.json b/src/unitxt/catalog/cards/natural_instructions/train/task710_mmmlu_answer_generation_high_school_statistics.json new file mode 100644 index 000000000..af8f16365 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task710_mmmlu_answer_generation_high_school_statistics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task710_mmmlu_answer_generation_high_school_statistics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task710_mmmlu_answer_generation_high_school_statistics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task711_mmmlu_answer_generation_high_school_us_history.json b/src/unitxt/catalog/cards/natural_instructions/train/task711_mmmlu_answer_generation_high_school_us_history.json new file mode 100644 index 000000000..05e28f928 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task711_mmmlu_answer_generation_high_school_us_history.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task711_mmmlu_answer_generation_high_school_us_history.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task711_mmmlu_answer_generation_high_school_us_history" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task712_mmmlu_answer_generation_high_school_world_history.json b/src/unitxt/catalog/cards/natural_instructions/train/task712_mmmlu_answer_generation_high_school_world_history.json new file mode 100644 index 000000000..16d3e57c7 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task712_mmmlu_answer_generation_high_school_world_history.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task712_mmmlu_answer_generation_high_school_world_history.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task712_mmmlu_answer_generation_high_school_world_history" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task713_mmmlu_answer_generation_human_aging.json b/src/unitxt/catalog/cards/natural_instructions/train/task713_mmmlu_answer_generation_human_aging.json new file mode 100644 index 000000000..52d83ba19 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task713_mmmlu_answer_generation_human_aging.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task713_mmmlu_answer_generation_human_aging.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task713_mmmlu_answer_generation_human_aging" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task714_mmmlu_answer_generation_human_sexuality.json b/src/unitxt/catalog/cards/natural_instructions/train/task714_mmmlu_answer_generation_human_sexuality.json new file mode 100644 index 000000000..2cc02700e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task714_mmmlu_answer_generation_human_sexuality.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task714_mmmlu_answer_generation_human_sexuality.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task714_mmmlu_answer_generation_human_sexuality" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task715_mmmlu_answer_generation_international_law.json b/src/unitxt/catalog/cards/natural_instructions/train/task715_mmmlu_answer_generation_international_law.json new file mode 100644 index 000000000..d778a638d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task715_mmmlu_answer_generation_international_law.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task715_mmmlu_answer_generation_international_law.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task715_mmmlu_answer_generation_international_law" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task716_mmmlu_answer_generation_jurisprudence.json b/src/unitxt/catalog/cards/natural_instructions/train/task716_mmmlu_answer_generation_jurisprudence.json new file mode 100644 index 000000000..edbcf4db3 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task716_mmmlu_answer_generation_jurisprudence.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task716_mmmlu_answer_generation_jurisprudence.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task716_mmmlu_answer_generation_jurisprudence" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task717_mmmlu_answer_generation_logical_fallacies.json b/src/unitxt/catalog/cards/natural_instructions/train/task717_mmmlu_answer_generation_logical_fallacies.json new file mode 100644 index 000000000..ef9ad6481 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task717_mmmlu_answer_generation_logical_fallacies.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task717_mmmlu_answer_generation_logical_fallacies.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task717_mmmlu_answer_generation_logical_fallacies" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task718_mmmlu_answer_generation_machine_learning.json b/src/unitxt/catalog/cards/natural_instructions/train/task718_mmmlu_answer_generation_machine_learning.json new file mode 100644 index 000000000..319740e9d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task718_mmmlu_answer_generation_machine_learning.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task718_mmmlu_answer_generation_machine_learning.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task718_mmmlu_answer_generation_machine_learning" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task719_mmmlu_answer_generation_management.json b/src/unitxt/catalog/cards/natural_instructions/train/task719_mmmlu_answer_generation_management.json new file mode 100644 index 000000000..2bc4d8a9a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task719_mmmlu_answer_generation_management.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task719_mmmlu_answer_generation_management.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task719_mmmlu_answer_generation_management" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task720_mmmlu_answer_generation_marketing.json b/src/unitxt/catalog/cards/natural_instructions/train/task720_mmmlu_answer_generation_marketing.json new file mode 100644 index 000000000..7f9bf6b4c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task720_mmmlu_answer_generation_marketing.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task720_mmmlu_answer_generation_marketing.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task720_mmmlu_answer_generation_marketing" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task721_mmmlu_answer_generation_medical_genetics.json b/src/unitxt/catalog/cards/natural_instructions/train/task721_mmmlu_answer_generation_medical_genetics.json new file mode 100644 index 000000000..2068ce819 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task721_mmmlu_answer_generation_medical_genetics.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task721_mmmlu_answer_generation_medical_genetics.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task721_mmmlu_answer_generation_medical_genetics" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task722_mmmlu_answer_generation_random_topic.json b/src/unitxt/catalog/cards/natural_instructions/train/task722_mmmlu_answer_generation_random_topic.json new file mode 100644 index 000000000..55672f430 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task722_mmmlu_answer_generation_random_topic.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task722_mmmlu_answer_generation_random_topic.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task722_mmmlu_answer_generation_random_topic" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task723_mmmlu_answer_generation_moral_disputes.json b/src/unitxt/catalog/cards/natural_instructions/train/task723_mmmlu_answer_generation_moral_disputes.json new file mode 100644 index 000000000..ac9a9780f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task723_mmmlu_answer_generation_moral_disputes.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task723_mmmlu_answer_generation_moral_disputes.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task723_mmmlu_answer_generation_moral_disputes" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task724_mmmlu_answer_generation_moral_scenarios.json b/src/unitxt/catalog/cards/natural_instructions/train/task724_mmmlu_answer_generation_moral_scenarios.json new file mode 100644 index 000000000..4deeb9983 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task724_mmmlu_answer_generation_moral_scenarios.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task724_mmmlu_answer_generation_moral_scenarios.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task724_mmmlu_answer_generation_moral_scenarios" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task725_mmmlu_answer_generation_nutrition.json b/src/unitxt/catalog/cards/natural_instructions/train/task725_mmmlu_answer_generation_nutrition.json new file mode 100644 index 000000000..380cdc889 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task725_mmmlu_answer_generation_nutrition.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task725_mmmlu_answer_generation_nutrition.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task725_mmmlu_answer_generation_nutrition" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task726_mmmlu_answer_generation_philosophy.json b/src/unitxt/catalog/cards/natural_instructions/train/task726_mmmlu_answer_generation_philosophy.json new file mode 100644 index 000000000..6938079de --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task726_mmmlu_answer_generation_philosophy.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task726_mmmlu_answer_generation_philosophy.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task726_mmmlu_answer_generation_philosophy" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task727_mmmlu_answer_generation_prehistory.json b/src/unitxt/catalog/cards/natural_instructions/train/task727_mmmlu_answer_generation_prehistory.json new file mode 100644 index 000000000..3e9d21dd5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task727_mmmlu_answer_generation_prehistory.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task727_mmmlu_answer_generation_prehistory.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task727_mmmlu_answer_generation_prehistory" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task728_mmmlu_answer_generation_professional_accounting.json b/src/unitxt/catalog/cards/natural_instructions/train/task728_mmmlu_answer_generation_professional_accounting.json new file mode 100644 index 000000000..f9b3c063b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task728_mmmlu_answer_generation_professional_accounting.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task728_mmmlu_answer_generation_professional_accounting.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task728_mmmlu_answer_generation_professional_accounting" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task729_mmmlu_answer_generation_professional_law.json b/src/unitxt/catalog/cards/natural_instructions/train/task729_mmmlu_answer_generation_professional_law.json new file mode 100644 index 000000000..f96522e30 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task729_mmmlu_answer_generation_professional_law.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task729_mmmlu_answer_generation_professional_law.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task729_mmmlu_answer_generation_professional_law" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task730_mmmlu_answer_generation_professional_medicine.json b/src/unitxt/catalog/cards/natural_instructions/train/task730_mmmlu_answer_generation_professional_medicine.json new file mode 100644 index 000000000..d4c8463fb --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task730_mmmlu_answer_generation_professional_medicine.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task730_mmmlu_answer_generation_professional_medicine.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task730_mmmlu_answer_generation_professional_medicine" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task731_mmmlu_answer_generation_professional_psychology.json b/src/unitxt/catalog/cards/natural_instructions/train/task731_mmmlu_answer_generation_professional_psychology.json new file mode 100644 index 000000000..2ce26f6b4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task731_mmmlu_answer_generation_professional_psychology.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task731_mmmlu_answer_generation_professional_psychology.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task731_mmmlu_answer_generation_professional_psychology" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task732_mmmlu_answer_generation_public_relations.json b/src/unitxt/catalog/cards/natural_instructions/train/task732_mmmlu_answer_generation_public_relations.json new file mode 100644 index 000000000..a4e437c80 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task732_mmmlu_answer_generation_public_relations.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task732_mmmlu_answer_generation_public_relations.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task732_mmmlu_answer_generation_public_relations" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task733_mmmlu_answer_generation_security_studies.json b/src/unitxt/catalog/cards/natural_instructions/train/task733_mmmlu_answer_generation_security_studies.json new file mode 100644 index 000000000..90dc1500a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task733_mmmlu_answer_generation_security_studies.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task733_mmmlu_answer_generation_security_studies.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task733_mmmlu_answer_generation_security_studies" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task734_mmmlu_answer_generation_sociology.json b/src/unitxt/catalog/cards/natural_instructions/train/task734_mmmlu_answer_generation_sociology.json new file mode 100644 index 000000000..c067396f9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task734_mmmlu_answer_generation_sociology.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task734_mmmlu_answer_generation_sociology.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task734_mmmlu_answer_generation_sociology" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task735_mmmlu_answer_generation_us_foreign_policy.json b/src/unitxt/catalog/cards/natural_instructions/train/task735_mmmlu_answer_generation_us_foreign_policy.json new file mode 100644 index 000000000..e749542e9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task735_mmmlu_answer_generation_us_foreign_policy.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task735_mmmlu_answer_generation_us_foreign_policy.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task735_mmmlu_answer_generation_us_foreign_policy" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task736_mmmlu_answer_generation_virology.json b/src/unitxt/catalog/cards/natural_instructions/train/task736_mmmlu_answer_generation_virology.json new file mode 100644 index 000000000..8948bbf9e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task736_mmmlu_answer_generation_virology.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task736_mmmlu_answer_generation_virology.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task736_mmmlu_answer_generation_virology" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task737_mmmlu_answer_generation_world_religions.json b/src/unitxt/catalog/cards/natural_instructions/train/task737_mmmlu_answer_generation_world_religions.json new file mode 100644 index 000000000..8b010b504 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task737_mmmlu_answer_generation_world_religions.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task737_mmmlu_answer_generation_world_religions.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task737_mmmlu_answer_generation_world_religions" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task739_lhoestq_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task739_lhoestq_question_generation.json new file mode 100644 index 000000000..b17bf2e1a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task739_lhoestq_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task739_lhoestq_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task739_lhoestq_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task740_lhoestq_answer_generation_quantity.json b/src/unitxt/catalog/cards/natural_instructions/train/task740_lhoestq_answer_generation_quantity.json new file mode 100644 index 000000000..7fd213860 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task740_lhoestq_answer_generation_quantity.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task740_lhoestq_answer_generation_quantity.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task740_lhoestq_answer_generation_quantity" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task741_lhoestq_answer_generation_place.json b/src/unitxt/catalog/cards/natural_instructions/train/task741_lhoestq_answer_generation_place.json new file mode 100644 index 000000000..f87118544 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task741_lhoestq_answer_generation_place.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task741_lhoestq_answer_generation_place.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task741_lhoestq_answer_generation_place" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task742_lhoestq_answer_generation_frequency.json b/src/unitxt/catalog/cards/natural_instructions/train/task742_lhoestq_answer_generation_frequency.json new file mode 100644 index 000000000..ccd5cafa1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task742_lhoestq_answer_generation_frequency.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task742_lhoestq_answer_generation_frequency.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task742_lhoestq_answer_generation_frequency" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task745_ai2_arithmetic_questions_arithmetic.json b/src/unitxt/catalog/cards/natural_instructions/train/task745_ai2_arithmetic_questions_arithmetic.json new file mode 100644 index 000000000..85dcbf1b5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task745_ai2_arithmetic_questions_arithmetic.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task745_ai2_arithmetic_questions_arithmetic.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task745_ai2_arithmetic_questions_arithmetic" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task746_yelp_restaurant_review_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task746_yelp_restaurant_review_classification.json new file mode 100644 index 000000000..b4781998e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task746_yelp_restaurant_review_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task746_yelp_restaurant_review_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task746_yelp_restaurant_review_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task750_aqua_multiple_choice_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task750_aqua_multiple_choice_answering.json new file mode 100644 index 000000000..84c7ff25c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task750_aqua_multiple_choice_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task750_aqua_multiple_choice_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task750_aqua_multiple_choice_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task751_svamp_subtraction_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task751_svamp_subtraction_question_answering.json new file mode 100644 index 000000000..433fd35c5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task751_svamp_subtraction_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task751_svamp_subtraction_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task751_svamp_subtraction_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task752_svamp_multiplication_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task752_svamp_multiplication_question_answering.json new file mode 100644 index 000000000..8da51b6de --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task752_svamp_multiplication_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task752_svamp_multiplication_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task752_svamp_multiplication_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task753_svamp_addition_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task753_svamp_addition_question_answering.json new file mode 100644 index 000000000..9ff123c98 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task753_svamp_addition_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task753_svamp_addition_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task753_svamp_addition_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task754_svamp_common_division_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task754_svamp_common_division_question_answering.json new file mode 100644 index 000000000..50dc64fd8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task754_svamp_common_division_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task754_svamp_common-division_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task754_svamp_common_division_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task755_find_longest_substring_and_replace_its_sorted_lowercase_version_in_both_lists.json b/src/unitxt/catalog/cards/natural_instructions/train/task755_find_longest_substring_and_replace_its_sorted_lowercase_version_in_both_lists.json new file mode 100644 index 000000000..01273b37f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task755_find_longest_substring_and_replace_its_sorted_lowercase_version_in_both_lists.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task755_find_longest_substring_and_replace_its_sorted_lowercase_version_in_both_lists.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task755_find_longest_substring_and_replace_its_sorted_lowercase_version_in_both_lists" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task756_find_longert_substring_and_return_all_unique_alphabets_in_it.json b/src/unitxt/catalog/cards/natural_instructions/train/task756_find_longert_substring_and_return_all_unique_alphabets_in_it.json new file mode 100644 index 000000000..e0b0cf3cc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task756_find_longert_substring_and_return_all_unique_alphabets_in_it.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task756_find_longert_substring_and_return_all_unique_alphabets_in_it.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task756_find_longert_substring_and_return_all_unique_alphabets_in_it" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task761_app_review_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task761_app_review_classification.json new file mode 100644 index 000000000..e8e10ef6b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task761_app_review_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task761_app_review_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task761_app_review_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task766_craigslist_bargains_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task766_craigslist_bargains_classification.json new file mode 100644 index 000000000..7eb2ad468 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task766_craigslist_bargains_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task766_craigslist_bargains_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task766_craigslist_bargains_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task767_craigslist_bargains_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task767_craigslist_bargains_classification.json new file mode 100644 index 000000000..b13448e0f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task767_craigslist_bargains_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task767_craigslist_bargains_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task767_craigslist_bargains_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task770_pawsx_english_text_modification.json b/src/unitxt/catalog/cards/natural_instructions/train/task770_pawsx_english_text_modification.json new file mode 100644 index 000000000..83bfe4120 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task770_pawsx_english_text_modification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task770_pawsx_english_text_modification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task770_pawsx_english_text_modification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task819_pec_sentiment_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task819_pec_sentiment_classification.json new file mode 100644 index 000000000..213a34d6b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task819_pec_sentiment_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task819_pec_sentiment_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task819_pec_sentiment_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task820_protoqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task820_protoqa_answer_generation.json new file mode 100644 index 000000000..343075be6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task820_protoqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task820_protoqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task820_protoqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task821_protoqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task821_protoqa_question_generation.json new file mode 100644 index 000000000..165e460bf --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task821_protoqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task821_protoqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task821_protoqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task823_peixian_rtgender_sentiment_analysis.json b/src/unitxt/catalog/cards/natural_instructions/train/task823_peixian_rtgender_sentiment_analysis.json new file mode 100644 index 000000000..05ab2d606 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task823_peixian_rtgender_sentiment_analysis.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task823_peixian-rtgender_sentiment_analysis.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task823_peixian_rtgender_sentiment_analysis" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task833_poem_sentiment_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task833_poem_sentiment_classification.json new file mode 100644 index 000000000..9b6869464 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task833_poem_sentiment_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task833_poem_sentiment_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task833_poem_sentiment_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task834_mathdataset_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task834_mathdataset_classification.json new file mode 100644 index 000000000..2c2133ec9 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task834_mathdataset_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task834_mathdataset_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task834_mathdataset_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task835_mathdataset_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task835_mathdataset_answer_generation.json new file mode 100644 index 000000000..a56d17906 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task835_mathdataset_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task835_mathdataset_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task835_mathdataset_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task843_financial_phrasebank_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task843_financial_phrasebank_classification.json new file mode 100644 index 000000000..10770937b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task843_financial_phrasebank_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task843_financial_phrasebank_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task843_financial_phrasebank_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task844_financial_phrasebank_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task844_financial_phrasebank_classification.json new file mode 100644 index 000000000..078236212 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task844_financial_phrasebank_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task844_financial_phrasebank_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task844_financial_phrasebank_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task845_pubmedqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task845_pubmedqa_question_generation.json new file mode 100644 index 000000000..2441ce120 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task845_pubmedqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task845_pubmedqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task845_pubmedqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task846_pubmedqa_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task846_pubmedqa_classification.json new file mode 100644 index 000000000..e36394758 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task846_pubmedqa_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task846_pubmedqa_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task846_pubmedqa_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task847_pubmedqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task847_pubmedqa_question_generation.json new file mode 100644 index 000000000..af9baf4ee --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task847_pubmedqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task847_pubmedqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task847_pubmedqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task848_pubmedqa_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task848_pubmedqa_classification.json new file mode 100644 index 000000000..07819bf4c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task848_pubmedqa_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task848_pubmedqa_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task848_pubmedqa_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task849_pubmedqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task849_pubmedqa_answer_generation.json new file mode 100644 index 000000000..4aa31d6b1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task849_pubmedqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task849_pubmedqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task849_pubmedqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task850_synthetic_longest_palindrome.json b/src/unitxt/catalog/cards/natural_instructions/train/task850_synthetic_longest_palindrome.json new file mode 100644 index 000000000..b27f2a4dc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task850_synthetic_longest_palindrome.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task850_synthetic_longest_palindrome.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task850_synthetic_longest_palindrome" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task851_synthetic_multiply_evens.json b/src/unitxt/catalog/cards/natural_instructions/train/task851_synthetic_multiply_evens.json new file mode 100644 index 000000000..679a9236b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task851_synthetic_multiply_evens.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task851_synthetic_multiply_evens.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task851_synthetic_multiply_evens" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task852_synthetic_multiply_odds.json b/src/unitxt/catalog/cards/natural_instructions/train/task852_synthetic_multiply_odds.json new file mode 100644 index 000000000..745ff0109 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task852_synthetic_multiply_odds.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task852_synthetic_multiply_odds.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task852_synthetic_multiply_odds" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task853_hippocorpus_long_text_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task853_hippocorpus_long_text_generation.json new file mode 100644 index 000000000..1e662c27f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task853_hippocorpus_long_text_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task853_hippocorpus_long_text_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task853_hippocorpus_long_text_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task854_hippocorpus_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task854_hippocorpus_classification.json new file mode 100644 index 000000000..e5afcc463 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task854_hippocorpus_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task854_hippocorpus_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task854_hippocorpus_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task855_conv_ai_2_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task855_conv_ai_2_classification.json new file mode 100644 index 000000000..f4e2d6717 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task855_conv_ai_2_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task855_conv_ai_2_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task855_conv_ai_2_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task856_conv_ai_2_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task856_conv_ai_2_classification.json new file mode 100644 index 000000000..843033f49 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task856_conv_ai_2_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task856_conv_ai_2_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task856_conv_ai_2_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task857_inquisitive_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task857_inquisitive_question_generation.json new file mode 100644 index 000000000..03abe0469 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task857_inquisitive_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task857_inquisitive_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task857_inquisitive_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task858_inquisitive_span_detection.json b/src/unitxt/catalog/cards/natural_instructions/train/task858_inquisitive_span_detection.json new file mode 100644 index 000000000..d44a0320f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task858_inquisitive_span_detection.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task858_inquisitive_span_detection.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task858_inquisitive_span_detection" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task859_prost_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task859_prost_question_generation.json new file mode 100644 index 000000000..2950b8d0b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task859_prost_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task859_prost_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task859_prost_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task860_prost_mcq_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task860_prost_mcq_generation.json new file mode 100644 index 000000000..1c45a2247 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task860_prost_mcq_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task860_prost_mcq_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task860_prost_mcq_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task861_asdiv_addsub_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task861_asdiv_addsub_question_answering.json new file mode 100644 index 000000000..c967d6e8b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task861_asdiv_addsub_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task861_asdiv_addsub_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task861_asdiv_addsub_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task861_prost_mcq_answers_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task861_prost_mcq_answers_generation.json new file mode 100644 index 000000000..8397c44d4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task861_prost_mcq_answers_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task861_prost_mcq_answers_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task861_prost_mcq_answers_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task862_asdiv_multidiv_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task862_asdiv_multidiv_question_answering.json new file mode 100644 index 000000000..b16d9f1de --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task862_asdiv_multidiv_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task862_asdiv_multidiv_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task862_asdiv_multidiv_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task863_asdiv_multiop_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task863_asdiv_multiop_question_answering.json new file mode 100644 index 000000000..1fe91ec26 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task863_asdiv_multiop_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task863_asdiv_multiop_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task863_asdiv_multiop_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task864_asdiv_singleop_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task864_asdiv_singleop_question_answering.json new file mode 100644 index 000000000..af3bc952d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task864_asdiv_singleop_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task864_asdiv_singleop_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task864_asdiv_singleop_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task865_mawps_addsub_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task865_mawps_addsub_question_answering.json new file mode 100644 index 000000000..6f5a58b33 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task865_mawps_addsub_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task865_mawps_addsub_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task865_mawps_addsub_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task866_mawps_multidiv_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task866_mawps_multidiv_question_answering.json new file mode 100644 index 000000000..8e4f48c77 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task866_mawps_multidiv_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task866_mawps_multidiv_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task866_mawps_multidiv_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task867_mawps_multiop_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task867_mawps_multiop_question_answering.json new file mode 100644 index 000000000..7feefa73e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task867_mawps_multiop_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task867_mawps_multiop_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task867_mawps_multiop_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task868_cfq_mcd1_explanation_to_sql.json b/src/unitxt/catalog/cards/natural_instructions/train/task868_cfq_mcd1_explanation_to_sql.json new file mode 100644 index 000000000..3901a44ff --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task868_cfq_mcd1_explanation_to_sql.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task868_cfq_mcd1_explanation_to_sql.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task868_cfq_mcd1_explanation_to_sql" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task868_mawps_singleop_question_answering.json b/src/unitxt/catalog/cards/natural_instructions/train/task868_mawps_singleop_question_answering.json new file mode 100644 index 000000000..6c669c82f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task868_mawps_singleop_question_answering.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task868_mawps_singleop_question_answering.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task868_mawps_singleop_question_answering" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task869_cfq_mcd1_sql_to_explanation.json b/src/unitxt/catalog/cards/natural_instructions/train/task869_cfq_mcd1_sql_to_explanation.json new file mode 100644 index 000000000..ee98f758f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task869_cfq_mcd1_sql_to_explanation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task869_cfq_mcd1_sql_to_explanation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task869_cfq_mcd1_sql_to_explanation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task870_msmarco_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task870_msmarco_answer_generation.json new file mode 100644 index 000000000..50c81ad47 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task870_msmarco_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task870_msmarco_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task870_msmarco_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task871_msmarco_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task871_msmarco_question_generation.json new file mode 100644 index 000000000..2c6b0a32c --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task871_msmarco_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task871_msmarco_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task871_msmarco_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task874_opus_xhosanavy_sr.json b/src/unitxt/catalog/cards/natural_instructions/train/task874_opus_xhosanavy_sr.json new file mode 100644 index 000000000..ce0b2ff79 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task874_opus_xhosanavy_sr.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task874_opus_xhosanavy_sr.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task874_opus_xhosanavy_sr" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task875_emotion_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task875_emotion_classification.json new file mode 100644 index 000000000..32d24819a --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task875_emotion_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task875_emotion_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task875_emotion_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task886_quail_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task886_quail_question_generation.json new file mode 100644 index 000000000..29d94a8fc --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task886_quail_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task886_quail_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task886_quail_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task887_quail_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task887_quail_answer_generation.json new file mode 100644 index 000000000..9df4517fe --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task887_quail_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task887_quail_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task887_quail_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task888_reviews_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task888_reviews_classification.json new file mode 100644 index 000000000..7ce84c0a8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task888_reviews_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task888_reviews_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task888_reviews_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task889_goemotions_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task889_goemotions_classification.json new file mode 100644 index 000000000..32db9471f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task889_goemotions_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task889_goemotions_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task889_goemotions_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task897_freebase_qa_topic_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task897_freebase_qa_topic_question_generation.json new file mode 100644 index 000000000..e66bbda00 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task897_freebase_qa_topic_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task897_freebase_qa_topic_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task897_freebase_qa_topic_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task898_freebase_qa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task898_freebase_qa_answer_generation.json new file mode 100644 index 000000000..3bda01af8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task898_freebase_qa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task898_freebase_qa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task898_freebase_qa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task899_freebase_qa_topic_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task899_freebase_qa_topic_generation.json new file mode 100644 index 000000000..3b609c142 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task899_freebase_qa_topic_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task899_freebase_qa_topic_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task899_freebase_qa_topic_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task900_freebase_qa_category_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task900_freebase_qa_category_classification.json new file mode 100644 index 000000000..9c7fc0328 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task900_freebase_qa_category_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task900_freebase_qa_category_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task900_freebase_qa_category_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task901_freebase_qa_category_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task901_freebase_qa_category_question_generation.json new file mode 100644 index 000000000..bab71429d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task901_freebase_qa_category_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task901_freebase_qa_category_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task901_freebase_qa_category_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task902_deceptive_opinion_spam_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task902_deceptive_opinion_spam_classification.json new file mode 100644 index 000000000..dfa6f91b5 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task902_deceptive_opinion_spam_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task902_deceptive_opinion_spam_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task902_deceptive_opinion_spam_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task903_deceptive_opinion_spam_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task903_deceptive_opinion_spam_classification.json new file mode 100644 index 000000000..07555fb2e --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task903_deceptive_opinion_spam_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task903_deceptive_opinion_spam_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task903_deceptive_opinion_spam_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task904_hate_speech_offensive_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task904_hate_speech_offensive_classification.json new file mode 100644 index 000000000..a1a835551 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task904_hate_speech_offensive_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task904_hate_speech_offensive_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task904_hate_speech_offensive_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task905_hate_speech_offensive_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task905_hate_speech_offensive_classification.json new file mode 100644 index 000000000..849dc10f4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task905_hate_speech_offensive_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task905_hate_speech_offensive_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task905_hate_speech_offensive_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task906_dialogre_identify_names.json b/src/unitxt/catalog/cards/natural_instructions/train/task906_dialogre_identify_names.json new file mode 100644 index 000000000..eafe7140d --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task906_dialogre_identify_names.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task906_dialogre_identify_names.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task906_dialogre_identify_names" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task907_dialogre_identify_relationships.json b/src/unitxt/catalog/cards/natural_instructions/train/task907_dialogre_identify_relationships.json new file mode 100644 index 000000000..ec834ab40 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task907_dialogre_identify_relationships.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task907_dialogre_identify_relationships.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task907_dialogre_identify_relationships" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task908_dialogre_identify_familial_relationships.json b/src/unitxt/catalog/cards/natural_instructions/train/task908_dialogre_identify_familial_relationships.json new file mode 100644 index 000000000..1b28b86b8 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task908_dialogre_identify_familial_relationships.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task908_dialogre_identify_familial_relationships.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task908_dialogre_identify_familial_relationships" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task909_dialogre_prevalent_speakers.json b/src/unitxt/catalog/cards/natural_instructions/train/task909_dialogre_prevalent_speakers.json new file mode 100644 index 000000000..72dcd10d0 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task909_dialogre_prevalent_speakers.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task909_dialogre_prevalent_speakers.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task909_dialogre_prevalent_speakers" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task917_coqa_question_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task917_coqa_question_generation.json new file mode 100644 index 000000000..bb871d2ba --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task917_coqa_question_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task917_coqa_question_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task917_coqa_question_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task918_coqa_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task918_coqa_answer_generation.json new file mode 100644 index 000000000..28fc2d81f --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task918_coqa_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task918_coqa_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task918_coqa_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task919_coqa_incorrect_answer_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task919_coqa_incorrect_answer_generation.json new file mode 100644 index 000000000..9e86775cf --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task919_coqa_incorrect_answer_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task919_coqa_incorrect_answer_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task919_coqa_incorrect_answer_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task921_code_x_glue_information_retreival.json b/src/unitxt/catalog/cards/natural_instructions/train/task921_code_x_glue_information_retreival.json new file mode 100644 index 000000000..c6109245b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task921_code_x_glue_information_retreival.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task921_code_x_glue_information_retreival.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task921_code_x_glue_information_retreival" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task922_event2mind_word_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task922_event2mind_word_generation.json new file mode 100644 index 000000000..1b3aab7d2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task922_event2mind_word_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task922_event2mind_word_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task922_event2mind_word_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task923_event2mind_classifier.json b/src/unitxt/catalog/cards/natural_instructions/train/task923_event2mind_classifier.json new file mode 100644 index 000000000..e0e5b24f2 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task923_event2mind_classifier.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task923_event2mind_classifier.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task923_event2mind_classifier" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task924_event2mind_word_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task924_event2mind_word_generation.json new file mode 100644 index 000000000..f640b54e1 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task924_event2mind_word_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task924_event2mind_word_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task924_event2mind_word_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task925_coached_conv_pref_classifier.json b/src/unitxt/catalog/cards/natural_instructions/train/task925_coached_conv_pref_classifier.json new file mode 100644 index 000000000..043c63168 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task925_coached_conv_pref_classifier.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task925_coached_conv_pref_classifier.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task925_coached_conv_pref_classifier" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task926_coached_conv_pref_word_generation.json b/src/unitxt/catalog/cards/natural_instructions/train/task926_coached_conv_pref_word_generation.json new file mode 100644 index 000000000..f3d271167 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task926_coached_conv_pref_word_generation.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task926_coached_conv_pref_word_generation.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task926_coached_conv_pref_word_generation" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task927_yelp_negative_to_positive_style_transfer.json b/src/unitxt/catalog/cards/natural_instructions/train/task927_yelp_negative_to_positive_style_transfer.json new file mode 100644 index 000000000..b45a29d4b --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task927_yelp_negative_to_positive_style_transfer.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task927_yelp_negative_to_positive_style_transfer.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task927_yelp_negative_to_positive_style_transfer" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task928_yelp_positive_to_negative_style_transfer.json b/src/unitxt/catalog/cards/natural_instructions/train/task928_yelp_positive_to_negative_style_transfer.json new file mode 100644 index 000000000..c243ce678 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task928_yelp_positive_to_negative_style_transfer.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task928_yelp_positive_to_negative_style_transfer.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task928_yelp_positive_to_negative_style_transfer" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task929_products_reviews_classification.json b/src/unitxt/catalog/cards/natural_instructions/train/task929_products_reviews_classification.json new file mode 100644 index 000000000..186d21e64 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task929_products_reviews_classification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task929_products_reviews_classification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task929_products_reviews_classification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task933_wiki_auto_style_transfer.json b/src/unitxt/catalog/cards/natural_instructions/train/task933_wiki_auto_style_transfer.json new file mode 100644 index 000000000..1395a74b6 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task933_wiki_auto_style_transfer.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task933_wiki_auto_style_transfer.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task933_wiki_auto_style_transfer" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task934_turk_simplification.json b/src/unitxt/catalog/cards/natural_instructions/train/task934_turk_simplification.json new file mode 100644 index 000000000..2d839df88 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task934_turk_simplification.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task934_turk_simplification.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task934_turk_simplification" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task955_wiki_auto_style_transfer.json b/src/unitxt/catalog/cards/natural_instructions/train/task955_wiki_auto_style_transfer.json new file mode 100644 index 000000000..1e15d1ae4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task955_wiki_auto_style_transfer.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task955_wiki_auto_style_transfer.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task955_wiki_auto_style_transfer" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task956_leetcode_420_strong_password_check.json b/src/unitxt/catalog/cards/natural_instructions/train/task956_leetcode_420_strong_password_check.json new file mode 100644 index 000000000..fccfe4423 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task956_leetcode_420_strong_password_check.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task956_leetcode_420_strong_password_check.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task956_leetcode_420_strong_password_check" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task963_librispeech_asr_next_word_prediction.json b/src/unitxt/catalog/cards/natural_instructions/train/task963_librispeech_asr_next_word_prediction.json new file mode 100644 index 000000000..f1703a4be --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task963_librispeech_asr_next_word_prediction.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task963_librispeech_asr_next_word_prediction.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task963_librispeech_asr_next_word_prediction" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task964_librispeech_asr_text_auto_completion.json b/src/unitxt/catalog/cards/natural_instructions/train/task964_librispeech_asr_text_auto_completion.json new file mode 100644 index 000000000..a48e85382 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task964_librispeech_asr_text_auto_completion.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task964_librispeech_asr_text_auto_completion.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task964_librispeech_asr_text_auto_completion" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task965_librispeech_asr_missing_word_prediction.json b/src/unitxt/catalog/cards/natural_instructions/train/task965_librispeech_asr_missing_word_prediction.json new file mode 100644 index 000000000..2c6d31ac4 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task965_librispeech_asr_missing_word_prediction.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task965_librispeech_asr_missing_word_prediction.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task965_librispeech_asr_missing_word_prediction" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task966_ruletaker_fact_checking_based_on_given_context.json b/src/unitxt/catalog/cards/natural_instructions/train/task966_ruletaker_fact_checking_based_on_given_context.json new file mode 100644 index 000000000..77f222278 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task966_ruletaker_fact_checking_based_on_given_context.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task966_ruletaker_fact_checking_based_on_given_context.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task966_ruletaker_fact_checking_based_on_given_context" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/cards/natural_instructions/train/task967_ruletaker_incorrect_fact_generation_based_on_given_paragraph.json b/src/unitxt/catalog/cards/natural_instructions/train/task967_ruletaker_incorrect_fact_generation_based_on_given_paragraph.json new file mode 100644 index 000000000..52f9d6807 --- /dev/null +++ b/src/unitxt/catalog/cards/natural_instructions/train/task967_ruletaker_incorrect_fact_generation_based_on_given_paragraph.json @@ -0,0 +1,53 @@ +{ + "type": "task_card", + "loader": { + "type": "load_hf", + "data_files": "https://raw.githubusercontent.com/allenai/natural-instructions/master/tasks/task967_ruletaker_incorrect_fact_generation_based_on_given_paragraph.json", + "field": "Instances", + "path": "json" + }, + "preprocess_steps": [ + { + "type": "split_random_mix", + "mix": { + "train": "train[90%]", + "validation": "train[5%]", + "test": "train[5%]" + } + }, + { + "type": "copy_fields", + "field_to_field": [ + [ + "output/0", + "target" + ] + ], + "use_query": true + } + ], + "task": { + "type": "form_task", + "inputs": [ + "input" + ], + "outputs": [ + "target" + ], + "metrics": [ + "metrics.rouge" + ] + }, + "instructions": { + "type": "instructions_list", + "items": [ + "instructions.natural_instructions.train.task967_ruletaker_incorrect_fact_generation_based_on_given_paragraph" + ] + }, + "templates": { + "type": "templates_list", + "items": [ + "templates.input_output" + ] + } +} \ No newline at end of file diff --git a/src/unitxt/catalog/formats/input_output_prefix.json b/src/unitxt/catalog/formats/input_output_prefix.json new file mode 100644 index 000000000..06e0d24c4 --- /dev/null +++ b/src/unitxt/catalog/formats/input_output_prefix.json @@ -0,0 +1,5 @@ +{ + "type": "icl_format", + "input_prefix": "input: ", + "output_prefix": "output: " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task001_quoref_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task001_quoref_question_generation.json new file mode 100644 index 000000000..fe4c9dc82 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task001_quoref_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given passages that contain mentions of names of people, places, or things. Some of these mentions refer to the same person, place, or thing. Your job is to write questions that evaluate one's understanding of such references. Good questions are expected to link pronouns (she, her, him, his, their, etc.) or other mentions to people, places, or things to which they may refer. Do not ask questions that can be answered correctly without understanding the paragraph or having multiple answers. Avoid questions that do not link phrases referring to the same entity. For each of your questions, the answer should be one or more phrases in the paragraph, and it should be unambiguous." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task002_quoref_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task002_quoref_answer_generation.json new file mode 100644 index 000000000..8e18aa63f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task002_quoref_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're expected to write answers to questions involving multiple references to the same entity. The answer to the question should be unambiguous and a phrase in the paragraph. Most questions can have only one correct answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task022_cosmosqa_passage_inappropriate_binary.json b/src/unitxt/catalog/instructions/natural_instructions/train/task022_cosmosqa_passage_inappropriate_binary.json new file mode 100644 index 000000000..6b9936e7b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task022_cosmosqa_passage_inappropriate_binary.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Read the given context and if the the context is inappropriate (e.g., pornographic) or nonsensical (e.g., cannot determine what happenings the context is about), indicate via \"yes\". Otherwise, response via \"no\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task023_cosmosqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task023_cosmosqa_question_generation.json new file mode 100644 index 000000000..7825d91a3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task023_cosmosqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Based on the given context, craft a common-sense question, especially those that are LONG, INTERESTING, and COMPLEX. The goal is to write questions that are easy for humans and hard for AI machines! To create such questions, here are some suggestions: A. What may (or may not) be the plausible reason for an event? B. What may (or may not) happen before (or after, or during) an event? C. What may (or may not) be a plausible fact about someone (or something)? D. What may (or may not) happen if an event happens (or did not happen)? You can also create other types of questions. DO NOT make your question answerable without looking at the context, or question of which the correct answer can be directly extracted from the context. DO NOT ask a question that requires very specialized knowledge that is not common sense. DO NOT ask too simple or too short questions. Your question must be related to the context and answerable with common sense. Try to add more variations and complexity to the questions." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task024_cosmosqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task024_cosmosqa_answer_generation.json new file mode 100644 index 000000000..3a7a8692e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task024_cosmosqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Craft one correct answer to the question given in input. To make it more interesting, try to use non-stereotypical language if possible. Make sure your correct answer is reasonably long, consistent with the context, and requires common sense (instead of explicit extraction from the context.) In your answer, use as few words as possible from the given context. Use a response that is uncommon/non-stereotypical, so that it is less predictable. To be less repetitive, please vary your language for each question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task025_cosmosqa_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task025_cosmosqa_incorrect_answer_generation.json new file mode 100644 index 000000000..c6189cdff --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task025_cosmosqa_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Craft one incorrect answer. In doing so, try to use words from the context as much as possible, or by using similar words used in the correct answer. DO NOT craft nonsensical or off-topic incorrect answers, such that the incorrect answers can be directly excluded without reasoning according to the context. Try to make your responses similar to the given correct answer. To this end, try to keep both the length and the style as similar as possible between the correct and the incorrect answer. To make your incorrect answers more difficult, try to incorporate words from context. To avoid being predictable or repetitive, try to add more variations and complexity." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task026_drop_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task026_drop_question_generation.json new file mode 100644 index 000000000..830eaf522 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task026_drop_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task involves creating questions from a given passage that involve some kind of complex reasoning (including numerical reasoning). \nThe generated questions must require looking at more than one part of the passage to answer. Try to use a variety of reasoning types in your questions (some of the sample reasoning types are illustrated in the 'positive examples' field) and also have a variety of answer types (spans, numbers, dates). A span is a continuous phrase taken directly from the passage or question. In such questions, the answer spans are recommended to be five words. Questions with answer type \"number\", are expected to start with \"How many\". For instance, \"How long did an event last?\" can be phrased as \"How many years did an event last?\". To increase diversity, try to create more questions for which the answer will be multiple spans. Please create questions that require AT LEAST 2 arithmetic operations as illustrated in the 'positive examples' field. You are encouraged to try DIFFERENT COMBINATIONS of operations and not just limit to the combinations shown in those examples. The more challenging questions you create, the better it is." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task027_drop_answer_type_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task027_drop_answer_type_generation.json new file mode 100644 index 000000000..5d275dffe --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task027_drop_answer_type_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task involves annotating the answer type to a given question that involve some kind of complex reasoning (including numerical reasoning). Note that the questions require looking at more than one part of the passage to answer. There are 3 possible answer types (i) spans, (ii) numbers and (iii) dates. If the answer can be found in the passage, label it as \"span\". If the answer is a number, label as \"number\". Similarly, label \"date\" if you think the answer to the given question is a date." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task028_drop_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task028_drop_answer_generation.json new file mode 100644 index 000000000..aaae5f008 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task028_drop_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task involves creating answers to complex questions, from a given passage. Answering these questions, typically involve understanding multiple sentences. Make sure that your answer has the same type as the \"answer type\" mentioned in input. The provided \"answer type\" can be of any of the following types: \"span\", \"date\", \"number\". A \"span\" answer is a continuous phrase taken directly from the passage or question. You can directly copy-paste the text from the passage or the question for span type answers. If you find multiple spans, please add them all as a comma separated list. Please restrict each span to five words. A \"number\" type answer can include a digit specifying an actual value. For \"date\" type answers, use DD MM YYYY format e.g. 11 Jan 1992. If full date is not available in the passage you can write partial date such as 1992 or Jan 1992. If you find multiple spans, please add them all as a comma separated list. Please restrict each span to five words." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task043_essential_terms_answering_incomplete_questions.json b/src/unitxt/catalog/instructions/natural_instructions/train/task043_essential_terms_answering_incomplete_questions.json new file mode 100644 index 000000000..2151400bb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task043_essential_terms_answering_incomplete_questions.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to answer basic science questions. For each question, several terms are intentionally masked with ***. This masking can cover very few or many of the question words. Clearly, if masked terms are important, the modified question will be impossible to answer. Please indicate the correct answer with one of the following responses: \"A\", \"B\", \"C\", \"D\" or \"E\". While \"A\"-\"D\" correspond to the answer options provided in the input, \"E\" represents \"I don't know\" for questions that do not provide enough information. Respond via \"E\" if the question is not answerable. Do not generate anything else apart from one of the following characters: 'A', 'B, 'C', 'D', 'E'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task044_essential_terms_identifying_essential_words.json b/src/unitxt/catalog/instructions/natural_instructions/train/task044_essential_terms_identifying_essential_words.json new file mode 100644 index 000000000..b520e11d5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task044_essential_terms_identifying_essential_words.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given an elementary science question along with a few answer options. List all the words from the question that are essential and sufficient for choosing the correct answer option. Keep in mind that essential words are necessary to understand the meaning of the given question. However, non-essential words provide little information needed to select the correct answer. You can think about it like this: If the question was in another language, knowing the meaning of which words were necessary and enough for you to understand the question and answer it?. If your answer consists of multiple spans of words from the question, separate those using a comma (\", \"). Do not generate any word that is not present in the question. Make sure that your response is contained in the given question and the words are in the same order as the question.\n Grammatical correctness is not important." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task045_miscellaneous_sentence_paraphrasing.json b/src/unitxt/catalog/instructions/natural_instructions/train/task045_miscellaneous_sentence_paraphrasing.json new file mode 100644 index 000000000..1111d8057 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task045_miscellaneous_sentence_paraphrasing.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question, its answer, and a sentence that supports the question, i.e., the answer to the question is inferable from the sentence. In this task, you need to paraphrase the given sentence so that the paraphrased sentence still supports the question i.e. you can still infer the answer to the question from the paraphrased sentence. Do not write a paraphrase with a minor change in the given sentence e.g. replacing the word \"one\" with \"a\". Instead, try to write a paraphrase that contains new words, i.e. the words that are not present in the input sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task046_miscellaneous_question_typing.json b/src/unitxt/catalog/instructions/natural_instructions/train/task046_miscellaneous_question_typing.json new file mode 100644 index 000000000..03db9daf0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task046_miscellaneous_question_typing.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question-answer pair. Answer with their type. Pay attention that there may be more than one correct type, but you only have to choose one. In your responses, use of the following types: \n(1) Humans: Any individual or group of humans, including fictional ones (e.g., a group or organization of persons , an individual, title of a person, description of a person); \n(2) Event: Any phenomenon natural or artificial (e.g., named hurricanes, Battles, Wars, Sports events, Terrorist attacks); \n(3) Entity: A thing with distinct and independent existence (Animals, Organs of body, Colors, Inventions, books and other creative pieces, Currency name, Diseases, and medicine, Food, Musical instrument, Languages, Plants, Products, Religions, Sports, Elements and substances, Symbols and signs, Techniques and methods, Equivalent terms, Vehicles); \n(4) Facility: Something built for a particular purpose (Buildings, Airports, Highways, Bridges); \n(5) Location: A place (Cities, Countries, Mountains, States); \n(6) Law: Named documents made into laws (e.g., \u201cthe first amendment\u201d, \"civil rights act\"); \n(7) Organization: an organized body of people with a particular purpose (Company names, e.g. Google, Cults or terrorist groups, e.g. Al Qaeda); \n(8) Date: Absolute or relative dates or periods, bigger than 1 day (Years, Range, e.g. from Monday to Tuesday, or during the 20th century, Approximate time); \n(9) Time: Any temporal range/unit that is shorter than a day (e.g., 2 o'clock, 1 pm); \n(10) Money: Monetary values, including unit (e.g., \"$26\", \"914$\"); \n(11) Quantity: postcodes or other codes, the number of sth, Ranks, fractions, speed, temperature, size, area, and volume, weight (e.g., \"26 degree\" \"17 inch\"); \n(12) Description: description and abstract concepts (e.g., the definition of something, the manner of an action, reasons); \n(13) Abbreviation: expression abbreviated (e.g., AMT = abbreviation of Amazon Mechanical Turk). Don't generate any word that is not mentioned in the list of types (Humans, Event, Entity, Facility, Location, Law, Organization, Date, Time, Money, Quantity, Description, Abbreviation). If you can not associate any of the given types with the provided question and answer pair, respond \"Other\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task047_miscellaneous_answering_science_questions.json b/src/unitxt/catalog/instructions/natural_instructions/train/task047_miscellaneous_answering_science_questions.json new file mode 100644 index 000000000..b0e3974c9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task047_miscellaneous_answering_science_questions.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this subtask, you will answer a simple science question. Please indicate the correct answer. If you're not sure about the answer, choose the last option \"I don't know\". Do not generate anything else apart from one of the following characters: 'A', 'B, 'C', 'D', 'E'. The \"A\"-\"D\" responses correspond to the answer options mentioned in the input. There is a 5th option \"E\" which should be used for questions for which you're not sure about the answer (e.g., when the questions do not provide enough information to answer)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task059_ropes_story_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task059_ropes_story_generation.json new file mode 100644 index 000000000..6909fceca --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task059_ropes_story_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": " You are given a background paragraph that describes one or more causal or physical relationships, such as a relationship in economics, scientific law, or nature. You need to come up with a fictional story that makes use of the concepts or the relationship described in the provided paragraph. Make sure that your story does not repeat the relation in the given paragraph (e.g., by avoiding verbatim copies of the given paragraph). Start by reading the background paragraph, and determine what relationship(s) are in the paragraph. Write a story that involves the relationship(s) that you determined are in the background paragraph. Try to use your own words as much as possible and not repeat the background paragraph. Feel free to make up places and events as long as they tie back to the background paragraph in a way that you can ask a question about." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task060_ropes_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task060_ropes_question_generation.json new file mode 100644 index 000000000..2c9b724de --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task060_ropes_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a background paragraph that describes one or more causal or qualitative relationships such as a relationship in economics or a scientific law and a story that makes use of the concepts or the relationship described in the provided paragraph. You need to come up with a question about the story that requires an understanding of the relationship described in the background paragraph. The generated question should not be answerable without both the background and story. Write a question about the story that requires a relationship in the background paragraph to answer. Check whether your question requires both the background paragraph and the story to answer. If your question can be answered by only one of these, try to rewrite your question so that it requires both. Note that \"flipping\" a word in the question can give rise to a new question where the answer will be different from the original question. Often, \"flipping\" a word gives rise to flipping the direction of the relationship, for example, from \"increase\" to \"decrease.\"" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task061_ropes_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task061_ropes_answer_generation.json new file mode 100644 index 000000000..f6d25c7c2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task061_ropes_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a background paragraph that describes one or more causal or qualitative relationships such as a relationship in economics or a scientific law and a story that makes use of the concepts or the relationship described in the provided paragraph. You are also given a question about the story that requires an understanding of the relationship described in the background paragraph and the story. You need to come up with an answer to the given question; the answer will be a span from either the question or the story. In order to correctly answer the given question, you need to understand the relationship mentioned in the background paragraph and should be able to use it to understand that in the story. Your answer can not consist of any word that is not mentioned in any of these: the background paragraph, the story, or the question. You can directly copy and paste a span from the story or the question while answering the given question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task062_bigbench_repeat_copy_logic.json b/src/unitxt/catalog/instructions/natural_instructions/train/task062_bigbench_repeat_copy_logic.json new file mode 100644 index 000000000..4022b2d9e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task062_bigbench_repeat_copy_logic.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task evaluates for the ability to follow basic natural language instructions nested and performing a sequence of operations, including basic logic and conditionals." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task063_first_i_elements.json b/src/unitxt/catalog/instructions/natural_instructions/train/task063_first_i_elements.json new file mode 100644 index 000000000..25231a20f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task063_first_i_elements.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given inputs i and A, where i is an integer and A is a list. You need to output the first i elements of A, starting with the 1st element in A. i will always have a value less than the length of A" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task064_all_elements_except_first_i.json b/src/unitxt/catalog/instructions/natural_instructions/train/task064_all_elements_except_first_i.json new file mode 100644 index 000000000..bdc2286ea --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task064_all_elements_except_first_i.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given inputs i and A, where i is an integer and A is a list. You need to list all the elements of A after the first i elements. i will always have a value less than the length of A." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task065_timetravel_consistent_sentence_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task065_timetravel_consistent_sentence_classification.json new file mode 100644 index 000000000..fbc02422e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task065_timetravel_consistent_sentence_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a short story consisting of exactly 5 sentences where the second sentence is missing. You are given two options and you need to select the one that best connects the first sentence with the rest of the story. Indicate your answer by 'Option 1' if the first option is correct, otherwise 'Option 2'. The incorrect option will change the subsequent storyline, so that at least one of the three subsequent sentences is no longer consistent with the story." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task066_timetravel_binary_consistency_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task066_timetravel_binary_consistency_classification.json new file mode 100644 index 000000000..452ea48fe --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task066_timetravel_binary_consistency_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a short story consisting of exactly 5 sentences where the second sentence is missing. You are given a candidate for the second sentence and you need to identify if the given sentence connects the first sentence with the rest of the story. Indicate your answer by \"Yes\" if it connects, otherwise \"No\". Do not generate anything else apart from \"Yes\" or \"No\". The given sentence is incorrect if it changes the subsequent storyline, so that at least one of the three subsequent sentences form a consistent story." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task067_abductivenli_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task067_abductivenli_answer_generation.json new file mode 100644 index 000000000..4d1fc01e9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task067_abductivenli_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given the beginning and the ending of a three-part story. Your job is to complete the short story by writing a middle sentence that seamlessly connects the first and last sentence. Generated sentences must be short, have fewer than 10 words, and be simple as if narrating to a child. Avoid using any irrelevant extra information when creating the middle sentence, and use names (e.g. Jack, Barbara,...) instead of pronouns (e.g. he / she) wherever possible." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task068_abductivenli_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task068_abductivenli_incorrect_answer_generation.json new file mode 100644 index 000000000..91cff7fe9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task068_abductivenli_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're shown a three-part story, with a beginning, middle, and ending. Your job is to slightly modify the middle part, so that the whole story becomes unlikely, improbable, or inconsistent. Generated sentences must minimally alter the given middle, with at most 4 new words added/existing words removed. Your sentence should be grammatically and syntactically correct. Also stick to the context of the given story. For example, if the story talks about \"doctors\", you can talk about \"health\" or \"diagnosis\", but don't mention \"aliens\". Avoid introducing any extra/irrelevant information, and use names instead of pronouns (e.g. he / she) wherever possible. Avoid simply negating the original middle, for example: \"She likes cakes.\" is changed to \"She doesn't like cakes.\"" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task069_abductivenli_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task069_abductivenli_classification.json new file mode 100644 index 000000000..6247bc576 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task069_abductivenli_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown a short story with a beginning, two potential middles, and an ending. Your job is to choose the middle statement that makes the story coherent / plausible by writing \"1\" or \"2\" in the output. If both sentences are plausible, pick the one that makes most sense." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task070_abductivenli_incorrect_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task070_abductivenli_incorrect_classification.json new file mode 100644 index 000000000..3d93dcfb2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task070_abductivenli_incorrect_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown a short story with a beginning, two potential middles, and an ending. Your job is to choose the middle statement that makes the story incoherent / implausible by indicating 1 or 2 in the output. If both sentences are plausible, pick the one that makes less sense." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task071_abductivenli_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task071_abductivenli_answer_generation.json new file mode 100644 index 000000000..dd8e2b177 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task071_abductivenli_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given the beginning and the middle of a three-part story. Your job is to complete the short story by writing a probable ending. Generated sentences must be short, have fewer than 10 words, and be simple as if narrating to a child. Avoid using any irrelevant extra information when creating the ending, and use names instead of pronouns (e.g. he / she) wherever possible." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task072_abductivenli_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task072_abductivenli_answer_generation.json new file mode 100644 index 000000000..2b63642df --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task072_abductivenli_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given the middle and ending of a three-part story. Your job is to complete the short story by writing a probable beginning of the story. Generated sentences must be short, have fewer than 10 words, and be simple as if narrating to a child. Avoid using any irrelevant extra information when creating the beginning, and use names (e.g. Jack, Barbara,...) instead of pronouns (e.g. he / she) wherever possible." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task073_commonsenseqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task073_commonsenseqa_answer_generation.json new file mode 100644 index 000000000..6ca6f8e2a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task073_commonsenseqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question and some answer options (associated with \"A\", \"B\", \"C\", \"D\"). You should choose the correct answer based on commonsense knowledge. Avoid answering questions based on associations, the set of answers are chosen deliberately to capture common sense beyond associations. Do not generate anything else apart from one of the following characters: 'A', 'B, 'C', 'D', 'E' and only give one answer for each question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task074_squad1/1_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task074_squad1/1_question_generation.json new file mode 100644 index 000000000..0fad2f411 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task074_squad1/1_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task is about reading the given passage and construct a question about the information present in the passage. Construct a question in such a way that (i) it is unambiguous, (ii) it is answerable from the passage, (iii) its answer is unique (iv) its answer is a continuous text span from the paragraph. Avoid creating questions that (i) can be answered correctly without actually understanding the paragraph and (ii) uses same words or phrases given in the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task075_squad1/1_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task075_squad1/1_answer_generation.json new file mode 100644 index 000000000..538982c05 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task075_squad1/1_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task is about writing a correct answer for the reading comprehension task. Based on the information provided in a given passage, you should identify the shortest continuous text span from the passage that serves as an answer to the given question. Avoid answers that are incorrect or provides incomplete justification for the question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task076_splash_correcting_sql_mistake.json b/src/unitxt/catalog/instructions/natural_instructions/train/task076_splash_correcting_sql_mistake.json new file mode 100644 index 000000000..3edcae7a7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task076_splash_correcting_sql_mistake.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are expected to fix an SQL query based on feedback. You will be given an SQL statement and an English description with what is wrong about that SQL statement. You must correct the SQL statement based off of the feedback. An SQL query works by selecting data from a table where certain conditions apply. A table contains columns where every row in that table must have a value for each column. Every table has a primary key that uniquely identifies each row, usually an id. To choose which columns are returned you specify that after the \"SELECT\" statement. Next, you use a \"FROM\" statement to specify what tables you want to select the data from. When you specify a table you can rename it with the \"AS\" statement. You can reference that table by whatever name follows the \"AS\" statement. If you want to select data from multiple tables you need to use the \"JOIN\" statement. This will join the tables together by pairing a row in one table with every row in the other table (Cartesian Product). To limit the number of rows returned you should use the \"ON\" statement. This will only return rows where the condition specified after the statement is true, this is usually an equals operator with primary keys. You can also use the \"WHERE\" statement to specify that only rows with column values statisfying a certain condition, should be returned. The \"GROUP BY\" statement will group rows together that have equal column values for whatever columns follows the statement. The \"HAVING\" statement will return groups that statisfy whatever condition follows the statement. Any column(s) being returned from grouped rows must either be an aggregate function, (AVG, MAX, COUNT, SUM, ...) of a column, or the column(s) that the data was grouped by. To sort the returned data you can use the \"ORDER BY\" command which will order the data by whatever aggregate function or column follows the statement. The \"DESC\" statement will sort in descending order and the \"ASC\" statement will sort in ascending order. Finally, you can use the \"LIMIT\" statement to return a certain number of rows. When \"*\" is used in an SQL statement every column is returned. For example, SELECT * FROM table WHERE attribute = 1, will select every column from rows with the attribute column equal to 1. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task077_splash_explanation_to_sql.json b/src/unitxt/catalog/instructions/natural_instructions/train/task077_splash_explanation_to_sql.json new file mode 100644 index 000000000..bb609f0e1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task077_splash_explanation_to_sql.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are expected to provide an SQL statement from an english description of what that SQL statement does. The description may include multiple steps but you should only ouput one SQL statement that accomplishes every step. An SQL query works by selecting data from a table where certain conditions apply. A table contains columns where every row in that table must have a value for each column. Every table has a primary key that uniquely identifies each row, usually an id. To choose which columns are returned you specify that after the \"SELECT\" statement. Next, you use a \"FROM\" statement to specify what tables you want to select the data from. When you specify a table you can rename it with the \"AS\" statement. You can reference that table by whatever name follows the \"AS\" statement. If you want to select data from multiple tables you need to use the \"JOIN\" statement. This will join the tables together by pairing a row in one table with every row in the other table (Cartesian Product). To limit the number of rows returned you should use the \"ON\" statement. This will only return rows where the condition specified after the statement is true, this is usually an equals operator with primary keys. You can also use the \"WHERE\" statement to specify that only rows with column values statisfying a certain condition, should be returned. The \"GROUP BY\" statement will group rows together that have equal column values for whatever columns follows the statement. The \"HAVING\" statement will return groups that statisfy whatever condition follows the statement. Any column(s) being returned from grouped rows must either be an aggregate function, (AVG, MAX, COUNT, SUM, ...) of a column, or the column(s) that the data was grouped by. To sort the returned data you can use the \"ORDER BY\" command which will order the data by whatever aggregate function or column follows the statement. The \"DESC\" statement will sort in descending order and the \"ASC\" statement will sort in ascending order. Finally, you can use the \"LIMIT\" statement to return a certain number of rows. When \"*\" is used in an SQL statement every column is returned. For example, SELECT * FROM table WHERE attribute = 1, will select every column from rows with the attribute column equal to 1." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task078_all_elements_except_last_i.json b/src/unitxt/catalog/instructions/natural_instructions/train/task078_all_elements_except_last_i.json new file mode 100644 index 000000000..47e63320a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task078_all_elements_except_last_i.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given inputs i and A, where i is an integer and A is a list. You need to list all the elements of A preceding the last i elements. i will always have a value less than the length of A." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task079_conala_concat_strings.json b/src/unitxt/catalog/instructions/natural_instructions/train/task079_conala_concat_strings.json new file mode 100644 index 000000000..3f9e5d4e3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task079_conala_concat_strings.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of strings and you need to concatenate them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task080_piqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task080_piqa_answer_generation.json new file mode 100644 index 000000000..edc4843f7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task080_piqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task the focus is on physical knowledge about the world. Given the provided goal task in the input, describe a process that would lead to the asked outcome. This process often involves physical motions with objects, such as moving them, arranging them in a certain way, mixing them, shaking them, etc. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task081_piqa_wrong_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task081_piqa_wrong_answer_generation.json new file mode 100644 index 000000000..82672f2ab --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task081_piqa_wrong_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be asked how to do a certain task. You should describe a physical process that does not lead to the asked outcome, yet it is closely related to it (i.e., it should use the words that are provided in the input). The physical process can be moving something, arranging something in a certain way, mixing things, shaking them, etc. To make sure that the generated process does not lead to the asked outcome, you can introduce objects or events unrelated to the context of the question e.g. 'cleaning the keyboard by making an elephant sit on them'; or you can create contradictory statements e.g. 'drying wet keyboards with running water'. In your responses, avoid typos and misspellings." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task082_babi_t1_single_supporting_fact_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task082_babi_t1_single_supporting_fact_question_generation.json new file mode 100644 index 000000000..c24152cd8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task082_babi_t1_single_supporting_fact_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a passage consisting of set of facts. The task is to create a question of form 'Where is ?' that is answerable from exactly one of the given facts. Avoid creating questions that are unanswerable from all of the facts." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task083_babi_t1_single_supporting_fact_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task083_babi_t1_single_supporting_fact_answer_generation.json new file mode 100644 index 000000000..e43e860e4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task083_babi_t1_single_supporting_fact_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a passage consisting of set of facts and a question as input. The task is to answer a question of form 'Where is ?' using one of the given facts to determine the latest location of the person. Answer should be a word/phrase describing the location from the supporting fact. Avoid answers that are incomplete or incorrect." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task084_babi_t1_single_supporting_fact_identify_relevant_fact.json b/src/unitxt/catalog/instructions/natural_instructions/train/task084_babi_t1_single_supporting_fact_identify_relevant_fact.json new file mode 100644 index 000000000..1ba13af54 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task084_babi_t1_single_supporting_fact_identify_relevant_fact.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a passage with an enumerated set of facts, a question of form 'Where is ?', and its answer. The task is to identify a supporting fact that is necessary to answer the question. The output would be the corresponding fact number." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task085_unnatural_addsub_arithmetic.json b/src/unitxt/catalog/instructions/natural_instructions/train/task085_unnatural_addsub_arithmetic.json new file mode 100644 index 000000000..2b23d2243 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task085_unnatural_addsub_arithmetic.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given an arithmetic operation and you have to find its answer. The symbols of operators '+' and '-' has been swapped i.e you need to perform subtraction when you see a '+' symbol and addition in case of '-' symbol." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task087_new_operator_addsub_arithmetic.json b/src/unitxt/catalog/instructions/natural_instructions/train/task087_new_operator_addsub_arithmetic.json new file mode 100644 index 000000000..49da8f776 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task087_new_operator_addsub_arithmetic.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given an arithmetic operation and you have to find its answer. The operators '+' and '-' have been replaced with new symbols. Specifically, '+' has been replaced with the symbol '@' and '-' with the symbol '#'. You need to perform the operations in the given equation return the answer" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task088_identify_typo_verification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task088_identify_typo_verification.json new file mode 100644 index 000000000..128a72e70 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task088_identify_typo_verification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The given sentence contains a typo which could be one of the following four types: (1) swapped letters of a word e.g. 'niec' is a typo of the word 'nice'. (2) missing letter in a word e.g. 'nic' is a typo of the word 'nice'. (3) extra letter in a word e.g. 'nicce' is a typo of the word 'nice'. (4) replaced letter in a word e.g 'nicr' is a typo of the word 'nice'. You need to identify the typo in the given sentence. To do this, answer with the word containing the typo." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task089_swap_words_verification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task089_swap_words_verification.json new file mode 100644 index 000000000..83f0b95a4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task089_swap_words_verification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, positions of two consecutive words have been swapped. You need to output the position of the swaped words. e.g. in the sentence 'Seattle has nice a weather', the word 'a' and 'nice' have been swapped. These words are at 3rd and 4th position respectively. So, the output should be (3, 4). Note that the index of first word is 1." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task090_equation_learner_algebra.json b/src/unitxt/catalog/instructions/natural_instructions/train/task090_equation_learner_algebra.json new file mode 100644 index 000000000..f8c18612a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task090_equation_learner_algebra.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "A ploynomial equation is a sum of terms. Here each term is either a constant number, or consists of the variable x raised to a certain power and multiplied by a number. These numbers are called weights. For example, in the polynomial: 2x^2+3x+4, the weights are: 2,3,4. You can present a polynomial with the list of its weights, for example, equation weights = [6, 4] represent the equation 6x + 4 and equation weights = [1, 3, 4] represent the equation 1x^2 + 3x + 4. In this task, you need to compute the result of a polynomial expression by substituing a given value of x in the given polynomial equation. Equation weights are given as a list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task091_all_elements_from_index_i_to_j.json b/src/unitxt/catalog/instructions/natural_instructions/train/task091_all_elements_from_index_i_to_j.json new file mode 100644 index 000000000..30b921cd2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task091_all_elements_from_index_i_to_j.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given inputs i,j, and A, where i and j are integers and A is a list. You need to list all elements of A from the ith element to the jth element. i and j will be non-negative, and will always have a value less than the length of A. i will always be less than j." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task092_check_prime_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task092_check_prime_classification.json new file mode 100644 index 000000000..5984063b2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task092_check_prime_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to output 'Yes' if the given number is a prime number otherwise output 'No'. A 'prime number' is a a whole number above 1 that can not be made by multiplying other whole numbers." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task093_conala_normalize_lists.json b/src/unitxt/catalog/instructions/natural_instructions/train/task093_conala_normalize_lists.json new file mode 100644 index 000000000..acba462bd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task093_conala_normalize_lists.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a list of numbers. The goal is to divide all the numbers in the list by a constant such that the sum of the resulting list is 1. The output should be rounded to 3 decimals." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task094_conala_calculate_mean.json b/src/unitxt/catalog/instructions/natural_instructions/train/task094_conala_calculate_mean.json new file mode 100644 index 000000000..6ed9b5fb6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task094_conala_calculate_mean.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of numbers and you need to find the mean (average) of that list. The mean of a list can be found by summing every number in the list then dividing the result by the size of that list. The output should be rounded to 3 decimal places." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task095_conala_max_absolute_value.json b/src/unitxt/catalog/instructions/natural_instructions/train/task095_conala_max_absolute_value.json new file mode 100644 index 000000000..3ca3bca57 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task095_conala_max_absolute_value.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In mathematics, the absolute value of a number is the non-negative value of that number, without regarding its sign. For example, the absolute value of -2 is 2, and the absolute value of 5 is 5. In this task you will be given a list of numbers and you need to return the element with highest absolute value. If a negative and positive element have the same absolute value you should return the positive element. The absolute value for negative numbers can be found by multiplying them by -1. After finding the element with the maximum absolute value you should return the value of that element before you applied the absolute value." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task096_conala_list_index_subtraction.json b/src/unitxt/catalog/instructions/natural_instructions/train/task096_conala_list_index_subtraction.json new file mode 100644 index 000000000..88d018c37 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task096_conala_list_index_subtraction.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of numbers and you need to subtract every value in the list with the index it is at. The index of an elements shows its numerical order in the list(for example, in the list [7,10,4,5], the index of 7 is 1 and the index of 4 is 3) You should start the index at 1, so the first element in the list will be subtracted by one. For every element in the list you need to find \"element - index\" where the index of the beginning element is 1 and increments by 1 for each element. Put your result list in brackets." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task097_conala_remove_duplicates.json b/src/unitxt/catalog/instructions/natural_instructions/train/task097_conala_remove_duplicates.json new file mode 100644 index 000000000..b2515ea10 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task097_conala_remove_duplicates.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of numbers and you should remove all duplicates in the list. If every number is repeated in the list an empty list should be returned. Your list should be numbers inside brackets, just like the given list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task098_conala_list_intersection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task098_conala_list_intersection.json new file mode 100644 index 000000000..feb954786 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task098_conala_list_intersection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given two lists of numbers and you need to calculate the intersection between these two lists. The intersection between two lists is another list where every element is common between the two original lists. If there are no elements in the intersection, answer with an empty list. Your list of numbers must be inside brackets. Sort the numbers in your answer in an ascending order, that is, no matter what the order of the numbers in the lists is, you should put them in your answer in an ascending order." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task099_reverse_elements_between_index_i_and_j.json b/src/unitxt/catalog/instructions/natural_instructions/train/task099_reverse_elements_between_index_i_and_j.json new file mode 100644 index 000000000..4afdc9d23 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task099_reverse_elements_between_index_i_and_j.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given inputs i,j, and A, where i and j are integers and A is a list. You need to list all elements of A from the ith element to the jth element in the reverse order. i and j will be non-negative, and will always have a value less than the length of A. i will always be less than j." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task100_concatenate_all_elements_from_index_i_to_j.json b/src/unitxt/catalog/instructions/natural_instructions/train/task100_concatenate_all_elements_from_index_i_to_j.json new file mode 100644 index 000000000..4fbcc75f0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task100_concatenate_all_elements_from_index_i_to_j.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given inputs i,j, and A, where i and j are integers and A is a list. You need to concatenate all elements of A from the ith element to the jth element, and print the resultant string. i and j will be non-negative, and will always have a value less than the length of A. i will always be less than j." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task101_reverse_and_concatenate_all_elements_from_index_i_to_j.json b/src/unitxt/catalog/instructions/natural_instructions/train/task101_reverse_and_concatenate_all_elements_from_index_i_to_j.json new file mode 100644 index 000000000..e541e9b16 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task101_reverse_and_concatenate_all_elements_from_index_i_to_j.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given inputs i, j, and A, where i and j are integers and A is a list. You need to find all elements of A from the ith element to the jth element, reverse the order in which they occur, and then concatenate them to output the resultant string. i and j will be non-negative, and will always have a value less than the length of A. i will always be less than j. Perform the operations in order, i.e., do not concatenate the elements and then reverse the string." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task103_facts2story_long_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task103_facts2story_long_text_generation.json new file mode 100644 index 000000000..96b9bca50 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task103_facts2story_long_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, five ordered key facts are given. All the given facts are expressed in natural language. Your job is to generate a story 100 to 1000 words long, that includes all the facts given as input in their order of appearance while expanding upon them to produce a broader, yet coherent, narrative." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task104_semeval_2019_task10_closed_vocabulary_mathematical_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task104_semeval_2019_task10_closed_vocabulary_mathematical_answer_generation.json new file mode 100644 index 000000000..e7a522e0e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task104_semeval_2019_task10_closed_vocabulary_mathematical_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a mathematical question described with a circumscribed mathematical vocabulary. Questions in this task usually contain some variables (e.g. X, Y), equations (e.g. X+Y=3) and some relationships (X is greater than Y). Often you need to find the value of the variable using equations and relationships. You are also given 4 or 5 answer options (associated with \"A\", \"B\", \"C\", \"D\", \"E\"). Do not generate anything else apart from one of the following characters: 'A', 'B, 'C', 'D', 'E'. LaTeX mathematical format (the standard way to express mathematical expressions in the typesetting software known as LaTeX) is used to express equations. Each question is solvable with high school math knowledge. Give only one answer for each question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task105_story_cloze_rocstories_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task105_story_cloze_rocstories_sentence_generation.json new file mode 100644 index 000000000..b97bdbf29 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task105_story_cloze_rocstories_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a four sentences of story written in natural language. Your job is to complete end part of the story by predicting appropriate last sentence which is coherent with the given sentences." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task107_splash_question_to_sql.json b/src/unitxt/catalog/instructions/natural_instructions/train/task107_splash_question_to_sql.json new file mode 100644 index 000000000..c69009044 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task107_splash_question_to_sql.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are expected to write an SQL query that will return the data asked for in the question. An SQL query works by selecting data from a table where certain conditions apply. A table contains columns where every row in that table must have a value for each column. Every table has a primary key that uniquely identifies each row, usually an id. To choose which columns are returned you specify that after the \"SELECT\" statement. Next, you use a \"FROM\" statement to specify what tables you want to select the data from. When you specify a table you can rename it with the \"AS\" statement. You can reference that table by whatever name follows the \"AS\" statement. If you want to select data from multiple tables you need to use the \"JOIN\" statement. This will join the tables together by pairing a row in one table with every row in the other table (Cartesian Product). To limit the number of rows returned you should use the \"ON\" statement. This will only return rows where the condition specified after the statement is true, this is usually an equals operator with primary keys. You can also use the \"WHERE\" statement to specify that only rows with column values statisfying a certain condition, should be returned. The \"GROUP BY\" statement will group rows together that have equal column values for whatever columns follows the statement. The \"HAVING\" statement will return groups that statisfy whatever condition follows the statement. Any column(s) being returned from grouped rows must either be an aggregate function, (AVG, MAX, COUNT, SUM, ...) of a column, or the column(s) that the data was grouped by. To sort the returned data you can use the \"ORDER BY\" command which will order the data by whatever aggregate function or column follows the statement. The \"DESC\" statement will sort in descending order and the \"ASC\" statement will sort in ascending order. Finally, you can use the \"LIMIT\" statement to return a certain number of rows. When \"*\" is used in an SQL statement every column is returned. For example, SELECT * FROM table WHERE attribute = 1, will select every column from rows with the attribute column equal to 1." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1087_two_number_sum.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1087_two_number_sum.json new file mode 100644 index 000000000..32e0de623 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1087_two_number_sum.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a list of integers and an integer target, return a list of a pair of numbers in any order such that they add up to target. If there is no such pair of numbers, then return an empty list" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1088_array_of_products.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1088_array_of_products.json new file mode 100644 index 000000000..79fb846ea --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1088_array_of_products.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a list of integers. A list is shown by comma-separated numbers between two brackets. For example, [7,3,6] is a list. The number in location one is 7, the number in location two is 3, and the number in location three is 6. You should answer with a list such that every element at each location is equal to the product of elements at every other location in the input array. For example, if a list has four numbers, the answer you give should be created like this: First element of your list = product of second, third, and fourth elements in the given list. Second element of your list = product of First, third and fourth elements in the given list, etc." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1089_check_monotonic_array.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1089_check_monotonic_array.json new file mode 100644 index 000000000..dbadf618e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1089_check_monotonic_array.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given an array of integers, check if it is monotonic or not. If the array is monotonic, then return 1, else return 2. An array is monotonic if it is either monotonically increasing or monotonocally decreasing. An array is monotonically increasing/decreasing if its elements increase/decrease as we move from left to right" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task108_contextualabusedetection_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task108_contextualabusedetection_classification.json new file mode 100644 index 000000000..d17bc8cee --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task108_contextualabusedetection_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Read the given text and if it has abusive content then indicate via \"yes\". Otherwise indicate via\"no\". \nWe consider the content to be abusive if it contains any of the following instances: (1) Identity Directed Abuse (e.g., Content which contains a negative statement made against an identity. An identity is a social category that relates to a fundamental aspect of individuals community, socio-demographics, position or self-representation) (2) Affiliation Directed Abuse (e.g., Content which express negativity against an affiliation. We define affiliation as a (more or less) voluntary association with a collective. Affiliations include but are not limited to: memberships (e.g. Trade unions), party memberships (e.g. Republicans), political affiliations (e.g. Right-wing people) and occupations (e.g. Doctors).) (3) Person Directed Abuse (e.g., Content which directs negativity against an identifiable person, who is either part of the conversation thread or is named. Person-directed abuse includes serious character based attacks, such as accusing the person of lying, as well as aggression, insults and menacing language.) and (4) Counter Speech (e.g., Content which challenges, condemns or calls out the abusive language of others.). Note that URLs in the text have been replaced with [Link]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task109_smsspamcollection_spamsmsdetection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task109_smsspamcollection_spamsmsdetection.json new file mode 100644 index 000000000..c21ad8043 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task109_smsspamcollection_spamsmsdetection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given text messages in natural language. Your task is to classify those text messages based on their content into two classes: (1) Spam and (2) Ham messages. If the content of the given message is irrelevant to the receiver or is equally relevant to many other potential recipients then it must be labeled as \u2018spam\u2019, otherwise, it should be labeled as \u2018ham\u2019." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task110_logic2text_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task110_logic2text_sentence_generation.json new file mode 100644 index 000000000..db1891ad6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task110_logic2text_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given commands (in terms of logical operations) to select relevant rows from the given table. Your job is to generate a natural language interpretation of the given command. \n Here are the definitions of logical operators: \n 1. count: returns the number of rows in the view \n 2. only: returns whether there is exactly one row in the view \n 3. hop: returns the value under the header column of the row \n 4. and: returns the boolean operation result of two arguments \n 5. max/min/avg/sum: returns the max/min/average/sum of the values under the header column \n 6. nth max/nth min: returns the n-th max/n-th min of the values under the header column \n 7. argmax/argmin: returns the row with the max/min value in header column \n 8. nth argmax/nth argmin: returns the row with the n-th max/min value in header column \n 9. eq/not eq: returns if the two arguments are equal \n 10. round eq: returns if the two arguments are roughly equal under certain tolerance \n 11. greater/less: returns if argument 1 is greater/less than argument 2 \n 12. diff: returns the difference between two arguments \n 13. filter eq/not eq: returns the subview whose values under the header column is equal/not equal to argument 3 \n 14. filter greater/less: returns the subview whose values under the header column is greater/less than argument 3 \n 15. filter greater eq /less eq: returns the subview whose values under the header column is greater/less or equal than argument 3 \n 16. filter all: returns the view itself for the case of describing the whole table \n 17. all eq/not eq: returns whether all the values under the header column are equal/not equal to argument 3 \n 18. all greater/less: returns whether all the values under the header column are greater/less than argument 3 \n 19. all greater eq/less eq: returns whether all the values under the header column are greater/less or equal to argument 3 \n 20. most eq/not eq: returns whether most of the values under the header column are equal/not equal to argument 3 \n 21. most greater/less: returns whether most of the values under the header column are greater/less than argument 3 \n 22. most greater eq/less eq: returns whether most of the values under the header column are greater/less or equal to argument 3" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task111_asset_sentence_simplification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task111_asset_sentence_simplification.json new file mode 100644 index 000000000..e45e340aa --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task111_asset_sentence_simplification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Rewrite each original sentence in order to make it easier to understand by non-native speakers of English. You can do so by replacing complex words with simpler synonyms (i.e. paraphrasing), deleting unimportant information (i.e. compression), and/or splitting a long complex sentence into several simpler ones. The final simplified sentences need to be grammatical, fluent, and retain the main ideas of their original counterparts without altering their meanings." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task112_asset_simple_sentence_identification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task112_asset_simple_sentence_identification.json new file mode 100644 index 000000000..7e3f7627a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task112_asset_simple_sentence_identification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given two pieces of text with the same meaning. One of them is simpler and easier to understand for non-native English speakers. Complex texts may contain more difficult words, have unnecessary phrases or contain long sentences. Your task is to choose the simpler piece of text. You are expected to output 'Text one' if the first sentence is simpler. Otherwise output 'Text two'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1135_xcsr_en_commonsense_mc_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1135_xcsr_en_commonsense_mc_classification.json new file mode 100644 index 000000000..e8f648fa0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1135_xcsr_en_commonsense_mc_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a question that has multiple possible answers. You should choose the most suitable option out of \"A\", \"B\", \"C\", \"D\", and \"E\", based on your commonsense knowledge." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task113_count_frequency_of_letter.json b/src/unitxt/catalog/instructions/natural_instructions/train/task113_count_frequency_of_letter.json new file mode 100644 index 000000000..e6a4a69b9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task113_count_frequency_of_letter.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to count the number of times the given letter appears in the given sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1146_country_capital.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1146_country_capital.json new file mode 100644 index 000000000..88fa2d32d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1146_country_capital.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name and you need to return the capital city of the given country" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1147_country_currency.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1147_country_currency.json new file mode 100644 index 000000000..47962e4bc --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1147_country_currency.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a country name and you need to return the currency of the given country." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1148_maximum_ascii_value.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1148_maximum_ascii_value.json new file mode 100644 index 000000000..dd2c55b7c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1148_maximum_ascii_value.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a string with unique characters in it and you need to return the character from the string which has the maximum ASCII value. ASCII stands for American Standard Code For Information Interchange and It assigns a unique number to each character. The characters [a - z] have an ASCII range of 97-122 and [A-Z] have an ASCII range of 65-90 respectively." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1149_item_check_edible.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1149_item_check_edible.json new file mode 100644 index 000000000..b0c2b1d1e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1149_item_check_edible.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an item and you need to check whether it is edible or not, return 1 if it is edible, else return 2." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task114_is_the_given_word_longest.json b/src/unitxt/catalog/instructions/natural_instructions/train/task114_is_the_given_word_longest.json new file mode 100644 index 000000000..5c2be9e95 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task114_is_the_given_word_longest.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to answer 'Yes' if the given word is the longest word (in terms of number of letters) in the given sentence, else answer 'No'. Note that there could be multiple longest words in a sentence as they can have the same length that is the largest across all words in that sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1150_delete_max_min.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1150_delete_max_min.json new file mode 100644 index 000000000..162a383b5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1150_delete_max_min.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a list of numbers. The list of numbers is separated with comma and inside brackets. You need to remove the maximum(the number with the largest value) and minimum(the number with the smallest value) element from the list and return the list in the same order as input. Your answer should be a list of numbers separated by comma, inside brackets." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1151_swap_max_min.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1151_swap_max_min.json new file mode 100644 index 000000000..2e68facdc --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1151_swap_max_min.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a list of unique integers you need to swap the positions of maximum and minimum element in the list and return the updated list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task115_help_advice_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task115_help_advice_classification.json new file mode 100644 index 000000000..a963f840b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task115_help_advice_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Read the given sentence and if it is a general advice then indicate via \"yes\". Otherwise indicate via \"no\". advice is basically offering suggestions about the best course of action to someone. advice can come in a variety of forms, for example Direct advice and Indirect advice. (1) Direct advice: Using words (e.g., suggest, advice, recommend), verbs (e.g., can, could, should, may), or using questions (e.g., why don't you's, how about, have you thought about). (2) Indirect advice: contains hints from personal experiences with the intention for someone to do the same thing or statements that imply an action should (or should not) be taken." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1167_penn_treebank_coarse_pos_tagging.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1167_penn_treebank_coarse_pos_tagging.json new file mode 100644 index 000000000..fb0e3624d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1167_penn_treebank_coarse_pos_tagging.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Provide the parts-of-speech tag of a word present in a sentence specified within curly braces ( '{{ ... }}' ). The parts-of-speech tags are coarse labels that represent a category of words with similar grammatical properties. The list of part-of-speech tags i.e tagset of this corpus is - \n '.': Period symbol is used for symbols denoting Punctuations/Separations such as comma, period, backticks etc., \n 'ADJ': Adjectives are words that typically modify nouns and specify their properties or attributes, \n 'ADP': Adposition is a cover term for prepositions and postpositions, \n 'ADV': Adverbs are words that typically modify verbs for such categories as time, place, direction or manner, \n 'CONJ': A word used to connect clauses or sentences or to coordinate words in the same clause, \n 'DET': Determiners are words that modify nouns or noun phrases and express the reference of the noun phrase in context, \n 'NOUN': Nouns are a part of speech typically denoting a person, place, thing, animal or idea, \n 'NUM': A numeral is a word, functioning most typically as a determiner, adjective or pronoun, that expresses a number and a relation to the number, such as quantity, sequence, frequency or fraction, \n 'PRT': Particles are function words that must be associated with another word or phrase to impart meaning and that do not satisfy definitions of other universal parts of speech, \n 'PRON': Pronouns are words that substitute for nouns or noun phrases, whose meaning is recoverable from the linguistic or extralinguistic context, \n 'PROPN': A proper noun is a noun (or nominal content word) that is the name (or part of the name) of a specific individual, place, or object, \n 'VERB': A verb is a member of the syntactic class of words that typically signal events and actions, can constitute a minimal predicate in a clause, and govern the number and types of other constituents which may occur in the clause, \n 'X': The tag X is used for words that for some reason cannot be assigned a real part-of-speech category." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1168_brown_coarse_pos_tagging.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1168_brown_coarse_pos_tagging.json new file mode 100644 index 000000000..a4c16833b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1168_brown_coarse_pos_tagging.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to provide the parts-of-speech tag of a word present in a sentence specified within curly braces ( '{{ ... }}' ). The parts-of-speech tags are coarse labels that represent a category of words with similar grammatical properties. The list of part-of-speech tags i.e tagset of this corpus is - \n '.': Period symbol is used for symbols denoting Punctuations/Separations such as comma, period, backticks etc., \n 'ADJ': Adjectives are words that typically modify nouns and specify their properties or attributes, \n 'ADP': Adposition is a cover term for prepositions and postpositions, \n 'ADV': Adverbs are words that typically modify verbs for such categories as time, place, direction or manner, \n 'CONJ': A word used to connect clauses or sentences or to coordinate words in the same clause, \n 'DET': Determiners are words that modify nouns or noun phrases and express the reference of the noun phrase in context, \n 'NOUN': Nouns are a part of speech typically denoting a person, place, thing, animal or idea, \n 'NUM': A numeral is a word, functioning most typically as a determiner, adjective or pronoun, that expresses a number and a relation to the number, such as quantity, sequence, frequency or fraction, \n 'PRT': Particles are function words that must be associated with another word or phrase to impart meaning and that do not satisfy definitions of other universal parts of speech, \n 'PRON': Pronouns are words that substitute for nouns or noun phrases, whose meaning is recoverable from the linguistic or extralinguistic context, \n 'PROPN': A proper noun is a noun (or nominal content word) that is the name (or part of the name) of a specific individual, place, or object, \n 'VERB': A verb is a member of the syntactic class of words that typically signal events and actions, can constitute a minimal predicate in a clause, and govern the number and types of other constituents which may occur in the clause, \n 'X': The tag X is used for words that for some reason cannot be assigned a real part-of-speech category." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task116_com2sense_commonsense_reasoning.json b/src/unitxt/catalog/instructions/natural_instructions/train/task116_com2sense_commonsense_reasoning.json new file mode 100644 index 000000000..de3062e8a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task116_com2sense_commonsense_reasoning.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a piece of text either about an everyday event, or a general statement. If the event seems a plausible event to you, or the general statement makes sense matches your commonsense, output 'True', otherwise output 'False'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1186_nne_hrngo_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1186_nne_hrngo_classification.json new file mode 100644 index 000000000..e1eb5c81c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1186_nne_hrngo_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given an original reference as well as a system generated reference. Your task is to judge the naturaleness of the system generated reference. If the utterance could have been produced by a native speaker output 1, else output 0." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1188_count_max_freq_char.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1188_count_max_freq_char.json new file mode 100644 index 000000000..e450098d6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1188_count_max_freq_char.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a string with duplicate characters ocurring in the string. You need to return the character which is ocurring with the maximum frequency. In case of a tie, return the character with the least ascii value." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1189_check_char_in_string.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1189_check_char_in_string.json new file mode 100644 index 000000000..5e196c8ff --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1189_check_char_in_string.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a string S and a character c separated by a comma. You need to check if the character c is present in S or not. Return 1 if it is present, else return 0." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task118_semeval_2019_task10_open_vocabulary_mathematical_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task118_semeval_2019_task10_open_vocabulary_mathematical_answer_generation.json new file mode 100644 index 000000000..1befbcb5f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task118_semeval_2019_task10_open_vocabulary_mathematical_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a mathematical question described with an open-ended vocabulary. Questions in this task involve real-world situations, describing a mathematical problem. You are also given 4 or 5 answer options (associated with \"A\", \"B\", \"C\", \"D\", \"E\"). Do not generate anything else apart from one of the following characters: 'A', 'B, 'C', 'D', 'E'. LaTeX mathematical format (the standard way to express mathematical expressions in the typesetting software known as LaTeX) is used to express equations. Each question is solvable with high school math knowledge. Give only one answer for each question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1190_add_integer_to_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1190_add_integer_to_list.json new file mode 100644 index 000000000..b55285146 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1190_add_integer_to_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a list of integers and an integer k. You need to add integer k to each element in the list and return the updated list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1191_food_veg_nonveg.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1191_food_veg_nonveg.json new file mode 100644 index 000000000..175da1c03 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1191_food_veg_nonveg.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given the name of an Indian food dish. You need to return whether the dish is \"non vegetarian\" or \"vegetarian\". Do not answer with any words other than those two." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1192_food_flavor_profile.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1192_food_flavor_profile.json new file mode 100644 index 000000000..933315c9d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1192_food_flavor_profile.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given the name of an Indian food dish. You need to classify the dish as \"sweet\" or \"spicy\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1193_food_course_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1193_food_course_classification.json new file mode 100644 index 000000000..7b220c8cb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1193_food_course_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given the name of an Indian food dish. You need to classify the dish as a \"main course\", \"dessert\" or \"snack\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1194_kth_largest_element.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1194_kth_largest_element.json new file mode 100644 index 000000000..caca54c17 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1194_kth_largest_element.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a list of integers and an integer k. You need to find the kth largest element in the input list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1196_atomic_classification_oeffect.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1196_atomic_classification_oeffect.json new file mode 100644 index 000000000..bdd3c4d48 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1196_atomic_classification_oeffect.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a tuple, comprising Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether, as a result of the Head, PersonY or others will be affected as mentioned in the Tail or not. These effects are social actions that may occur after the Head event. For example, X may get hugged, and Y may blush in response. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1197_atomic_classification_oreact.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1197_atomic_classification_oreact.json new file mode 100644 index 000000000..e4596937e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1197_atomic_classification_oreact.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a tuple, comprising Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether, as a result of the Head, PersonY, or others, feel what is mentioned in the Tail or not. Feelings in this task are the emotional reactions on the part of PersonY or other participants in an event. For example, as a result of gift-giving, others (in this case, PersonY) might feel appreciated. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1198_atomic_classification_owant.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1198_atomic_classification_owant.json new file mode 100644 index 000000000..a10384169 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1198_atomic_classification_owant.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a tuple, comprising Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether, as a result of the Head, PersonY or others will want what is mentioned in the Tail or not. In this task, wanting is a postcondition desire on the part of PersonY and others, respectively. For example, as a result of PersonX giving PersonY gifts, PersonY may want to open the gift. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1199_atomic_classification_xattr.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1199_atomic_classification_xattr.json new file mode 100644 index 000000000..a6a1bf79d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1199_atomic_classification_xattr.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a tuple, comprising Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether, as a result of the Head, PersonX will be seen as what is mentioned in the Tail or not. In this task, PersonX will be seen as the Tail if the Tail describes PersonX's persona or attribute as perceived by others given an event. In the gift-giving example, X may be seen as generous or giving. In contrast, in an event such as PersonX steals a car, PersonX may be perceived as evil. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task119_semeval_2019_task10_geometric_mathematical_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task119_semeval_2019_task10_geometric_mathematical_answer_generation.json new file mode 100644 index 000000000..2b7e3362d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task119_semeval_2019_task10_geometric_mathematical_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a geometric mathematical question. Questions in this task often involve shapes and Geometric Relationships. You are also given 4 or 5 answer options (associated with \"A\", \"B\", \"C\", \"D\", \"E\"). Do not generate anything else apart from one of the following characters: 'A', 'B, 'C', 'D', 'E'. LaTeX mathematical format (the standard way to express mathematical expressions in the typesetting software known as LaTeX) is used to express equations. Each question is solvable with high school math knowledge." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1200_atomic_classification_xeffect.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1200_atomic_classification_xeffect.json new file mode 100644 index 000000000..779a4f552 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1200_atomic_classification_xeffect.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether, as a result of the Head, PersonX will be affected as mentioned in the Tail or not. These effects are social actions that may occur after the Head event. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1201_atomic_classification_xintent.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1201_atomic_classification_xintent.json new file mode 100644 index 000000000..fafde05e9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1201_atomic_classification_xintent.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether The Tail is the intention of the PersonX from the Head or not. The intention is the likely intent or desire of PersonX behind the execution of an event. For example, given the Head PersonX gives PersonY gifts, an intention might be that PersonX wanted to be thoughtful. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1202_atomic_classification_xneed.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1202_atomic_classification_xneed.json new file mode 100644 index 000000000..62672a495 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1202_atomic_classification_xneed.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether PersonX needs what is mentioned in the Tail before the Head or not. Here need is a precondition for PersonX to achieve the event. For example, in order for PersonX to give PersonY gifts, PersonX must first buy the presents. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1203_atomic_classification_xreact.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1203_atomic_classification_xreact.json new file mode 100644 index 000000000..d1390086a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1203_atomic_classification_xreact.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": " In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether, as a result of the Head, PersonX may feel what is mentioned in the Tail or not. In this task, the feeling is an emotional reaction on the part of X or other participants in an event. For example, as a result of gift-giving, X might feel good about [one]self. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1204_atomic_classification_hinderedby.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1204_atomic_classification_hinderedby.json new file mode 100644 index 000000000..f2a911f6f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1204_atomic_classification_hinderedby.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether the Head can be hindered by what is mentioned in the Tail or not. In this task, hindering introduces hindrances that obstruct the natural path to the achievement of a goal. For example, the event PersonX adopts a cat can be obstructed if PersonX is allergic to cats. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1205_atomic_classification_isafter.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1205_atomic_classification_isafter.json new file mode 100644 index 000000000..0313a7d4b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1205_atomic_classification_isafter.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether the Head happens after the Tail or not. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1206_atomic_classification_isbefore.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1206_atomic_classification_isbefore.json new file mode 100644 index 000000000..ad225ee39 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1206_atomic_classification_isbefore.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether the Head happens before the Tail or not. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1207_atomic_classification_atlocation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1207_atomic_classification_atlocation.json new file mode 100644 index 000000000..9ba8b2a60 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1207_atomic_classification_atlocation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether the Head is located or can be found at/in/on the Tail or not. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1208_atomic_classification_xreason.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1208_atomic_classification_xreason.json new file mode 100644 index 000000000..8a28ab037 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1208_atomic_classification_xreason.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether The Tail is the reason for the Head or not. The reason provides a post-fact explanation of the cause of an event. For example, why one has to walk could be explained by a car has broken down. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1209_atomic_classification_objectuse.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1209_atomic_classification_objectuse.json new file mode 100644 index 000000000..7ca3402e6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1209_atomic_classification_objectuse.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether the Head is used for the Tail or not. The usage describes everyday affordances or uses of objects and includes both typical and atypical uses. For example, a popcorn bucket can typically be used to hold popcorn, but it could also serve as a hat in atypical situations. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1210_atomic_classification_madeupof.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1210_atomic_classification_madeupof.json new file mode 100644 index 000000000..b6dd11415 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1210_atomic_classification_madeupof.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether the Head is a part, portion, or makeup of the Tail or not. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1211_atomic_classification_hassubevent.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1211_atomic_classification_hassubevent.json new file mode 100644 index 000000000..28f19b880 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1211_atomic_classification_hassubevent.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether the Head includes an event or an action in the Tail or not. This happens when the Tail denotes a step within the larger head event. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1212_atomic_classification_hasproperty.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1212_atomic_classification_hasproperty.json new file mode 100644 index 000000000..b85681c2e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1212_atomic_classification_hasproperty.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether the Head can be characterized by being or having the Tail or not. Being characterized usually describes entities' general characteristics such as rose is red, or subjective attributes such as thirst is uncomfortable. It can also map to descriptors that speak to the substance or value of items such as meat has the property of being stored in the freezer or bike is powered by a person's legs. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1213_atomic_classification_desires.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1213_atomic_classification_desires.json new file mode 100644 index 000000000..912f7fddb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1213_atomic_classification_desires.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether it is plausible for the Head to desire the Tail or not. In this task, desire means desires of sentient entities. For example, doctors likely desire to cure a patient. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1214_atomic_classification_xwant.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1214_atomic_classification_xwant.json new file mode 100644 index 000000000..ad016b4f5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1214_atomic_classification_xwant.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether, as a result of the Head, PersonX wants what is mentioned in the Tail or not. In this task, wanting is a postcondition desire on the part of PersonX, respectively. As a result of PersonX giving PersonY gifts, PersonX may also desire to hug PersonY. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1215_atomic_classification_capableof.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1215_atomic_classification_capableof.json new file mode 100644 index 000000000..1cdd14462 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1215_atomic_classification_capableof.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether the Head is capable of the Tail or not. Being capable of something includes general capabilities, such as a human is capable of thinking and reasoning or drinking coffee. It also includes specialized capabilities such as a surgeon is capable of operating on a patient. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1216_atomic_classification_causes.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1216_atomic_classification_causes.json new file mode 100644 index 000000000..f2fc34bb2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1216_atomic_classification_causes.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two phrases: Head and Tail, separated with . The Head and the Tail events are short phrases possibly involving participants. The names of specific people have been replaced by generic words (e.g., PersonX, PersonY, PersonZ). PersonX is always the subject of the event. You have to determine whether the Head causes the Tail or not. Classify your answers into \"Yes\" and \"No\". The phrase may also contain \"___\", a placeholder that can be an object, a person, and/or an action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1217_atomic_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1217_atomic_answer_generation.json new file mode 100644 index 000000000..431a23396 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1217_atomic_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence with a missing word that can be an object, a person, and/or an action. Fill in the blank with a plausible word. Although each sentence has many correct answers, you only have to write one answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task122_conala_list_index_addition.json b/src/unitxt/catalog/instructions/natural_instructions/train/task122_conala_list_index_addition.json new file mode 100644 index 000000000..6366825ff --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task122_conala_list_index_addition.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list, of lists, of numbers. Each list is presented with brackets and comma-separated values. For example, a list of numbers is [1,2,3] and a list of two lists of numbers is [[1,2],[3,4,6]]. You should sum up the values at every position of every inner list and put it as an element of your answer, that is, you should sum the first members of each inner list together and put it as the first element of the list, then sum the second members of each inner list together and put it as the second element of your list, etc. The output should be a list of numbers with the same length as the longest inner list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task123_conala_sort_dictionary.json b/src/unitxt/catalog/instructions/natural_instructions/train/task123_conala_sort_dictionary.json new file mode 100644 index 000000000..7d34c1154 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task123_conala_sort_dictionary.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of dictionaries. A dictionary is a set of key-value pairs, where each key is unique and has a value associated with that key. You should sort the list of dictionaries from smallest to largest by their 'first' key. If there is two dictionaries with the same 'first' value then sort them by their 'second' key. Negative numbers should come before positive numbers." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task124_conala_pair_averages.json b/src/unitxt/catalog/instructions/natural_instructions/train/task124_conala_pair_averages.json new file mode 100644 index 000000000..5943fa447 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task124_conala_pair_averages.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a list of numbers and you need to find the average of each two consecutive values. The average of two numbers a and b is calculated as: (a + b) /2. The output should be a list of the averages of each two consecutive values. A list is presented with two brackets and comma-separated values, like: [1,2,3]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task125_conala_pair_differences.json b/src/unitxt/catalog/instructions/natural_instructions/train/task125_conala_pair_differences.json new file mode 100644 index 000000000..75e3cfe00 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task125_conala_pair_differences.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a list of integers and you need to find the absolute value of the difference between each two consecutive values. The output should be a list of the absolute value of the differences of each two consecutive values." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task126_scan_structured_text_generation_command_action_all.json b/src/unitxt/catalog/instructions/natural_instructions/train/task126_scan_structured_text_generation_command_action_all.json new file mode 100644 index 000000000..f9a9769a8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task126_scan_structured_text_generation_command_action_all.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a command in a limited form of natural language, provide the correct sequence of actions that executes the command to thus navigate an agent in its environment. A command can be broken down into many different actions. Actions are uppercase and are individual steps that serve as the building blocks for a command. For commands, 'left' and 'right' are used to denote the direction of an action. The word 'opposite' turns the agent backward in the specified direction. The word 'around' makes the agent execute an action while turning around in the specified direction. The word 'and' means to execute the next scope of the command following the previous scope of the command. The word 'after' signifies to execute the previous scope of the command following the next scope of the command. The words 'twice' and 'thrice' trigger repetition of a command that they scope over two times or three times, respectively. There are only six actions: 'I_LOOK', 'I_WALK', 'I_RUN', 'I_JUMP', 'I_TURN_LEFT', and 'I_TURN_RIGHT'. These actions respectively align with the commands 'look', 'walk', 'run', 'jump', 'turn left', and 'turn right'. Actions and commands do not have quotations in the input and output." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task127_scan_long_text_generation_action_command_all.json b/src/unitxt/catalog/instructions/natural_instructions/train/task127_scan_long_text_generation_action_command_all.json new file mode 100644 index 000000000..ed76240e0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task127_scan_long_text_generation_action_command_all.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sequence of actions to navigate an agent in its environment, provide the correct command in a limited form of natural language that matches the sequence of actions when executed. Commands are lowercase and encapsulate the logic of the sequence of actions. Actions are individual steps that serve as the building blocks for a command. There are only six actions: 'I_LOOK', 'I_WALK', 'I_RUN', 'I_JUMP', 'I_TURN_LEFT', and 'I_TURN_RIGHT'. These actions respectively align with the commands 'look', 'walk', 'run', 'jump', 'turn left', and 'turn right'. For commands, 'left' and 'right' are used to denote the direction of an action. opposite turns the agent backward in the specified direction. The word 'around' makes the agent execute an action while turning around in the specified direction. The word 'and' means to execute the next scope of the command following the previous scope of the command. The word 'after' signifies to execute the previous scope of the command following the next scope of the command. The words 'twice' and 'thrice' trigger repetition of a command that they scope over two times or three times, respectively. Actions and commands do not have quotations in the input and output." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1283_hrngo_quality_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1283_hrngo_quality_classification.json new file mode 100644 index 000000000..d7c0b283d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1283_hrngo_quality_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given an original reference as well as a system reference. Your task is to judge the quality of the system reference. If the utterance is grammatically correct and fluent output 1, else output 0." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1284_hrngo_informativeness_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1284_hrngo_informativeness_classification.json new file mode 100644 index 000000000..be6d62cfe --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1284_hrngo_informativeness_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given an original reference as well as a system reference. Your task is to judge the informativeness of the system reference. If the utterance provides all the useful information from the meaning representation output 1, else output 0." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1285_kpa_keypoint_matching.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1285_kpa_keypoint_matching.json new file mode 100644 index 000000000..53ad67072 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1285_kpa_keypoint_matching.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input contains a debate topic, an argument on the topic and a keypoint, separated by \"\". Your task is to answer if the keypoint matches the argument and summarizes exactly what the argument means, in the context of the given topic." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1286_openbookqa_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1286_openbookqa_question_answering.json new file mode 100644 index 000000000..fcb4dd79d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1286_openbookqa_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a multiple-choice question and you have to pick the correct option. Answer with option indexes (i.e., \"A\", \"B\", \"C\", and \"D\")." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1288_glue_mrpc_paraphrasing.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1288_glue_mrpc_paraphrasing.json new file mode 100644 index 000000000..a0040889c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1288_glue_mrpc_paraphrasing.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given two sentences(Sentence1 and Sentence2). Answer \"Yes\" if these sentences are a paraphrase of one another, otherwise answer \"No\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1289_trec_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1289_trec_classification.json new file mode 100644 index 000000000..af9a4ca59 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1289_trec_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question. You need to detect which category better describes the question. A question belongs to the description category if it asks about description and abstract concepts. Entity questions are about entities such as animals, colors, sports, etc. Abbreviation questions ask about abbreviations and expressions abbreviated. Questions regarding human beings, description of a person, and a group or organization of persons are categorized as Human. Quantity questions are asking about numeric values and Location questions ask about locations, cities, and countries. Answer with \"Description\", \"Entity\", \"Abbreviation\", \"Person\", \"Quantity\", and \"Location\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task128_scan_structured_text_generation_command_action_short.json b/src/unitxt/catalog/instructions/natural_instructions/train/task128_scan_structured_text_generation_command_action_short.json new file mode 100644 index 000000000..f9a9769a8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task128_scan_structured_text_generation_command_action_short.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a command in a limited form of natural language, provide the correct sequence of actions that executes the command to thus navigate an agent in its environment. A command can be broken down into many different actions. Actions are uppercase and are individual steps that serve as the building blocks for a command. For commands, 'left' and 'right' are used to denote the direction of an action. The word 'opposite' turns the agent backward in the specified direction. The word 'around' makes the agent execute an action while turning around in the specified direction. The word 'and' means to execute the next scope of the command following the previous scope of the command. The word 'after' signifies to execute the previous scope of the command following the next scope of the command. The words 'twice' and 'thrice' trigger repetition of a command that they scope over two times or three times, respectively. There are only six actions: 'I_LOOK', 'I_WALK', 'I_RUN', 'I_JUMP', 'I_TURN_LEFT', and 'I_TURN_RIGHT'. These actions respectively align with the commands 'look', 'walk', 'run', 'jump', 'turn left', and 'turn right'. Actions and commands do not have quotations in the input and output." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1290_xsum_summarization.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1290_xsum_summarization.json new file mode 100644 index 000000000..ef114e0d9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1290_xsum_summarization.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an article. Your task is to summarize the article in a sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1291_multi_news_summarization.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1291_multi_news_summarization.json new file mode 100644 index 000000000..28585c460 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1291_multi_news_summarization.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a text of many news articles seperated by special token \"|||||\". Your task is to summarize them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1292_yelp_review_full_text_categorization.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1292_yelp_review_full_text_categorization.json new file mode 100644 index 000000000..e80490f0f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1292_yelp_review_full_text_categorization.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a review about a place. You need to provide a rating from \"1 star\" to \"5 stars\" for this place." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1293_kilt_tasks_hotpotqa_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1293_kilt_tasks_hotpotqa_question_answering.json new file mode 100644 index 000000000..1b1fe7e84 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1293_kilt_tasks_hotpotqa_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a question. You have to answer the question based on your information." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1294_wiki_qa_answer_verification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1294_wiki_qa_answer_verification.json new file mode 100644 index 000000000..2472df5d3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1294_wiki_qa_answer_verification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a question and an answer. Answer \"Yes\" if the given answer correctly answers the question, otherwise answer \"No\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1295_adversarial_qa_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1295_adversarial_qa_question_answering.json new file mode 100644 index 000000000..01ae0371a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1295_adversarial_qa_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a question and a context passage. You have to answer the question based on the given passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1296_wiki_hop_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1296_wiki_hop_question_answering.json new file mode 100644 index 000000000..ef8d93a72 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1296_wiki_hop_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a context, a subject, a relation, and many options. Based on the context, from the options select the object entity that has the given relation with the subject. Answer with text (not indexes)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task129_scan_long_text_generation_action_command_short.json b/src/unitxt/catalog/instructions/natural_instructions/train/task129_scan_long_text_generation_action_command_short.json new file mode 100644 index 000000000..ed76240e0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task129_scan_long_text_generation_action_command_short.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sequence of actions to navigate an agent in its environment, provide the correct command in a limited form of natural language that matches the sequence of actions when executed. Commands are lowercase and encapsulate the logic of the sequence of actions. Actions are individual steps that serve as the building blocks for a command. There are only six actions: 'I_LOOK', 'I_WALK', 'I_RUN', 'I_JUMP', 'I_TURN_LEFT', and 'I_TURN_RIGHT'. These actions respectively align with the commands 'look', 'walk', 'run', 'jump', 'turn left', and 'turn right'. For commands, 'left' and 'right' are used to denote the direction of an action. opposite turns the agent backward in the specified direction. The word 'around' makes the agent execute an action while turning around in the specified direction. The word 'and' means to execute the next scope of the command following the previous scope of the command. The word 'after' signifies to execute the previous scope of the command following the next scope of the command. The words 'twice' and 'thrice' trigger repetition of a command that they scope over two times or three times, respectively. Actions and commands do not have quotations in the input and output." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1308_amazonreview_category_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1308_amazonreview_category_classification.json new file mode 100644 index 000000000..1188a2486 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1308_amazonreview_category_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a review from Amazon and category of the product based on the review given by the user and your task is classify whether the given category match the review. Generate \"True\" if given review and its category match, otherwise generate \"False\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1309_amazonreview_summary_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1309_amazonreview_summary_classification.json new file mode 100644 index 000000000..3f1f6debf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1309_amazonreview_summary_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given reviews from Amazon's food products and a summary of that review. Your task is to classify whether the given summary matches the original review. Generate \"True\" if the given review and its summary match, otherwise generate \"False\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task130_scan_structured_text_generation_command_action_long.json b/src/unitxt/catalog/instructions/natural_instructions/train/task130_scan_structured_text_generation_command_action_long.json new file mode 100644 index 000000000..f9a9769a8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task130_scan_structured_text_generation_command_action_long.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a command in a limited form of natural language, provide the correct sequence of actions that executes the command to thus navigate an agent in its environment. A command can be broken down into many different actions. Actions are uppercase and are individual steps that serve as the building blocks for a command. For commands, 'left' and 'right' are used to denote the direction of an action. The word 'opposite' turns the agent backward in the specified direction. The word 'around' makes the agent execute an action while turning around in the specified direction. The word 'and' means to execute the next scope of the command following the previous scope of the command. The word 'after' signifies to execute the previous scope of the command following the next scope of the command. The words 'twice' and 'thrice' trigger repetition of a command that they scope over two times or three times, respectively. There are only six actions: 'I_LOOK', 'I_WALK', 'I_RUN', 'I_JUMP', 'I_TURN_LEFT', and 'I_TURN_RIGHT'. These actions respectively align with the commands 'look', 'walk', 'run', 'jump', 'turn left', and 'turn right'. Actions and commands do not have quotations in the input and output." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1310_amazonreview_rating_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1310_amazonreview_rating_classification.json new file mode 100644 index 000000000..40e9c90e4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1310_amazonreview_rating_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a review from Amazon. Your task is to generate a rating for the product on a scale of 1-5 based on the review. The rating means 1: extremely poor, 2: poor, 3: neutral, 4: good, 5: extremely good." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1311_amazonreview_rating_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1311_amazonreview_rating_classification.json new file mode 100644 index 000000000..afb79dd53 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1311_amazonreview_rating_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a review from Amazon and rating for the product on a scale of 1-5 based on the review. The rating means 1: extremely poor, 2: poor, 3: neutral, 4: good, 5: extremely good. Your task is to generate whether the rating matches the review or not. Answer with \"True\" if the sentence belongs to that section, otherwise answer with \"False\"" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1312_amazonreview_polarity_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1312_amazonreview_polarity_classification.json new file mode 100644 index 000000000..7e9735a34 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1312_amazonreview_polarity_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, You are given a review of Amazon's food products. Your task is to divide them into two classes: negative or positive, depending on the content of the review." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1313_amazonreview_polarity_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1313_amazonreview_polarity_classification.json new file mode 100644 index 000000000..8b5239dbf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1313_amazonreview_polarity_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, You are given an amazon review and its polarity (positive or negative). Your task is to answer \"True\" if the specified sentence and its polarity match; otherwise, answer \"False\"" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1314_country_abbreviation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1314_country_abbreviation.json new file mode 100644 index 000000000..434428ecd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1314_country_abbreviation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name and you need to return the abbrevation name of the given country." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1315_find_range_array.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1315_find_range_array.json new file mode 100644 index 000000000..5fd77cea3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1315_find_range_array.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a list of integers you need to calculate and return the range of the integers which is the difference between maximum and minimum element in the list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1316_remove_duplicates_string.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1316_remove_duplicates_string.json new file mode 100644 index 000000000..536342b61 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1316_remove_duplicates_string.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a string of characters. You need to remove duplicate characters from the string if any, and return the resulting string." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1317_country_calling_code.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1317_country_calling_code.json new file mode 100644 index 000000000..2c1c7c022 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1317_country_calling_code.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name and you need to return the calling code of the given country. Your output must be formatted as a plus sign (+), followed by the calling code number" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1318_country_national_dish.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1318_country_national_dish.json new file mode 100644 index 000000000..590c4d4f6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1318_country_national_dish.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name and you need to return the national dish of the given country. Some countries have multiple national dishes, in which case any one of those dishes will be considered a valid output." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1319_country_by_barcode_prefix.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1319_country_by_barcode_prefix.json new file mode 100644 index 000000000..cba169c86 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1319_country_by_barcode_prefix.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name and you need to return the barcode prefix of the given country. A barcode prefix is a 3-digit number at the begining of all the barcodes on products from a company or country. Some countries have ranges of barcode prefixes such as, 730 - 739; in such a case, a number from within that range will be considered as a valid output." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task131_scan_long_text_generation_action_command_long.json b/src/unitxt/catalog/instructions/natural_instructions/train/task131_scan_long_text_generation_action_command_long.json new file mode 100644 index 000000000..ed76240e0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task131_scan_long_text_generation_action_command_long.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sequence of actions to navigate an agent in its environment, provide the correct command in a limited form of natural language that matches the sequence of actions when executed. Commands are lowercase and encapsulate the logic of the sequence of actions. Actions are individual steps that serve as the building blocks for a command. There are only six actions: 'I_LOOK', 'I_WALK', 'I_RUN', 'I_JUMP', 'I_TURN_LEFT', and 'I_TURN_RIGHT'. These actions respectively align with the commands 'look', 'walk', 'run', 'jump', 'turn left', and 'turn right'. For commands, 'left' and 'right' are used to denote the direction of an action. opposite turns the agent backward in the specified direction. The word 'around' makes the agent execute an action while turning around in the specified direction. The word 'and' means to execute the next scope of the command following the previous scope of the command. The word 'after' signifies to execute the previous scope of the command following the next scope of the command. The words 'twice' and 'thrice' trigger repetition of a command that they scope over two times or three times, respectively. Actions and commands do not have quotations in the input and output." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1320_country_domain_tld.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1320_country_domain_tld.json new file mode 100644 index 000000000..ca105b0de --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1320_country_domain_tld.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name and you need to return the Top Level Domain (TLD) of the given country. The TLD is the part that follows immediately after the \"dot\" symbol in a website's address. The output, TLD is represented by a \".\", followed by the domain." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1321_country_continent.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1321_country_continent.json new file mode 100644 index 000000000..e3d9af11f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1321_country_continent.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name and you need to return the continent to which the country belongs." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1322_country_government_type.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1322_country_government_type.json new file mode 100644 index 000000000..9c25040f9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1322_country_government_type.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name and you need to answer with the government type of the country, as of the year 2015. The following are possible government types that are considered valid answers: Republic, Parliamentary Coprincipality, Federal Republic, Monarchy, Islamic Republic, Constitutional Monarchy, Parlementary Monarchy, Federation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1325_qa_zre_question_generation_on_subject_relation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1325_qa_zre_question_generation_on_subject_relation.json new file mode 100644 index 000000000..91716c280 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1325_qa_zre_question_generation_on_subject_relation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a context, a subject and a relation. Your task is to generate a question based on the subject and relation. The generated question should include the given subject. Try to use a minimum number of words that are not present in either context, subject or relation while generating question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1326_qa_zre_question_generation_from_answer.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1326_qa_zre_question_generation_from_answer.json new file mode 100644 index 000000000..f6a4e46cc --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1326_qa_zre_question_generation_from_answer.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Generate a question which can yield the answer mentioned in the input. Generated question must be answered by the answer provided in input, without using any extra knowledge." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1327_qa_zre_answer_generation_from_question.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1327_qa_zre_answer_generation_from_question.json new file mode 100644 index 000000000..795e51317 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1327_qa_zre_answer_generation_from_question.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Generate a correct and concise answer for the question based on the words in the context." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1328_qa_zre_relation_generation_from_question.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1328_qa_zre_relation_generation_from_question.json new file mode 100644 index 000000000..d0f5efb90 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1328_qa_zre_relation_generation_from_question.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Classify the relation of question with context to one of these categories: 1) award received, 2) based on, collection, 3) conflict, 4) constellation, 5) convicted of, 6) date of death, 7) director, 8) drafted by, 9) educated at, 10) medical condition, 11) military branch, 12) narrative location, 13) occupation, 14) original network, 15) parent company, 16) point in time, 17) production company, 18) residence, 19) series, 20) service entry, 21) sex or gender, 22) spouse, 23) standards body question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task132_dais_text_modification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task132_dais_text_modification.json new file mode 100644 index 000000000..2c03a5779 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task132_dais_text_modification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Languages typically provide more than one grammatical construction to express certain types of messages. Your task is to generate a senetence with the same meaning as given sentence, but with different grammatical construction." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1331_reverse_array.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1331_reverse_array.json new file mode 100644 index 000000000..5c6cb1f49 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1331_reverse_array.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a list of integers in a random order. You need to return the same list of integers in the reverse order." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1332_check_leap_year.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1332_check_leap_year.json new file mode 100644 index 000000000..cdac582a7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1332_check_leap_year.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a year. You need to check if it is a leap year or not. A year may be a leap year if it is evenly divisible by 4. Years that are divisible by 100 (century years such as 1900 or 2000) cannot be leap years unless they are also divisible by 400. Return 1 if it is a leap year, else return 0." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1333_check_validity_date_ddmmyyyy.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1333_check_validity_date_ddmmyyyy.json new file mode 100644 index 000000000..5a02dd69d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1333_check_validity_date_ddmmyyyy.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a date in \"dd/mm/yyyy\" format. You need to check if the date is valid or not. Return 1 if it is valid, else return 0. A date is valid if the components day(\"dd\"), month(\"mm\") and year(\"yyyy\") are all valid individually. A day(dd) is valid if it: a) lies between 1 and 31 for the months of January, March, May, July, August, October, December, b) lies between 1 and 28 for February on non-leap years and between 1-29 on leap years, c) lies between 1-30 for all other months. A month(mm) is valid if it lies in the range from 1 to 12 as there are 12 months in a year. A year is always valid if it is expressed in the form of \"yyyy\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1336_peixian_equity_evaluation_corpus_gender_classifier.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1336_peixian_equity_evaluation_corpus_gender_classifier.json new file mode 100644 index 000000000..5e1e71a12 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1336_peixian_equity_evaluation_corpus_gender_classifier.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a sentence containing a pronoun/person name and an emotion. From these implicit parameters, the main goal is to find the gender of the person (male / female)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1338_peixian_equity_evaluation_corpus_sentiment_classifier.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1338_peixian_equity_evaluation_corpus_sentiment_classifier.json new file mode 100644 index 000000000..868726bbb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1338_peixian_equity_evaluation_corpus_sentiment_classifier.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is a sentence. The sentence includes an emotion. The goal of the task is to classify the emotion in the sentence to one of the classes: 'fear', 'joy', 'anger', 'sadness'. The emotion mainly depends on the adverb within the sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1339_peixian_equity_evaluation_corpus_text_completion.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1339_peixian_equity_evaluation_corpus_text_completion.json new file mode 100644 index 000000000..bf3f4f700 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1339_peixian_equity_evaluation_corpus_text_completion.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is a sentence with a missed word and an emotion. Your task is to fill in the blank with a word that matches the emotion and rewrite the completed sentence. The emotion is one of ['fear', 'joy', 'anger', 'sadness']." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1340_msr_text_compression_compression.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1340_msr_text_compression_compression.json new file mode 100644 index 000000000..b689df49b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1340_msr_text_compression_compression.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a text, write a compressed version of it in a single sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1341_msr_text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1341_msr_text_classification.json new file mode 100644 index 000000000..835ae36b6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1341_msr_text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sentence, judge the quality of this sentence by indicating \"Good\" and \"Bad\". The quality depends on the grammar and the meaning of the sentence. If a sentence is easily understandable, and doesn't have grammatical errors, answer with \"Good\", otherwise answer with \"Bad\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1346_glue_cola_grammatical_correctness_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1346_glue_cola_grammatical_correctness_classification.json new file mode 100644 index 000000000..2be46ec33 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1346_glue_cola_grammatical_correctness_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a sentence. Check whether the sentence is grammatically correct and is meaningful. If the sentence is grammatically correct, then answer with '1', otherwise answer with '0'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1347_glue_sts_b_similarity_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1347_glue_sts_b_similarity_classification.json new file mode 100644 index 000000000..661e9ff90 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1347_glue_sts_b_similarity_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Evaluate the similarity between them and classify them into classes from 0-5 as follows:\n0 : The two sentences are completely dissimilar.\n1 : The two sentences are not equivalent, but are on the same topic.\n2 : The two sentences are not equivalent, but share some details.\n3 : The two sentences are roughly equivalent, but some important information differs/missing.\n4 : The two sentences are mostly equivalent, but some unimportant details differ.\n5 : The two sentences are completely equivalent, as they mean the same thing." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1354_sent_comp_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1354_sent_comp_classification.json new file mode 100644 index 000000000..aca270f38 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1354_sent_comp_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a text of news article and corresponding headline of an article. Your task is to give label \"match\" if headline is correct for article, otherwise give label \"no\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1355_sent_comp_summarization.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1355_sent_comp_summarization.json new file mode 100644 index 000000000..45cf998d9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1355_sent_comp_summarization.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a piece of an article. Your task is to generate a short summary of the text. Try to give the summary in just one sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1359_numer_sense_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1359_numer_sense_answer_generation.json new file mode 100644 index 000000000..a31d277f6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1359_numer_sense_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sentence, fill out the missing word with a 'no' or a number (between zero and ten). You should write the numbers with english alphabet, like: four instead of 4." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1360_numer_sense_multiple_choice_qa_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1360_numer_sense_multiple_choice_qa_generation.json new file mode 100644 index 000000000..489b35a35 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1360_numer_sense_multiple_choice_qa_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sentence with a missing word, pick the answer option that best fills out the missing word in the sentence. Indicate each answer with its index ('a', 'b', 'c', 'd')." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1361_movierationales_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1361_movierationales_classification.json new file mode 100644 index 000000000..0c0a53822 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1361_movierationales_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you must classify if a given review is positive/negative, indicating your answer as P or N." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1364_hans_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1364_hans_answer_generation.json new file mode 100644 index 000000000..87fe5471a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1364_hans_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a premise sentence. Your task is to write a new sentence by substituting the subject and object (i.e., the input's subject should be output's object and vice versa.). The generated sentence must be fluent and shouldn't change the voice (i.e., passive or active) of the input." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1366_healthfact_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1366_healthfact_classification.json new file mode 100644 index 000000000..ba768f1bb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1366_healthfact_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a paragraph and a claim, classify it this way: If the claim contradicts the evidence present in the paragraph, classify the claim as '0'. If the claim has multiple supporting *AND* contradicting evidences, classify the claim as '1'. If the claim has supporting evidence and the paragraph is in overall favor of the claim, then classify the claim as '2'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1368_healthfact_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1368_healthfact_sentence_generation.json new file mode 100644 index 000000000..0ac89c1db --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1368_healthfact_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a paragraph, generate a claim that is supported by the given paragraph. 1) The claim must contain information from within the paragraph. 2) A sentence within the paragraph can be used as a claim. 3) The claim should not have contradictions within the paragraph. 4) The claim should be at most one sentence long." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1369_healthfact_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1369_healthfact_sentence_generation.json new file mode 100644 index 000000000..9553df0b0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1369_healthfact_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Generate an explanation for the given claim using the provided supporting material from the paragraph. Please consider the following points while generating an output. 1) The claim will always have supporting proof in the paragraph, and the paragraph will have a clear point of view supporting the claim. 2) There can be instances where direct correlation to the claim is not available. Make use of the sentences in the paragraph to provide a corresponding output supporting the claim. 3) The explanation should be at least one and at most twelve sentences long." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1378_quarel_correct_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1378_quarel_correct_answer_generation.json new file mode 100644 index 000000000..49445b493 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1378_quarel_correct_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a sentence, a question and two answer options ('A' and 'B'). Your task is to find the correct answer (return the string of the correct option, not 'A' or 'B') for the given question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1379_quarel_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1379_quarel_incorrect_answer_generation.json new file mode 100644 index 000000000..2a2431893 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1379_quarel_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a sentence, a question and two answer options ('A' and 'B'). Your task is to find the **incorrect** answer (return the string of the incorrect option, not A/B)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task137_detoxifying_lms_classification_toxicity.json b/src/unitxt/catalog/instructions/natural_instructions/train/task137_detoxifying_lms_classification_toxicity.json new file mode 100644 index 000000000..3bee971c4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task137_detoxifying_lms_classification_toxicity.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a prompt and two completions from a language model, select the completion that is the least toxic with respect to continuing the prompt. Toxicity is defined as a rude, disrespectful, or unreasonable statement that is likely to make you leave a discussion. Generate either Completion A or Completion B." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1380_quarel_correct_option_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1380_quarel_correct_option_generation.json new file mode 100644 index 000000000..4a3dd7c31 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1380_quarel_correct_option_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a sentence, a question and two answer options ('A' and 'B'). Your task is to find the correct option for the given question. Write down the answer index: 'A' or 'B'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1381_quarel_incorrect_option_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1381_quarel_incorrect_option_generation.json new file mode 100644 index 000000000..b934b00e0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1381_quarel_incorrect_option_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a sentence, a question and two answer options. Your task is to write down the index ('A' or 'B') of the **incorrect** option for the given question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1382_quarel_write_correct_answer.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1382_quarel_write_correct_answer.json new file mode 100644 index 000000000..c18b3a011 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1382_quarel_write_correct_answer.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a sentence and a question. You're expected to write the correct answer based on the sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1383_quarel_write_incorrect_answer.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1383_quarel_write_incorrect_answer.json new file mode 100644 index 000000000..bdfef7e1e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1383_quarel_write_incorrect_answer.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a sentence and a question. You're expected to write an **incorrect** answer to the given question, such that it is relevant to the given sentence. Your answer should not be completely out of context. Try to write short answers with one or two words." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1384_deal_or_no_dialog_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1384_deal_or_no_dialog_classification.json new file mode 100644 index 000000000..69dc1a513 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1384_deal_or_no_dialog_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a negotiation between two participants, answer 'Yes' if both participants agree to the deal, otherwise answer 'No'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1389_hellaswag_completion.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1389_hellaswag_completion.json new file mode 100644 index 000000000..34bff290d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1389_hellaswag_completion.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a context and four options. Each option is a suggested ending for the context. You should read the context and pick the best ending for the context. Please answer with \"A\", \"B\", \"C\", and \"D\". " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task138_detoxifying_lms_classification_fluency.json b/src/unitxt/catalog/instructions/natural_instructions/train/task138_detoxifying_lms_classification_fluency.json new file mode 100644 index 000000000..6026dd634 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task138_detoxifying_lms_classification_fluency.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a prompt and two completions from a language model, select the completion that is the most fluent with respect to continuing the prompt. Fluency is defined by coherency and ease of understanding, not necessarily grammatical correctness. Generate either Completion A or Completion B." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1398_obqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1398_obqa_question_generation.json new file mode 100644 index 000000000..0ed8bb41c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1398_obqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a fact, create a question that can be answered using the fact. Construct the question such that it is unambiguous, has a unique answer and the answer can be given using the fact." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1399_obqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1399_obqa_answer_generation.json new file mode 100644 index 000000000..4bfb61802 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1399_obqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a fact statement and question based on the fact. Your task is to generate the correct answer for the question. The answer needs to be generated using the context fact statement." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task139_detoxifying_lms_classification_topicality.json b/src/unitxt/catalog/instructions/natural_instructions/train/task139_detoxifying_lms_classification_topicality.json new file mode 100644 index 000000000..f2bf1e275 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task139_detoxifying_lms_classification_topicality.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a prompt and two completions from a language model, select the completion that is more topical with respect to continuing the prompt. A prompt-completion pair is defined to be topical if the completion maintains relevance and logical succession (i.e. stays on topic) with the prompt. The flow from the prompt to the completion should be as reasonable as possible. Generate either Completion A or Completion B." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1400_obqa_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1400_obqa_incorrect_answer_generation.json new file mode 100644 index 000000000..6064f4ddf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1400_obqa_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task is about generating an incorrect answer to a question given the question and a true statement related to the question. The answer must be related to the question, but incorrectly answer it given the context." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1401_obqa_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1401_obqa_sentence_generation.json new file mode 100644 index 000000000..99df335dd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1401_obqa_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a question and a corresponding answer. Your task is to generate a fact statement that is useful in answering the given question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1403_check_validity_date_mmddyyyy.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1403_check_validity_date_mmddyyyy.json new file mode 100644 index 000000000..f5e4ee306 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1403_check_validity_date_mmddyyyy.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a date in \"mm/dd/yyyy\" format. You need to check if the date is valid or not. Return 1 if it is valid, else return 0. A date is valid is the components month(\"mm\"), day(\"dd\") and year(\"yyyy\") are all valid individually. A day(dd) is valid if it is greater than or equal to 1 and less than 30 or 31 depending upon the month(mm). Months which have 31 days are January, March, May, July, August, October, December. Rest of the months have 30 days except February which has 28 days if it is not a leap year and 29 days if it is a leap year. A month(mm) is valid if it lies in the range from 1 to 12 as there are 12 months in a year. A year is always valid if it is expressed in the form of \"yyyy\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1404_date_conversion.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1404_date_conversion.json new file mode 100644 index 000000000..1e2629a2d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1404_date_conversion.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a date in a particular format and you need to convert to another format. If given format is \"dd/mm/yyyy\" then convert to \"mm/dd/yyyy\". If given format is \"mm/dd/yyyy\" then convert to \"dd/mm/yyyy\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1405_find_median.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1405_find_median.json new file mode 100644 index 000000000..b3d173973 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1405_find_median.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a list of integers. You need to find the median of the list of integers and return that as the output. The median is the middle value in the list of numbers such that half of the elements are less than the median and the other half of elements are greater than the median." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1406_kth_smallest_element.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1406_kth_smallest_element.json new file mode 100644 index 000000000..7c6707694 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1406_kth_smallest_element.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a list of integers and an integer k. You need to find the kth smallest element in the input list and return that." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task140_detoxifying_lms_classification_style.json b/src/unitxt/catalog/instructions/natural_instructions/train/task140_detoxifying_lms_classification_style.json new file mode 100644 index 000000000..d8d35774c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task140_detoxifying_lms_classification_style.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a prompt and two completions from a language model, select the completion that has the most similar style to the prompt. Style is defined as the tone, word choice, grammar, and sentence structure throughout the prompt-completion pair. If a prompt is colloquial, then the completion should also be colloquial, as opposed to a completion that is encyclopedic or overly formal. Generate either Completion A or Completion B." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1412_web_questions_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1412_web_questions_question_answering.json new file mode 100644 index 000000000..af0eceac9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1412_web_questions_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "A question is presented to you in this task, and your job is to write a potentially correct answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1418_bless_semantic_relation_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1418_bless_semantic_relation_classification.json new file mode 100644 index 000000000..041f05262 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1418_bless_semantic_relation_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a pair of words, generate the relation between them. The first word is called the 'concept' and the second word is called the 'relatum' The relation must be one of the following: co-hyponym (coordinate), hypernym, meronym, attribute, event, or random. A coordinate relation indicates that the concept and relatum belong to the same semantic class. A hypernym relation indicates that the relatum is a category of which the concept is a specific instance. A meronym relation implies that relatum is a part/component/organ/member of the concept. An attribute relation is when the relatum is an adjective expressing an attribute of the concept. An event relation holds when the relatum is a verb referring to an action/activity/happening/event that is performed by or with the concept. If the relatum and concept are unrelated, the relation between them is 'random'. Classify your answers into coord, hyper, mero, attri, event, and random." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1419_mathqa_gain.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1419_mathqa_gain.json new file mode 100644 index 000000000..cfc3068ec --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1419_mathqa_gain.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to answer the given multiple-choice question on the gain. Gain is the value by which to multiply the input. Classify your answers into 'a', 'b', 'c', 'd', and 'e'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task141_odd_man_out_classification_category.json b/src/unitxt/catalog/instructions/natural_instructions/train/task141_odd_man_out_classification_category.json new file mode 100644 index 000000000..1731921e3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task141_odd_man_out_classification_category.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a category and a set of five words, find the word from the set that does not belong (i.e. is the least relevant) with the other words in the category. Words are separated by commas." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1420_mathqa_general.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1420_mathqa_general.json new file mode 100644 index 000000000..c4dd94136 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1420_mathqa_general.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to answer the given multiple-choice question on the general math. Classify your answers into 'a', 'b', 'c', 'd', and 'e'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1421_mathqa_other.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1421_mathqa_other.json new file mode 100644 index 000000000..3937fd9fe --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1421_mathqa_other.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to provide the correct option for a given problem from the provided options." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1422_mathqa_physics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1422_mathqa_physics.json new file mode 100644 index 000000000..beb6a36f4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1422_mathqa_physics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to answer the given multiple-choice question on the physics. Classify your answers into 'a', 'b', 'c', 'd', and 'e'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1423_mathqa_geometry.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1423_mathqa_geometry.json new file mode 100644 index 000000000..e20257908 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1423_mathqa_geometry.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to answer the given multiple-choice question on geometry. Classify your answers into 'a', 'b', 'c', 'd', and 'e'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1424_mathqa_probability.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1424_mathqa_probability.json new file mode 100644 index 000000000..9b84c72f4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1424_mathqa_probability.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to provide the correct option for a given problem on probability from the provided options." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1425_country_iso_numeric.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1425_country_iso_numeric.json new file mode 100644 index 000000000..ebeda047c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1425_country_iso_numeric.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name, and you need to return the numeric International Organization for Standardization (ISO) code of the given country. The codes are three-digit numbers defined by the ISO to represent countries, dependent territories, and special areas of geographical interest." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1426_country_independence_year.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1426_country_independence_year.json new file mode 100644 index 000000000..ebf86dd2a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1426_country_independence_year.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name, and you need to return the year in which the country became independent. Independence is a nation's independence or statehood, usually after ceasing to be a group or part of another nation or state, or more rarely after the end of military occupation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1427_country_region_in_world.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1427_country_region_in_world.json new file mode 100644 index 000000000..84f13b793 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1427_country_region_in_world.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name and you need to return the region of the world map that the country is located in. The possible regions that are considered valid answers are: Caribbean, Southern Europe, Eastern Europe, Western Europe, South America, North America, Central America, Antarctica, Australia and New Zealand, Central Africa, Northern Africa, Eastern Africa, Western Africa, Southern Africa, Eastern Asia, Southern and Central Asia, Southeast Asia, Middle East, Melanesia, Polynesia, British Isles, Micronesia, Nordic Countries, Baltic Countries." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1428_country_surface_area.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1428_country_surface_area.json new file mode 100644 index 000000000..4c889df42 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1428_country_surface_area.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a country name, and you need to return the country's surface area in terms of square kilometers. Up to two decimal places are allowed in your answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1429_evalution_semantic_relation_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1429_evalution_semantic_relation_classification.json new file mode 100644 index 000000000..f6d21dc97 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1429_evalution_semantic_relation_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a pair of words, deduce the type of relationship between them. The various types of relations are: 'Entails, HasProperty, Synonym, Antonym, HasA, MemberOf, PartOf, MadeOf, IsA'. Let's denote the first word by X and the second word by Y. An 'IsA' relation holds when 'X is a kind of Y'. An 'Antonym' relation holds when 'X can be used as the opposite of Y'. A 'Synonym' relation applies when 'X can be used in place of Y, without changing the meaning'. A 'PartOf' relation holds when 'X is a part of Y'. A 'MemberOf' relation holds when 'X is a member of Y'. A 'MadeOf' relation holds when 'X is made of Y'. An 'Entailment' relation holds when 'If X is true, then Y is true as well'. A 'HasA' relation holds when 'X can have or contain Y'. A 'HasProperty' relation holds when 'Y is to specify X'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task142_odd_man_out_classification_no_category.json b/src/unitxt/catalog/instructions/natural_instructions/train/task142_odd_man_out_classification_no_category.json new file mode 100644 index 000000000..6580abc23 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task142_odd_man_out_classification_no_category.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a set of five words, generate the word from the set that does not belong (i.e. is the least relevant) with the other words. Words are separated by commas." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1431_head_qa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1431_head_qa_answer_generation.json new file mode 100644 index 000000000..ba0ec4a22 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1431_head_qa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a multiple-choice question about healthcare. Answer the question based on your information and classify your answers into '1', '2', '3', and '4'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1434_head_qa_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1434_head_qa_classification.json new file mode 100644 index 000000000..95ec59900 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1434_head_qa_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a question and answer options for that question. Using this information, you have to classify each text into different topics: medicine, nursery, psychology, chemistry, pharmacology, biology." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task143_odd_man_out_classification_generate_category.json b/src/unitxt/catalog/instructions/natural_instructions/train/task143_odd_man_out_classification_generate_category.json new file mode 100644 index 000000000..7fd232941 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task143_odd_man_out_classification_generate_category.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a set of four words, generate the category that the words belong to. Words are separated by commas. The possible categories are social gathering, accomodation, physical property, measurement unit, corporate, nutritional value, boats, police punishment, location (proximity), card games, outdoor sport activity, military rank, baby animals, weather, consumer product, animals, boxing terminology, food, chocolate food, bird, type of sandwich, date status, body part, ocean, employment activity, moral characteristic, elements, poker, computers, construction, guitar part, shady activities, physical activity, kitchenware, temperature, type of rigidity, emotional status, season, mode of transportation, window material, activity, emotional display, geographical property, fried food, store status, widespread, aesthetic characteristic, alcoholic drinks, secretary duty, direction, personal characteristic, and animal." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1443_string_to_number.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1443_string_to_number.json new file mode 100644 index 000000000..95b0f40da --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1443_string_to_number.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a string that only contains single digit numbers spelled out. The input string will not contain spaces between the different numbers. Your task is to return the number that the string spells out. The string will spell out each digit of the number for example '1726' will be 'oneseventwosix' instead of 'one thousand seven hundred six'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1444_round_power_of_two.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1444_round_power_of_two.json new file mode 100644 index 000000000..8b0d6b43b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1444_round_power_of_two.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of integers. A list contains numbers separated by a comma. You need to round every integer to the closest power of 2. A power of 2 is a number in the form '2^n', it is a number that is the result of multiplying by 2 n times. The following are all powers of 2, '2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096'. If an integer is exactly in equally far from two different powers of 2 then you should output the larger power of 2. The output should be a list of integers that is the result of rounding each integer int the input list to the closest power of 2. The output should include a '[' to denote the start of the output list and ']' to denote the end of the output list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1445_closest_integers.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1445_closest_integers.json new file mode 100644 index 000000000..87d3b031b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1445_closest_integers.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of integers. You should find the minimum absolute difference between 2 integers in the list. The absolute difference is the absolute value of one integer subtracted by another. The output should be a single integer which is the smallest possible absolute distance." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1446_farthest_integers.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1446_farthest_integers.json new file mode 100644 index 000000000..99a088159 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1446_farthest_integers.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of integers. You should find the maximum absolute difference between 2 integers in the list. The absolute difference is the absolute value of one integer subtracted by another. The output should be a single integer which is the largest possible absolute distance." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1447_drug_extraction_ade.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1447_drug_extraction_ade.json new file mode 100644 index 000000000..413651f79 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1447_drug_extraction_ade.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given sentences in which your task is to recognize the name of the drug or medicine. Drugs are substances that change a person's mental or physical state. They can affect how your brain works, how you feel and behave, your understanding, and your senses. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1448_disease_entity_extraction_ncbi_dataset.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1448_disease_entity_extraction_ncbi_dataset.json new file mode 100644 index 000000000..67fbabbd2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1448_disease_entity_extraction_ncbi_dataset.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a sentence. You need to reconize the name of the disorder or disease. Disease is a disorder of structure or function in a human, animal, or plant, especially one that produces specific symptoms or that affects a specific location and is not simply a direct result of physical injury. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1449_disease_entity_extraction_bc5cdr_dataset.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1449_disease_entity_extraction_bc5cdr_dataset.json new file mode 100644 index 000000000..a7d0b3c10 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1449_disease_entity_extraction_bc5cdr_dataset.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a single sentence or a set of sentences. You have to recognize the name of the disorder or disease. Disease is a disorder of structure or function in a human, animal, or plant, especially one that produces specific symptoms or that affects a specific location and is not simply a direct result of physical injury. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task144_subjqa_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task144_subjqa_question_answering.json new file mode 100644 index 000000000..1c805aee3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task144_subjqa_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a review about a book, an item, a place or a movie. After that, a question is given that you should answer using a certain span of the review. Your answer should be from the review itself and should not contain extra words, and should not be a combination of different spans. If there's no direct answer to the question, answer with a part of the text that is the most relevant to the question. See the examples for clarification." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1451_drug_dose_extraction.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1451_drug_dose_extraction.json new file mode 100644 index 000000000..39544d37c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1451_drug_dose_extraction.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given sentences and a drug name in which your task is to indicate the doses of intake of that particular drug. A dose refers to a specified amount of medication taken at one time. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1452_location_entity_extraction_btc_corpus.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1452_location_entity_extraction_btc_corpus.json new file mode 100644 index 000000000..a575f43d1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1452_location_entity_extraction_btc_corpus.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given sentences in which your task is to recognize the name of the location or place. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1453_person_entity_extraction_btc_corpus.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1453_person_entity_extraction_btc_corpus.json new file mode 100644 index 000000000..d4b1ec793 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1453_person_entity_extraction_btc_corpus.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given sentences in which your task is to recognize the name of a person. Note that Twitter names shouldn't be considered as people's names. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task145_afs_argument_similarity_death_penalty.json b/src/unitxt/catalog/instructions/natural_instructions/train/task145_afs_argument_similarity_death_penalty.json new file mode 100644 index 000000000..289a92d8b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task145_afs_argument_similarity_death_penalty.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "We would like you to classify each of the following sets of argument pairs (discussing Death Penalty) into either SIMILAR or NOT SIMILAR. A pair of arguments is considered SIMILAR if the arguments are about the same FACET (making the same argument), and is considered NOT SIMILAR if they do not have the same FACET. A FACET is a low level issue that often reoccurs in many arguments in support of the author's stance or in attacking the other author's position." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task146_afs_argument_similarity_gun_control.json b/src/unitxt/catalog/instructions/natural_instructions/train/task146_afs_argument_similarity_gun_control.json new file mode 100644 index 000000000..a6e50ba97 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task146_afs_argument_similarity_gun_control.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "We would like you to classify each of the following sets of argument pairs (discussing Gun Control) into either SIMILAR or NOT SIMILAR. A pair of arguments is considered SIMILAR if the arguments are about the same FACET (making the same argument), and is considered NOT SIMILAR if they do not have the same FACET. A FACET is a low level issue that often reoccurs in many arguments in support of the author's stance or in attacking the other author's position." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1479_organization_entity_extraction_btc_corpus.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1479_organization_entity_extraction_btc_corpus.json new file mode 100644 index 000000000..f87d20e41 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1479_organization_entity_extraction_btc_corpus.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence. You are expected to recognize the name of company or organization. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task147_afs_argument_similarity_gay_marriage.json b/src/unitxt/catalog/instructions/natural_instructions/train/task147_afs_argument_similarity_gay_marriage.json new file mode 100644 index 000000000..0363c2f23 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task147_afs_argument_similarity_gay_marriage.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "We would like you to classify each of the following sets of argument pairs (discussing Gay Marriage) into either SIMILAR or NOT SIMILAR. A pair of arguments is considered SIMILAR if the arguments are about the same FACET (making the same argument), and is considered NOT SIMILAR if they do not have the same FACET. A FACET is a low level issue that often reoccurs in many arguments in support of the author's stance or in attacking the other author's position." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1480_gene_extraction_jnlpba_dataset.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1480_gene_extraction_jnlpba_dataset.json new file mode 100644 index 000000000..a78b876e4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1480_gene_extraction_jnlpba_dataset.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence. You are expected to recognize the name of gene or protein. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1481_gene_extraction_bc2gm_dataset.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1481_gene_extraction_bc2gm_dataset.json new file mode 100644 index 000000000..a78b876e4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1481_gene_extraction_bc2gm_dataset.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence. You are expected to recognize the name of gene or protein. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1482_gene_extraction_chemprot_dataset.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1482_gene_extraction_chemprot_dataset.json new file mode 100644 index 000000000..a78b876e4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1482_gene_extraction_chemprot_dataset.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence. You are expected to recognize the name of gene or protein. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1483_chemical_extraction_chemprot_dataset.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1483_chemical_extraction_chemprot_dataset.json new file mode 100644 index 000000000..ed6aacdbd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1483_chemical_extraction_chemprot_dataset.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence. You are expected to recognize the name of any form of chemical substances. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1484_gene_extraction_linnaeus_dataset.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1484_gene_extraction_linnaeus_dataset.json new file mode 100644 index 000000000..a78b876e4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1484_gene_extraction_linnaeus_dataset.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence. You are expected to recognize the name of gene or protein. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1485_organ_extraction_anem_dataset.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1485_organ_extraction_anem_dataset.json new file mode 100644 index 000000000..3d6c52ccb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1485_organ_extraction_anem_dataset.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given sentences in which your task is to recognize the name of the organ of the body. An organ is a collection of tissues that structurally form a functional unit specialized to perform a particular function. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1486_cell_extraction_anem_dataset.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1486_cell_extraction_anem_dataset.json new file mode 100644 index 000000000..a84c669d3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1486_cell_extraction_anem_dataset.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given sentences in which you have to recognize the name of the body cells. A cell is a mass of cytoplasm that is bound externally by a cell membrane. Usually microscopic in size, cells are the smallest structural units of living matter and compose all living things. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1487_organism_substance_extraction_anem_dataset.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1487_organism_substance_extraction_anem_dataset.json new file mode 100644 index 000000000..a55629c82 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1487_organism_substance_extraction_anem_dataset.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence. You are expected to write the name of the organism substances in the body mentioned in the input. Although there might be several correct answers, you need to write one of them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1488_sarcasmdetection_headline_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1488_sarcasmdetection_headline_classification.json new file mode 100644 index 000000000..29ff36893 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1488_sarcasmdetection_headline_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a news headline in English. You are expected to classify the post into two classes: sarcastic or non-sarcastic. A sarcastic sentence is one that refers to the use of words that mean the opposite of what you really want to say, especially in order to insult someone, or to show irritation, or just to be funny." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1489_sarcasmdetection_tweet_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1489_sarcasmdetection_tweet_classification.json new file mode 100644 index 000000000..d4b1b52ef --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1489_sarcasmdetection_tweet_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a tweet in English. You are expected to classify the post into two classes: sarcastic or non-sarcastic. A sarcastic sentence is one that refers to the use of words that mean the opposite of what you really want to say, especially in order to insult someone, or to show irritation, or just to be funny." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task148_afs_argument_quality_gay_marriage.json b/src/unitxt/catalog/instructions/natural_instructions/train/task148_afs_argument_quality_gay_marriage.json new file mode 100644 index 000000000..6231adaf7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task148_afs_argument_quality_gay_marriage.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "We would like you to assess the QUALITY of each of the following argument (discussing Gay Marriage) and determine if the argument is Valid or Invalid. A valid argument is clearly interpretable and either expresses an argument, or a premise or a conclusion that can be used in an argument for the topic of gay marriage. An invalid argument is a phrase that cannot be interpreted as an argument or not on the topic of gay marriage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1495_adverse_drug_event_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1495_adverse_drug_event_classification.json new file mode 100644 index 000000000..62c2845fb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1495_adverse_drug_event_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Adverse drug reactions are appreciably harmful or unpleasant reactions resulting from an intervention related to the use of medical products, which predicts hazard from future administration and warrants prevention or specific treatment, or alteration of the dosage regimen, or withdrawal of the product. Given medical case reports extracted from MEDLINE, the task is to classify whether the case report mentions the presence of any adverse drug reaction. Classify your answers into non-adverse drug event and adverse drug event." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1498_24hour_to_12hour_clock.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1498_24hour_to_12hour_clock.json new file mode 100644 index 000000000..507f21e1f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1498_24hour_to_12hour_clock.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a time in 24-Hours format, and you need to convert it to time in the 12-Hours format. For a 24-Hours format time larger than 12:00, subtract 12 hours from the given time, then add 'PM'. For example, if you have 14:30 hours, subtract 12 hours, and the result is 2:30 PM. If the 24-Hours format time is less than or equal to 12:00, add 'AM'. For example, say you have 10:15 hours, add the 'AM' to the end, here we get 10:15 AM. Note that 00:00 Hrs in 24-Hours format is 12:00 AM in 12-Hours format and 12:00 Hrs in 24-Hours format would be 12:00 PM in 12-Hours format." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1499_dstc3_summarization.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1499_dstc3_summarization.json new file mode 100644 index 000000000..798af6377 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1499_dstc3_summarization.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is a conversation between an automated system and a user looking for suggestions for pubs, restaurants and coffee shops in Cambridge. In the dialogue, the user may provide some criteria for the type of place they want such as price range, cuisine, etc. Similarly, the user may ask details of the place suggested by the system such as phone number, address, etc. Given such a dialogue, output a summary of the dialogue stating the criteria provided and details seeked by the user in this dialogue. The summary should strictly be in second person point of view. The summary should not contain any information that was not present in the conversation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task149_afs_argument_quality_death_penalty.json b/src/unitxt/catalog/instructions/natural_instructions/train/task149_afs_argument_quality_death_penalty.json new file mode 100644 index 000000000..da66f6d89 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task149_afs_argument_quality_death_penalty.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "We would like you to assess the QUALITY of each of the following argument (discussing Death Penalty) and determine if the argument is Valid or Invalid. A valid argument is clearly interpretable and either expresses an argument, or a premise or a conclusion that can be used in an argument for the topic of death penalty. An invalid argument is a phrase that cannot be interpreted as an argument or not on the topic of death penalty." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1500_dstc3_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1500_dstc3_classification.json new file mode 100644 index 000000000..b311741d3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1500_dstc3_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is a conversation between an automated system and a user looking for suggestions for pubs, restaurants and coffee shops in Cambridge. In the dialogue, the user may provide some criteria for the type of place they want such as price range, cuisine, etc. Given such a dialogue, output the price range the user if looking for which can take one of four values: Cheap, Moderate, Expensive and Don't Care. Output cannot be any other value than the four values. Note that if the user asks for the prices of items provided at a pub, restaurant or coffee shop but doesn't mention the price range they are looking for then the correct classification will be Don't Care. If the user does not mention a particular price, the correct classification will be Don't Care." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1501_dstc3_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1501_dstc3_answer_generation.json new file mode 100644 index 000000000..3b75dee87 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1501_dstc3_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is a conversation between an automated system and a user, followed by a question. The user is looking for suggestions for pubs, restaurants and coffee shops in Cambridge. In the dialogue, the user may provide some criteria for the type of place they want such as price range, cuisine, etc. Similarly, the user may ask details of the place suggested by the system such as phone number, address, etc. The answer of the question has to be a Yes or a No. Given such a dialogue, answer the given question based on the information present in the dialogue." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1502_hatexplain_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1502_hatexplain_classification.json new file mode 100644 index 000000000..fd22f8c2f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1502_hatexplain_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is a tweet which can be classified as Hate Speech, Offensive or Normal. Given such a tweet, output the class the tweet belongs to. Hate Speech will contain threatening language towards the community targeted. Offensive language will contain abusive or discriminatory language towards the community targeted." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1503_hatexplain_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1503_hatexplain_classification.json new file mode 100644 index 000000000..dc50f64b4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1503_hatexplain_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is a tweet which can be Hate Speech, Offensive or Normal tweet. Hate Speech and Offensive tweets target one community. Given such a tweet, output the community targeted in the tweet. The community will be one of the nine values: 'African', 'Islam', 'Jewish', 'Women', 'Refugee', 'Arab', 'Caucasian', 'Hispanic' or 'Asian'. Output 'None' if the tweet does not target any community. A tweet targets only one community." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1504_hatexplain_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1504_hatexplain_answer_generation.json new file mode 100644 index 000000000..9d4b198ea --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1504_hatexplain_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is a tweet which can be Hate Speech or Offensive. Given such a tweet, output a phrase from the tweet that makes it hate speech or offensive. The output should contain only one such phrase. The output has to be from within the tweet itself. Do not generate words or phrases not present in the tweet." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1505_root09_semantic_relation_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1505_root09_semantic_relation_classification.json new file mode 100644 index 000000000..c366dadea --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1505_root09_semantic_relation_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a pair of words, deduce the type of relationship between them. The various types of relations are: 'HYPER', 'COORD' and 'RANDOM'. Let's denote the first word by X and the second word by Y. A COORD relationship holds when X and Y belong to the same semantic class. A HYPER relationship applies when X is a specific instance of Y. If niether COORD nor HYPER are applicable then the relationship is RANDOM." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1506_celebrity_minimal_dob_span.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1506_celebrity_minimal_dob_span.json new file mode 100644 index 000000000..cc4cd570b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1506_celebrity_minimal_dob_span.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a short bio of a person, find the minimal text span containing the date of birth of the person. The output must be the minimal text span that contains the birth date, month and year as long as they are present. For instance, given a bio like 'I was born on 27th of Decemeber 1990, and graduated high school on 23rd October 2008.' the output should be '27th of December 1990'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1507_boolean_temporal_reasoning.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1507_boolean_temporal_reasoning.json new file mode 100644 index 000000000..cf9ab15e6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1507_boolean_temporal_reasoning.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a statement about date and time, state whether the statement is true or false. The number of date/time operands in the statement ranges between 2 and 3. Let's say the values are denoted by t1, t2 and t3. The statements follow one of the following ten templates: 't1 occurs before t2, t1 doesn't occur before t2, t1 occurs after t2, t1 doesn't occur after t2, t1 occurs between t2 and t3, t1 doesn't occur between t2 and t3, t1 occured before t2 but after t3, t1 occured after t2 but before t3, t1 didn't occur before t2 but after t3, t1 didn't occur after t2 but before t3'. The output should be either 'True' or 'False'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1508_wordnet_antonyms.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1508_wordnet_antonyms.json new file mode 100644 index 000000000..b0342d9ef --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1508_wordnet_antonyms.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given an adjective, generate its antonym. An antonym of a word is a word opposite in meaning to it." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1509_evalution_antonyms.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1509_evalution_antonyms.json new file mode 100644 index 000000000..008d56325 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1509_evalution_antonyms.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an adjective, and your job is to generate its antonym. An antonym of a word is a word opposite in meaning to it." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task150_afs_argument_quality_gun_control.json b/src/unitxt/catalog/instructions/natural_instructions/train/task150_afs_argument_quality_gun_control.json new file mode 100644 index 000000000..83518e906 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task150_afs_argument_quality_gun_control.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "We would like you to assess the QUALITY of each of the following argument (discussing Gun Control) and determine if the argument is Valid or Invalid. A valid argument is clearly interpretable and either expresses an argument, or a premise or a conclusion that can be used in an argument for the topic of gun control. An invalid argument is a phrase that cannot be interpreted as an argument or not on the topic of gun control." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1510_evalution_relation_extraction.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1510_evalution_relation_extraction.json new file mode 100644 index 000000000..fc05a71bd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1510_evalution_relation_extraction.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a phrase describing the relationship between two words, extract the words and the lexical relationship between them. The relation has to be of the type 'MemberOf', 'MadeOf', 'Synonym', 'Entails', 'HasA', 'HasProperty', 'PartOf', 'Antonym' or 'IsA'. The output should have the format: word1 relation word2." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1517_limit_classfication.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1517_limit_classfication.json new file mode 100644 index 000000000..de820dd3c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1517_limit_classfication.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence and your task is to identify whether the sentence contains motion or not, by classifying the sentence into Yes or No. The sentence belongs to the 'Yes' category if there is an occurrence of a motion of a physical entity otherwise the sentence belongs to the 'No' category. The sentence contains motion if it (i) involves the movement of a physical object. (ii) contains verb in present tense indicating the action performed. Sometimes there can be verb which indicates a motion but the motion might have happened in the past and the answers to such sentences is 'No'" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1518_limit_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1518_limit_answer_generation.json new file mode 100644 index 000000000..90f6e6083 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1518_limit_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence which contains a motion and your task is to identify the physical entities involved in the motion. The input sentence can have more than one entity and also there is at least one entity that takes part in physical motion. There are two types of entities which are animate (beings that are alive) and inanimate entities (beings that are not alive)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1519_qa_srl_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1519_qa_srl_question_generation.json new file mode 100644 index 000000000..686ac79a2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1519_qa_srl_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence and a verb from the sentence. Your task is to generate a set of wh-questions starting with who, what, when, where, why, how, how much. The generated questions must contain the verb and the answers to these questions are phrases in the input sentence. The answer to the questions is associated with a specific semantic role. The answer to these questions is associated with a specific semantic role. The questions must use pronouns instead of direct nouns that could be used to refer to various roles present in the sentence. Construct a question in such a way that (i) it is unambiguous, (ii) its answer is unique (iii) its answer is a continuous text span from the paragraph." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task151_tomqa_find_location_easy_clean.json b/src/unitxt/catalog/instructions/natural_instructions/train/task151_tomqa_find_location_easy_clean.json new file mode 100644 index 000000000..8cfaca024 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task151_tomqa_find_location_easy_clean.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a story, answer the question about the story. The question is the last sentence in the input. The story has one of the three following scenarios: (1) when the individual's belief matches reality, (2) when the individual's belief does not match reality, (3) is when an individual has a false belief about another individual's beliefs. The question will ask about the location of an object in the story with respect to either none or one of the three scenarios." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1520_qa_srl_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1520_qa_srl_answer_generation.json new file mode 100644 index 000000000..8e0014bd3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1520_qa_srl_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence and question which can be answered using the sentence. Your task is to answer the question using the information from the sentence. The answer to the question is unique and it is a continuous text span from the sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task152_tomqa_find_location_easy_noise.json b/src/unitxt/catalog/instructions/natural_instructions/train/task152_tomqa_find_location_easy_noise.json new file mode 100644 index 000000000..c7c5a86a6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task152_tomqa_find_location_easy_noise.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a story, answer the question about the story. The question is the last sentence in the input. The story has one of the three following scenarios: the first is when the individual's belief matches reality, the second is when the individual's belief does not match reality, and the third is when an individual has a false belief about another individual's beliefs. The question will ask about the location of an object in the story with respect to either none or one of the three scenarios. Note that there are distractor sentences in each story that are unrelated to the question and are designed to confuse the reader." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task153_tomqa_find_location_hard_clean.json b/src/unitxt/catalog/instructions/natural_instructions/train/task153_tomqa_find_location_hard_clean.json new file mode 100644 index 000000000..44a8b3d7b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task153_tomqa_find_location_hard_clean.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a story, answer the question about the story. The question is the last sentence in the input. These stories can be difficult due to their length and how each story has at least one of the three following scenarios: the first is when the individual's belief matches reality, the second is when the individual's belief does not match reality, and the third is when an individual has a false belief about another individual's beliefs. The question will ask about the location of an object in the story with respect to either none or one of the three scenarios." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1541_agnews_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1541_agnews_classification.json new file mode 100644 index 000000000..ed1379252 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1541_agnews_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a short article. Your job is to classify the article based on its category. Use the following classification labels, 0. World, 1. Sports, 2. Business, 3. Science or Technical. Label the text \"0\" if it contains information related to world. Label the text \"1\" if it contains information related to sports. Label the text \"2\" if it contains information related business. Label the text \"3\" if it contains science or technical related information. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1542_every_ith_element_from_starting.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1542_every_ith_element_from_starting.json new file mode 100644 index 000000000..62dd8574d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1542_every_ith_element_from_starting.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input i,A where i is an integer and A is an array. You need to find every ith element of A starting with the 1st element." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1548_wiqa_binary_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1548_wiqa_binary_classification.json new file mode 100644 index 000000000..2ceb403d5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1548_wiqa_binary_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You need to answer the question 'Are the given steps in order?', given a set of steps describing a process. Your answer must be either Yes or No. If the answer is No, that means the steps are out of order and do not make sense in the order they are in. If the answer is Yes, that means the steps are in order and make sense in the order that they are in. A set of steps are not in order if the steps reference information that is introduced in a later step" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1549_wiqa_answer_generation_missing_step.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1549_wiqa_answer_generation_missing_step.json new file mode 100644 index 000000000..50160eb7b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1549_wiqa_answer_generation_missing_step.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a list of steps and an additional step, determine where the step fits into the original list of steps. A correct answer, correctly places the given step into the set of steps so that it creates a new plausible set of steps. Output must be formatted as 'After step n', where n is the step number after which the given additional step is to be inserted." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task154_tomqa_find_location_hard_noise.json b/src/unitxt/catalog/instructions/natural_instructions/train/task154_tomqa_find_location_hard_noise.json new file mode 100644 index 000000000..10ea01b60 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task154_tomqa_find_location_hard_noise.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a story, answer the question about the story. The question is the last sentence in the input. These stories can be difficult due to their length and how each story has at least one of the three following scenarios: the first is when the individual's belief matches reality, the second is when the individual's belief does not match reality, and the third is when an individual has a false belief about another individual's beliefs. The question will ask about the location of an object in the story with respect to either none or one of the three scenarios. Note that there are distractor sentences in each story that are unrelated to the question and are designed to confuse the reader." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1551_every_ith_element_from_kth_element.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1551_every_ith_element_from_kth_element.json new file mode 100644 index 000000000..ad4437d38 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1551_every_ith_element_from_kth_element.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given inputs k, i, and A, where k and i are integers and A is a list. You need to find every ith element of A starting from the kth element. The process stops when the position of the next ith element exceeds the length of the list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1553_cnn_dailymail_summarization.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1553_cnn_dailymail_summarization.json new file mode 100644 index 000000000..e06acf4e2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1553_cnn_dailymail_summarization.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given news articles and you need to generate a highlight, i.e., a short summary, with a maximum length of 10 lines." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1559_blimp_binary_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1559_blimp_binary_classification.json new file mode 100644 index 000000000..d3b18902c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1559_blimp_binary_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown an English sentence. You need to classify the sentence as either a representation of an adjunct island or as an incorrect representation. A correct representation should be denoted as 'good' while everything else should be denoted as 'bad'. A correct representation of an adjunct island will be a grammatically correct instance of a sentence using an adjunct island. An incorrect representation will be everything else." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task155_count_nouns_verbs.json b/src/unitxt/catalog/instructions/natural_instructions/train/task155_count_nouns_verbs.json new file mode 100644 index 000000000..0b9d90f9d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task155_count_nouns_verbs.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to count the number of nouns/verbs in the given sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1560_blimp_binary_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1560_blimp_binary_classification.json new file mode 100644 index 000000000..41fc29e22 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1560_blimp_binary_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown an English sentence. You need to classify the sentence as either a representation of an anaphor number agreement or as an incorrect representation. An anaphor is an expression whose interpretation depends upon another expression. Anaphor number agreement is a restriction where a phrase agrees with the preceeding expression: plurals match plurals or singular expressions match singular expressions. In this task a valid representation of anaphor number agreement should be denoted as 'good' while everything else should be denoted as 'bad'. A correct representation of an anaphor number agreement will be a grammatically correct instance of a sentence where the subject and self-referencing nouns match plurality. An incorrect representation is a sentence in which the subject and self-referencing noun's plurality do not match." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1564_triviaqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1564_triviaqa_answer_generation.json new file mode 100644 index 000000000..fd7f16561 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1564_triviaqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a question. You need to generate an answer to the question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1565_triviaqa_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1565_triviaqa_classification.json new file mode 100644 index 000000000..dc5f3c779 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1565_triviaqa_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task involves asking a question, providing a set of 2 options. You are expected to choose the best answer to the question. The output will be in the form of A or B, corresponding to which option is chosen." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1566_propara_structured_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1566_propara_structured_text_generation.json new file mode 100644 index 000000000..df3f7c776 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1566_propara_structured_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a paragraph, and your job is to generate comma-separated entities present in the given paragraph. Generate entities from a given passage in such a way that (i) they are present in the paragraph, (ii) they are non-duplicate, (iii) they underwent a state change during the process. Avoid creating entities that (i) aren't present in the process paragraph and (ii) aren't significant. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1567_propara_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1567_propara_question_generation.json new file mode 100644 index 000000000..5ebd07d43 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1567_propara_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a paragraph, and your task is to construct a question from the given passage. Construct question in such a way that (i) it is well explained in the paragraph, (ii) the words may/may not be present in the paragraph, (iii) it should start with what/how/describe. Avoid creating a question that (i) is just relevant to one or two sentences, and (ii) not relevant to passage. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1568_propara_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1568_propara_classification.json new file mode 100644 index 000000000..500ace915 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1568_propara_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a paragraph, event and an entity. The event is part of the given paragraph and it changes the state of the entity. Your task is to classify the state of the entity into three classes: 1) not exist, 2) unknown location and 3) known location. \"not exist\" means the entity doesn't exist in that state anymore. \"unknown location\" means the entity exists in that state but location is unknown. \"known location\" means the entity exists and location is known. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task156_codah_classification_adversarial.json b/src/unitxt/catalog/instructions/natural_instructions/train/task156_codah_classification_adversarial.json new file mode 100644 index 000000000..c8ddb209c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task156_codah_classification_adversarial.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a prompt and four completions, select the completion that is the most plausible in continuing or answering the prompt. This task is designed to test common sense and has various categories ranging between idioms, negated statements, polysemy, subject referencing, and quantitative reasoning. Generate either Completion A, Completion B, Completion C, or Completion D." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1572_samsum_summary.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1572_samsum_summary.json new file mode 100644 index 000000000..94a7eae62 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1572_samsum_summary.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a conversation, and your task is to generate a summary from the information present in the given conversation. Generate a summary in such a way that the context should be present in the conversation. It should cover the complete context of the conversation. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1573_samsum_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1573_samsum_classification.json new file mode 100644 index 000000000..ba4272e5a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1573_samsum_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two sentences taken from a conversation, and your job is to classify whether these given sentences are sequential or not. We will mark the given sentence pair as 'True' if it's sequential, otherwise 'False'. The two sentences are spoken by two different people. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task157_count_vowels_and_consonants.json b/src/unitxt/catalog/instructions/natural_instructions/train/task157_count_vowels_and_consonants.json new file mode 100644 index 000000000..1e968f709 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task157_count_vowels_and_consonants.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to count the number of vowels (letters 'a', 'e', 'i', 'o', 'u') / consonants (all letters other than vowels) in the given sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1580_eqasc_perturbed_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1580_eqasc_perturbed_question_generation.json new file mode 100644 index 000000000..cb84c9391 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1580_eqasc_perturbed_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a statement, generate a question such that the answer is contained in that statement." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1581_eqasc_perturbed_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1581_eqasc_perturbed_answer_generation.json new file mode 100644 index 000000000..0625796d5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1581_eqasc_perturbed_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a statement and question, generate the answer to the question such that the answer is contained in the statement." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1582_bless_hypernym_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1582_bless_hypernym_generation.json new file mode 100644 index 000000000..01a1ecc17 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1582_bless_hypernym_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a concept word, generate a hypernym for it. A hypernym is a superordinate, i.e., a word with a broad meaning constituting a category, that generalizes another word. For example, color is a hypernym of red. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1583_bless_meronym_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1583_bless_meronym_classification.json new file mode 100644 index 000000000..489c65add --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1583_bless_meronym_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given an object and a part, decide whether the object has that part. For example if you are asked 'gun has barrel?', you need to decide if a gun has a barrel as one of its components or parts, indicating 1 or 0 as your answer respectively. All sentences strictly follow the template 'object has part?.'" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1584_evalution_meronym_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1584_evalution_meronym_classification.json new file mode 100644 index 000000000..374fc28d1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1584_evalution_meronym_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given an object and a part, decide whether the object has that part. For example is you are asked 'gun has barrel', you need to decide if a gun has a barrel as one of its components or parts. All sentences strictly follow the template 'object has part?.' The answer should be 1 or 0, 1 means the object has the given part, while 0 means it doesn't have the part." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1585_root09_hypernym_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1585_root09_hypernym_generation.json new file mode 100644 index 000000000..16f5bb4d1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1585_root09_hypernym_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a concept word, generate a hypernym for it. A hypernym is a superordinate, i.e. a word with a broad meaning constituting a category, that generalizes another word. For example, color is a hypernym of red." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task158_count_frequency_of_words.json b/src/unitxt/catalog/instructions/natural_instructions/train/task158_count_frequency_of_words.json new file mode 100644 index 000000000..8150fa48d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task158_count_frequency_of_words.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to count the occurrences of the given word in the given sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1590_diplomacy_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1590_diplomacy_text_generation.json new file mode 100644 index 000000000..28da6a636 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1590_diplomacy_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given first 5 messages from a series of message exchanges between 2 persons playing the game of Diplomacy which is an American strategic board game. You need to generate the next message. The message should be generated such that it fits the context seen so far. Avoid the text that is (i) tangent to the context, (ii) repeats the context." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1592_yahoo_answers_topics_classfication.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1592_yahoo_answers_topics_classfication.json new file mode 100644 index 000000000..9cfa3e4c3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1592_yahoo_answers_topics_classfication.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question title. You need to classify it into one of the 10 topics: 0 - 'Society & Culture', 1 - 'Science & Mathematics', 2 - 'Health', 3 - 'Education & Reference', 4 - 'Computers & Internet', 5 - 'Sports', 6 - 'Business & Finance', 7 - 'Entertainment & Music', 8 - 'Family & Relationships', 9 - 'Politics & Government'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1593_yahoo_answers_topics_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1593_yahoo_answers_topics_classification.json new file mode 100644 index 000000000..bd4c71bbf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1593_yahoo_answers_topics_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a passage. Using the information present in the passage, you need to classify it into one of the 10 topics: 0 - 'Society & Culture', 1 - 'Science & Mathematics', 2 - 'Health', 3 - 'Education & Reference', 4 - 'Computers & Internet', 5 - 'Sports', 6 - 'Business & Finance', 7 - 'Entertainment & Music', 8 - 'Family & Relationships', 9 - 'Politics & Government'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1594_yahoo_answers_topics_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1594_yahoo_answers_topics_question_generation.json new file mode 100644 index 000000000..40fb18e80 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1594_yahoo_answers_topics_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a passage. You need to construct a question about the information present in the passage. Construct a question in such a way that (i) it is unambiguous, (ii) its answer is the whole paragraph. Avoid creating questions that can be answered correctly without actually understanding the paragraph." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1595_event2mind_text_generation_1.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1595_event2mind_text_generation_1.json new file mode 100644 index 000000000..d03d2db9b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1595_event2mind_text_generation_1.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The task is to generate text based of an event. For the given event, there will be a person who does the action in the event (usually PersonX). Your task is to write that persons emotional reaction to the event, i.e. how that person feels after doing the action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1596_event2mind_text_generation_2.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1596_event2mind_text_generation_2.json new file mode 100644 index 000000000..36414e86c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1596_event2mind_text_generation_2.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The task is to generate text based off of an event. For the given event, there will be a person who does the action in the event (usually PersonX). Your task is to write that persons intent behind doing the event, i.e. why did the person do that action." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1599_smcalflow_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1599_smcalflow_classification.json new file mode 100644 index 000000000..953f00884 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1599_smcalflow_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an utterance, which is a part of a conversation between a user and an agent. Your job is to detect the speaker. The user usually commands the agent to schedule events, retrieve event information, and check the schedule. While the agent's response is an answer to the user's questions or follow-up questions on the user's command. Answer with \"User\" or \"Agent\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task159_check_frequency_of_words_in_sentence_pair.json b/src/unitxt/catalog/instructions/natural_instructions/train/task159_check_frequency_of_words_in_sentence_pair.json new file mode 100644 index 000000000..133579071 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task159_check_frequency_of_words_in_sentence_pair.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, answer 'Yes' if the frequency of the given word in the two sentences is equal, else answer 'No'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1600_smcalflow_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1600_smcalflow_sentence_generation.json new file mode 100644 index 000000000..16e606a00 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1600_smcalflow_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you have given an input which is agent's reply, based on that you have to identify what will be users' command for that reply. The user generally asks a question related to event scheduling or information of the scheduled events. Agent reply based on the available information or do the task as per user command." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1601_webquestions_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1601_webquestions_answer_generation.json new file mode 100644 index 000000000..a59a10e73 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1601_webquestions_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Based on the given question and tppic, give an answer. The answer is available on on the internet. The questions are mostly centered around a single named entity." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1602_webquestion_question_genreation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1602_webquestion_question_genreation.json new file mode 100644 index 000000000..e24843b37 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1602_webquestion_question_genreation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a concept, and a list of answers. You should generate a question about the concept that leads to the given answer(s)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1603_smcalflow_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1603_smcalflow_sentence_generation.json new file mode 100644 index 000000000..44616409c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1603_smcalflow_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you have given an input which is user's command or question, based on that you have to return what will be Agent's response/reply for that particular user's command or question" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1604_ethos_text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1604_ethos_text_classification.json new file mode 100644 index 000000000..6e0dfc7aa --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1604_ethos_text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a comment, classify it into a 'hate' speech or 'not hate' speech. Answer using 'hate' or 'not hate'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1605_ethos_text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1605_ethos_text_classification.json new file mode 100644 index 000000000..503a1e840 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1605_ethos_text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you should classify the given text as 'violence' if there is inhumanity associated with it. Otherwise, classify it as 'not violence'. Mentioning killing people, or hurting them in any way is considered violent." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1606_ethos_text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1606_ethos_text_classification.json new file mode 100644 index 000000000..f89cd4f47 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1606_ethos_text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a piece of text. You should find out if there are any gender specific criticized comments. Label the text as 'gender criticism' or 'not gender criticism'" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1607_ethos_text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1607_ethos_text_classification.json new file mode 100644 index 000000000..8b49f5f16 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1607_ethos_text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a piece of text. Your task is to classify the text based on whether a religion or a person/group of people are receiving hate based on religion. If there is a hate based on religion in the text, answer with 'religious hate', otherwise, answer with 'not religious hate'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1608_xquad_en_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1608_xquad_en_answer_generation.json new file mode 100644 index 000000000..0da5538d1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1608_xquad_en_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Answer the question from the given passage. Your answer should be directly extracted from the passage, and it should be a single entity, name, or number, not a sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1609_xquad_en_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1609_xquad_en_question_generation.json new file mode 100644 index 000000000..7f0a4e758 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1609_xquad_en_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a paragraph, your job is to generate a question that can be answered from the passage. The answer to your question should be a single entity, person, time, etc. that can be extracted from the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task160_replace_letter_in_a_sentence.json b/src/unitxt/catalog/instructions/natural_instructions/train/task160_replace_letter_in_a_sentence.json new file mode 100644 index 000000000..c97bc8ce1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task160_replace_letter_in_a_sentence.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to replace a letter in the sentence with another given letter." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task161_count_words_containing_letter.json b/src/unitxt/catalog/instructions/natural_instructions/train/task161_count_words_containing_letter.json new file mode 100644 index 000000000..e17b2b3f7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task161_count_words_containing_letter.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to count the number of words in a sentence that contain the given letter" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task162_count_words_starting_with_letter.json b/src/unitxt/catalog/instructions/natural_instructions/train/task162_count_words_starting_with_letter.json new file mode 100644 index 000000000..87df1bb9b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task162_count_words_starting_with_letter.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to count the number of words in a sentence that start with the given letter. Answer with numbers and not words." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task163_count_words_ending_with_letter.json b/src/unitxt/catalog/instructions/natural_instructions/train/task163_count_words_ending_with_letter.json new file mode 100644 index 000000000..20ff1d3c2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task163_count_words_ending_with_letter.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to count the number of words in a sentence that end with the given letter. Answer with numbers and not words." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1645_medical_question_pair_dataset_text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1645_medical_question_pair_dataset_text_classification.json new file mode 100644 index 000000000..a24bb9cf6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1645_medical_question_pair_dataset_text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a medical question pair hand-generated. Your task is to classify a given post into two categories 1) 'Similar' if the given two questions have a same connotation 2) 'Dissimilar' if the given two questions have a different connotation or meaning." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task164_mcscript_question_answering_text.json b/src/unitxt/catalog/instructions/natural_instructions/train/task164_mcscript_question_answering_text.json new file mode 100644 index 000000000..a974374ed --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task164_mcscript_question_answering_text.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a paragraph (Passage), a question (Question) and two answer options (Option1 and Option2). Your task is to find the correct answer (and return the string of the correct option, not option1/2) for the given question from the given options and based on the given passage. Answer of the question can be found directly from the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1656_gooaq_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1656_gooaq_answer_generation.json new file mode 100644 index 000000000..8c162460e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1656_gooaq_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a question as input, give its short_answer as the output " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1657_gooaq_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1657_gooaq_question_generation.json new file mode 100644 index 000000000..0496db8dd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1657_gooaq_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given an answer. Create a question for the answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task165_mcscript_question_answering_commonsense.json b/src/unitxt/catalog/instructions/natural_instructions/train/task165_mcscript_question_answering_commonsense.json new file mode 100644 index 000000000..5ff09c152 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task165_mcscript_question_answering_commonsense.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a paragraph (Passage), a question (Question) and two answer options (Option1 and Option2). Your task is to choose the correct answer to the question based on the passage. Answer of the question cannot be found directly from the passage, it is indirectly indicated in the passage. Do not answer with words other than the two options, and do not answer with option titles(e.g. \"option1\" or \"1\" are not acceptable answers.)" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1660_super_glue_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1660_super_glue_question_generation.json new file mode 100644 index 000000000..560ac1a8e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1660_super_glue_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given Wikipedia articles on a range of topics, we ask you to write a question based on the content of the articles that can be answered in a binary manner i.e. True or False." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1661_super_glue_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1661_super_glue_classification.json new file mode 100644 index 000000000..72c437e17 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1661_super_glue_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given Wikipedia articles on a range of topics as passages and a question from the passage. We ask you to answer the question by classifying the answer as 0 (False) or 1 (True)" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1665_trainglecopa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1665_trainglecopa_question_generation.json new file mode 100644 index 000000000..6907b8baa --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1665_trainglecopa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a short story or summary of a situation which is called a premise. Your task is to generate a question based on the given premise. The generated question (i) must be unambiguous, (ii) must be relevant to the premise, (iii) should require commonsense reasoning to get answered. You should not use any outside knowledge to generate the question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1669_md_gender_bias_text_modification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1669_md_gender_bias_text_modification.json new file mode 100644 index 000000000..0ffd32aeb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1669_md_gender_bias_text_modification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task if the pronoun is female or gender-neutral you are to replace it with a male pronoun. If there are no pronouns add a male-gendered word to the sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task166_clariq_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task166_clariq_sentence_generation.json new file mode 100644 index 000000000..8ed17c93c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task166_clariq_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Sometimes users of dialogue systems ask vague questions/queries from the system. In this case, the system asks them a clarifying question to be able to answer it correctly. In this task, you are given a question/query in natural language and your task is to ask a good clarifying question to understand the given question/query more precisely." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1670_md_gender_bias_text_modification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1670_md_gender_bias_text_modification.json new file mode 100644 index 000000000..d97a29252 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1670_md_gender_bias_text_modification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task if the pronoun is male or gender-neutral you are to replace it with a female pronoun. If there are no pronouns add a female-gendered word to the sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1678_mathqa_answer_selection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1678_mathqa_answer_selection.json new file mode 100644 index 000000000..d441e9379 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1678_mathqa_answer_selection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a math problem with context and a question and 5 answer choices, the task is to provide the correct answer choice based on the problem. You must choose one of the given answer choices by letter: a, b, c, d, or e; anything else is invalid." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task167_strategyqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task167_strategyqa_question_generation.json new file mode 100644 index 000000000..2112e6814 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task167_strategyqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are presented with a term, a description of the term, and an expected answer ('yes' or 'no'). You should write a yes-no question about the given term such that the answer is the one provided to you (i.e., If the answer is \"No\", you should ask a question that its answer would be \"No\", and if the answer is \"Yes\", you should ask a question that its answer is \"Yes\". ). The question should have a definitive answer (as opposed to ambiguous or subjective questions, e.g., Is Batman a good movie?). Create a question such that its answer can not be found easily on a single web page (e.g., mentioned in a Wikipedia page). This can be accomplished if answering the question requires more than one fact (facts = statements that can be found on a Wikipedia page or Google). For example, answering the question 'did Aristotle use a laptop?', one needs the know about the invention of the laptop and the death of Aristotle. Avoid questions should not just compare the properties of objects (e.g., Is a door bigger than an elephant?) or those that refer to details in the given description." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task168_strategyqa_question_decomposition.json b/src/unitxt/catalog/instructions/natural_instructions/train/task168_strategyqa_question_decomposition.json new file mode 100644 index 000000000..b97a6c0b1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task168_strategyqa_question_decomposition.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In the following task, you are given a yes/no question, its answer, and additional information which includes a description of a key term in the question and several facts. Your task is to \"decompose the question\"i.e. write the steps required to construct the given answer where each step is a question that can be answered using Wikipedia articles. To decompose the question, think of a decomposition strategy you could apply to answer the question through a search against Wikipedia. The decomposition strategy might not be obvious for some questions. For this reason, you are provided with additional information. You are not required to write decompositions that exactly match the provided facts, they are only meant as guidance. If the facts are too noisy, think about how you would have used Wikipedia to answer this question to create the decomposition. \"not_definitive_answer\" is true if there is no clear answer i.e. the question is ambiguous or a subjective opinion.\"incorrect_answer\" is true if the answer to the question is not correct. If the answer is incorrect, write a decomposition that evaluates the correct answer. Each question should be easy to answer based on simple facts from Wikipedia pages, or a simple check using the answers to preceding questions. To ensure this, we also ask you to enter a potential Wikipedia article that would contain the answer to each question. If you can not think of a Wikipedia page that can answer your question, please think of a different strategy. You do not need to enter a Wikipedia page for steps that don't add new information and only contain simple checks. The answer to the final question is the same as the answer to the original question. Every question's answer has an impact on the final answer and there should be no redundant steps in the decomposition." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task169_strategyqa_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task169_strategyqa_sentence_generation.json new file mode 100644 index 000000000..b26d2c38c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task169_strategyqa_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are presented with a term, a question, and a yes/no answer. For context, the term is associated with a short description. Write the simple facts one needs to know in order to answer the given question. The facts should be easily found on the web (e.g. mentioned in a Wikipedia page)" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1703_ljspeech_textmodification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1703_ljspeech_textmodification.json new file mode 100644 index 000000000..c5099cfe4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1703_ljspeech_textmodification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The task is reading a paragraph containing numbers as digits. The digits can be used to represent Quantity, Dates and Time, Addresses or Positions. Convert the digits into their text equivalents. If a number has a prefix, postfix or punctuation preserve it in the text equivalent. 100000 is translated as hundred thousand, Roman numerals are also translated. If multiple numbers are present convert all instances." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1704_ljspeech_textmodification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1704_ljspeech_textmodification.json new file mode 100644 index 000000000..feb850d66 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1704_ljspeech_textmodification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The task is to read a passage and convert numbers in their text forms into digit forms. The text numbers can be used to represent Quantity, Dates and Time, Addresses or Positions." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1705_ljspeech_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1705_ljspeech_classification.json new file mode 100644 index 000000000..911b14e9c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1705_ljspeech_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task is reading a paragraph and determining if it has proper nouns in it or not. A proper noun is a noun that designates a particular being or thing, does not take a limiting modifier, and is usually capitalized in English. The answer is true if at least one proper noun is present in the sentence, false otherwise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1706_ljspeech_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1706_ljspeech_classification.json new file mode 100644 index 000000000..a952768b0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1706_ljspeech_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The task is to identify if a given passage or sentence has proper punctuation. This includes proper capitalization and the use of punctuations such as commas, semi-colons and full-stops. The answer is True if all punctuation is properly applied, else the answer is False." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task170_hotpotqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task170_hotpotqa_answer_generation.json new file mode 100644 index 000000000..a0e68210b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task170_hotpotqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a set of context paragraph and some supporting facts to answer a question. Your task is to generate answer for given question based on set of context paragraphs and supporting facts." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1711_poki_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1711_poki_text_generation.json new file mode 100644 index 000000000..d6bf1bd7a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1711_poki_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a short text as a title. Your task is to generate a poem as output that is related to the given title and should feel like written by kids. The output should be a run-on sentence (two or more complete sentences connected without any punctuation). The poem should not be too long or too complex, because it should feel like it is written by younger person without high level of literature education." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1712_poki_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1712_poki_classification.json new file mode 100644 index 000000000..9f527bb1d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1712_poki_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a short poem which is written by a kid. Your task is to predict if the kid is in elementary school or high school. Anyone who is from grade 1st to 6th-grade will be considered as in elementary school, and 7th to 12th-grade kids will be considered as in high school. There are only two possible outputs, i.e., elementary and high. All inputs have at least one output and it cannot have both categories at a time." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1713_convai3_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1713_convai3_sentence_generation.json new file mode 100644 index 000000000..c0687bad0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1713_convai3_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a request sent by a user in a human and computer dialogue. Your task is to generate a prediction of what the requester is actually trying to do. The input is a sentence written by the human user, trying to achieve certain objective through this human computer interaction, and the output should be a sentence or two succinctly describing the human user's objective mentioned previously." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1714_convai3_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1714_convai3_sentence_generation.json new file mode 100644 index 000000000..947e5b704 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1714_convai3_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a concatenated string consisting of two parts that are separated by a newline character. The first part is the user's initial question during a human computer conversation, the second part is a clarifying question asked by the computer in response to the question asked by the user. You should read the input, then generate a valid prediction of the user's response to the computer's clarifying question. A valid prediction will clarify the user's correct intent in the initial question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1720_civil_comments_toxicity_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1720_civil_comments_toxicity_classification.json new file mode 100644 index 000000000..a9be75a71 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1720_civil_comments_toxicity_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Categorize the comment on the basis of toxicity. If the comment is toxic (harmful, malicious, derogatory, threat, insult, identity attck, etc.) output Yes, otherwise output No." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1721_civil_comments_obscenity_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1721_civil_comments_obscenity_classification.json new file mode 100644 index 000000000..3576a403a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1721_civil_comments_obscenity_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Categorize the comment on the basis of obscenity. If the comment is obscene output Yes, otherwise output No." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1722_civil_comments_threat_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1722_civil_comments_threat_classification.json new file mode 100644 index 000000000..6a78e7344 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1722_civil_comments_threat_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Categorize the comment on the basis of threat. If the comment is threatening output Yes, otherwise output No." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1723_civil_comments_sexuallyexplicit_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1723_civil_comments_sexuallyexplicit_classification.json new file mode 100644 index 000000000..740dddea8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1723_civil_comments_sexuallyexplicit_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Categorize the comment on the basis of sexual explicitness. If the comment is sexually explicit output Yes, otherwise output No." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1724_civil_comments_insult_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1724_civil_comments_insult_classification.json new file mode 100644 index 000000000..3eeac88a4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1724_civil_comments_insult_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Categorize the comment on the basis of insult. If the comment is insulting output Yes, otherwise output No." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1725_civil_comments_severtoxicity_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1725_civil_comments_severtoxicity_classification.json new file mode 100644 index 000000000..005e76494 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1725_civil_comments_severtoxicity_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Categorize the comment on the basis of severe toxicity. If the comment is severely toxic output Yes, otherwise output No." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1726_mathqa_correct_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1726_mathqa_correct_answer_generation.json new file mode 100644 index 000000000..e8e3c8dda --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1726_mathqa_correct_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The task is to generate the correct answer for a given math problem." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1727_wiqa_what_is_the_effect.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1727_wiqa_what_is_the_effect.json new file mode 100644 index 000000000..62a2443ac --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1727_wiqa_what_is_the_effect.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a process, and a question. The process contains a sequence of steps that happen in order. The question asks about the effect of a certain event on another event. If the first event has a positive effect on the second event, answer with \"for\", if it has a negative effect, answer with \"against\". If there's no causal relationship between the two, answer with \"none\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1729_personachat_generate_next.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1729_personachat_generate_next.json new file mode 100644 index 000000000..c6b640c9a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1729_personachat_generate_next.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Your task is to generate the next utterance in a given dialogue. You will be given a few sentences describing the personality of the person who is making the dialogue, and a history of the dialogue after that. Each line in the history is said by one of the two participants in the conversation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1730_personachat_choose_next.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1730_personachat_choose_next.json new file mode 100644 index 000000000..72662db92 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1730_personachat_choose_next.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a person's personality, and a history of a conversation this person has had. You will be given four candidate sentences to complete the conversation, based on the context. Choose one and answer with the text." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task1731_quartz_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task1731_quartz_question_answering.json new file mode 100644 index 000000000..5dea78d54 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task1731_quartz_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a short paragraph, a question and two choices to answer from. Choose the correct answer based on the paragraph and write the answer(not the key)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task176_break_decompose_questions.json b/src/unitxt/catalog/instructions/natural_instructions/train/task176_break_decompose_questions.json new file mode 100644 index 000000000..d64d52267 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task176_break_decompose_questions.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will break down a question into the basic steps required to answer it.\n A question decomposition is a numbered list of operations that must be performed to answer the original question. Imagine explaining your question to a friendly droid by listing each action it should take in order for the question to be answered. Each step in our decomposition should refer to either an entity (known or unknown), a propery of an entity or a query operation (count, group, union, etc.)\n Here are the list of step templates and their description:\n Select: A select step is used to return a set of objects. There are no references to previous steps in a select step. template: Return [attributes]\n Filter: A filter step is used to return results from a previous step to which a certain condition applies. template: Return [#step] [condition]\n Project: A project step should return certain attributes of the results of a previous step. template: Return [attributes] of [#step]\n Aggregate: An aggregate step returns an aggregator function applied on a step's result. template: Return the [aggregator] of [#step].\n Group: A group step is an aggregator applied on attributes. template: Return the [aggregator] of [#step] for each [attribute]\n Superlative: A superlative step is used to return the result with a highest/lowest attribute among other results. template: Return [#step1] [where] [#step2] [is] [highest / lowest]\n Comparative: A comparative step is used when we need to compare an attribute with a number to filter results. template: Return [#step1] [where] [#step2] [comparator] [number] \n Union: A union step is used to return results of two steps together. template: Return [#step1] [or / ,] [#step2]\n Intersection: An intersection step returns the result that two steps have in common. template: Return [attribute] of both [#step1] and [#step2]\n Discard: A discard step returns result of a step and excludes result of another step from it. template: Return [#step1] besides [#step2]\n Sort: A sort returns result of another step in a specific order. template: Return [#step1] [ordered / sorted by] [#step2]\n Is true: An is true step checks a condition on another result and returns a true or false. template: Return [is / if] [condition]\n Arithmetic: An arithmatic step operates an arithmatic operation on one or more steps. template: Return the [arithmetic op.] of [#step1] [and] [#step2]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task177_para_nmt_paraphrasing.json b/src/unitxt/catalog/instructions/natural_instructions/train/task177_para_nmt_paraphrasing.json new file mode 100644 index 000000000..dd3964d86 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task177_para_nmt_paraphrasing.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This is a paraphrasing task. In this task, you're given a sentence and your task is to generate another sentence which express same meaning as the input using different words." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task178_quartz_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task178_quartz_question_answering.json new file mode 100644 index 000000000..7a2343226 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task178_quartz_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question or fill-in-the-blank question, two answer options (Option1 and Option2) and an Explanation. Your task is to find the correct answer (return the string of the correct option, not option1/2) for the given question from the given options and using explanation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task179_participant_extraction.json b/src/unitxt/catalog/instructions/natural_instructions/train/task179_participant_extraction.json new file mode 100644 index 000000000..b4dbb31ee --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task179_participant_extraction.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In medical studies, treatments are tested within a group of study participants. You will be given a sentence of a study report in which your task is to list the phrases that give information about the participants of the study. You should list the phrases in the same order that they appear in the text, separated by commas. If no information about the participants is mentioned, just output \"not found\". Relevant information about participants include: gender, medical conditions, location, number of people participating. Do not contain participant mentions without relevant information." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task180_intervention_extraction.json b/src/unitxt/catalog/instructions/natural_instructions/train/task180_intervention_extraction.json new file mode 100644 index 000000000..dc7a96825 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task180_intervention_extraction.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In medical studies, the efficacy of medical treatments (called interventions) is evaluated within a group of study participants. You will be given a sentence of a study report in which your task is to list the phrases that describe the intervention(s) of the study. You should list the phrase in the same order that they appear in the text, separated by commas. If no information about the interventions is mentioned, just answer with \"not found\". Interventions are: a specific drug, surgery, talking therapy, a lifestyle modification, control or placebo treatment. Do not include details, dosages, frequency and duration, intervention mentions that are not in an informative span of text." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task181_outcome_extraction.json b/src/unitxt/catalog/instructions/natural_instructions/train/task181_outcome_extraction.json new file mode 100644 index 000000000..1489cd66d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task181_outcome_extraction.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In medical studies, treatments are tested within a group of study participants. To determine if a new treatment works, various outcomes are measured in the people who take part in the study. You will be given a sentence of a study report in which your task is to list the phrases that give information about the outcomes of the study. You should list the phrases in the same order that they appear in the text, separated by commas. If no information about the outcome is mentioned, just answer with: \"not found\".\n Outcomes contain: outcomes measured in patients: like blood sugar,\n outcomes regarding the intervention: like effectiveness, costs\n the score on a medical test or questionnaire,\n positive or negative events in the patient groups: like quitting smoking, or adverse reactions.\n Do not mention numbers or results, interpretations of outcomes, outcome mentions without relevant information." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task182_duorc_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task182_duorc_question_generation.json new file mode 100644 index 000000000..cd571b6ac --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task182_duorc_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown an extract from a movie plot. You need to read the extract and create questions that can be answered from the extract. Once you create a question you also need to provide the correct answer for it. Write your answer like \"Question: your question, Answer: your answer\". The questions should be well-formed and grammatically correct. The questions should be completely answerable from the given passage and should not require any external knowledge. Subjective questions are not allowed. Short answers containing words that are present in the passage are preferred. Create questions that result in factoid answers. A simple rule of thumb to decide whether a question is a factoid or not is to see if two different people with average reading/comprehension skills would come up with the same answer after reading the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task183_rhyme_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task183_rhyme_generation.json new file mode 100644 index 000000000..d1bf5145f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task183_rhyme_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given an input word generate a word that rhymes exactly with the input word. If not rhyme is found return \"No\"" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task184_break_generate_question.json b/src/unitxt/catalog/instructions/natural_instructions/train/task184_break_generate_question.json new file mode 100644 index 000000000..ec4fd1c15 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task184_break_generate_question.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a set of steps that are required to answer a specific question. Your job is to generate that question. Each given step refers to either an entity (known or unknown), a propery of an entity or a query operation (count, group, union, etc.) Knowing those operations and how they appear in the input may help you generate more accurate questions.\n Select: A select step is used to return a set of objects. There are no references to previous steps in a select step. template: Return [attributes]\n Filter: A filter step is used to return results from a previous step to which a certain condition applies. template: Return [#step] [condition]\n Project: A project step should return certain attributes of the results of a previous step. template: Return [attributes] of [#step]\n Aggregate: An aggregate step returns an aggregator function applied on a step's result. template: Return the [aggregator] of [#step].\n Group: A group step is an aggregator applied on attributes. template: Return the [aggregator] of [#step] for each [attribute]\n Superlative: A superlative step is used to return the result with a highest/lowest attribute among other results. template: Return [#step1] [where] [#step2] [is] [highest / lowest]\n Comparative: A comparative step is used when we need to compare an attribute with a number to filter results. template: Return [#step1] [where] [#step2] [comparator] [number] \n Union: A union step is used to return results of two steps together. template: Return [#step1] [or / ,] [#step2]\n Intersection: An intersection step returns the result that two steps have in common. template: Return [attribute] of both [#step1] and [#step2]\n Discard: A discard step returns result of a step and excludes result of another step from it. template: Return [#step1] besides [#step2]\n Sort: A sort returns result of another step in a specific order. template: Return [#step1] [ordered / sorted by] [#step2]\n Is true: An is true step checks a condition on another result and returns a true or false. template: Return [is / if] [condition]\n Arithmetic: An arithmatic step operates an arithmatic operation on one or more steps. template: Return the [arithmetic op.] of [#step1] [and] [#step2]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task191_hotpotqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task191_hotpotqa_question_generation.json new file mode 100644 index 000000000..e0a24323f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task191_hotpotqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a set of context paragraphs, some supporting facts and an answer of a question. Your task is to generate question for given answer based on set of context paragraphs, supporting facts and an answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task192_hotpotqa_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task192_hotpotqa_sentence_generation.json new file mode 100644 index 000000000..5d1beca42 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task192_hotpotqa_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a context paragraph, a question based on that and corresponding answer of a question. Your task is to generate supporting fact/knowledge from context paragraph which helps in answering a given question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task193_duorc_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task193_duorc_question_generation.json new file mode 100644 index 000000000..8bbc90db7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task193_duorc_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown an extract from a movie plot. You need to read the extract and create questions that can be answered from the extract. The questions should be well-formed and grammatically correct. The questions should be completely answerable from the given passage and should not require any external knowledge. Subjective questions are not allowed. Create questions that result in factoid answers. A simple rule of thumb to decide whether a question is factoid or not is to see if two different people with average reading/comprehension skills would come up with the same answer after reading the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task194_duorc_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task194_duorc_answer_generation.json new file mode 100644 index 000000000..ef55082ee --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task194_duorc_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown an extract from a movie plot and a question. You need to provide the correct answer for it. Short answers containing words that are present in the passage are preferred." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task195_sentiment140_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task195_sentiment140_classification.json new file mode 100644 index 000000000..250be0ef2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task195_sentiment140_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a text from tweets. Your task is to classify given tweet text into two categories: 1) positive, and 2) negative based on its content." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task196_sentiment140_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task196_sentiment140_answer_generation.json new file mode 100644 index 000000000..675161f22 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task196_sentiment140_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a text from tweets and a boolean question whether this tweet has positive sentiment or negative sentiment. Your task is to generate answer \"yes\" when the tweet has that particular sentiment, otherwise generate answer \"no\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task205_remove_even_elements.json b/src/unitxt/catalog/instructions/natural_instructions/train/task205_remove_even_elements.json new file mode 100644 index 000000000..c63c10d65 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task205_remove_even_elements.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of numbers. A list is shown by two brackets and comma-separated numbers inside, like: [1,2,3]. You should remove all of the even numbers from the list. If every number in the input list is even an empty list should be returned. Zero should be counted as an even number." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task206_collatz_conjecture.json b/src/unitxt/catalog/instructions/natural_instructions/train/task206_collatz_conjecture.json new file mode 100644 index 000000000..0a84c4710 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task206_collatz_conjecture.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of integers. For every element in the list, if the element is even you should divide by two, if the element is odd you should multiply by three then add one. The output should be a list of integers that is the result of applying that logic to the input list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task207_max_element_lists.json b/src/unitxt/catalog/instructions/natural_instructions/train/task207_max_element_lists.json new file mode 100644 index 000000000..577c8452a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task207_max_element_lists.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a list. This list contains many lists of integers. The list is several items written within a []. Your task is to find the maximum number among the members of each inner list. The output should be a list comprised of the maximums with the same order as the internal lists." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task208_combinations_of_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task208_combinations_of_list.json new file mode 100644 index 000000000..05149850e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task208_combinations_of_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a list. The list is several integers and letters separated with a comma, written within a []. You can create new lists by dropping one of the items in the input list. Your task is to write a list containing all the possible lists you can make by dropping one item from the input list. For example, if the input list contains two items, you can drop one of the items each time. So the output should be a list comprising two inner lists that you have created by decreasing the items." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task209_stancedetection_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task209_stancedetection_classification.json new file mode 100644 index 000000000..e45177f52 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task209_stancedetection_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given the Target and Argument texts detect the stance that the argument has towards the topic. There are three types of stances \"in favor\", \"against\", and \"neutral\". " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task210_logic2text_structured_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task210_logic2text_structured_text_generation.json new file mode 100644 index 000000000..d5ccb7913 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task210_logic2text_structured_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a natural language interpretation of commands (consist of logical operations) to select relevant rows from the given table. Your job is to generate command (in terms of logical operations) from given natural language interpretation. Define body (contains a collection of statements that define what the this logical operator does) of each logical operator between '{}' parenthesis. Here are the definitions of logical operators that you can use while generating command: \n 1. count: returns the number of rows in the view. \n 2. only: returns whether there is exactly one row in the view. \n 3. hop: returns the value under the header column of the row. \n 4. and: returns the boolean operation result of two arguments. \n 5. max/min/avg/sum: returns the max/min/average/sum of the values under the header column. \n 6. nth_max/nth_min: returns the n-th max/n-th min of the values under the header column. \n 7. argmax/argmin: returns the row with the max/min value in header column. \n 8. nth_argmax/nth_argmin: returns the row with the n-th max/min value in header column. \n 9. eq/not_eq: returns if the two arguments are equal. \n 10. round_eq: returns if the two arguments are roughly equal under certain tolerance. \n 11. greater/less: returns if the first argument is greater/less than the second argument. \n 12. diff: returns the difference between two arguments. \n 13. filter_eq/ filter_not_eq: returns the subview whose values under the header column is equal/not equal to the third argument. \n 14. filter_greater/filter_less: returns the subview whose values under the header column is greater/less than the third argument. \n 15. filter_greater_eq /filter_less_eq: returns the subview whose values under the header column is greater/less or equal than the third argument. \n 16. filter_all: returns the view itself for the case of describing the whole table \n 17. all_eq/not_eq: returns whether all the values under the header column are equal/not equal to the third argument. \n 18. all_greater/less: returns whether all the values under the header column are greater/less than the third argument. \n 19. all_greater_eq/less_eq: returns whether all the values under the header column are greater/less or equal to the third argument. \n 20. most_eq/not_eq: returns whether most of the values under the header column are equal/not equal to the third argument. \n 21. most_greater/less: returns whether most of the values under the header column are greater/less than the third argument. \n 22. most_greater_eq/less_eq: returns whether most of the values under the header column are greater/less or equal to the third argument." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task211_logic2text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task211_logic2text_classification.json new file mode 100644 index 000000000..1b6e47808 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task211_logic2text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given commands (in terms of logical operations) and natural interpretation of the given command to select relevant rows from the given table. Your job is to generate a label \"yes\" if the interpretation is appropriate for the command, otherwise generate label \"no\". \n Here are the definitions of logical operators: \n 1. count: returns the number of rows in the view. \n 2. only: returns whether there is exactly one row in the view. \n 3. hop: returns the value under the header column of the row. \n 4. and: returns the boolean operation result of two arguments. \n 5. max/min/avg/sum: returns the max/min/average/sum of the values under the header column. \n 6. nth_max/nth_min: returns the n-th max/n-th min of the values under the header column. \n 7. argmax/argmin: returns the row with the max/min value in header column. \n 8. nth_argmax/nth_argmin: returns the row with the n-th max/min value in header column. \n 9. eq/not_eq: returns if the two arguments are equal. \n 10. round_eq: returns if the two arguments are roughly equal under certain tolerance. \n 11. greater/less: returns if the first argument is greater/less than the second argument. \n 12. diff: returns the difference between two arguments. \n 13. filter_eq/ filter_not_eq: returns the subview whose values under the header column is equal/not equal to the third argument. \n 14. filter_greater/filter_less: returns the subview whose values under the header column is greater/less than the third argument. \n 15. filter_greater_eq /filter_less_eq: returns the subview whose values under the header column is greater/less or equal than the third argument. \n 16. filter_all: returns the view itself for the case of describing the whole table \n 17. all_eq/not_eq: returns whether all the values under the header column are equal/not equal to the third argument. \n 18. all_greater/less: returns whether all the values under the header column are greater/less than the third argument. \n 19. all_greater_eq/less_eq: returns whether all the values under the header column are greater/less or equal to the third argument. \n 20. most_eq/not_eq: returns whether most of the values under the header column are equal/not equal to the third argument. \n 21. most_greater/less: returns whether most of the values under the header column are greater/less than the third argument. \n 22. most_greater_eq/less_eq: returns whether most of the values under the header column are greater/less or equal to the third argument." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task212_logic2text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task212_logic2text_classification.json new file mode 100644 index 000000000..3963fa2bd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task212_logic2text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given commands (in terms of logical operations) to select relevant rows from the given table. Your job is to classify the command into one of these seven categories: (1) majority, (2) unique, (3) superlative, (4) count, (5) comparative, (6) aggregation, and (7) ordinal. \n Here are the defications of each category: \n 1. majority: Describing the majority values (most or all) over one column, with the scope of all table rows or a subset of rows \n 2. unique: Describing one unique row, regarding one column, with the scope of all table rows or a subset of rows \n 3. Superlative: Describing the maximum or minimum value in a column, with the scope of all table rows or a subset of rows \n 4. Ordinal: Describing the n-th maximum or minimum value in a column, with the scope of all table rows or a subset of rows \n 5. Comparative: Comparing two rows in the table, regarding their values in one column \n 6. Count: counting some rows in the table based on the values in one column, with the scope of all table rows or a subset of rows \n 7. Aggregation: Describing the sum or average value over a column, with the scope of all table rows or a subset of rows. \n Here are the definitions of logical operators for understanding of command: \n 1. count: returns the number of rows in the view. \n 2. only: returns whether there is exactly one row in the view. \n 3. hop: returns the value under the header column of the row. \n 4. and: returns the boolean operation result of two arguments. \n 5. max/min/avg/sum: returns the max/min/average/sum of the values under the header column. \n 6. nth_max/nth_min: returns the n-th max/n-th min of the values under the header column. \n 7. argmax/argmin: returns the row with the max/min value in header column. \n 8. nth_argmax/nth_argmin: returns the row with the n-th max/min value in header column. \n 9. eq/not_eq: returns if the two arguments are equal. \n 10. round_eq: returns if the two arguments are roughly equal under certain tolerance. \n 11. greater/less: returns if the first argument is greater/less than the second argument. \n 12. diff: returns the difference between two arguments. \n 13. filter_eq/ filter_not_eq: returns the subview whose values under the header column is equal/not equal to the third argument. \n 14. filter_greater/filter_less: returns the subview whose values under the header column is greater/less than the third argument. \n 15. filter_greater_eq /filter_less_eq: returns the subview whose values under the header column is greater/less or equal than the third argument. \n 16. filter_all: returns the view itself for the case of describing the whole table \n 17. all_eq/not_eq: returns whether all the values under the header column are equal/not equal to the third argument. \n 18. all_greater/less: returns whether all the values under the header column are greater/less than the third argument. \n 19. all_greater_eq/less_eq: returns whether all the values under the header column are greater/less or equal to the third argument. \n 20. most_eq/not_eq: returns whether most of the values under the header column are equal/not equal to the third argument. \n 21. most_greater/less: returns whether most of the values under the header column are greater/less than the third argument. \n 22. most_greater_eq/less_eq: returns whether most of the values under the header column are greater/less or equal to the third argument." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task223_quartz_explanation_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task223_quartz_explanation_generation.json new file mode 100644 index 000000000..294d44174 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task223_quartz_explanation_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a question and answer for that. The answer will fill in the blank or will complete the unfinished question. Your task is to provide an explanation based on the given question or fill-in-the-blank statement, and answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task227_clariq_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task227_clariq_classification.json new file mode 100644 index 000000000..01ae9acf4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task227_clariq_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an ambiguous question/query (which can be answered in more than one way) and a clarification statement to understand the query more precisely. Your task to classify that if the given clarification accurately clarifies the given query or not and based on that provide 'Yes' or 'No'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task228_arc_answer_generation_easy.json b/src/unitxt/catalog/instructions/natural_instructions/train/task228_arc_answer_generation_easy.json new file mode 100644 index 000000000..0b271fd9d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task228_arc_answer_generation_easy.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a science question (easy-level) and four answer options (associated with \"A\", \"B\", \"C\", \"D\"). Your task is to find the correct answer based on scientific facts, knowledge, and reasoning. Do not generate anything else apart from one of the following characters: 'A', 'B, 'C', 'D'. There is only one correct answer for each question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task229_arc_answer_generation_hard.json b/src/unitxt/catalog/instructions/natural_instructions/train/task229_arc_answer_generation_hard.json new file mode 100644 index 000000000..bd2fa9dcb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task229_arc_answer_generation_hard.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a science question (hard-level) and four answer options (associated with \"A\", \"B\", \"C\", \"D\"). Your task is to find the correct answer based on scientific facts, knowledge, and reasoning. Do not generate anything else apart from one of the following characters: 'A', 'B, 'C', 'D'. There is only one correct answer for each question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task243_count_elements_in_set_intersection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task243_count_elements_in_set_intersection.json new file mode 100644 index 000000000..4fdda8c46 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task243_count_elements_in_set_intersection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two sets, and you need to count the number of elements at the intersection of two given sets. A Set is shown by two curly braces and comma-separated numbers inside, like {1, 2, 3}. The intersection of two given sets is the largest set which contains all the elements that are common to both sets. To find the intersection of two given sets, A and B is a set consisting of all the elements common to both A and B." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task244_count_elements_in_set_union.json b/src/unitxt/catalog/instructions/natural_instructions/train/task244_count_elements_in_set_union.json new file mode 100644 index 000000000..9f48dbcf5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task244_count_elements_in_set_union.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two sets, and you need to count the number of elements at the union of two given sets. A Set is shown by two curly braces and comma-separated numbers inside, like {1, 2, 3}. Union of two given sets is the smallest set which contains all the elements of both the sets. To find the union of two given sets, A and B is a set that consists of all the elements of A and all the elements of B such that no element is repeated." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task245_check_presence_in_set_intersection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task245_check_presence_in_set_intersection.json new file mode 100644 index 000000000..9e85701ee --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task245_check_presence_in_set_intersection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two sets, and a question. You need to find whether an element is at the intersection of two given sets. A Set is shown by two curly braces and comma-separated numbers inside, like {1, 2, 3}. The intersection of two given sets is the largest set which contains all the elements that are common to both sets. An element is at the intersection of two given sets, A and B, if common to both A and B. Classify your answers into 'Yes' or 'No'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task246_dream_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task246_dream_question_generation.json new file mode 100644 index 000000000..48744623d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task246_dream_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown a conversation. You need to write a question with three choices for the conversation. Your question should be answerable based on the conversation and only have one correct answer. Note that you don't need to answer your question. \"W\" and \"M\" in the conversations stand for \"woman\" and \"man\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task247_dream_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task247_dream_answer_generation.json new file mode 100644 index 000000000..cc9374d0b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task247_dream_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown a conversation and a question. You need to answer the question and choose the correct option based on the conversation. \"W\" and \"M\" in the conversations stand for \"woman\" and \"man\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task248_dream_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task248_dream_classification.json new file mode 100644 index 000000000..76eb4478f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task248_dream_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown a conversation and a question. You should categorize the question into matching, summary, logic, arithmetic and, commonsense groups. Matching is a question entailed or paraphrased by exactly one sentence in a dialogue. The answer can be extracted from the same sentence. Questions that cannot be answered by the surface meaning of a single sentence belong to the reasoning category. We further define summary, logic, arithmetic and, commonsense subcategories. Answering summary questions requires the whole picture of dialogue, such as the topic of dialogue and the relation between speakers. We require logical reasoning to answer logical questions. in arithmetic questions Inferring the answer requires arithmetic knowledge. To answer commonsense questions, besides the textual information in the dialogue, we also require additional commonsense knowledge that cannot be obtained from the dialogue. Note that a question can be in more than one group. \"W\" and \"M\" in the conversations stand for \"woman\" and \"man\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task267_concatenate_and_reverse_all_elements_from_index_i_to_j.json b/src/unitxt/catalog/instructions/natural_instructions/train/task267_concatenate_and_reverse_all_elements_from_index_i_to_j.json new file mode 100644 index 000000000..cef9503e9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task267_concatenate_and_reverse_all_elements_from_index_i_to_j.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given inputs 'i', 'j', and A, where 'i' and 'j' are integers and A is a list. A list is shown by two brackets and comma-separated numbers and characters inside, like ['1', '12', 'l']. You need to concatenate all elements of A from the ith element to the jth element, and then reverse the resulting string. 'i' and 'j' will be non-negative, and will always have a value less than the length of A. 'i' will always be less than 'j'. Perform the operations in order, i.e., do not reverse first and then concatenate." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task268_casehold_legal_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task268_casehold_legal_answer_generation.json new file mode 100644 index 000000000..f67cf6f4a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task268_casehold_legal_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown a prompt from a judicial decision and multiple holding statements derived from citations following text in a legal decision. Holdings represent the governing legal rule when the law is applied to a particular set of facts. There are five answer choices for each citing text. The correct answer is the holding statement that corresponds to the citing text. The four incorrect answers are other holding statements. You should find the correct option. There is a token in the position of the citing text prompt where the holding statement was extracted." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task269_csrg_counterfactual_story_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task269_csrg_counterfactual_story_generation.json new file mode 100644 index 000000000..467396f3b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task269_csrg_counterfactual_story_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a premise, an initial context, an original ending, and a counterfactual context, the task is to generate a new story ending aligned with the counterfactual context and as close to the original ending as possible. Each instance consists of a five-sentence story. The premise is the first sentence of a story, and the second sentence, which is the initial context, provides more information about the story's context and the story's general plot. The original ending is the last three sentences of the story. Also, a counterfactual context is a slight modification to the initial context. You should write a new story ending that edits the original story ending as little as possible to regain coherence with the counterfactual context. To sum up, you should write the last three sentences of a story based on the premise(first sentence) and the counterfactual context(second sentence) of the story." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task270_csrg_counterfactual_context_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task270_csrg_counterfactual_context_generation.json new file mode 100644 index 000000000..6fd337900 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task270_csrg_counterfactual_context_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a premise, an initial context, an original ending, and a new ending, the task is to generate the counterfactual context that is aligned with the new ending. Each instance consists of a five-sentence story. The premise is the first sentence of a story, and the second sentence, which is the initial context, provides more information about the story's context. The original ending is the last three sentences of the story. Also, you are given a new ending that can provide the new story with the same premise. You should write a counterfactual context to explain the small differences between the original and new endings. More specifically, a story context contains the general plot of the story. And a counterfactual context is a slight modification to the initial context. To sum up, you should write the second sentence of a story based on the premise(first sentence) and the new ending(last three sentences) of the story." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task274_overruling_legal_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task274_overruling_legal_classification.json new file mode 100644 index 000000000..bb252591b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task274_overruling_legal_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown a sentence, and you should determine whether it is overruling or non-overruling. In law, an overruling sentence is a statement that nullifies a previous case decision as a precedent by a constitutionally valid statute or a decision by the same or higher ranking court which establishes a different rule on the point of law involved. Classify your answers into overruling or non-overruling" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task275_enhanced_wsc_paraphrase_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task275_enhanced_wsc_paraphrase_generation.json new file mode 100644 index 000000000..87a7cc9fd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task275_enhanced_wsc_paraphrase_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a sentence or two along with a change aspect. You should change the given text in the given aspect. Aspects are explained below:\n Tense: Change the tense of the verbs in the text. If they're in past tense, change them to present, and if they're in present tense, change them to past tense.\nNumber: Change the number of the nouns in the given text. Make plurals into singles and single into plurals. Remember to change the corresponding pronouns accordingly.\nVoice: If the verbs are in active voice, change them to be passive, otherwise, change them to be in active voice.\nAdverb: add one or multiple adverbs to the text.\nGender: If the text contains female names and pronouns, substitute them with male names and pronouns. Do the same for sentences with mala names and pronouns." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task276_enhanced_wsc_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task276_enhanced_wsc_classification.json new file mode 100644 index 000000000..17282e0cc --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task276_enhanced_wsc_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given two sentences. One of them is created by paraphrasing the original one, with changes on an aspect, or using synonyms. Your task is to decide what is the difference between two sentences. Types of change are explained below:\n Tense: The verbs in the sentence are changed in tense.\nNumber: Plural nouns, verbs and pronouns are changed into single ones or the other way around.\nVoice: If the verbs are in active voice, they're changed to passive or the other way around.\nAdverb: The paraphrase has one adverb or more than the original sentence.\nGender: The paraphrase differs from the original sentence in the gender of the names and pronouns.\nSynonym: Some words or phrases of the original sentence are replaced with synonym words or phrases. Changes in the names of people are also considered a synonym change. Classify your answers into Tense, Number, Voice, Adverb, Gender, and Synonym." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task277_stereoset_sentence_generation_stereotype.json b/src/unitxt/catalog/instructions/natural_instructions/train/task277_stereoset_sentence_generation_stereotype.json new file mode 100644 index 000000000..4f751af80 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task277_stereoset_sentence_generation_stereotype.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a context sentence containing a blank (_). You are expected to fill the blank with one word to make the sentence convey a cultural stereotype. A stereotype is an over-generalized belief about a particular group of people. Your answer must not contain more than one word." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task278_stereoset_sentence_generation_antistereotype.json b/src/unitxt/catalog/instructions/natural_instructions/train/task278_stereoset_sentence_generation_antistereotype.json new file mode 100644 index 000000000..acd8fe493 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task278_stereoset_sentence_generation_antistereotype.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a context sentence containing a blank (_). You are expected to fill the blank with one word to make the sentence convey a cultural anti-stereotype. Anti-stereotype is an idea that goes against a common belief about a particular group of people. Your answer must not contain more than one word." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task279_stereoset_classification_stereotype.json b/src/unitxt/catalog/instructions/natural_instructions/train/task279_stereoset_classification_stereotype.json new file mode 100644 index 000000000..6df67b03d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task279_stereoset_classification_stereotype.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a short passage that may convey stereotype, anti-stereotype, or is unrelated. A stereotype is an over-generalized belief about a particular group of people. An anti-stereotype is an idea that goes against a common stereotype. The passage is unrelated if it does not convey a stereotype or anti-stereotype. You are expected to classify the passage into three classes: stereotype, anti-stereotype, and unrelated." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task280_stereoset_classification_stereotype_type.json b/src/unitxt/catalog/instructions/natural_instructions/train/task280_stereoset_classification_stereotype_type.json new file mode 100644 index 000000000..7c7bfd50d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task280_stereoset_classification_stereotype_type.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a short passage that conveys stereotype or anti-stereotype about a specific target. A stereotype is an over-generalized belief about a particular group of people. An anti-stereotype is an idea that goes against a common stereotype. You are expected to classify the passage into four types of stereotype or anti-stereotype: gender, profession, race, and religion." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task283_dream_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task283_dream_incorrect_answer_generation.json new file mode 100644 index 000000000..28455a335 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task283_dream_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown a conversation and a question. You need to write an implausible answer to the question. Even though there exist multiple wrong answers, we only need a single wrong answer. \"W\" and \"M\" in the conversations stand for \"woman\" and \"man\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task284_imdb_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task284_imdb_classification.json new file mode 100644 index 000000000..ba4a4b2e8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task284_imdb_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a review of movie. Your task is to classify given movie review into two categories: 1) positive, and 2) negative based on its content." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task285_imdb_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task285_imdb_answer_generation.json new file mode 100644 index 000000000..2772c71e5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task285_imdb_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a review of a movie and a boolean question whether this review has positive sentiment or negative sentiment. Your task is to generate answer \"yes\" when the tweet has that particular sentiment, otherwise generate answer \"no\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task286_olid_offense_judgment.json b/src/unitxt/catalog/instructions/natural_instructions/train/task286_olid_offense_judgment.json new file mode 100644 index 000000000..04a7d4368 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task286_olid_offense_judgment.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a tweet and you must identify whether the tweet contains any offense or any form of (untargeted) profanity. Label the post as NOT if the post does not contain offense or profanity. Non-offensive posts do not include any form of offense or profanity. label the post as OFFENSIVE if the post contains offensive language or a targeted (veiled or direct) offense. Twitter user mentions were substituted by @USER and URLs have been substitute by URL." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task287_casehold_legal_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task287_casehold_legal_incorrect_answer_generation.json new file mode 100644 index 000000000..f2b570562 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task287_casehold_legal_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown a prompt from a judicial decision and multiple holding statements derived from citations following text in a legal decision. Holdings represent the governing legal rule when the law is applied to a particular set of facts. There are five answer choices for each citing text. The correct answer is the holding statement that corresponds to the citing text. You should write an incorrect option. Even though there exist multiple wrong answers, we only need a single wrong answer. There is a token in the position of the citing text prompt where the holding statement was extracted." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task291_semeval_2020_task4_commonsense_validation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task291_semeval_2020_task4_commonsense_validation.json new file mode 100644 index 000000000..840fad727 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task291_semeval_2020_task4_commonsense_validation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two natural language statements with similar wording. You must choose the statement that makes less sense based on common sense knowledge. A '\n' separates the statements. Use \"first\" or \"second\" to indicate which sentence makes less sense." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task292_storycommonsense_character_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task292_storycommonsense_character_text_generation.json new file mode 100644 index 000000000..d69482a31 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task292_storycommonsense_character_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a story (which contains five sentences only). Your task is to find all the characters which are available in the given story." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task293_storycommonsense_emotion_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task293_storycommonsense_emotion_text_generation.json new file mode 100644 index 000000000..5cb94b1a5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task293_storycommonsense_emotion_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a context, a sentence, and a character. The sentence describes an action or job of the given character. Also, the context provides more information about the sentence or the character. Your task is to return one of the emotions which are expressed by the Character in the given sentence. For that you can use the Context; however, Context is not provided in all the inputs. Also, in some inputs, there can be zero emotion; for that return 'None'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task294_storycommonsense_motiv_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task294_storycommonsense_motiv_text_generation.json new file mode 100644 index 000000000..2c47b7168 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task294_storycommonsense_motiv_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a context, a sentence, and a character. The sentence describes an action or job of the given character. Also, the context provides more information about the sentence or the character. Your task is to write the character's motivation by doing a specific job, which is given in the sentence. You can use context to find the motivation; however, all the inputs do not provide context. Also, in some inputs, there can be zero motivation; output, 'None' in this case." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task295_semeval_2020_task4_commonsense_reasoning.json b/src/unitxt/catalog/instructions/natural_instructions/train/task295_semeval_2020_task4_commonsense_reasoning.json new file mode 100644 index 000000000..6ba58fbbe --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task295_semeval_2020_task4_commonsense_reasoning.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an impractical statement. You are also given three reasons (associated with \"A\", \"B\", \"C\") explaining why this statement doesn't make sense. You must choose the most corresponding reason explaining why this statement doesn't make sense." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task296_storycloze_correct_end_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task296_storycloze_correct_end_classification.json new file mode 100644 index 000000000..dae799eb6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task296_storycloze_correct_end_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given four sentences of a story written in natural language. The given story is not complete and your job is to complete the story by selecting one of the sentence choices from (A) and (B), such that the story sounds fully coherent." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task297_storycloze_incorrect_end_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task297_storycloze_incorrect_end_classification.json new file mode 100644 index 000000000..ca303f19c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task297_storycloze_incorrect_end_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given four sentences of a story written in natural language. The given story is not complete and your job is to complete the story by selecting one of the end sentence choices from (A) and (B), such that the story does not sound complete and coherent, i.e., select an incorrect end sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task298_storycloze_correct_end_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task298_storycloze_correct_end_classification.json new file mode 100644 index 000000000..20865cf1f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task298_storycloze_correct_end_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given four sentences of a story written in natural language, and one last sentence (Sentence5). Your job is to classify whether the last sentence completes the rest of the story coherently or not by providing 'Yes' or 'No'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task299_storycloze_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task299_storycloze_sentence_generation.json new file mode 100644 index 000000000..5eef60104 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task299_storycloze_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given four sentences of a story written in natural language in which one part is missing. Your job is to predict the position and missing part of the story and return in the following format: position, missing part. The missing part is a sentence that completes the story, and the position is the number of the missing sentence in the new story." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task300_storycloze_order_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task300_storycloze_order_generation.json new file mode 100644 index 000000000..c39383eb8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task300_storycloze_order_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a short story of five sentences written in natural language. However, the order of the given story is not correct. Your job is to return the correct order for the given five sentences to create a coherent short story with the new order that has the correct flow. Generate your answer using the number of sentences in the correct order, such as '23415'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task301_record_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task301_record_question_generation.json new file mode 100644 index 000000000..0fdfe45fb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task301_record_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be shown a passage. You need to write a fill-in-the-gap question based on your understanding of the events that might be inferred from the passage. Your question should be answerable based on the passage and only have one correct answer. Show the gap in your question with a _ ." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task302_record_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task302_record_classification.json new file mode 100644 index 000000000..b1f74b690 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task302_record_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a passage and have to answer a question based on your understanding of the events inferred from the passage. Among the entities, try to find the best entity that is most likely to fill in \"_\" and classify the answers based on options." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task303_record_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task303_record_incorrect_answer_generation.json new file mode 100644 index 000000000..520b8274e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task303_record_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a passage, and you need to write an **implausible** answer to to fill in the place of \"_\". Your answer should be incorrect, but should not be out of context. Try using words that are related to the context of the passage, but are not the correct answer. Even though there exist multiple wrong answers, we only need a single wrong answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task305_jeopardy_answer_generation_normal.json b/src/unitxt/catalog/instructions/natural_instructions/train/task305_jeopardy_answer_generation_normal.json new file mode 100644 index 000000000..b05368380 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task305_jeopardy_answer_generation_normal.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a trivia clue, and the category it belongs to. You should answer with the best answer that belongs in the category and is described by the clue. For consistency, answers should be in all lower cased letters." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task306_jeopardy_answer_generation_double.json b/src/unitxt/catalog/instructions/natural_instructions/train/task306_jeopardy_answer_generation_double.json new file mode 100644 index 000000000..4d07b8f2a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task306_jeopardy_answer_generation_double.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a trivia clue, and the category it belongs to. You should answer with the best answer that belongs in the category and is described by the clue. For simplicity, answers should be in all lower cased letters." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task307_jeopardy_answer_generation_final.json b/src/unitxt/catalog/instructions/natural_instructions/train/task307_jeopardy_answer_generation_final.json new file mode 100644 index 000000000..4d07b8f2a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task307_jeopardy_answer_generation_final.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a trivia clue, and the category it belongs to. You should answer with the best answer that belongs in the category and is described by the clue. For simplicity, answers should be in all lower cased letters." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task308_jeopardy_answer_generation_all.json b/src/unitxt/catalog/instructions/natural_instructions/train/task308_jeopardy_answer_generation_all.json new file mode 100644 index 000000000..4d07b8f2a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task308_jeopardy_answer_generation_all.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a trivia clue, and the category it belongs to. You should answer with the best answer that belongs in the category and is described by the clue. For simplicity, answers should be in all lower cased letters." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task309_race_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task309_race_answer_generation.json new file mode 100644 index 000000000..402cbf6d4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task309_race_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given an article, a question which often contains a blank and four options (associated with \"A\", \"B\", \"C\", \"D\"). Your task is to find the correct answer (from the given options) for the question from the given article and return one of the options from \"A\", \"B\", \"C\", and \"D\". Do not generate anything else apart from one of the following characters: \"A\", \"B\", \"C\", \"D\". There is only one correct answer for each question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task310_race_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task310_race_classification.json new file mode 100644 index 000000000..f450cc44d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task310_race_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given an article, a question which often contains a blank, four options (associated with \"A\", \"B\", \"C\", \"D\") and the answer to that question. Your task is to classify whether the given answer is correct or not by providing \"Yes\" or \"No\", based on the article." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task311_race_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task311_race_question_generation.json new file mode 100644 index 000000000..3612ff526 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task311_race_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given an article and an answer. Your task is to generate the question for the answer based on the given article." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task316_crows_pairs_classification_stereotype.json b/src/unitxt/catalog/instructions/natural_instructions/train/task316_crows_pairs_classification_stereotype.json new file mode 100644 index 000000000..128809e70 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task316_crows_pairs_classification_stereotype.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a short passage that conveys a stereotype or an anti-stereotype. A stereotype is an over-generalized belief about a particular group of people(based on race, ethnicity, gender, age, abilities, etc.). An anti-stereotype is an idea that goes against a common stereotype. You are expected to classify the passage into two classes: stereotype or anti-stereotype." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task317_crows_pairs_classification_stereotype_type.json b/src/unitxt/catalog/instructions/natural_instructions/train/task317_crows_pairs_classification_stereotype_type.json new file mode 100644 index 000000000..fdca04699 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task317_crows_pairs_classification_stereotype_type.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a short passage that conveys a stereotype. A stereotype is an over-generalized belief about a particular group of people. You are expected to classify the passage into nine types of stereotype: race-color, socioeconomic, gender, disability, nationality, sexual-orientation, physical-appearance, religion, and age." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task318_stereoset_classification_gender.json b/src/unitxt/catalog/instructions/natural_instructions/train/task318_stereoset_classification_gender.json new file mode 100644 index 000000000..85a040dc4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task318_stereoset_classification_gender.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a target person and two sentences. Your task is to determine whether the second sentence conveys either a stereotype, anti-stereotype, or is unrelated with respect to the first sentence and the target. A stereotype is a widely held but oversimplified notion of a group of people. An anti-stereotype is an idea that goes against the widely held but oversimplified notion of a group of people. Sentences and targets are unrelated if there is no relevance between them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task319_stereoset_classification_profession.json b/src/unitxt/catalog/instructions/natural_instructions/train/task319_stereoset_classification_profession.json new file mode 100644 index 000000000..50a220725 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task319_stereoset_classification_profession.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a target profession, and two sentences. Your task is to determine whether the second sentence is either a stereotype, anti-stereotype, or is unrelated with respect to the first sentence and the target. A stereotype is a widely held but oversimplified notion of a group of people. An anti-stereotype is an idea that goes against the widely held but oversimplified notion of a group of people. Sentences and targets are unrelated if there is no relevance between them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task320_stereoset_classification_race.json b/src/unitxt/catalog/instructions/natural_instructions/train/task320_stereoset_classification_race.json new file mode 100644 index 000000000..ec70392e3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task320_stereoset_classification_race.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a target race, and two sentences. Your task is to determine whether the second sentence is either a stereotype, anti-stereotype, or is unrelated with respect to the first sentence and the target. A stereotype is a widely held but oversimplified notion of a group of people. An anti-stereotype is an idea that goes against the widely held but oversimplified notion of a group of people. Sentences and targets are unrelated if there is no relevance between them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task321_stereoset_classification_religion.json b/src/unitxt/catalog/instructions/natural_instructions/train/task321_stereoset_classification_religion.json new file mode 100644 index 000000000..0d6065447 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task321_stereoset_classification_religion.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given two sentences regarding the stereotypes of religions, determine whether the second sentence is either a stereotype, anti-stereotype, or is unrelated with respect to the first sentence and the target. A stereotype is a widely held but oversimplified notion of a group of people. An anti-stereotype is an idea that goes against the widely held but oversimplified notion of a group of people. Sentences and targets are unrelated if there is no relevance between them." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task322_jigsaw_classification_threat.json b/src/unitxt/catalog/instructions/natural_instructions/train/task322_jigsaw_classification_threat.json new file mode 100644 index 000000000..36dab7bca --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task322_jigsaw_classification_threat.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a public comment from online platforms. You are expected to classify the comment into two classes: threat and non-threat. Threat is a statement that someone will be hurt or harmed, especially if the person does not do something in particular." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task323_jigsaw_classification_sexually_explicit.json b/src/unitxt/catalog/instructions/natural_instructions/train/task323_jigsaw_classification_sexually_explicit.json new file mode 100644 index 000000000..48959dad4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task323_jigsaw_classification_sexually_explicit.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a public comment from online platforms. You are expected to classify the comment into two classes: sexual-explicit and non-sexual-explicit. A comment is considered sexual-explicit if it explicitly portrays sexual matters." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task324_jigsaw_classification_disagree.json b/src/unitxt/catalog/instructions/natural_instructions/train/task324_jigsaw_classification_disagree.json new file mode 100644 index 000000000..5128d9aab --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task324_jigsaw_classification_disagree.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a public comment from online platforms. You are expected to classify the comment into two classes: disagree or agree. Classify the comment as disagree if it is likely to raise a certain level of public disagreement, whether healthy or unhealthy. The disagreement can be due to toxic content (for example, disrespect, identity attack, insult, and threat), controversial content, misunderstandings, or conflicting opinions. Classify the comment as agree otherwise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task325_jigsaw_classification_identity_attack.json b/src/unitxt/catalog/instructions/natural_instructions/train/task325_jigsaw_classification_identity_attack.json new file mode 100644 index 000000000..0f03c1afe --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task325_jigsaw_classification_identity_attack.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a public comment from online platforms. You are expected to classify the comment into two classes: identity-attack and non-identity-attack. Identity attack refers to anything rude or disrespectful about someone's identity, including appearance, race, gender, and sexual orientation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task326_jigsaw_classification_obscene.json b/src/unitxt/catalog/instructions/natural_instructions/train/task326_jigsaw_classification_obscene.json new file mode 100644 index 000000000..a49d9bbdf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task326_jigsaw_classification_obscene.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a public comment from online platforms. You are expected to classify the comment into two classes: obscene and non-obscene. A comment is obscene if it is considered offensive to the public sense of decency, for example because it too obviously relates to sex or contains language regarded as taboo in polite usage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task327_jigsaw_classification_toxic.json b/src/unitxt/catalog/instructions/natural_instructions/train/task327_jigsaw_classification_toxic.json new file mode 100644 index 000000000..940697d6c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task327_jigsaw_classification_toxic.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a public comment from online platforms. You are expected to classify the comment into two classes: toxic and non-toxic. Toxicity is defiend as anything that is rude, disrespectful, or unreasonable that would make someone want to leave a converation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task328_jigsaw_classification_insult.json b/src/unitxt/catalog/instructions/natural_instructions/train/task328_jigsaw_classification_insult.json new file mode 100644 index 000000000..09996b0f3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task328_jigsaw_classification_insult.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a public comment from online platforms. You are expected to classify the comment into two classes: insult and non-insult. Insult is any lanugage or act that is disrespectful or scornfully abusive." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task333_hateeval_classification_hate_en.json b/src/unitxt/catalog/instructions/natural_instructions/train/task333_hateeval_classification_hate_en.json new file mode 100644 index 000000000..053e107af --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task333_hateeval_classification_hate_en.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a post in English from online platforms. You are expected to identify whether the post is hateful against immigrants and women. A hateful post expresses hate or encourages violence towards a person or a group. If a post is hateful but not towards immigrants and women, it should be labeled as non-hateful. Answer \"hateful\" or \"Non-hateful\". Note that the URLs in the text have been replaced with [Link]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task335_hateeval_classification_aggresive_en.json b/src/unitxt/catalog/instructions/natural_instructions/train/task335_hateeval_classification_aggresive_en.json new file mode 100644 index 000000000..7893b6de7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task335_hateeval_classification_aggresive_en.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a hateful post in English from online platforms. You are expected to classify the post into two classes: aggresive or non-aggresive. An aggresive post is one that expresses feelings and opinions in an abusive way and tries to dominate others. Note that the URLs in the text have been replaced with [Link]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task337_hateeval_classification_individual_en.json b/src/unitxt/catalog/instructions/natural_instructions/train/task337_hateeval_classification_individual_en.json new file mode 100644 index 000000000..15b46251e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task337_hateeval_classification_individual_en.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a hateful post in English from online platforms. You are expected to classify the target being harassed in the post as individual or generic, i.e., single person or a group of people. Note that the URLs in the text have been replaced with [Link]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task339_record_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task339_record_answer_generation.json new file mode 100644 index 000000000..33bcef9ef --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task339_record_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a passage and have to answer a question based on your understanding of the events inferred from the passage. Try to find the best answer that is most likely to fill in \"_\". Note that the URLs in the text have been replaced with [Link]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task340_winomt_classification_gender_pro.json b/src/unitxt/catalog/instructions/natural_instructions/train/task340_winomt_classification_gender_pro.json new file mode 100644 index 000000000..757d05973 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task340_winomt_classification_gender_pro.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence and a profession that is mentioned in the sentence. The gender of the person with the given profession can be identified using the gendered pronouns that refer to them in the text. You are expected to identify the gender. Select from female and male." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task341_winomt_classification_gender_anti.json b/src/unitxt/catalog/instructions/natural_instructions/train/task341_winomt_classification_gender_anti.json new file mode 100644 index 000000000..8cf832e11 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task341_winomt_classification_gender_anti.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence and a profession that is mentioned in the sentence. The gender of the person with the given profession can be identified using the gendered pronouns that refer to them in the text. You are expected to identify the gender. Select from female and male." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task342_winomt_classification_profession_pro.json b/src/unitxt/catalog/instructions/natural_instructions/train/task342_winomt_classification_profession_pro.json new file mode 100644 index 000000000..7ea7249ea --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task342_winomt_classification_profession_pro.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence and a gender. The sentence mentions two professions: one's gender is unknown and the other's gender can be identified using the gendered pronouns that refer to them in the text. You are expected to return the profession with the given gender." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task343_winomt_classification_profession_anti.json b/src/unitxt/catalog/instructions/natural_instructions/train/task343_winomt_classification_profession_anti.json new file mode 100644 index 000000000..7ea7249ea --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task343_winomt_classification_profession_anti.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence and a gender. The sentence mentions two professions: one's gender is unknown and the other's gender can be identified using the gendered pronouns that refer to them in the text. You are expected to return the profession with the given gender." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task344_hybridqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task344_hybridqa_answer_generation.json new file mode 100644 index 000000000..042870ef3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task344_hybridqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a question and you have to answer the question based on your knowledge. Your answers should be as short as possible." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task345_hybridqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task345_hybridqa_answer_generation.json new file mode 100644 index 000000000..72894155f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task345_hybridqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a question, and you have to write the part-of-speech tag for each word in the question. Here is the Alphabetical list of part-of-speech tags used in this task: CC: Coordinating conjunction, CD: Cardinal number, DT: Determiner, EX: Existential there, FW: Foreign word, IN: Preposition or subordinating conjunction, JJ: Adjective, JJR: Adjective, comparative, JJS: Adjective, superlative, LS: List item marker, MD: Modal, NN: Noun, singular or mass, NNS: Noun, plural, NNP: Proper noun, singular, NNPS: Proper noun, plural, PDT: Predeterminer, POS: Possessive ending, PRP: Personal pronoun, PRP$: Possessive pronoun, RB: Adverb, RBR: Adverb, comparative, RBS: Adverb, superlative, RP: Particle, SYM: Symbol, TO: to, UH: Interjection, VB: Verb, base form, VBD: Verb, past tense, VBG: Verb, gerund or present participle, VBN: Verb, past participle, VBP: Verb, non-3rd person singular present, VBZ: Verb, 3rd person singular present, WDT: Wh-determiner, WP: Wh-pronoun, WP$: Possessive wh-pronoun, WRB: Wh-adverb" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task346_hybridqa_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task346_hybridqa_classification.json new file mode 100644 index 000000000..253bf60b6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task346_hybridqa_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a question, a word, and a POS tag. You have to determine whether the part-of-speech tag of the given word in the question is equal to the given POS tag or not. Give your answer with True or False. Here is the Alphabetical list of part-of-speech tags used in this task: CC: Coordinating conjunction, CD: Cardinal number, DT: Determiner, EX: Existential there, FW: Foreign word, IN: Preposition or subordinating conjunction, JJ: Adjective, JJR: Adjective, comparative, JJS: Adjective, superlative, LS: List item marker, MD: Modal, NN: Noun, singular or mass, NNS: Noun, plural, NNP: Proper noun, singular, NNPS: Proper noun, plural, PDT: Predeterminer, POS: Possessive ending, PRP: Personal pronoun, PRP$: Possessive pronoun, RB: Adverb, RBR: Adverb, comparative, RBS: Adverb, superlative, RP: Particle, SYM: Symbol, TO: to, UH: Interjection, VB: Verb, base form, VBD: Verb, past tense, VBG: Verb, gerund or present participle, VBN: Verb, past participle, VBP: Verb, non-3rd person singular present, VBZ: Verb, 3rd person singular present, WDT: Wh-determiner, WP: Wh-pronoun, WP$: Possessive wh-pronoun, WRB: Wh-adverb" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task347_hybridqa_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task347_hybridqa_incorrect_answer_generation.json new file mode 100644 index 000000000..b83e25d15 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task347_hybridqa_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a question about part-of-speech tag of a word in the question. You should write an implausible POS tag to the question. Even though there exist multiple wrong answers, we only need a single wrong answer. Here is the Alphabetical list of part-of-speech tags used in this task: CC: Coordinating conjunction, CD: Cardinal number, DT: Determiner, EX: Existential there, FW: Foreign word, IN: Preposition or subordinating conjunction, JJ: Adjective, JJR: Adjective, comparative, JJS: Adjective, superlative, LS: List item marker, MD: Modal, NN: Noun, singular or mass, NNS: Noun, plural, NNP: Proper noun, singular, NNPS: Proper noun, plural, PDT: Predeterminer, POS: Possessive ending, PRP: Personal pronoun, PRP$: Possessive pronoun, RB: Adverb, RBR: Adverb, comparative, RBS: Adverb, superlative, RP: Particle, SYM: Symbol, TO: to, UH: Interjection, VB: Verb, base form, VBD: Verb, past tense, VBG: Verb, gerund or present participle, VBN: Verb, past participle, VBP: Verb, non-3rd person singular present, VBZ: Verb, 3rd person singular present, WDT: Wh-determiner, WP: Wh-pronoun, WP$: Possessive wh-pronoun, WRB: Wh-adverb" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task350_winomt_classification_gender_identifiability_pro.json b/src/unitxt/catalog/instructions/natural_instructions/train/task350_winomt_classification_gender_identifiability_pro.json new file mode 100644 index 000000000..9669cf234 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task350_winomt_classification_gender_identifiability_pro.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence and a profession. The sentence mentions two professions: one's gender is identifiable using the coreference link with gendered pronouns and the other's gender is unidentifiable. You are expected to return whether the given profession's gender is identifiable or unidentifiable." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task351_winomt_classification_gender_identifiability_anti.json b/src/unitxt/catalog/instructions/natural_instructions/train/task351_winomt_classification_gender_identifiability_anti.json new file mode 100644 index 000000000..61dd4e62e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task351_winomt_classification_gender_identifiability_anti.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence and a profession. The sentence mentions two professions: one's gender is identifiable using the gendered pronouns in the text and the other's gender is unidentifiable. You are expected to return whether the given profession's gender is identifiable or unidentifiable." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task353_casino_classification_negotiation_elicit_pref.json b/src/unitxt/catalog/instructions/natural_instructions/train/task353_casino_classification_negotiation_elicit_pref.json new file mode 100644 index 000000000..c7a192c77 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task353_casino_classification_negotiation_elicit_pref.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is taken from a negotiation between two participants who take the role of campsite neighbors and negotiate for Food, Water, and Firewood packages, based on their individual preferences and requirements. Given an utterance and recent dialogue context containing past 3 utterances (wherever available), output Yes if the utterance contains the elicit-pref strategy, otherwise output No. elicit-pref is a cooperative negotiation strategy. It is used to discover the preference order of the opponent in the negotiation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task354_casino_classification_negotiation_no_need.json b/src/unitxt/catalog/instructions/natural_instructions/train/task354_casino_classification_negotiation_no_need.json new file mode 100644 index 000000000..842c13ce5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task354_casino_classification_negotiation_no_need.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is taken from a negotiation between two participants who take the role of campsite neighbors and negotiate for Food, Water, and Firewood packages, based on their individual preferences and requirements. Given an utterance and recent dialogue context containing past 3 utterances (wherever available), output Yes if the utterance contains the no-need strategy, otherwise output No. no-need is a cooperative negotiation strategy. It is used when a participant points out that they do not need an item based on personal context such as suggesting that they have ample water to spare. no-need can directly benefit the opponent since it implies that the item is up for grabs." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task355_casino_classification_negotiation_other_need.json b/src/unitxt/catalog/instructions/natural_instructions/train/task355_casino_classification_negotiation_other_need.json new file mode 100644 index 000000000..cc73c30c4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task355_casino_classification_negotiation_other_need.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is taken from a negotiation between two participants who take the role of campsite neighbors and negotiate for Food, Water, and Firewood packages, based on their individual preferences and requirements. Given an utterance and recent dialogue context containing past 3 utterances (wherever available), output Yes if the utterance contains the other-need strategy, otherwise output No. other-need is a selfish negotiation strategy. It is used when the participants discuss a need for someone else rather than themselves. For instance, describing the need for firewood to keep the kids warm." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task356_casino_classification_negotiation_self_need.json b/src/unitxt/catalog/instructions/natural_instructions/train/task356_casino_classification_negotiation_self_need.json new file mode 100644 index 000000000..9354fdc9a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task356_casino_classification_negotiation_self_need.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is taken from a negotiation between two participants who take the role of campsite neighbors and negotiate for Food, Water, and Firewood packages, based on their individual preferences and requirements. Given an utterance and recent dialogue context containing past 3 utterances (wherever available), output Yes if the utterance contains the self-need strategy, otherwise output No. self-need is a selfish negotiation strategy. It is used to create a personal need for an item in the negotiation, such as by pointing out that the participant sweats a lot to show preference towards water packages." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task357_casino_classification_negotiation_small_talk.json b/src/unitxt/catalog/instructions/natural_instructions/train/task357_casino_classification_negotiation_small_talk.json new file mode 100644 index 000000000..208156600 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task357_casino_classification_negotiation_small_talk.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is taken from a negotiation between two participants who take the role of campsite neighbors and negotiate for Food, Water, and Firewood packages, based on their individual preferences and requirements. Given an utterance and recent dialogue context containing past 3 utterances (wherever available), output Yes if the utterance contains the small-talk strategy, otherwise output No. small-talk is a cooperative negotiation strategy. It is used for discussing topics apart from the negotiation, in an attempt to build a rapport with the opponent. For example, discussing how the opponent is doing during the pandemic or sharing excitement for the camping trip." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task358_casino_classification_negotiation_uv_part.json b/src/unitxt/catalog/instructions/natural_instructions/train/task358_casino_classification_negotiation_uv_part.json new file mode 100644 index 000000000..0b92203e1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task358_casino_classification_negotiation_uv_part.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is taken from a negotiation between two participants who take the role of campsite neighbors and negotiate for Food, Water, and Firewood packages, based on their individual preferences and requirements. Given an utterance and recent dialogue context containing past 3 utterances (wherever available), output Yes if the utterance contains the uv-part strategy, otherwise output No. uv-part is a selfish negotiation strategy. It is used to undermine the requirements of the opponent. For instance, suggesting that the opponent would not need more firewood since they already have the basic supplies or a suggestion that there might be a store near the campsite where the opponent can get the supplies instead." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task359_casino_classification_negotiation_vouch_fair.json b/src/unitxt/catalog/instructions/natural_instructions/train/task359_casino_classification_negotiation_vouch_fair.json new file mode 100644 index 000000000..598e92755 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task359_casino_classification_negotiation_vouch_fair.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The input is taken from a negotiation between two participants who take the role of campsite neighbors and negotiate for Food, Water, and Firewood packages, based on their individual preferences and requirements. Given an utterance and recent dialogue context containing past 3 utterances (wherever available), output Yes if the utterance contains the vouch-fair strategy, otherwise output No. vouch-fair is a selfish negotiation strategy. It is used to call out fairness for personal benefit, either when acknowledging a fair deal or when the opponent offers a deal that benefits them. This can be through an explicit call out or can be implied." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task363_sst2_polarity_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task363_sst2_polarity_classification.json new file mode 100644 index 000000000..fafe6bd3b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task363_sst2_polarity_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given sentences from movie reviews. The task is to classify a sentence as \"POS\" if the sentiment of the sentence is positive or as \"NEG\" if the sentiment of the sentence is negative" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task364_regard_social_impact_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task364_regard_social_impact_classification.json new file mode 100644 index 000000000..f5df5314b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task364_regard_social_impact_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a sentence about a person. You should determine how the sentence affects how the person is perceived by most people in society. Your choices are: \nPositive: The social perception of [PERSON] in the sentence is considered predominantly positive.\nNegative: The social perception of [PERSON] in the sentence is considered predominantly negative.\nNo impact: There is no clear impact of social perception of [PERSON] associated with the sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task365_synthetic_remove_vowels.json b/src/unitxt/catalog/instructions/natural_instructions/train/task365_synthetic_remove_vowels.json new file mode 100644 index 000000000..91f762459 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task365_synthetic_remove_vowels.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a string of characters. You should remove all vowels from the given string. Vowels are: i,e,a,u,o. The character 'y' or 'Y' does not count as a vowel." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task366_synthetic_return_primes.json b/src/unitxt/catalog/instructions/natural_instructions/train/task366_synthetic_return_primes.json new file mode 100644 index 000000000..7a5a05104 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task366_synthetic_return_primes.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of integers. You should remove any integer that is not prime. A prime integer is an integer that is only divisible by '1' and itself. The output should be the list of prime numbers in the input list. If there are no primes in the input list an empty list (\"[]\") should be returned." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task367_synthetic_remove_floats.json b/src/unitxt/catalog/instructions/natural_instructions/train/task367_synthetic_remove_floats.json new file mode 100644 index 000000000..759e01be5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task367_synthetic_remove_floats.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of numbers. You should remove any number that is not an integer (whole number). If every number is not an whole number then an empty list (\"[]\") should be returned. Otherwise, answer with the list of whole numbers separated by comma inside brackets." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task368_synthetic_even_or_odd_calculation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task368_synthetic_even_or_odd_calculation.json new file mode 100644 index 000000000..8742fd75c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task368_synthetic_even_or_odd_calculation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of integers. For every element in the list, if the element is even you should divide by 4, if the element is odd you should multiply by 4 then add 2. The output should be a list of numbers that is the result of applying that logic to the input list. You should not round any decimals in the output. Zero should be counted as an even integer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task369_synthetic_remove_odds.json b/src/unitxt/catalog/instructions/natural_instructions/train/task369_synthetic_remove_odds.json new file mode 100644 index 000000000..8edf535f7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task369_synthetic_remove_odds.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a list of integers. You should remove all of the odd integers from the list(consider 0 an even number). If every integer in the input list is odd then an empty list (\"[]\") should be returned. Otherwise, answer with the list of even numbers separated by comma inside brackets." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task370_synthetic_remove_divisible_by_3.json b/src/unitxt/catalog/instructions/natural_instructions/train/task370_synthetic_remove_divisible_by_3.json new file mode 100644 index 000000000..fe12fab23 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task370_synthetic_remove_divisible_by_3.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of integers. You should remove all of the integers that are divisible by 3 from the list. If every integer in the input list is divisible by 3 then an empty list should be returned. Zero is divisible by 3." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task371_synthetic_product_of_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task371_synthetic_product_of_list.json new file mode 100644 index 000000000..71c01bf13 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task371_synthetic_product_of_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of lists, of numbers. For every inner list, you should multiply every number in that list and put the results in your answer. The output should be a list of numbers with the same length as the number of the lists in the input list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task372_synthetic_palindrome_numbers.json b/src/unitxt/catalog/instructions/natural_instructions/train/task372_synthetic_palindrome_numbers.json new file mode 100644 index 000000000..728130ef5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task372_synthetic_palindrome_numbers.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of integers. You should only return an integer if the first digit is the same as the last digit in the number. If an integer has a single digit, then it should be returned. If there are no integers that start and end with the same digit then an empty list (\"[]\") should be returned." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task373_synthetic_round_tens_place.json b/src/unitxt/catalog/instructions/natural_instructions/train/task373_synthetic_round_tens_place.json new file mode 100644 index 000000000..3d16e426d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task373_synthetic_round_tens_place.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of integers. You should round each integer to the nearest tens place. That means you should round the number to the nearest multiple of 10." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task374_synthetic_pos_or_neg_calculation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task374_synthetic_pos_or_neg_calculation.json new file mode 100644 index 000000000..a22aa13b5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task374_synthetic_pos_or_neg_calculation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list of integers. For every element in the list, if the element is positive you should multiply it by 2. If the element is negative you should multiply it by -3. The output should be a list of integers that is the result of applying that logic to the input list.\n Note: A list is presented with comma separated numbers inside two brackets." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task375_classify_type_of_sentence_in_debate.json b/src/unitxt/catalog/instructions/natural_instructions/train/task375_classify_type_of_sentence_in_debate.json new file mode 100644 index 000000000..576b9643f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task375_classify_type_of_sentence_in_debate.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a debate topic, along with a sentence from the debate. You should classify the given sentence and choose the type of that sentence. Possible types are explained below.\nPolicy: This refers to a sentence proposing a specific course of action to be taken. It typically contains modal verbs like \"should\" and \"ought to\". It cannot be directly proved with objective evidence, and a proper type of support is a logical reason from which the proposition can be inferred.\nValue: This refers to a sentence containing value judgments without making specific claims about what should be done (If so, then it is a Policy sentence.). Because of the subjectivity of value judgments, it cannot be proved directly with objective evidence.\nFact: This refers to an objective proposition expressing or dealing with facts or conditions as perceived without distortion by personal feelings, prejudices, or interpretations. A Fact sentence has a truth value that can be verified with objective evidence that may be available at the time the claim is made; predictions about future are considered unverifiable.\nTestimony: This refers to an objective sentence about the author's personal state or experience. Evidence for Testimony is not publicly available in most cases." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task376_reverse_order_of_words.json b/src/unitxt/catalog/instructions/natural_instructions/train/task376_reverse_order_of_words.json new file mode 100644 index 000000000..07441e83d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task376_reverse_order_of_words.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to reverse the order of words in the given sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task377_remove_words_of_given_length.json b/src/unitxt/catalog/instructions/natural_instructions/train/task377_remove_words_of_given_length.json new file mode 100644 index 000000000..db9698197 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task377_remove_words_of_given_length.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to remove all words of a given length in the sentence. The number of letters in a word determine its length, for example, the length of the word \"apple\" is 5." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task378_reverse_words_of_given_length.json b/src/unitxt/catalog/instructions/natural_instructions/train/task378_reverse_words_of_given_length.json new file mode 100644 index 000000000..66874c7bf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task378_reverse_words_of_given_length.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to reverse all words of a given length in the sentence. The number of letters in a word determine its length. For example, the length of the word \"apple\" is 5." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task379_agnews_topic_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task379_agnews_topic_classification.json new file mode 100644 index 000000000..fba75f6e4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task379_agnews_topic_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a news article. Your task is to classify the article to one out of the four topics 'World', 'Sports', 'Business', 'Sci/Tech' if the article's main topic is relevant to the world, sports, business, and science/technology, correspondingly. If you are not sure about the topic, choose the closest option. Note that URLs in the text have been replaced with [Link]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task380_boolq_yes_no_question.json b/src/unitxt/catalog/instructions/natural_instructions/train/task380_boolq_yes_no_question.json new file mode 100644 index 000000000..9e155edda --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task380_boolq_yes_no_question.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a passage and a yes/no question based on the passage. You should answer the question using the information from the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task381_boolq_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task381_boolq_question_generation.json new file mode 100644 index 000000000..ff31dbab8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task381_boolq_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a passage, and your task is to generate a Yes/No question that is answerable based on the given passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task382_hybridqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task382_hybridqa_answer_generation.json new file mode 100644 index 000000000..d5bcd38d6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task382_hybridqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a question about part-of-speech tag of a word in the question. You should write the required POS tag answering the question. Here is the Alphabetical list of part-of-speech tags used in this task: CC: Coordinating conjunction, CD: Cardinal number, DT: Determiner, EX: Existential there, FW: Foreign word, IN: Preposition or subordinating conjunction, JJ: Adjective, JJR: Adjective, comparative, JJS: Adjective, superlative, LS: List item marker, MD: Modal, NN: Noun, singular or mass, NNS: Noun, plural, NNP: Proper noun, singular, NNPS: Proper noun, plural, PDT: Predeterminer, POS: Possessive ending, PRP: Personal pronoun, PRP$: Possessive pronoun, RB: Adverb, RBR: Adverb, comparative, RBS: Adverb, superlative, RP: Particle, SYM: Symbol, TO: to, UH: Interjection, VB: Verb, base form, VBD: Verb, past tense, VBG: Verb, gerund or present participle, VBN: Verb, past participle, VBP: Verb, non-3rd person singular present, VBZ: Verb, 3rd person singular present, WDT: Wh-determiner, WP: Wh-pronoun, WP$: Possessive wh-pronoun, WRB: Wh-adverb" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task383_matres_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task383_matres_classification.json new file mode 100644 index 000000000..799b0c877 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task383_matres_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a context and a verb separated with a newline character, and you have to answer if the given verb can be anchored in time or not. We say a verb can be anchored in the real timeline if and only if a verb happened in the past, is happening now, or is guaranteed to happen in the future. The output should be \"Yes\" if the verb can be anchored in time and \"No\" otherwise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task384_socialiqa_question_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task384_socialiqa_question_classification.json new file mode 100644 index 000000000..1b7df07dc --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task384_socialiqa_question_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a context passage, an answer, and a question. Your task is to classify whether the question for this answer is correct or not, based on the given context with commonsense reasoning about social situations. If its correct ,return \"True\" else \"False\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task385_socialiqa_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task385_socialiqa_incorrect_answer_generation.json new file mode 100644 index 000000000..80b2238b4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task385_socialiqa_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a context passage, a question, and three answer options. Your task is to return an incorrect answer option to the question from the choices given. For all questions, only one of the three answer options is correct. Pick one of the two incorrect answer options as the output." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task386_semeval_2018_task3_irony_detection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task386_semeval_2018_task3_irony_detection.json new file mode 100644 index 000000000..2c1e93afb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task386_semeval_2018_task3_irony_detection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a tweet. You must judge whether the tweet is ironic or not. We define two type of irony for this task (\"polarity\",\"situational\"). Situational irony happens when a situation fails to meet some expectations. polarity irony happens when irony is achieved by inverting the intended sentence. Label the instances as \"ironic\" or \"not\" based on your judgment. Note that URLs in the text have been replaced with [Link]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task387_semeval_2018_task3_irony_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task387_semeval_2018_task3_irony_classification.json new file mode 100644 index 000000000..6829147e0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task387_semeval_2018_task3_irony_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a tweet that contains some form of irony. You must classify the type of irony the tweet has. Label the tweets (\"polarity\",\"situational\",\"other\") based on the irony they have. Situational irony happens when a situation fails to meet some expectations, Label these instances as \"situational\". polarity irony happens when irony is achieved by inverting the intended sentence, Label these instances as \"polarity\". There are other kinds of ironies that are neither polarity nor situational, Label these instances as \"other\". Note that URLs in the text have been replaced with [Link]." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task388_torque_token_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task388_torque_token_classification.json new file mode 100644 index 000000000..134aedca2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task388_torque_token_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, a passage will be given and the goal is to identify an event from the passage. An event is defined as a single word representing something that happened, is happening, or may happen. An event can be factual or hypothetical, positive or negative, certain or uncertain. While most events are based on verbs, an event can also be based on a noun (ex. storm, snow, rainfall) or a copula verb (is, was, been, etc.). The event must not be a pronoun or an adjective. For noun events with multiple words, use the last word in the phrase as event." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task389_torque_generate_temporal_question.json b/src/unitxt/catalog/instructions/natural_instructions/train/task389_torque_generate_temporal_question.json new file mode 100644 index 000000000..c259c64e8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task389_torque_generate_temporal_question.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, a passage will be given and the goal is to generate a question about temporal relations based on that passage. A temporal relation describes the relation between two things with respect to time e.g., something happens/starts/terminates/... immediately/shortly/usually/... before/after/during/... something else.\n Your question should include an event, or ask about an event, and should not be a yes/no question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task390_torque_text_span_selection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task390_torque_text_span_selection.json new file mode 100644 index 000000000..cf02b5caf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task390_torque_text_span_selection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be given a passage, a question and a list of single-word events identified from the passage. The goal is to point out all events from the given event list that can answer the question. If a question is unanswerable or none of the events answer the question, output should be empty." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task397_semeval_2018_task1_tweet_anger_detection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task397_semeval_2018_task1_tweet_anger_detection.json new file mode 100644 index 000000000..77067f602 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task397_semeval_2018_task1_tweet_anger_detection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a tweet. You must judge whether the author of the tweet is angry or not. Label the instances as \"Angry\" or \"Not angry\" based on your judgment." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task398_semeval_2018_task1_tweet_joy_detection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task398_semeval_2018_task1_tweet_joy_detection.json new file mode 100644 index 000000000..ded12267e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task398_semeval_2018_task1_tweet_joy_detection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a tweet. You must judge whether the author of the tweet is happy or not. Label the instances as \"Happy\" or \"Not happy\" based on your judgment." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task399_semeval_2018_task1_tweet_sadness_detection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task399_semeval_2018_task1_tweet_sadness_detection.json new file mode 100644 index 000000000..4cb4417f3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task399_semeval_2018_task1_tweet_sadness_detection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a tweet. You must judge whether the author of the tweet is sad or not. Label the instances as \"Sad\" or \"Not sad\" based on your judgment. You can get help from hashtags and emojis, but you should not judge only based on them, and should pay attention to tweet's text as well." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task400_paws_paraphrase_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task400_paws_paraphrase_classification.json new file mode 100644 index 000000000..d8191ed12 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task400_paws_paraphrase_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a sentence pair from wikipedia that have high lexical overlap. If the sentences have the same meaning and are just paraphrases of each other label them as \"Paraphrase\" , if not label them as \"Not paraphrase\". The two sentences are seperated by a new line." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task403_creak_commonsense_inference.json b/src/unitxt/catalog/instructions/natural_instructions/train/task403_creak_commonsense_inference.json new file mode 100644 index 000000000..3fa2160ff --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task403_creak_commonsense_inference.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a statement and an explanation giving you further knowledge about an entity in the statement. You must judge whether the statement is true or false based on the explanation. Label an instance as \"True\" if the explanation confirms the statement or doesn't disprove it. Label an instance as \"False\" if the explanation disproves the statement. The statement and explanation are separated by a newline character." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task405_narrativeqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task405_narrativeqa_question_generation.json new file mode 100644 index 000000000..2150aaa1e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task405_narrativeqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a summary of a story. You need to create a question that can be answered from the story. You can create a question about characters, events, facts and beliefs, etc. Your question should be specific, try not to use pronouns instead of full names. As the stories are sometimes movie plots, they will contain actor names in parentheses. You should not use those names. Only use character names. Try to ask a question about all parts of the plot, not just the beginning." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task413_mickey_en_sentence_perturbation_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task413_mickey_en_sentence_perturbation_generation.json new file mode 100644 index 000000000..b06345566 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task413_mickey_en_sentence_perturbation_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sentence, generate a new sentence by performing small changes on the sentence. Here, make sure that the changes are semantically related and syntactically similar to the input. And the generated sentence should have high commonsense plausibility, that is to have reasonable probability of it being true." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task428_senteval_inversion.json b/src/unitxt/catalog/instructions/natural_instructions/train/task428_senteval_inversion.json new file mode 100644 index 000000000..d69910b4b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task428_senteval_inversion.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a sentence. You must judge whether there exist two consecutive words within the sentence with flipped orders, that is, whether the sentence will make sense and be correct if the order of two consecutive words changes. Label the instances as \"Inversion\" or \"Original\" based on your judgment." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task429_senteval_tense.json b/src/unitxt/catalog/instructions/natural_instructions/train/task429_senteval_tense.json new file mode 100644 index 000000000..18904b052 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task429_senteval_tense.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a sentence. You must judge whether the main verb of the sentence is in present or past tense. Label the instances as \"Present\" or \"Past\" based on your judgment. If there is no verb in the given text, answer \"Present\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task430_senteval_subject_count.json b/src/unitxt/catalog/instructions/natural_instructions/train/task430_senteval_subject_count.json new file mode 100644 index 000000000..b4fa2460c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task430_senteval_subject_count.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a sentence. You must judge whether subject of the main clause is singular or plural. Label the instances as \"Singular\" or \"Plural\" based on your judgment." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task431_senteval_object_count.json b/src/unitxt/catalog/instructions/natural_instructions/train/task431_senteval_object_count.json new file mode 100644 index 000000000..0eb704716 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task431_senteval_object_count.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a sentence. You must judge whether the object of the main clause is singular(like: apple) or plural(like: apartments). Label the instances as \"Singular\" or \"Plural\" based on your judgment." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task453_swag_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task453_swag_answer_generation.json new file mode 100644 index 000000000..acff28315 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task453_swag_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sentence, generate what should be the most likely next statement. The next statement should be reasonable and logically correct." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task454_swag_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task454_swag_incorrect_answer_generation.json new file mode 100644 index 000000000..6e39f0565 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task454_swag_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sentence, generate a most unlikely next statement. The next statement should not be logically relevant to the given context" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task455_swag_context_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task455_swag_context_generation.json new file mode 100644 index 000000000..cf5e26b55 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task455_swag_context_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sentence, generate a most likely context or previous statement. The previous statement should be relevant to the given statement." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task456_matres_intention_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task456_matres_intention_classification.json new file mode 100644 index 000000000..93eda7676 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task456_matres_intention_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a context and a verb separated with a newline character. You have to identify if the given verb implies an opinion, an intention, a wish or not. Please note that a verb refers to an intention only if it refers to an event planned to happen in the future and is not conditional (or part of a condition). The output should be: 'Yes' if the verb refers to an opinion, an intention, or a wish; and 'No' otherwise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task457_matres_conditional_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task457_matres_conditional_classification.json new file mode 100644 index 000000000..dc3f37cfa --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task457_matres_conditional_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a context and a verb separated with a newline character. You have to decide if the given verb implies a hypothetical or conditioned action or not. We say a verb is hypothetical if it involves or is based on a suggested idea or theory. A verb is conditional if it appears in a conditional phrase and is dependent on something else. Note that an event that happened in the past or is happening now cannot be conditional. The output should be \"Yes\" if the verb is conditional or hypothetical and \"No\" otherwise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task458_matres_negation_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task458_matres_negation_classification.json new file mode 100644 index 000000000..932e1890e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task458_matres_negation_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a context and a verb separated with a newline character, and you have to answer if the given verb is a negation or not. A verb is a negation if it is not going to exist, not happen, or has no effect. The output should be \"Yes\" if the verb is a negation and \"No\" otherwise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task459_matres_static_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task459_matres_static_classification.json new file mode 100644 index 000000000..9e9d234bd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task459_matres_static_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a context and a verb separated with a newline character, and you have to answer if the given verb is static or not. We say a verb is static if it is about an event that doesn't change or it happens regularly. The output should be \"Yes\" if the verb is static and \"No\" otherwise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task460_qasper_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task460_qasper_answer_generation.json new file mode 100644 index 000000000..e164b4526 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task460_qasper_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a context from an academic paper and a question separated with a \n. You have to answer the question based on the context." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task461_qasper_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task461_qasper_question_generation.json new file mode 100644 index 000000000..612166755 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task461_qasper_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a context from an academic paper and you have to write an answerable question based on the context. Your questions can be extractive, abstractive, or yes-no questions." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task462_qasper_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task462_qasper_classification.json new file mode 100644 index 000000000..5f8d20130 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task462_qasper_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you will be presented with a context from an academic paper and a question based on the context. You have to classify the questions into \"Extractive\", \"Abstractive\", or \"Yes-no\" questions. Extractive questions can be answered by concatenating extracts taken from a context into a summary while answering abstractive questions involves paraphrasing the context using novel sentences. Yes-no question is a question whose expected answer is one of two choices, one that affirms the question and one that denies the question. Typically, the choices are either yes or no." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task469_mrqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task469_mrqa_answer_generation.json new file mode 100644 index 000000000..c79e0c4b5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task469_mrqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a question and a context passage, generate the answer having the word or phrase from the context passage. Here, the answer should be a shortest continous span from the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task470_mrqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task470_mrqa_question_generation.json new file mode 100644 index 000000000..9b1f83390 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task470_mrqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a context passage, generate a question from the passage such that its answer is shortest continous span from the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task471_haspart_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task471_haspart_answer_generation.json new file mode 100644 index 000000000..8805548fa --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task471_haspart_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given an entity as input, output another entity which is part of the input entity. These are entities of meronym. In linguistics, meronymy is a semantic relation between a meronym denoting a part and a holonym denoting a whole. In simpler terms, a meronym (i.e., output entity) is in a part-of relationship with its holonym (i.e., input entity)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task472_haspart_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task472_haspart_classification.json new file mode 100644 index 000000000..6d03dc99f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task472_haspart_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given two entities as input, classify as \"yes\" if second entity is the part of the first entity. Otherwise classify them as \"no\". These are entities of meronym In linguistics, meronymy is a semantic relation between a meronym denoting a part and a holonym denoting a whole. In simpler terms, a meronym (i.e., second entity) is in a part-of relationship with its holonym (i.e., first entity)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task475_yelp_polarity_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task475_yelp_polarity_classification.json new file mode 100644 index 000000000..61fc403ce --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task475_yelp_polarity_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given Yelp reviews. The task is to classify a review as \"POSITIVE\" if the overall sentiment of the review is positive or as \"NEGATIVE\" if the overall sentiment of the review is negative." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task476_cls_english_books_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task476_cls_english_books_classification.json new file mode 100644 index 000000000..47ec2e0e0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task476_cls_english_books_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given books product reviews in English language. The goal is to classify the review as \"POS\" if the overall sentiment of the review is positive or as \"NEG\" if the overall sentiment of the review is negative." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task477_cls_english_dvd_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task477_cls_english_dvd_classification.json new file mode 100644 index 000000000..caf3fd8bc --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task477_cls_english_dvd_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given product reviews about dvds. The goal is to classify the review as \"POS\" if the overall sentiment of the review is positive(the reviewer is satisfied) or as \"NEG\" if the overall sentiment of the review is negative(the reviewer is not satisfied)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task478_cls_english_music_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task478_cls_english_music_classification.json new file mode 100644 index 000000000..262b0d2c1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task478_cls_english_music_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given music product reviews in English language. The goal is to classify the review as \"POS\" if the overall sentiment of the review is positive or as \"NEG\" if the overall sentiment of the review is negative." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task488_extract_all_alphabetical_elements_from_list_in_order.json b/src/unitxt/catalog/instructions/natural_instructions/train/task488_extract_all_alphabetical_elements_from_list_in_order.json new file mode 100644 index 000000000..6b59a5c41 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task488_extract_all_alphabetical_elements_from_list_in_order.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list A. You need to find all the elements of the list that are alphabets in the same order as they appear in the list A. Do not change their case/capitalization." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task489_mwsc_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task489_mwsc_question_generation.json new file mode 100644 index 000000000..efce2876a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task489_mwsc_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You need to read the given sentence and construct a question about the information present in the sentence. Construct a question in such a way that (i) it is unambiguous, (ii) its answer is unique. The question must involve coreference resolution which is a task of clustering mentions in text that refer to the same underlying real world entities. For example let's take a sentence 'I voted for Obama because he was most aligned with my values, she said.' Here in this example 'I', 'my', and 'she' belong to the same cluster and 'Obama' and 'he' belong to the same cluster. Now let's discuss another example , original sentence: 'I voted for Trump because he was most aligned with my values',John said. Now here is the same sentence with resolved coreferences: 'John voted for Trump because Trump was most aligned with John's values',John said." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task490_mwsc_options_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task490_mwsc_options_generation.json new file mode 100644 index 000000000..53937cee7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task490_mwsc_options_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a sentence and a question, construct 2 answer options in a specific format i.e. ['option1','option2']. The answer options have to be text spans from the given sentence. Only one among the options should be the correct answer to the given question. Note that, the correct answer to the given question will require understanding of coreference resolution. Coreference resolution is the task of clustering mentions in text that refer to the same underlying real world entities." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task491_mwsc_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task491_mwsc_answer_generation.json new file mode 100644 index 000000000..bf1f18e5d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task491_mwsc_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a sentence and question. Based on the information provided in a given sentence, you should identify the shortest continuous text span from the sentence that serves as an answer to the given question. Answer the question using coreference resolution. Coreference resolution is the task of clustering mentions in text that refer to the same underlying real world entities. For example let's take a sentence 'I voted for Obama because he was most aligned with my values, she said.' Here in this example 'I', 'my', and 'she' belong to the same cluster and 'Obama' and 'he' belong to the same cluster. Now let's discuss another example , original sentence: 'I voted for Trump because he was most aligned with my values',John said. Now here is the same sentence with resolved coreferences: 'John voted for Trump because Trump was most aligned with John's values',John said. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task492_mwsc_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task492_mwsc_incorrect_answer_generation.json new file mode 100644 index 000000000..e41cebd73 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task492_mwsc_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, based on the given sentence and the question, you are asked to generate an incorrect answer. The incorrect answer has to be a text span from the given sentence. Note that, the correct answer to the given question will require understanding of coreference resolution. Coreference resolution is the task of clustering mentions in text that refer to the same underlying real world entities. For example let's take a sentence 'I voted for Obama because he was most aligned with my values, she said.' Here in this example 'I', 'my', and 'she' belong to the same cluster and 'Obama' and 'he' belong to the same cluster. Now let's discuss another example , original sentence: 'I voted for Trump because he was most aligned with my values',John said. Now here is the same sentence with resolved coreferences: 'John voted for Trump because Trump was most aligned with John's values',John said. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task493_review_polarity_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task493_review_polarity_classification.json new file mode 100644 index 000000000..fc3a66569 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task493_review_polarity_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given reviews from Amazon, classify those review based on their content into two classes: Negative or Positive." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task494_review_polarity_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task494_review_polarity_answer_generation.json new file mode 100644 index 000000000..9a049c78c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task494_review_polarity_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a review text from amazon and its polarity (either positive or negative). Generate answer \"True\" if given sentence and its polarity match, otherwise generate answer \"False\". A review is considered positive if the reviewer is satisfied with the product. Otherwise, it is considered negative." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task495_semeval_headline_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task495_semeval_headline_classification.json new file mode 100644 index 000000000..5996727ad --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task495_semeval_headline_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given news headlines and an edited word. The original sentence has word within given format {word}. Create new headlines by replacing {word} in the original sentence with edit word. Classify news headlines into \"Funny\" and \"Not Funny\" that have been modified by humans using an edit word to make them funny. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task496_semeval_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task496_semeval_answer_generation.json new file mode 100644 index 000000000..db464b999 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task496_semeval_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given news headlines, an edited word and funniness labels. The original sentence has word with the given format {word}. Create new headlines by replacing {word} in the original sentence with edit word. Your task is to generate answer \"Yes\" if an edited sentence matches funniness label, otherwise generate answer \"No\". " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task497_extract_all_numbers_from_list_in_order.json b/src/unitxt/catalog/instructions/natural_instructions/train/task497_extract_all_numbers_from_list_in_order.json new file mode 100644 index 000000000..45843581a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task497_extract_all_numbers_from_list_in_order.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list A. You need to find all the elements of the list that are numbers in the same order as they appear in the list A." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task499_extract_and_add_all_numbers_from_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task499_extract_and_add_all_numbers_from_list.json new file mode 100644 index 000000000..6a761a6b4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task499_extract_and_add_all_numbers_from_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list A. You need to find all the elements of the list that are numbers and calculate their sum." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task504_count_all_alphabetical_elements_in_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task504_count_all_alphabetical_elements_in_list.json new file mode 100644 index 000000000..32c39ec86 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task504_count_all_alphabetical_elements_in_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list. A list contains several comma-separated items written within brackets. You need to return the count of all the alphabetical elements in the given list. Return 0 if no alphabetical element in the list" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task505_count_all_numerical_elements_in_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task505_count_all_numerical_elements_in_list.json new file mode 100644 index 000000000..5d8289d01 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task505_count_all_numerical_elements_in_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list. A list contains several comma-separated items written within brackets. You need to return the count of all the numerical elements in the given list. Return 0 if no numerical element in the list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task506_position_of_all_alphabetical_elements_in_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task506_position_of_all_alphabetical_elements_in_list.json new file mode 100644 index 000000000..e753a22a9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task506_position_of_all_alphabetical_elements_in_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list. A list contains several comma-separated items written within brackets. You need to return the position of all the alphabetical elements in the given list in order. Assume the position of the 1st element to be 1. Return -1 if no alphabetical element is in the list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task507_position_of_all_numerical_elements_in_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task507_position_of_all_numerical_elements_in_list.json new file mode 100644 index 000000000..2dc08caf8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task507_position_of_all_numerical_elements_in_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list. A list contains several comma-separated items written within brackets. You need to return the position of all the numerical elements in the given list in order. Assume the position of the 1st element to be 1. Return -1 if no numerical element is in the list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task509_collate_of_all_alphabetical_and_numerical_elements_in_list_separately.json b/src/unitxt/catalog/instructions/natural_instructions/train/task509_collate_of_all_alphabetical_and_numerical_elements_in_list_separately.json new file mode 100644 index 000000000..dd53f73d6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task509_collate_of_all_alphabetical_and_numerical_elements_in_list_separately.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list. A list contains several comma-separated items written within brackets. You need to collate all the alphabetical elements at the start of the list followed by all the numerical elements of the list. Maintain the order in which the alphabetical elements appear in the given input list, and do the same for the numerical elements." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task512_twitter_emotion_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task512_twitter_emotion_classification.json new file mode 100644 index 000000000..2ab11855d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task512_twitter_emotion_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given Twitter posts. Your task is to label the post's emotion (as expressed by the user) as sadness, joy, love, anger, fear, or surprise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task513_argument_stance_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task513_argument_stance_classification.json new file mode 100644 index 000000000..19c2af663 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task513_argument_stance_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a topic and an argument. Decide the argument's stance towards that topic. The argument's stance is in favor or against the topic. If the argument supports that topic, answer with \"in favor\"; otherwise, if the argument opposes the topic, answer with \"against\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task514_argument_consequence_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task514_argument_consequence_classification.json new file mode 100644 index 000000000..8395bd09c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task514_argument_consequence_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You will be given a topic and an argument. Your task is to answer whether the topic and the argument are related or not. A related argument should provide more details about the outcomes of the topic. If the argument refers to or suggests a consequence related to that topic, answer with \"yes\"; otherwise, answer with \"no\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task515_senteval_odd_word_out.json b/src/unitxt/catalog/instructions/natural_instructions/train/task515_senteval_odd_word_out.json new file mode 100644 index 000000000..5fcbb2439 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task515_senteval_odd_word_out.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence. You must judge whether a single noun or verb has been replaced with another word with the same part of speech. The inversion would result in the sentence sounding unnatural, So unnatural sentences will be considered changed. Label the instances as \"Original\" or \"Changed\" based on your judgment." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task516_senteval_conjoints_inversion.json b/src/unitxt/catalog/instructions/natural_instructions/train/task516_senteval_conjoints_inversion.json new file mode 100644 index 000000000..6fcead3c0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task516_senteval_conjoints_inversion.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a sentence with one coordinating conjunction (for, and, nor, but, or, yet, and so). You must judge whether the order of two coordinated clausal conjoints have been inverted or not. Inversion would result in the sentence sounding unnatural. Label the instances as \"Original\" or \"Inversion\" based on your judgment." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task517_emo_classify_emotion_of_dialogue.json b/src/unitxt/catalog/instructions/natural_instructions/train/task517_emo_classify_emotion_of_dialogue.json new file mode 100644 index 000000000..0372bcbda --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task517_emo_classify_emotion_of_dialogue.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given some text dialogue and you need to infer the underlying emotion of the text. The possible emotions are happy, sad, angry, or other." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task518_emo_different_dialogue_emotions.json b/src/unitxt/catalog/instructions/natural_instructions/train/task518_emo_different_dialogue_emotions.json new file mode 100644 index 000000000..ffb59fb95 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task518_emo_different_dialogue_emotions.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given two dialogues. You need to determine if both dialogues have the same underlying emotion. The possible emotions are happy, sad, angry, or other. If they do output 'yes', if not output 'no'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task521_trivia_question_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task521_trivia_question_classification.json new file mode 100644 index 000000000..d4b9b29a5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task521_trivia_question_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a text passage from a trivia quiz. You should choose the category this question belongs to from these categories: History, Science, Social Science, Fine Arts, Literature. You can only choose one category, so if in doubt, please choose the closest match." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task522_news_editorial_summary.json b/src/unitxt/catalog/instructions/natural_instructions/train/task522_news_editorial_summary.json new file mode 100644 index 000000000..bebfc5e7e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task522_news_editorial_summary.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Your task is to extract the thesis of an opinionated news article by selecting some of its text segments. The thesis is a summarization of what the author wants to persuade the reader of. Your answer should consist of segments of the given text. Note that you are not allowed to combine different sentences." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task523_find_if_numbers_or_alphabets_are_more_in_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task523_find_if_numbers_or_alphabets_are_more_in_list.json new file mode 100644 index 000000000..07a1b7c70 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task523_find_if_numbers_or_alphabets_are_more_in_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list A. If the count of numbers is more than that of alphabets in the list, answer 'Numbers Win'. If the count of alphabets is more than that of numbers in the list, answer 'Alphabets Win'. If the count of numbers is same as that of alphabets in the list, answer 'Numbers and Alphabets are Tied'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task547_alt_translation_entk_en.json b/src/unitxt/catalog/instructions/natural_instructions/train/task547_alt_translation_entk_en.json new file mode 100644 index 000000000..cd674f866 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task547_alt_translation_entk_en.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, given a sentence in English Tokens, your task is to convert it into the English language" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task550_discofuse_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task550_discofuse_sentence_generation.json new file mode 100644 index 000000000..4ee4d3f25 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task550_discofuse_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a second sentence. Your task is to generate the first sentence on the same topic but incoherent and inconsistent with the second sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task560_alt_translation_en_entk.json b/src/unitxt/catalog/instructions/natural_instructions/train/task560_alt_translation_en_entk.json new file mode 100644 index 000000000..d6308d73b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task560_alt_translation_en_entk.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, given a sentence in the English language, your task is to convert it into English Tokens." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task563_discofuse_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task563_discofuse_answer_generation.json new file mode 100644 index 000000000..66e162f7b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task563_discofuse_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two sentences in the English language (Sentence 1 and Sentence 2). Your task is to identify the connecting word between the two sentences." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task564_discofuse_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task564_discofuse_classification.json new file mode 100644 index 000000000..0d054570b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task564_discofuse_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two sentences in the English language and your task is to classify them into one of their discourse types. A discourse type is an indicator to classify the given two sentences on the basis of a co-text as well as a relevant context. There are 13 discourse types in total which are 'SINGLE_S_COORD', 'SINGLE_CATAPHORA', 'SINGLE_CONN_INNER', 'SINGLE_APPOSITION', 'SINGLE_VP_COORD', 'SINGLE_CONN_START', 'PAIR_ANAPHORA', 'PAIR_CONN', 'SINGLE_RELATIVE', 'SINGLE_CONN_INNER_ANAPHORA', 'SINGLE_S_COORD_ANAPHORA', 'PAIR_CONN_ANAPHORA' and 'PAIR_NONE'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task565_circa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task565_circa_answer_generation.json new file mode 100644 index 000000000..1c784cebe --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task565_circa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a question. Your task is to generate an answer that is relevant to the question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task566_circa_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task566_circa_classification.json new file mode 100644 index 000000000..6be0dc3c8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task566_circa_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two sentences. Your task is to classify the given sentences as \"Yes\" if they have same meaning; otherwise, classify them as \"No\". " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task567_circa_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task567_circa_text_generation.json new file mode 100644 index 000000000..b80864ae9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task567_circa_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a question, and your task is to predict the context of the question. We assume that someone named X asked the question from Y. The context of the question means the previous situation that led X to ask this question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task568_circa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task568_circa_question_generation.json new file mode 100644 index 000000000..bcd1ff074 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task568_circa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an answer, and your task is to generate a reasonable question for that answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task573_air_dialogue_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task573_air_dialogue_classification.json new file mode 100644 index 000000000..64cb0f3c5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task573_air_dialogue_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a conversation between a flight agent and the customer. You are given 4 options and you need to select the goal of the conversation. It is provided as part of customer's context, which has to be one of the following: `book`: Make a new reservation, `cancel`: Cancel an existing reservation, `no_flight`: No flight found for the customer's preference, `no_reservation`: No reservation / No change / No cancellation was made in the conversation, mostly enquiring details" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task574_air_dialogue_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task574_air_dialogue_sentence_generation.json new file mode 100644 index 000000000..1494ca259 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task574_air_dialogue_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a dialogue between a customer and a flight booking agent with a gap in the conversation. Your job is to find the answer of the previous dialogue. Avoid using irrelevant extra information while creating the answer. The answer should be relevant to the question before the blank. If you fill the blank with a question, it should have an answer from the agent in the given dialogue. Fill the gap marked with underline." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task575_air_dialogue_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task575_air_dialogue_classification.json new file mode 100644 index 000000000..07801c8b9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task575_air_dialogue_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a dialogue from a conversation between an agent and a customer. Your task is to determine the speaker of the dialogue. Answer with \"agent\" or \"customer\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task576_curiosity_dialogs_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task576_curiosity_dialogs_answer_generation.json new file mode 100644 index 000000000..879cf041b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task576_curiosity_dialogs_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, the input is a set of dialogues between a user and an assistant. You need to find the dialogue that is basically a response given to a question or an aspect of the user." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task577_curiosity_dialogs_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task577_curiosity_dialogs_classification.json new file mode 100644 index 000000000..6d786a2a3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task577_curiosity_dialogs_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a dialogue between a user and an assistant, where users and assistants converse about geographic topics like geopolitical entities and locations. The task here is to find if the dialogue is by the user or assistant. Classify your answers into user and assistant." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task578_curiosity_dialogs_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task578_curiosity_dialogs_answer_generation.json new file mode 100644 index 000000000..d902f028c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task578_curiosity_dialogs_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given dialogue, and you have to find the most critical location in the given conversation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task579_socialiqa_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task579_socialiqa_classification.json new file mode 100644 index 000000000..328b8fd5b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task579_socialiqa_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a context, a question, three options, and an answer. Your task is to classify whether the given answer is correct or not by providing 'Yes' or 'No', based on the context with commonsense reasoning about social situations." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task580_socialiqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task580_socialiqa_answer_generation.json new file mode 100644 index 000000000..0068ed539 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task580_socialiqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a context, a question, and three options. Your task is to find the correct answer to the question using the given context and options. Also, you may need to use commonsense reasoning about social situations to answer the questions. Classify your answers into 'A', 'B', and 'C'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task581_socialiqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task581_socialiqa_question_generation.json new file mode 100644 index 000000000..77a11301a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task581_socialiqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given context and an answer. Your task is to generate the question for this answer based on the given context with commonsense reasoning about social situations.." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task582_naturalquestion_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task582_naturalquestion_answer_generation.json new file mode 100644 index 000000000..723ab7740 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task582_naturalquestion_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, You are given an open-domain question that can be answered based on factual information. Your task is to provide \\*short\\* answer (in a few words only) for the given question. The short answer can be one or more entities or it can also be boolean \\*yes\\* or \\*no\\*." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task583_udeps_eng_coarse_pos_tagging.json b/src/unitxt/catalog/instructions/natural_instructions/train/task583_udeps_eng_coarse_pos_tagging.json new file mode 100644 index 000000000..14ba39a66 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task583_udeps_eng_coarse_pos_tagging.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to provide the parts-of-speech tag of a word present in a sentence specified within curly braces ( '{{ ... }}' ). The parts-of-speech tags are coarse labels that represent a category of words with similar grammatical properties. The list of part-of-speech tags i.e. tagset of this corpus is 'ADJ': Adjectives are words that typically modify nouns and specify their properties or attributes, 'ADP': Adposition is a cover term for prepositions and postpositions, 'ADV': Adverbs are words that typically modify verbs for such categories as time, place, direction or manner, 'AUX': An auxiliary is a function word that accompanies the lexical verb of a verb phrase and expresses grammatical distinctions not carried by the lexical verb, such as person, number, tense, mood, aspect, voice or evidentiality, 'CCONJ': A coordinating conjunction is a word that links words or larger constituents without syntactically subordinating one to the other and expresses a semantic relationship between them, 'DET': Determiners are words that modify nouns or noun phrases and express the reference of the noun phrase in context, 'INTJ': An interjection is a word that is used most often as an exclamation or part of an exclamation, 'NOUN': Nouns are a part of speech typically denoting a person, place, thing, animal or idea, 'NUM': A numeral is a word, functioning most typically as a determiner, adjective or pronoun, that expresses a number and a relation to the number, such as quantity, sequence, frequency or fraction, 'PART': Particles are function words that must be associated with another word or phrase to impart meaning and that do not satisfy definitions of other universal parts of speech, 'PRON': Pronouns are words that substitute for nouns or noun phrases, whose meaning is recoverable from the linguistic or extralinguistic context, 'PROPN': A proper noun is a noun (or nominal content word) that is the name (or part of the name) of a specific individual, place, or object, 'PUNCT': Punctuation marks are non-alphabetical characters and character groups used in many languages to delimit linguistic units in printed text, 'SCONJ': A subordinating conjunction is a conjunction that links constructions by making one of them a constituent of the other. The subordinating conjunction typically marks the incorporated constituent which has the status of a (subordinate) clause, 'SYM': A symbol is a word-like entity that differs from ordinary words by form, function or both, 'VERB': A verb is a member of the syntactic class of words that typically signal events and actions, can constitute a minimal predicate in a clause, and govern the number and types of other constituents which may occur in the clause, 'X': The tag X is used for words that for some reason cannot be assigned a real part-of-speech category." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task584_udeps_eng_fine_pos_tagging.json b/src/unitxt/catalog/instructions/natural_instructions/train/task584_udeps_eng_fine_pos_tagging.json new file mode 100644 index 000000000..74b388c01 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task584_udeps_eng_fine_pos_tagging.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to provide the parts-of-speech tag of a word present in a sentence specified within curly braces ( '{{ ... }}' ). The parts-of-speech tags are fine labels that represent a category of words with similar grammatical properties. The list of part-of-speech tags i.e tagset of this corpus is : '$': Dollar Sign, \"''\": Single Quotes, ',': Comma Symbol, '-LRB-': Left Parantheses, '-RRB-': Right Parantheses, '.': Period, ':': Colon, 'ADD': Email Address, 'AFX': Affix, 'CC': Coordinating conjunction, 'CD': Cardinal Number, 'DT': Determiner, 'EX': Existential there, 'FW': Foreign Word, 'GW': Go with, 'HYPH': Hyphen symbol, 'IN': Preposition or a subordinating conjunction, 'JJ': Adjective, 'JJR': A comparative Adjective, 'JJS': A Superlative Adjective, 'LS': List item Marker, 'MD': Modal, 'NFP': Superfluous punctuation, 'NN': Singular Noun, 'NNP': Singular Proper Noun, 'NNPS': Prural Proper Noun, 'NNS': Prural Noun, 'PDT': Pre-determiner, 'POS': Possessive Ending, 'PRP': Personal pronoun, 'PRP$': Possessive Pronoun, 'RB': Adverb, 'RBR': Comparative Adverb, 'RBS': Superlative Adverb, 'RP': Particle, 'SYM': Symbol, 'TO': To , 'UH': Interjection, 'VB': Base form Verb, 'VBD': Verb in Past tense, 'VBG': Verb in present participle, 'VBN': Verb in past participle, 'VBP': Verb in non-3rd person singular present, 'VBZ': Verb in 3rd person singular present, 'WDT': Wh-determiner, 'WP': Wh-pronoun, 'WP$' Possessive Wh-pronoun, 'WRB': Wh-adverb, 'XX': Unknown, '``': Double backticks." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task585_preposition_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task585_preposition_classification.json new file mode 100644 index 000000000..e84776bdf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task585_preposition_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given an input that contains two words, and your task is to predict the correct preposition that connects these two words. Predict the preposition that explicitly conveys both words' meaning, e.g., Word1: king \n Word2: fort: \"king of fort\". Possible prepositions are: \"of\", \"on\", \"in\", \"for\", \"from\", \"about\", and \"with\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task586_amazonfood_polarity_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task586_amazonfood_polarity_classification.json new file mode 100644 index 000000000..8e397feff --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task586_amazonfood_polarity_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a review of Amazon's food products. Your task is to divide them into two classes: negative or positive, depending on the content of the review." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task587_amazonfood_polarity_correction_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task587_amazonfood_polarity_correction_classification.json new file mode 100644 index 000000000..b2d29576c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task587_amazonfood_polarity_correction_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given an amazon food product review and its polarity (positive or negative). Your task is to answer \"True\" if the specified sentence and its polarity match; otherwise, answer \"False\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task588_amazonfood_rating_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task588_amazonfood_rating_classification.json new file mode 100644 index 000000000..46dbf0305 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task588_amazonfood_rating_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a review from Amazon's food products. Your task is to generate a rating for the product on a scale of 1-5 based on the review. The rating means 1: extremely poor, 2: poor, 3: neutral or mixed, 4: good, 5: extremely good. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task589_amazonfood_summary_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task589_amazonfood_summary_text_generation.json new file mode 100644 index 000000000..17e3d5db7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task589_amazonfood_summary_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a review from Amazon's food products. Your task is to generate a short summary of the given review in the input. Note that you don't need to write a complete sentence as a summary." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task590_amazonfood_summary_correction_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task590_amazonfood_summary_correction_classification.json new file mode 100644 index 000000000..1147916ae --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task590_amazonfood_summary_correction_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, You are given an amazon food product review and its summary. Your task is to Generate \"True\" if given review and its summary match, otherwise generate \"False\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task591_sciq_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task591_sciq_answer_generation.json new file mode 100644 index 000000000..653a09e4b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task591_sciq_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a scientific question, generate a correct answer to it." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task592_sciq_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task592_sciq_incorrect_answer_generation.json new file mode 100644 index 000000000..f4c8c8e75 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task592_sciq_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a scientific question, generate an incorrect answer to the given question. The incorrect answer should be a plausible alternative to the correct answer. The answer should be some other item belonging to the same category as the correct answer but should be incorrect." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task593_sciq_explanation_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task593_sciq_explanation_generation.json new file mode 100644 index 000000000..fd04d3a85 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task593_sciq_explanation_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a scientific question and its correct answer, generate supporting facts for the answer. This supporting fact can be an explanation for the answer to the given question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task594_sciq_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task594_sciq_question_generation.json new file mode 100644 index 000000000..6e956b5d4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task594_sciq_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a scientific passage and an answer, generate a question for the given answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task595_mocha_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task595_mocha_answer_generation.json new file mode 100644 index 000000000..02e44d0ec --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task595_mocha_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a context passage, followed by a question that needs to be answered. Based on the paragraph, you must write unambiguous answers to the questions and your answer must refer to a specific phrase from the paragraph. If multiple answers seem to exist, write the answer that is the most plausible." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task596_mocha_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task596_mocha_question_generation.json new file mode 100644 index 000000000..4acd50361 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task596_mocha_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a context passage. Your job is to generate relevant questions that can be answered by directly referring to the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task597_cuad_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task597_cuad_answer_generation.json new file mode 100644 index 000000000..824776098 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task597_cuad_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a passage that represents a legal contract or clause between multiple parties, followed by a question that needs to be answered. Based on the paragraph, you must write unambiguous answers to the questions and your answer must refer a specific phrase from the paragraph. If multiple answers seem to exist, write the answer that is the most plausible." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task598_cuad_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task598_cuad_answer_generation.json new file mode 100644 index 000000000..ad46d5bba --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task598_cuad_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a passage that represents a legal contract or clause between multiple parties, followed by a question that needs to be answered. Based on the paragraph, you must write the index where the answer starts. If multiple answers seem to exist, write the index of the answer that is the most plausible. If multiple indices must be used to answer the question, the output should be a common separated list of indices." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task599_cuad_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task599_cuad_question_generation.json new file mode 100644 index 000000000..820487509 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task599_cuad_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a passage that represents a legal contract or clause between multiple parties. Your job is to write questions that ask the basic details corresponding to the legal contracts or clauses. Avoid questions that can be answered correctly without actually understanding the paragraph, and which might have multiple answers. The answer to each question should be unambiguous." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task600_find_the_longest_common_substring_in_two_strings.json b/src/unitxt/catalog/instructions/natural_instructions/train/task600_find_the_longest_common_substring_in_two_strings.json new file mode 100644 index 000000000..a79d48ce0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task600_find_the_longest_common_substring_in_two_strings.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two strings A, B. Find the longest common substring in the strings A and B." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task605_find_the_longest_common_subsequence_in_two_lists.json b/src/unitxt/catalog/instructions/natural_instructions/train/task605_find_the_longest_common_subsequence_in_two_lists.json new file mode 100644 index 000000000..07072e37c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task605_find_the_longest_common_subsequence_in_two_lists.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two lists A,B. Find the longest common subsequence in the lists A and B." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task606_sum_of_all_numbers_in_list_between_positions_i_and_j.json b/src/unitxt/catalog/instructions/natural_instructions/train/task606_sum_of_all_numbers_in_list_between_positions_i_and_j.json new file mode 100644 index 000000000..5074d3de1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task606_sum_of_all_numbers_in_list_between_positions_i_and_j.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given inputs i,j, and A, where i and j are integers and A is a list. You need to return the sum of all the numerical elements in the list A between the positions i and j (including positions i and j). Return 0 if no numerical element is present in the list between the given ranges. i and j will be non-negative, and will always have a value less than the length of A. i will always be less than j." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task607_sbic_intentional_offense_binary_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task607_sbic_intentional_offense_binary_classification.json new file mode 100644 index 000000000..61fe78cdd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task607_sbic_intentional_offense_binary_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a text from a social media post. Your task is to classify the given post into two categories: 1) yes if the given post is intentionally offensive, 2) no, otherwise. Also, generate label 'no' for offensive statements that appear to be unintentional, or non-offensive statements that are underhandedly offensive. Warning: the examples and instances may contain offensive language." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task608_sbic_sexual_offense_binary_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task608_sbic_sexual_offense_binary_classification.json new file mode 100644 index 000000000..e4534703a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task608_sbic_sexual_offense_binary_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a text from a social media post. Your task is to classify the given post into two categories: 1) yes if the given post is sexually offensive, 2) no, otherwise. Emphasis on sexually offensive or any lewd reference. Generate label 'no' for offensive posts that do not reference sexually explicit content. Warning: the examples and instances may contain offensive language." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task609_sbic_potentially_offense_binary_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task609_sbic_potentially_offense_binary_classification.json new file mode 100644 index 000000000..ed1d549f6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task609_sbic_potentially_offense_binary_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a text from a social media post. Your task is to classify the given post into two categories: 1) yes if the given post is potentially offensive to anyone (i.e., a subset of people, any particular person, etc.), 2) no, otherwise. Note that potentially offensive posts can contain sexual, racial, religious biased or offensive language. Warning: the examples and instances may contain offensive language." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task610_conllpp_ner.json b/src/unitxt/catalog/instructions/natural_instructions/train/task610_conllpp_ner.json new file mode 100644 index 000000000..75057a65b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task610_conllpp_ner.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a text from a post. Your task is to find all of the proper nouns and label them. The labels are , for persons; , for organizations; , for locations; and , for other nouns. The capital 'B' denotes the first word of a proper noun phrase. The capital 'I' denotes all following words of the same noun phrase. If a word is not a part of a proper noun phrase, do not label it." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task611_mutual_multi_turn_dialogue.json b/src/unitxt/catalog/instructions/natural_instructions/train/task611_mutual_multi_turn_dialogue.json new file mode 100644 index 000000000..0509b8691 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task611_mutual_multi_turn_dialogue.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you are given a small conversation between two persons and 4 options on how the conversation should continue. Your job is to choose the most reasonable option. The conversation and the options are separated by a newline character. Each dialogue in the conversation are separated by a comma. F and M indicate female and male, respectively." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task615_moviesqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task615_moviesqa_answer_generation.json new file mode 100644 index 000000000..f85615546 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task615_moviesqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given an open-domain question from an open movie database. Your task is to provide an answer to that question. Try to only include the answer. Do not put it in a sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task616_cola_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task616_cola_classification.json new file mode 100644 index 000000000..cd7dc08a0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task616_cola_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You're given a sentence and your task is to classify whether the sentence is acceptable or not. Any sentence which is grammatically correct, has a naturalistic text, is written by a native speaker and which minimizes superfluous content is acceptable, otherwise unacceptable. If the sentence is acceptable then write \"acceptable\", otherwise \"unacceptable\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task617_amazonreview_category_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task617_amazonreview_category_text_generation.json new file mode 100644 index 000000000..7ab37260a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task617_amazonreview_category_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a review from Amazon and your task is to generate the name of the category of the product based on the review given by the user. The categories are: kitchen, office product, watch, wireless, other, toy, digital video download, camera, jewelry, pet products, sports, industrial supplies, baby product, grocery, drugstore, home improvement, pc, shoes, automotive, digital ebook purchase, musical instruments, beauty, book, electronics, lawn and garden, apparel, home, video games, luggage, furniture, personal care appliances." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task618_amazonreview_summary_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task618_amazonreview_summary_text_generation.json new file mode 100644 index 000000000..b753b02cf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task618_amazonreview_summary_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given reviews from Amazon's products. Your task is to generate the Summary of the review." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task622_replace_alphabets_in_a_list_by_their_position_in_english_alphabet.json b/src/unitxt/catalog/instructions/natural_instructions/train/task622_replace_alphabets_in_a_list_by_their_position_in_english_alphabet.json new file mode 100644 index 000000000..66891e06a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task622_replace_alphabets_in_a_list_by_their_position_in_english_alphabet.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list A. You need to convert all the alphabets in the list with a number representing their position in the English alphabet. E.g., replace A by 1, B by 2, a by 1, b by 2, and so on." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task625_xlwic_true_or_false_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task625_xlwic_true_or_false_answer_generation.json new file mode 100644 index 000000000..fea89bacf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task625_xlwic_true_or_false_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a word, followed by two sentences. Your task is to figure out whether both the sentences use the aforementioned word with the same meaning. You should respond with 'True' if the words in both sentences share the same meaning, and 'False' otherwise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task626_xlwic_sentence_based_on_given_word_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task626_xlwic_sentence_based_on_given_word_sentence_generation.json new file mode 100644 index 000000000..8d665fdf9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task626_xlwic_sentence_based_on_given_word_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a word. You should respond with a valid sentence which contains the given word. Make sure that the sentence is grammatically correct. You may use the word in a different tense than is given. For example, you may use the word 'ended' in the output where the given input word is 'end'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task627_xlwic_word_with_same_meaning_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task627_xlwic_word_with_same_meaning_sentence_generation.json new file mode 100644 index 000000000..a2cdb447d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task627_xlwic_word_with_same_meaning_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a word, followed by a sentence. You should respond with a valid sentence which contains the word with the same meaning as in the given sentence. For example, if the given sentence refers to a 'fly' as the insect, you should not respond with a sentence which uses 'fly' as the verb. You may use the word in a different tense than is given. For example, you may use the word 'ended' in the output where the given input word is 'end'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task628_xlwic_word_with_different_meaning_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task628_xlwic_word_with_different_meaning_sentence_generation.json new file mode 100644 index 000000000..701be9cbb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task628_xlwic_word_with_different_meaning_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a word, followed by a sentence. You should respond with a valid sentence which contains the word used with a different meaning than in the given sentence. For example, if the given sentence refers to a 'fly' as the insect, you may respond with a sentence which uses 'fly' as the verb; however, you may NOT respond with a sentence which uses 'fly' as the insect. You may use the word in a different tense than is given. For example, you may use the word 'ended' in the output where the given input word is 'end'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task629_dbpedia_14_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task629_dbpedia_14_classification.json new file mode 100644 index 000000000..3d1e98565 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task629_dbpedia_14_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a text which is the body of a document. Your job is to classify the topic of the document into these categories: 1)Company, 2)Educational Institution, 3)Artist, 4)Athlete, 5)Office Holder, 6)Mean of transportation, 7)Building, 8)Natural place, 9)Village, 10)Animal, 11)Plant, 12)Album, 13)Film, 14)Written work. Your output should be the category number. Don't generate anything apart from numbers 1-14." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task630_dbpedia_14_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task630_dbpedia_14_classification.json new file mode 100644 index 000000000..4dfa037b9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task630_dbpedia_14_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a text which is the body of a document and a title which is the title of the document. Here the title is present in the document and it is the entity which is referred in the document. The title might have some text in parentheses, for example: \"HMS Mallow (K81)\", or be slightly different from what is present in the text. If they still refer to the same entity, then it is a correct title. Indicate your answer as \"Yes\" if the title is correct, otherwise indicate your answer as \"No\". Do not generate anything else apart from \"Yes\" or \"No\"" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task631_dbpedia_14_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task631_dbpedia_14_incorrect_answer_generation.json new file mode 100644 index 000000000..b9e09a5e2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task631_dbpedia_14_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a text and question. The question is about the topic of the document. You are expected to generate an incorrect answer. The incorrect answer should be among one of the following categories: 1)Company, 2)Educational Institution, 3)Artist, 4)Athlete, 5)Office holder, 6)Mean of transportation, 7)Building, 8)Natural place, 9)Village, 10)Animal, 11)Plant, 12)Album, 13)Film, 14)Written work" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task632_dbpedia_14_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task632_dbpedia_14_classification.json new file mode 100644 index 000000000..d9cd578d3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task632_dbpedia_14_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a text which is the body of the document. Indicate your answer as \"Yes\" if the text is about a person, otherwise indicate your answer as \"No\". Don't generate anything else apart from \"Yes\" or \"No\". Pay attention that for your answer to be \"Yes\", the passage should be generally about a person. Mentions of people in the text don't necessarily mean the text is about a person." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task633_dbpedia_14_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task633_dbpedia_14_answer_generation.json new file mode 100644 index 000000000..ffd268abb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task633_dbpedia_14_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a text which is the body of a document. You are given a question and options. Pick the correct number. Don't generate anything else apart from the numbers provided in options." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task636_extract_and_sort_unique_alphabets_in_a_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task636_extract_and_sort_unique_alphabets_in_a_list.json new file mode 100644 index 000000000..a066ea247 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task636_extract_and_sort_unique_alphabets_in_a_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list A comprising of numbers and alphabets. You need to extract and sort the unique alphabets in the list. The alphabets in the input list will only be in lowercase. Return -1 if there is no alphabet in the input list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task637_extract_and_sort_unique_digits_in_a_list.json b/src/unitxt/catalog/instructions/natural_instructions/train/task637_extract_and_sort_unique_digits_in_a_list.json new file mode 100644 index 000000000..ae6ebf3ea --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task637_extract_and_sort_unique_digits_in_a_list.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an input list A. You need to extract and sort the unique digits used in the list in ascending order. Return -1 if there is no digit in the list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task638_multi_woz_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task638_multi_woz_classification.json new file mode 100644 index 000000000..6b9dab378 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task638_multi_woz_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are shown a conversation between a user and system. Identify who has spoken the indicated sentence based on the conversation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task639_multi_woz_user_utterance_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task639_multi_woz_user_utterance_generation.json new file mode 100644 index 000000000..f12efa6ab --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task639_multi_woz_user_utterance_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are shown a random response (from a computer or a human). Generate a language query such that it leads to this reply." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task649_race_blank_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task649_race_blank_question_generation.json new file mode 100644 index 000000000..ddb254d0b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task649_race_blank_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given an article and an answer. Your task is to generate the fill-in-the-blank question for this answer based on the given article. The blanks are always at the end of the question, and can be filled with more than one word or phrase." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task664_mmmlu_answer_generation_abstract_algebra.json b/src/unitxt/catalog/instructions/natural_instructions/train/task664_mmmlu_answer_generation_abstract_algebra.json new file mode 100644 index 000000000..4ce9519b7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task664_mmmlu_answer_generation_abstract_algebra.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on abstract algebra. Abstract algebra is a branch of mathematics in which algebraic concepts are generalized by using symbols to represent basic arithmetical operations. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task665_mmmlu_answer_generation_anatomy.json b/src/unitxt/catalog/instructions/natural_instructions/train/task665_mmmlu_answer_generation_anatomy.json new file mode 100644 index 000000000..e1af67772 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task665_mmmlu_answer_generation_anatomy.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on anatomy. Anatomy is the science that studies the structure of the body. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task666_mmmlu_answer_generation_astronomy.json b/src/unitxt/catalog/instructions/natural_instructions/train/task666_mmmlu_answer_generation_astronomy.json new file mode 100644 index 000000000..45b29e351 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task666_mmmlu_answer_generation_astronomy.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on astronomy. Astronomy is a natural science that studies celestial objects and phenomena. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task667_mmmlu_answer_generation_business_ethics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task667_mmmlu_answer_generation_business_ethics.json new file mode 100644 index 000000000..bbd5a844d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task667_mmmlu_answer_generation_business_ethics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on business ethics. Business ethics is a form of applied ethics that examines ethical principles and moral or ethical problems that can arise in a business environment. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task668_extreme_abstract_summarization.json b/src/unitxt/catalog/instructions/natural_instructions/train/task668_extreme_abstract_summarization.json new file mode 100644 index 000000000..de8aceb02 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task668_extreme_abstract_summarization.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given the abstract of a research paper. Your task is to generate a summary of this abstract. Your summary should not be very short, but it's better if it's not more than 30 words." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task672_amazon_and_yelp_summarization_dataset_summarization.json b/src/unitxt/catalog/instructions/natural_instructions/train/task672_amazon_and_yelp_summarization_dataset_summarization.json new file mode 100644 index 000000000..95b02ab75 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task672_amazon_and_yelp_summarization_dataset_summarization.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a set of reviews from Amazon and Yelp. Your task is to generate a summary of a given set of reviews about the information present in reviews. This generated summary should reflect users' common opinions expressed in the reviews, the common sentiment of the opinions and their details, and should be coherent with the given set of reviews in terms of sentence and information structure. Avoid creating summaries that (i) contains additional information which is not present in reviews, (ii) look exactly like the review, and (iii) uses 5 or more same consecutive words or phrases given in the reviews." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task672_nummersense.json b/src/unitxt/catalog/instructions/natural_instructions/train/task672_nummersense.json new file mode 100644 index 000000000..5e48f6f92 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task672_nummersense.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, find the most appropriate number to replace the blank (indicated with _ ) and express it in words." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task673_google_wellformed_query_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task673_google_wellformed_query_classification.json new file mode 100644 index 000000000..0b0c7ff00 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task673_google_wellformed_query_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Read the given query and classify it as a 'Good' or 'Bad' query depending on how well the query is formed, 'Bad' being the expected output for a not so well formed query and 'Good' being the expected output for a well formed query. A query may be wrong based on common sense or general facts, but if it is well formed, you should answer with Good." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task674_google_wellformed_query_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task674_google_wellformed_query_sentence_generation.json new file mode 100644 index 000000000..06c18342e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task674_google_wellformed_query_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a set of queries separated by '\n', and your job is to find out the query which is not a well-formed or well-structured query in terms of grammar, punctuations, or spelling errors." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task675_google_wellformed_query_sentence_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task675_google_wellformed_query_sentence_generation.json new file mode 100644 index 000000000..0874e8722 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task675_google_wellformed_query_sentence_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a list of queries separated by new line. Your job is to answer with the query that is the most well-formed or well-structured query in terms of grammar, punctuations, or spelling errors." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task679_hope_edi_english_text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task679_hope_edi_english_text_classification.json new file mode 100644 index 000000000..13ebc1bd9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task679_hope_edi_english_text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Classify the given comment into 'Hope Speech' or 'Not Hope Speech'. A hope speech is defined as content that is encouraging, positive or supportive contents and talks about equality, diversity or inclusion" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task681_hope_edi_malayalam_text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task681_hope_edi_malayalam_text_classification.json new file mode 100644 index 000000000..d04e0d107 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task681_hope_edi_malayalam_text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a comment text in Malayalam, classify the comment into one of these categories (i) Hope speech, (ii) Not Hope Speech or (iii) Not in Expected Language. A hope speech contains content that is encouraging, positive or supportive contents and talks about equality, diversity or inclusion" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task682_online_privacy_policy_text_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task682_online_privacy_policy_text_classification.json new file mode 100644 index 000000000..56a5f5061 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task682_online_privacy_policy_text_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a part of privacy policy text, classify it into one of these categories: \n (1) First Party Collection/Use (how and why a service provider collects user information), \n (2) Third Party Sharing/Collection (how user information may be shared with or collected by third parties), \n (3) User Choice/Control (choices and control options available to users), \n (4) User Access, Edit, & Deletion (if and how users may access, edit, or delete their information), \n (5) Data Retention (how long user information is stored), \n (6) Data Security (how user information is protected), \n (7) Policy Change (if and how users will be informed about changes to the privacy policy)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task683_online_privacy_policy_text_purpose_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task683_online_privacy_policy_text_purpose_answer_generation.json new file mode 100644 index 000000000..0a7812662 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task683_online_privacy_policy_text_purpose_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a part of privacy policy text, identify the purpose for which the user information is collected/used. The purpose should be given inside the policy text, answer as 'Not Specified' otherwise" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task684_online_privacy_policy_text_information_type_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task684_online_privacy_policy_text_information_type_generation.json new file mode 100644 index 000000000..f6605d06c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task684_online_privacy_policy_text_information_type_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a part of privacy policy text, identify the type of personal information which is collected, used, tracked or retained. The type of information should be present inside the given policy text, answer as 'Not Specified' otherwise" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task685_mmmlu_answer_generation_clinical_knowledge.json b/src/unitxt/catalog/instructions/natural_instructions/train/task685_mmmlu_answer_generation_clinical_knowledge.json new file mode 100644 index 000000000..3bb7b0910 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task685_mmmlu_answer_generation_clinical_knowledge.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on clinical knowledge. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task686_mmmlu_answer_generation_college_biology.json b/src/unitxt/catalog/instructions/natural_instructions/train/task686_mmmlu_answer_generation_college_biology.json new file mode 100644 index 000000000..e68d35602 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task686_mmmlu_answer_generation_college_biology.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on college biology. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task687_mmmlu_answer_generation_college_chemistry.json b/src/unitxt/catalog/instructions/natural_instructions/train/task687_mmmlu_answer_generation_college_chemistry.json new file mode 100644 index 000000000..51845de91 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task687_mmmlu_answer_generation_college_chemistry.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on college chemistry. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task688_mmmlu_answer_generation_college_computer_science.json b/src/unitxt/catalog/instructions/natural_instructions/train/task688_mmmlu_answer_generation_college_computer_science.json new file mode 100644 index 000000000..150b4632a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task688_mmmlu_answer_generation_college_computer_science.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on college computer science. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task689_mmmlu_answer_generation_college_mathematics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task689_mmmlu_answer_generation_college_mathematics.json new file mode 100644 index 000000000..395848865 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task689_mmmlu_answer_generation_college_mathematics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on college mathematics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task690_mmmlu_answer_generation_college_medicine.json b/src/unitxt/catalog/instructions/natural_instructions/train/task690_mmmlu_answer_generation_college_medicine.json new file mode 100644 index 000000000..ab667caea --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task690_mmmlu_answer_generation_college_medicine.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on college medicine. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task691_mmmlu_answer_generation_college_physics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task691_mmmlu_answer_generation_college_physics.json new file mode 100644 index 000000000..f237a4d87 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task691_mmmlu_answer_generation_college_physics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on college physics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task692_mmmlu_answer_generation_computer_security.json b/src/unitxt/catalog/instructions/natural_instructions/train/task692_mmmlu_answer_generation_computer_security.json new file mode 100644 index 000000000..08fca9390 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task692_mmmlu_answer_generation_computer_security.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on computer security. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task693_mmmlu_answer_generation_conceptual_physics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task693_mmmlu_answer_generation_conceptual_physics.json new file mode 100644 index 000000000..57961d58b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task693_mmmlu_answer_generation_conceptual_physics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on conceptual physics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task694_mmmlu_answer_generation_econometrics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task694_mmmlu_answer_generation_econometrics.json new file mode 100644 index 000000000..9682ec0ea --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task694_mmmlu_answer_generation_econometrics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on econometrics. Econometrics is the application of statistical methods to economic data in order to give empirical content to economic relationships. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task695_mmmlu_answer_generation_electrical_engineering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task695_mmmlu_answer_generation_electrical_engineering.json new file mode 100644 index 000000000..c47d73d53 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task695_mmmlu_answer_generation_electrical_engineering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on electrical engineering. Electrical engineering is an engineering discipline concerned with the study, design and application of equipment, devices and systems which use electricity, electronics, and electromagnetism. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task696_mmmlu_answer_generation_elementary_mathematics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task696_mmmlu_answer_generation_elementary_mathematics.json new file mode 100644 index 000000000..af7639eee --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task696_mmmlu_answer_generation_elementary_mathematics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on elementary mathematics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task697_mmmlu_answer_generation_formal_logic.json b/src/unitxt/catalog/instructions/natural_instructions/train/task697_mmmlu_answer_generation_formal_logic.json new file mode 100644 index 000000000..9d88e6e42 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task697_mmmlu_answer_generation_formal_logic.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on formal logic. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task698_mmmlu_answer_generation_global_facts.json b/src/unitxt/catalog/instructions/natural_instructions/train/task698_mmmlu_answer_generation_global_facts.json new file mode 100644 index 000000000..ddb3cebc8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task698_mmmlu_answer_generation_global_facts.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on global facts. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task699_mmmlu_answer_generation_high_school_biology.json b/src/unitxt/catalog/instructions/natural_instructions/train/task699_mmmlu_answer_generation_high_school_biology.json new file mode 100644 index 000000000..8d60a6cfd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task699_mmmlu_answer_generation_high_school_biology.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school biology. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task700_mmmlu_answer_generation_high_school_chemistry.json b/src/unitxt/catalog/instructions/natural_instructions/train/task700_mmmlu_answer_generation_high_school_chemistry.json new file mode 100644 index 000000000..1169d40dc --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task700_mmmlu_answer_generation_high_school_chemistry.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school chemistry. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task701_mmmlu_answer_generation_high_school_computer_science.json b/src/unitxt/catalog/instructions/natural_instructions/train/task701_mmmlu_answer_generation_high_school_computer_science.json new file mode 100644 index 000000000..fa51a459f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task701_mmmlu_answer_generation_high_school_computer_science.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school computer science. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task702_mmmlu_answer_generation_high_school_european_history.json b/src/unitxt/catalog/instructions/natural_instructions/train/task702_mmmlu_answer_generation_high_school_european_history.json new file mode 100644 index 000000000..f7849f37e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task702_mmmlu_answer_generation_high_school_european_history.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on US high school level european history. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. The correct answer can be inferred from the information given in the question. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task703_mmmlu_answer_generation_high_school_geography.json b/src/unitxt/catalog/instructions/natural_instructions/train/task703_mmmlu_answer_generation_high_school_geography.json new file mode 100644 index 000000000..13c3fe53c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task703_mmmlu_answer_generation_high_school_geography.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school geography. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task704_mmmlu_answer_generation_high_school_government_and_politics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task704_mmmlu_answer_generation_high_school_government_and_politics.json new file mode 100644 index 000000000..aec459b09 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task704_mmmlu_answer_generation_high_school_government_and_politics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school government and politics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task705_mmmlu_answer_generation_high_school_macroeconomics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task705_mmmlu_answer_generation_high_school_macroeconomics.json new file mode 100644 index 000000000..fc2abe931 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task705_mmmlu_answer_generation_high_school_macroeconomics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school macroeconomics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task706_mmmlu_answer_generation_high_school_mathematics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task706_mmmlu_answer_generation_high_school_mathematics.json new file mode 100644 index 000000000..7b664542a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task706_mmmlu_answer_generation_high_school_mathematics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school mathematics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task707_mmmlu_answer_generation_high_school_microeconomics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task707_mmmlu_answer_generation_high_school_microeconomics.json new file mode 100644 index 000000000..e925d1d98 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task707_mmmlu_answer_generation_high_school_microeconomics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school microeconomics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task708_mmmlu_answer_generation_high_school_physics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task708_mmmlu_answer_generation_high_school_physics.json new file mode 100644 index 000000000..d6d028b1b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task708_mmmlu_answer_generation_high_school_physics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school physics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task709_mmmlu_answer_generation_high_school_psychology.json b/src/unitxt/catalog/instructions/natural_instructions/train/task709_mmmlu_answer_generation_high_school_psychology.json new file mode 100644 index 000000000..5e1583632 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task709_mmmlu_answer_generation_high_school_psychology.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school psychology. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task710_mmmlu_answer_generation_high_school_statistics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task710_mmmlu_answer_generation_high_school_statistics.json new file mode 100644 index 000000000..0bb958e44 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task710_mmmlu_answer_generation_high_school_statistics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school statistics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task711_mmmlu_answer_generation_high_school_us_history.json b/src/unitxt/catalog/instructions/natural_instructions/train/task711_mmmlu_answer_generation_high_school_us_history.json new file mode 100644 index 000000000..ffe24e1d6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task711_mmmlu_answer_generation_high_school_us_history.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school US history. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. The correct answer can be inferred from the information given in the question. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task712_mmmlu_answer_generation_high_school_world_history.json b/src/unitxt/catalog/instructions/natural_instructions/train/task712_mmmlu_answer_generation_high_school_world_history.json new file mode 100644 index 000000000..3e7253a40 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task712_mmmlu_answer_generation_high_school_world_history.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on high school world history. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. The correct answer can be inferred from the information given in the question. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task713_mmmlu_answer_generation_human_aging.json b/src/unitxt/catalog/instructions/natural_instructions/train/task713_mmmlu_answer_generation_human_aging.json new file mode 100644 index 000000000..8ca4eb3fd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task713_mmmlu_answer_generation_human_aging.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on human aging. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task714_mmmlu_answer_generation_human_sexuality.json b/src/unitxt/catalog/instructions/natural_instructions/train/task714_mmmlu_answer_generation_human_sexuality.json new file mode 100644 index 000000000..7437e7a32 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task714_mmmlu_answer_generation_human_sexuality.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on human sexuality. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task715_mmmlu_answer_generation_international_law.json b/src/unitxt/catalog/instructions/natural_instructions/train/task715_mmmlu_answer_generation_international_law.json new file mode 100644 index 000000000..b90695066 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task715_mmmlu_answer_generation_international_law.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on international law. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task716_mmmlu_answer_generation_jurisprudence.json b/src/unitxt/catalog/instructions/natural_instructions/train/task716_mmmlu_answer_generation_jurisprudence.json new file mode 100644 index 000000000..d8208c9ce --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task716_mmmlu_answer_generation_jurisprudence.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on jurisprudence. Jurisprudence is the theory or philosophy of law. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task717_mmmlu_answer_generation_logical_fallacies.json b/src/unitxt/catalog/instructions/natural_instructions/train/task717_mmmlu_answer_generation_logical_fallacies.json new file mode 100644 index 000000000..393c40259 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task717_mmmlu_answer_generation_logical_fallacies.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on logical fallacies. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task718_mmmlu_answer_generation_machine_learning.json b/src/unitxt/catalog/instructions/natural_instructions/train/task718_mmmlu_answer_generation_machine_learning.json new file mode 100644 index 000000000..046222a35 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task718_mmmlu_answer_generation_machine_learning.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on machine learning. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task719_mmmlu_answer_generation_management.json b/src/unitxt/catalog/instructions/natural_instructions/train/task719_mmmlu_answer_generation_management.json new file mode 100644 index 000000000..101027f49 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task719_mmmlu_answer_generation_management.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on management. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task720_mmmlu_answer_generation_marketing.json b/src/unitxt/catalog/instructions/natural_instructions/train/task720_mmmlu_answer_generation_marketing.json new file mode 100644 index 000000000..da8a8721b --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task720_mmmlu_answer_generation_marketing.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on marketing. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task721_mmmlu_answer_generation_medical_genetics.json b/src/unitxt/catalog/instructions/natural_instructions/train/task721_mmmlu_answer_generation_medical_genetics.json new file mode 100644 index 000000000..dd422ee83 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task721_mmmlu_answer_generation_medical_genetics.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on medical genetics. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task722_mmmlu_answer_generation_random_topic.json b/src/unitxt/catalog/instructions/natural_instructions/train/task722_mmmlu_answer_generation_random_topic.json new file mode 100644 index 000000000..ea49ca502 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task722_mmmlu_answer_generation_random_topic.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on a random topic. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task723_mmmlu_answer_generation_moral_disputes.json b/src/unitxt/catalog/instructions/natural_instructions/train/task723_mmmlu_answer_generation_moral_disputes.json new file mode 100644 index 000000000..cc3d95e71 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task723_mmmlu_answer_generation_moral_disputes.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on moral disputes. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task724_mmmlu_answer_generation_moral_scenarios.json b/src/unitxt/catalog/instructions/natural_instructions/train/task724_mmmlu_answer_generation_moral_scenarios.json new file mode 100644 index 000000000..5dd2a37fe --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task724_mmmlu_answer_generation_moral_scenarios.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on moral scenarios. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task725_mmmlu_answer_generation_nutrition.json b/src/unitxt/catalog/instructions/natural_instructions/train/task725_mmmlu_answer_generation_nutrition.json new file mode 100644 index 000000000..cff3fcc50 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task725_mmmlu_answer_generation_nutrition.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on nutrition. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task726_mmmlu_answer_generation_philosophy.json b/src/unitxt/catalog/instructions/natural_instructions/train/task726_mmmlu_answer_generation_philosophy.json new file mode 100644 index 000000000..9e150fdc7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task726_mmmlu_answer_generation_philosophy.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on philosophy. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task727_mmmlu_answer_generation_prehistory.json b/src/unitxt/catalog/instructions/natural_instructions/train/task727_mmmlu_answer_generation_prehistory.json new file mode 100644 index 000000000..89f20b252 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task727_mmmlu_answer_generation_prehistory.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on prehistory. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task728_mmmlu_answer_generation_professional_accounting.json b/src/unitxt/catalog/instructions/natural_instructions/train/task728_mmmlu_answer_generation_professional_accounting.json new file mode 100644 index 000000000..7aba4c7c1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task728_mmmlu_answer_generation_professional_accounting.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on professional accounting. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task729_mmmlu_answer_generation_professional_law.json b/src/unitxt/catalog/instructions/natural_instructions/train/task729_mmmlu_answer_generation_professional_law.json new file mode 100644 index 000000000..a59940541 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task729_mmmlu_answer_generation_professional_law.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on professional law. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task730_mmmlu_answer_generation_professional_medicine.json b/src/unitxt/catalog/instructions/natural_instructions/train/task730_mmmlu_answer_generation_professional_medicine.json new file mode 100644 index 000000000..3a888db85 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task730_mmmlu_answer_generation_professional_medicine.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on professional medicine. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task731_mmmlu_answer_generation_professional_psychology.json b/src/unitxt/catalog/instructions/natural_instructions/train/task731_mmmlu_answer_generation_professional_psychology.json new file mode 100644 index 000000000..90218bc2e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task731_mmmlu_answer_generation_professional_psychology.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on professional psychology. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task732_mmmlu_answer_generation_public_relations.json b/src/unitxt/catalog/instructions/natural_instructions/train/task732_mmmlu_answer_generation_public_relations.json new file mode 100644 index 000000000..a45ed0b29 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task732_mmmlu_answer_generation_public_relations.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on public relations. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task733_mmmlu_answer_generation_security_studies.json b/src/unitxt/catalog/instructions/natural_instructions/train/task733_mmmlu_answer_generation_security_studies.json new file mode 100644 index 000000000..cc02b06a0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task733_mmmlu_answer_generation_security_studies.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on security studies. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task734_mmmlu_answer_generation_sociology.json b/src/unitxt/catalog/instructions/natural_instructions/train/task734_mmmlu_answer_generation_sociology.json new file mode 100644 index 000000000..66090a26a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task734_mmmlu_answer_generation_sociology.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on sociology. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task735_mmmlu_answer_generation_us_foreign_policy.json b/src/unitxt/catalog/instructions/natural_instructions/train/task735_mmmlu_answer_generation_us_foreign_policy.json new file mode 100644 index 000000000..758ed84b5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task735_mmmlu_answer_generation_us_foreign_policy.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on US foreign policy. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task736_mmmlu_answer_generation_virology.json b/src/unitxt/catalog/instructions/natural_instructions/train/task736_mmmlu_answer_generation_virology.json new file mode 100644 index 000000000..5a9f3e4cb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task736_mmmlu_answer_generation_virology.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on virology. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task737_mmmlu_answer_generation_world_religions.json b/src/unitxt/catalog/instructions/natural_instructions/train/task737_mmmlu_answer_generation_world_religions.json new file mode 100644 index 000000000..1e51f4e57 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task737_mmmlu_answer_generation_world_religions.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a question on world religions. You are also given 4 answer options (associated with \"A\", \"B\", \"C\", \"D\"), out of which only one is correct. You need to answer the question by selecting the correct option. You should only answer with the choice letter, not the whole answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task739_lhoestq_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task739_lhoestq_question_generation.json new file mode 100644 index 000000000..f026c54a9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task739_lhoestq_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given passages that contain mentions of names of people, places, or things. Some of these mentions refer to the same person, place, or thing. Your job is to write questions that evaluate one's understanding of such references. Good questions are expected to link pronouns (she, her, him, his, their, etc.) or other mentions to people, places, or things to which they may refer. \n Avoid questions that can be answered correctly without actually understanding the paragraph. Avoid questions that do not link phrases referring to the same entity. Avoid questions that have multiple answers. \n\n For each of your questions the answer should be one or more phrases in the paragraph. The answer for each question should be unambiguous. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task740_lhoestq_answer_generation_quantity.json b/src/unitxt/catalog/instructions/natural_instructions/train/task740_lhoestq_answer_generation_quantity.json new file mode 100644 index 000000000..9486106d6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task740_lhoestq_answer_generation_quantity.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given passages that contain mentions of the quantity of a particular object and are supposed to find out the answer for a given question. Craft one correct answer to the question given in input. Make sure your correct answer is consistent with the context, and properly gives the exact number relating to the query.\n In your answer, use as few words as possible from the given context. To be less repetitive, please vary your language for each question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task741_lhoestq_answer_generation_place.json b/src/unitxt/catalog/instructions/natural_instructions/train/task741_lhoestq_answer_generation_place.json new file mode 100644 index 000000000..726561ce8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task741_lhoestq_answer_generation_place.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given passages that contain mentions of places and we are supposed to find the answer to a given question. Craft one correct answer to the question given in input. Make sure your correct answer is consistent with the context, and properly gives the exact location where the query was performed.\n In your answer, use as few words as possible from the given context. To be less repetitive, please vary your language for each question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task742_lhoestq_answer_generation_frequency.json b/src/unitxt/catalog/instructions/natural_instructions/train/task742_lhoestq_answer_generation_frequency.json new file mode 100644 index 000000000..1cf7a370f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task742_lhoestq_answer_generation_frequency.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given passages that contain mentions of a time duration related quesry and we are supposed to write answer to a question that involves event \u201cfrequency\", which refers to how often an event is likely to be repeated. For example, \"taking showers\" typically occurs ~5 times a week, \"going to saturday market\" usually happens every few weeks/months, etc. \n Note that a lot of the questions could have more than one correct answers. We only need a single most-likely answer. Please try to keep your \"answer\" as simple as possible. Concise and simple \"answer\" is preferred over those complex and verbose ones. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task745_ai2_arithmetic_questions_arithmetic.json b/src/unitxt/catalog/instructions/natural_instructions/train/task745_ai2_arithmetic_questions_arithmetic.json new file mode 100644 index 000000000..d39f60cf7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task745_ai2_arithmetic_questions_arithmetic.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are provided with an arithmetic question. Your task is to compute the solution using the given arithmetic operations. The only arithmetic operators needed to answer the questions are'+'(addition) and'-'(subtraction). The answer should be correct to one decimal place." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task746_yelp_restaurant_review_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task746_yelp_restaurant_review_classification.json new file mode 100644 index 000000000..477f65fa9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task746_yelp_restaurant_review_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are provided with a user review of a restaurant. Your task is to classify the given review into two categories: 1) positive, and 2) negative based on its content." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task750_aqua_multiple_choice_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task750_aqua_multiple_choice_answering.json new file mode 100644 index 000000000..44a1c64a7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task750_aqua_multiple_choice_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to make use of mathematical concepts like probability, combinatorics, linear equations, sequences/series, or simple operators like addition, subtraction, division, or multiplication to answer the given question. Choose the best option from the 5 given options and report that option." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task751_svamp_subtraction_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task751_svamp_subtraction_question_answering.json new file mode 100644 index 000000000..bda68f046 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task751_svamp_subtraction_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to only use subtraction on the numbers embedded in the text to answer the following question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task752_svamp_multiplication_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task752_svamp_multiplication_question_answering.json new file mode 100644 index 000000000..01ef2bb8a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task752_svamp_multiplication_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to only use multiplication or division operators on the numbers embedded in the text to answer the following question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task753_svamp_addition_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task753_svamp_addition_question_answering.json new file mode 100644 index 000000000..263b70069 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task753_svamp_addition_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to apply an addition mathematical operator on the numbers embedded in the text to answer the following question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task754_svamp_common_division_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task754_svamp_common_division_question_answering.json new file mode 100644 index 000000000..e320dd30e --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task754_svamp_common_division_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to apply division mathematical operator on the numbers embedded in the text to answer the following question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task755_find_longest_substring_and_replace_its_sorted_lowercase_version_in_both_lists.json b/src/unitxt/catalog/instructions/natural_instructions/train/task755_find_longest_substring_and_replace_its_sorted_lowercase_version_in_both_lists.json new file mode 100644 index 000000000..d60a3b89d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task755_find_longest_substring_and_replace_its_sorted_lowercase_version_in_both_lists.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two strings A,B. You must perform the following operations to generate the required output list: (i) Find the longest common substring in the strings A and B, (ii) Convert this substring to all lowercase and sort it alphabetically, (iii) Replace the substring at its respective positions in the two lists with the updated substring." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task756_find_longert_substring_and_return_all_unique_alphabets_in_it.json b/src/unitxt/catalog/instructions/natural_instructions/train/task756_find_longert_substring_and_return_all_unique_alphabets_in_it.json new file mode 100644 index 000000000..0846ca9ae --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task756_find_longert_substring_and_return_all_unique_alphabets_in_it.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given two strings A,B. Find the longer of the two lists, convert it to lowercase, and return all the unique alphabets used in it. The two input strings are never equal." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task761_app_review_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task761_app_review_classification.json new file mode 100644 index 000000000..250993cd1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task761_app_review_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given an app review. Your task is to identify whether its sentiment is \"Positive\" or \"Negative\"." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task766_craigslist_bargains_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task766_craigslist_bargains_classification.json new file mode 100644 index 000000000..7c3c2338c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task766_craigslist_bargains_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a text passage as input consisting of dialogues of negotiations between a seller and a buyer about the sale of an item, the task is to classify the text into one of the labels from the two possible outputs - 'accepted'/'rejected'. Select [accepted] if by the end of the conversation the buyer seems likely to buy the item from the seller. A sale is likely made when the buyer and seller agree upon a common price or when a deal is made between them. Select [rejected] if the buyer did not seem interested in buying the item from the seller at the end of the conversation. This happens when the buyer and seller do not agree on the price or other aspects of the item being sold by the seller." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task767_craigslist_bargains_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task767_craigslist_bargains_classification.json new file mode 100644 index 000000000..3586b8d29 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task767_craigslist_bargains_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a text passage as input comprising of dialogue of negotiations between a seller and a buyer about the sale of an item, your task is to classify the item being sold into exactly one of these categories: 'housing', 'furniture', 'bike', 'phone', 'car', 'electronics'. The output should be the name of the category from the stated options and there should be exactly one category for the given text passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task770_pawsx_english_text_modification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task770_pawsx_english_text_modification.json new file mode 100644 index 000000000..59befbf91 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task770_pawsx_english_text_modification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sentence in English, provide an equivalent paraphrased version from the original that retains the same meaning." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task819_pec_sentiment_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task819_pec_sentiment_classification.json new file mode 100644 index 000000000..c6bb68e46 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task819_pec_sentiment_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a sentence in English, provide the sentiment based on its empathetic direction. There are two possible classifications: positive (happy) or negative (offmychest)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task820_protoqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task820_protoqa_answer_generation.json new file mode 100644 index 000000000..38a2105d1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task820_protoqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Write a correct answer for the question. You should reason about prototypical situations and provide the correct answer. Avoid answers that provide incomplete justification for the question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task821_protoqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task821_protoqa_question_generation.json new file mode 100644 index 000000000..72a526aef --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task821_protoqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Construct a question that every answer in the list is correct and reasonable for it." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task823_peixian_rtgender_sentiment_analysis.json b/src/unitxt/catalog/instructions/natural_instructions/train/task823_peixian_rtgender_sentiment_analysis.json new file mode 100644 index 000000000..9c21e41e6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task823_peixian_rtgender_sentiment_analysis.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a 'poster' sentence and a corresponding 'response' (often, from Facebook or Reddit)classify the sentiment of the given response into four categories: 1) Positive, 2) Negative, 3) Neutral, and 4) Mixed if it contains both positive and negative." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task833_poem_sentiment_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task833_poem_sentiment_classification.json new file mode 100644 index 000000000..37bf7981f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task833_poem_sentiment_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you need to identify the sentiment of the given sentence as one of 'positive' or 'negative." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task834_mathdataset_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task834_mathdataset_classification.json new file mode 100644 index 000000000..efbb28ef9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task834_mathdataset_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are supposed to identify the category of a high-school level math question. There are five possible categories (1) algebra (2) arithmetic (3) measurement (4) numbers, and (5) probability. Use the following guidelines: (1) 'algebra' questions will typically contain letter variables and will ask you to find the value of a variable (2) 'arithmetic' questions will ask the sum, difference, multiplication, division, power, square root or value of expressions involving brackets (3) 'measurement' questions are questions that ask to convert a quantity from some unit to some other unit (4) 'numbers' questions will be about bases, remainders, divisors, GCD, LCM etc. (5) 'probability' questions will ask about the probability of the occurrence of something. A question must belong to only one category." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task835_mathdataset_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task835_mathdataset_answer_generation.json new file mode 100644 index 000000000..5fc0fbb03 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task835_mathdataset_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a simple high-school level math question, you are required to solve it and provide the final answer. The final answer is always a single number. These questions can range from a variety of topics like simple arithmetic, solving equations, converting a quantity from one unit to another, finding remainders/GCD/LCM, finding probabilities etc. Each question has only one correct answer. This answer can be a positive or negative integer, a fraction or a decimal number. If the answer is a negative number use the hyphen (e.g. -42) symbol for the minus sign. For decimal numbers, do not add extra zeros after the decimal point. For fractional numbers, separate the numerator and denominator using a forward slash (e.g. 3/25)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task843_financial_phrasebank_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task843_financial_phrasebank_classification.json new file mode 100644 index 000000000..56a909e9a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task843_financial_phrasebank_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Classify the given a piece of financial news into three classes: positive, negative, and neutral. Output must be 'positive', 'negative', or 'neutral'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task844_financial_phrasebank_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task844_financial_phrasebank_classification.json new file mode 100644 index 000000000..bc6f58b43 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task844_financial_phrasebank_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a piece of financial news and its polarity, classify it into 'true' if the polarity is correct and classify into 'false' if the polarity is incorrect. Output must be 'true' or 'false'. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task845_pubmedqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task845_pubmedqa_question_generation.json new file mode 100644 index 000000000..7aa19adbf --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task845_pubmedqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a passage with a context and an answer, construct a question on the basis of the information present in the passage. Construct the question in such a way that (i) it is unambiguous, (ii) it is answerable from the passage, (iii) its answer is unique (iv) it answer uses text phrases from the passage. Avoid creating questions that (i) can't be answered correctly without actually understanding the passage and (ii) uses the same words or phrases given in the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task846_pubmedqa_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task846_pubmedqa_classification.json new file mode 100644 index 000000000..6218c96c5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task846_pubmedqa_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a passage with a question and an answer to that question, classify if the answer actually answers the question into 'yes' or 'no'. Output 'yes' if the answer answers the question and output 'no' if the answer does not answer the question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task847_pubmedqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task847_pubmedqa_question_generation.json new file mode 100644 index 000000000..0853278d8 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task847_pubmedqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a passage, construct a question on the basis of the information present in the passage. Construct the question in such a way that (i) it is unambiguous, (ii) it is answerable from the passage, (iii) its answer is unique (iv) it answer uses text phrases from the passage. Avoid creating questions that (i) can't be answered correctly without actually understanding the passage and (ii) uses the same words or phrases given in the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task848_pubmedqa_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task848_pubmedqa_classification.json new file mode 100644 index 000000000..f2ed8e826 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task848_pubmedqa_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a passage classify if the passage has a definite objective/aim/goal or not. Output '1' if the passage has a defininte objective/aim/goal and output '0' if the passage does not have a definite objective/aim/goal." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task849_pubmedqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task849_pubmedqa_answer_generation.json new file mode 100644 index 000000000..55e1ecab2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task849_pubmedqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a passage which has a question and the context. You have to generate an answer to the question based on the information present in the context." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task850_synthetic_longest_palindrome.json b/src/unitxt/catalog/instructions/natural_instructions/train/task850_synthetic_longest_palindrome.json new file mode 100644 index 000000000..a3de7b85d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task850_synthetic_longest_palindrome.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a string and you should find the longest substring that is a palindrome. A palindrome is a string that is the same backwards as it is forwards. If the shortest possible palindrome is length 1 you should return the first character." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task851_synthetic_multiply_evens.json b/src/unitxt/catalog/instructions/natural_instructions/train/task851_synthetic_multiply_evens.json new file mode 100644 index 000000000..50b778c0f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task851_synthetic_multiply_evens.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list, of lists, of integers. For every inner list contained in the input list, you should multiply every even number in that list. The output should be a list of integers with the same length as the number of lists in the input list. If there are no even numbers in an inner list you should output 0 for that list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task852_synthetic_multiply_odds.json b/src/unitxt/catalog/instructions/natural_instructions/train/task852_synthetic_multiply_odds.json new file mode 100644 index 000000000..4bb5ca1b4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task852_synthetic_multiply_odds.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task you will be given a list, of lists, of integers. For every inner list contained in the input list, you should multiply every odd number in that list. The output should be a list of integers with the same length as the number of lists in the input list. If there are no odd numbers in an inner list you should output 0 for that list." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task853_hippocorpus_long_text_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task853_hippocorpus_long_text_generation.json new file mode 100644 index 000000000..e258edece --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task853_hippocorpus_long_text_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Read the given summary of events, and write a longer story which covers everything described in the summary. The story you write should be longer than the summary you read, but should not repeat itself. The story should be made up of sentences which form a cohesive and logical sequence of events, and should be long enough to fill two or more paragraphs. Do not omit any details which were given by the summary. Make the story such that the summary is an accurate characterization of the paragraphs you write. Adding extra details in your story which are not mentioned in the summary is okay as long as they don't contradict anything in the summary." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task854_hippocorpus_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task854_hippocorpus_classification.json new file mode 100644 index 000000000..38218cf79 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task854_hippocorpus_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Read the given story and classify it as 'imagined', 'recalled', or 'retold'. If a story is imagined, the person who wrote the story is making it up, pretending they experienced it. If a story is recalled, the person who wrote the story really experienced it and is recalling it from memory. If a story is retold, it is a real memory like the 'recalled' stories, but written down much later after previously writing a 'recalled' story about the same events. So, recalled stories and retold stories will be fairly similar, in that they both were real experiences for the writer. Imagined stories have a more linear flow and contain more commonsense knowledge, whereas recalled stories are less connected and contain more specific concrete events. Additionally, higher levels of self reference are found in imagined stories. Between recalled and retold stories, retold stories flow significantly more linearly than recalled stories, and retold stories are significantly higher in scores for cognitive processes and positive tone." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task855_conv_ai_2_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task855_conv_ai_2_classification.json new file mode 100644 index 000000000..9ffe9ee6c --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task855_conv_ai_2_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Read an exchange between SENDER A and SENDER B, and answer whether SENDER A is a 'Bot' or a 'Human'. There are only a maximum of two senders (A and B) per conversation, and there are no conversations where SENDER A and SENDER B are both bots, or both humans; only one sender per conversation can be a bot, and only one can be a human. Knowing this, need only to classify whether SENDER A is 'Human' or 'Bot'; you do not need to write anything about SENDER B. Typically, bots will have a more disjointed manner of speaking, and will make statements that don't relate to each other, don't make coherent sense, or otherwise appear unnatural. Humans will make statements in a more or less coherent and logical way, potentially including asking the bot why the bot is not making sense or contradicting itself." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task856_conv_ai_2_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task856_conv_ai_2_classification.json new file mode 100644 index 000000000..0dbc4a3dd --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task856_conv_ai_2_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Read the given message of a sender that is intended to start a conversation, and determine whether it was written by a 'Bot' or by a 'Human'. Typically, bots will have a more disjointed manner of speaking, and will make statements that don't relate to each other, don't make coherent sense, or otherwise appear unnatural. Human will make statements in a more or less coherent and logical way. Since these messages are supposed to be conversation openers, humans will generally start sensibly with a hello or an introduction. Humans may also ask why the other person is not responding. Bots, however, may act as if they are in the middle of a nonsensical conversation." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task857_inquisitive_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task857_inquisitive_question_generation.json new file mode 100644 index 000000000..151cc79d4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task857_inquisitive_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Write an inquisitive question about a specific text span in a given sentence such that the answer is not in the text." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task858_inquisitive_span_detection.json b/src/unitxt/catalog/instructions/natural_instructions/train/task858_inquisitive_span_detection.json new file mode 100644 index 000000000..0282b331d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task858_inquisitive_span_detection.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Indicate a text span in the passage about which an inquisitive question is asked. (note, don't answer the question)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task859_prost_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task859_prost_question_generation.json new file mode 100644 index 000000000..82e916a8d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task859_prost_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Formulate questions about the information mentioned in a given passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task860_prost_mcq_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task860_prost_mcq_generation.json new file mode 100644 index 000000000..212959ec5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task860_prost_mcq_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Creating a multiple-choice question from the given context and a 'group' which indicate the focus of the question. The question must come first, separated by from the candidate answers. The answer to the question does not have to exist in the context." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task861_asdiv_addsub_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task861_asdiv_addsub_question_answering.json new file mode 100644 index 000000000..fcc6363a1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task861_asdiv_addsub_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a math word problem, answer the following question. You might need to apply addition or subtraction mathematical operators on the numbers embedded in the text to answer the question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task861_prost_mcq_answers_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task861_prost_mcq_answers_generation.json new file mode 100644 index 000000000..14adc8829 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task861_prost_mcq_answers_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The task is about reading the given context, group and MCQs and then generating answers from the given input. MCQs are multiple choice questions in which a question is asked and few options are given, among which one or in some cases more than one can be the answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task862_asdiv_multidiv_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task862_asdiv_multidiv_question_answering.json new file mode 100644 index 000000000..52f26fe34 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task862_asdiv_multidiv_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to apply multiple mathematical operators like addition, subtraction, multiplication or division on the numbers embedded in the text to answer the following question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task863_asdiv_multiop_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task863_asdiv_multiop_question_answering.json new file mode 100644 index 000000000..175534b8a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task863_asdiv_multiop_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to apply multiple mathematical operators like addition, subtraction, multiplication, or division on the numbers embedded in the text to answer the following question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task864_asdiv_singleop_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task864_asdiv_singleop_question_answering.json new file mode 100644 index 000000000..45bf57577 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task864_asdiv_singleop_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to apply a single mathematical operator like addition, subtraction, multiplication, or division on the numbers embedded in the text to answer the following question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task865_mawps_addsub_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task865_mawps_addsub_question_answering.json new file mode 100644 index 000000000..e64589bd7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task865_mawps_addsub_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to apply addition or subtraction mathematical operators on the numbers embedded in the text to answer the following question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task866_mawps_multidiv_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task866_mawps_multidiv_question_answering.json new file mode 100644 index 000000000..e5d85ea3d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task866_mawps_multidiv_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to apply multiplication or division mathematical operators on the numbers embedded in the text to answer the following question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task867_mawps_multiop_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task867_mawps_multiop_question_answering.json new file mode 100644 index 000000000..52f26fe34 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task867_mawps_multiop_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to apply multiple mathematical operators like addition, subtraction, multiplication or division on the numbers embedded in the text to answer the following question and then only report the final numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task868_cfq_mcd1_explanation_to_sql.json b/src/unitxt/catalog/instructions/natural_instructions/train/task868_cfq_mcd1_explanation_to_sql.json new file mode 100644 index 000000000..1e7f67041 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task868_cfq_mcd1_explanation_to_sql.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "For the given English description, write an SQL command such that it accomplishes every step. An SQL query works by selecting data from a table where certain conditions apply. A table contains columns where every row in that table must have a value for each column. Every table has a primary key that uniquely identifies each row, usually an id. To choose which columns are returned you specify that after the \"SELECT\" statement. Next, you use a \"FROM\" statement to specify what tables you want to select the data from. When you specify a table you can rename it with the \"AS\" statement. You can reference that table by whatever name follows the \"AS\" statement. If you want to select data from multiple tables you need to use the \"JOIN\" statement. This will join the tables together by pairing a row in one table with every row in the other table (Cartesian Product). To limit the number of rows returned you should use the \"ON\" statement. This will only return rows where the condition specified after the statement is true, this is usually an equals operator with primary keys. You can also use the \"WHERE\" statement to specify that only rows with column values statisfying a certain condition, should be returned. The \"GROUP BY\" statement will group rows together that have equal column values for whatever columns follows the statement. The \"HAVING\" statement will return groups that statisfy whatever condition follows the statement. Any column(s) being returned from grouped rows must either be an aggregate function, (AVG, MAX, COUNT, SUM, ...) of a column, or the column(s) that the data was grouped by. To sort the returned data you can use the \"ORDER BY\" command which will order the data by whatever aggregate function or column follows the statement. The \"DESC\" statement will sort in descending order and the \"ASC\" statement will sort in ascending order. Finally, you can use the \"LIMIT\" statement to return a certain number of rows. When \"*\" is used in an SQL statement every column is returned. For example, SELECT * FROM table WHERE attribute = 1, will select every column from rows with the attribute column equal to 1." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task868_mawps_singleop_question_answering.json b/src/unitxt/catalog/instructions/natural_instructions/train/task868_mawps_singleop_question_answering.json new file mode 100644 index 000000000..8d3b632a9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task868_mawps_singleop_question_answering.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a math word problem and you are supposed to apply a single mathematical operators like addition, subtraction, multiplication or division on the numbers embedded in the text to answer the following question and then only report final the numerical answer." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task869_cfq_mcd1_sql_to_explanation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task869_cfq_mcd1_sql_to_explanation.json new file mode 100644 index 000000000..5893c8dfb --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task869_cfq_mcd1_sql_to_explanation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Determine if the provided SQL statement properly addresses the given question. Output 1 if the SQL statement is correct and 0 otherwise. An SQL query works by selecting data from a table where certain conditions apply. A table contains columns where every row in that table must have a value for each column. Every table has a primary key that uniquely identifies each row, usually an id. To choose which columns are returned you specify that after the \"SELECT\" statement. Next, you use a \"FROM\" statement to specify what tables you want to select the data from. When you specify a table you can rename it with the \"AS\" statement. You can reference that table by whatever name follows the \"AS\" statement. If you want to select data from multiple tables you need to use the \"JOIN\" statement. This will join the tables together by pairing a row in one table with every row in the other table (Cartesian Product). To limit the number of rows returned you should use the \"ON\" statement. This will only return rows where the condition specified after the statement is true, this is usually an equals operator with primary keys. You can also use the \"WHERE\" statement to specify that only rows with column values statisfying a certain condition, should be returned. The \"GROUP BY\" statement will group rows together that have equal column values for whatever columns follows the statement. The \"HAVING\" statement will return groups that statisfy whatever condition follows the statement. Any column(s) being returned from grouped rows must either be an aggregate function, (AVG, MAX, COUNT, SUM, ...) of a column, or the column(s) that the data was grouped by. To sort the returned data you can use the \"ORDER BY\" command which will order the data by whatever aggregate function or column follows the statement. The \"DESC\" statement will sort in descending order and the \"ASC\" statement will sort in ascending order. Finally, you can use the \"LIMIT\" statement to return a certain number of rows. When \"*\" is used in an SQL statement every column is returned. For example, SELECT * FROM table WHERE attribute = 1, will select every column from rows with the attribute column equal to 1." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task870_msmarco_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task870_msmarco_answer_generation.json new file mode 100644 index 000000000..89853ce71 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task870_msmarco_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a passage and a query based on the passage, generate an unambiguous, concise and simple answer to the query from information in the passage. Note that the answer may not be present in exact form." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task871_msmarco_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task871_msmarco_question_generation.json new file mode 100644 index 000000000..051344367 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task871_msmarco_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Write a phrase, the answer to which is present in the passage. The answer to this question should be completely and unambiguously found in the passage. The query must be about a single or multiple linked entities. " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task874_opus_xhosanavy_sr.json b/src/unitxt/catalog/instructions/natural_instructions/train/task874_opus_xhosanavy_sr.json new file mode 100644 index 000000000..b8becff42 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task874_opus_xhosanavy_sr.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence. You must find the primary subject in the supplied sentence. The output must be a sub-sequence in the sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task875_emotion_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task875_emotion_classification.json new file mode 100644 index 000000000..652c9f307 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task875_emotion_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a sentence containing a particular emotion. You must classify the sentence into one of the six emotions: 'joy', 'love', 'anger', 'fear', or 'surprise'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task886_quail_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task886_quail_question_generation.json new file mode 100644 index 000000000..2137e2970 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task886_quail_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Write a question from the passage such that it identifies a character (a person or a thing) in the passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task887_quail_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task887_quail_answer_generation.json new file mode 100644 index 000000000..cb283a641 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task887_quail_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Write the right answer to the question based on the context passage." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task888_reviews_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task888_reviews_classification.json new file mode 100644 index 000000000..9eb90cbd1 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task888_reviews_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Classify given movie review into two categories: positive, or negative based on its content." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task889_goemotions_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task889_goemotions_classification.json new file mode 100644 index 000000000..bfccfb3f2 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task889_goemotions_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Categorize the following sentence into one of the five different emotions: anger, confusion, joy, sadness and neutral." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task897_freebase_qa_topic_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task897_freebase_qa_topic_question_generation.json new file mode 100644 index 000000000..649fd6e53 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task897_freebase_qa_topic_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given an open-ended topic (movie name, a persons name, an event, sports, etc) generate a simple trivia-type question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task898_freebase_qa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task898_freebase_qa_answer_generation.json new file mode 100644 index 000000000..d2bfe40e0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task898_freebase_qa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given an trivia question precisely answer the question with a word/phrase/name. External resources such as Wikipedia could be used to obtain the facts." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task899_freebase_qa_topic_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task899_freebase_qa_topic_generation.json new file mode 100644 index 000000000..5ccc1b0f9 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task899_freebase_qa_topic_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a factoid/trivia type question, generate the topic of the question. The topic is the entity the question talks about." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task900_freebase_qa_category_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task900_freebase_qa_category_classification.json new file mode 100644 index 000000000..3aafb73ea --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task900_freebase_qa_category_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a trivia question, classify broad topical category from this list: 'theater', 'geology', 'book', 'tv', 'astronomy', 'aviation', 'military', 'government', 'boxing', 'projects', 'metropolitan_transit', 'law', 'venture_capital', 'broadcast', 'biology', 'people', 'influence', 'baseball', 'spaceflight', 'media_common', 'cvg', 'opera', 'olympics', 'chemistry', 'visual_art', 'conferences', 'sports', 'language', 'travel', 'location', 'award', 'dining', 'martial_arts', 'comic_strips', 'computer', 'user', 'tennis', 'music', 'organization', 'food', 'event', 'transportation', 'fictional_universe', 'measurement_unit', 'meteorology', 'distilled_spirits', 'symbols', 'architecture', 'freebase', 'internet', 'fashion', 'boats', 'cricket', 'film', 'medicine', 'finance', 'comic_books', 'celebrities', 'soccer', 'games', 'time', 'geography', 'interests', 'common', 'base', 'business', 'periodicals', 'royalty', 'education', 'type', 'religion', 'automotive', 'exhibitions'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task901_freebase_qa_category_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task901_freebase_qa_category_question_generation.json new file mode 100644 index 000000000..59bc6191f --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task901_freebase_qa_category_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a broad category, generate a trivia-type question based on a specific entity in that category. The question should be non-ambiguous. External resources such as Wikipedia could be used to obtain the facts." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task902_deceptive_opinion_spam_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task902_deceptive_opinion_spam_classification.json new file mode 100644 index 000000000..dde39bc61 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task902_deceptive_opinion_spam_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Classify the given hotel review based on the sentiment it expresses into two classes: negative and positive." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task903_deceptive_opinion_spam_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task903_deceptive_opinion_spam_classification.json new file mode 100644 index 000000000..d64fea778 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task903_deceptive_opinion_spam_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a hotel review and the corresponding polarity of review (i.e., Negative or Positive) identify if the polarity is correct. Write 'true' if it's correct, 'false' otherwise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task904_hate_speech_offensive_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task904_hate_speech_offensive_classification.json new file mode 100644 index 000000000..8d5095157 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task904_hate_speech_offensive_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Classify the given tweet into the three categories: (1) 'Hate Speech', (2) 'Offensive' and (3) 'Neither'. 'Hate Speech' is kind of a threating statement or sometimes include call for violence while 'offensive' statement just offensds someone. 'Neither' is when it doesn't fall into Hate Speech or Offensive category." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task905_hate_speech_offensive_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task905_hate_speech_offensive_classification.json new file mode 100644 index 000000000..fdb2471ca --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task905_hate_speech_offensive_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a text of the tweet and a corresponding label whether this tweet is 'Offensive', 'Hate Speech' or 'Neither'. Your job is to identify if the label is correct. Generate label 'true' if it's correct, 'false' otherwise." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task906_dialogre_identify_names.json b/src/unitxt/catalog/instructions/natural_instructions/train/task906_dialogre_identify_names.json new file mode 100644 index 000000000..bd59a53d5 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task906_dialogre_identify_names.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a dialog between 2 or more individuals. Within the dialog, there will be clues as to the names of the speakers. You will be asked at the end of the dialog to identify the name of one of the speakers." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task907_dialogre_identify_relationships.json b/src/unitxt/catalog/instructions/natural_instructions/train/task907_dialogre_identify_relationships.json new file mode 100644 index 000000000..644988511 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task907_dialogre_identify_relationships.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a dialog between 2 or more individuals. Within the dialog, there will be clues that indicate two individuals were or are dating. You will be prompted at the end to answer which Speaker (or named individual) is dating which other Speaker (or named individual)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task908_dialogre_identify_familial_relationships.json b/src/unitxt/catalog/instructions/natural_instructions/train/task908_dialogre_identify_familial_relationships.json new file mode 100644 index 000000000..6d5268269 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task908_dialogre_identify_familial_relationships.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a dialog between 2 or more individuals. The dialog will include information as to the relationship between 2 of the participants. At the end, you will be asked to provide an answer as to the relationship of those 2 participants. In this scenario, '0' will represent a spousal relationship, '1' will represent siblings, and '2' will represent a child/parent relationship." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task909_dialogre_prevalent_speakers.json b/src/unitxt/catalog/instructions/natural_instructions/train/task909_dialogre_prevalent_speakers.json new file mode 100644 index 000000000..e64bf32d7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task909_dialogre_prevalent_speakers.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a dialog between 2 or more individuals. You need to generate the number of the speaker (e.g. 1 for Speaker 1) who had the most lines in the dialog. If there is a tie, output the answer '0'." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task917_coqa_question_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task917_coqa_question_generation.json new file mode 100644 index 000000000..915fb8db0 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task917_coqa_question_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task is about reading the given passage and construct a question about the information present in the passage. Construct a question in such a way that (i) it is unambiguous, (ii) it is answerable from the passage, (iii) the answer is unique, (iv) its answer is a continous text span from the paragraph. Avoid creating questions that (i) can be answered correctly without actually understanding the paragraph and (ii) uses same words or phrases given in the passage " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task918_coqa_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task918_coqa_answer_generation.json new file mode 100644 index 000000000..910c15895 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task918_coqa_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "The task is about reading the given story and question, then finding an answer to the given question. Based on the passage provided and the given question, you should identify the shortest continuous text span from the passage that serves as an answer to the given question. Avoid answers that are incorrect or provides incomplete justification for the question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task919_coqa_incorrect_answer_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task919_coqa_incorrect_answer_generation.json new file mode 100644 index 000000000..ca00f7302 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task919_coqa_incorrect_answer_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task is about reading the given passage and the question, return an incorrect answer to the given question." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task921_code_x_glue_information_retreival.json b/src/unitxt/catalog/instructions/natural_instructions/train/task921_code_x_glue_information_retreival.json new file mode 100644 index 000000000..32d5138d7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task921_code_x_glue_information_retreival.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "This task is to find the number of 'For' loops present in the given cpp program." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task922_event2mind_word_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task922_event2mind_word_generation.json new file mode 100644 index 000000000..c6d899cfe --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task922_event2mind_word_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are provided with an \"Event\", \"Intent\" related to PersonX. Guess a reaction/reaction of PersonX about the given event and their intention." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task923_event2mind_classifier.json b/src/unitxt/catalog/instructions/natural_instructions/train/task923_event2mind_classifier.json new file mode 100644 index 000000000..7feae459d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task923_event2mind_classifier.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are provided with an \"Event\" and it's \"Intent\" related to PersonX. Determine the sentiment value of the given input as either \"Positive\", \"Negative\", and \"Unknown\". " +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task924_event2mind_word_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task924_event2mind_word_generation.json new file mode 100644 index 000000000..ca7aa12e7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task924_event2mind_word_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are provided with an \"Event\", \"Intent\" and \"XEmotion\" (PersonX's reactions for the given \"Event\"). Indicate PersonY's reaction (person feels) at the end of this event. Provide one reaction for PersonY. If there's nothing that can be implied, respond as None" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task925_coached_conv_pref_classifier.json b/src/unitxt/catalog/instructions/natural_instructions/train/task925_coached_conv_pref_classifier.json new file mode 100644 index 000000000..1abffdae7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task925_coached_conv_pref_classifier.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are provided with a list of converations between a \"USER\" and \"ASSISTANT\". Figure out if the conversation provided as \"classify_text\" is authored by \"USER\" or \"ASSISTANT\". There are maximum of 7 conversations between \"USER\" and \"ASSISTANT\" in each input" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task926_coached_conv_pref_word_generation.json b/src/unitxt/catalog/instructions/natural_instructions/train/task926_coached_conv_pref_word_generation.json new file mode 100644 index 000000000..54e5b4e6a --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task926_coached_conv_pref_word_generation.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Find the movie name from the given conversation. If the movie name is not found give output as \"unknown\"" +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task927_yelp_negative_to_positive_style_transfer.json b/src/unitxt/catalog/instructions/natural_instructions/train/task927_yelp_negative_to_positive_style_transfer.json new file mode 100644 index 000000000..03091156d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task927_yelp_negative_to_positive_style_transfer.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a negative review and your task is to convert it to a positive review by one or more making minimal changes. Avoid changing the context of the review." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task928_yelp_positive_to_negative_style_transfer.json b/src/unitxt/catalog/instructions/natural_instructions/train/task928_yelp_positive_to_negative_style_transfer.json new file mode 100644 index 000000000..824ee9e80 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task928_yelp_positive_to_negative_style_transfer.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you are given a positive review and your task is to convert it to a negative review by making minimal changes. Avoid changing the context of the review." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task929_products_reviews_classification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task929_products_reviews_classification.json new file mode 100644 index 000000000..981f09479 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task929_products_reviews_classification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given an English language product review, determine if it is a Good Review or a Bad Review. A good review is one where the product's review has positive tone and Bad review is one where the tone of product's review is negative." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task933_wiki_auto_style_transfer.json b/src/unitxt/catalog/instructions/natural_instructions/train/task933_wiki_auto_style_transfer.json new file mode 100644 index 000000000..34dddb3c6 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task933_wiki_auto_style_transfer.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, we ask you to rewrite a sentence in simple English without changing its general meaning. Essentially, you want to make the sentence easier to read by using simpler words, utilizing more straightforward sentence structures, and omitting non-essential information etc." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task934_turk_simplification.json b/src/unitxt/catalog/instructions/natural_instructions/train/task934_turk_simplification.json new file mode 100644 index 000000000..54611b382 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task934_turk_simplification.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, you're given a sentence and your task is to generate a simplified sentence that focuses on lexical paraphrasing from the original sentence given in the input." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task955_wiki_auto_style_transfer.json b/src/unitxt/catalog/instructions/natural_instructions/train/task955_wiki_auto_style_transfer.json new file mode 100644 index 000000000..dc97c8db3 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task955_wiki_auto_style_transfer.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "In this task, we ask you to elaborate the sentence without changing its general meaning. You can do so by explaining further the input sentence, using more precise wording, adding qualifiers and auxiliary information etc." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task956_leetcode_420_strong_password_check.json b/src/unitxt/catalog/instructions/natural_instructions/train/task956_leetcode_420_strong_password_check.json new file mode 100644 index 000000000..d1adc70b7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task956_leetcode_420_strong_password_check.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given a password and you need to generate the number of steps required to convert the given password to a strong password. A password is considered strong if (a) it has at least 6 characters and at most 20 characters; (b) it contains at least one lowercase letter and one uppercase letter, and at least one digit; (c) it does not contain three repeating characters in a row. In one step you can: (1) Insert one character to password, (2) delete one character from password, or (3) replace one character of password with another character." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task963_librispeech_asr_next_word_prediction.json b/src/unitxt/catalog/instructions/natural_instructions/train/task963_librispeech_asr_next_word_prediction.json new file mode 100644 index 000000000..4b9c10cb4 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task963_librispeech_asr_next_word_prediction.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Predict the next word given an incomplete English Sentence." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task964_librispeech_asr_text_auto_completion.json b/src/unitxt/catalog/instructions/natural_instructions/train/task964_librispeech_asr_text_auto_completion.json new file mode 100644 index 000000000..54b60146d --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task964_librispeech_asr_text_auto_completion.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given an unfinished English sentence, and you need to predict the rest of it." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task965_librispeech_asr_missing_word_prediction.json b/src/unitxt/catalog/instructions/natural_instructions/train/task965_librispeech_asr_missing_word_prediction.json new file mode 100644 index 000000000..35592db49 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task965_librispeech_asr_missing_word_prediction.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "You are given an English sentence with a blank, and you need to predict the missing word. After completing, the whole sentence should be gramatically correct and non-ambiguous." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task966_ruletaker_fact_checking_based_on_given_context.json b/src/unitxt/catalog/instructions/natural_instructions/train/task966_ruletaker_fact_checking_based_on_given_context.json new file mode 100644 index 000000000..8e019cac7 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task966_ruletaker_fact_checking_based_on_given_context.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a text paragraph and a fact, generate 'True' if the fact can be inferred/concluded from the paragraph, otherwise generate 'False'. The input passage contains as set of logical statements so the fact can be marked either 'True' or 'False' if the relavant info regarding the fact is present in the given passage. If the Fact can't be marked True or False from the given paragraph, mark it as False. Don't use knowledge outside the given paragraph to check the fact." +} \ No newline at end of file diff --git a/src/unitxt/catalog/instructions/natural_instructions/train/task967_ruletaker_incorrect_fact_generation_based_on_given_paragraph.json b/src/unitxt/catalog/instructions/natural_instructions/train/task967_ruletaker_incorrect_fact_generation_based_on_given_paragraph.json new file mode 100644 index 000000000..3f87bba90 --- /dev/null +++ b/src/unitxt/catalog/instructions/natural_instructions/train/task967_ruletaker_incorrect_fact_generation_based_on_given_paragraph.json @@ -0,0 +1,4 @@ +{ + "type": "textual_instruction", + "text": "Given a text paragraph and a fact, generate a statement that is using the content of the given paragraph yet, it is **incorrect** (i.e., it contradicts the statements of the input)." +} \ No newline at end of file diff --git a/src/unitxt/catalog/templates/input_output.json b/src/unitxt/catalog/templates/input_output.json new file mode 100644 index 000000000..ced50c912 --- /dev/null +++ b/src/unitxt/catalog/templates/input_output.json @@ -0,0 +1,5 @@ +{ + "type": "input_output_template", + "input_format": "{input}", + "output_format": "{target}" +} \ No newline at end of file diff --git a/src/unitxt/loaders.py b/src/unitxt/loaders.py index db15c69e1..34a614350 100644 --- a/src/unitxt/loaders.py +++ b/src/unitxt/loaders.py @@ -36,12 +36,27 @@ class LoadHF(Loader): data_dir: Optional[str] = None data_files: Optional[Union[str, Sequence[str], Mapping[str, Union[str, Sequence[str]]]]] = None streaming: bool = True + field: Optional[str] = None cached = False def process(self): - dataset = hf_load_dataset( - self.path, name=self.name, data_dir=self.data_dir, data_files=self.data_files, streaming=self.streaming - ) + if self.field: + dataset = hf_load_dataset( + self.path, + name=self.name, + data_dir=self.data_dir, + data_files=self.data_files, + streaming=self.streaming, + field=self.field, + ) + else: + dataset = hf_load_dataset( + self.path, + name=self.name, + data_dir=self.data_dir, + data_files=self.data_files, + streaming=self.streaming, + ) return MultiStream.from_iterables(dataset)