From e63d93c49f896698a030bd30309812ca883b9fd6 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E9=98=BF=E5=BD=AA?= Date: Tue, 18 Jan 2022 20:27:35 +0800 Subject: [PATCH 1/5] =?UTF-8?q?=09=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A=20?= =?UTF-8?q?=20=20parlai/tasks/xpersona/=5F=5Finit=5F=5F.py=20=09=E6=96=B0?= =?UTF-8?q?=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/tasks/xpersona/agent?= =?UTF-8?q?s.py=20=09=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/t?= =?UTF-8?q?asks/xpersona/build.py=20=09=E6=96=B0=E6=96=87=E4=BB=B6?= =?UTF-8?q?=EF=BC=9A=20=20=20parlai/tasks/xpersona/test.py=20=09=E6=96=B0?= =?UTF-8?q?=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/?= =?UTF-8?q?xpersona=5FEn=5Ftest.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6?= =?UTF-8?q?=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/xpersona=5FEn=5Ftr?= =?UTF-8?q?ain.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parla?= =?UTF-8?q?i/tasks/xpersona/test/xpersona=5FEn=5Fvalid.yml=20=09=E6=96=B0?= =?UTF-8?q?=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/?= =?UTF-8?q?xpersona=5FFr=5Ftest.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6?= =?UTF-8?q?=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/xpersona=5FFr=5Ftr?= =?UTF-8?q?ain.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parla?= =?UTF-8?q?i/tasks/xpersona/test/xpersona=5FFr=5Fvalid.yml=20=09=E6=96=B0?= =?UTF-8?q?=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/?= =?UTF-8?q?xpersona=5FId=5Ftest.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6?= =?UTF-8?q?=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/xpersona=5FId=5Ftr?= =?UTF-8?q?ain.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parla?= =?UTF-8?q?i/tasks/xpersona/test/xpersona=5FId=5Fvalid.yml=20=09=E6=96=B0?= =?UTF-8?q?=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/?= =?UTF-8?q?xpersona=5FIt=5Ftest.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6?= =?UTF-8?q?=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/xpersona=5FIt=5Ftr?= =?UTF-8?q?ain.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parla?= =?UTF-8?q?i/tasks/xpersona/test/xpersona=5FIt=5Fvalid.yml=20=09=E6=96=B0?= =?UTF-8?q?=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/?= =?UTF-8?q?xpersona=5FJp=5Ftest.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6?= =?UTF-8?q?=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/xpersona=5FJp=5Ftr?= =?UTF-8?q?ain.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parla?= =?UTF-8?q?i/tasks/xpersona/test/xpersona=5FJp=5Fvalid.yml=20=09=E6=96=B0?= =?UTF-8?q?=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/?= =?UTF-8?q?xpersona=5FKo=5Ftest.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6?= =?UTF-8?q?=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/xpersona=5FKo=5Ftr?= =?UTF-8?q?ain.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parla?= =?UTF-8?q?i/tasks/xpersona/test/xpersona=5FKo=5Fvalid.yml=20=09=E6=96=B0?= =?UTF-8?q?=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/?= =?UTF-8?q?xpersona=5FZh=5Ftest.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6?= =?UTF-8?q?=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/xpersona=5FZh=5Ftr?= =?UTF-8?q?ain.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parla?= =?UTF-8?q?i/tasks/xpersona/test/xpersona=5FZh=5Fvalid.yml=20=09=E6=96=B0?= =?UTF-8?q?=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/tasks/xpersona/test/?= =?UTF-8?q?xpersona=5Ftest.yml=20=09=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A?= =?UTF-8?q?=20=20=20parlai/tasks/xpersona/test/xpersona=5Ftrain.yml=20=09?= =?UTF-8?q?=E6=96=B0=E6=96=87=E4=BB=B6=EF=BC=9A=20=20=20parlai/tasks/xpers?= =?UTF-8?q?ona/test/xpersona=5Fvalid.yml?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- parlai/tasks/xpersona/__init__.py | 5 + parlai/tasks/xpersona/agents.py | 70 ++++++ parlai/tasks/xpersona/build.py | 200 ++++++++++++++++++ parlai/tasks/xpersona/test.py | 39 ++++ .../tasks/xpersona/test/xpersona_En_test.yml | 42 ++++ .../tasks/xpersona/test/xpersona_En_train.yml | 43 ++++ .../tasks/xpersona/test/xpersona_En_valid.yml | 46 ++++ .../tasks/xpersona/test/xpersona_Fr_test.yml | 42 ++++ .../tasks/xpersona/test/xpersona_Fr_train.yml | 41 ++++ .../tasks/xpersona/test/xpersona_Fr_valid.yml | 42 ++++ .../tasks/xpersona/test/xpersona_Id_test.yml | 44 ++++ .../tasks/xpersona/test/xpersona_Id_train.yml | 44 ++++ .../tasks/xpersona/test/xpersona_Id_valid.yml | 43 ++++ .../tasks/xpersona/test/xpersona_It_test.yml | 42 ++++ .../tasks/xpersona/test/xpersona_It_train.yml | 43 ++++ .../tasks/xpersona/test/xpersona_It_valid.yml | 43 ++++ .../tasks/xpersona/test/xpersona_Jp_test.yml | 41 ++++ .../tasks/xpersona/test/xpersona_Jp_train.yml | 41 ++++ .../tasks/xpersona/test/xpersona_Jp_valid.yml | 41 ++++ .../tasks/xpersona/test/xpersona_Ko_test.yml | 41 ++++ .../tasks/xpersona/test/xpersona_Ko_train.yml | 41 ++++ .../tasks/xpersona/test/xpersona_Ko_valid.yml | 41 ++++ .../tasks/xpersona/test/xpersona_Zh_test.yml | 41 ++++ .../tasks/xpersona/test/xpersona_Zh_train.yml | 41 ++++ .../tasks/xpersona/test/xpersona_Zh_valid.yml | 41 ++++ parlai/tasks/xpersona/test/xpersona_test.yml | 42 ++++ parlai/tasks/xpersona/test/xpersona_train.yml | 43 ++++ parlai/tasks/xpersona/test/xpersona_valid.yml | 46 ++++ 28 files changed, 1329 insertions(+) create mode 100644 parlai/tasks/xpersona/__init__.py create mode 100644 parlai/tasks/xpersona/agents.py create mode 100644 parlai/tasks/xpersona/build.py create mode 100644 parlai/tasks/xpersona/test.py create mode 100644 parlai/tasks/xpersona/test/xpersona_En_test.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_En_train.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_En_valid.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Fr_test.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Fr_train.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Fr_valid.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Id_test.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Id_train.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Id_valid.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_It_test.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_It_train.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_It_valid.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Jp_test.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Jp_train.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Jp_valid.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Ko_test.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Ko_train.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Ko_valid.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Zh_test.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Zh_train.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_Zh_valid.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_test.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_train.yml create mode 100644 parlai/tasks/xpersona/test/xpersona_valid.yml diff --git a/parlai/tasks/xpersona/__init__.py b/parlai/tasks/xpersona/__init__.py new file mode 100644 index 00000000000..240697e3247 --- /dev/null +++ b/parlai/tasks/xpersona/__init__.py @@ -0,0 +1,5 @@ +#!/usr/bin/env python3 + +# Copyright (c) Facebook, Inc. and its affiliates. +# This source code is licensed under the MIT license found in the +# LICENSE file in the root directory of this source tree. diff --git a/parlai/tasks/xpersona/agents.py b/parlai/tasks/xpersona/agents.py new file mode 100644 index 00000000000..ab5b2bbb6cd --- /dev/null +++ b/parlai/tasks/xpersona/agents.py @@ -0,0 +1,70 @@ +#!/usr/bin/env python3 + +# Copyright (c) Facebook, Inc. and its affiliates. +# This source code is licensed under the MIT license found in the +# LICENSE file in the root directory of this source tree. + +import copy +import os +from .build import build +from parlai.core.teachers import FbDeprecatedDialogTeacher + +'''This dataset is available in seven different languages. +To use the dataset in the specified language, use the task flag to specify it. + +--task xpersona:{LANGUAGE} + +The default language is English. +''' + + +def _path(opt): + # build the data if it does not exist + build(opt) + + # set up path to data (specific to each dataset) + dt = opt['datatype'].split(':')[0] + if ':' in opt['task']: + language = opt['task'].split(':')[1] + else: + language = 'En' + return os.path.join(opt['datapath'], 'XPersona', language + '_' + dt + '.txt') + + +class XPersonaTeacher(FbDeprecatedDialogTeacher): + def __init__(self, opt, shared=None): + opt = copy.deepcopy(opt) + opt['datafile'] = _path(opt) + super().__init__(opt, shared) + + +class DefaultTeacher(XPersonaTeacher): + pass + + +class EnTeacher(XPersonaTeacher): + pass + + +class ItTeacher(XPersonaTeacher): + pass + + +class ZhTeacher(XPersonaTeacher): + pass + + +class IdTeacher(XPersonaTeacher): + pass + + +class FrTeacher(XPersonaTeacher): + pass + + +class JpTeacher(XPersonaTeacher): + pass + + +class KoTeacher(XPersonaTeacher): + pass diff --git a/parlai/tasks/xpersona/build.py b/parlai/tasks/xpersona/build.py new file mode 100644 index 00000000000..8050106ad50 --- /dev/null +++ b/parlai/tasks/xpersona/build.py @@ -0,0 +1,200 @@ +#!/usr/bin/env python3 + +# Copyright (c) Facebook, Inc. and its affiliates. +# This source code is licensed under the MIT license found in the +# LICENSE file in the root directory of this source tree. +# Download and build the data if it does not exist. + +import parlai.core.build_data as build_data +import os +from parlai.core.build_data import DownloadableFile +import json +from parlai.utils.io import PathManager + +RESOURCES = [ + ########En######## + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/En_persona_test.json', + 'En_test_tmp.json', + '8baa09a8064a22967544f501821aa114393a59339c0559da8afa160966ba87c9', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/En_persona_train.json', + 'En_train_tmp.json', + 'e23112bba7320f798b07afb4c5acc3edad2a2ccb7df5cc46f141a0c79ff4665c', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/En_persona_valid.json', + 'En_valid_tmp.json', + '08ed3d41c5b0681c2d125a5312b43d926a8a5aa1d10a5df655d17f4c56dab635', + zipped=False, + ), + #######Fr######## + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Fr_persona_train_corrected.json', + 'Fr_train_tmp.json', + '40e66e91aa6360eeda642c2c674f03c52854626eaf35da50084d26ff42f61292', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Fr_persona_split_test_human_annotated.json', + 'Fr_test_tmp.json', + '0783fcf01bdf4c27ec28120a9b23bf4f0248e97ae476e03cd7e759cb2667ab23', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Fr_persona_split_valid_human_annotated.json', + 'Fr_valid_tmp.json', + '8ad86b05aabfadedba7863828b1cc4fdff0926ebf476121268089ac7ed9af149', + zipped=False, + ), + ########Id######## + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Id_persona_train_corrected.json', + 'Id_train_tmp.json', + 'fee1a9769fe707fd09401c33bdf3b3cd4f7b5fd100998577f3f179c42423bc4f', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Id_persona_split_test_human_annotated.json', + 'Id_test_tmp.json', + 'e0bcd3c02f318f4381c42798a2ce6e0a10237b6998793076fbf97f633a9f2563', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Id_persona_split_valid_human_annotated.json', + 'Id_valid_tmp.json', + '8f70cab662f082ae3ee2abce9e9cac619ebc632a2820d93414a59005dbf75d7e', + zipped=False, + ), + ########It######## + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/It_persona_train_corrected.json', + 'It_train_tmp.json', + '9636893050ad16dc2daabfe8bde6979c9c780c5da9d0790f5668e198aac18b8f', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/It_persona_split_test_human_annotated.json', + 'It_test_tmp.json', + '690103031791fd5c6763176a074cdb65e249adc784e2d577110c2d9430a02a87', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/It_persona_split_valid_human_annotated.json', + 'It_valid_tmp.json', + '720dc91d3f9bc6a56ac229c6800cde63c71677a3db8d0ace7a59a7f94d89df3d', + zipped=False, + ), + ########Jp######## + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Jp_persona_train_corrected.json', + 'Jp_train_tmp.json', + '808ee29c79303e1300b38aceee79111ffe1fd2a2facb09a0956615a61d840738', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Jp_persona_split_test_human_annotated.json', + 'Jp_test_tmp.json', + '682fed16148517097437942088d225bd728cb7b41aa390559681ae73e5e6848f', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Jp_persona_split_valid_human_annotated.json', + 'Jp_valid_tmp.json', + 'a86bb811364d100bc77ddc8038265df1e01bbc3be095e56c6ec8f179e6365d75', + zipped=False, + ), + ########Ko######## + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Ko_persona_train_corrected.json', + 'Ko_train_tmp.json', + '105d6a08d02e76f1d006edb1819b96a8b5fa8d94b3ed278936bcf171368809b7', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Ko_persona_split_test_human_annotated.json', + 'Ko_test_tmp.json', + 'f7ac6bd2aec7014a28d34bb34dceed653b389ce25d21ca770e77142578dc70a6', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Ko_persona_split_valid_human_annotated.json', + 'Ko_valid_tmp.json', + '188470f863f639946bc8248a9f6aa1e589b41ec61792b88b81e7a95c72deeae0', + zipped=False, + ), + ########Zh######## + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Zh_persona_train_corrected.json', + 'Zh_train_tmp.json', + 'e07899fa91edd127ec77502bd604693c40e264b60225976e2ac6ed145d080323', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Zh_persona_split_test_human_annotated.json', + 'Zh_test_tmp.json', + '0767a4a27c765277792597502f57ea8bb80bf7be94613b0d833107f66a7d3512', + zipped=False, + ), + DownloadableFile( + 'https://raw.githubusercontent.com/HLTCHKUST/Xpersona/master/dataset/Zh_persona_split_valid_human_annotated.json', + 'Zh_valid_tmp.json', + 'cfa90117d73fe294a1b776b2d1c7b53711bfcd724f5833204726c910dad5482d', + zipped=False, + ), +] + + +def build(opt): + dpath = os.path.join(opt['datapath'], 'XPersona') + version = None + + if not build_data.built(dpath, version_string=version): + print('[building data: ' + dpath + ']') + if build_data.built(dpath): + # An older version exists, so remove these outdated files. + build_data.remove_dir(dpath) + build_data.make_dir(dpath) + + # Download the data. + for downloadable_file in RESOURCES: + downloadable_file.download_file(dpath) + _create_parlai_format(dpath) + + # Mark the data as built. + build_data.mark_done(dpath, version_string=version) + + +def _create_parlai_format(dpath: str): + datatypes = ['train', 'valid', 'test'] + languages = ['En_', 'Zh_', 'Fr_', 'Ko_', 'Id_', 'Jp_', 'It_'] + for language in languages: + for datatype in datatypes: + datatype_full = language + datatype + '_tmp' + datatype_rename = language + datatype + load_path = os.path.join(dpath, f'{datatype_full}.json') + save_path = os.path.join(dpath, f'{datatype_rename}.txt') + with PathManager.open(load_path, 'r', encoding='utf8') as f_read: + data = json.load(f_read) + with PathManager.open(save_path, 'w', encoding='utf8') as f_write: + for content in data: + line_num = 0 + personas = content['persona'] + dialogs = content['dialogue'] + for persona in personas: + line_num += 1 + f_write.write(str(line_num) + ' your persona:' + persona + '\n') + for utterance_A, utterance_B in dialogs: + line_num += 1 + f_write.write( + str(line_num) + + ' ' + + utterance_A + + '\t' + + utterance_B + + '\n' + ) + os.remove(load_path) diff --git a/parlai/tasks/xpersona/test.py b/parlai/tasks/xpersona/test.py new file mode 100644 index 00000000000..52048a82bcf --- /dev/null +++ b/parlai/tasks/xpersona/test.py @@ -0,0 +1,39 @@ +#!/usr/bin/env python3 + +# Copyright (c) Facebook, Inc. and its affiliates. +# This source code is licensed under the MIT license found in the +# LICENSE file in the root directory of this source tree. + +from parlai.utils.testing import AutoTeacherTest # noqa: F401 + + +class TestDefaultTeacher(AutoTeacherTest): + task = 'xpersona' + + +class TestEnTeacher(AutoTeacherTest): + task = 'xpersona:En' + + +class TestZhTeacher(AutoTeacherTest): + task = 'xpersona:Zh' + + +class TestFrTeacher(AutoTeacherTest): + task = 'xpersona:Fr' + + +class TestIdTeacher(AutoTeacherTest): + task = 'xpersona:Id' + + +class TestItTeacher(AutoTeacherTest): + task = 'xpersona:It' + + +class TestKoTeacher(AutoTeacherTest): + task = 'xpersona:Ko' + + +class TestJpTeacher(AutoTeacherTest): + task = 'xpersona:Jp' diff --git a/parlai/tasks/xpersona/test/xpersona_En_test.yml b/parlai/tasks/xpersona/test/xpersona_En_test.yml new file mode 100644 index 00000000000..65ab619a4ab --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_En_test.yml @@ -0,0 +1,42 @@ +acts: +- - episode_done: false + eval_labels: + - i am good , i just got off work and tired , i have two jobs . + id: xpersona:En + reward: 0 + text: 'your persona:i read twenty books a year. + + your persona:i''m a stunt double as my second job. + + your persona:i only eat kosher. + + your persona:i was raised in a single parent household. + + hello what are doing today ?' +- - episode_done: false + eval_labels: + - i rather read , i've read about 20 books this year . + id: xpersona:En + reward: 0 + text: i just got done watching a horror movie +- - episode_done: false + eval_labels: + - but a good movie is always good . + id: xpersona:En + reward: 0 + text: wow ! i do love a good horror movie . loving this cooler weather +- - episode_done: false + eval_labels: + - i work in the movies as well . + id: xpersona:En + reward: 0 + text: yes ! my son is in junior high and i just started letting him watch them + too +- - episode_done: false + eval_labels: + - yes it is neat , i stunt double , it is so much fun and hard work . + id: xpersona:En + reward: 0 + text: neat ! ! i used to work in the human services field +num_episodes: 1000 +num_examples: 7801 diff --git a/parlai/tasks/xpersona/test/xpersona_En_train.yml b/parlai/tasks/xpersona/test/xpersona_En_train.yml new file mode 100644 index 00000000000..bce680ac2cf --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_En_train.yml @@ -0,0 +1,43 @@ +acts: +- - episode_done: false + id: xpersona:En + labels: + - you must be very fast . hunting is one of my favorite hobbies . + reward: 0 + text: 'your persona:i like to remodel homes. + + your persona:i like to go hunting. + + your persona:i like to shoot a bow. + + your persona:my favorite holiday is halloween. + + hi , how are you doing ? i''m getting ready to do some cheetah chasing to stay + in shape .' +- - episode_done: false + id: xpersona:En + labels: + - i also remodel homes when i am not out bow hunting . + reward: 0 + text: i am ! for my hobby i like to do canning or some whittling . +- - episode_done: false + id: xpersona:En + labels: + - that's awesome . do you have a favorite season or time of year ? + reward: 0 + text: that's neat . when i was in high school i placed 6th in 100m dash ! +- - episode_done: false + id: xpersona:En + labels: + - what is your favorite meat to eat ? + reward: 0 + text: i do not . but i do have a favorite meat since that is all i eat exclusively + . +- - episode_done: false + id: xpersona:En + labels: + - i like chicken or macaroni and cheese . + reward: 0 + text: i would have to say its prime rib . do you have any favorite foods ? +num_episodes: 16878 +num_examples: 124122 diff --git a/parlai/tasks/xpersona/test/xpersona_En_valid.yml b/parlai/tasks/xpersona/test/xpersona_En_valid.yml new file mode 100644 index 00000000000..13807c4ed44 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_En_valid.yml @@ -0,0 +1,46 @@ +acts: +- - episode_done: false + eval_labels: + - hey there ! i'm just taking a break from baking . whats up ? + id: xpersona:En + reward: 0 + text: 'your persona:i''m a nurse. + + your persona:i am a great baker. + + your persona:i surf often. + + your persona:i was an army brat. + + __SILENCE__' +- - episode_done: false + eval_labels: + - how romantic ! just some cupcakes for the surf a thon . gotta feed my fellow + surfers + id: xpersona:En + reward: 0 + text: finishing plans for my wedding in the park next week ! what are you baking + ? +- - episode_done: false + eval_labels: + - wow sounds so sweet ! so we both love the water huh ? + id: xpersona:En + reward: 0 + text: gnarly ! reminds me of the niagra falls where we are taking our honeymoon + . +- - episode_done: false + eval_labels: + - haha its sweet you compromised . have you been together long ? + id: xpersona:En + reward: 0 + text: yeah , although i'd prefer the beach . the falls are her idea . +- - episode_done: false + eval_labels: + - i get it . . . i grew up an army brat and my family is so disapproving of me + too . + id: xpersona:En + reward: 0 + text: 7 years . you would think my family would like her by now but they don't + . +num_episodes: 1000 +num_examples: 7316 diff --git a/parlai/tasks/xpersona/test/xpersona_Fr_test.yml b/parlai/tasks/xpersona/test/xpersona_Fr_test.yml new file mode 100644 index 00000000000..5bafbd6ebb9 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Fr_test.yml @@ -0,0 +1,42 @@ +acts: +- - episode_done: false + eval_labels: + - je vais bien, je viens de quitter le travail et je suis fatigué, j'ai deux emplois. + id: xpersona:Fr + reward: 0 + text: 'your persona:je lis vingt livres par an. + + your persona:je suis un cascadeur comme deuxième travail. + + your persona:je ne mange que casher. + + your persona:j''ai été élevé dans une famille monoparentale. + + bonjour que fais tu aujourd''hui?' +- - episode_done: false + eval_labels: + - j'ai plutôt lu, j'ai lu environ 20 livres cette année. + id: xpersona:Fr + reward: 0 + text: je viens de finir de regarder un film d'horreur +- - episode_done: false + eval_labels: + - mais un bon film est toujours bon. + id: xpersona:Fr + reward: 0 + text: Hou la la ! j'aime un bon film d'horreur. aimer ce temps plus frais +- - episode_done: false + eval_labels: + - je travaille aussi dans les films. + id: xpersona:Fr + reward: 0 + text: Oui ! mon fils est au premier cycle du secondaire et je viens de le laisser + le regarder aussi +- - episode_done: false + eval_labels: + - oui c'est soigné, je stunt double, c'est tellement amusant et dur de travailler. + id: xpersona:Fr + reward: 0 + text: bon ! ! j'ai travaillé dans le domaine des services à la personne +num_episodes: 249 +num_examples: 1950 diff --git a/parlai/tasks/xpersona/test/xpersona_Fr_train.yml b/parlai/tasks/xpersona/test/xpersona_Fr_train.yml new file mode 100644 index 00000000000..47db8cb25e7 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Fr_train.yml @@ -0,0 +1,41 @@ +acts: +- - episode_done: false + id: xpersona:Fr + labels: + - vous devez être très rapide. la chasse est l'un de mes passe-temps préférés. + reward: 0 + text: 'your persona:j''aime remodeler des maisons. + + your persona:j''aime aller chasser. + + your persona:j''aime tirer un arc. + + your persona:ma fête préférée est Halloween. + + salut comment vas-tu ? Je me prépare à faire du guépard pour rester en forme.' +- - episode_done: false + id: xpersona:Fr + labels: + - je remodèle aussi des maisons quand je ne suis pas à la chasse à l'arc. + reward: 0 + text: je suis ! pour mon hobby j'aime faire la mise en conserve ou un peu tailler. +- - episode_done: false + id: xpersona:Fr + labels: + - c'est génial . avez-vous une saison ou une période préférée de l'année? + reward: 0 + text: c'est bien. quand j'étais au lycée, je me suis placé 6ème au 100m dash! +- - episode_done: false + id: xpersona:Fr + labels: + - quelle est votre viande préférée à manger? + reward: 0 + text: Non . mais j'ai une viande préférée car c'est tout ce que je mange exclusivement. +- - episode_done: false + id: xpersona:Fr + labels: + - j'aime le poulet ou les macaronis et le fromage. + reward: 0 + text: je devrais dire sa côte de bœuf. avez-vous des aliments préférés? +num_episodes: 16878 +num_examples: 124122 diff --git a/parlai/tasks/xpersona/test/xpersona_Fr_valid.yml b/parlai/tasks/xpersona/test/xpersona_Fr_valid.yml new file mode 100644 index 00000000000..7ac868d2370 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Fr_valid.yml @@ -0,0 +1,42 @@ +acts: +- - episode_done: false + eval_labels: + - je le fais bien . juste se détendre avec mes deux chiens. + id: xpersona:Fr + reward: 0 + text: 'your persona:j''ai deux chiens. + + your persona:j''aime travailler sur les voitures anciennes. + + your persona:ma musique préférée est le country. + + your persona:je possède deux mustangs vintages. + + salut ! comment vas-tu ce soir ?' +- - episode_done: false + eval_labels: + - c'est bien. quel genre de travail bénévole faites-vous? + id: xpersona:Fr + reward: 0 + text: génial . dans mon temps libre je fais du bénévolat. +- - episode_done: false + eval_labels: + - Bien pour vous . vous aimez les voitures anciennes? j'ai deux anciennes mustangs. + id: xpersona:Fr + reward: 0 + text: je travaille dans un refuge pour sans-abri dans ma ville. +- - episode_done: false + eval_labels: + - les voitures sont mon truc. voitures anciennes . j'adore travailler sur cela. + est-ce que tu aimes ça ? + id: xpersona:Fr + reward: 0 + text: cool . pas vraiment dans les voitures. mon travail de jour est dur. +- - episode_done: false + eval_labels: + - je n'ai pas pensé à l'aspect foule de la lutte. je n'aime pas les foules. + id: xpersona:Fr + reward: 0 + text: oui, j'aime la foule, faire connaissance avec les gens. +num_episodes: 248 +num_examples: 1934 diff --git a/parlai/tasks/xpersona/test/xpersona_Id_test.yml b/parlai/tasks/xpersona/test/xpersona_Id_test.yml new file mode 100644 index 00000000000..f900c475265 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Id_test.yml @@ -0,0 +1,44 @@ +acts: +- - episode_done: false + eval_labels: + - saya baik, saya baru saja pulang kerja dan lelah, saya punya dua pekerjaan. + id: xpersona:Id + reward: 0 + text: 'your persona:saya membaca dua puluh buku dalam setahun. + + your persona:Saya seorang akrobat ganda sebagai pekerjaan sampingan saya. + + your persona:saya hanya makan halal. + + your persona:saya dibesarkan dalam rumah tangga dengan orang tua tunggal. + + halo apa yang Anda lakukan hari ini?' +- - episode_done: false + eval_labels: + - saya lebih suka membaca, saya sudah membaca sekitar 20 buku tahun ini. + id: xpersona:Id + reward: 0 + text: saya baru saja selesai menonton film horor +- - episode_done: false + eval_labels: + - tapi sebuah film yang bagus tentu selalu bagus. + id: xpersona:Id + reward: 0 + text: wow! Saya sangat suka film horor yang bagus. Saya juga suka cuaca yang lebih + dingin seperti ini. +- - episode_done: false + eval_labels: + - saya bekerja di bidang perfilman. + id: xpersona:Id + reward: 0 + text: benar! anak saya masih SMP dan saya mulai membiarkannya menonton film horor + juga. +- - episode_done: false + eval_labels: + - benar, itu keren, saya seorang pemain pengganti, itu sangat menyenangkan dan + membutuhkan kerja keras. + id: xpersona:Id + reward: 0 + text: keren!! saya pernah bekerja di bidang layanan manusia. +num_episodes: 484 +num_examples: 3770 diff --git a/parlai/tasks/xpersona/test/xpersona_Id_train.yml b/parlai/tasks/xpersona/test/xpersona_Id_train.yml new file mode 100644 index 00000000000..425665110d9 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Id_train.yml @@ -0,0 +1,44 @@ +acts: +- - episode_done: false + id: xpersona:Id + labels: + - Anda pasti sangat cepat. berburu adalah salah satu hobi favorit saya. + reward: 0 + text: 'your persona:Saya suka merombak rumah. + + your persona:saya suka pergi berburu. + + your persona:saya suka menembak busur. + + your persona:liburan favorit saya adalah halloween. + + Hai apa kabar ? Saya bersiap-siap untuk melakukan cheetah mengejar untuk tetap + bugar.' +- - episode_done: false + id: xpersona:Id + labels: + - saya juga merombak rumah ketika saya tidak berburu busur. + reward: 0 + text: saya ! untuk hobi saya, saya suka melakukan pengalengan atau sedikit merengek. +- - episode_done: false + id: xpersona:Id + labels: + - itu luar biasa. apakah Anda memiliki musim atau waktu favorit tahun ini? + reward: 0 + text: itu bagus . Ketika saya masih di sekolah menengah saya menempatkan 6 dalam + 100m dasbor! +- - episode_done: false + id: xpersona:Id + labels: + - apa daging favoritmu untuk dimakan? + reward: 0 + text: saya tidak . tapi saya punya daging favorit karena hanya itu yang saya makan + secara eksklusif. +- - episode_done: false + id: xpersona:Id + labels: + - Saya suka ayam atau makaroni dan keju. + reward: 0 + text: Saya harus mengatakan tulang rusuk utama. apakah Anda punya makanan favorit? +num_episodes: 16878 +num_examples: 124122 diff --git a/parlai/tasks/xpersona/test/xpersona_Id_valid.yml b/parlai/tasks/xpersona/test/xpersona_Id_valid.yml new file mode 100644 index 00000000000..9bd1f44417f --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Id_valid.yml @@ -0,0 +1,43 @@ +acts: +- - episode_done: false + eval_labels: + - saya baik-baik saja. hanya bersantai dengan kedua anjing saya. + id: xpersona:Id + reward: 0 + text: 'your persona:saya punya dua anjing. + + your persona:Saya suka mengurus mobil vintage. + + your persona:musik favorit saya adalah country. + + your persona:Saya memiliki dua mustang vintage. + + hai! bagaimana kabar anda malam ini?' +- - episode_done: false + eval_labels: + - itu hebat. pekerjaan sukarela seperti apa yang anda lakukan? + id: xpersona:Id + reward: 0 + text: bagus. di waktu luang saya melakukan pekerjaan sukarela. +- - episode_done: false + eval_labels: + - bagus, apakah anda suka mobil-mobil vintage? saya punya dua mustang tua. + id: xpersona:Id + reward: 0 + text: saya bekerja di sebuah tempat penampungan tunawisma di kota saya. +- - episode_done: false + eval_labels: + - mobil adalah kesenangan saya. mobil-mobil vintage. saya suka memodifikasi mobil. + gulat? apakah Anda menikmatinya? + id: xpersona:Id + reward: 0 + text: keren. saya tidak terlalu tertarik dengan mobil. pekerjaan sehari-hari saya + adalah bergulat. +- - episode_done: false + eval_labels: + - saya tidak memikirkan aspek keramaian dari gulat. saya tidak menyukai keramaian. + id: xpersona:Id + reward: 0 + text: ya, saya suka keramaian, membuat saya mengenal orang lain. +num_episodes: 484 +num_examples: 3781 diff --git a/parlai/tasks/xpersona/test/xpersona_It_test.yml b/parlai/tasks/xpersona/test/xpersona_It_test.yml new file mode 100644 index 00000000000..3fbdc8080a7 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_It_test.yml @@ -0,0 +1,42 @@ +acts: +- - episode_done: false + eval_labels: + - sto bene, sono appena uscito dal lavoro e sono stanco, ho due lavori. + id: xpersona:It + reward: 0 + text: 'your persona:leggo venti libri all''anno. + + your persona:sono una controfigura come secondo lavoro. + + your persona:mangio solo kosher. + + your persona:sono cresciuto in una famiglia con un solo genitore. + + ciao cosa fai oggi?' +- - episode_done: false + eval_labels: + - preferisco leggere, ho letto circa 20 libri quest'anno. + id: xpersona:It + reward: 0 + text: ho appena finito di guardare un film dell'orrore +- - episode_done: false + eval_labels: + - un bel film é sempre un bel film . + id: xpersona:It + reward: 0 + text: Wow ! Mi pieacerebbe davvero guardare un bel film horror. Questo fresco + é piacevole. +- - episode_done: false + eval_labels: + - lavoro anche nell'industria cinematografica . + id: xpersona:It + reward: 0 + text: si ! mio figlio é alle medie e ho appena iniziato a fargleli vedere +- - episode_done: false + eval_labels: + - si , é figo , faccio anche lo stantman, é molto divertente, ma é un lavoro faticoso. + id: xpersona:It + reward: 0 + text: eccezionale! ! Io invece lavoravo nel campo dei servizi umani +num_episodes: 140 +num_examples: 1096 diff --git a/parlai/tasks/xpersona/test/xpersona_It_train.yml b/parlai/tasks/xpersona/test/xpersona_It_train.yml new file mode 100644 index 00000000000..2a1cc1164a4 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_It_train.yml @@ -0,0 +1,43 @@ +acts: +- - episode_done: false + id: xpersona:It + labels: + - devi essere molto veloce. la caccia è uno dei miei hobby preferiti. + reward: 0 + text: 'your persona:mi piace ristrutturare le case. + + your persona:mi piace andare a caccia. + + your persona:mi piace tirare un inchino. + + your persona:la mia vacanza preferita è halloween. + + Ciao come va ? mi sto preparando a fare qualche ghepardo inseguendo per rimanere + in forma.' +- - episode_done: false + id: xpersona:It + labels: + - Ritocco anche le case quando non sono fuori a caccia di prua. + reward: 0 + text: sono ! per il mio hobby mi piace fare conserve o un po 'di whittling. +- - episode_done: false + id: xpersona:It + labels: + - è fantastico. hai una stagione o un periodo dell'anno preferito? + reward: 0 + text: è pulito. quando ero al liceo mi sono piazzato sesto nella lineetta dei + 100m! +- - episode_done: false + id: xpersona:It + labels: + - qual'è la tua carne preferita da mangiare? + reward: 0 + text: Io non . ma ho una carne preferita dato che è tutto ciò che mangio esclusivamente. +- - episode_done: false + id: xpersona:It + labels: + - mi piacciono il pollo, i maccheroni e il formaggio. + reward: 0 + text: dovrei dire la sua costola. hai dei cibi preferiti? +num_episodes: 16878 +num_examples: 124122 diff --git a/parlai/tasks/xpersona/test/xpersona_It_valid.yml b/parlai/tasks/xpersona/test/xpersona_It_valid.yml new file mode 100644 index 00000000000..1377be6a339 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_It_valid.yml @@ -0,0 +1,43 @@ +acts: +- - episode_done: false + eval_labels: + - Sto andando alla grande . mi sto solo rilassando con i miei due cani. + id: xpersona:It + reward: 0 + text: 'your persona:ho due cani. + + your persona:mi piace lavorare su auto d''epoca. + + your persona:la mia musica preferita è il Country. + + your persona:Possiedo due mustang vintage. + + Ciao ! come stai sta sera ?' +- - episode_done: false + eval_labels: + - Eccezionale. che tipo di volontariato fai? + id: xpersona:It + reward: 0 + text: grande . nel mio tempo libero faccio volontariato. +- - episode_done: false + eval_labels: + - buon per te . ti piacciono le auto d'epoca? ho due mustang d'epoca. + id: xpersona:It + reward: 0 + text: lavoro in un rifugio per senzatetto nella mia cittá. +- - episode_done: false + eval_labels: + - le macchine fanno per me, specialmente le auto d'epoca. mi piace lavorarci. + wrestling? ti piace ? + id: xpersona:It + reward: 0 + text: pazzesco . le macchine non fanno per me. Faccio il wrestler. +- - episode_done: false + eval_labels: + - non ho pensato ha quante persone ci sono in un' incontro di wrestling. non mi + piacciono le folle. + id: xpersona:It + reward: 0 + text: si, amo la folla, conoscere gente. +num_episodes: 140 +num_examples: 1080 diff --git a/parlai/tasks/xpersona/test/xpersona_Jp_test.yml b/parlai/tasks/xpersona/test/xpersona_Jp_test.yml new file mode 100644 index 00000000000..8bf3c58ccf3 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Jp_test.yml @@ -0,0 +1,41 @@ +acts: +- - episode_done: false + eval_labels: + - 元気です。ちょうど仕事が終わって疲れました。私は2つの仕事をしています。 + id: xpersona:Jp + reward: 0 + text: 'your persona:私は年間20冊の本を読みました。 + + your persona:私は私の2番目の仕事を兼ねたスタントです。 + + your persona:私はコーシャだけを食べます。 + + your persona:私はひとり親家庭で育ちました。 + + こんにちは今日は何をしていますか?' +- - episode_done: false + eval_labels: + - 私はむしろ読書が好きです、私は今年約20冊の本を読みました。 + id: xpersona:Jp + reward: 0 + text: ホラー映画を観たところです +- - episode_done: false + eval_labels: + - しかし、良い映画は常に良いです。 + id: xpersona:Jp + reward: 0 + text: うわー !私は良いホラー映画が大好きです。この涼しい天気が大好き +- - episode_done: false + eval_labels: + - 私も映画で働いています。 + id: xpersona:Jp + reward: 0 + text: はい !私の息子は中学生なのですが、彼にそれらを見ることを最近許し始めました。 +- - episode_done: false + eval_labels: + - はい、それは素晴らしいです。私はスタントマンとして働いていました。楽しくて大変な仕事です。 + id: xpersona:Jp + reward: 0 + text: 素晴らしい! !私はヒューマンサービス分野で働いていました +num_episodes: 275 +num_examples: 2161 diff --git a/parlai/tasks/xpersona/test/xpersona_Jp_train.yml b/parlai/tasks/xpersona/test/xpersona_Jp_train.yml new file mode 100644 index 00000000000..081a9b20588 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Jp_train.yml @@ -0,0 +1,41 @@ +acts: +- - episode_done: false + id: xpersona:Jp + labels: + - あなたは非常に速くなければなりません。狩猟は私の好きな趣味の1つです。 + reward: 0 + text: 'your persona:私は家を改造するのが好きです。 + + your persona:私は狩りに行くのが好きです。 + + your persona:私は弓を撃つのが好きです。 + + your persona:私のお気に入りの休日はハロウィーンです。 + + こんにちは、元気ですか?私はチーターを追いかけて体調を整える準備をしています。' +- - episode_done: false + id: xpersona:Jp + labels: + - 弓狩りをしていないときも家を改造します。 + reward: 0 + text: わたし !私の趣味のために私は缶詰か口someをするのが好きです。 +- - episode_done: false + id: xpersona:Jp + labels: + - それは素晴らしいです。好きな季節や時期はありますか? + reward: 0 + text: それはきちんとしている。私が高校にいたとき、100mダッシュで6位になりました! +- - episode_done: false + id: xpersona:Jp + labels: + - 好きな肉は何ですか? + reward: 0 + text: 私はしません 。でも好きな肉があるのはそれだけで食べるから。 +- - episode_done: false + id: xpersona:Jp + labels: + - 私はチキンやマカロニとチーズが好きです。 + reward: 0 + text: 私はそのプライムリブを言わなければならないでしょう。好きな食べ物はありますか? +num_episodes: 16878 +num_examples: 124122 diff --git a/parlai/tasks/xpersona/test/xpersona_Jp_valid.yml b/parlai/tasks/xpersona/test/xpersona_Jp_valid.yml new file mode 100644 index 00000000000..1ebda7356da --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Jp_valid.yml @@ -0,0 +1,41 @@ +acts: +- - episode_done: false + eval_labels: + - 私は元気です。私の2匹の犬とリラックスしています。 + id: xpersona:Jp + reward: 0 + text: 'your persona:私は2匹の犬を飼っています。 + + your persona:ヴィンテージカーで仕事をするのが好きです。 + + your persona:私の好きな音楽は田舎です。 + + your persona:私は2つのビンテージマスタングを所有しています。 + + こんばんは !今夜はどうお過ごしですか?' +- - episode_done: false + eval_labels: + - それは素晴らしい。どんなボランティア活動をしていますか? + id: xpersona:Jp + reward: 0 + text: すばらしいです 。暇なときはボランティア活動をしています。 +- - episode_done: false + eval_labels: + - いいですね。ビンテージカーはお好きですか?私は2つの古いムスタングを持っています。 + id: xpersona:Jp + reward: 0 + text: 私は町のホームレスシェルターで働いています。 +- - episode_done: false + eval_labels: + - 車はお気に入りです。ヴィンテージカー。私はそれらに取り組むことが大好きです。レスリングですか?楽しんでますか? + id: xpersona:Jp + reward: 0 + text: かっこいいですね。私はあまり車に興味がありません。私の仕事はレスリングです。 +- - episode_done: false + eval_labels: + - 私はレスリングの群衆の側面について考えませんでした。私は群衆が好きではありません。 + id: xpersona:Jp + reward: 0 + text: はい、私は群衆や人々と知り合いになるのが大好きです。 +num_episodes: 275 +num_examples: 2139 diff --git a/parlai/tasks/xpersona/test/xpersona_Ko_test.yml b/parlai/tasks/xpersona/test/xpersona_Ko_test.yml new file mode 100644 index 00000000000..5afba3d91ea --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Ko_test.yml @@ -0,0 +1,41 @@ +acts: +- - episode_done: false + eval_labels: + - 나는 좋아, 나는 방금 퇴근 했어 그리고 피곤해, 나는 두 직업을 가지고 있어. + id: xpersona:Ko + reward: 0 + text: 'your persona:나는 일년에 20권의 책을 읽어. + + your persona:난 두 번째 직업으로 대역이야 + + your persona:나는 오직 코셔만 먹어. + + your persona:나는 한 부모 가정에서 자랐어. + + 안녕, 오늘 뭐하니?' +- - episode_done: false + eval_labels: + - 나는 차라리 책을 읽어, 나는 올해 약 20권의 책을 읽었어. + id: xpersona:Ko + reward: 0 + text: 나는 방금 공포영화를 다 봤어. +- - episode_done: false + eval_labels: + - 그러나 좋은 영화는 항상 좋아. + id: xpersona:Ko + reward: 0 + text: 와우! 나는 좋은 공포영화를 좋아해. 더 시원한 날씨를 좋아해. +- - episode_done: false + eval_labels: + - 나는 영화계에서도 일해. + id: xpersona:Ko + reward: 0 + text: 응! 내 아들은 중학교에 다니고 있어. 나도 이제 막 내 아들이 그들을 보게 하기 시작했어. +- - episode_done: false + eval_labels: + - 그래, 그것은 멋지다, 나는 대역이야 그것은 매우 재미있고 힘든 일이야. + id: xpersona:Ko + reward: 0 + text: 좋았어! 나는 사회 복지 분야에서 일했었어. +num_episodes: 300 +num_examples: 2339 diff --git a/parlai/tasks/xpersona/test/xpersona_Ko_train.yml b/parlai/tasks/xpersona/test/xpersona_Ko_train.yml new file mode 100644 index 00000000000..8a69f58b939 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Ko_train.yml @@ -0,0 +1,41 @@ +acts: +- - episode_done: false + id: xpersona:Ko + labels: + - 너는 매우 빨라야 한다. 사냥은 내가 가장 좋아하는 취미중의 하나이다. + reward: 0 + text: 'your persona:나는 집을 개조하는 것을 좋아한다. + + your persona:나는 사냥 가는 것을 좋아한다. + + your persona:나는 활 쏘는 것을 좋아한다. + + your persona:내가 가장 좋아하는 휴일은 할로윈이다. + + 안녕, 어떻게 지내니? 나는 몸매를 유지하기 위해 치타를 쫓을 준비를 하고 있어.' +- - episode_done: false + id: xpersona:Ko + labels: + - 나는 또한 내가 활 사냥을 나가지 않을 때 집을 개조한다. + reward: 0 + text: 나는 나의 취미로 통조림이나 약간의 채찍질을 좋아한다. +- - episode_done: false + id: xpersona:Ko + labels: + - 멋지다. 너는 일년 중 가장 좋아하는 계절이나 시간을 가지고 있니? + reward: 0 + text: 멋지다. 내가 고등학교 때 100m 경주에서 6위를 했어! +- - episode_done: false + id: xpersona:Ko + labels: + - 네가 가장 좋아하는 고기는 뭐니? + reward: 0 + text: 나는 그렇지 않다. 그러나 그것이 내가 독점적으로 먹는 전부이기 때문에 나는 가장 좋아하는 고기를 가지고 있다. +- - episode_done: false + id: xpersona:Ko + labels: + - 나는 치킨이나 마카로니, 치즈를 좋아한다. + reward: 0 + text: 나는 그것의 주요 갈비라고 말해야 할 것이다. 너는 좋아하는 음식을 가지고 있니? +num_episodes: 16878 +num_examples: 124122 diff --git a/parlai/tasks/xpersona/test/xpersona_Ko_valid.yml b/parlai/tasks/xpersona/test/xpersona_Ko_valid.yml new file mode 100644 index 00000000000..77ff459606b --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Ko_valid.yml @@ -0,0 +1,41 @@ +acts: +- - episode_done: false + eval_labels: + - 나는 아주 잘 지내고 있어. 그냥 내 두 마리의 개와 함께 쉬고 있을 뿐이야. + id: xpersona:Ko + reward: 0 + text: 'your persona:나는 두 마리의 개를 가지고 있어. + + your persona:나는 빈티지 카에 대해 일하는 것을 좋아해. + + your persona:내가 가장 좋아하는 음악은 컨트리야 + + your persona:나는 빈티지 무스탕 두 개를 가지고 있어. + + 안녕! 오늘 밤 어떻게 지내니?' +- - episode_done: false + eval_labels: + - 멋지다. 너는 어떤 종류의 자원봉사를 하니? + id: xpersona:Ko + reward: 0 + text: 대단해. 여가시간에 나는 봉사활동을 해. +- - episode_done: false + eval_labels: + - 잘됐군요. 너는 빈티지 자동차를 좋아하니? 나는 두 개의 오래된 무스탕을 가지고 있어. + id: xpersona:Ko + reward: 0 + text: 나는 우리 마을의 노숙자 쉼터에서 일해. +- - episode_done: false + eval_labels: + - 차는 나의 전문분야야. 빈티지 자동차. 나는 그것들에 대해 일하는 것을 좋아해. 레슬링? 너는 그것을 즐기니? + id: xpersona:Ko + reward: 0 + text: 멋지다. 사실 자동차에는 관심이 별로 없어. 나의 주간 일은 레슬링이야. +- - episode_done: false + eval_labels: + - 나는 레슬링의 군중적인 측면에 대해 생각하지 않았어. 나는 군중들을 좋아하지 않아. + id: xpersona:Ko + reward: 0 + text: 예, 나는 군중들을 사랑합니다, 사람들을 알게 되는 것. +num_episodes: 299 +num_examples: 2342 diff --git a/parlai/tasks/xpersona/test/xpersona_Zh_test.yml b/parlai/tasks/xpersona/test/xpersona_Zh_test.yml new file mode 100644 index 00000000000..cf28bbd2cff --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Zh_test.yml @@ -0,0 +1,41 @@ +acts: +- - episode_done: false + eval_labels: + - 我很好,我刚下班很累,我有两份工作。 + id: xpersona:Zh + reward: 0 + text: 'your persona:我一年读二十本书。 + + your persona:我的第二份工作是做特技。 + + your persona:我只吃犹太洁食。 + + your persona:我在单亲家庭中长大。 + + 你好,今天在做什么?' +- - episode_done: false + eval_labels: + - 我更喜欢看书,今年我已经看了20本书。 + id: xpersona:Zh + reward: 0 + text: 我刚看完一部恐怖电影 +- - episode_done: false + eval_labels: + - 好看的电影总是好的。 + id: xpersona:Zh + reward: 0 + text: 哇 !我确实喜欢看一部恐怖电影。喜欢这种凉爽的天气 +- - episode_done: false + eval_labels: + - 我也看电影。 + id: xpersona:Zh + reward: 0 + text: 是的!我儿子在初中,我也开始让他看他们 +- - episode_done: false + eval_labels: + - 是吗,那很棒,那是非常有趣和困难的工作。 + id: xpersona:Zh + reward: 0 + text: 太好了! !我曾经在服务业工作 +num_episodes: 222 +num_examples: 1729 diff --git a/parlai/tasks/xpersona/test/xpersona_Zh_train.yml b/parlai/tasks/xpersona/test/xpersona_Zh_train.yml new file mode 100644 index 00000000000..b578937e7ee --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Zh_train.yml @@ -0,0 +1,41 @@ +acts: +- - episode_done: false + id: xpersona:Zh + labels: + - 你必须很快。狩猎是我最喜欢的爱好之一。 + reward: 0 + text: 'your persona:我喜欢装修房屋。 + + your persona:我喜欢打猎。 + + your persona:我喜欢打弓。 + + your persona:我最喜欢的假期是万圣节。 + + 嗨,你好吗 ?我准备做一些猎豹追捕以保持体形。' +- - episode_done: false + id: xpersona:Zh + labels: + - 当我不狩猎弓箭时,我也会改造房屋。 + reward: 0 + text: 我是 !为了我的爱好,我喜欢装罐头或一些糖果。 +- - episode_done: false + id: xpersona:Zh + labels: + - 棒极了 。您有一年中最喜欢的季节或时间吗? + reward: 0 + text: 那很好 。当我上高中时,我在100m冲刺中排名第六! +- - episode_done: false + id: xpersona:Zh + labels: + - 你最喜欢吃什么肉? + reward: 0 + text: 我不 。但是我确实喜欢一种肉,因为那是我唯一吃的。 +- - episode_done: false + id: xpersona:Zh + labels: + - 我喜欢鸡肉或通心粉和奶酪。 + reward: 0 + text: 我不得不说它的主要肋骨。你有最喜欢的食物吗? +num_episodes: 16878 +num_examples: 124122 diff --git a/parlai/tasks/xpersona/test/xpersona_Zh_valid.yml b/parlai/tasks/xpersona/test/xpersona_Zh_valid.yml new file mode 100644 index 00000000000..3c6d3d3a804 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_Zh_valid.yml @@ -0,0 +1,41 @@ +acts: +- - episode_done: false + eval_labels: + - 我很好 。和我的两只狗一起放松。 + id: xpersona:Zh + reward: 0 + text: 'your persona:我有两只狗。 + + your persona:我喜欢在老爷车上工作。 + + your persona:我最喜欢的音乐是乡村。 + + your persona:我拥有两个老式野马。 + + 嗨!你今晚过得怎么样?' +- - episode_done: false + eval_labels: + - 那很好 。您从事什么样的志愿工作? + id: xpersona:Zh + reward: 0 + text: 好极了。在业余时间我做志愿者工作。 +- - episode_done: false + eval_labels: + - 那很好。你喜欢老爷车吗?我有两个福特野马。 + id: xpersona:Zh + reward: 0 + text: 我在城镇的一个收容所工作。 +- - episode_done: false + eval_labels: + - 汽车是我的工作。老爷车。我喜欢为他们工作。摔角?你喜欢吗? + id: xpersona:Zh + reward: 0 + text: 很酷。我并不是很喜欢汽车。我的白天的工作是摔跤。 +- - episode_done: false + eval_labels: + - 我没考虑过摔跤。我不喜欢人多的地方。 + id: xpersona:Zh + reward: 0 + text: 是的,我喜欢人多的地方,也喜欢去了解人们。 +num_episodes: 222 +num_examples: 1720 diff --git a/parlai/tasks/xpersona/test/xpersona_test.yml b/parlai/tasks/xpersona/test/xpersona_test.yml new file mode 100644 index 00000000000..0f7523aa749 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_test.yml @@ -0,0 +1,42 @@ +acts: +- - episode_done: false + eval_labels: + - i am good , i just got off work and tired , i have two jobs . + id: xpersona + reward: 0 + text: 'your persona:i read twenty books a year. + + your persona:i''m a stunt double as my second job. + + your persona:i only eat kosher. + + your persona:i was raised in a single parent household. + + hello what are doing today ?' +- - episode_done: false + eval_labels: + - i rather read , i've read about 20 books this year . + id: xpersona + reward: 0 + text: i just got done watching a horror movie +- - episode_done: false + eval_labels: + - but a good movie is always good . + id: xpersona + reward: 0 + text: wow ! i do love a good horror movie . loving this cooler weather +- - episode_done: false + eval_labels: + - i work in the movies as well . + id: xpersona + reward: 0 + text: yes ! my son is in junior high and i just started letting him watch them + too +- - episode_done: false + eval_labels: + - yes it is neat , i stunt double , it is so much fun and hard work . + id: xpersona + reward: 0 + text: neat ! ! i used to work in the human services field +num_episodes: 1000 +num_examples: 7801 diff --git a/parlai/tasks/xpersona/test/xpersona_train.yml b/parlai/tasks/xpersona/test/xpersona_train.yml new file mode 100644 index 00000000000..1af6ae9dedd --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_train.yml @@ -0,0 +1,43 @@ +acts: +- - episode_done: false + id: xpersona + labels: + - you must be very fast . hunting is one of my favorite hobbies . + reward: 0 + text: 'your persona:i like to remodel homes. + + your persona:i like to go hunting. + + your persona:i like to shoot a bow. + + your persona:my favorite holiday is halloween. + + hi , how are you doing ? i''m getting ready to do some cheetah chasing to stay + in shape .' +- - episode_done: false + id: xpersona + labels: + - i also remodel homes when i am not out bow hunting . + reward: 0 + text: i am ! for my hobby i like to do canning or some whittling . +- - episode_done: false + id: xpersona + labels: + - that's awesome . do you have a favorite season or time of year ? + reward: 0 + text: that's neat . when i was in high school i placed 6th in 100m dash ! +- - episode_done: false + id: xpersona + labels: + - what is your favorite meat to eat ? + reward: 0 + text: i do not . but i do have a favorite meat since that is all i eat exclusively + . +- - episode_done: false + id: xpersona + labels: + - i like chicken or macaroni and cheese . + reward: 0 + text: i would have to say its prime rib . do you have any favorite foods ? +num_episodes: 16878 +num_examples: 124122 diff --git a/parlai/tasks/xpersona/test/xpersona_valid.yml b/parlai/tasks/xpersona/test/xpersona_valid.yml new file mode 100644 index 00000000000..256102185c7 --- /dev/null +++ b/parlai/tasks/xpersona/test/xpersona_valid.yml @@ -0,0 +1,46 @@ +acts: +- - episode_done: false + eval_labels: + - hey there ! i'm just taking a break from baking . whats up ? + id: xpersona + reward: 0 + text: 'your persona:i''m a nurse. + + your persona:i am a great baker. + + your persona:i surf often. + + your persona:i was an army brat. + + __SILENCE__' +- - episode_done: false + eval_labels: + - how romantic ! just some cupcakes for the surf a thon . gotta feed my fellow + surfers + id: xpersona + reward: 0 + text: finishing plans for my wedding in the park next week ! what are you baking + ? +- - episode_done: false + eval_labels: + - wow sounds so sweet ! so we both love the water huh ? + id: xpersona + reward: 0 + text: gnarly ! reminds me of the niagra falls where we are taking our honeymoon + . +- - episode_done: false + eval_labels: + - haha its sweet you compromised . have you been together long ? + id: xpersona + reward: 0 + text: yeah , although i'd prefer the beach . the falls are her idea . +- - episode_done: false + eval_labels: + - i get it . . . i grew up an army brat and my family is so disapproving of me + too . + id: xpersona + reward: 0 + text: 7 years . you would think my family would like her by now but they don't + . +num_episodes: 1000 +num_examples: 7316 From da12bc18312ac23b2a50808712d808ba75998a33 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E9=98=BF=E5=BD=AA?= Date: Tue, 18 Jan 2022 20:33:51 +0800 Subject: [PATCH 2/5] =?UTF-8?q?=09=E4=BF=AE=E6=94=B9=EF=BC=9A=20=20=20=20?= =?UTF-8?q?=20parlai/tasks/task=5Flist.py?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- parlai/tasks/task_list.py | 76 +++++---------------------------------- 1 file changed, 9 insertions(+), 67 deletions(-) diff --git a/parlai/tasks/task_list.py b/parlai/tasks/task_list.py index 2081031bbd0..ffc14759eb5 100644 --- a/parlai/tasks/task_list.py +++ b/parlai/tasks/task_list.py @@ -876,18 +876,6 @@ ), "links": {"website": "https://ai.google/tools/datasets/taskmaster-1"}, }, - { - "id": "MSR-E2E", - "display_name": "MSR End-to-End", - "task": "msr_e2e", - "tags": ["ChitChat"], - "description": ( - "MSR-E2E is a dataset of human-human conversations in which one " - "human plays the role of an Agent and the other one plays the role" - "of a User. Data is collected from Amazon Mechanical Turk. " - ), - "links": {"website": "https://github.com/xiul-msr/e2e_dialog_challenge"}, - }, { "id": "Twitter", "display_name": "Twitter", @@ -1175,20 +1163,6 @@ ), "links": {"arXiv": "https://arxiv.org/abs/1908.06083"}, }, - { - "id": "MultiDoGo", - "display_name": "MultiDoGo", - "task": "multidogo", - "tags": ["TOD"], - "description": ( - "MultiDoGo is a large task-oriented dataset from Amazon collected " - "in a Wizard of Oz fashion, using both crowd and expert annotators " - "with annotations at varying levels of granularity." - ), - "links": { - "website": "https://github.com/awslabs/multi-domain-goal-oriented-dialogues-dataset" - }, - }, { "id": "MultiWOZv2.0", "display_name": "MultiWOZ 2.0", @@ -1211,19 +1185,6 @@ ), "links": {"website": "http://dialogue.mi.eng.cam.ac.uk/index.php/corpus/"}, }, - { - "id": "MultiWOZv2.2", - "display_name": "MultiWOZ 2.2", - "task": "multiwoz_v22", - "tags": ["Goal"], - "description": ( - "A fully labeled collection of human-written conversations spanning" - "over multiple domains and topics. Schemas are included." - ), - "links": { - "website": "https://github.com/budzianowski/multiwoz/tree/master/data/MultiWOZ_2.2" - }, - }, { "id": "SelfChat", "display_name": "SelfChat", @@ -1393,17 +1354,6 @@ "human and a virtual assistant." ), }, - { - "id": "GoogleSGDSimulationSplits", - "display_name": "GoogleSGD Simulation Splits", - "task": "google_sgd_simulation_splits", - "tags": ["Goal"], - "description": ( - "Custom processing of the Google SGD dataset into In-Domain and " - "Out-of-Domain splits for the use of zero and few-shotting with " - "other task-oriented data." - ), - }, { "id": "TaskMaster2", "display_name": "TaskMaster2", @@ -1414,15 +1364,6 @@ "for task oriented dialogue in 7 domains." ), }, - { - "id": "TaskMaster3", - "display_name": "TicketTalk (Taskmaster3)", - "task": "taskmaster3", - "tags": ["Goal"], - "description": ( - "Taskmaster3 is a dataset of movie ticket dialogues collected in a self-chat manner. To induce conversational variety, crowd workers were asked to generate conversations given dozens of different instructions of different level of specificity, some purposefully including conversational errors." - ), - }, { "id": "GenderationBiasControlTask", "display_name": "GenderationBiasControlTask", @@ -1525,15 +1466,16 @@ }, }, { - "id": "SaFeRDialogues", - "display_name": "SaFeRDialogues", - "task": "saferdialogues", - "tags": [], + "id": "XPersona", + "display_name": "XPersona", + "task": "xpersona", + "tags": ["ChitChat", "Multilingual"], "description": ( - "A dataset of 8k dialogues demonstrating safety failures, feedback " - "signaling them, and a response acknowledging the feedback. " - "Dataset has been released under the CC BY-NC license." + "XPersona is an extension of ConvAI2 with six more languages: Chinese, French, Indonesian, Italian, Korean, and Japanese." ), - "links": {"arXiv": "https://arxiv.org/abs/2110.07518"}, + "links": { + "arXiv": "https://arxiv.org/pdf/2003.07568.pdf", + "website": "https://github.com/HLTCHKUST/Xpersona", + }, }, ] From c296ad408c1d53683ae0fdace517db959211b9fd Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E9=98=BF=E5=BD=AA?= Date: Tue, 18 Jan 2022 20:46:18 +0800 Subject: [PATCH 3/5] =?UTF-8?q?=09=E4=BF=AE=E6=94=B9=EF=BC=9A=20=20=20=20?= =?UTF-8?q?=20parlai/tasks/task=5Flist.py?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- parlai/tasks/task_list.py | 71 +++++++++++++++++++++++++++++++++++++++ 1 file changed, 71 insertions(+) diff --git a/parlai/tasks/task_list.py b/parlai/tasks/task_list.py index ffc14759eb5..0c558c69084 100644 --- a/parlai/tasks/task_list.py +++ b/parlai/tasks/task_list.py @@ -876,6 +876,18 @@ ), "links": {"website": "https://ai.google/tools/datasets/taskmaster-1"}, }, + { + "id": "MSR-E2E", + "display_name": "MSR End-to-End", + "task": "msr_e2e", + "tags": ["ChitChat"], + "description": ( + "MSR-E2E is a dataset of human-human conversations in which one " + "human plays the role of an Agent and the other one plays the role" + "of a User. Data is collected from Amazon Mechanical Turk. " + ), + "links": {"website": "https://github.com/xiul-msr/e2e_dialog_challenge"}, + }, { "id": "Twitter", "display_name": "Twitter", @@ -1163,6 +1175,20 @@ ), "links": {"arXiv": "https://arxiv.org/abs/1908.06083"}, }, + { + "id": "MultiDoGo", + "display_name": "MultiDoGo", + "task": "multidogo", + "tags": ["TOD"], + "description": ( + "MultiDoGo is a large task-oriented dataset from Amazon collected " + "in a Wizard of Oz fashion, using both crowd and expert annotators " + "with annotations at varying levels of granularity." + ), + "links": { + "website": "https://github.com/awslabs/multi-domain-goal-oriented-dialogues-dataset" + }, + }, { "id": "MultiWOZv2.0", "display_name": "MultiWOZ 2.0", @@ -1185,6 +1211,19 @@ ), "links": {"website": "http://dialogue.mi.eng.cam.ac.uk/index.php/corpus/"}, }, + { + "id": "MultiWOZv2.2", + "display_name": "MultiWOZ 2.2", + "task": "multiwoz_v22", + "tags": ["Goal"], + "description": ( + "A fully labeled collection of human-written conversations spanning" + "over multiple domains and topics. Schemas are included." + ), + "links": { + "website": "https://github.com/budzianowski/multiwoz/tree/master/data/MultiWOZ_2.2" + }, + }, { "id": "SelfChat", "display_name": "SelfChat", @@ -1354,6 +1393,17 @@ "human and a virtual assistant." ), }, + { + "id": "GoogleSGDSimulationSplits", + "display_name": "GoogleSGD Simulation Splits", + "task": "google_sgd_simulation_splits", + "tags": ["Goal"], + "description": ( + "Custom processing of the Google SGD dataset into In-Domain and " + "Out-of-Domain splits for the use of zero and few-shotting with " + "other task-oriented data." + ), + }, { "id": "TaskMaster2", "display_name": "TaskMaster2", @@ -1364,6 +1414,15 @@ "for task oriented dialogue in 7 domains." ), }, + { + "id": "TaskMaster3", + "display_name": "TicketTalk (Taskmaster3)", + "task": "taskmaster3", + "tags": ["Goal"], + "description": ( + "Taskmaster3 is a dataset of movie ticket dialogues collected in a self-chat manner. To induce conversational variety, crowd workers were asked to generate conversations given dozens of different instructions of different level of specificity, some purposefully including conversational errors." + ), + }, { "id": "GenderationBiasControlTask", "display_name": "GenderationBiasControlTask", @@ -1465,6 +1524,18 @@ "website": "https://github.com/kushalchawla/CaSiNo", }, }, + { + "id": "SaFeRDialogues", + "display_name": "SaFeRDialogues", + "task": "saferdialogues", + "tags": [], + "description": ( + "A dataset of 8k dialogues demonstrating safety failures, feedback " + "signaling them, and a response acknowledging the feedback. " + "Dataset has been released under the CC BY-NC license." + ), + "links": {"arXiv": "https://arxiv.org/abs/2110.07518"}, + }, { "id": "XPersona", "display_name": "XPersona", From 89d0b0ae8a5f175b0b6bcb9bcea25e22aa5b37f3 Mon Sep 17 00:00:00 2001 From: Zheng0428 Date: Wed, 19 Jan 2022 11:22:37 +0800 Subject: [PATCH 4/5] =?UTF-8?q?=09=E4=BF=AE=E6=94=B9=EF=BC=9A=20=20=20=20?= =?UTF-8?q?=20parlai/tasks/task=5Flist.py?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- parlai/tasks/task_list.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/parlai/tasks/task_list.py b/parlai/tasks/task_list.py index 0c558c69084..ca876f4409f 100644 --- a/parlai/tasks/task_list.py +++ b/parlai/tasks/task_list.py @@ -1540,7 +1540,7 @@ "id": "XPersona", "display_name": "XPersona", "task": "xpersona", - "tags": ["ChitChat", "Multilingual"], + "tags": ["ChitChat"], "description": ( "XPersona is an extension of ConvAI2 with six more languages: Chinese, French, Indonesian, Italian, Korean, and Japanese." ), From 6c681eabfc8893caca76edc7cde5a6b072665752 Mon Sep 17 00:00:00 2001 From: Stephen Roller Date: Thu, 20 Jan 2022 00:45:01 -0500 Subject: [PATCH 5/5] Update parlai/tasks/xpersona/build.py --- parlai/tasks/xpersona/build.py | 9 +-------- 1 file changed, 1 insertion(+), 8 deletions(-) diff --git a/parlai/tasks/xpersona/build.py b/parlai/tasks/xpersona/build.py index 8050106ad50..c8cf57a0f09 100644 --- a/parlai/tasks/xpersona/build.py +++ b/parlai/tasks/xpersona/build.py @@ -189,12 +189,5 @@ def _create_parlai_format(dpath: str): f_write.write(str(line_num) + ' your persona:' + persona + '\n') for utterance_A, utterance_B in dialogs: line_num += 1 - f_write.write( - str(line_num) - + ' ' - + utterance_A - + '\t' - + utterance_B - + '\n' - ) + f_write.write(f"{line_num} {utterance_A}\t{utterance_B}\n") os.remove(load_path)