From c266f55b884fda1bba9d26d82eac43e19abd79d6 Mon Sep 17 00:00:00 2001 From: Preston Rasmussen <109292228+prasmussen15@users.noreply.github.com> Date: Wed, 6 Nov 2024 11:00:06 -0500 Subject: [PATCH] Update MSC dataset (#208) jsonl --- .../parse_msc_messages.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/examples/multi_session_conversation_memory/parse_msc_messages.py b/examples/multi_session_conversation_memory/parse_msc_messages.py index d69879bb..4c5bd219 100644 --- a/examples/multi_session_conversation_memory/parse_msc_messages.py +++ b/examples/multi_session_conversation_memory/parse_msc_messages.py @@ -31,8 +31,8 @@ def parse_msc_messages() -> list[list[ParsedMscMessage]]: msc_messages: list[list[ParsedMscMessage]] = [] speakers = ['Alice', 'Bob'] - with open('../data/msc.json') as file: - data = json.load(file)['data'] + with open('../data/msc.jsonl') as file: + data = [json.loads(line) for line in file] for i, conversation in enumerate(data): messages: list[ParsedMscMessage] = [] for previous_dialog in conversation['previous_dialogs']: @@ -73,8 +73,8 @@ def parse_msc_messages() -> list[list[ParsedMscMessage]]: def conversation_q_and_a() -> list[tuple[str, str]]: - with open('../data/msc.json') as file: - data = json.load(file)['data'] + with open('../data/msc.jsonl') as file: + data = [json.loads(line) for line in file] qa: list[tuple[str, str]] = [] for conversation in data: