diff --git a/model-customization/data-processing/seed-data-for-knowledge/utils/create_seed_dataset.py b/model-customization/data-processing/seed-data-for-knowledge/utils/create_seed_dataset.py index f049c86..af6980a 100644 --- a/model-customization/data-processing/seed-data-for-knowledge/utils/create_seed_dataset.py +++ b/model-customization/data-processing/seed-data-for-knowledge/utils/create_seed_dataset.py @@ -155,7 +155,7 @@ def truncate_chunk(chunk: str): for c in chunked_document_all_icl: if get_token_count(c["document"], tokenizer) > max_token_count: - raise ValueError(f"Chunk \"{truncate_chunk(c["document"])}\" exceeds token count of {max_token_count}") + raise ValueError(f"Chunk \"{truncate_chunk(c['document'])}\" exceeds token count of {max_token_count}") df = chunked_document_all_icl.to_pandas() diff --git a/model-customization/data-processing/seed-data-for-knowledge/utils/qna_gen.py b/model-customization/data-processing/seed-data-for-knowledge/utils/qna_gen.py index 5fb3384..eae8b2c 100644 --- a/model-customization/data-processing/seed-data-for-knowledge/utils/qna_gen.py +++ b/model-customization/data-processing/seed-data-for-knowledge/utils/qna_gen.py @@ -271,7 +271,7 @@ def view_seed_example(qna_output_path: Path, seed_example_num: int) -> None: raise ValueError(f"seed_example_num must be less than number of seed examples {len(seed_examples)}") seed_example = seed_examples[seed_example_num] print("Context:") - print(f"{seed_example["context"]}\n") + print(f"{seed_example['context']}\n") for qna in seed_example["questions_and_answers"]: - print(f"Question: {qna["question"]}") - print(f"Answer: {qna["answer"]}\n") + print(f"Question: {qna['question']}") + print(f"Answer: {qna['answer']}\n") diff --git a/quick-starts/instructlab-knowledge/utils/create_seed_dataset.py b/quick-starts/instructlab-knowledge/utils/create_seed_dataset.py index f049c86..af6980a 100644 --- a/quick-starts/instructlab-knowledge/utils/create_seed_dataset.py +++ b/quick-starts/instructlab-knowledge/utils/create_seed_dataset.py @@ -155,7 +155,7 @@ def truncate_chunk(chunk: str): for c in chunked_document_all_icl: if get_token_count(c["document"], tokenizer) > max_token_count: - raise ValueError(f"Chunk \"{truncate_chunk(c["document"])}\" exceeds token count of {max_token_count}") + raise ValueError(f"Chunk \"{truncate_chunk(c['document'])}\" exceeds token count of {max_token_count}") df = chunked_document_all_icl.to_pandas() diff --git a/quick-starts/instructlab-knowledge/utils/qna_gen.py b/quick-starts/instructlab-knowledge/utils/qna_gen.py index a112d5e..af5a86e 100644 --- a/quick-starts/instructlab-knowledge/utils/qna_gen.py +++ b/quick-starts/instructlab-knowledge/utils/qna_gen.py @@ -271,7 +271,7 @@ def view_seed_example(qna_output_path: Path, seed_example_num: int) -> None: raise ValueError(f"seed_example_num must be less than number of seed examples {len(seed_examples)}") seed_example = seed_examples[seed_example_num] print("Context:") - print(f"{seed_example["context"]}\n") + print(f"{seed_example['context']}\n") for qna in seed_example["questions_and_answers"]: - print(f"Question: {qna["question"]}") - print(f"Answer: {qna["answer"]}\n") + print(f"Question: {qna['question']}") + print(f"Answer: {qna['answer']}\n")