Answer the question above to unlock this code
import json
print("š Loading and validating training data...")
# Define data files
training_file = "data/basic_sft_training.jsonl"
validation_file = "data/basic_sft_validation.jsonl"
# Simulate loading training data
training_dataset = [
{"messages": [
{"role": "system", "content": "You are a helpful assistant for Zava Corp."},
{"role": "user", "content": "What are your business hours?"},
{"role": "assistant", "content": "Zava Corp is open Monday-Friday 9AM-6PM EST."}
]},
{"messages": [
{"role": "user", "content": "How can I contact support?"},
{"role": "assistant", "content": "You can reach Zava support at support@zava.com or call 1-800-ZAVA-HELP."}
]}
]
print(f"ā
Training set loaded: {len(training_dataset)} examples")
print(f"\nš First training example:")
for i, message in enumerate(training_dataset[0]["messages"]):
role_emoji = {"system": "š¤", "user": "š¤", "assistant": "š®"}
emoji = role_emoji.get(message["role"], "š¬")
print(f" {emoji} {message['role'].upper()}: {message['content']}")
print(f"\nš Data Summary:")
print(f" Training examples: {len(training_dataset)}")
print(f" Validation examples: 25")
print(f" Total examples: {len(training_dataset) + 25}")
š Loading and validating training data...
ā
Training set loaded: 2 examples
š First training example:
š¤ SYSTEM: You are a helpful assistant for Zava Corp.
š¤ USER: What are your business hours?
š® ASSISTANT: Zava Corp is open Monday-Friday 9AM-6PM EST.
š Data Summary:
Training examples: 2
Validation examples: 25
Total examples: 27