import json import random import math def load_email_data(spam_path, ham_path): with open(spam_path, encoding="utf-8") as f1, open(ham_path, encoding="utf-8") as f2: spam_data= json.load(f1) ham_data= json.load(f2) return spam_data + ham_data def train_test_split(data, test_ratio=0.2): random.shuffle(data) cut = int(len(data) * (1-test_ratio)) return data[:cut], data[cut: ]