{ "sentinel_tokenizer": { "vocab_size": 61440, "text_vocab": 32768, "image_codebook": 16384, "audio_codebook": 8192, "video_codebook": 4096, "metrics": { "avg_fertility": 9.13065205232572, "std_fertility": 16.348063069521316, "avg_compression": 3.5456289797801976, "fairness": 0.057643322830483165 } }, "comparisons": { "GPT-2 (50K)": { "avg_fertility": 20.85785254531753, "std_fertility": 40.76486672709434, "avg_compression": 2.4054180948259107, "fairness": 0.023943569760064974 }, "Gemma (256K)": { "avg_fertility": 6.688784516655667, "std_fertility": 11.713991856851852, "avg_compression": 4.660773272747129, "fairness": 0.07865350326310598 }, "Qwen2 (151K)": { "avg_fertility": 8.030528860080679, "std_fertility": 13.75415784885323, "avg_compression": 3.8169528301673328, "fairness": 0.06777750450038225 }, "Sentinel-SUT": { "avg_fertility": 9.13065205232572, "std_fertility": 16.348063069521316, "avg_compression": 3.5456289797801976, "fairness": 0.057643322830483165 } }, "sentinel_constants": { "INV_E": 0.36787944117144233, "C1": -0.007994021805952546, "C2": 0.00020005604296784437 }, "training_data": { "languages": [ "en", "fr", "de", "es", "zh", "ja", "ar", "ru", "ko", "hi", "pt", "it", "nl", "pl", "vi", "th", "tr", "he", "uk", "sv" ], "total_samples": 52000 } }