{ "artifacts": { "config_json": "/__modal/volumes/vo-XIgHS4JYPE8ddRlAcjQTwm/matex-privacy-sentinel-v0.15/config.json", "model_safetensors": "/__modal/volumes/vo-XIgHS4JYPE8ddRlAcjQTwm/matex-privacy-sentinel-v0.15/model.safetensors", "summary_json": "/__modal/volumes/vo-XIgHS4JYPE8ddRlAcjQTwm/matex-privacy-sentinel-v0.15/finetune_summary.json" }, "base_checkpoint": "/root/.opf/privacy_filter", "batch_size": 4, "best_epoch": 3, "best_metric": 0.1024377345965187, "best_metric_name": "validation_loss", "checkpoint_category_version": "v2", "device": "cuda", "elapsed_s": 1389.140961668, "encoding": "o200k_base", "epoch_metrics": [ { "elapsed_s": 236.30141436400004, "epoch": 1, "optimizer_steps": 4838, "train_batches": 4838, "train_loss": 0.4224884525690041, "train_token_accuracy": 0.8979510164879142, "train_tokens": 2511294, "validation_batches": 269, "validation_loss": 0.14451168486060656, "validation_token_accuracy": 0.963510242154591, "validation_tokens": 135079 }, { "elapsed_s": 231.365270813, "epoch": 2, "optimizer_steps": 4838, "train_batches": 4838, "train_loss": 0.1340547019875811, "train_token_accuracy": 0.9689526594655982, "train_tokens": 2511294, "validation_batches": 269, "validation_loss": 0.10732391039130999, "validation_token_accuracy": 0.9706097913073091, "validation_tokens": 135079 }, { "elapsed_s": 233.10564159199998, "epoch": 3, "optimizer_steps": 4838, "train_batches": 4838, "train_loss": 0.09496889466764975, "train_token_accuracy": 0.9774387228257624, "train_tokens": 2511294, "validation_batches": 269, "validation_loss": 0.1024377345965187, "validation_token_accuracy": 0.9753921779107041, "validation_tokens": 135079 }, { "elapsed_s": 227.36588568000002, "epoch": 4, "optimizer_steps": 4838, "train_batches": 4838, "train_loss": 0.07451669528509243, "train_token_accuracy": 0.982364868470199, "train_tokens": 2511294, "validation_batches": 269, "validation_loss": 0.10625521156434652, "validation_token_accuracy": 0.9763101592401484, "validation_tokens": 135079 }, { "elapsed_s": 226.71261706799987, "epoch": 5, "optimizer_steps": 4838, "train_batches": 4838, "train_loss": 0.05886880379947683, "train_token_accuracy": 0.9861358327619147, "train_tokens": 2511294, "validation_batches": 269, "validation_loss": 0.1118486727110866, "validation_token_accuracy": 0.9772059313438802, "validation_tokens": 135079 }, { "elapsed_s": 226.514154576, "epoch": 6, "optimizer_steps": 4838, "train_batches": 4838, "train_loss": 0.04627119501343269, "train_token_accuracy": 0.9890052697931824, "train_tokens": 2511294, "validation_batches": 269, "validation_loss": 0.12361862301164639, "validation_token_accuracy": 0.9769542267858068, "validation_tokens": 135079 } ], "epochs": 6, "generated_at_unix": 1777769967.2668755, "grad_accum_steps": 1, "label_space_json_path": "/__modal/volumes/vo-1GyZvIAPD7wnYD3s0C2QXS/dataset/configs/custom_label_space.json", "label_space_source": "label-space-json", "learning_rate": 1e-05, "max_grad_norm": 1.0, "num_output_labels": 97, "num_train_examples": 19350, "num_train_windows": 19350, "num_validation_examples": 1075, "num_validation_windows": 1075, "output_checkpoint_dir": "/__modal/volumes/vo-XIgHS4JYPE8ddRlAcjQTwm/matex-privacy-sentinel-v0.15", "output_head_reinitialized": true, "output_head_rows_copied": 97, "output_head_rows_copied_exact": 33, "output_head_rows_copied_fallback": 64, "resolved_category_version": "matex_privacy_sentinel_v0_1", "resolved_n_ctx": 128000, "schema_version": 1, "serialized_param_dtype": "bfloat16", "span_class_names": [ "O", "account_number", "private_address", "private_email", "private_person", "private_phone", "private_url", "private_date", "secret", "api_key", "auth_token", "session_cookie", "database_uri", "cloud_credential", "private_file_path", "internal_url", "workspace_identity", "customer_data", "prompt_sensitive", "agent_memory_sensitive", "stacktrace_sensitive", "repo_secret", "payment_token", "personal_document_id", "terminal_log" ], "train_dataset": "/data/dataset/compiled/train.jsonl", "train_dataset_variant": "full", "validation_dataset": "/data/dataset/compiled/validation.jsonl", "validation_dataset_variant": "full", "validation_split": null, "weight_decay": 0.01 }