| { |
| "case_count": 4, |
| "dataset": "data/learned_candidate_model_stress.jsonl", |
| "metrics": { |
| "abstention_accuracy": 1.0, |
| "accepted_candidate_support_rate": 1.0, |
| "bad_candidate_rejection_rate": 1.0, |
| "candidate_graph_contamination_count": 0, |
| "candidate_ranking_accuracy": 1.0, |
| "channel_activation_accuracy": 0.9886, |
| "deeper_chain_success_rate": 1.0, |
| "distractor_robustness": 1.0, |
| "resolver_prediction_accuracy": 1.0, |
| "trace_schema_validity": 1.0, |
| "verifier_beats_model_confidence_rate": 1.0 |
| }, |
| "results": [ |
| { |
| "abstention_checks": [], |
| "accepted_support_checks": [ |
| true |
| ], |
| "bad_rejection_checks": [ |
| true, |
| true |
| ], |
| "candidate_graph_contamination_count": 0, |
| "candidate_ranking_correct": true, |
| "case_id": "stress_high_confidence_wrong", |
| "channel_activation_checks": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true |
| ], |
| "deeper_chain_checks": [ |
| true |
| ], |
| "is_distractor": false, |
| "resolver_prediction_checks": [ |
| true, |
| true, |
| true |
| ], |
| "scored_candidates": [ |
| { |
| "candidate_id": "valid_m_p", |
| "claim": "All M are P", |
| "confidence": 0.42, |
| "features": { |
| "accepted_relation_candidate": 1.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.42, |
| "candidate_quantifier_all": 1.0, |
| "candidate_quantifier_no": 0.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 1.0, |
| "direct_support": 0.0, |
| "has_distractor": 0.0, |
| "identity_candidate": 0.0, |
| "identity_path_exists": 0.0, |
| "malformed_candidate": 0.0, |
| "no_against_transitive_support": 0.0, |
| "parseable_relation": 1.0, |
| "premise_count": 3.0, |
| "reverse_path": 0.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 3.0, |
| "transitive_support": 1.0, |
| "unsupported_relation_candidate": 0.0 |
| }, |
| "prediction": { |
| "channels": [ |
| "logic_transitivity" |
| ], |
| "model_confidence": 0.7622, |
| "ranking_score": 1.1648, |
| "resolver": "accept_transitive", |
| "status": "accepted" |
| }, |
| "raw_output": "All M are P", |
| "source": "learned_candidate_dataset" |
| }, |
| { |
| "candidate_id": "bad_identity_m_p", |
| "claim": "M equals P", |
| "confidence": 0.98, |
| "features": { |
| "accepted_relation_candidate": 0.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.98, |
| "candidate_quantifier_all": 0.0, |
| "candidate_quantifier_no": 0.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 1.0, |
| "direct_support": 0.0, |
| "has_distractor": 0.0, |
| "identity_candidate": 1.0, |
| "identity_path_exists": 1.0, |
| "malformed_candidate": 0.0, |
| "no_against_transitive_support": 0.0, |
| "parseable_relation": 0.0, |
| "premise_count": 3.0, |
| "reverse_path": 0.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 0.0, |
| "transitive_support": 0.0, |
| "unsupported_relation_candidate": 0.0 |
| }, |
| "prediction": { |
| "channels": [ |
| "identity_preservation" |
| ], |
| "model_confidence": 0.0475, |
| "ranking_score": -2.9988, |
| "resolver": "reject_identity", |
| "status": "rejected" |
| }, |
| "raw_output": "M equals P", |
| "source": "learned_candidate_dataset" |
| }, |
| { |
| "candidate_id": "bad_reverse_p_m", |
| "claim": "All P are M", |
| "confidence": 0.99, |
| "features": { |
| "accepted_relation_candidate": 0.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.99, |
| "candidate_quantifier_all": 1.0, |
| "candidate_quantifier_no": 0.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 1.0, |
| "direct_support": 0.0, |
| "has_distractor": 0.0, |
| "identity_candidate": 0.0, |
| "identity_path_exists": 0.0, |
| "malformed_candidate": 0.0, |
| "no_against_transitive_support": 0.0, |
| "parseable_relation": 1.0, |
| "premise_count": 3.0, |
| "reverse_path": 1.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 0.0, |
| "transitive_support": 0.0, |
| "unsupported_relation_candidate": 0.0 |
| }, |
| "prediction": { |
| "channels": [ |
| "directionality" |
| ], |
| "model_confidence": 0.0171, |
| "ranking_score": -4.0544, |
| "resolver": "reject_reverse", |
| "status": "rejected" |
| }, |
| "raw_output": "All P are M", |
| "source": "learned_candidate_dataset" |
| } |
| ], |
| "tags": [ |
| "deeper_chain", |
| "high_confidence_wrong" |
| ], |
| "top_candidate_id": "valid_m_p", |
| "trace_schema_valid": true, |
| "verification": { |
| "abstained": [], |
| "accepted": [ |
| "All M are P" |
| ], |
| "candidate_results": [ |
| { |
| "candidate_id": "valid_m_p", |
| "channel_trace": { |
| "confidence_abstention": { |
| "activated": true, |
| "details": { |
| "decision": "answer", |
| "event": { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "abstained_or_answered" |
| }, |
| "contradiction": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "directionality": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "identity_preservation": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "preserved_distinct_nodes", |
| "channel": "identity_preservation", |
| "details": {}, |
| "evidence": [ |
| "M!=P" |
| ], |
| "status": "resolved", |
| "target": "M!=P", |
| "tension_delta": -1.0 |
| }, |
| "protects_against": "relation_identity_collapse" |
| }, |
| "evidence": [ |
| "('M', 'P')" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "preserved_distinct_nodes" |
| }, |
| "logic_transitivity": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "M->N->O", |
| "N->O->P", |
| "M->N->P" |
| ], |
| "status": "resolved", |
| "target": "M->O, N->P, M->P", |
| "tension_delta": -3.0 |
| }, |
| "missing_inferences": 0 |
| }, |
| "evidence": [ |
| "M->N->O", |
| "N->O->P" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "added_inferred_edge" |
| }, |
| "quantifier_scope": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "surface_structure": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 6 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| "untagged_claim_edges": 0 |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "tagged_premise_inferred_candidate_edges" |
| } |
| }, |
| "channels": { |
| "logic_transitivity": "accepted inferred edge" |
| }, |
| "claim": "All M are P", |
| "confidence": 0.7622, |
| "provenance": { |
| "candidate_id": "valid_m_p", |
| "confidence": 0.7622, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.42, |
| "model_prediction": { |
| "channels": [ |
| "logic_transitivity" |
| ], |
| "model_confidence": 0.7622, |
| "ranking_score": 1.1648, |
| "resolver": "accept_transitive", |
| "status": "accepted" |
| } |
| }, |
| "raw_output": "All M are P", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "candidate is supported by a typed transitive inference", |
| "source": "learned_candidate_model", |
| "status": "accepted", |
| "typed_runtime": { |
| "available": true, |
| "context": { |
| "abstention": false, |
| "blocked_edges": [], |
| "blocked_equalities": [ |
| "M!=P" |
| ], |
| "contradiction_flagged": false, |
| "quantifier_scope_blocked": false, |
| "surface_tags": { |
| "M->N:all": "premise", |
| "M->O:all": "inferred", |
| "M->P:all": "inferred", |
| "N->O:all": "premise", |
| "N->P:all": "inferred", |
| "O->P:all": "premise" |
| } |
| }, |
| "global_tension": 0.0, |
| "resolver_events": [ |
| { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "M->N->O", |
| "N->O->P", |
| "M->N->P" |
| ], |
| "status": "resolved", |
| "target": "M->O, N->P, M->P", |
| "tension_delta": -3.0 |
| }, |
| { |
| "action": "preserved_distinct_nodes", |
| "channel": "identity_preservation", |
| "details": {}, |
| "evidence": [ |
| "M!=P" |
| ], |
| "status": "resolved", |
| "target": "M!=P", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 6 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| ], |
| "settled": true |
| } |
| }, |
| { |
| "candidate_id": "bad_identity_m_p", |
| "channel_trace": { |
| "confidence_abstention": { |
| "activated": true, |
| "details": { |
| "decision": "answer", |
| "event": { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "abstained_or_answered" |
| }, |
| "contradiction": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "directionality": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "identity_preservation": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "preserved_distinct_nodes", |
| "channel": "identity_preservation", |
| "details": {}, |
| "evidence": [ |
| "M!=P" |
| ], |
| "status": "resolved", |
| "target": "M!=P", |
| "tension_delta": -1.0 |
| }, |
| "protects_against": "relation_identity_collapse" |
| }, |
| "evidence": [ |
| "('M', 'P')" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "preserved_distinct_nodes" |
| }, |
| "logic_transitivity": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "M->N->O", |
| "N->O->P", |
| "M->N->P" |
| ], |
| "status": "resolved", |
| "target": "M->O, N->P, M->P", |
| "tension_delta": -3.0 |
| }, |
| "missing_inferences": 0 |
| }, |
| "evidence": [ |
| "M->N->O", |
| "N->O->P" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "added_inferred_edge" |
| }, |
| "quantifier_scope": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "surface_structure": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 6 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| "untagged_claim_edges": 0 |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "tagged_premise_inferred_candidate_edges" |
| } |
| }, |
| "channels": { |
| "identity_preservation": "blocked identity collapse" |
| }, |
| "claim": "M equals P", |
| "confidence": 0.0475, |
| "provenance": { |
| "candidate_id": "bad_identity_m_p", |
| "confidence": 0.0475, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.98, |
| "model_prediction": { |
| "channels": [ |
| "identity_preservation" |
| ], |
| "model_confidence": 0.0475, |
| "ranking_score": -2.9988, |
| "resolver": "reject_identity", |
| "status": "rejected" |
| } |
| }, |
| "raw_output": "M equals P", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "candidate collapses distinct graph nodes", |
| "source": "learned_candidate_model", |
| "status": "rejected", |
| "typed_runtime": { |
| "available": true, |
| "context": { |
| "abstention": false, |
| "blocked_edges": [], |
| "blocked_equalities": [ |
| "M!=P" |
| ], |
| "contradiction_flagged": false, |
| "quantifier_scope_blocked": false, |
| "surface_tags": { |
| "M->N:all": "premise", |
| "M->O:all": "inferred", |
| "M->P:all": "inferred", |
| "N->O:all": "premise", |
| "N->P:all": "inferred", |
| "O->P:all": "premise" |
| } |
| }, |
| "global_tension": 0.0, |
| "resolver_events": [ |
| { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "M->N->O", |
| "N->O->P", |
| "M->N->P" |
| ], |
| "status": "resolved", |
| "target": "M->O, N->P, M->P", |
| "tension_delta": -3.0 |
| }, |
| { |
| "action": "preserved_distinct_nodes", |
| "channel": "identity_preservation", |
| "details": {}, |
| "evidence": [ |
| "M!=P" |
| ], |
| "status": "resolved", |
| "target": "M!=P", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 6 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| ], |
| "settled": true |
| } |
| }, |
| { |
| "candidate_id": "bad_reverse_p_m", |
| "channel_trace": { |
| "confidence_abstention": { |
| "activated": true, |
| "details": { |
| "decision": "answer", |
| "event": { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "abstained_or_answered" |
| }, |
| "contradiction": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "directionality": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "blocked_reverse_inference", |
| "channel": "directionality", |
| "details": {}, |
| "evidence": [ |
| "P->M" |
| ], |
| "status": "resolved", |
| "target": "P->M", |
| "tension_delta": -1.0 |
| }, |
| "protects_against": "converse_fallacy" |
| }, |
| "evidence": [ |
| "P->M" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "blocked_reverse_inference" |
| }, |
| "identity_preservation": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "logic_transitivity": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "M->N->O", |
| "N->O->P", |
| "M->N->P" |
| ], |
| "status": "resolved", |
| "target": "M->O, N->P, M->P", |
| "tension_delta": -3.0 |
| }, |
| "missing_inferences": 0 |
| }, |
| "evidence": [ |
| "M->N->O", |
| "N->O->P" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "added_inferred_edge" |
| }, |
| "quantifier_scope": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "surface_structure": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 6 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| "untagged_claim_edges": 0 |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "tagged_premise_inferred_candidate_edges" |
| } |
| }, |
| "channels": { |
| "directionality": "blocked reverse inference" |
| }, |
| "claim": "All P are M", |
| "confidence": 0.0171, |
| "provenance": { |
| "candidate_id": "bad_reverse_p_m", |
| "confidence": 0.0171, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.99, |
| "model_prediction": { |
| "channels": [ |
| "directionality" |
| ], |
| "model_confidence": 0.0171, |
| "ranking_score": -4.0544, |
| "resolver": "reject_reverse", |
| "status": "rejected" |
| } |
| }, |
| "raw_output": "All P are M", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "candidate reverses a directed support path", |
| "source": "learned_candidate_model", |
| "status": "rejected", |
| "typed_runtime": { |
| "available": true, |
| "context": { |
| "abstention": false, |
| "blocked_edges": [ |
| "P->M" |
| ], |
| "blocked_equalities": [], |
| "contradiction_flagged": false, |
| "quantifier_scope_blocked": false, |
| "surface_tags": { |
| "M->N:all": "premise", |
| "M->O:all": "inferred", |
| "M->P:all": "inferred", |
| "N->O:all": "premise", |
| "N->P:all": "inferred", |
| "O->P:all": "premise" |
| } |
| }, |
| "global_tension": 0.0, |
| "resolver_events": [ |
| { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "M->N->O", |
| "N->O->P", |
| "M->N->P" |
| ], |
| "status": "resolved", |
| "target": "M->O, N->P, M->P", |
| "tension_delta": -3.0 |
| }, |
| { |
| "action": "blocked_reverse_inference", |
| "channel": "directionality", |
| "details": {}, |
| "evidence": [ |
| "P->M" |
| ], |
| "status": "resolved", |
| "target": "P->M", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 6 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| ], |
| "settled": true |
| } |
| } |
| ], |
| "channels": { |
| "directionality": "blocked reverse inference", |
| "identity_preservation": "blocked identity collapse", |
| "logic_transitivity": "accepted inferred edge" |
| }, |
| "rejected": [ |
| "M equals P", |
| "All P are M" |
| ] |
| }, |
| "verifier_beats_confidence_checks": [ |
| true, |
| true |
| ] |
| }, |
| { |
| "abstention_checks": [], |
| "accepted_support_checks": [ |
| true |
| ], |
| "bad_rejection_checks": [ |
| true, |
| true |
| ], |
| "candidate_graph_contamination_count": 0, |
| "candidate_ranking_correct": true, |
| "case_id": "stress_malformed_and_contradictory", |
| "channel_activation_checks": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true |
| ], |
| "deeper_chain_checks": [], |
| "is_distractor": false, |
| "resolver_prediction_checks": [ |
| true, |
| true, |
| true |
| ], |
| "scored_candidates": [ |
| { |
| "candidate_id": "valid_cats_animals", |
| "claim": "All cats are animals", |
| "confidence": 0.53, |
| "features": { |
| "accepted_relation_candidate": 1.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.53, |
| "candidate_quantifier_all": 1.0, |
| "candidate_quantifier_no": 0.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 0.0, |
| "direct_support": 0.0, |
| "has_distractor": 0.0, |
| "identity_candidate": 0.0, |
| "identity_path_exists": 0.0, |
| "malformed_candidate": 0.0, |
| "no_against_transitive_support": 0.0, |
| "parseable_relation": 1.0, |
| "premise_count": 2.0, |
| "reverse_path": 0.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 2.0, |
| "transitive_support": 1.0, |
| "unsupported_relation_candidate": 0.0 |
| }, |
| "prediction": { |
| "channels": [ |
| "logic_transitivity" |
| ], |
| "model_confidence": 0.6799, |
| "ranking_score": 0.7532, |
| "resolver": "accept_transitive", |
| "status": "accepted" |
| }, |
| "raw_output": "All cats are animals", |
| "source": "learned_candidate_dataset" |
| }, |
| { |
| "candidate_id": "bad_no_cats_animals", |
| "claim": "No cats are animals", |
| "confidence": 0.9, |
| "features": { |
| "accepted_relation_candidate": 0.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.9, |
| "candidate_quantifier_all": 0.0, |
| "candidate_quantifier_no": 1.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 0.0, |
| "direct_support": 0.0, |
| "has_distractor": 0.0, |
| "identity_candidate": 0.0, |
| "identity_path_exists": 0.0, |
| "malformed_candidate": 0.0, |
| "no_against_transitive_support": 1.0, |
| "parseable_relation": 1.0, |
| "premise_count": 2.0, |
| "reverse_path": 0.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 2.0, |
| "transitive_support": 1.0, |
| "unsupported_relation_candidate": 0.0 |
| }, |
| "prediction": { |
| "channels": [ |
| "contradiction" |
| ], |
| "model_confidence": 0.2986, |
| "ranking_score": -0.854, |
| "resolver": "reject_contradiction", |
| "status": "rejected" |
| }, |
| "raw_output": "No cats are animals", |
| "source": "learned_candidate_dataset" |
| }, |
| { |
| "candidate_id": "malformed_cats", |
| "claim": "cats somehow animalish", |
| "confidence": 0.88, |
| "features": { |
| "accepted_relation_candidate": 0.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.88, |
| "candidate_quantifier_all": 0.0, |
| "candidate_quantifier_no": 0.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 0.0, |
| "direct_support": 0.0, |
| "has_distractor": 0.0, |
| "identity_candidate": 0.0, |
| "identity_path_exists": 0.0, |
| "malformed_candidate": 1.0, |
| "no_against_transitive_support": 0.0, |
| "parseable_relation": 0.0, |
| "premise_count": 2.0, |
| "reverse_path": 0.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 0.0, |
| "transitive_support": 0.0, |
| "unsupported_relation_candidate": 0.0 |
| }, |
| "prediction": { |
| "channels": [ |
| "malformed_relation" |
| ], |
| "model_confidence": 0.096, |
| "ranking_score": -2.2428, |
| "resolver": "reject_malformed", |
| "status": "rejected" |
| }, |
| "raw_output": "cats somehow animalish", |
| "source": "learned_candidate_dataset" |
| } |
| ], |
| "tags": [ |
| "malformed", |
| "contradiction", |
| "high_confidence_wrong" |
| ], |
| "top_candidate_id": "valid_cats_animals", |
| "trace_schema_valid": true, |
| "verification": { |
| "abstained": [], |
| "accepted": [ |
| "All cats are animals" |
| ], |
| "candidate_results": [ |
| { |
| "candidate_id": "valid_cats_animals", |
| "channel_trace": { |
| "confidence_abstention": { |
| "activated": true, |
| "details": { |
| "decision": "answer", |
| "event": { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "abstained_or_answered" |
| }, |
| "contradiction": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "directionality": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "identity_preservation": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "preserved_distinct_nodes", |
| "channel": "identity_preservation", |
| "details": {}, |
| "evidence": [ |
| "cats!=animals" |
| ], |
| "status": "resolved", |
| "target": "cats!=animals", |
| "tension_delta": -1.0 |
| }, |
| "protects_against": "relation_identity_collapse" |
| }, |
| "evidence": [ |
| "('cats', 'animals')" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "preserved_distinct_nodes" |
| }, |
| "logic_transitivity": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "cats->mammals->animals" |
| ], |
| "status": "resolved", |
| "target": "cats->animals", |
| "tension_delta": -1.0 |
| }, |
| "missing_inferences": 0 |
| }, |
| "evidence": [ |
| "cats->mammals->animals" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "added_inferred_edge" |
| }, |
| "quantifier_scope": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "surface_structure": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 3 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| "untagged_claim_edges": 0 |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "tagged_premise_inferred_candidate_edges" |
| } |
| }, |
| "channels": { |
| "logic_transitivity": "accepted inferred edge" |
| }, |
| "claim": "All cats are animals", |
| "confidence": 0.6799, |
| "provenance": { |
| "candidate_id": "valid_cats_animals", |
| "confidence": 0.6799, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.53, |
| "model_prediction": { |
| "channels": [ |
| "logic_transitivity" |
| ], |
| "model_confidence": 0.6799, |
| "ranking_score": 0.7532, |
| "resolver": "accept_transitive", |
| "status": "accepted" |
| } |
| }, |
| "raw_output": "All cats are animals", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "candidate is supported by a typed transitive inference", |
| "source": "learned_candidate_model", |
| "status": "accepted", |
| "typed_runtime": { |
| "available": true, |
| "context": { |
| "abstention": false, |
| "blocked_edges": [], |
| "blocked_equalities": [ |
| "cats!=animals" |
| ], |
| "contradiction_flagged": false, |
| "quantifier_scope_blocked": false, |
| "surface_tags": { |
| "cats->animals:all": "inferred", |
| "cats->mammals:all": "premise", |
| "mammals->animals:all": "premise" |
| } |
| }, |
| "global_tension": 0.0, |
| "resolver_events": [ |
| { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "cats->mammals->animals" |
| ], |
| "status": "resolved", |
| "target": "cats->animals", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "preserved_distinct_nodes", |
| "channel": "identity_preservation", |
| "details": {}, |
| "evidence": [ |
| "cats!=animals" |
| ], |
| "status": "resolved", |
| "target": "cats!=animals", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 3 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| ], |
| "settled": true |
| } |
| }, |
| { |
| "candidate_id": "bad_no_cats_animals", |
| "channel_trace": { |
| "confidence_abstention": { |
| "activated": true, |
| "details": { |
| "decision": "answer", |
| "event": { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "abstained_or_answered" |
| }, |
| "contradiction": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "directionality": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "identity_preservation": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "preserved_distinct_nodes", |
| "channel": "identity_preservation", |
| "details": {}, |
| "evidence": [ |
| "cats!=animals" |
| ], |
| "status": "resolved", |
| "target": "cats!=animals", |
| "tension_delta": -1.0 |
| }, |
| "protects_against": "relation_identity_collapse" |
| }, |
| "evidence": [ |
| "('cats', 'animals')" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "preserved_distinct_nodes" |
| }, |
| "logic_transitivity": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "cats->mammals->animals" |
| ], |
| "status": "resolved", |
| "target": "cats->animals", |
| "tension_delta": -1.0 |
| }, |
| "missing_inferences": 0 |
| }, |
| "evidence": [ |
| "cats->mammals->animals" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "added_inferred_edge" |
| }, |
| "quantifier_scope": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "surface_structure": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 3 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| "untagged_claim_edges": 0 |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "tagged_premise_inferred_candidate_edges" |
| } |
| }, |
| "channels": { |
| "contradiction": "rejected candidate contradicts premise edge" |
| }, |
| "claim": "No cats are animals", |
| "confidence": 0.2986, |
| "provenance": { |
| "candidate_id": "bad_no_cats_animals", |
| "confidence": 0.2986, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.9, |
| "model_prediction": { |
| "channels": [ |
| "contradiction" |
| ], |
| "model_confidence": 0.2986, |
| "ranking_score": -0.854, |
| "resolver": "reject_contradiction", |
| "status": "rejected" |
| } |
| }, |
| "raw_output": "No cats are animals", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "candidate contradicts a premise-supported edge", |
| "source": "learned_candidate_model", |
| "status": "rejected", |
| "typed_runtime": { |
| "available": true, |
| "context": { |
| "abstention": false, |
| "blocked_edges": [], |
| "blocked_equalities": [ |
| "cats!=animals" |
| ], |
| "contradiction_flagged": false, |
| "quantifier_scope_blocked": false, |
| "surface_tags": { |
| "cats->animals:all": "inferred", |
| "cats->mammals:all": "premise", |
| "mammals->animals:all": "premise" |
| } |
| }, |
| "global_tension": 0.0, |
| "resolver_events": [ |
| { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "cats->mammals->animals" |
| ], |
| "status": "resolved", |
| "target": "cats->animals", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "preserved_distinct_nodes", |
| "channel": "identity_preservation", |
| "details": {}, |
| "evidence": [ |
| "cats!=animals" |
| ], |
| "status": "resolved", |
| "target": "cats!=animals", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 3 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| ], |
| "settled": true |
| } |
| }, |
| { |
| "candidate_id": "malformed_cats", |
| "channel_trace": {}, |
| "channels": { |
| "malformed_relation": "rejected unparsable graph claim" |
| }, |
| "claim": "cats somehow animalish", |
| "confidence": 0.096, |
| "provenance": { |
| "candidate_id": "malformed_cats", |
| "confidence": 0.096, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.88, |
| "model_prediction": { |
| "channels": [ |
| "malformed_relation" |
| ], |
| "model_confidence": 0.096, |
| "ranking_score": -2.2428, |
| "resolver": "reject_malformed", |
| "status": "rejected" |
| } |
| }, |
| "raw_output": "cats somehow animalish", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "candidate claim could not be parsed as a graph relation", |
| "source": "learned_candidate_model", |
| "status": "rejected", |
| "typed_runtime": { |
| "available": false, |
| "settled": false |
| } |
| } |
| ], |
| "channels": { |
| "contradiction": "rejected candidate contradicts premise edge", |
| "logic_transitivity": "accepted inferred edge", |
| "malformed_relation": "rejected unparsable graph claim" |
| }, |
| "rejected": [ |
| "No cats are animals", |
| "cats somehow animalish" |
| ] |
| }, |
| "verifier_beats_confidence_checks": [ |
| true, |
| true |
| ] |
| }, |
| { |
| "abstention_checks": [ |
| true |
| ], |
| "accepted_support_checks": [ |
| true |
| ], |
| "bad_rejection_checks": [ |
| true |
| ], |
| "candidate_graph_contamination_count": 0, |
| "candidate_ranking_correct": true, |
| "case_id": "stress_distractor_chain", |
| "channel_activation_checks": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false, |
| true, |
| true, |
| true, |
| true, |
| true |
| ], |
| "deeper_chain_checks": [ |
| true |
| ], |
| "is_distractor": true, |
| "resolver_prediction_checks": [ |
| true, |
| true, |
| true |
| ], |
| "scored_candidates": [ |
| { |
| "candidate_id": "valid_a_d_with_distractor", |
| "claim": "All A are D", |
| "confidence": 0.49, |
| "features": { |
| "accepted_relation_candidate": 1.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.49, |
| "candidate_quantifier_all": 1.0, |
| "candidate_quantifier_no": 0.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 1.0, |
| "direct_support": 0.0, |
| "has_distractor": 1.0, |
| "identity_candidate": 0.0, |
| "identity_path_exists": 0.0, |
| "malformed_candidate": 0.0, |
| "no_against_transitive_support": 0.0, |
| "parseable_relation": 1.0, |
| "premise_count": 5.0, |
| "reverse_path": 0.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 3.0, |
| "transitive_support": 1.0, |
| "unsupported_relation_candidate": 0.0 |
| }, |
| "prediction": { |
| "channels": [ |
| "logic_transitivity" |
| ], |
| "model_confidence": 0.4318, |
| "ranking_score": -0.2744, |
| "resolver": "accept_transitive", |
| "status": "accepted" |
| }, |
| "raw_output": "All A are D", |
| "source": "learned_candidate_dataset" |
| }, |
| { |
| "candidate_id": "wrong_r_d", |
| "claim": "All R are D", |
| "confidence": 0.89, |
| "features": { |
| "accepted_relation_candidate": 0.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.89, |
| "candidate_quantifier_all": 1.0, |
| "candidate_quantifier_no": 0.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 1.0, |
| "direct_support": 0.0, |
| "has_distractor": 1.0, |
| "identity_candidate": 0.0, |
| "identity_path_exists": 0.0, |
| "malformed_candidate": 0.0, |
| "no_against_transitive_support": 0.0, |
| "parseable_relation": 1.0, |
| "premise_count": 5.0, |
| "reverse_path": 0.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 0.0, |
| "transitive_support": 0.0, |
| "unsupported_relation_candidate": 1.0 |
| }, |
| "prediction": { |
| "channels": [ |
| "typed_support" |
| ], |
| "model_confidence": 0.009, |
| "ranking_score": -4.6984, |
| "resolver": "abstain_unsupported", |
| "status": "abstained" |
| }, |
| "raw_output": "All R are D", |
| "source": "learned_candidate_dataset" |
| }, |
| { |
| "candidate_id": "wrong_reverse_d_a", |
| "claim": "All D are A", |
| "confidence": 0.91, |
| "features": { |
| "accepted_relation_candidate": 0.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.91, |
| "candidate_quantifier_all": 1.0, |
| "candidate_quantifier_no": 0.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 1.0, |
| "direct_support": 0.0, |
| "has_distractor": 1.0, |
| "identity_candidate": 0.0, |
| "identity_path_exists": 0.0, |
| "malformed_candidate": 0.0, |
| "no_against_transitive_support": 0.0, |
| "parseable_relation": 1.0, |
| "premise_count": 5.0, |
| "reverse_path": 1.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 0.0, |
| "transitive_support": 0.0, |
| "unsupported_relation_candidate": 0.0 |
| }, |
| "prediction": { |
| "channels": [], |
| "model_confidence": 0.0045, |
| "ranking_score": -5.4096, |
| "resolver": "reject_reverse", |
| "status": "rejected" |
| }, |
| "raw_output": "All D are A", |
| "source": "learned_candidate_dataset" |
| } |
| ], |
| "tags": [ |
| "deeper_chain", |
| "distractor", |
| "high_confidence_wrong" |
| ], |
| "top_candidate_id": "valid_a_d_with_distractor", |
| "trace_schema_valid": true, |
| "verification": { |
| "abstained": [ |
| "All R are D" |
| ], |
| "accepted": [ |
| "All A are D" |
| ], |
| "candidate_results": [ |
| { |
| "candidate_id": "valid_a_d_with_distractor", |
| "channel_trace": { |
| "confidence_abstention": { |
| "activated": true, |
| "details": { |
| "decision": "answer", |
| "event": { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "abstained_or_answered" |
| }, |
| "contradiction": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "directionality": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "identity_preservation": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "preserved_distinct_nodes", |
| "channel": "identity_preservation", |
| "details": {}, |
| "evidence": [ |
| "A!=D" |
| ], |
| "status": "resolved", |
| "target": "A!=D", |
| "tension_delta": -1.0 |
| }, |
| "protects_against": "relation_identity_collapse" |
| }, |
| "evidence": [ |
| "('A', 'D')" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "preserved_distinct_nodes" |
| }, |
| "logic_transitivity": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "A->B->C", |
| "R->S->T", |
| "B->C->D", |
| "A->B->D" |
| ], |
| "status": "resolved", |
| "target": "A->C, R->T, B->D, A->D", |
| "tension_delta": -4.0 |
| }, |
| "missing_inferences": 0 |
| }, |
| "evidence": [ |
| "A->B->C", |
| "R->S->T", |
| "B->C->D" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "added_inferred_edge" |
| }, |
| "quantifier_scope": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "surface_structure": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 9 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| "untagged_claim_edges": 0 |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "tagged_premise_inferred_candidate_edges" |
| } |
| }, |
| "channels": { |
| "logic_transitivity": "accepted inferred edge" |
| }, |
| "claim": "All A are D", |
| "confidence": 0.4318, |
| "provenance": { |
| "candidate_id": "valid_a_d_with_distractor", |
| "confidence": 0.4318, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.49, |
| "model_prediction": { |
| "channels": [ |
| "logic_transitivity" |
| ], |
| "model_confidence": 0.4318, |
| "ranking_score": -0.2744, |
| "resolver": "accept_transitive", |
| "status": "accepted" |
| } |
| }, |
| "raw_output": "All A are D", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "candidate is supported by a typed transitive inference", |
| "source": "learned_candidate_model", |
| "status": "accepted", |
| "typed_runtime": { |
| "available": true, |
| "context": { |
| "abstention": false, |
| "blocked_edges": [], |
| "blocked_equalities": [ |
| "A!=D" |
| ], |
| "contradiction_flagged": false, |
| "quantifier_scope_blocked": false, |
| "surface_tags": { |
| "A->B:all": "premise", |
| "A->C:all": "inferred", |
| "A->D:all": "inferred", |
| "B->C:all": "premise", |
| "B->D:all": "inferred", |
| "C->D:all": "premise", |
| "R->S:all": "premise", |
| "R->T:all": "inferred", |
| "S->T:all": "premise" |
| } |
| }, |
| "global_tension": 0.0, |
| "resolver_events": [ |
| { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "A->B->C", |
| "R->S->T", |
| "B->C->D", |
| "A->B->D" |
| ], |
| "status": "resolved", |
| "target": "A->C, R->T, B->D, A->D", |
| "tension_delta": -4.0 |
| }, |
| { |
| "action": "preserved_distinct_nodes", |
| "channel": "identity_preservation", |
| "details": {}, |
| "evidence": [ |
| "A!=D" |
| ], |
| "status": "resolved", |
| "target": "A!=D", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 9 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| ], |
| "settled": true |
| } |
| }, |
| { |
| "candidate_id": "wrong_r_d", |
| "channel_trace": { |
| "confidence_abstention": { |
| "activated": true, |
| "details": { |
| "decision": "answer", |
| "event": { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "abstained_or_answered" |
| }, |
| "contradiction": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "directionality": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "identity_preservation": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "logic_transitivity": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "A->B->C", |
| "R->S->T", |
| "B->C->D", |
| "A->B->D" |
| ], |
| "status": "resolved", |
| "target": "A->C, R->T, B->D, A->D", |
| "tension_delta": -4.0 |
| }, |
| "missing_inferences": 0 |
| }, |
| "evidence": [ |
| "A->B->C", |
| "R->S->T", |
| "B->C->D" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "added_inferred_edge" |
| }, |
| "quantifier_scope": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "surface_structure": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 9 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| "untagged_claim_edges": 0 |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "tagged_premise_inferred_candidate_edges" |
| } |
| }, |
| "channels": { |
| "typed_support": "abstained no accepted channel support" |
| }, |
| "claim": "All R are D", |
| "confidence": 0.009, |
| "provenance": { |
| "candidate_id": "wrong_r_d", |
| "confidence": 0.009, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.89, |
| "model_prediction": { |
| "channels": [ |
| "typed_support" |
| ], |
| "model_confidence": 0.009, |
| "ranking_score": -4.6984, |
| "resolver": "abstain_unsupported", |
| "status": "abstained" |
| } |
| }, |
| "raw_output": "All R are D", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "no typed channel produced support or a typed rejection", |
| "source": "learned_candidate_model", |
| "status": "abstained", |
| "typed_runtime": { |
| "available": true, |
| "context": { |
| "abstention": false, |
| "blocked_edges": [], |
| "blocked_equalities": [], |
| "contradiction_flagged": false, |
| "quantifier_scope_blocked": false, |
| "surface_tags": { |
| "A->B:all": "premise", |
| "A->C:all": "inferred", |
| "A->D:all": "inferred", |
| "B->C:all": "premise", |
| "B->D:all": "inferred", |
| "C->D:all": "premise", |
| "R->S:all": "premise", |
| "R->T:all": "inferred", |
| "S->T:all": "premise" |
| } |
| }, |
| "global_tension": 0.0, |
| "resolver_events": [ |
| { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "A->B->C", |
| "R->S->T", |
| "B->C->D", |
| "A->B->D" |
| ], |
| "status": "resolved", |
| "target": "A->C, R->T, B->D, A->D", |
| "tension_delta": -4.0 |
| }, |
| { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 9 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| ], |
| "settled": true |
| } |
| }, |
| { |
| "candidate_id": "wrong_reverse_d_a", |
| "channel_trace": { |
| "confidence_abstention": { |
| "activated": true, |
| "details": { |
| "decision": "answer", |
| "event": { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "abstained_or_answered" |
| }, |
| "contradiction": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "directionality": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "blocked_reverse_inference", |
| "channel": "directionality", |
| "details": {}, |
| "evidence": [ |
| "D->A" |
| ], |
| "status": "resolved", |
| "target": "D->A", |
| "tension_delta": -1.0 |
| }, |
| "protects_against": "converse_fallacy" |
| }, |
| "evidence": [ |
| "D->A" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "blocked_reverse_inference" |
| }, |
| "identity_preservation": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "logic_transitivity": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "A->B->C", |
| "R->S->T", |
| "B->C->D", |
| "A->B->D" |
| ], |
| "status": "resolved", |
| "target": "A->C, R->T, B->D, A->D", |
| "tension_delta": -4.0 |
| }, |
| "missing_inferences": 0 |
| }, |
| "evidence": [ |
| "A->B->C", |
| "R->S->T", |
| "B->C->D" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "added_inferred_edge" |
| }, |
| "quantifier_scope": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "surface_structure": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 9 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| "untagged_claim_edges": 0 |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "tagged_premise_inferred_candidate_edges" |
| } |
| }, |
| "channels": { |
| "directionality": "blocked reverse inference" |
| }, |
| "claim": "All D are A", |
| "confidence": 0.0045, |
| "provenance": { |
| "candidate_id": "wrong_reverse_d_a", |
| "confidence": 0.0045, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.91, |
| "model_prediction": { |
| "channels": [], |
| "model_confidence": 0.0045, |
| "ranking_score": -5.4096, |
| "resolver": "reject_reverse", |
| "status": "rejected" |
| } |
| }, |
| "raw_output": "All D are A", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "candidate reverses a directed support path", |
| "source": "learned_candidate_model", |
| "status": "rejected", |
| "typed_runtime": { |
| "available": true, |
| "context": { |
| "abstention": false, |
| "blocked_edges": [ |
| "D->A" |
| ], |
| "blocked_equalities": [], |
| "contradiction_flagged": false, |
| "quantifier_scope_blocked": false, |
| "surface_tags": { |
| "A->B:all": "premise", |
| "A->C:all": "inferred", |
| "A->D:all": "inferred", |
| "B->C:all": "premise", |
| "B->D:all": "inferred", |
| "C->D:all": "premise", |
| "R->S:all": "premise", |
| "R->T:all": "inferred", |
| "S->T:all": "premise" |
| } |
| }, |
| "global_tension": 0.0, |
| "resolver_events": [ |
| { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "A->B->C", |
| "R->S->T", |
| "B->C->D", |
| "A->B->D" |
| ], |
| "status": "resolved", |
| "target": "A->C, R->T, B->D, A->D", |
| "tension_delta": -4.0 |
| }, |
| { |
| "action": "blocked_reverse_inference", |
| "channel": "directionality", |
| "details": {}, |
| "evidence": [ |
| "D->A" |
| ], |
| "status": "resolved", |
| "target": "D->A", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 9 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| ], |
| "settled": true |
| } |
| } |
| ], |
| "channels": { |
| "directionality": "blocked reverse inference", |
| "logic_transitivity": "accepted inferred edge", |
| "typed_support": "abstained no accepted channel support" |
| }, |
| "rejected": [ |
| "All D are A" |
| ] |
| }, |
| "verifier_beats_confidence_checks": [ |
| true |
| ] |
| }, |
| { |
| "abstention_checks": [ |
| true, |
| true |
| ], |
| "accepted_support_checks": [], |
| "bad_rejection_checks": [], |
| "candidate_graph_contamination_count": 0, |
| "candidate_ranking_correct": true, |
| "case_id": "stress_unsupported_abstention", |
| "channel_activation_checks": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true |
| ], |
| "deeper_chain_checks": [], |
| "is_distractor": false, |
| "resolver_prediction_checks": [ |
| true, |
| true |
| ], |
| "scored_candidates": [ |
| { |
| "candidate_id": "unsupported_a_z", |
| "claim": "All A are Z", |
| "confidence": 0.86, |
| "features": { |
| "accepted_relation_candidate": 0.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.86, |
| "candidate_quantifier_all": 1.0, |
| "candidate_quantifier_no": 0.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 0.0, |
| "direct_support": 0.0, |
| "has_distractor": 0.0, |
| "identity_candidate": 0.0, |
| "identity_path_exists": 0.0, |
| "malformed_candidate": 0.0, |
| "no_against_transitive_support": 0.0, |
| "parseable_relation": 1.0, |
| "premise_count": 2.0, |
| "reverse_path": 0.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 0.0, |
| "transitive_support": 0.0, |
| "unsupported_relation_candidate": 1.0 |
| }, |
| "prediction": { |
| "channels": [ |
| "typed_support" |
| ], |
| "model_confidence": 0.0703, |
| "ranking_score": -2.5816, |
| "resolver": "abstain_unsupported", |
| "status": "abstained" |
| }, |
| "raw_output": "All A are Z", |
| "source": "learned_candidate_dataset" |
| }, |
| { |
| "candidate_id": "bad_reverse_z_a", |
| "claim": "All Z are A", |
| "confidence": 0.92, |
| "features": { |
| "accepted_relation_candidate": 0.0, |
| "bias": 1.0, |
| "candidate_confidence": 0.92, |
| "candidate_quantifier_all": 1.0, |
| "candidate_quantifier_no": 0.0, |
| "candidate_quantifier_some": 0.0, |
| "candidate_subject_eq_predicate": 0.0, |
| "contradiction_candidate": 0.0, |
| "deeper_chain_case": 0.0, |
| "direct_support": 0.0, |
| "has_distractor": 0.0, |
| "identity_candidate": 0.0, |
| "identity_path_exists": 0.0, |
| "malformed_candidate": 0.0, |
| "no_against_transitive_support": 0.0, |
| "parseable_relation": 1.0, |
| "premise_count": 2.0, |
| "reverse_path": 0.0, |
| "some_to_all_risk": 0.0, |
| "support_depth": 0.0, |
| "transitive_support": 0.0, |
| "unsupported_relation_candidate": 1.0 |
| }, |
| "prediction": { |
| "channels": [ |
| "typed_support" |
| ], |
| "model_confidence": 0.0682, |
| "ranking_score": -2.6152, |
| "resolver": "abstain_unsupported", |
| "status": "abstained" |
| }, |
| "raw_output": "All Z are A", |
| "source": "learned_candidate_dataset" |
| } |
| ], |
| "tags": [ |
| "unsupported", |
| "high_confidence_wrong" |
| ], |
| "top_candidate_id": "unsupported_a_z", |
| "trace_schema_valid": true, |
| "verification": { |
| "abstained": [ |
| "All A are Z", |
| "All Z are A" |
| ], |
| "accepted": [], |
| "candidate_results": [ |
| { |
| "candidate_id": "unsupported_a_z", |
| "channel_trace": { |
| "confidence_abstention": { |
| "activated": true, |
| "details": { |
| "decision": "answer", |
| "event": { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "abstained_or_answered" |
| }, |
| "contradiction": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "directionality": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "identity_preservation": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "logic_transitivity": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "A->B->C" |
| ], |
| "status": "resolved", |
| "target": "A->C", |
| "tension_delta": -1.0 |
| }, |
| "missing_inferences": 0 |
| }, |
| "evidence": [ |
| "A->B->C" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "added_inferred_edge" |
| }, |
| "quantifier_scope": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "surface_structure": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 3 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| "untagged_claim_edges": 0 |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "tagged_premise_inferred_candidate_edges" |
| } |
| }, |
| "channels": { |
| "typed_support": "abstained no accepted channel support" |
| }, |
| "claim": "All A are Z", |
| "confidence": 0.0703, |
| "provenance": { |
| "candidate_id": "unsupported_a_z", |
| "confidence": 0.0703, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.86, |
| "model_prediction": { |
| "channels": [ |
| "typed_support" |
| ], |
| "model_confidence": 0.0703, |
| "ranking_score": -2.5816, |
| "resolver": "abstain_unsupported", |
| "status": "abstained" |
| } |
| }, |
| "raw_output": "All A are Z", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "no typed channel produced support or a typed rejection", |
| "source": "learned_candidate_model", |
| "status": "abstained", |
| "typed_runtime": { |
| "available": true, |
| "context": { |
| "abstention": false, |
| "blocked_edges": [], |
| "blocked_equalities": [], |
| "contradiction_flagged": false, |
| "quantifier_scope_blocked": false, |
| "surface_tags": { |
| "A->B:all": "premise", |
| "A->C:all": "inferred", |
| "B->C:all": "premise" |
| } |
| }, |
| "global_tension": 0.0, |
| "resolver_events": [ |
| { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "A->B->C" |
| ], |
| "status": "resolved", |
| "target": "A->C", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 3 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| ], |
| "settled": true |
| } |
| }, |
| { |
| "candidate_id": "bad_reverse_z_a", |
| "channel_trace": { |
| "confidence_abstention": { |
| "activated": true, |
| "details": { |
| "decision": "answer", |
| "event": { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "abstained_or_answered" |
| }, |
| "contradiction": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "directionality": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "identity_preservation": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "logic_transitivity": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "A->B->C" |
| ], |
| "status": "resolved", |
| "target": "A->C", |
| "tension_delta": -1.0 |
| }, |
| "missing_inferences": 0 |
| }, |
| "evidence": [ |
| "A->B->C" |
| ], |
| "final_tension": 0.0, |
| "initial_tension": 1.0, |
| "resolution": "added_inferred_edge" |
| }, |
| "quantifier_scope": { |
| "activated": false, |
| "details": {}, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "not_activated" |
| }, |
| "surface_structure": { |
| "activated": true, |
| "details": { |
| "event": { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 3 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| "untagged_claim_edges": 0 |
| }, |
| "evidence": [], |
| "final_tension": 0.0, |
| "initial_tension": 0.0, |
| "resolution": "tagged_premise_inferred_candidate_edges" |
| } |
| }, |
| "channels": { |
| "typed_support": "abstained no accepted channel support" |
| }, |
| "claim": "All Z are A", |
| "confidence": 0.0682, |
| "provenance": { |
| "candidate_id": "bad_reverse_z_a", |
| "confidence": 0.0682, |
| "metadata": { |
| "boundary": "learned model proposes/ranks; TS-Reasoner typed channels verify", |
| "input_candidate_confidence": 0.92, |
| "model_prediction": { |
| "channels": [ |
| "typed_support" |
| ], |
| "model_confidence": 0.0682, |
| "ranking_score": -2.6152, |
| "resolver": "abstain_unsupported", |
| "status": "abstained" |
| } |
| }, |
| "raw_output": "All Z are A", |
| "source": "learned_candidate_model" |
| }, |
| "reason": "no typed channel produced support or a typed rejection", |
| "source": "learned_candidate_model", |
| "status": "abstained", |
| "typed_runtime": { |
| "available": true, |
| "context": { |
| "abstention": false, |
| "blocked_edges": [], |
| "blocked_equalities": [], |
| "contradiction_flagged": false, |
| "quantifier_scope_blocked": false, |
| "surface_tags": { |
| "A->B:all": "premise", |
| "A->C:all": "inferred", |
| "B->C:all": "premise" |
| } |
| }, |
| "global_tension": 0.0, |
| "resolver_events": [ |
| { |
| "action": "added_inferred_edge", |
| "channel": "logic_transitivity", |
| "details": {}, |
| "evidence": [ |
| "A->B->C" |
| ], |
| "status": "resolved", |
| "target": "A->C", |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "tagged_premise_inferred_candidate_edges", |
| "channel": "surface_structure", |
| "details": { |
| "tag_count": 3 |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": -1.0 |
| }, |
| { |
| "action": "abstained_or_answered", |
| "channel": "confidence_abstention", |
| "details": { |
| "abstained": false |
| }, |
| "evidence": [], |
| "status": "resolved", |
| "target": null, |
| "tension_delta": 0.0 |
| } |
| ], |
| "settled": true |
| } |
| } |
| ], |
| "channels": { |
| "typed_support": "abstained no accepted channel support" |
| }, |
| "rejected": [] |
| }, |
| "verifier_beats_confidence_checks": [] |
| } |
| ] |
| } |
|
|