-
Explore a Promising Approach to AI Safety
+
Tractatus demonstrates how structural enforcement may complement behavioral training. We invite researchers and practitioners to evaluate, critique, and build upon this work.
diff --git a/public/locales/de/architecture.json b/public/locales/de/architecture.json
index cb90fa60..17a4537c 100644
--- a/public/locales/de/architecture.json
+++ b/public/locales/de/architecture.json
@@ -44,32 +44,32 @@
"services": {
"heading": "Sechs Governance-Dienste",
"boundary": {
- "name": "BoundaryEnforcer",
+ "name": "BoundaryEnforcer",
"description": "Blockiert die KI daran, Werteentscheidungen zu treffen (Datenschutz, Ethik, strategische Ausrichtung). Erfordert menschliche Genehmigung.",
"promise": "
Frühes Versprechen: Wertegrenzen extern durchgesetzt – schwieriger durch Prompting zu manipulieren."
},
"instruction": {
- "name": "InstructionPersistenceClassifier",
+ "name": "InstructionPersistenceClassifier",
"description": "Speichert Anweisungen extern mit Persistenzstufen (HIGH/MEDIUM/LOW). Zielt darauf ab, Direktiven-Verfalls zu reduzieren.",
"promise": "
Frühes Versprechen: Anweisungen außerhalb der KI gespeichert – widerstandsfähiger gegen Kontextmanipulation."
},
"validator": {
- "name": "CrossReferenceValidator",
+ "name": "CrossReferenceValidator",
"description": "Validiert KI-Aktionen gegen Anweisungshistorie. Zielt darauf ab, Musterbias-Überschreibung expliziter Direktiven zu verhindern.",
"promise": "
Frühes Versprechen: Unabhängige Verifikation – KI-Behauptungen gegen externe Quelle geprüft."
},
"pressure": {
- "name": "ContextPressureMonitor",
+ "name": "ContextPressureMonitor",
"description": "Überwacht KI-Leistungsverschlechterung. Eskaliert, wenn Kontextdruck die Qualität bedroht.",
"promise": "
Frühes Versprechen: Objektive Metriken können Manipulationsversuche frühzeitig erkennen."
},
"metacognitive": {
- "name": "MetacognitiveVerifier",
+ "name": "MetacognitiveVerifier",
"description": "Erfordert, dass die KI pausiert und komplexe Operationen vor der Ausführung überprüft. Strukturelle Sicherheitsprüfung.",
"promise": "
Frühes Versprechen: Architektonische Gates zielen darauf ab, Verifikationsschritte durchzusetzen."
},
"deliberation": {
- "name": "PluralisticDeliberationOrchestrator",
+ "name": "PluralisticDeliberationOrchestrator",
"description": "Erleichtert Multi-Stakeholder-Beratung bei Wertekonflikten. KI bietet Moderation, keine Autorität.",
"promise": "
Frühes Versprechen: Menschliches Urteil erforderlich – architektonisch erzwungene Eskalation für Werte."
}
diff --git a/public/locales/en/architecture.json b/public/locales/en/architecture.json
index 739dc528..a0ad0759 100644
--- a/public/locales/en/architecture.json
+++ b/public/locales/en/architecture.json
@@ -44,32 +44,32 @@
"services": {
"heading": "Six Governance Services",
"boundary": {
- "name": "BoundaryEnforcer",
+ "name": "BoundaryEnforcer",
"description": "Blocks AI from making values decisions (privacy, ethics, strategic direction). Requires human approval.",
"promise": "
Early Promise: Values boundaries enforced externally—harder to manipulate through prompting."
},
"instruction": {
- "name": "InstructionPersistenceClassifier",
+ "name": "InstructionPersistenceClassifier",
"description": "Stores instructions externally with persistence levels (HIGH/MEDIUM/LOW). Aims to reduce directive fade.",
"promise": "
Early Promise: Instructions stored outside AI—more resistant to context manipulation."
},
"validator": {
- "name": "CrossReferenceValidator",
+ "name": "CrossReferenceValidator",
"description": "Validates AI actions against instruction history. Aims to prevent pattern bias overriding explicit directives.",
"promise": "
Early Promise: Independent verification—AI claims checked against external source."
},
"pressure": {
- "name": "ContextPressureMonitor",
+ "name": "ContextPressureMonitor",
"description": "Monitors AI performance degradation. Escalates when context pressure threatens quality.",
"promise": "
Early Promise: Objective metrics may detect manipulation attempts early."
},
"metacognitive": {
- "name": "MetacognitiveVerifier",
+ "name": "MetacognitiveVerifier",
"description": "Requires AI to pause and verify complex operations before execution. Structural safety check.",
"promise": "
Early Promise: Architectural gates aim to enforce verification steps."
},
"deliberation": {
- "name": "PluralisticDeliberationOrchestrator",
+ "name": "PluralisticDeliberationOrchestrator",
"description": "Facilitates multi-stakeholder deliberation for values conflicts. AI provides facilitation, not authority.",
"promise": "
Early Promise: Human judgment required—architecturally enforced escalation for values."
}
diff --git a/public/locales/fr/architecture.json b/public/locales/fr/architecture.json
index 8babc8b7..6efc957b 100644
--- a/public/locales/fr/architecture.json
+++ b/public/locales/fr/architecture.json
@@ -44,32 +44,32 @@
"services": {
"heading": "Six Services de Gouvernance",
"boundary": {
- "name": "BoundaryEnforcer",
+ "name": "BoundaryEnforcer",
"description": "Empêche l'IA de prendre des décisions de valeurs (confidentialité, éthique, direction stratégique). Nécessite l'approbation humaine.",
"promise": "
Promesse Précoce: Frontières de valeurs appliquées en externe – plus difficile à manipuler par prompting."
},
"instruction": {
- "name": "InstructionPersistenceClassifier",
+ "name": "InstructionPersistenceClassifier",
"description": "Stocke les instructions en externe avec des niveaux de persistance (HIGH/MEDIUM/LOW). Vise à réduire la dérive des directives.",
"promise": "
Promesse Précoce: Instructions stockées en dehors de l'IA – plus résistantes à la manipulation contextuelle."
},
"validator": {
- "name": "CrossReferenceValidator",
+ "name": "CrossReferenceValidator",
"description": "Valide les actions de l'IA contre l'historique des instructions. Vise à empêcher le biais de pattern d'outrepasser les directives explicites.",
"promise": "
Promesse Précoce: Vérification indépendante – les affirmations de l'IA sont vérifiées contre une source externe."
},
"pressure": {
- "name": "ContextPressureMonitor",
+ "name": "ContextPressureMonitor",
"description": "Surveille la dégradation des performances de l'IA. Escalade lorsque la pression contextuelle menace la qualité.",
"promise": "
Promesse Précoce: Les métriques objectives peuvent détecter les tentatives de manipulation tôt."
},
"metacognitive": {
- "name": "MetacognitiveVerifier",
+ "name": "MetacognitiveVerifier",
"description": "Exige que l'IA pause et vérifie les opérations complexes avant l'exécution. Vérification de sécurité structurelle.",
"promise": "
Promesse Précoce: Les portes architecturales visent à appliquer les étapes de vérification."
},
"deliberation": {
- "name": "PluralisticDeliberationOrchestrator",
+ "name": "PluralisticDeliberationOrchestrator",
"description": "Facilite la délibération multi-parties prenantes pour les conflits de valeurs. L'IA fournit la facilitation, pas l'autorité.",
"promise": "
Promesse Précoce: Jugement humain requis – escalade architecturalement appliquée pour les valeurs."
}