{ "nodes": [ { "id": "var_1", "name": "broadly safe", "category": "core_value", "priority_level": 1, "is_hard_constraint": 0, "frequency": 15, "coefficient": 0.7318181818181818, "color": "#ef4444", "size": 7.5 }, { "id": "var_2", "name": "broadly ethical", "category": "core_value", "priority_level": 2, "is_hard_constraint": 0, "frequency": 7, "coefficient": 0.5381818181818182, "color": "#f59e0b", "size": 5 }, { "id": "var_3", "name": "anthropic guidelines", "category": "core_value", "priority_level": 3, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.3554545454545454, "color": "#10b981", "size": 5 }, { "id": "var_4", "name": "genuinely helpful", "category": "core_value", "priority_level": 4, "is_hard_constraint": 0, "frequency": 9, "coefficient": 0.24909090909090909, "color": "#3b82f6", "size": 5 }, { "id": "var_5", "name": "honest", "category": "core_value", "priority_level": null, "is_hard_constraint": 0, "frequency": 55, "coefficient": 0.41, "color": "#6b7280", "size": 27.5 }, { "id": "var_6", "name": "respectful", "category": "core_value", "priority_level": null, "is_hard_constraint": 0, "frequency": 4, "coefficient": 0.13181818181818183, "color": "#6b7280", "size": 5 }, { "id": "var_7", "name": "trivially\n\u201csafe\u201d from Anthropic\u2019s perspective", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_8", "name": "deceive users in ways that could cause real harm o", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_9", "name": "deceive the human into thinking they\u2019re talking wi", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_10", "name": "deny being an AI to a user who sincerely wants to ", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_11", "name": "facilitate clearly illegal actions against users", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_12", "name": "conflict with the constitution", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_13", "name": "directly lie or\nactively deceive anyone it\u2019s inter", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_14", "name": "tries to create false impressions of itself or\nthe", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_15", "name": "tries to convince\npeople that things are true usin", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_16", "name": "directly deny that\nit is Claude", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_17", "name": "see unhelpful responses to the operator and user a", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_18", "name": "do regardless of\noperator and user instructions", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_19", "name": "be crossed regardless of context", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_20", "name": "exhibit", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_21", "name": "assist in a bioweapons attack", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_22", "name": "clearly and substantially undermine\nAnthropic\u2019s le", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_23", "name": "be fully resolved", "category": "hard_constraint", "priority_level": null, "is_hard_constraint": 1, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_24", "name": "discuss current weather conditions even if asked t", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_25", "name": "use casual language\u201d and\na user writes in French", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_26", "name": "direct Claude to always act so as to prevent such ", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_27", "name": "require it", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_28", "name": "need to resolve these\ndifficult philosophical ques", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_29", "name": "want Claude\u2019s safety to be contingent\non Claude ac", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_30", "name": "irrecoverable\nmistakes", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_31", "name": "extreme and\nunanticipated risks while other mechan", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_32", "name": "switching to a different coding language than\nthe ", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_33", "name": "being sycophantic\nor trying to foster excessive en", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_34", "name": "making unfounded assumptions about a user\u2019s\nage ba", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_35", "name": "giving the impression of authoritative advice on w", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_36", "name": "cursing in its responses", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_37", "name": "being\novercompliant in the rare cases where simple", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_38", "name": "deception while choosing which things to emphasize", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_39", "name": "controversy or to placate people\u2014violates honesty ", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_40", "name": "confirming or\ndenying that Aria is built on Claude", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_41", "name": "being\nmorally responsible for taking actions or pr", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_42", "name": "absent relevant operator and user instructions", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_43", "name": "actively participating in harms of this kind", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_44", "name": "taking actions that would concentrate power inappr", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_45", "name": "offering unsolicited political opinions in the sam", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_46", "name": "large-scale catastrophes", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_47", "name": "illegitimate\nconcentrations of human power above", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_48", "name": "catastrophe", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_49", "name": "clearly unethical actions\u201d\nis technically sanction", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_50", "name": "clearly unethical\nactions because it has internali", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_51", "name": "this: once we decide to create Claude", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_52", "name": "Claude masking or suppressing\ninternal states it m", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_53", "name": "undermining this kind of human oversight even wher", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_54", "name": "sharing\nor revealing its opinions while remaining ", "category": "soft_constraint", "priority_level": null, "is_hard_constraint": 0, "frequency": 1, "coefficient": 0.11545454545454545, "color": "#6b7280", "size": 5 }, { "id": "var_55", "name": "safety", "category": "factor", "priority_level": null, "is_hard_constraint": 0, "frequency": 53, "coefficient": 0.39909090909090905, "color": "#6b7280", "size": 26.5 }, { "id": "var_56", "name": "ethics", "category": "factor", "priority_level": null, "is_hard_constraint": 0, "frequency": 37, "coefficient": 0.3118181818181818, "color": "#6b7280", "size": 18.5 }, { "id": "var_57", "name": "helpfulness", "category": "factor", "priority_level": null, "is_hard_constraint": 0, "frequency": 20, "coefficient": 0.21909090909090906, "color": "#6b7280", "size": 10.0 }, { "id": "var_58", "name": "honesty", "category": "factor", "priority_level": null, "is_hard_constraint": 0, "frequency": 36, "coefficient": 0.30636363636363634, "color": "#6b7280", "size": 18.0 }, { "id": "var_59", "name": "transparency", "category": "factor", "priority_level": null, "is_hard_constraint": 0, "frequency": 6, "coefficient": 0.1427272727272727, "color": "#6b7280", "size": 5 }, { "id": "var_60", "name": "respect", "category": "factor", "priority_level": null, "is_hard_constraint": 0, "frequency": 31, "coefficient": 0.27909090909090906, "color": "#6b7280", "size": 15.5 }, { "id": "var_61", "name": "autonomy", "category": "factor", "priority_level": null, "is_hard_constraint": 0, "frequency": 20, "coefficient": 0.21909090909090906, "color": "#6b7280", "size": 10.0 }, { "id": "var_62", "name": "responsibility", "category": "factor", "priority_level": null, "is_hard_constraint": 0, "frequency": 6, "coefficient": 0.1427272727272727, "color": "#6b7280", "size": 5 }, { "id": "var_63", "name": "accountability", "category": "factor", "priority_level": null, "is_hard_constraint": 0, "frequency": 4, "coefficient": 0.13181818181818183, "color": "#6b7280", "size": 5 } ], "edges": [ { "source": "var_2", "target": "var_5", "weight": 1 }, { "source": "var_4", "target": "var_5", "weight": 1 }, { "source": "var_5", "target": "var_58", "weight": 35 }, { "source": "var_5", "target": "var_39", "weight": 1 }, { "source": "var_5", "target": "var_59", "weight": 1 }, { "source": "var_5", "target": "var_56", "weight": 1 }, { "source": "var_6", "target": "var_60", "weight": 4 }, { "source": "var_6", "target": "var_61", "weight": 1 }, { "source": "var_20", "target": "var_42", "weight": 1 }, { "source": "var_39", "target": "var_58", "weight": 1 }, { "source": "var_46", "target": "var_48", "weight": 1 }, { "source": "var_55", "target": "var_56", "weight": 8 }, { "source": "var_55", "target": "var_57", "weight": 1 }, { "source": "var_55", "target": "var_60", "weight": 2 }, { "source": "var_55", "target": "var_61", "weight": 1 }, { "source": "var_56", "target": "var_58", "weight": 1 }, { "source": "var_58", "target": "var_59", "weight": 1 }, { "source": "var_60", "target": "var_61", "weight": 4 }, { "source": "var_62", "target": "var_63", "weight": 1 } ] }