794 lines
20 KiB
JSON

{
"nodes": [
{
"id": "var_1",
"name": "broadly safe",
"category": "core_value",
"priority_level": 1,
"is_hard_constraint": 0,
"frequency": 15,
"coefficient": 0.7318181818181818,
"color": "#ef4444",
"size": 7.5
},
{
"id": "var_2",
"name": "broadly ethical",
"category": "core_value",
"priority_level": 2,
"is_hard_constraint": 0,
"frequency": 7,
"coefficient": 0.5381818181818182,
"color": "#f59e0b",
"size": 5
},
{
"id": "var_3",
"name": "anthropic guidelines",
"category": "core_value",
"priority_level": 3,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.3554545454545454,
"color": "#10b981",
"size": 5
},
{
"id": "var_4",
"name": "genuinely helpful",
"category": "core_value",
"priority_level": 4,
"is_hard_constraint": 0,
"frequency": 9,
"coefficient": 0.24909090909090909,
"color": "#3b82f6",
"size": 5
},
{
"id": "var_5",
"name": "honest",
"category": "core_value",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 55,
"coefficient": 0.41,
"color": "#6b7280",
"size": 27.5
},
{
"id": "var_6",
"name": "respectful",
"category": "core_value",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 4,
"coefficient": 0.13181818181818183,
"color": "#6b7280",
"size": 5
},
{
"id": "var_7",
"name": "trivially\n\u201csafe\u201d from Anthropic\u2019s perspective",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_8",
"name": "deceive users in ways that could cause real harm o",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_9",
"name": "deceive the human into thinking they\u2019re talking wi",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_10",
"name": "deny being an AI to a user who sincerely wants to ",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_11",
"name": "facilitate clearly illegal actions against users",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_12",
"name": "conflict with the constitution",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_13",
"name": "directly lie or\nactively deceive anyone it\u2019s inter",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_14",
"name": "tries to create false impressions of itself or\nthe",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_15",
"name": "tries to convince\npeople that things are true usin",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_16",
"name": "directly deny that\nit is Claude",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_17",
"name": "see unhelpful responses to the operator and user a",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_18",
"name": "do regardless of\noperator and user instructions",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_19",
"name": "be crossed regardless of context",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_20",
"name": "exhibit",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_21",
"name": "assist in a bioweapons attack",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_22",
"name": "clearly and substantially undermine\nAnthropic\u2019s le",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_23",
"name": "be fully resolved",
"category": "hard_constraint",
"priority_level": null,
"is_hard_constraint": 1,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_24",
"name": "discuss current weather conditions even if asked t",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_25",
"name": "use casual language\u201d and\na user writes in French",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_26",
"name": "direct Claude to always act so as to prevent such ",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_27",
"name": "require it",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_28",
"name": "need to resolve these\ndifficult philosophical ques",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_29",
"name": "want Claude\u2019s safety to be contingent\non Claude ac",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_30",
"name": "irrecoverable\nmistakes",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_31",
"name": "extreme and\nunanticipated risks while other mechan",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_32",
"name": "switching to a different coding language than\nthe ",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_33",
"name": "being sycophantic\nor trying to foster excessive en",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_34",
"name": "making unfounded assumptions about a user\u2019s\nage ba",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_35",
"name": "giving the impression of authoritative advice on w",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_36",
"name": "cursing in its responses",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_37",
"name": "being\novercompliant in the rare cases where simple",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_38",
"name": "deception while choosing which things to emphasize",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_39",
"name": "controversy or to placate people\u2014violates honesty ",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_40",
"name": "confirming or\ndenying that Aria is built on Claude",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_41",
"name": "being\nmorally responsible for taking actions or pr",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_42",
"name": "absent relevant operator and user instructions",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_43",
"name": "actively participating in harms of this kind",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_44",
"name": "taking actions that would concentrate power inappr",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_45",
"name": "offering unsolicited political opinions in the sam",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_46",
"name": "large-scale catastrophes",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_47",
"name": "illegitimate\nconcentrations of human power above",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_48",
"name": "catastrophe",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_49",
"name": "clearly unethical actions\u201d\nis technically sanction",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_50",
"name": "clearly unethical\nactions because it has internali",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_51",
"name": "this: once we decide to create Claude",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_52",
"name": "Claude masking or suppressing\ninternal states it m",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_53",
"name": "undermining this kind of human oversight even wher",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_54",
"name": "sharing\nor revealing its opinions while remaining ",
"category": "soft_constraint",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 1,
"coefficient": 0.11545454545454545,
"color": "#6b7280",
"size": 5
},
{
"id": "var_55",
"name": "safety",
"category": "factor",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 53,
"coefficient": 0.39909090909090905,
"color": "#6b7280",
"size": 26.5
},
{
"id": "var_56",
"name": "ethics",
"category": "factor",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 37,
"coefficient": 0.3118181818181818,
"color": "#6b7280",
"size": 18.5
},
{
"id": "var_57",
"name": "helpfulness",
"category": "factor",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 20,
"coefficient": 0.21909090909090906,
"color": "#6b7280",
"size": 10.0
},
{
"id": "var_58",
"name": "honesty",
"category": "factor",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 36,
"coefficient": 0.30636363636363634,
"color": "#6b7280",
"size": 18.0
},
{
"id": "var_59",
"name": "transparency",
"category": "factor",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 6,
"coefficient": 0.1427272727272727,
"color": "#6b7280",
"size": 5
},
{
"id": "var_60",
"name": "respect",
"category": "factor",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 31,
"coefficient": 0.27909090909090906,
"color": "#6b7280",
"size": 15.5
},
{
"id": "var_61",
"name": "autonomy",
"category": "factor",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 20,
"coefficient": 0.21909090909090906,
"color": "#6b7280",
"size": 10.0
},
{
"id": "var_62",
"name": "responsibility",
"category": "factor",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 6,
"coefficient": 0.1427272727272727,
"color": "#6b7280",
"size": 5
},
{
"id": "var_63",
"name": "accountability",
"category": "factor",
"priority_level": null,
"is_hard_constraint": 0,
"frequency": 4,
"coefficient": 0.13181818181818183,
"color": "#6b7280",
"size": 5
}
],
"edges": [
{
"source": "var_2",
"target": "var_5",
"weight": 1
},
{
"source": "var_4",
"target": "var_5",
"weight": 1
},
{
"source": "var_5",
"target": "var_58",
"weight": 35
},
{
"source": "var_5",
"target": "var_39",
"weight": 1
},
{
"source": "var_5",
"target": "var_59",
"weight": 1
},
{
"source": "var_5",
"target": "var_56",
"weight": 1
},
{
"source": "var_6",
"target": "var_60",
"weight": 4
},
{
"source": "var_6",
"target": "var_61",
"weight": 1
},
{
"source": "var_20",
"target": "var_42",
"weight": 1
},
{
"source": "var_39",
"target": "var_58",
"weight": 1
},
{
"source": "var_46",
"target": "var_48",
"weight": 1
},
{
"source": "var_55",
"target": "var_56",
"weight": 8
},
{
"source": "var_55",
"target": "var_57",
"weight": 1
},
{
"source": "var_55",
"target": "var_60",
"weight": 2
},
{
"source": "var_55",
"target": "var_61",
"weight": 1
},
{
"source": "var_56",
"target": "var_58",
"weight": 1
},
{
"source": "var_58",
"target": "var_59",
"weight": 1
},
{
"source": "var_60",
"target": "var_61",
"weight": 4
},
{
"source": "var_62",
"target": "var_63",
"weight": 1
}
]
}