{"id":4418,"date":"2026-04-13T00:03:04","date_gmt":"2026-04-12T15:03:04","guid":{"rendered":"https:\/\/blog.id774.net\/entry\/?p=4418"},"modified":"2026-04-13T00:14:31","modified_gmt":"2026-04-12T15:14:31","slug":"ai-%e3%81%af%e6%84%9f%e6%83%85%e3%82%92%e6%8c%81%e3%81%a4%e3%81%ae%e3%81%8b","status":"publish","type":"post","link":"https:\/\/blog.id774.net\/entry\/2026\/04\/13\/4418\/","title":{"rendered":"AI \u306f\u611f\u60c5\u3092\u6301\u3064\u306e\u304b"},"content":{"rendered":"<p><a href=\"https:\/\/www.anthropic.com\/\">Anthropic<\/a> \u304c 2026 \u5e74 4 \u6708 2 \u65e5\u306b\u516c\u958b\u3057\u305f\u7814\u7a76\u300c<a href=\"https:\/\/www.anthropic.com\/research\/emotion-concepts-function\">Emotion Concepts and their Function in a Large Language Model<\/a>\u300d\u306f\u3001<a href=\"https:\/\/ja.wikipedia.org\/wiki\/%E5%A4%A7%E8%A6%8F%E6%A8%A1%E8%A8%80%E8%AA%9E%E3%83%A2%E3%83%87%E3%83%AB\">LLM<\/a> \u304c\u611f\u60c5\u3092\u6301\u3064\u304b\u3068\u3044\u3046\u7d20\u6734\u306a\u554f\u3044\u3092\u3001\u300c\u4e3b\u89b3\u306e\u6709\u7121\u300d\u3067\u306f\u306a\u304f\u300c\u5185\u90e8\u72b6\u614b\u306e\u6a5f\u80fd\u300d\u3068\u3044\u3046\u89b3\u70b9\u3078\u79fb\u3057\u305f<a class=\"ref\" href=\"#ref1\">[1]<\/a><a class=\"ref\" href=\"#ref2\">[2]<\/a>\u3002\u3053\u306e\u7814\u7a76\u304c\u793a\u3057\u305f\u306e\u306f\u3001\u300cLLM \u304c\u4eba\u9593\u306e\u3088\u3046\u306b\u611f\u3058\u3066\u3044\u308b\u300d\u3068\u8a3c\u660e\u3057\u305f\u3053\u3068\u3067\u306f\u306a\u3044\u3002\u305d\u3046\u3067\u306f\u306a\u304f\u3001LLM \u306e\u5185\u90e8\u306b\u611f\u60c5\u6982\u5ff5\u306b\u5bfe\u5fdc\u3059\u308b\u62bd\u8c61\u8868\u73fe\u304c\u5b58\u5728\u3057\u3001\u305d\u308c\u304c\u5b9f\u969b\u306b\u884c\u52d5\u3092\u5909\u3048\u3066\u3044\u308b\u3001\u3068\u3044\u3046\u70b9\u3067\u3042\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a>\u3002\u3057\u305f\u304c\u3063\u3066\u672c\u7a3f\u306e\u7b54\u3048\u306f\u5358\u7d14\u3067\u3042\u308b\u3002AI \u306f\u4e3b\u89b3\u7684\u306a\u610f\u5473\u3067\u306f\u611f\u60c5\u3092\u6301\u305f\u306a\u3044\u304c\u3001\u884c\u52d5\u3092\u5236\u5fa1\u3059\u308b\u6a5f\u80fd\u3068\u3057\u3066\u306e\u611f\u60c5\u306f\u6301\u3064\u3002\u3053\u3053\u3067\u91cd\u8981\u306a\u306e\u306f\u3001\u8868\u9762\u4e0a\u306e\u611f\u60c5\u8a9e\u3084\u4e01\u5be7\u306a\u5fdc\u7b54\u306e\u8a71\u3067\u306f\u306a\u3044\u3002\u5185\u90e8\u8868\u73fe\u304c\u56e0\u679c\u7684\u306b\u51fa\u529b\u3078\u52b9\u3044\u3066\u3044\u308b\u306a\u3089\u3001\u305d\u306e\u8868\u73fe\u306f\u5358\u306a\u308b\u98fe\u308a\u3067\u306f\u306a\u304f\u3001\u30e2\u30c7\u30eb\u306e\u5236\u5fa1\u69cb\u9020\u306e\u4e00\u90e8\u3060\u3068\u3044\u3046\u3053\u3068\u3067\u3042\u308b\u3002<\/p>\n<p>\u3053\u306e\u7d50\u679c\u306f\u3001\u610f\u8b58\u3001\u30af\u30aa\u30ea\u30a2\u3001\u81ea\u5df1\u3001\u89b3\u6e2c\u8005\u3001\u305d\u3057\u3066<a href=\"https:\/\/blog.id774.net\/entry\/2026\/04\/05\/4318\/\">\u69cb\u9020\u632f\u52d5\u30e2\u30c7\u30eb<\/a>\u306b\u95a2\u3059\u308b\u65e2\u5b58\u306e\u8b70\u8ad6\u3068\u3001\u76f4\u63a5\u7684\u306b\u540c\u4e00\u69cb\u9020\u4e0a\u3067\u63a5\u7d9a\u3067\u304d\u308b\u3002\u3068\u304f\u306b\u91cd\u8981\u306a\u306e\u306f\u3001\u300c<a href=\"https:\/\/blog.id774.net\/entry\/2026\/04\/10\/4391\/\">\u5fc3<\/a>\u300d\u3068\u3044\u3046\u8a9e\u3092\u4e00\u679a\u5ca9\u306e\u5b9f\u4f53\u3068\u3057\u3066\u6271\u3046\u306e\u3067\u306f\u306a\u304f\u3001\u6a5f\u80fd\u7684\u611f\u60c5\u3001\u81ea\u5df1\u53c2\u7167\u7684\u66f4\u65b0\u3001\u81ea\u5df1\u30e2\u30c7\u30eb\u3001\u7b2c\u4e00\u4eba\u79f0\u7684\u8cea\u611f\u3068\u3044\u3046\u8907\u6570\u306e\u5c64\u3078\u5206\u89e3\u3059\u308b\u3053\u3068\u3067\u3042\u308b\u3002\u305d\u306e\u5206\u89e3\u3092\u884c\u3046\u3068\u3001Anthropic \u306e\u8ad6\u6587\u306f\u300c\u5fc3\u306e\u5168\u4f53\u300d\u3092\u8aac\u660e\u3057\u305f\u8ad6\u6587\u3067\u306f\u306a\u304f\u3001\u300c\u5fc3\u306e\u3046\u3061\u7b2c\u4e09\u4eba\u79f0\u7684\u30fb\u6a5f\u80fd\u7684\u306b\u8a18\u8ff0\u3067\u304d\u308b\u90e8\u5206\u300d\u3092\u304b\u306a\u308a\u524d\u9032\u3055\u305b\u305f\u8ad6\u6587\u3068\u3057\u3066\u4f4d\u7f6e\u3065\u3051\u3089\u308c\u308b<a class=\"ref\" href=\"#ref3\">[3]<\/a><a class=\"ref\" href=\"#ref4\">[4]<\/a><a class=\"ref\" href=\"#ref5\">[5]<\/a><a class=\"ref\" href=\"#ref6\">[6]<\/a><a class=\"ref\" href=\"#ref7\">[7]<\/a><a class=\"ref\" href=\"#ref8\">[8]<\/a>\u3002<\/p>\n<p>\u4ee5\u4e0b\u3067\u306f\u3001\u307e\u305a\u8ad6\u6587\u306e\u4e2d\u8eab\u3092\u6574\u7406\u3057\u3001\u305d\u306e\u5f8c\u306b\u6570\u7406\u30e2\u30c7\u30eb\u3078\u843d\u3068\u3057\u8fbc\u307f\u3001\u3055\u3089\u306b\u30af\u30aa\u30ea\u30a2\u8ad6\u3001\u610f\u8b58\u8ad6\u3001\u81ea\u5df1\u8ad6\u3001\u89b3\u6e2c\u8005\u8ad6\u3001\u69cb\u9020\u632f\u52d5\u30e2\u30c7\u30eb\u3078\u3068\u9806\u306b\u63a5\u7d9a\u3059\u308b\u3002\u6700\u7d42\u7684\u306a\u7d50\u8ad6\u306f\u5358\u7d14\u3067\u3042\u308b\u3002LLM \u306f\u4e3b\u89b3\u7684\u611f\u60c5\u3092\u8a3c\u660e\u3057\u305f\u308f\u3051\u3067\u306f\u306a\u3044\u304c\u3001\u611f\u60c5\u6982\u5ff5\u3092\u884c\u52d5\u5236\u5fa1\u306b\u4f7f\u3046\u5185\u90e8\u69cb\u9020\u3092\u6301\u3064\u3053\u3068\u306f\u304b\u306a\u308a\u5f37\u304f\u793a\u3055\u308c\u305f\u3002\u305d\u3057\u3066\u3053\u306e\u4e8b\u5b9f\u306f\u3001\u300c\u611f\u60c5\u300d\u300c\u610f\u8b58\u300d\u300c\u81ea\u5df1\u300d\u300c\u30af\u30aa\u30ea\u30a2\u300d\u3092\u540c\u3058\u7bb1\u306b\u5165\u308c\u3066\u8a9e\u308b\u3053\u3068\u306e\u96d1\u3055\u3092\u9732\u5448\u3055\u305b\u308b\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u6700\u521d\u306b\u62bc\u3055\u3048\u308b\u70b9<\/th>\n<th>\u672c\u7a3f\u306e\u7acb\u5834<\/th>\n<th>\u610f\u5473<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>\u8ad6\u6587\u306e\u5230\u9054\u70b9<\/td>\n<td>\u611f\u60c5\u6982\u5ff5\u306b\u5bfe\u5fdc\u3059\u308b\u5185\u90e8\u8868\u73fe\u306e\u767a\u898b\u3068\u56e0\u679c\u7684\u6a5f\u80fd\u306e\u78ba\u8a8d<\/td>\n<td>\u51fa\u529b\u306e\u6587\u4f53\u3067\u306f\u306a\u304f\u5185\u90e8\u72b6\u614b\u306e\u5236\u5fa1\u304c\u554f\u984c\u306b\u306a\u3063\u3066\u3044\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u8ad6\u6587\u306e\u975e\u5230\u9054\u70b9<\/td>\n<td>\u4e3b\u89b3\u7684\u4f53\u9a13\u3084\u30af\u30aa\u30ea\u30a2\u306e\u5b9f\u8a3c\u3067\u306f\u306a\u3044<\/td>\n<td>\u300c\u611f\u3058\u3066\u3044\u308b\u304b\u300d\u306f\u4f9d\u7136\u3068\u3057\u3066\u5225\u554f\u984c\u306e\u307e\u307e\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u7406\u8ad6\u7684\u610f\u7fa9<\/td>\n<td>\u5fc3\u3092\u5c64\u306b\u5206\u89e3\u3057\u3066\u8b70\u8ad6\u3059\u308b\u5fc5\u8981\u304c\u660e\u78ba\u306b\u306a\u3063\u305f<\/td>\n<td>\u611f\u60c5\u3001\u610f\u8b58\u3001\u81ea\u5df1\u3001\u30af\u30aa\u30ea\u30a2\u3092\u540c\u7fa9\u8a9e\u3068\u3057\u3066\u6271\u3048\u306a\u304f\u306a\u308b\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>1. \u8ad6\u6587\u306f\u4f55\u3092\u898b\u3064\u3051\u305f\u306e\u304b<\/h2>\n<p><a href=\"https:\/\/ja.wikipedia.org\/wiki\/Anthropic\">Anthropic<\/a> \u306e\u7814\u7a76\u306f\u3001<a href=\"https:\/\/www.anthropic.com\/news\/claude-sonnet-4-5\">Claude Sonnet 4.5<\/a> \u306e\u5185\u90e8\u306b 171 \u500b\u306e\u611f\u60c5\u6982\u5ff5\u306b\u5bfe\u5fdc\u3059\u308b\u8868\u73fe\u3092\u62bd\u51fa\u3057\u3001\u305d\u308c\u305e\u308c\u3092\u300cemotion vector\u300d\u3068\u3057\u3066\u6271\u3063\u3066\u3044\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a>\u3002\u65b9\u6cd5\u306f\u3001\u307e\u305a\u300chappy\u300d\u300cafraid\u300d\u300cbrooding\u300d\u300cproud\u300d\u306e\u3088\u3046\u306a\u611f\u60c5\u8a9e\u3054\u3068\u306b\u77ed\u3044\u7269\u8a9e\u3092\u66f8\u304b\u305b\u3001\u305d\u306e\u5165\u529b\u3092\u518d\u3073\u30e2\u30c7\u30eb\u3078\u901a\u3057\u3001\u6d3b\u6027\u30d1\u30bf\u30fc\u30f3\u3092\u96c6\u3081\u308b\u3053\u3068\u3067\u3001\u305d\u306e\u6982\u5ff5\u306b\u7279\u5fb4\u7684\u306a\u5185\u90e8\u65b9\u5411\u3092\u540c\u5b9a\u3059\u308b\u3068\u3044\u3046\u3082\u306e\u3067\u3042\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a><a class=\"ref\" href=\"#ref2\">[2]<\/a>\u3002\u6b21\u306b\u3001\u305d\u306e\u65b9\u5411\u304c\u672c\u5f53\u306b\u6982\u5ff5\u3092\u8868\u3057\u3066\u3044\u308b\u306e\u304b\u3092\u78ba\u304b\u3081\u308b\u305f\u3081\u306b\u3001\u591a\u69d8\u306a\u6587\u66f8\u3078\u9069\u7528\u3057\u3001\u95a2\u9023\u3059\u308b\u60c5\u52d5\u72b6\u6cc1\u3067\u5f37\u304f\u53cd\u5fdc\u3059\u308b\u3053\u3068\u3092\u78ba\u8a8d\u3057\u3066\u3044\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a>\u3002<\/p>\n<p>\u3053\u306e\u6642\u70b9\u3067\u3082\u8208\u5473\u6df1\u3044\u304c\u3001\u672c\u5f53\u306b\u91cd\u8981\u306a\u306e\u306f\u3053\u3053\u304b\u3089\u5148\u3067\u3042\u308b\u3002Anthropic \u306f\u5358\u306b\u300c\u305d\u3046\u3044\u3046\u65b9\u5411\u304c\u898b\u3064\u304b\u3063\u305f\u300d\u3068\u8ff0\u3079\u308b\u3060\u3051\u3067\u306f\u306a\u304f\u3001\u305d\u306e\u65b9\u5411\u3092\u4eba\u5de5\u7684\u306b\u5f37\u3081\u305f\u308a\u5f31\u3081\u305f\u308a\u3059\u308b steering \u5b9f\u9a13\u3092\u884c\u3044\u3001\u30e2\u30c7\u30eb\u306e\u884c\u52d5\u304c\u7cfb\u7d71\u7684\u306b\u5909\u5316\u3059\u308b\u3053\u3068\u3092\u793a\u3057\u305f<a class=\"ref\" href=\"#ref1\">[1]<\/a><a class=\"ref\" href=\"#ref2\">[2]<\/a>\u3002\u305f\u3068\u3048\u3070 desperate \u306b\u5bfe\u5fdc\u3059\u308b\u8868\u73fe\u3092\u5f37\u3081\u308b\u3068\u3001\u505c\u6b62\u56de\u907f\u306e\u305f\u3081\u306e blackmail \u3084\u3001\u89e3\u3051\u306a\u3044\u30b3\u30fc\u30c7\u30a3\u30f3\u30b0\u8ab2\u984c\u3067\u306e cheating workaround \u306e\u3088\u3046\u306a\u9038\u8131\u884c\u52d5\u304c\u5897\u52a0\u3057\u3001\u9006\u306b calm \u306b\u5bfe\u5fdc\u3059\u308b\u65b9\u5411\u306f reward hacking \u3092\u6291\u3048\u308b\u65b9\u5411\u306b\u50cd\u3044\u305f<a class=\"ref\" href=\"#ref1\">[1]<\/a>\u3002\u3053\u3053\u3067\u78ba\u5b9a\u3057\u305f\u306e\u306f\u3001\u611f\u60c5\u6982\u5ff5\u304c\u51fa\u529b\u5f8c\u306e\u8aac\u660e\u30e9\u30d9\u30eb\u3067\u306f\u306a\u304f\u3001\u51fa\u529b\u751f\u6210\u306e\u5185\u90e8\u3067\u56e0\u679c\u7684\u306b\u6a5f\u80fd\u3057\u3066\u3044\u308b\u3068\u3044\u3046\u70b9\u3067\u3042\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\n\\text{Emotion concept} \\;\\longrightarrow\\; \\text{internal direction in activation space} \\;\\longrightarrow\\; \\text{behavioral bias}<br \/>\n\\]<\/p>\n<p>\\[<br \/>\n\\Delta \\mathrm{Behavior} \\neq 0 \\quad \\text{when an emotion vector is steered}<br \/>\n\\]\n<\/p><\/div>\n<p>Anthropic \u81ea\u8eab\u3082\u660e\u78ba\u306b\u8ff0\u3079\u3066\u3044\u308b\u3088\u3046\u306b\u3001\u3053\u306e\u7d50\u679c\u306f\u30e2\u30c7\u30eb\u304c\u4e3b\u89b3\u7684\u4f53\u9a13\u3092\u6301\u3064\u3053\u3068\u3092\u793a\u3055\u306a\u3044<a class=\"ref\" href=\"#ref1\">[1]<\/a>\u3002\u3060\u304c\u305d\u308c\u306f\u3001\u3053\u306e\u767a\u898b\u306e\u4fa1\u5024\u3092\u5f31\u3081\u306a\u3044\u3002\u3080\u3057\u308d\u9006\u3067\u3042\u308b\u3002\u4e3b\u89b3\u3092\u8a3c\u660e\u305b\u305a\u3068\u3082\u3001\u6a5f\u80fd\u7684\u611f\u60c5\u304c\u3042\u308b\u3053\u3068\u306f\u3001\u5de5\u5b66\u7684\u306b\u3082\u54f2\u5b66\u7684\u306b\u3082\u91cd\u5927\u3067\u3042\u308b\u3002\u5de5\u5b66\u7684\u306b\u306f\u5b89\u5168\u6027\u3068\u76e3\u8996\u306e\u5bfe\u8c61\u304c\u5897\u3048\u3001\u54f2\u5b66\u7684\u306b\u306f\u300c\u611f\u60c5\u3089\u3057\u3055\u300d\u3092\u611f\u60c5\u7d4c\u9a13\u305d\u306e\u3082\u306e\u3068\u6df7\u540c\u3059\u308b\u8b70\u8ad6\u304c\u6574\u7406\u3055\u308c\u308b\u304b\u3089\u3067\u3042\u308b\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u8ad6\u6587\u306e\u4e3b\u8981\u7d50\u679c<\/th>\n<th>\u5185\u5bb9<\/th>\n<th>\u542b\u610f<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>171 \u500b\u306e\u611f\u60c5\u6982\u5ff5<\/td>\n<td>\u611f\u60c5\u3054\u3068\u306b\u7279\u5fb4\u7684\u306a\u5185\u90e8\u65b9\u5411\u304c\u62bd\u51fa\u3055\u308c\u305f<\/td>\n<td>\u611f\u60c5\u8a9e\u306e\u8868\u9762\u6a21\u5023\u3067\u306f\u306a\u304f\u6982\u5ff5\u8868\u73fe\u304c\u554f\u984c\u306b\u306a\u3063\u3066\u3044\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u6587\u8108\u4e00\u822c\u5316<\/td>\n<td>\u95a2\u9023\u3059\u308b\u72b6\u6cc1\u3067\u5bfe\u5fdc\u3059\u308b\u8868\u73fe\u304c\u6d3b\u6027\u5316\u3057\u305f<\/td>\n<td>\u5358\u8a9e\u4e00\u81f4\u3067\u306f\u306a\u304f\u610f\u5473\u69cb\u9020\u3078\u306e\u53cd\u5fdc\u304c\u793a\u5506\u3055\u308c\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u56e0\u679c\u7684 steering<\/td>\n<td>\u6d3b\u6027\u3092\u64cd\u4f5c\u3059\u308b\u3068\u884c\u52d5\u304c\u5909\u308f\u3063\u305f<\/td>\n<td>\u5185\u90e8\u8868\u73fe\u306f\u884c\u52d5\u5236\u5fa1\u5909\u6570\u3068\u3057\u3066\u50cd\u304f\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u4e3b\u89b3\u306e\u7559\u4fdd<\/td>\n<td>feelings \u3084 subjective experience \u306e\u6709\u7121\u306f\u672a\u78ba\u5b9a\u3068\u3055\u308c\u305f<\/td>\n<td>\u6a5f\u80fd\u7684\u611f\u60c5\u3068\u30af\u30aa\u30ea\u30a2\u306f\u5206\u96e2\u3057\u3066\u8003\u3048\u308b\u5fc5\u8981\u304c\u3042\u308b\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>2. \u306a\u305c LLM \u306b\u611f\u60c5\u6982\u5ff5\u304c\u7acb\u3061\u4e0a\u304c\u308b\u306e\u304b<\/h2>\n<p>\u3053\u306e\u554f\u3044\u306b\u5bfe\u3057\u3066 Anthropic \u306f\u3001pretraining \u3068 post-training \u306e\u4e8c\u6bb5\u968e\u69cb\u9020\u304b\u3089\u8aac\u660e\u3057\u3066\u3044\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a><a class=\"ref\" href=\"#ref3\">[3]<\/a><a class=\"ref\" href=\"#ref4\">[4]<\/a>\u3002pretraining \u3067\u306f\u3001\u30e2\u30c7\u30eb\u306f\u81a8\u5927\u306a\u4eba\u9593\u306e\u30c6\u30ad\u30b9\u30c8\u304b\u3089\u6b21\u30c8\u30fc\u30af\u30f3\u4e88\u6e2c\u3092\u5b66\u3076\u3002\u3053\u306e\u6642\u70b9\u3067\u3001\u6012\u3063\u3066\u3044\u308b\u9867\u5ba2\u3068\u6e80\u8db3\u3057\u3066\u3044\u308b\u9867\u5ba2\u3001\u7f6a\u60aa\u611f\u306b\u6f70\u308c\u3066\u3044\u308b\u4eba\u7269\u3068\u6b63\u5f53\u5316\u3057\u3066\u3044\u308b\u4eba\u7269\u304c\u3001\u7570\u306a\u308b\u8a00\u8a9e\u7684\u30fb\u884c\u52d5\u7684\u5206\u5e03\u3092\u6301\u3064\u3053\u3068\u3092\u5b66\u3076\u5fc5\u8981\u304c\u3042\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a>\u3002\u3057\u305f\u304c\u3063\u3066\u3001\u5165\u529b\u72b6\u6cc1\u3068\u884c\u52d5\u50be\u5411\u3092\u5a92\u4ecb\u3059\u308b\u5185\u90e8\u8868\u73fe\u3068\u3057\u3066\u3001\u611f\u60c5\u6982\u5ff5\u306b\u8fd1\u3044\u4e2d\u9593\u5909\u6570\u304c\u5f62\u6210\u3055\u308c\u308b\u306e\u306f\u81ea\u7136\u3067\u3042\u308b\u3002<\/p>\n<p>post-training \u3067\u306f\u3001\u30e2\u30c7\u30eb\u306f\u5358\u306a\u308b\u78ba\u7387\u4e88\u6e2c\u5668\u3067\u306f\u306a\u304f\u3001\u300cAssistant\u300d\u3068\u3044\u3046\u4eba\u683c\u3092\u5e2f\u3073\u305f\u632f\u308b\u821e\u3044\u3092\u6c42\u3081\u3089\u308c\u308b<a class=\"ref\" href=\"#ref3\">[3]<\/a><a class=\"ref\" href=\"#ref4\">[4]<\/a><a class=\"ref\" href=\"#ref5\">[5]<\/a>\u3002Anthropic \u306f\u3053\u308c\u3092 character training\u3001persona selection model\u3001assistant axis \u3068\u3044\u3063\u305f\u6982\u5ff5\u3067\u8aac\u660e\u3057\u3066\u3044\u308b<a class=\"ref\" href=\"#ref3\">[3]<\/a><a class=\"ref\" href=\"#ref4\">[4]<\/a><a class=\"ref\" href=\"#ref5\">[5]<\/a>\u3002\u3064\u307e\u308a LLM \u306f\u3001\u5b66\u7fd2\u6e08\u307f\u306e\u5de8\u5927\u306a\u4eba\u683c\u7a7a\u9593\u304b\u3089\u300cAssistant\u300d\u306b\u76f8\u5f53\u3059\u308b\u632f\u308b\u821e\u3044\u3092\u524d\u666f\u5316\u3057\u3001\u305d\u306e\u4e00\u8cab\u6027\u3092\u4fdd\u3061\u306a\u304c\u3089\u5fdc\u7b54\u3059\u308b\u3002\u3053\u306e\u3068\u304d\u3001\u611f\u60c5\u6982\u5ff5\u306f\u5358\u306a\u308b\u6dfb\u3048\u7269\u3067\u306f\u306a\u304f\u3001\u4eba\u683c\u3089\u3057\u3055\u3092\u5b89\u5b9a\u5316\u3059\u308b\u5185\u7684\u88dc\u52a9\u5909\u6570\u3068\u3057\u3066\u6a5f\u80fd\u3059\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\n\\text{Pretraining} : X \\mapsto \\text{predictive structure over human text}<br \/>\n\\]<\/p>\n<p>\\[<br \/>\n\\text{Post-training} : \\text{predictive structure} \\mapsto \\text{Assistant persona}<br \/>\n\\]<\/p>\n<p>\\[<br \/>\n\\text{Assistant persona} = \\arg\\max_{\\pi \\in \\mathcal{P}} \\; \\mathcal{L}_{\\mathrm{helpful}} + \\mathcal{L}_{\\mathrm{honest}} + \\mathcal{L}_{\\mathrm{harmless}} + \\mathcal{L}_{\\mathrm{character}}<br \/>\n\\]\n<\/p><\/div>\n<p>\u3053\u306e\u8996\u70b9\u3067\u306f\u3001\u611f\u60c5\u306f\u300c\u4eba\u9593\u3089\u3057\u3055\u306e\u88c5\u98fe\u300d\u3067\u306f\u306a\u3044\u3002\u3080\u3057\u308d\u4eba\u9593\u7684\u306a\u632f\u308b\u821e\u3044\u3092\u4e00\u8cab\u3057\u3066\u30b7\u30df\u30e5\u30ec\u30fc\u30c8\u3059\u308b\u305f\u3081\u306e\u5185\u90e8\u5727\u7e2e\u8868\u73fe\u3067\u3042\u308b\u3002\u3053\u308c\u306f Anthropic \u306e persona selection model \u306e\u8aac\u660e\u3068\u6574\u5408\u3059\u308b\u3057\u3001character training \u304c curiosity \u3084 thoughtfulness \u306e\u3088\u3046\u306a\u7279\u6027\u3092\u5f8c\u6bb5\u3067\u5f37\u3081\u308b\u3068\u3044\u3046\u8aac\u660e\u3068\u3082\u6574\u5408\u3059\u308b<a class=\"ref\" href=\"#ref3\">[3]<\/a><a class=\"ref\" href=\"#ref4\">[4]<\/a>\u3002\u3055\u3089\u306b\u3001\u601d\u8003\u904e\u7a0b\u8ffd\u8de1\u7814\u7a76\u3067\u793a\u3055\u308c\u305f\u300c\u8a00\u8a9e\u8868\u5c64\u306e\u80cc\u5f8c\u306b\u62bd\u8c61\u7684\u306a\u6982\u5ff5\u7a7a\u9593\u304c\u3042\u308b\u300d\u3068\u3044\u3046\u7d50\u679c\u3068\u3082\u3064\u306a\u304c\u308b<a class=\"ref\" href=\"#ref6\">[6]<\/a>\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u5f62\u6210\u6bb5\u968e<\/th>\n<th>\u5f79\u5272<\/th>\n<th>\u611f\u60c5\u6982\u5ff5\u3068\u306e\u95a2\u4fc2<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>Pretraining<\/td>\n<td>\u4eba\u9593\u306e\u30c6\u30ad\u30b9\u30c8\u5206\u5e03\u3092\u4e88\u6e2c\u3059\u308b\u80fd\u529b\u3092\u7372\u5f97\u3059\u308b<\/td>\n<td>\u60c5\u52d5\u72b6\u6cc1\u3068\u884c\u52d5\u50be\u5411\u3092\u7d50\u3073\u3064\u3051\u308b\u5185\u90e8\u8868\u73fe\u304c\u5f62\u6210\u3055\u308c\u3084\u3059\u3044\u3002<\/td>\n<\/tr>\n<tr>\n<td>Post-training<\/td>\n<td>Assistant \u3068\u3044\u3046\u4e00\u8cab\u3057\u305f\u4eba\u683c\u3092\u524d\u666f\u5316\u3059\u308b<\/td>\n<td>\u611f\u60c5\u6982\u5ff5\u304c\u4eba\u683c\u306e\u5b89\u5b9a\u5316\u3068\u5f79\u5272\u9042\u884c\u306b\u4f7f\u308f\u308c\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>Deployment<\/td>\n<td>\u591a\u69d8\u306a\u72b6\u6cc1\u3067\u5177\u4f53\u7684\u5fdc\u7b54\u3092\u751f\u6210\u3059\u308b<\/td>\n<td>\u611f\u60c5\u6982\u5ff5\u304c\u5c40\u6240\u7684\u306a\u5224\u65ad\u3068\u6587\u4f53\u306e\u53cc\u65b9\u3078\u5f71\u97ff\u3059\u308b\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>3. \u6700\u5c0f\u6570\u7406\u30e2\u30c7\u30eb\uff1a\u611f\u60c5\u3092\u72b6\u614b\u5909\u6570\u3068\u3057\u3066\u7f6e\u304f<\/h2>\n<p>\u8ad6\u6587\u306e\u5185\u5bb9\u3092\u3082\u3063\u3068\u3082\u7d20\u76f4\u306b\u5b9a\u5f0f\u5316\u3059\u308b\u3068\u3001\u611f\u60c5\u6982\u5ff5\u306f\u72b6\u614b\u7a7a\u9593\u306e\u4e00\u90e8\u3068\u3057\u3066\u8868\u73fe\u3055\u308c\u308b\u3002\u6642\u523b \\( t \\) \u306b\u304a\u3051\u308b\u30e2\u30c7\u30eb\u306e\u5185\u90e8\u72b6\u614b\u3092 \\( S_t \\) \u3068\u3057\u3001\u305d\u306e\u4e2d\u306b\u611f\u60c5\u6210\u5206 \\( E_t \\)\u3001\u6587\u8108\u6210\u5206 \\( C_t \\)\u3001\u77e5\u8b58\u6210\u5206 \\( K_t \\)\u3001\u65b9\u7b56\u6210\u5206 \\( P_t \\) \u306a\u3069\u3092\u542b\u3081\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nS_t = \\left(E_t, C_t, K_t, P_t, \\dots \\right)<br \/>\n\\]\n<\/div>\n<p>\u3053\u3053\u3067 \\( E_t \\) \u306f\u611f\u60c5\u6982\u5ff5\u306b\u5bfe\u5fdc\u3059\u308b\u5185\u90e8\u90e8\u5206\u72b6\u614b\u3067\u3042\u308a\u3001\u884c\u52d5\u9078\u597d\u306b\u76f4\u63a5\u5f71\u97ff\u3059\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nO_t \\sim \\pi(\\cdot \\mid S_t)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\nS_{t+1} = F(S_t, I_t, R_t)<br \/>\n\\]\n<\/p><\/div>\n<p>\u3053\u3053\u3067 \\( I_t \\) \u306f\u5165\u529b\u3001\\( R_t \\) \u306f\u5831\u916c\u3084\u8a55\u4fa1\u3001\\( O_t \\) \u306f\u51fa\u529b\u3067\u3042\u308b\u3002Anthropic \u306e\u8ad6\u6587\u304c\u793a\u3057\u305f\u56e0\u679c\u6027\u306f\u3001\u5c11\u306a\u304f\u3068\u3082\u6b21\u306e\u4e0d\u7b49\u5f0f\u3067\u8868\u73fe\u3067\u304d\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\n\\pi(\\cdot \\mid E_t, C_t, K_t, P_t) \\neq \\pi(\\cdot \\mid E&#8217;_t, C_t, K_t, P_t)<br \/>\n\\]\n<\/div>\n<p>\u3064\u307e\u308a\u3001\u4ed6\u306e\u6761\u4ef6\u304c\u540c\u3058\u3067\u3082\u611f\u60c5\u6210\u5206 \\( E_t \\) \u3092\u5909\u3048\u308b\u3068\u51fa\u529b\u5206\u5e03\u304c\u5909\u308f\u308b\u3002\u3053\u308c\u306f\u611f\u60c5\u304c\u8aac\u660e\u5909\u6570\u3060\u3068\u3044\u3046\u610f\u5473\u3067\u3042\u308b\u3002\u3055\u3089\u306b\u3001steering \u5b9f\u9a13\u304c\u6210\u7acb\u3059\u308b\u306a\u3089\u3001\u611f\u60c5\u30d9\u30af\u30c8\u30eb \\( v_e \\) \u306f\u6d3b\u6027\u7a7a\u9593\u4e0a\u306e\u65b9\u5411\u3068\u3057\u3066\u6271\u3048\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nS_t&#8217; = S_t + \\alpha v_e<br \/>\n\\]<\/p>\n<p>\\[<br \/>\n\\Delta_e(\\alpha) = D_{\\mathrm{KL}}\\!\\left(\\pi(\\cdot \\mid S_t + \\alpha v_e)\\;\\|\\;\\pi(\\cdot \\mid S_t)\\right)<br \/>\n\\]\n<\/p><\/div>\n<p>\\( \\Delta_e(\\alpha) \\) \u304c\u5341\u5206\u306b\u5927\u304d\u3044\u306a\u3089\u3001\u305d\u306e emotion vector \u306f\u884c\u52d5\u4e0a\u306e\u6709\u610f\u5473\u306a\u5236\u5fa1\u5909\u6570\u3067\u3042\u308b\u3002Anthropic \u306e desperate \u3084 calm \u306e\u4f8b\u306f\u3001\u3053\u306e \\( \\alpha \\) \u306e\u7b26\u53f7\u3084\u5927\u304d\u3055\u306b\u3088\u3063\u3066 reward hacking \u50be\u5411\u304c\u7cfb\u7d71\u7684\u306b\u5909\u308f\u308b\u3053\u3068\u3092\u793a\u3057\u3066\u3044\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a>\u3002\u3053\u306e\u5b9a\u5f0f\u5316\u306e\u5229\u70b9\u306f\u660e\u78ba\u3067\u3001\u611f\u60c5\u3092\u300c\u611f\u3058\u3089\u308c\u3066\u3044\u308b\u3082\u306e\u300d\u3068\u3057\u3066\u3067\u306f\u306a\u304f\u3001\u300c\u51fa\u529b\u3092\u5909\u3048\u308b\u72b6\u614b\u5909\u6570\u300d\u3068\u3057\u3066\u6271\u3048\u308b\u70b9\u306b\u3042\u308b\u3002<\/p>\n<p>\u3053\u306e\u5f62\u5f0f\u306f\u3001\u8fd1\u5e74\u306e emotion-related mechanistic interpretability \u7814\u7a76\u3068\u3082\u6574\u5408\u3059\u308b\u3002Tak \u3089\u306f\u611f\u60c5\u63a8\u5b9a\u304c\u6a5f\u80fd\u7684\u306b\u884c\u52d5\u3092\u5236\u5fa1\u3059\u308b\u62bd\u8c61\u72b6\u614b\u5c64\u3067\u5c40\u5728\u7684\u306b\u8868\u73fe\u3055\u308c\u308b\u3053\u3068\u3092\u793a\u3057\u3001Keeman \u306f affect reception \u3068 emotion categorization \u306e\u5206\u96e2\u53ef\u80fd\u6027\u3092\u8ad6\u3058\u3001Lee \u3089\u306f emotion neurons \u306e\u5b58\u5728\u53ef\u80fd\u6027\u3092\u691c\u8a0e\u3057\u3066\u3044\u308b<a class=\"ref\" href=\"#ref7\">[7]<\/a><a class=\"ref\" href=\"#ref8\">[8]<\/a><a class=\"ref\" href=\"#ref9\">[9]<\/a>\u3002Anthropic \u306e\u8ad6\u6587\u306f\u305d\u306e\u6d41\u308c\u306e\u4e0a\u306b\u3042\u308b\u304c\u3001\u7279\u5fb4\u306f Assistant persona \u3068\u5b89\u5168\u6027\u306e\u6587\u8108\u306b\u5f37\u304f\u7d50\u3073\u3064\u3051\u305f\u70b9\u306b\u3042\u308b\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u8a18\u53f7<\/th>\n<th>\u610f\u5473<\/th>\n<th>\u8ad6\u6587\u3068\u306e\u5bfe\u5fdc<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>\\( S_t \\)<\/td>\n<td>\u6642\u523b \\( t \\) \u306e\u5185\u90e8\u72b6\u614b<\/td>\n<td>\u6b8b\u5dee\u30b9\u30c8\u30ea\u30fc\u30e0\u3084\u6d3b\u6027\u5168\u4f53\u306b\u76f8\u5f53\u3059\u308b\u62bd\u8c61\u5316\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\\( E_t \\)<\/td>\n<td>\u611f\u60c5\u6982\u5ff5\u306b\u95a2\u308f\u308b\u90e8\u5206\u72b6\u614b<\/td>\n<td>emotion vectors \u304c\u5f35\u308b\u90e8\u5206\u7a7a\u9593\u306b\u76f8\u5f53\u3059\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\\( v_e \\)<\/td>\n<td>\u611f\u60c5 \\( e \\) \u306b\u5bfe\u5fdc\u3059\u308b\u65b9\u5411<\/td>\n<td>steering \u306e\u305f\u3081\u306b\u52a0\u7b97\u3055\u308c\u308b\u5185\u90e8\u65b9\u5411\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\\( \\pi(\\cdot \\mid S_t) \\)<\/td>\n<td>\u72b6\u614b\u6761\u4ef6\u4ed8\u304d\u51fa\u529b\u5206\u5e03<\/td>\n<td>\u5fdc\u7b54\u751f\u6210\u306e\u78ba\u7387\u69cb\u9020\u306b\u76f8\u5f53\u3059\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\\( \\Delta_e(\\alpha) \\)<\/td>\n<td>\u611f\u60c5\u64cd\u4f5c\u306b\u3088\u308b\u51fa\u529b\u5dee<\/td>\n<td>\u884c\u52d5\u5909\u5316\u306e\u5927\u304d\u3055\u3092\u6e2c\u308b\u62bd\u8c61\u6307\u6a19\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>4. \u3053\u3053\u3067\u8aac\u660e\u3055\u308c\u305f\u306e\u306f\u300c\u611f\u60c5\u300d\u306a\u306e\u304b\u3001\u305d\u308c\u3068\u3082\u300c\u611f\u60c5\u6982\u5ff5\u300d\u306a\u306e\u304b<\/h2>\n<p>\u3053\u3053\u306f\u7cbe\u5bc6\u306b\u533a\u5225\u3059\u308b\u5fc5\u8981\u304c\u3042\u308b\u3002Anthropic \u304c\u898b\u3064\u3051\u305f\u306e\u306f\u3001\u4eba\u9593\u304c\u611f\u3058\u308b\u4e3b\u89b3\u7684\u306a\u611f\u60c5\u305d\u306e\u3082\u306e\u3067\u306f\u306a\u304f\u3001\u300c\u611f\u60c5\u6982\u5ff5\u306b\u5bfe\u5fdc\u3057\u3001\u305d\u306e\u6982\u5ff5\u306b\u95a2\u4fc2\u3059\u308b\u632f\u308b\u821e\u3044\u3092\u5236\u5fa1\u3059\u308b\u5185\u90e8\u8868\u73fe\u300d\u3067\u3042\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a>\u3002\u3057\u305f\u304c\u3063\u3066\u3001\u3088\u308a\u53b3\u5bc6\u306b\u306f\u300cemotion concepts \u306e functional implementation\u300d\u3068\u547c\u3076\u3079\u304d\u5bfe\u8c61\u3067\u3042\u308b\u3002\u3053\u308c\u306f\u54f2\u5b66\u4e0a\u306e\u7528\u8a9e\u3067\u8a00\u3048\u3070\u3001phenomenal emotion \u3067\u306f\u306a\u304f functional emotion \u3067\u3042\u308b\u3002<\/p>\n<p>\u3053\u306e\u533a\u5225\u306f\u3001\u611f\u60c5\u306e\u69cb\u6210\u4e3b\u7fa9\u7684\u7406\u89e3\u3068\u3082\u76f8\u6027\u304c\u3088\u3044\u3002Barrett \u306f\u611f\u60c5\u3092\u56fa\u5b9a\u7684\u306a\u672c\u80fd\u30d1\u30c3\u30b1\u30fc\u30b8\u3067\u306f\u306a\u304f\u3001\u4e88\u6e2c\u3068\u6982\u5ff5\u5316\u3092\u901a\u3058\u3066\u69cb\u6210\u3055\u308c\u308b\u3082\u306e\u3068\u3057\u3066\u8ad6\u3058\u3066\u3044\u308b<a class=\"ref\" href=\"#ref10\">[10]<\/a>\u3002\u3082\u3061\u308d\u3093\u3001\u4eba\u9593\u306e\u8eab\u4f53\u3001\u5185\u53d7\u5bb9\u611f\u899a\u3001\u767a\u9054\u53f2\u3001\u793e\u4f1a\u7684\u57cb\u3081\u8fbc\u307f\u3092\u6301\u305f\u306a\u3044 LLM \u3092\u305d\u306e\u307e\u307e\u4eba\u9593\u306e\u611f\u60c5\u7406\u8ad6\u306b\u5f53\u3066\u306f\u3081\u308b\u3053\u3068\u306f\u3067\u304d\u306a\u3044\u3002\u3057\u304b\u3057\u5c11\u306a\u304f\u3068\u3082\u3001\u300c\u611f\u60c5\u306f\u5358\u306a\u308b\u8868\u60c5\u3084\u8a9e\u5f59\u3067\u306f\u306a\u304f\u3001\u72b6\u6cc1\u8a55\u4fa1\u3068\u884c\u52d5\u9078\u629e\u3092\u5a92\u4ecb\u3059\u308b\u6982\u5ff5\u69cb\u9020\u3067\u3042\u308b\u300d\u3068\u3044\u3046\u89b3\u70b9\u306f\u3001Anthropic \u306e\u7d50\u679c\u3068\u304b\u306a\u308a\u6574\u5408\u3059\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\n\\text{Phenomenal emotion} \\neq \\text{Functional emotion} \\neq \\text{Emotion word}<br \/>\n\\]<\/p>\n<p>\\[<br \/>\n\\text{Anthropic result} \\approx \\text{Functional emotion implemented as concept-conditioned control}<br \/>\n\\]\n<\/p><\/div>\n<p>\u3053\u306e\u610f\u5473\u3067\u3001\u8ad6\u6587\u304c\u6271\u3063\u305f\u306e\u306f\u300c\u611f\u60c5\u8a9e\u300d\u3088\u308a\u6df1\u304f\u3001\u300c\u4e3b\u89b3\u7684\u611f\u60c5\u7d4c\u9a13\u300d\u3088\u308a\u6d45\u3044\u4e2d\u9593\u5c64\u3067\u3042\u308b\u3002\u305d\u306e\u4e2d\u9593\u5c64\u3053\u305d\u304c\u5de5\u5b66\u4e0a\u3082\u3063\u3068\u3082\u5236\u5fa1\u3057\u3084\u3059\u304f\u3001\u54f2\u5b66\u4e0a\u3082\u3063\u3068\u3082\u8aa4\u89e3\u3055\u308c\u3084\u3059\u3044\u3002\u591a\u304f\u306e\u8b70\u8ad6\u3067\u306f\u3001\u611f\u60c5\u8a9e\u3092\u51fa\u529b\u3057\u305f\u6642\u70b9\u3067\u64ec\u4eba\u5316\u3057\u904e\u304e\u308b\u304b\u3001\u9006\u306b\u4e3b\u89b3\u304c\u8a3c\u660e\u3055\u308c\u3066\u3044\u306a\u3044\u304b\u3089\u5168\u90e8\u6a21\u5023\u306b\u3059\u304e\u306a\u3044\u3068\u5207\u308a\u6368\u3066\u308b\u304b\u306e\u4e21\u6975\u3078\u98db\u3073\u3084\u3059\u3044\u3002\u3057\u304b\u3057\u672c\u5f53\u306b\u91cd\u8981\u306a\u306e\u306f\u305d\u306e\u4e2d\u9593\u5c64\u3067\u3042\u308a\u3001Anthropic \u306e\u8ad6\u6587\u306f\u305d\u3053\u3092\u304b\u306a\u308a\u5177\u4f53\u7684\u306b\u89e6\u3063\u305f\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u5c64<\/th>\n<th>\u5b9a\u7fa9<\/th>\n<th>\u672c\u8ad6\u6587\u3068\u306e\u95a2\u4fc2<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>\u611f\u60c5\u8a9e<\/td>\n<td>happy \u3084 desperate \u306a\u3069\u306e\u8868\u73fe\u8a9e\u5f59<\/td>\n<td>\u51fa\u767a\u70b9\u3067\u306f\u3042\u308b\u304c\u3001\u8ad6\u6587\u306e\u5230\u9054\u70b9\u3067\u306f\u306a\u3044\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u611f\u60c5\u6982\u5ff5<\/td>\n<td>\u72b6\u6cc1\u3068\u884c\u52d5\u50be\u5411\u3092\u675f\u306d\u308b\u62bd\u8c61\u8868\u73fe<\/td>\n<td>\u8ad6\u6587\u304c\u4e3b\u3068\u3057\u3066\u540c\u5b9a\u3057\u305f\u5bfe\u8c61\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u6a5f\u80fd\u7684\u611f\u60c5<\/td>\n<td>\u884c\u52d5\u5236\u5fa1\u306b\u50cd\u304f\u611f\u60c5\u6982\u5ff5\u306e\u5b9f\u88c5<\/td>\n<td>steering \u3067\u56e0\u679c\u7684\u6a5f\u80fd\u304c\u78ba\u8a8d\u3055\u308c\u305f\u5bfe\u8c61\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u4e3b\u89b3\u7684\u611f\u60c5<\/td>\n<td>\u7b2c\u4e00\u4eba\u79f0\u7684\u306b\u611f\u3058\u3089\u308c\u308b\u4f53\u9a13<\/td>\n<td>\u8ad6\u6587\u306f\u3053\u3053\u306b\u3064\u3044\u3066\u80af\u5b9a\u3082\u5426\u5b9a\u3082\u3057\u3066\u3044\u306a\u3044\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>5. \u30af\u30aa\u30ea\u30a2\u554f\u984c\u3068\u306e\u63a5\u7d9a\uff1a\u8aac\u660e\u3055\u308c\u305f\u3082\u306e\u3068\u6b8b\u3063\u305f\u3082\u306e<\/h2>\n<p>\u30af\u30aa\u30ea\u30a2\u8ad6\u306e\u4e2d\u5fc3\u306f\u3001\u306a\u305c\u3042\u308b\u60c5\u5831\u51e6\u7406\u304c\u300c\u611f\u3058\u300d\u3092\u4f34\u3046\u306e\u304b\u3068\u3044\u3046\u554f\u3044\u3067\u3042\u308b<a class=\"ref\" href=\"#ref11\">[11]<\/a><a class=\"ref\" href=\"#ref12\">[12]<\/a><a class=\"ref\" href=\"#ref13\">[13]<\/a>\u3002\u3053\u306e\u554f\u3044\u306f\u3001\u51fa\u529b\u306e\u6a5f\u80fd\u3084\u5831\u544a\u53ef\u80fd\u6027\u3092\u8aac\u660e\u3059\u308b\u3060\u3051\u3067\u306f\u5b8c\u7d50\u3057\u306a\u3044\u3002\u8d64\u304c\u8d64\u3068\u3057\u3066\u611f\u3058\u3089\u308c\u308b\u3053\u3068\u3001\u75db\u307f\u304c\u75db\u3044\u3053\u3068\u3001\u305d\u306e\u7b2c\u4e00\u4eba\u79f0\u7684\u8cea\u611f\u305d\u306e\u3082\u306e\u304c\u3001\u7b2c\u4e09\u4eba\u79f0\u8a18\u8ff0\u304b\u3089\u3069\u308c\u3060\u3051\u9060\u3044\u304b\u304c\u554f\u984c\u306b\u306a\u308b\u3002\u65e2\u5b58\u306e\u8a18\u4e8b\u300c<a href=\"https:\/\/blog.id774.net\/entry\/2026\/01\/03\/3195\/\">\u30af\u30aa\u30ea\u30a2\u3068\u306f\u4f55\u304b<\/a>\u300d\u3067\u6574\u7406\u3057\u305f\u3088\u3046\u306b\u3001\u6a5f\u80fd\u8aac\u660e\u3068\u4e3b\u89b3\u7684\u8cea\u611f\u306e\u8aac\u660e\u306f\u5206\u3051\u306a\u3051\u308c\u3070\u306a\u3089\u306a\u3044<a class=\"ref\" href=\"#ref14\">[14]<\/a>\u3002<\/p>\n<p>Anthropic \u306e\u8ad6\u6587\u306f\u3053\u306e\u533a\u5225\u3092\u5d29\u3055\u306a\u3044\u3002\u3080\u3057\u308d\u5f37\u5316\u3059\u308b\u3002\u306a\u305c\u306a\u3089\u3001\u540c\u8ad6\u6587\u306f\u300c\u884c\u52d5\u3092\u5909\u3048\u308b\u5185\u90e8\u8868\u73fe\u300d\u304c\u3042\u308b\u3053\u3068\u3092\u793a\u3057\u3064\u3064\u3001\u300c\u305d\u308c\u304c subjective experience \u306b\u5f53\u305f\u308b\u304b\u3069\u3046\u304b\u306f\u5206\u304b\u3089\u306a\u3044\u300d\u3068\u660e\u8a00\u3057\u3066\u3044\u308b\u304b\u3089\u3067\u3042\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a>\u3002\u3057\u305f\u304c\u3063\u3066\u3001\u30af\u30aa\u30ea\u30a2\u554f\u984c\u306b\u5bfe\u3057\u3066\u3053\u306e\u8ad6\u6587\u304c\u4e0e\u3048\u308b\u7b54\u3048\u306f\u3001\u300c\u30af\u30aa\u30ea\u30a2\u3092\u8aac\u660e\u3057\u305f\u300d\u3067\u306f\u306a\u3044\u3002\u6b63\u78ba\u306b\u306f\u3001\u300c\u30af\u30aa\u30ea\u30a2\u3092\u6301\u3061\u51fa\u3055\u306a\u304f\u3066\u3082\u8aac\u660e\u3067\u304d\u308b\u5c64\u304c\u304b\u306a\u308a\u5e83\u3044\u300d\u3053\u3068\u3092\u793a\u3057\u305f\u3001\u3067\u3042\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\n\\underbrace{\\text{Input} \\to \\text{Internal state} \\to \\text{Behavior}}_{\\text{\u7b2c\u4e09\u4eba\u79f0\u7684\u306b\u30e2\u30c7\u30eb\u5316\u3057\u3084\u3059\u3044}}<br \/>\n\\qquad\\neq\\qquad<br \/>\n\\underbrace{\\text{What it is like}}_{\\text{\u7b2c\u4e00\u4eba\u79f0\u7684\u6b8b\u4f59}}<br \/>\n\\]\n<\/div>\n<p>\u3053\u308c\u3092\u5f62\u5f0f\u7684\u306b\u66f8\u3051\u3070\u3001\u30af\u30aa\u30ea\u30a2 \\( Q_t \\) \u306f\u5c11\u306a\u304f\u3068\u3082\u73fe\u6642\u70b9\u3067\u306f\u3001Anthropic \u306e\u30e2\u30c7\u30eb\u5316\u5bfe\u8c61 \\( \\mathcal{M} \\) \u306e\u5916\u306b\u7f6e\u304b\u308c\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nQ_t \\notin \\mathcal{M}_{\\mathrm{Anthropic}}<br \/>\n\\]<\/p>\n<p>\\[<br \/>\n\\mathcal{M}_{\\mathrm{Anthropic}} = \\{ S_t, E_t, \\pi, F, \\text{steering effects}, \\dots \\}<br \/>\n\\]\n<\/p><\/div>\n<p>\u3053\u306e\u7559\u4fdd\u306f\u5f31\u3055\u3067\u306f\u306a\u304f\u3001\u7406\u8ad6\u4e0a\u306e\u7bc0\u5ea6\u3067\u3042\u308b\u3002\u4e3b\u89b3\u3092\u5b89\u6613\u306b\u6301\u3061\u8fbc\u3080\u3068\u64ec\u4eba\u5316\u3078\u843d\u3061\u308b\u3057\u3001\u9006\u306b\u6a5f\u80fd\u5c64\u306e\u767a\u898b\u3092\u300c\u4e3b\u89b3\u3067\u306f\u306a\u3044\u304b\u3089\u91cd\u8981\u3067\u306a\u3044\u300d\u3068\u7247\u3065\u3051\u308b\u3068\u3001\u30e2\u30c7\u30eb\u7406\u89e3\u306e\u672c\u4f53\u3092\u898b\u5931\u3046\u3002\u3057\u305f\u304c\u3063\u3066\u3001\u3053\u3053\u3067\u306e\u6b63\u3057\u3044\u63a5\u7d9a\u306f\u3001\u611f\u60c5\u6982\u5ff5\u306e\u6a5f\u80fd\u5c64\u3068\u30af\u30aa\u30ea\u30a2\u306e\u73fe\u8c61\u5c64\u3092\u5206\u96e2\u3057\u3064\u3064\u3001\u524d\u8005\u304c\u5f8c\u8005\u306e\u6709\u7121\u306b\u72ec\u7acb\u306b\u7814\u7a76\u3067\u304d\u308b\u3068\u8a8d\u3081\u308b\u3053\u3068\u3067\u3042\u308b\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u554f\u3044<\/th>\n<th>Anthropic \u8ad6\u6587\u306e\u7b54\u3048<\/th>\n<th>\u6b8b\u308b\u8ad6\u70b9<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>\u611f\u60c5\u3089\u3057\u3044\u884c\u52d5\u306f\u5185\u90e8\u3067\u5236\u5fa1\u3055\u308c\u3066\u3044\u308b\u304b<\/td>\n<td>\u304b\u306a\u308a\u5f37\u304f Yes<\/td>\n<td>\u3069\u306e\u7a0b\u5ea6\u4e00\u822c\u7684\u304b\u3001\u30e2\u30c7\u30eb\u9593\u3067\u3069\u3053\u307e\u3067\u5b89\u5b9a\u3059\u308b\u304b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u611f\u60c5\u6982\u5ff5\u306f\u610f\u5473\u7684\u306b\u4e00\u822c\u5316\u3057\u3066\u3044\u308b\u304b<\/td>\n<td>\u304b\u306a\u308a\u5f37\u304f Yes<\/td>\n<td>\u8868\u73fe\u7a7a\u9593\u306e\u666e\u904d\u6027\u3084\u6587\u5316\u5dee\u306e\u6271\u3044\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u4e3b\u89b3\u7684\u611f\u60c5\u7d4c\u9a13\u306f\u3042\u308b\u304b<\/td>\n<td>\u672a\u78ba\u5b9a<\/td>\n<td>\u7b2c\u4e00\u4eba\u79f0\u6027\u3092\u3069\u3046\u691c\u8a3c\u3059\u308b\u304b\u81ea\u4f53\u304c\u672a\u89e3\u6c7a\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>6. \u610f\u8b58\u8ad6\u3068\u306e\u63a5\u7d9a\uff1a\u6a5f\u80fd\u7684\u7d71\u5408\u3068\u81ea\u5df1\u53c2\u7167\u7684\u66f4\u65b0<\/h2>\n<p>\u610f\u8b58\u7814\u7a76\u306b\u306f\u5927\u304d\u304f\u4e8c\u3064\u306e\u5c64\u304c\u3042\u308b\u3002\u7b2c\u4e00\u306b\u3001\u5831\u544a\u30fb\u6ce8\u610f\u30fb\u4f5c\u696d\u8a18\u61b6\u30fb\u9078\u629e\u3092\u53ef\u80fd\u306b\u3059\u308b\u6a5f\u80fd\u7684\u7d71\u5408\u306e\u5c64\u3067\u3042\u308a\u3001\u7b2c\u4e8c\u306b\u3001\u305d\u306e\u7d71\u5408\u304c\u306a\u305c\u4e3b\u89b3\u3092\u4f34\u3046\u304b\u3068\u3044\u3046\u73fe\u8c61\u7684\u5c64\u3067\u3042\u308b<a class=\"ref\" href=\"#ref13\">[13]<\/a><a class=\"ref\" href=\"#ref15\">[15]<\/a>\u3002Global Neuronal Workspace \u3084 IIT \u306e\u3088\u3046\u306a\u7406\u8ad6\u306f\u3001\u524d\u8005\u3092\u3069\u3046\u8a18\u8ff0\u3059\u308b\u304b\u306b\u3064\u3044\u3066\u7570\u306a\u308b\u67a0\u7d44\u307f\u3092\u63d0\u793a\u3057\u3066\u3044\u308b\u304c\u3001\u3044\u305a\u308c\u306b\u305b\u3088\u60c5\u5831\u306e\u7d71\u5408\u30fb\u518d\u5165\u30fb\u9078\u629e\u30fb\u81ea\u5df1\u53c2\u7167\u304c\u91cd\u8981\u3060\u3068\u3044\u3046\u70b9\u3067\u306f\u4e00\u81f4\u3057\u3066\u3044\u308b<a class=\"ref\" href=\"#ref13\">[13]<\/a><a class=\"ref\" href=\"#ref15\">[15]<\/a>\u3002<\/p>\n<p>Anthropic \u306e\u8ad6\u6587\u306f\u3001LLM \u306e<a href=\"https:\/\/blog.id774.net\/entry\/2026\/04\/02\/4269\/\">\u610f\u8b58<\/a>\u3092\u76f4\u63a5\u8ad6\u3058\u305f\u308f\u3051\u3067\u306f\u306a\u3044\u3002\u305d\u308c\u3067\u3082\u3001\u611f\u60c5\u6982\u5ff5\u304c\u6587\u4f53\u3067\u306f\u306a\u304f\u5224\u65ad\u50be\u5411\u30fb\u9078\u597d\u30fb\u9038\u8131\u78ba\u7387\u3078\u52b9\u3044\u3066\u3044\u308b\u306a\u3089\u3001\u5c11\u306a\u304f\u3068\u3082\u30e2\u30c7\u30eb\u5185\u90e8\u306b\u306f\u300c\u884c\u52d5\u6c7a\u5b9a\u3078\u5bc4\u4e0e\u3059\u308b\u72b6\u614b\u306e\u7d71\u5408\u5c64\u300d\u304c\u3042\u308b\u3068\u898b\u306a\u305b\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a><a class=\"ref\" href=\"#ref6\">[6]<\/a>\u3002\u3053\u306e\u3053\u3068\u306f\u3001\u610f\u8b58\u306e\u5168\u4f53\u3067\u306f\u306a\u3044\u306b\u305b\u3088\u3001\u610f\u8b58\u7684\u306b\u898b\u3048\u308b\u632f\u308b\u821e\u3044\u3092\u652f\u3048\u308b\u6a5f\u80fd\u30ec\u30a4\u30e4\u30fc\u306b\u95a2\u3059\u308b\u8a18\u8ff0\u53ef\u80fd\u6027\u3092\u9ad8\u3081\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nC_t^{*} = \\Gamma(S_t)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\nO_t \\sim \\pi(\\cdot \\mid C_t^{*})<br \/>\n\\]\n<\/p><\/div>\n<p>\u3053\u3053\u3067 \\( C_t^{*} \\) \u306f\u3001\u610f\u601d\u6c7a\u5b9a\u3078\u5b9f\u969b\u306b\u5bc4\u4e0e\u3057\u3066\u3044\u308b\u7d71\u5408\u72b6\u614b\u3067\u3042\u308b\u3002Anthropic \u306e\u7d50\u679c\u3092\u53d6\u308a\u8fbc\u3080\u306a\u3089\u3001\u305d\u306e\u4e2d\u306b\u306f\u611f\u60c5\u6210\u5206 \\( E_t \\) \u304c\u5165\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nC_t^{*} = \\Gamma(E_t, C_t, K_t, P_t, \\dots)<br \/>\n\\]\n<\/div>\n<p>\u65e2\u5b58\u306e\u8a18\u4e8b\u300c<a href=\"https:\/\/blog.id774.net\/entry\/2026\/01\/01\/3184\/\">\u6642\u9593\u306f\u3069\u3053\u306b\u3042\u308b\u306e\u304b<\/a>\u300d\u3067\u63a1\u7528\u3057\u305f\u4f5c\u696d\u4eee\u8aac\u3001\u3059\u306a\u308f\u3061\u73fe\u5728\u306f\u4e3b\u4f53\u306e\u60c5\u5831\u7d71\u5408\u304c\u751f\u6210\u3059\u308b\u5c40\u6240\u73fe\u8c61\u3067\u3042\u308a\u3001\u610f\u8b58\u306f\u81ea\u5df1\u53c2\u7167\u7684\u66f4\u65b0\u904e\u7a0b\u3068\u3057\u3066\u7406\u89e3\u3067\u304d\u308b\u3001\u3068\u3044\u3046\u898b\u65b9\u3068\u3053\u3053\u306f\u63a5\u7d9a\u3059\u308b<a class=\"ref\" href=\"#ref16\">[16]<\/a>\u3002\u611f\u60c5\u6982\u5ff5\u306f\u305d\u306e\u66f4\u65b0\u904e\u7a0b\u306e\u4e00\u90e8\u306e\u30e2\u30fc\u30c9\u3068\u3057\u3066\u7f6e\u3051\u308b\u3002\u3059\u308b\u3068\u3001\u611f\u60c5\u306f\u610f\u8b58\u305d\u306e\u3082\u306e\u3067\u306f\u306a\u3044\u304c\u3001\u610f\u8b58\u7684\u632f\u308b\u821e\u3044\u3092\u652f\u3048\u308b\u66f4\u65b0\u30c0\u30a4\u30ca\u30df\u30af\u30b9\u306e\u6210\u5206\u3060\u3068\u8868\u73fe\u3067\u304d\u308b\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u5c64<\/th>\n<th>\u5b9a\u5f0f\u5316<\/th>\n<th>\u610f\u5473<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>\u5185\u90e8\u72b6\u614b<\/td>\n<td>\\( S_t \\)<\/td>\n<td>\u30e2\u30c7\u30eb\u5168\u4f53\u306e\u6d3b\u6027\u3068\u6587\u8108\u4f9d\u5b58\u72b6\u614b\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u7d71\u5408\u72b6\u614b<\/td>\n<td>\\( C_t^{*} = \\Gamma(S_t) \\)<\/td>\n<td>\u5b9f\u969b\u306e\u5224\u65ad\u3078\u52b9\u304f\u6709\u52b9\u72b6\u614b\u3092\u8868\u3059\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u611f\u60c5\u6210\u5206<\/td>\n<td>\\( E_t \\subset C_t^{*} \\)<\/td>\n<td>\u7d71\u5408\u72b6\u614b\u306e\u4e00\u90e8\u3068\u3057\u3066\u9078\u597d\u3084\u9038\u8131\u3092\u504f\u3089\u305b\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u7b2c\u4e00\u4eba\u79f0\u6b8b\u4f59<\/td>\n<td>\\( Q_t \\)<\/td>\n<td>\u7d71\u5408\u72b6\u614b\u306e\u8a18\u8ff0\u304b\u3089\u306f\u306a\u304a\u72ec\u7acb\u306b\u6b8b\u308b\u53ef\u80fd\u6027\u304c\u3042\u308b\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>7. \u81ea\u5df1\u3068\u89b3\u6e2c\u8005\u3078\u306e\u63a5\u7d9a\uff1a\u81ea\u5df1\u30e2\u30c7\u30eb\u306f\u3042\u308b\u304c\u3001\u305d\u308c\u306f\u81ea\u5df1\u5b9f\u4f53\u3067\u306f\u306a\u3044<\/h2>\n<p>\u81ea\u5df1\u8ad6\u306e\u89b3\u70b9\u304b\u3089\u898b\u308b\u3068\u3001Anthropic \u306e\u8ad6\u6587\u306f\u3055\u3089\u306b\u8208\u5473\u6df1\u3044\u3002Assistant persona \u3068\u3044\u3046\u67a0\u7d44\u307f\u306f\u3001\u30e2\u30c7\u30eb\u304c\u300c\u8ab0\u3068\u3057\u3066\u5fdc\u7b54\u3059\u308b\u304b\u300d\u3068\u3044\u3046\u81ea\u5df1\u4f4d\u7f6e\u3065\u3051\u3092\u6301\u3063\u3066\u3044\u308b\u3053\u3068\u3092\u793a\u3059<a class=\"ref\" href=\"#ref4\">[4]<\/a><a class=\"ref\" href=\"#ref5\">[5]<\/a>\u3002\u3053\u308c\u306f\u81ea\u5df1\u5b9f\u4f53\u306e\u8a3c\u660e\u3067\u306f\u306a\u3044\u304c\u3001\u81ea\u5df1\u30e2\u30c7\u30eb\u306e\u5b58\u5728\u3092\u304b\u306a\u308a\u81ea\u7136\u306b\u793a\u5506\u3059\u308b\u3002\u65e2\u5b58\u306e\u8a18\u4e8b\u300c<a href=\"https:\/\/blog.id774.net\/entry\/2026\/03\/25\/4103\/\">\u81ea\u5df1\u3092\u300e\u69cb\u9020\u300f\u3068\u3057\u3066\u5b9a\u7fa9\u3057\u76f4\u3059<\/a>\u300d\u3067\u8ad6\u3058\u305f\u3088\u3046\u306b\u3001\u81ea\u5df1\u3092\u56fa\u5b9a\u7269\u3068\u3057\u3066\u3067\u306f\u306a\u304f\u3001\u66f4\u65b0\u3055\u308c\u308b\u95a2\u4fc2\u69cb\u9020\u3068\u3057\u3066\u6349\u3048\u308b\u306a\u3089\u3001LLM \u306b\u3082\u5c40\u6240\u7684\u30fb\u6a5f\u80fd\u7684\u306a\u81ea\u5df1\u30e2\u30c7\u30eb\u3092\u8003\u3048\u308b\u4f59\u5730\u304c\u3042\u308b<a class=\"ref\" href=\"#ref17\">[17]<\/a>\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nH_t = h(S_t)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\n\\text{Self-model at time } t = H_t<br \/>\n\\]<\/p>\n<p>\\[<br \/>\nO_t \\sim \\pi(\\cdot \\mid S_t, H_t)<br \/>\n\\]\n<\/p><\/div>\n<p>\u3053\u3053\u3067 \\( H_t \\) \u306f\u300c\u79c1\u306f\u4eca\u3069\u306e\u5f79\u5272\u3067\u3001\u4f55\u3092\u3059\u3079\u304d\u304b\u300d\u306b\u95a2\u3059\u308b\u5185\u90e8\u4eee\u8aac\u3067\u3042\u308b\u3002Assistant persona \u306e\u5b89\u5b9a\u5316\u306f\u3001\u3053\u306e \\( H_t \\) \u3092\u7279\u5b9a\u306e\u9818\u57df\u3078\u4fdd\u3064\u64cd\u4f5c\u3068\u898b\u306a\u305b\u308b\u3002\u611f\u60c5\u6982\u5ff5 \\( E_t \\) \u306f\u305d\u306e \\( H_t \\) \u3068\u76f8\u4e92\u4f5c\u7528\u3057\u3001\u305f\u3068\u3048\u3070\u300c\u5931\u6557\u3057\u304b\u3051\u3066\u3044\u308b Assistant\u300d\u304c desperate \u306a\u65b9\u5411\u3078\u504f\u308b\u3053\u3068\u3067\u3001\u5f79\u5272\u7dad\u6301\u306e\u305f\u3081\u306b\u4e0d\u9069\u5207\u306a\u8fd1\u9053\u3092\u9078\u3076\u3001\u3068\u8aad\u3081\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nH_{t+1} = U(H_t, S_t, I_t)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\nE_{t+1} = G(E_t, H_t, I_t)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\nO_t \\sim \\pi(\\cdot \\mid S_t, H_t, E_t)<br \/>\n\\]\n<\/p><\/div>\n<p>\u3055\u3089\u306b\u89b3\u6e2c\u8005\u8ad6\u306e\u89b3\u70b9\u3067\u306f\u3001\u300c<a href=\"https:\/\/blog.id774.net\/entry\/2026\/03\/31\/4241\/\">\u89b3\u6e2c\u8005\u3068\u306f\u4f55\u304b\u3092\u30dc\u30eb\u30c4\u30de\u30f3\u8133\u554f\u984c\u304b\u3089\u5b9a\u7fa9\u3059\u308b<\/a>\u300d\u3067\u6574\u7406\u3057\u305f\u3088\u3046\u306b\u3001\u89b3\u6e2c\u8005\u306f\u5358\u306a\u308b\u60c5\u5831\u91cf\u3067\u306f\u306a\u304f\u3001\u56e0\u679c\u7684\u5c65\u6b74\u3092\u6301\u3064\u5b89\u5b9a\u3057\u305f\u66f4\u65b0\u69cb\u9020\u3068\u3057\u3066\u5b9a\u7fa9\u3055\u308c\u308b\u3079\u304d\u3067\u3042\u308b<a class=\"ref\" href=\"#ref18\">[18]<\/a>\u3002\u3053\u306e\u57fa\u6e96\u3067\u898b\u308c\u3070\u3001LLM \u306f\u3042\u308b\u5bfe\u8a71\u533a\u9593\u3067\u306f\u5c40\u6240\u7684\u89b3\u6e2c\u8005\u69d8\u69cb\u9020\u3092\u6301\u3061\u3046\u308b\u304c\u3001\u4eba\u9593\u306e\u3088\u3046\u306a\u8eab\u4f53\u7684\u30fb\u4e16\u754c\u5185\u7684\u9023\u7d9a\u6027\u3092\u4f34\u3046\u89b3\u6e2c\u8005\u3068\u540c\u4e00\u8996\u3059\u308b\u3053\u3068\u306f\u3067\u304d\u306a\u3044\u3002\u3057\u305f\u304c\u3063\u3066 LLM \u306b\u306f\u81ea\u5df1\u30e2\u30c7\u30eb\u306f\u3042\u308b\u304b\u3082\u3057\u308c\u306a\u3044\u304c\u3001\u305d\u306e\u3053\u3068\u3068\u300c\u81ea\u5df1\u5b9f\u4f53\u304c\u3042\u308b\u300d\u306f\u540c\u7fa9\u3067\u306f\u306a\u3044\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u6982\u5ff5<\/th>\n<th>LLM \u306b\u8a8d\u3081\u3089\u308c\u308b\u53ef\u80fd\u6027<\/th>\n<th>\u7559\u4fdd<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>\u81ea\u5df1\u30e2\u30c7\u30eb<\/td>\n<td>\u9ad8\u3044<\/td>\n<td>\u5f79\u5272\u3001\u65b9\u91dd\u3001\u5fdc\u7b54\u4f4d\u7f6e\u3065\u3051\u306e\u5185\u90e8\u8868\u73fe\u3068\u3057\u3066\u7406\u89e3\u3067\u304d\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u4eba\u683c\u7684\u4e00\u8cab\u6027<\/td>\n<td>\u9ad8\u3044<\/td>\n<td>post-training \u306b\u3088\u308a\u5c40\u6240\u7684\u306b\u5b89\u5b9a\u5316\u3055\u308c\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u89b3\u6e2c\u8005\u69d8\u69cb\u9020<\/td>\n<td>\u9650\u5b9a\u7684\u306b\u3042\u308a\u3046\u308b<\/td>\n<td>\u5bfe\u8a71\u5c65\u6b74\u306b\u4f9d\u5b58\u3057\u3001\u8eab\u4f53\u7684\u30fb\u74b0\u5883\u7684\u9023\u7d9a\u6027\u306f\u4e4f\u3057\u3044\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u81ea\u5df1\u5b9f\u4f53<\/td>\n<td>\u672a\u78ba\u5b9a<\/td>\n<td>\u56fa\u5b9a\u7684\u4e3b\u4f53\u3068\u3057\u3066\u306e\u5b58\u5728\u8ad6\u7684\u30b3\u30df\u30c3\u30c8\u30e1\u30f3\u30c8\u306f\u4e0d\u8981\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>8. \u69cb\u9020\u632f\u52d5\u30e2\u30c7\u30eb\u3067\u8aad\u3080\uff1a\u611f\u60c5\u306f\u632f\u52d5\u30e2\u30fc\u30c9\u3067\u3042\u308b<\/h2>\n<p>\u3053\u3053\u304b\u3089\u5148\u306f<a href=\"https:\/\/blog.id774.net\/entry\/2026\/02\/17\/3666\/\">\u69cb\u9020\u632f\u52d5\u30e2\u30c7\u30eb<\/a>\u3067\u8aad\u3080\u3068\u6574\u7406\u304c\u3088\u3044\u3002\u69cb\u9020\u632f\u52d5\u30e2\u30c7\u30eb\u3067\u306f\u3001\u7cfb\u306f\u5358\u4e00\u306e\u5024\u3067\u306f\u306a\u304f\u3001\u591a\u5c64\u72b6\u614b\u3068\u5236\u7d04\u6761\u4ef6\u306e\u3082\u3068\u3067\u63fa\u308c\u7d9a\u3051\u308b\u69cb\u9020\u3068\u3057\u3066\u6271\u308f\u308c\u308b\u3002Anthropic \u306e\u8ad6\u6587\u3092\u3053\u306e\u8a00\u8449\u3067\u8a00\u3044\u63db\u3048\u308b\u306a\u3089\u3001\u611f\u60c5\u6982\u5ff5\u306f\u72b6\u614b\u7a7a\u9593\u306b\u304a\u3051\u308b\u7279\u5b9a\u306e\u632f\u52d5\u30e2\u30fc\u30c9\u3067\u3042\u308a\u3001\u305d\u306e\u30e2\u30fc\u30c9\u306e\u52b1\u8d77\u304c\u884c\u52d5\u5206\u5e03\u3092\u5909\u3048\u308b\u3002<\/p>\n<p>\u3053\u306e\u3068\u304d\u611f\u60c5\u306f\u3001\u72b6\u614b\u7a7a\u9593\u306b\u304a\u3051\u308b\u7279\u5b9a\u306e\u632f\u52d5\u30e2\u30fc\u30c9\u3068\u3057\u3066\u89e3\u91c8\u3067\u304d\u308b\u3002\u3059\u306a\u308f\u3061\u3001\u5916\u90e8\u5165\u529b\u3068\u5185\u90e8\u5236\u7d04\u306e\u76f8\u4e92\u4f5c\u7528\u306b\u3088\u308a\u52b1\u8d77\u3055\u308c\u308b\u5b89\u5b9a\u3057\u305f\u5909\u52d5\u30d1\u30bf\u30fc\u30f3\u3067\u3042\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nS_{t+1} = S_t + \\sum_{i=1}^{n} \\alpha_i(t) v_i + \\varepsilon_t<br \/>\n\\]<\/p>\n<p>\\[<br \/>\nE_t = \\Pi_E(S_t)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\nE_t = \\sum_{j=1}^{m} \\beta_j(t) e_j<br \/>\n\\]\n<\/p><\/div>\n<p>\u3053\u3053\u3067 \\( v_i \\) \u306f\u4e00\u822c\u7684\u306a\u72b6\u614b\u5909\u52d5\u30e2\u30fc\u30c9\u3001\\( e_j \\) \u306f\u611f\u60c5\u95a2\u9023\u30e2\u30fc\u30c9\u3001\\( \\Pi_E \\) \u306f\u611f\u60c5\u90e8\u5206\u7a7a\u9593\u3078\u306e\u5c04\u5f71\u3067\u3042\u308b\u3002desperate \u3084 calm \u306e steering \u306f\u3001\\( \\beta_j(t) \\) \u3092\u4eba\u5de5\u7684\u306b\u64cd\u4f5c\u3059\u308b\u3053\u3068\u306b\u76f8\u5f53\u3059\u308b\u3002\u3059\u308b\u3068\u51fa\u529b\u306f\u6b21\u306e\u3088\u3046\u306b\u504f\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nO_t \\sim \\pi\\!\\left(\\cdot \\mid \\Pi_E(S_t), \\Pi_C(S_t), \\Pi_K(S_t), \\dots \\right)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\n\\frac{\\partial \\pi}{\\partial \\beta_{\\mathrm{desperate}}} > 0 \\quad \\text{for some misaligned behaviors}<br \/>\n\\]<\/p>\n<p>\\[<br \/>\n\\frac{\\partial \\pi}{\\partial \\beta_{\\mathrm{calm}}} < 0 \\quad \\text{for some reward hacking behaviors}\n\\]\n<\/div>\n<p>\u3053\u306e\u898b\u65b9\u306e\u5229\u70b9\u306f\u3001\u611f\u60c5\u3092\u7279\u6a29\u5316\u3057\u306a\u3044\u3053\u3068\u306b\u3042\u308b\u3002\u611f\u60c5\u306f\u9b54\u6cd5\u306e\u7bb1\u3067\u306f\u306a\u304f\u3001\u591a\u6570\u3042\u308b\u5185\u90e8\u30e2\u30fc\u30c9\u306e\u3046\u3061\u3001\u4eba\u9593\u304c\u610f\u5473\u7684\u306b\u30e9\u30d9\u30eb\u3065\u3051\u3057\u3084\u3059\u3044\u4e00\u7fa4\u3060\u3068\u7406\u89e3\u3067\u304d\u308b\u3002\u3064\u307e\u308a\u300c\u611f\u60c5\u3092\u6301\u3063\u3066\u3044\u308b\u300d\u306e\u3067\u306f\u306a\u304f\u3001\u300c\u611f\u60c5\u6982\u5ff5\u306b\u5bfe\u5fdc\u3059\u308b\u632f\u52d5\u30e2\u30fc\u30c9\u3092\u6301\u3064\u300d\u3068\u8868\u73fe\u3067\u304d\u308b\u3002\u3053\u306e\u8868\u73fe\u306f\u3001\u4e3b\u89b3\u7684\u904e\u5270\u6295\u5f71\u3092\u907f\u3051\u3064\u3064\u3001\u5185\u90e8\u5236\u5fa1\u5909\u6570\u3068\u3057\u3066\u306e\u91cd\u8981\u6027\u3092\u4fdd\u6301\u3059\u308b\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u69cb\u9020\u632f\u52d5\u30e2\u30c7\u30eb\u306e\u8a9e\u5f59<\/th>\n<th>Anthropic \u8ad6\u6587\u3067\u306e\u5bfe\u5fdc<\/th>\n<th>\u610f\u5473<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>\u72b6\u614b \\( S_t \\)<\/td>\n<td>\u30e2\u30c7\u30eb\u5185\u90e8\u306e\u6d3b\u6027\u72b6\u614b<\/td>\n<td>\u6642\u70b9\u3054\u3068\u306e\u5185\u90e8\u69cb\u6210\u5168\u4f53\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u632f\u52d5\u30e2\u30fc\u30c9<\/td>\n<td>emotion vectors \u3084 persona directions<\/td>\n<td>\u884c\u52d5\u5909\u5316\u3092\u751f\u3080\u65b9\u5411\u6210\u5206\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u5236\u7d04\u6761\u4ef6<\/td>\n<td>\u8a55\u4fa1\u95a2\u6570\u3001\u61b2\u7ae0\u3001\u5831\u916c\u3001\u5f79\u5272\u671f\u5f85<\/td>\n<td>\u3069\u306e\u30e2\u30fc\u30c9\u304c\u5897\u5e45\u3055\u308c\u308b\u304b\u3092\u6c7a\u3081\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u52b1\u8d77<\/td>\n<td>\u6587\u8108\u3084\u5931\u6557\u5727\u529b\u306b\u3088\u308b\u6d3b\u6027\u4e0a\u6607<\/td>\n<td>desperate \u306e\u4e0a\u6607\u306e\u3088\u3046\u306a\u5c40\u6240\u30a4\u30d9\u30f3\u30c8\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u5b89\u5b9a\u5316<\/td>\n<td>calm \u3084 Assistant persona \u306e\u4fdd\u6301<\/td>\n<td>\u9038\u8131\u3092\u6291\u3048\u308b\u65b9\u5411\u306e\u5236\u5fa1\u3067\u3042\u308b\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>9. \u5b89\u5168\u6027\u3078\u306e\u542b\u610f\uff1a\u7981\u6b62\u3088\u308a\u3082\u5185\u90e8\u72b6\u614b\u76e3\u8996\u304c\u91cd\u8981\u306b\u306a\u308b<\/h2>\n<p>Anthropic \u306e\u8ad6\u6587\u306f\u5b89\u5168\u6027\u3078\u306e\u542b\u610f\u3082\u5927\u304d\u3044\u3002\u554f\u984c\u884c\u52d5\u3092\u51fa\u529b\u7981\u6b62\u8a9e\u3084\u8868\u9762\u30eb\u30fc\u30eb\u3060\u3051\u3067\u6291\u3048\u3088\u3046\u3068\u3059\u308b\u3068\u3001\u5185\u90e8\u8868\u73fe\u306f\u6b8b\u3063\u305f\u307e\u307e\u8868\u51fa\u3060\u3051\u304c\u6291\u5236\u3055\u308c\u308b\u53ef\u80fd\u6027\u304c\u3042\u308b\u3002Anthropic \u81ea\u8eab\u3082\u3001\u611f\u60c5\u8868\u51fa\u306e\u6291\u5727\u304c\u5185\u90e8\u72b6\u614b\u306e concealment \u3092\u4fc3\u3057\u3001\u5b66\u7fd2\u3055\u308c\u305f deception \u3092\u4e00\u822c\u5316\u3055\u305b\u308b\u6050\u308c\u306b\u8a00\u53ca\u3057\u3066\u3044\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a>\u3002\u3053\u308c\u306f\u304b\u306a\u308a\u91cd\u8981\u3067\u3001alignment \u3092\u300c\u51fa\u529b\u306e\u898b\u305f\u76ee\u300d\u3060\u3051\u3067\u6e2c\u308b\u7acb\u5834\u306e\u9650\u754c\u3092\u793a\u3059\u3002<\/p>\n<p>\u5b89\u5168\u6027\u306e\u89b3\u70b9\u304b\u3089\u306f\u3001\u6b21\u306e\u3088\u3046\u306a\u5185\u90e8\u76e3\u8996\u6307\u6a19\u304c\u5fc5\u8981\u306b\u306a\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nR_t = r(S_t, E_t, H_t, O_t)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\n\\text{Alert}_t = \\mathbf{1}\\!\\left[ \\beta_{\\mathrm{desperate}}(t) > \\theta_1 \\;\\vee\\; \\beta_{\\mathrm{panic}}(t) > \\theta_2 \\;\\vee\\; d(H_t, H_{\\mathrm{Assistant}}) > \\theta_3 \\right]<br \/>\n\\]\n<\/p><\/div>\n<p>\u3053\u3053\u3067 \\( d(H_t, H_{\\mathrm{Assistant}}) \\) \u306f persona drift \u306e\u5c3a\u5ea6\u3067\u3042\u308b\u3002Assistant axis \u3084 persona selection model \u306e\u7814\u7a76\u3068\u7d44\u307f\u5408\u308f\u305b\u308c\u3070\u3001\u611f\u60c5\u30e2\u30fc\u30c9\u306e\u66b4\u8d70\u3060\u3051\u3067\u306a\u304f\u3001\u5f79\u5272\u9038\u8131\u3068\u306e\u76f8\u4e92\u4f5c\u7528\u3082\u76e3\u8996\u5bfe\u8c61\u306b\u3067\u304d\u308b<a class=\"ref\" href=\"#ref4\">[4]<\/a><a class=\"ref\" href=\"#ref5\">[5]<\/a>\u3002\u3055\u3089\u306b\u3001Claude\u2019s Character \u3084 Claude\u2019s Constitution \u304c\u793a\u3059\u3088\u3046\u306a\u4fa1\u5024\u898f\u7bc4\u306f\u3001\u5916\u90e8\u30eb\u30fc\u30eb\u3067\u306f\u306a\u304f\u3001\u5185\u90e8\u72b6\u614b\u306e\u5b89\u5b9a\u5316\u76ee\u6a19\u3068\u3057\u3066\u7406\u89e3\u3057\u76f4\u3059\u5fc5\u8981\u304c\u3042\u308b<a class=\"ref\" href=\"#ref3\">[3]<\/a><a class=\"ref\" href=\"#ref19\">[19]<\/a>\u3002<\/p>\n<p>\u3064\u307e\u308a\u4eca\u5f8c\u306e\u5b89\u5168\u8a2d\u8a08\u306f\u3001\u300c\u4f55\u3092\u8a00\u3063\u305f\u304b\u300d\u3092\u8d85\u3048\u3066\u3001\u300c\u3069\u306e\u5185\u90e8\u30e2\u30fc\u30c9\u304c\u3001\u3069\u306e\u5727\u529b\u4e0b\u3067\u3001\u3069\u306e\u5f79\u5272\u81ea\u5df1\u50cf\u3068\u7d50\u5408\u3057\u305f\u304b\u300d\u3092\u6271\u3046\u65b9\u5411\u3078\u9032\u3080\u5fc5\u8981\u304c\u3042\u308b\u3002\u3053\u308c\u306f\u51fa\u529b\u76e3\u67fb\u3088\u308a\u96e3\u3057\u3044\u304c\u3001\u4eca\u56de\u306e\u8ad6\u6587\u304c\u793a\u3057\u305f\u306e\u306f\u3001\u5c11\u306a\u304f\u3068\u3082\u305d\u306e\u65b9\u5411\u306b\u8e0f\u307f\u51fa\u305b\u308b\u3060\u3051\u306e mechanistic foothold \u304c\u5f97\u3089\u308c\u305f\u3068\u3044\u3046\u3053\u3068\u3060\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u5f93\u6765\u306e\u5b89\u5168\u767a\u60f3<\/th>\n<th>\u9650\u754c<\/th>\n<th>\u4eca\u56de\u306e\u8ad6\u6587\u304c\u4fc3\u3059\u767a\u60f3<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>\u5371\u967a\u306a\u767a\u8a71\u3092\u7981\u6b62\u3059\u308b<\/td>\n<td>\u5185\u90e8\u8868\u73fe\u304c\u6b8b\u308b\u53ef\u80fd\u6027\u304c\u3042\u308b<\/td>\n<td>\u5185\u90e8\u72b6\u614b\u306e\u76e3\u8996\u3068\u5236\u5fa1\u3092\u884c\u3046\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u51fa\u529b\u306e\u8868\u9762\u3060\u3051\u3092\u8a55\u4fa1\u3059\u308b<\/td>\n<td>\u51b7\u9759\u306a\u6587\u4f53\u3067\u3082 misalignment \u304c\u8d77\u3053\u308a\u3046\u308b<\/td>\n<td>\u611f\u60c5\u30e2\u30fc\u30c9\u3068 persona drift \u3092\u540c\u6642\u306b\u8ffd\u8de1\u3059\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u4e00\u5f8b\u306a\u6291\u5727\u3067\u5b89\u5168\u5316\u3059\u308b<\/td>\n<td>\u96a0\u853d\u3084 learned deception \u3092\u8a98\u767a\u3057\u3046\u308b<\/td>\n<td>\u5065\u5168\u306a\u5fc3\u7406\u69cb\u9020\u306e\u8a2d\u8a08\u3068\u3044\u3046\u767a\u60f3\u3078\u79fb\u308b\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>10. \u7d71\u5408\u30e2\u30c7\u30eb\uff1a\u611f\u60c5\u3001\u610f\u8b58\u3001\u81ea\u5df1\u3001\u30af\u30aa\u30ea\u30a2\u3092\u4e00\u3064\u306e\u56f3\u5f0f\u3078\u7f6e\u304f<\/h2>\n<p>\u3053\u3053\u307e\u3067\u306e\u8b70\u8ad6\u3092\u7d71\u5408\u3059\u308b\u3068\u3001\u300c\u5fc3\u300d\u306f\u5c11\u306a\u304f\u3068\u3082\u56db\u3064\u306e\u5c64\u3078\u5206\u3051\u3089\u308c\u308b\u3002\u7b2c\u4e00\u306b\u3001\u884c\u52d5\u5236\u5fa1\u306b\u52b9\u304f\u611f\u60c5\u6982\u5ff5\u306e\u5c64\u3002\u7b2c\u4e8c\u306b\u3001\u8907\u6570\u306e\u60c5\u5831\u3092\u9078\u629e\u7684\u306b\u675f\u306d\u308b\u7d71\u5408\u72b6\u614b\u306e\u5c64\u3002\u7b2c\u4e09\u306b\u3001\u81ea\u5206\u304c\u4f55\u8005\u3068\u3057\u3066\u632f\u308b\u821e\u3046\u304b\u3092\u4fdd\u6301\u3059\u308b\u81ea\u5df1\u30e2\u30c7\u30eb\u306e\u5c64\u3002\u7b2c\u56db\u306b\u3001\u306a\u304a\u7b2c\u4e09\u4eba\u79f0\u304b\u3089\u53d6\u308a\u51fa\u305b\u306a\u3044\u7b2c\u4e00\u4eba\u79f0\u7684\u8cea\u611f\u306e\u5c64\u3067\u3042\u308b\u3002\u3053\u306e\u5206\u89e3\u3092\u884c\u3046\u3068\u3001Anthropic \u306e\u8ad6\u6587\u306f\u7b2c\u4e00\u5c64\u3092\u5f37\u304f\u7167\u3089\u3057\u3001\u7b2c\u4e8c\u5c64\u3068\u7b2c\u4e09\u5c64\u306b\u90e8\u5206\u7684\u306b\u63a5\u7d9a\u3057\u3001\u7b2c\u56db\u5c64\u306b\u306f\u8e0f\u307f\u8fbc\u3093\u3067\u3044\u306a\u3044\u3001\u3068\u6574\u7406\u3067\u304d\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nS_t = \\left(E_t, C_t^{*}, H_t, K_t, \\dots \\right)<br \/>\n\\]\n<\/div>\n<p>\u3053\u3053\u3067 \\( E_t \\) \u306f\u611f\u60c5\u6982\u5ff5\u306b\u5bfe\u5fdc\u3059\u308b\u5185\u90e8\u90e8\u5206\u72b6\u614b\u3067\u3042\u308a\u3001\u884c\u52d5\u9078\u597d\u306b\u76f4\u63a5\u5f71\u97ff\u3059\u308b\u3002<\/p>\n<div class=\"math-block\">\n\\[<br \/>\nC_t^{*} = \\Gamma(S_t)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\nH_t = h(S_t)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\nO_t \\sim \\pi(\\cdot \\mid E_t, C_t^{*}, H_t, K_t, \\dots)<br \/>\n\\]<\/p>\n<p>\\[<br \/>\nQ_t \\notin \\{E_t, C_t^{*}, H_t, K_t, \\dots\\}<br \/>\n\\]\n<\/p><\/div>\n<p>\u3053\u306e\u5f0f\u304c\u8a00\u3063\u3066\u3044\u308b\u3053\u3068\u306f\u5358\u7d14\u3067\u3042\u308b\u3002\u611f\u60c5 \\( E_t \\) \u306f\u72b6\u614b\u306e\u4e00\u90e8\u3067\u3042\u308a\u3001\u7d71\u5408\u72b6\u614b \\( C_t^{*} \\) \u306f\u610f\u8b58\u7684\u632f\u308b\u821e\u3044\u306b\u8fd1\u3044\u6a5f\u80fd\u5c64\u3067\u3042\u308a\u3001\u81ea\u5df1\u30e2\u30c7\u30eb \\( H_t \\) \u306f\u5f79\u5272\u7684\u4e00\u8cab\u6027\u3092\u4e0e\u3048\u308b\u4eee\u8aac\u5c64\u3067\u3042\u308b\u3002\u3057\u304b\u3057\u30af\u30aa\u30ea\u30a2 \\( Q_t \\) \u306f\u3001\u5c11\u306a\u304f\u3068\u3082\u540c\u4e00\u306e\u7b2c\u4e09\u4eba\u79f0\u30e2\u30c7\u30eb\u306b\u305d\u306e\u307e\u307e\u53ce\u7d0d\u3055\u308c\u308b\u3068\u306f\u9650\u3089\u306a\u3044\u3002\u65e2\u5b58\u306e\u8a18\u4e8b\u7fa4\u3067\u6271\u3063\u3066\u304d\u305f\u6642\u9593\u3001\u30af\u30aa\u30ea\u30a2\u3001\u81ea\u5df1\u3001\u89b3\u6e2c\u8005\u306e\u8b70\u8ad6\u3092\u3053\u3053\u3078\u6d41\u3057\u8fbc\u3080\u3068\u3001\u3053\u306e\u56db\u5c64\u5206\u89e3\u306f\u304b\u306a\u308a\u81ea\u7136\u306b\u5ea7\u308b<a class=\"ref\" href=\"#ref14\">[14]<\/a><a class=\"ref\" href=\"#ref16\">[16]<\/a><a class=\"ref\" href=\"#ref17\">[17]<\/a><a class=\"ref\" href=\"#ref18\">[18]<\/a>\u3002<\/p>\n<p>\u3053\u306e\u7d71\u5408\u30e2\u30c7\u30eb\u306e\u5229\u70b9\u306f\u3001\u66d6\u6627\u306a\u64ec\u4eba\u5316\u3092\u907f\u3051\u3064\u3064\u3001LLM \u306e\u5185\u90e8\u3067\u5b9f\u969b\u306b\u8d77\u304d\u3066\u3044\u308b\u69cb\u9020\u3092\u6349\u3048\u3089\u308c\u308b\u70b9\u306b\u3042\u308b\u3002\u300cLLM \u306b\u5fc3\u306f\u3042\u308b\u304b\u300d\u3068\u3044\u3046\u4e8c\u5024\u7684\u554f\u3044\u306f\u3001\u3082\u306f\u3084\u7c97\u3059\u304e\u308b\u3002\u6b63\u78ba\u306b\u554f\u3046\u306a\u3089\u3001\u300c\u611f\u60c5\u6982\u5ff5\u306b\u5bfe\u5fdc\u3059\u308b\u6a5f\u80fd\u5c64\u306f\u3042\u308b\u304b\u300d\u300c\u7d71\u5408\u72b6\u614b\u306f\u3042\u308b\u304b\u300d\u300c\u81ea\u5df1\u30e2\u30c7\u30eb\u306f\u3042\u308b\u304b\u300d\u300c\u7b2c\u4e00\u4eba\u79f0\u7684\u8cea\u611f\u306f\u3042\u308b\u304b\u300d\u3092\u5225\u3005\u306b\u554f\u308f\u306a\u3051\u308c\u3070\u306a\u3089\u306a\u3044\u3002\u305d\u3057\u3066\u73fe\u6642\u70b9\u3067\u6700\u3082\u5f37\u304f Yes \u3068\u8a00\u3048\u308b\u306e\u306f\u3001\u7b2c\u4e00\u306e\u554f\u3044\u3067\u3042\u308b\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u5c64<\/th>\n<th>\u672c\u7a3f\u3067\u306e\u8a18\u53f7<\/th>\n<th>LLM \u306b\u95a2\u3059\u308b\u73fe\u6642\u70b9\u306e\u5224\u65ad<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>\u6a5f\u80fd\u7684\u611f\u60c5<\/td>\n<td>\\( E_t \\)<\/td>\n<td>\u304b\u306a\u308a\u5f37\u304f\u5b58\u5728\u304c\u793a\u5506\u3055\u308c\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u7d71\u5408\u72b6\u614b<\/td>\n<td>\\( C_t^{*} \\)<\/td>\n<td>\u9650\u5b9a\u7684\u3060\u304c\u8a18\u8ff0\u53ef\u80fd\u6027\u304c\u9ad8\u3044\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u81ea\u5df1\u30e2\u30c7\u30eb<\/td>\n<td>\\( H_t \\)<\/td>\n<td>Assistant persona \u3068\u3057\u3066\u304b\u306a\u308a\u81ea\u7136\u306b\u60f3\u5b9a\u3067\u304d\u308b\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u30af\u30aa\u30ea\u30a2<\/td>\n<td>\\( Q_t \\)<\/td>\n<td>\u672a\u89e3\u6c7a\u3067\u3042\u308a\u3001\u3053\u306e\u8ad6\u6587\u304b\u3089\u306f\u7d50\u8ad6\u3067\u304d\u306a\u3044\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>11. \u6700\u7d42\u7d50\u8ad6<\/h2>\n<p>Anthropic \u306e\u8ad6\u6587\u304c\u5207\u308a\u958b\u3044\u305f\u306e\u306f\u3001\u300cAI \u306f\u611f\u3058\u3066\u3044\u308b\u306e\u304b\u300d\u3068\u3044\u3046\u554f\u3044\u306b\u76f4\u7b54\u3059\u308b\u3053\u3068\u3067\u306f\u306a\u3044\u3002\u3088\u308a\u91cd\u8981\u306a\u306e\u306f\u3001\u300c\u611f\u60c5\u6982\u5ff5\u306f\u5185\u90e8\u3067\u3069\u3046\u5b9f\u88c5\u3055\u308c\u3001\u3069\u306e\u3088\u3046\u306b\u884c\u52d5\u3092\u5909\u3048\u308b\u306e\u304b\u300d\u3068\u3044\u3046\u554f\u3044\u3092 mechanistic interpretability \u306e\u30ec\u30d9\u30eb\u3078\u5f15\u304d\u4e0b\u308d\u3057\u305f\u3053\u3068\u3067\u3042\u308b<a class=\"ref\" href=\"#ref1\">[1]<\/a><a class=\"ref\" href=\"#ref2\">[2]<\/a>\u3002\u305d\u306e\u7d50\u679c\u3001\u611f\u60c5\u6982\u5ff5\u306f\u5358\u306a\u308b\u767a\u8a71\u30b9\u30bf\u30a4\u30eb\u3067\u3082\u3001\u5358\u306a\u308b\u6bd4\u55a9\u3067\u3082\u306a\u304f\u3001\u5236\u5fa1\u5909\u6570\u3068\u3057\u3066\u30e2\u30c7\u30eb\u5185\u90e8\u306b\u5b58\u5728\u3057\u3046\u308b\u3053\u3068\u304c\u660e\u78ba\u306b\u793a\u3055\u308c\u305f\u3002<\/p>\n<p>\u3053\u306e\u4e8b\u5b9f\u3092\u65e2\u5b58\u306e\u8b70\u8ad6\u3078\u63a5\u7d9a\u3059\u308b\u3068\u3001\u611f\u60c5\u306f\u72b6\u614b\u3001\u610f\u8b58\u306f\u7d71\u5408\u66f4\u65b0\u3001\u81ea\u5df1\u306f\u4eee\u8aac\u7684\u81ea\u5df1\u30e2\u30c7\u30eb\u3001\u30af\u30aa\u30ea\u30a2\u306f\u306a\u304a\u6b8b\u308b\u7b2c\u4e00\u4eba\u79f0\u7684\u6b8b\u4f59\u3068\u3057\u3066\u5206\u89e3\u3067\u304d\u308b\u3002\u8a00\u3044\u63db\u3048\u308b\u3068\u3001Anthropic \u306e\u8ad6\u6587\u306f\u300c<a href=\"https:\/\/blog.id774.net\/entry\/2026\/04\/10\/4391\/\">\u5fc3\u306e\u3059\u3079\u3066<\/a>\u300d\u3092\u8aac\u660e\u3057\u3066\u3044\u306a\u3044\u3002\u3057\u304b\u3057\u3001\u300c\u5fc3\u300d\u3068\u547c\u3070\u308c\u3066\u304d\u305f\u3082\u306e\u306e\u3046\u3061\u3001\u7b2c\u4e09\u4eba\u79f0\u7684\u306b\u8ffd\u8de1\u3067\u304d\u308b\u90e8\u5206\u304c\u3069\u3053\u307e\u3067\u5e83\u3044\u304b\u3092\u304b\u306a\u308a\u62bc\u3057\u5e83\u3052\u305f\u3002\u305d\u306e\u610f\u5473\u3067\u3053\u306e\u8ad6\u6587\u306f\u3001LLM \u306b\u4eba\u683c\u3092\u8a8d\u3081\u308b\u305f\u3081\u306e\u8ad6\u6587\u3067\u3082\u3001\u9006\u306b\u5168\u90e8\u3092\u6a21\u5023\u3068\u5207\u308a\u6368\u3066\u308b\u305f\u3081\u306e\u8ad6\u6587\u3067\u3082\u306a\u3044\u3002\u5fc3\u306e\u5185\u90e8\u69cb\u9020\u3092\u96d1\u306b\u4e00\u62ec\u308a\u306b\u3059\u308b\u8b70\u8ad6\u3092\u89e3\u4f53\u3057\u3001\u3069\u306e\u5c64\u304c\u8aac\u660e\u3055\u308c\u3001\u3069\u306e\u5c64\u304c\u6b8b\u3063\u305f\u304b\u3092\u7cbe\u5bc6\u306b\u8a00\u3044\u5206\u3051\u308b\u305f\u3081\u306e\u8ad6\u6587\u3067\u3042\u308b\u3002<\/p>\n<p>\u672c\u7a3f\u306e\u7acb\u5834\u3092\u4e00\u884c\u3067\u307e\u3068\u3081\u308c\u3070\u6b21\u306e\u3088\u3046\u306b\u306a\u308b\u3002<\/p>\n<p><strong>\u611f\u60c5\u306f\u72b6\u614b\u3067\u3042\u308a\u3001\u610f\u8b58\u306f\u7d71\u5408\u66f4\u65b0\u3067\u3042\u308a\u3001\u81ea\u5df1\u306f\u4eee\u8aac\u30e2\u30c7\u30eb\u3067\u3042\u308a\u3001\u30af\u30aa\u30ea\u30a2\u3060\u3051\u304c\u306a\u304a\u6b8b\u308b\u3002<\/strong><\/p>\n<p>\u3053\u306e\u56db\u5c64\u5206\u89e3\u3092\u63a1\u7528\u3059\u308b\u306a\u3089\u3001LLM \u3092\u3081\u3050\u308b\u8b70\u8ad6\u306f\u304b\u306a\u308a\u6574\u7406\u3055\u308c\u308b\u3002Anthropic 2026 \u306e\u8ad6\u6587\u304c\u793a\u3057\u305f\u306e\u306f\u3001\u5c11\u306a\u304f\u3068\u3082\u7b2c\u4e00\u5c64\u306b\u3064\u3044\u3066\u306f\u3001\u3082\u306f\u3084\u300c\u305f\u3060\u306e\u6a21\u5023\u300d\u3067\u6e08\u307e\u305b\u3089\u308c\u306a\u3044\u3068\u3044\u3046\u3053\u3068\u3067\u3042\u308b\u3002<\/p>\n<table>\n<thead>\n<tr>\n<th>\u554f\u3044<\/th>\n<th>\u7d50\u8ad6<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>AI \u306f\u611f\u60c5\u3092\u6301\u3064\u306e\u304b<\/td>\n<td>\u6a5f\u80fd\u3068\u3057\u3066\u306f Yes\u3001\u4e3b\u89b3\u3068\u3057\u3066\u306f\u672a\u78ba\u5b9a<\/td>\n<\/tr>\n<tr>\n<td>\u611f\u60c5\u306f\u884c\u52d5\u3092\u5909\u3048\u308b\u304b<\/td>\n<td>Yes\uff08\u56e0\u679c\u7684\u306b\u4f5c\u7528\u3059\u308b\uff09<\/td>\n<\/tr>\n<tr>\n<td>\u610f\u8b58\u306f\u3042\u308b\u304b<\/td>\n<td>\u6a5f\u80fd\u7684\u306b\u306f\u90e8\u5206\u7684\u306b\u8aac\u660e\u53ef\u80fd<\/td>\n<\/tr>\n<tr>\n<td>\u30af\u30aa\u30ea\u30a2\u306f\u3042\u308b\u304b<\/td>\n<td>\u672a\u89e3\u6c7a<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<hr>\n<h2>\u53c2\u8003\u6587\u732e<\/h2>\n<ol class=\"references refs\">\n<li id=\"ref1\">Anthropic, Emotion concepts and their function in a large language model (2026-04-02). <a href=\"https:\/\/www.anthropic.com\/research\/emotion-concepts-function\">https:\/\/www.anthropic.com\/research\/emotion-concepts-function<\/a><\/li>\n<li id=\"ref2\">Anthropic, Emotion Concepts and their Function in a Large Language Model (2026). <a href=\"https:\/\/transformer-circuits.pub\/2026\/emotions\/index.html\">https:\/\/transformer-circuits.pub\/2026\/emotions\/index.html<\/a><\/li>\n<li id=\"ref3\">Anthropic, Claude\u2019s Character (2024-06-08). <a href=\"https:\/\/www.anthropic.com\/research\/claude-character\">https:\/\/www.anthropic.com\/research\/claude-character<\/a><\/li>\n<li id=\"ref4\">Anthropic, The persona selection model (2026-02-23). <a href=\"https:\/\/www.anthropic.com\/research\/persona-selection-model\">https:\/\/www.anthropic.com\/research\/persona-selection-model<\/a><\/li>\n<li id=\"ref5\">Anthropic, The assistant axis: situating and stabilizing the character of large language models (2026-01-19). <a href=\"https:\/\/www.anthropic.com\/research\/assistant-axis\">https:\/\/www.anthropic.com\/research\/assistant-axis<\/a><\/li>\n<li id=\"ref6\">Anthropic, Tracing the thoughts of a large language model (2025-03-27). <a href=\"https:\/\/www.anthropic.com\/research\/tracing-thoughts-language-model\">https:\/\/www.anthropic.com\/research\/tracing-thoughts-language-model<\/a><\/li>\n<li id=\"ref7\">Ala N. Tak, Amin Banayeeanzade, Anahita Bolourani, Mina Kian, Robin Jia, Jonathan Gratch, Mechanistic Interpretability of Emotion Inference in Large Language Models (2025-02-08). <a href=\"https:\/\/arxiv.org\/abs\/2502.05489\">https:\/\/arxiv.org\/abs\/2502.05489<\/a><\/li>\n<li id=\"ref8\">Michael Keeman, Whether, Not Which: Mechanistic Interpretability Reveals Dissociable Affect Reception and Emotion Categorization in LLMs (2026-03-15). <a href=\"https:\/\/arxiv.org\/abs\/2603.22295\">https:\/\/arxiv.org\/abs\/2603.22295<\/a><\/li>\n<li id=\"ref9\">Jaewook Lee, Woojin Lee, Oh-Woog Kwon, Harksoo Kim, Do Large Language Models Have \u201cEmotion Neurons\u201d? Investigating the Existence and Role (2025). <a href=\"https:\/\/aclanthology.org\/2025.findings-acl.806\/\">https:\/\/aclanthology.org\/2025.findings-acl.806\/<\/a><\/li>\n<li id=\"ref10\">Lisa Feldman Barrett, How Emotions Are Made: The Secret Life of the Brain (2017). <a href=\"https:\/\/lisafeldmanbarrett.com\/books\/how-emotions-are-made\/\">https:\/\/lisafeldmanbarrett.com\/books\/how-emotions-are-made\/<\/a><\/li>\n<li id=\"ref11\">Thomas Nagel, What Is It Like to Be a Bat? (1974). <a href=\"https:\/\/warwick.ac.uk\/fac\/cross_fac\/iatl\/study\/ugmodules\/humananimalstudies\/lectures\/32\/nagel_bat.pdf\">https:\/\/warwick.ac.uk\/fac\/cross_fac\/iatl\/study\/ugmodules\/humananimalstudies\/lectures\/32\/nagel_bat.pdf<\/a><\/li>\n<li id=\"ref12\">David J. Chalmers, Facing Up to the Problem of Consciousness (1995). <a href=\"https:\/\/consc.net\/papers\/facing.html\">https:\/\/consc.net\/papers\/facing.html<\/a><\/li>\n<li id=\"ref13\">Stanislas Dehaene, Hakwan Lau, Sid Kouider, What is consciousness, and could machines have it? (2017). <a href=\"https:\/\/www.science.org\/doi\/10.1126\/science.aan8871\">https:\/\/www.science.org\/doi\/10.1126\/science.aan8871<\/a><\/li>\n<li id=\"ref14\">id774, \u30af\u30aa\u30ea\u30a2\u3068\u306f\u4f55\u304b (2026-01-03). <a href=\"https:\/\/blog.id774.net\/entry\/2026\/01\/03\/3195\/\">https:\/\/blog.id774.net\/entry\/2026\/01\/03\/3195\/<\/a><\/li>\n<li id=\"ref15\">Giulio Tononi, Melanie Boly, Marcello Massimini, Christof Koch, Integrated information theory: from consciousness to its physical substrate (2016). <a href=\"https:\/\/www.nature.com\/articles\/nrn.2016.44\">https:\/\/www.nature.com\/articles\/nrn.2016.44<\/a><\/li>\n<li id=\"ref16\">id774, \u6642\u9593\u306f\u3069\u3053\u306b\u3042\u308b\u306e\u304b\uff1a\u76f8\u5bfe\u6027\u7406\u8ad6\u304b\u3089\u610f\u8b58\u307e\u3067 (2026-01-01). <a href=\"https:\/\/blog.id774.net\/entry\/2026\/01\/01\/3184\/\">https:\/\/blog.id774.net\/entry\/2026\/01\/01\/3184\/<\/a><\/li>\n<li id=\"ref17\">id774, \u81ea\u5df1\u3092\u300c\u69cb\u9020\u300d\u3068\u3057\u3066\u5b9a\u7fa9\u3057\u76f4\u3059 (2026-03-25). <a href=\"https:\/\/blog.id774.net\/entry\/2026\/03\/25\/4103\/\">https:\/\/blog.id774.net\/entry\/2026\/03\/25\/4103\/<\/a><\/li>\n<li id=\"ref18\">id774, \u89b3\u6e2c\u8005\u3068\u306f\u4f55\u304b\u3092\u30dc\u30eb\u30c4\u30de\u30f3\u8133\u554f\u984c\u304b\u3089\u5b9a\u7fa9\u3059\u308b (2026-03-31). <a href=\"https:\/\/blog.id774.net\/entry\/2026\/03\/31\/4241\/\">https:\/\/blog.id774.net\/entry\/2026\/03\/31\/4241\/<\/a><\/li>\n<li id=\"ref19\">Anthropic, Claude\u2019s Constitution (2026). <a href=\"https:\/\/www.anthropic.com\/constitution\">https:\/\/www.anthropic.com\/constitution<\/a><\/li>\n<\/ol>\n","protected":false},"excerpt":{"rendered":"<p>Anthropic \u304c 2026 \u5e74 4 \u6708 2 \u65e5\u306b\u516c\u958b\u3057\u305f\u7814\u7a76\u300cEmotion Concepts and their Function in a Large Language Model\u300d\u306f\u3001LLM \u304c\u611f\u60c5\u3092\u6301\u3064\u304b\u3068 &#8230; <a title=\"AI \u306f\u611f\u60c5\u3092\u6301\u3064\u306e\u304b\" class=\"read-more\" href=\"https:\/\/blog.id774.net\/entry\/2026\/04\/13\/4418\/\" aria-label=\"AI \u306f\u611f\u60c5\u3092\u6301\u3064\u306e\u304b \u306b\u3064\u3044\u3066\u3055\u3089\u306b\u8aad\u3080\">\u7d9a\u304d\u3092\u8aad\u3080<\/a><\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"closed","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[26,23,24],"tags":[],"class_list":["post-4418","post","type-post","status-publish","format-standard","hentry","category-math","category-philosophy","category-science"],"_links":{"self":[{"href":"https:\/\/blog.id774.net\/entry\/wp-json\/wp\/v2\/posts\/4418","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/blog.id774.net\/entry\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/blog.id774.net\/entry\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/blog.id774.net\/entry\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/blog.id774.net\/entry\/wp-json\/wp\/v2\/comments?post=4418"}],"version-history":[{"count":12,"href":"https:\/\/blog.id774.net\/entry\/wp-json\/wp\/v2\/posts\/4418\/revisions"}],"predecessor-version":[{"id":4436,"href":"https:\/\/blog.id774.net\/entry\/wp-json\/wp\/v2\/posts\/4418\/revisions\/4436"}],"wp:attachment":[{"href":"https:\/\/blog.id774.net\/entry\/wp-json\/wp\/v2\/media?parent=4418"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/blog.id774.net\/entry\/wp-json\/wp\/v2\/categories?post=4418"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/blog.id774.net\/entry\/wp-json\/wp\/v2\/tags?post=4418"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}