[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"summaries-facets-categories":3,"article-the-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-expb-premium-post-merge-article":3589,"article-related-the-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-expb-premium-post-merge-article":4043},[4,7,10,13,16,19,21,23,25,27,29,31,34,36,38,40,42,44,46,48,50,52,55,58,60,62,65,67,69,72,74,76,78,80,82,84,86,88,90,92,94,96,98,100,102,104,106,108,110,112,114,116,118,120,122,124,126,128,130,132,134,136,138,140,142,144,146,148,150,152,154,156,158,160,162,164,166,168,170,172,174,176,178,180,182,184,186,188,190,192,194,196,198,200,202,204,206,208,210,212,214,216,218,220,222,224,226,228,230,232,234,236,238,240,242,244,246,248,250,252,254,256,258,260,262,264,266,268,270,272,274,276,278,280,282,284,286,288,290,292,294,296,298,300,302,304,306,308,310,312,314,316,318,320,322,324,326,329,331,333,335,337,339,341,343,345,347,349,351,353,355,357,359,361,363,365,367,369,371,373,375,377,379,381,383,385,387,389,391,393,395,397,399,401,403,405,407,409,411,413,415,417,419,421,423,425,427,429,431,433,435,437,439,441,443,445,447,449,451,453,455,457,459,461,463,465,467,469,471,473,475,477,479,481,483,485,487,489,491,493,495,497,499,501,503,505,507,509,511,513,515,517,519,521,523,525,527,529,531,533,535,537,539,541,543,545,547,549,551,553,555,557,559,561,563,565,567,569,571,573,575,577,579,581,583,585,587,589,591,593,595,597,599,601,603,605,607,609,611,613,615,617,619,621,623,625,627,629,631,633,635,637,639,641,643,645,647,649,651,653,655,657,659,661,663,665,667,669,671,673,675,677,679,681,683,685,687,689,691,693,695,697,699,701,703,705,707,709,711,713,715,717,719,721,723,725,727,729,731,733,735,737,739,741,743,745,747,749,751,753,755,757,759,761,763,765,767,769,771,773,775,777,779,781,783,785,787,789,791,793,795,797,799,801,803,805,807,809,811,813,815,817,819,821,823,825,827,829,831,833,835,837,839,841,843,845,847,849,851,853,855,857,859,861,863,865,867,869,871,873,875,877,879,881,883,885,887,889,891,893,895,897,899,901,903,905,907,909,911,913,915,917,919,921,923,925,927,929,931,933,935,937,939,941,943,945,947,949,951,953,955,957,959,961,963,965,967,969,971,973,975,977,979,981,983,985,987,989,991,993,995,997,999,1001,1003,1005,1007,1009,1011,1013,1015,1017,1019,1021,1023,1025,1027,1029,1031,1033,1035,1037,1039,1041,1043,1045,1047,1049,1051,1053,1055,1057,1059,1061,1063,1065,1067,1069,1071,1073,1075,1077,1079,1081,1083,1085,1087,1089,1091,1093,1095,1097,1099,1101,1103,1105,1107,1109,1111,1113,1115,1117,1119,1121,1123,1125,1127,1129,1131,1133,1135,1137,1139,1141,1143,1145,1147,1149,1151,1153,1155,1157,1159,1161,1163,1165,1167,1169,1171,1173,1175,1177,1179,1181,1183,1185,1187,1189,1191,1193,1195,1197,1199,1201,1203,1205,1207,1209,1211,1213,1215,1217,1219,1221,1223,1225,1227,1229,1231,1233,1235,1237,1239,1241,1243,1245,1247,1249,1251,1253,1255,1257,1259,1261,1263,1265,1267,1269,1271,1273,1275,1277,1279,1281,1283,1285,1287,1289,1291,1293,1295,1297,1299,1301,1303,1305,1307,1309,1311,1313,1315,1317,1319,1321,1323,1325,1327,1329,1331,1333,1335,1337,1339,1341,1343,1345,1347,1349,1351,1353,1355,1357,1359,1361,1363,1365,1367,1369,1371,1373,1375,1377,1379,1381,1383,1385,1387,1389,1391,1393,1395,1397,1399,1401,1403,1405,1407,1409,1411,1413,1415,1417,1419,1421,1423,1425,1427,1429,1431,1433,1435,1437,1439,1441,1443,1445,1447,1449,1451,1453,1455,1457,1459,1461,1463,1465,1467,1469,1471,1473,1475,1477,1479,1481,1483,1485,1487,1489,1491,1493,1495,1497,1499,1501,1503,1505,1507,1509,1511,1513,1515,1517,1519,1521,1523,1525,1527,1529,1531,1533,1535,1537,1539,1541,1543,1545,1547,1549,1551,1553,1555,1557,1559,1561,1563,1565,1567,1569,1571,1573,1575,1577,1579,1581,1583,1585,1587,1589,1591,1593,1595,1597,1599,1601,1603,1605,1607,1609,1611,1613,1615,1617,1619,1621,1623,1625,1627,1629,1631,1633,1635,1637,1639,1641,1643,1645,1647,1649,1651,1653,1655,1657,1659,1661,1663,1665,1667,1669,1671,1673,1675,1677,1679,1681,1683,1685,1687,1689,1691,1693,1695,1697,1699,1701,1703,1705,1707,1709,1711,1713,1715,1717,1719,1721,1723,1725,1727,1729,1731,1733,1735,1737,1739,1741,1743,1745,1747,1749,1751,1753,1755,1757,1759,1761,1763,1765,1767,1769,1771,1773,1775,1777,1779,1781,1783,1785,1787,1789,1791,1793,1795,1797,1799,1801,1803,1805,1807,1809,1811,1813,1815,1817,1819,1821,1823,1825,1827,1829,1831,1833,1835,1837,1839,1841,1843,1845,1847,1849,1851,1853,1855,1857,1859,1861,1863,1865,1867,1869,1871,1873,1875,1877,1879,1881,1883,1885,1887,1889,1891,1893,1895,1897,1899,1901,1903,1905,1907,1909,1911,1913,1915,1917,1919,1921,1923,1925,1927,1929,1931,1933,1935,1937,1939,1941,1943,1945,1947,1949,1951,1953,1955,1957,1959,1961,1963,1965,1967,1969,1971,1973,1975,1977,1979,1981,1983,1985,1987,1989,1991,1993,1995,1997,1999,2001,2003,2005,2007,2009,2011,2013,2015,2017,2019,2021,2023,2025,2027,2029,2031,2033,2035,2037,2039,2041,2043,2045,2047,2049,2051,2053,2055,2057,2059,2061,2063,2065,2067,2069,2071,2073,2075,2077,2079,2081,2083,2085,2087,2089,2091,2093,2095,2097,2099,2101,2103,2105,2107,2109,2111,2113,2115,2117,2119,2121,2123,2125,2127,2129,2131,2133,2135,2137,2139,2141,2143,2145,2147,2149,2151,2153,2155,2157,2159,2161,2163,2165,2167,2169,2171,2173,2175,2177,2179,2181,2183,2185,2187,2189,2191,2193,2195,2197,2199,2201,2203,2205,2207,2209,2211,2213,2215,2217,2219,2221,2223,2225,2227,2229,2231,2233,2235,2237,2239,2241,2243,2245,2247,2249,2251,2253,2255,2257,2259,2261,2263,2265,2267,2269,2271,2273,2275,2277,2279,2281,2283,2285,2287,2289,2291,2293,2295,2297,2299,2301,2303,2305,2307,2309,2311,2313,2315,2317,2319,2321,2323,2325,2327,2329,2331,2333,2335,2337,2339,2341,2343,2345,2347,2349,2351,2353,2355,2357,2359,2361,2363,2365,2367,2369,2371,2373,2375,2377,2379,2381,2383,2385,2387,2389,2391,2393,2395,2397,2399,2401,2403,2405,2407,2409,2411,2413,2415,2417,2419,2421,2423,2425,2427,2429,2431,2433,2435,2437,2439,2441,2443,2445,2447,2449,2451,2453,2455,2457,2459,2461,2463,2465,2467,2469,2471,2473,2475,2477,2479,2481,2483,2485,2487,2489,2491,2493,2495,2497,2499,2501,2503,2505,2507,2509,2511,2513,2515,2517,2519,2521,2523,2525,2527,2529,2531,2533,2535,2537,2539,2541,2543,2545,2547,2549,2551,2553,2555,2557,2559,2561,2563,2565,2567,2569,2571,2573,2575,2577,2579,2581,2583,2585,2587,2589,2591,2593,2595,2597,2599,2601,2603,2605,2607,2609,2611,2613,2615,2617,2619,2621,2623,2625,2627,2629,2631,2633,2635,2637,2639,2641,2643,2645,2647,2649,2651,2653,2655,2657,2659,2661,2663,2665,2667,2669,2671,2673,2675,2677,2679,2681,2683,2685,2687,2689,2691,2693,2695,2697,2699,2701,2703,2705,2707,2709,2711,2713,2715,2717,2719,2721,2723,2725,2727,2729,2731,2733,2735,2737,2739,2741,2743,2745,2747,2749,2751,2753,2755,2757,2759,2761,2763,2765,2767,2769,2771,2773,2775,2777,2779,2781,2783,2785,2787,2789,2791,2793,2795,2797,2799,2801,2803,2805,2807,2809,2811,2813,2815,2817,2819,2821,2823,2825,2827,2829,2831,2833,2835,2837,2839,2841,2843,2845,2847,2849,2851,2853,2855,2857,2859,2861,2863,2865,2867,2869,2871,2873,2875,2877,2879,2881,2883,2885,2887,2889,2891,2893,2895,2897,2899,2901,2903,2905,2907,2909,2911,2913,2915,2917,2919,2921,2923,2925,2927,2929,2931,2933,2935,2937,2939,2941,2943,2945,2947,2949,2951,2953,2955,2957,2959,2961,2963,2965,2967,2969,2971,2973,2975,2977,2979,2981,2983,2985,2987,2989,2991,2993,2995,2997,2999,3001,3003,3005,3007,3009,3011,3013,3015,3017,3019,3021,3023,3025,3027,3029,3031,3033,3035,3037,3039,3041,3043,3045,3047,3049,3051,3053,3055,3057,3059,3061,3063,3065,3067,3069,3071,3073,3075,3077,3079,3081,3083,3085,3087,3089,3091,3093,3095,3097,3099,3101,3103,3105,3107,3109,3111,3113,3115,3117,3119,3121,3123,3125,3127,3129,3131,3133,3135,3137,3139,3141,3143,3145,3147,3149,3151,3153,3155,3157,3159,3161,3163,3165,3167,3169,3171,3173,3175,3177,3179,3181,3183,3185,3187,3189,3191,3193,3195,3197,3199,3201,3203,3205,3207,3209,3211,3213,3215,3217,3219,3221,3223,3225,3227,3229,3231,3233,3235,3237,3239,3241,3243,3245,3247,3249,3251,3253,3255,3257,3259,3261,3263,3265,3267,3269,3271,3273,3275,3277,3279,3281,3283,3285,3287,3289,3291,3293,3295,3297,3299,3301,3303,3305,3307,3309,3311,3313,3315,3317,3319,3321,3323,3325,3327,3329,3331,3333,3335,3337,3339,3341,3343,3345,3347,3349,3351,3353,3355,3357,3359,3361,3363,3365,3367,3369,3371,3373,3375,3377,3379,3381,3383,3385,3387,3389,3391,3393,3395,3397,3399,3401,3403,3405,3407,3409,3411,3413,3415,3417,3419,3421,3423,3425,3427,3429,3431,3433,3435,3437,3439,3441,3443,3445,3447,3449,3451,3453,3455,3457,3459,3461,3463,3465,3467,3469,3471,3473,3475,3477,3479,3481,3483,3485,3487,3489,3491,3493,3495,3497,3499,3501,3503,3505,3507,3509,3511,3513,3515,3517,3519,3521,3523,3525,3527,3529,3531,3533,3535,3537,3539,3541,3543,3545,3547,3549,3551,3553,3555,3557,3559,3561,3563,3565,3567,3569,3571,3573,3575,3577,3579,3581,3583,3585,3587],{"categories":5},[6],"Developer Productivity",{"categories":8},[9],"Business & SaaS",{"categories":11},[12],"AI & LLMs",{"categories":14},[15],"AI Automation",{"categories":17},[18],"Product Strategy",{"categories":20},[12],{"categories":22},[6],{"categories":24},[9],{"categories":26},[],{"categories":28},[12],{"categories":30},[],{"categories":32},[33],"AI News & Trends",{"categories":35},[15],{"categories":37},[33],{"categories":39},[15],{"categories":41},[15],{"categories":43},[12],{"categories":45},[12],{"categories":47},[33],{"categories":49},[12],{"categories":51},[],{"categories":53},[54],"Design & Frontend",{"categories":56},[57],"Data Science & Visualization",{"categories":59},[33],{"categories":61},[],{"categories":63},[64],"Software Engineering",{"categories":66},[12],{"categories":68},[15],{"categories":70},[71],"Marketing & Growth",{"categories":73},[12],{"categories":75},[15],{"categories":77},[],{"categories":79},[],{"categories":81},[54],{"categories":83},[15],{"categories":85},[6],{"categories":87},[54],{"categories":89},[12],{"categories":91},[15],{"categories":93},[33],{"categories":95},[],{"categories":97},[],{"categories":99},[15],{"categories":101},[64],{"categories":103},[],{"categories":105},[9],{"categories":107},[],{"categories":109},[],{"categories":111},[15],{"categories":113},[15],{"categories":115},[12],{"categories":117},[],{"categories":119},[64],{"categories":121},[],{"categories":123},[],{"categories":125},[],{"categories":127},[12],{"categories":129},[71],{"categories":131},[54],{"categories":133},[54],{"categories":135},[12],{"categories":137},[15],{"categories":139},[12],{"categories":141},[12],{"categories":143},[15],{"categories":145},[15],{"categories":147},[57],{"categories":149},[33],{"categories":151},[15],{"categories":153},[71],{"categories":155},[15],{"categories":157},[18],{"categories":159},[],{"categories":161},[15],{"categories":163},[],{"categories":165},[15],{"categories":167},[64],{"categories":169},[54],{"categories":171},[12],{"categories":173},[],{"categories":175},[],{"categories":177},[15],{"categories":179},[],{"categories":181},[12],{"categories":183},[],{"categories":185},[6],{"categories":187},[64],{"categories":189},[9],{"categories":191},[33],{"categories":193},[12],{"categories":195},[],{"categories":197},[12],{"categories":199},[],{"categories":201},[64],{"categories":203},[57],{"categories":205},[],{"categories":207},[12],{"categories":209},[54],{"categories":211},[],{"categories":213},[54],{"categories":215},[15],{"categories":217},[],{"categories":219},[15],{"categories":221},[33],{"categories":223},[9],{"categories":225},[12],{"categories":227},[],{"categories":229},[15],{"categories":231},[12],{"categories":233},[18],{"categories":235},[],{"categories":237},[12],{"categories":239},[15],{"categories":241},[15],{"categories":243},[],{"categories":245},[57],{"categories":247},[12],{"categories":249},[],{"categories":251},[6],{"categories":253},[9],{"categories":255},[12],{"categories":257},[15],{"categories":259},[64],{"categories":261},[12],{"categories":263},[],{"categories":265},[],{"categories":267},[12],{"categories":269},[],{"categories":271},[54],{"categories":273},[],{"categories":275},[12],{"categories":277},[],{"categories":279},[15],{"categories":281},[12],{"categories":283},[54],{"categories":285},[],{"categories":287},[12],{"categories":289},[12],{"categories":291},[9],{"categories":293},[15],{"categories":295},[12],{"categories":297},[54],{"categories":299},[15],{"categories":301},[],{"categories":303},[],{"categories":305},[33],{"categories":307},[],{"categories":309},[12],{"categories":311},[9,71],{"categories":313},[],{"categories":315},[12],{"categories":317},[],{"categories":319},[],{"categories":321},[12],{"categories":323},[],{"categories":325},[12],{"categories":327},[328],"DevOps & Cloud",{"categories":330},[],{"categories":332},[33],{"categories":334},[54],{"categories":336},[],{"categories":338},[33],{"categories":340},[33],{"categories":342},[12],{"categories":344},[71],{"categories":346},[],{"categories":348},[9],{"categories":350},[],{"categories":352},[12,328],{"categories":354},[12],{"categories":356},[12],{"categories":358},[15],{"categories":360},[12,64],{"categories":362},[57],{"categories":364},[12],{"categories":366},[71],{"categories":368},[15],{"categories":370},[15],{"categories":372},[],{"categories":374},[15],{"categories":376},[12,9],{"categories":378},[],{"categories":380},[54],{"categories":382},[54],{"categories":384},[],{"categories":386},[],{"categories":388},[33],{"categories":390},[],{"categories":392},[6],{"categories":394},[64],{"categories":396},[12],{"categories":398},[54],{"categories":400},[15],{"categories":402},[64],{"categories":404},[33],{"categories":406},[54],{"categories":408},[],{"categories":410},[12],{"categories":412},[12],{"categories":414},[12],{"categories":416},[33],{"categories":418},[6],{"categories":420},[12],{"categories":422},[15],{"categories":424},[328],{"categories":426},[54],{"categories":428},[15],{"categories":430},[],{"categories":432},[],{"categories":434},[54],{"categories":436},[33],{"categories":438},[57],{"categories":440},[],{"categories":442},[12],{"categories":444},[12],{"categories":446},[9],{"categories":448},[12],{"categories":450},[12],{"categories":452},[33],{"categories":454},[],{"categories":456},[15],{"categories":458},[64],{"categories":460},[],{"categories":462},[12],{"categories":464},[12],{"categories":466},[15],{"categories":468},[],{"categories":470},[],{"categories":472},[12],{"categories":474},[],{"categories":476},[9],{"categories":478},[15],{"categories":480},[],{"categories":482},[6],{"categories":484},[12],{"categories":486},[9],{"categories":488},[33],{"categories":490},[],{"categories":492},[],{"categories":494},[],{"categories":496},[33],{"categories":498},[33],{"categories":500},[],{"categories":502},[],{"categories":504},[9],{"categories":506},[],{"categories":508},[],{"categories":510},[6],{"categories":512},[],{"categories":514},[71],{"categories":516},[15],{"categories":518},[9],{"categories":520},[15],{"categories":522},[64],{"categories":524},[],{"categories":526},[18],{"categories":528},[54],{"categories":530},[64],{"categories":532},[12],{"categories":534},[15],{"categories":536},[9],{"categories":538},[12],{"categories":540},[],{"categories":542},[],{"categories":544},[64],{"categories":546},[57],{"categories":548},[18],{"categories":550},[15],{"categories":552},[12],{"categories":554},[],{"categories":556},[328],{"categories":558},[],{"categories":560},[15],{"categories":562},[],{"categories":564},[],{"categories":566},[12],{"categories":568},[54],{"categories":570},[71],{"categories":572},[15],{"categories":574},[],{"categories":576},[6],{"categories":578},[],{"categories":580},[33],{"categories":582},[12,328],{"categories":584},[33],{"categories":586},[12],{"categories":588},[9],{"categories":590},[12],{"categories":592},[],{"categories":594},[9],{"categories":596},[],{"categories":598},[64],{"categories":600},[54],{"categories":602},[33],{"categories":604},[57],{"categories":606},[6],{"categories":608},[12],{"categories":610},[64],{"categories":612},[],{"categories":614},[],{"categories":616},[18],{"categories":618},[],{"categories":620},[12],{"categories":622},[],{"categories":624},[54],{"categories":626},[54],{"categories":628},[54],{"categories":630},[],{"categories":632},[],{"categories":634},[33],{"categories":636},[15],{"categories":638},[12],{"categories":640},[12],{"categories":642},[12],{"categories":644},[9],{"categories":646},[12],{"categories":648},[],{"categories":650},[64],{"categories":652},[64],{"categories":654},[9],{"categories":656},[],{"categories":658},[12],{"categories":660},[12],{"categories":662},[9],{"categories":664},[33],{"categories":666},[71],{"categories":668},[15],{"categories":670},[],{"categories":672},[54],{"categories":674},[],{"categories":676},[12],{"categories":678},[],{"categories":680},[9],{"categories":682},[15],{"categories":684},[],{"categories":686},[328],{"categories":688},[57],{"categories":690},[64],{"categories":692},[71],{"categories":694},[64],{"categories":696},[15],{"categories":698},[],{"categories":700},[],{"categories":702},[15],{"categories":704},[6],{"categories":706},[15],{"categories":708},[18],{"categories":710},[9],{"categories":712},[],{"categories":714},[12],{"categories":716},[18],{"categories":718},[12],{"categories":720},[12],{"categories":722},[71],{"categories":724},[54],{"categories":726},[15],{"categories":728},[],{"categories":730},[],{"categories":732},[328],{"categories":734},[64],{"categories":736},[],{"categories":738},[15],{"categories":740},[12],{"categories":742},[54,12],{"categories":744},[6],{"categories":746},[],{"categories":748},[12],{"categories":750},[6],{"categories":752},[54],{"categories":754},[15],{"categories":756},[64],{"categories":758},[],{"categories":760},[12],{"categories":762},[],{"categories":764},[6],{"categories":766},[],{"categories":768},[15],{"categories":770},[18],{"categories":772},[12],{"categories":774},[12],{"categories":776},[54],{"categories":778},[15],{"categories":780},[328],{"categories":782},[54],{"categories":784},[15],{"categories":786},[12],{"categories":788},[12],{"categories":790},[12],{"categories":792},[33],{"categories":794},[],{"categories":796},[18],{"categories":798},[15],{"categories":800},[54],{"categories":802},[15],{"categories":804},[64],{"categories":806},[54],{"categories":808},[15],{"categories":810},[33],{"categories":812},[],{"categories":814},[12],{"categories":816},[54],{"categories":818},[12],{"categories":820},[6],{"categories":822},[33],{"categories":824},[12],{"categories":826},[71],{"categories":828},[12],{"categories":830},[12],{"categories":832},[15],{"categories":834},[15],{"categories":836},[12],{"categories":838},[15],{"categories":840},[54],{"categories":842},[12],{"categories":844},[],{"categories":846},[],{"categories":848},[64],{"categories":850},[],{"categories":852},[6],{"categories":854},[328],{"categories":856},[],{"categories":858},[6],{"categories":860},[9],{"categories":862},[71],{"categories":864},[],{"categories":866},[9],{"categories":868},[],{"categories":870},[],{"categories":872},[],{"categories":874},[],{"categories":876},[],{"categories":878},[12],{"categories":880},[15],{"categories":882},[328],{"categories":884},[6],{"categories":886},[12],{"categories":888},[64],{"categories":890},[18],{"categories":892},[12],{"categories":894},[71],{"categories":896},[12],{"categories":898},[12],{"categories":900},[12],{"categories":902},[12,6],{"categories":904},[64],{"categories":906},[64],{"categories":908},[54],{"categories":910},[12],{"categories":912},[],{"categories":914},[],{"categories":916},[],{"categories":918},[64],{"categories":920},[57],{"categories":922},[33],{"categories":924},[54],{"categories":926},[],{"categories":928},[12],{"categories":930},[12],{"categories":932},[],{"categories":934},[],{"categories":936},[15],{"categories":938},[12],{"categories":940},[9],{"categories":942},[],{"categories":944},[6],{"categories":946},[12],{"categories":948},[6],{"categories":950},[12],{"categories":952},[64],{"categories":954},[71],{"categories":956},[12,54],{"categories":958},[33],{"categories":960},[54],{"categories":962},[],{"categories":964},[328],{"categories":966},[54],{"categories":968},[15],{"categories":970},[],{"categories":972},[],{"categories":974},[],{"categories":976},[],{"categories":978},[64],{"categories":980},[15],{"categories":982},[15],{"categories":984},[328],{"categories":986},[12],{"categories":988},[12],{"categories":990},[12],{"categories":992},[],{"categories":994},[54],{"categories":996},[],{"categories":998},[],{"categories":1000},[15],{"categories":1002},[],{"categories":1004},[],{"categories":1006},[71],{"categories":1008},[71],{"categories":1010},[15],{"categories":1012},[],{"categories":1014},[12],{"categories":1016},[12],{"categories":1018},[64],{"categories":1020},[54],{"categories":1022},[54],{"categories":1024},[15],{"categories":1026},[6],{"categories":1028},[12],{"categories":1030},[54],{"categories":1032},[54],{"categories":1034},[15],{"categories":1036},[15],{"categories":1038},[12],{"categories":1040},[],{"categories":1042},[],{"categories":1044},[12],{"categories":1046},[15],{"categories":1048},[33],{"categories":1050},[64],{"categories":1052},[6],{"categories":1054},[12],{"categories":1056},[],{"categories":1058},[15],{"categories":1060},[15],{"categories":1062},[],{"categories":1064},[6],{"categories":1066},[12],{"categories":1068},[6],{"categories":1070},[6],{"categories":1072},[],{"categories":1074},[],{"categories":1076},[15],{"categories":1078},[15],{"categories":1080},[12],{"categories":1082},[12],{"categories":1084},[33],{"categories":1086},[57],{"categories":1088},[18],{"categories":1090},[33],{"categories":1092},[54],{"categories":1094},[],{"categories":1096},[33],{"categories":1098},[],{"categories":1100},[],{"categories":1102},[],{"categories":1104},[],{"categories":1106},[64],{"categories":1108},[57],{"categories":1110},[],{"categories":1112},[12],{"categories":1114},[12],{"categories":1116},[57],{"categories":1118},[64],{"categories":1120},[],{"categories":1122},[],{"categories":1124},[15],{"categories":1126},[33],{"categories":1128},[33],{"categories":1130},[15],{"categories":1132},[6],{"categories":1134},[12,328],{"categories":1136},[],{"categories":1138},[54],{"categories":1140},[6],{"categories":1142},[15],{"categories":1144},[54],{"categories":1146},[],{"categories":1148},[15],{"categories":1150},[15],{"categories":1152},[12],{"categories":1154},[71],{"categories":1156},[64],{"categories":1158},[54],{"categories":1160},[],{"categories":1162},[15],{"categories":1164},[12],{"categories":1166},[15],{"categories":1168},[15],{"categories":1170},[15],{"categories":1172},[71],{"categories":1174},[15],{"categories":1176},[12],{"categories":1178},[],{"categories":1180},[71],{"categories":1182},[33],{"categories":1184},[15],{"categories":1186},[],{"categories":1188},[],{"categories":1190},[12],{"categories":1192},[15],{"categories":1194},[33],{"categories":1196},[15],{"categories":1198},[],{"categories":1200},[],{"categories":1202},[],{"categories":1204},[15],{"categories":1206},[],{"categories":1208},[],{"categories":1210},[57],{"categories":1212},[12],{"categories":1214},[57],{"categories":1216},[33],{"categories":1218},[12],{"categories":1220},[12],{"categories":1222},[15],{"categories":1224},[12],{"categories":1226},[],{"categories":1228},[],{"categories":1230},[328],{"categories":1232},[],{"categories":1234},[],{"categories":1236},[6],{"categories":1238},[],{"categories":1240},[],{"categories":1242},[],{"categories":1244},[],{"categories":1246},[64],{"categories":1248},[33],{"categories":1250},[71],{"categories":1252},[9],{"categories":1254},[12],{"categories":1256},[12],{"categories":1258},[9],{"categories":1260},[],{"categories":1262},[54],{"categories":1264},[15],{"categories":1266},[9],{"categories":1268},[12],{"categories":1270},[12],{"categories":1272},[6],{"categories":1274},[],{"categories":1276},[6],{"categories":1278},[12],{"categories":1280},[71],{"categories":1282},[15],{"categories":1284},[33],{"categories":1286},[9],{"categories":1288},[12],{"categories":1290},[15],{"categories":1292},[],{"categories":1294},[12],{"categories":1296},[6],{"categories":1298},[12],{"categories":1300},[],{"categories":1302},[33],{"categories":1304},[12],{"categories":1306},[],{"categories":1308},[9],{"categories":1310},[12],{"categories":1312},[],{"categories":1314},[],{"categories":1316},[],{"categories":1318},[12],{"categories":1320},[],{"categories":1322},[328],{"categories":1324},[12],{"categories":1326},[],{"categories":1328},[12],{"categories":1330},[12],{"categories":1332},[12],{"categories":1334},[12,328],{"categories":1336},[12],{"categories":1338},[12],{"categories":1340},[54],{"categories":1342},[15],{"categories":1344},[],{"categories":1346},[15],{"categories":1348},[12],{"categories":1350},[12],{"categories":1352},[12],{"categories":1354},[6],{"categories":1356},[6],{"categories":1358},[64],{"categories":1360},[54],{"categories":1362},[15],{"categories":1364},[],{"categories":1366},[12],{"categories":1368},[33],{"categories":1370},[12],{"categories":1372},[9],{"categories":1374},[],{"categories":1376},[328],{"categories":1378},[54],{"categories":1380},[54],{"categories":1382},[15],{"categories":1384},[33],{"categories":1386},[15],{"categories":1388},[12],{"categories":1390},[],{"categories":1392},[12],{"categories":1394},[],{"categories":1396},[],{"categories":1398},[12],{"categories":1400},[12],{"categories":1402},[12],{"categories":1404},[15],{"categories":1406},[12],{"categories":1408},[],{"categories":1410},[57],{"categories":1412},[15],{"categories":1414},[],{"categories":1416},[],{"categories":1418},[12],{"categories":1420},[33],{"categories":1422},[],{"categories":1424},[54],{"categories":1426},[328],{"categories":1428},[33],{"categories":1430},[64],{"categories":1432},[64],{"categories":1434},[33],{"categories":1436},[33],{"categories":1438},[328],{"categories":1440},[],{"categories":1442},[33],{"categories":1444},[12],{"categories":1446},[6],{"categories":1448},[33],{"categories":1450},[],{"categories":1452},[57],{"categories":1454},[33],{"categories":1456},[64],{"categories":1458},[33],{"categories":1460},[328],{"categories":1462},[12],{"categories":1464},[12],{"categories":1466},[],{"categories":1468},[9],{"categories":1470},[],{"categories":1472},[],{"categories":1474},[12],{"categories":1476},[12],{"categories":1478},[12],{"categories":1480},[12],{"categories":1482},[],{"categories":1484},[57],{"categories":1486},[6],{"categories":1488},[],{"categories":1490},[12],{"categories":1492},[12],{"categories":1494},[328],{"categories":1496},[328],{"categories":1498},[],{"categories":1500},[15],{"categories":1502},[33],{"categories":1504},[33],{"categories":1506},[12],{"categories":1508},[15],{"categories":1510},[],{"categories":1512},[54],{"categories":1514},[12],{"categories":1516},[12],{"categories":1518},[],{"categories":1520},[],{"categories":1522},[328],{"categories":1524},[12],{"categories":1526},[64],{"categories":1528},[9],{"categories":1530},[12],{"categories":1532},[],{"categories":1534},[15],{"categories":1536},[6],{"categories":1538},[6],{"categories":1540},[],{"categories":1542},[12],{"categories":1544},[54],{"categories":1546},[15],{"categories":1548},[],{"categories":1550},[12],{"categories":1552},[12],{"categories":1554},[15],{"categories":1556},[],{"categories":1558},[15],{"categories":1560},[64],{"categories":1562},[],{"categories":1564},[12],{"categories":1566},[],{"categories":1568},[12],{"categories":1570},[],{"categories":1572},[12],{"categories":1574},[12],{"categories":1576},[],{"categories":1578},[12],{"categories":1580},[33],{"categories":1582},[12],{"categories":1584},[12],{"categories":1586},[6],{"categories":1588},[12],{"categories":1590},[33],{"categories":1592},[15],{"categories":1594},[],{"categories":1596},[12],{"categories":1598},[71],{"categories":1600},[],{"categories":1602},[],{"categories":1604},[],{"categories":1606},[6],{"categories":1608},[33],{"categories":1610},[15],{"categories":1612},[12],{"categories":1614},[54],{"categories":1616},[15],{"categories":1618},[],{"categories":1620},[15],{"categories":1622},[],{"categories":1624},[12],{"categories":1626},[15],{"categories":1628},[12],{"categories":1630},[],{"categories":1632},[12],{"categories":1634},[12],{"categories":1636},[33],{"categories":1638},[54],{"categories":1640},[15],{"categories":1642},[54],{"categories":1644},[9],{"categories":1646},[],{"categories":1648},[],{"categories":1650},[12],{"categories":1652},[6],{"categories":1654},[33],{"categories":1656},[],{"categories":1658},[],{"categories":1660},[64],{"categories":1662},[54],{"categories":1664},[],{"categories":1666},[12],{"categories":1668},[],{"categories":1670},[71],{"categories":1672},[12],{"categories":1674},[328],{"categories":1676},[64],{"categories":1678},[],{"categories":1680},[15],{"categories":1682},[12],{"categories":1684},[15],{"categories":1686},[15],{"categories":1688},[12],{"categories":1690},[],{"categories":1692},[6],{"categories":1694},[12],{"categories":1696},[9],{"categories":1698},[64],{"categories":1700},[54],{"categories":1702},[],{"categories":1704},[],{"categories":1706},[],{"categories":1708},[15],{"categories":1710},[54],{"categories":1712},[33],{"categories":1714},[12],{"categories":1716},[33],{"categories":1718},[54],{"categories":1720},[],{"categories":1722},[54],{"categories":1724},[33],{"categories":1726},[9],{"categories":1728},[12],{"categories":1730},[33],{"categories":1732},[71],{"categories":1734},[],{"categories":1736},[],{"categories":1738},[57],{"categories":1740},[12,64],{"categories":1742},[33],{"categories":1744},[12],{"categories":1746},[15],{"categories":1748},[15],{"categories":1750},[12],{"categories":1752},[],{"categories":1754},[64],{"categories":1756},[12],{"categories":1758},[57],{"categories":1760},[15],{"categories":1762},[71],{"categories":1764},[328],{"categories":1766},[],{"categories":1768},[6],{"categories":1770},[15],{"categories":1772},[15],{"categories":1774},[64],{"categories":1776},[12],{"categories":1778},[12],{"categories":1780},[],{"categories":1782},[],{"categories":1784},[],{"categories":1786},[328],{"categories":1788},[33],{"categories":1790},[12],{"categories":1792},[12],{"categories":1794},[12],{"categories":1796},[],{"categories":1798},[57],{"categories":1800},[9],{"categories":1802},[],{"categories":1804},[15],{"categories":1806},[328],{"categories":1808},[],{"categories":1810},[54],{"categories":1812},[54],{"categories":1814},[],{"categories":1816},[64],{"categories":1818},[54],{"categories":1820},[12],{"categories":1822},[],{"categories":1824},[33],{"categories":1826},[12],{"categories":1828},[54],{"categories":1830},[15],{"categories":1832},[33],{"categories":1834},[],{"categories":1836},[15],{"categories":1838},[54],{"categories":1840},[12],{"categories":1842},[],{"categories":1844},[12],{"categories":1846},[12],{"categories":1848},[328],{"categories":1850},[33],{"categories":1852},[57],{"categories":1854},[57],{"categories":1856},[],{"categories":1858},[],{"categories":1860},[],{"categories":1862},[15],{"categories":1864},[64],{"categories":1866},[64],{"categories":1868},[],{"categories":1870},[],{"categories":1872},[12],{"categories":1874},[],{"categories":1876},[15],{"categories":1878},[12],{"categories":1880},[],{"categories":1882},[12],{"categories":1884},[9],{"categories":1886},[12],{"categories":1888},[71],{"categories":1890},[15],{"categories":1892},[12],{"categories":1894},[64],{"categories":1896},[33],{"categories":1898},[15],{"categories":1900},[],{"categories":1902},[33],{"categories":1904},[15],{"categories":1906},[15],{"categories":1908},[],{"categories":1910},[9],{"categories":1912},[15],{"categories":1914},[],{"categories":1916},[12],{"categories":1918},[6],{"categories":1920},[33],{"categories":1922},[328],{"categories":1924},[15],{"categories":1926},[15],{"categories":1928},[6],{"categories":1930},[12],{"categories":1932},[],{"categories":1934},[],{"categories":1936},[54],{"categories":1938},[12,9],{"categories":1940},[],{"categories":1942},[6],{"categories":1944},[57],{"categories":1946},[12],{"categories":1948},[64],{"categories":1950},[12],{"categories":1952},[15],{"categories":1954},[12],{"categories":1956},[12],{"categories":1958},[33],{"categories":1960},[15],{"categories":1962},[],{"categories":1964},[],{"categories":1966},[15],{"categories":1968},[12],{"categories":1970},[328],{"categories":1972},[],{"categories":1974},[12],{"categories":1976},[15],{"categories":1978},[],{"categories":1980},[12],{"categories":1982},[71],{"categories":1984},[57],{"categories":1986},[15],{"categories":1988},[12],{"categories":1990},[328],{"categories":1992},[],{"categories":1994},[12],{"categories":1996},[71],{"categories":1998},[54],{"categories":2000},[12],{"categories":2002},[],{"categories":2004},[71],{"categories":2006},[33],{"categories":2008},[12],{"categories":2010},[12],{"categories":2012},[6],{"categories":2014},[],{"categories":2016},[],{"categories":2018},[54],{"categories":2020},[12],{"categories":2022},[57],{"categories":2024},[71],{"categories":2026},[71],{"categories":2028},[33],{"categories":2030},[],{"categories":2032},[],{"categories":2034},[12],{"categories":2036},[],{"categories":2038},[12,64],{"categories":2040},[33],{"categories":2042},[15],{"categories":2044},[64],{"categories":2046},[12],{"categories":2048},[6],{"categories":2050},[],{"categories":2052},[],{"categories":2054},[6],{"categories":2056},[71],{"categories":2058},[12],{"categories":2060},[],{"categories":2062},[54,12],{"categories":2064},[328],{"categories":2066},[6],{"categories":2068},[],{"categories":2070},[9],{"categories":2072},[9],{"categories":2074},[12],{"categories":2076},[64],{"categories":2078},[15],{"categories":2080},[33],{"categories":2082},[71],{"categories":2084},[54],{"categories":2086},[12],{"categories":2088},[12],{"categories":2090},[12],{"categories":2092},[6],{"categories":2094},[12],{"categories":2096},[15],{"categories":2098},[33],{"categories":2100},[],{"categories":2102},[],{"categories":2104},[57],{"categories":2106},[64],{"categories":2108},[12],{"categories":2110},[54],{"categories":2112},[57],{"categories":2114},[12],{"categories":2116},[12],{"categories":2118},[15],{"categories":2120},[15],{"categories":2122},[12,9],{"categories":2124},[],{"categories":2126},[54],{"categories":2128},[],{"categories":2130},[12],{"categories":2132},[33],{"categories":2134},[6],{"categories":2136},[6],{"categories":2138},[15],{"categories":2140},[12],{"categories":2142},[9],{"categories":2144},[64],{"categories":2146},[71],{"categories":2148},[],{"categories":2150},[33],{"categories":2152},[12],{"categories":2154},[12],{"categories":2156},[33],{"categories":2158},[64],{"categories":2160},[12],{"categories":2162},[15],{"categories":2164},[33],{"categories":2166},[12],{"categories":2168},[54],{"categories":2170},[12],{"categories":2172},[12],{"categories":2174},[328],{"categories":2176},[18],{"categories":2178},[15],{"categories":2180},[12],{"categories":2182},[33],{"categories":2184},[15],{"categories":2186},[71],{"categories":2188},[12],{"categories":2190},[],{"categories":2192},[12],{"categories":2194},[],{"categories":2196},[],{"categories":2198},[],{"categories":2200},[9],{"categories":2202},[12],{"categories":2204},[15],{"categories":2206},[33],{"categories":2208},[33],{"categories":2210},[33],{"categories":2212},[33],{"categories":2214},[],{"categories":2216},[6],{"categories":2218},[15],{"categories":2220},[33],{"categories":2222},[6],{"categories":2224},[15],{"categories":2226},[12],{"categories":2228},[12,15],{"categories":2230},[15],{"categories":2232},[328],{"categories":2234},[33],{"categories":2236},[33],{"categories":2238},[15],{"categories":2240},[12],{"categories":2242},[],{"categories":2244},[33],{"categories":2246},[71],{"categories":2248},[6],{"categories":2250},[12],{"categories":2252},[12],{"categories":2254},[],{"categories":2256},[64],{"categories":2258},[],{"categories":2260},[6],{"categories":2262},[15],{"categories":2264},[33],{"categories":2266},[12],{"categories":2268},[33],{"categories":2270},[6],{"categories":2272},[33],{"categories":2274},[33],{"categories":2276},[],{"categories":2278},[9],{"categories":2280},[15],{"categories":2282},[33],{"categories":2284},[33],{"categories":2286},[33],{"categories":2288},[33],{"categories":2290},[33],{"categories":2292},[33],{"categories":2294},[33],{"categories":2296},[33],{"categories":2298},[33],{"categories":2300},[33],{"categories":2302},[57],{"categories":2304},[6],{"categories":2306},[12],{"categories":2308},[12],{"categories":2310},[],{"categories":2312},[12,6],{"categories":2314},[],{"categories":2316},[15],{"categories":2318},[33],{"categories":2320},[15],{"categories":2322},[12],{"categories":2324},[12],{"categories":2326},[12],{"categories":2328},[12],{"categories":2330},[12],{"categories":2332},[15],{"categories":2334},[9],{"categories":2336},[54],{"categories":2338},[33],{"categories":2340},[12],{"categories":2342},[],{"categories":2344},[],{"categories":2346},[15],{"categories":2348},[54],{"categories":2350},[12],{"categories":2352},[],{"categories":2354},[],{"categories":2356},[71],{"categories":2358},[12],{"categories":2360},[],{"categories":2362},[],{"categories":2364},[6],{"categories":2366},[9],{"categories":2368},[12],{"categories":2370},[9],{"categories":2372},[54],{"categories":2374},[],{"categories":2376},[33],{"categories":2378},[],{"categories":2380},[54],{"categories":2382},[12],{"categories":2384},[71],{"categories":2386},[],{"categories":2388},[71],{"categories":2390},[],{"categories":2392},[],{"categories":2394},[15],{"categories":2396},[],{"categories":2398},[9],{"categories":2400},[6],{"categories":2402},[54],{"categories":2404},[64],{"categories":2406},[],{"categories":2408},[],{"categories":2410},[12],{"categories":2412},[6],{"categories":2414},[71],{"categories":2416},[],{"categories":2418},[15],{"categories":2420},[15],{"categories":2422},[33],{"categories":2424},[12],{"categories":2426},[15],{"categories":2428},[12],{"categories":2430},[15],{"categories":2432},[12],{"categories":2434},[18],{"categories":2436},[33],{"categories":2438},[],{"categories":2440},[71],{"categories":2442},[64],{"categories":2444},[15],{"categories":2446},[],{"categories":2448},[12],{"categories":2450},[15],{"categories":2452},[9],{"categories":2454},[6],{"categories":2456},[12],{"categories":2458},[54],{"categories":2460},[64],{"categories":2462},[64],{"categories":2464},[12],{"categories":2466},[57],{"categories":2468},[12],{"categories":2470},[15],{"categories":2472},[9],{"categories":2474},[15],{"categories":2476},[12],{"categories":2478},[12],{"categories":2480},[15],{"categories":2482},[33],{"categories":2484},[],{"categories":2486},[6],{"categories":2488},[12],{"categories":2490},[15],{"categories":2492},[12],{"categories":2494},[12],{"categories":2496},[],{"categories":2498},[54],{"categories":2500},[9],{"categories":2502},[33],{"categories":2504},[12],{"categories":2506},[12],{"categories":2508},[54],{"categories":2510},[71],{"categories":2512},[57],{"categories":2514},[12],{"categories":2516},[33],{"categories":2518},[12],{"categories":2520},[15],{"categories":2522},[328],{"categories":2524},[12],{"categories":2526},[15],{"categories":2528},[57],{"categories":2530},[],{"categories":2532},[15],{"categories":2534},[64],{"categories":2536},[54],{"categories":2538},[12],{"categories":2540},[6],{"categories":2542},[9],{"categories":2544},[64],{"categories":2546},[],{"categories":2548},[15],{"categories":2550},[12],{"categories":2552},[],{"categories":2554},[33],{"categories":2556},[],{"categories":2558},[33],{"categories":2560},[12],{"categories":2562},[15],{"categories":2564},[15],{"categories":2566},[15],{"categories":2568},[],{"categories":2570},[],{"categories":2572},[12],{"categories":2574},[12],{"categories":2576},[],{"categories":2578},[54],{"categories":2580},[15],{"categories":2582},[71],{"categories":2584},[6],{"categories":2586},[],{"categories":2588},[],{"categories":2590},[33],{"categories":2592},[64],{"categories":2594},[12],{"categories":2596},[12],{"categories":2598},[12],{"categories":2600},[64],{"categories":2602},[33],{"categories":2604},[54],{"categories":2606},[12],{"categories":2608},[12],{"categories":2610},[12],{"categories":2612},[33],{"categories":2614},[12],{"categories":2616},[33],{"categories":2618},[15],{"categories":2620},[15],{"categories":2622},[64],{"categories":2624},[15],{"categories":2626},[12],{"categories":2628},[64],{"categories":2630},[54],{"categories":2632},[],{"categories":2634},[15],{"categories":2636},[],{"categories":2638},[],{"categories":2640},[],{"categories":2642},[9],{"categories":2644},[12],{"categories":2646},[15],{"categories":2648},[6],{"categories":2650},[15],{"categories":2652},[71],{"categories":2654},[],{"categories":2656},[15],{"categories":2658},[],{"categories":2660},[6],{"categories":2662},[15],{"categories":2664},[],{"categories":2666},[15],{"categories":2668},[12],{"categories":2670},[33],{"categories":2672},[12],{"categories":2674},[15],{"categories":2676},[33],{"categories":2678},[15],{"categories":2680},[64],{"categories":2682},[54],{"categories":2684},[6],{"categories":2686},[],{"categories":2688},[15],{"categories":2690},[54],{"categories":2692},[328],{"categories":2694},[33],{"categories":2696},[12],{"categories":2698},[54],{"categories":2700},[6],{"categories":2702},[],{"categories":2704},[15],{"categories":2706},[15],{"categories":2708},[12],{"categories":2710},[],{"categories":2712},[15],{"categories":2714},[18],{"categories":2716},[33],{"categories":2718},[15],{"categories":2720},[9],{"categories":2722},[],{"categories":2724},[12],{"categories":2726},[18],{"categories":2728},[12],{"categories":2730},[15],{"categories":2732},[33],{"categories":2734},[6],{"categories":2736},[328],{"categories":2738},[12],{"categories":2740},[12],{"categories":2742},[12],{"categories":2744},[33],{"categories":2746},[9],{"categories":2748},[12],{"categories":2750},[54],{"categories":2752},[33],{"categories":2754},[328],{"categories":2756},[12],{"categories":2758},[],{"categories":2760},[],{"categories":2762},[328],{"categories":2764},[57],{"categories":2766},[15],{"categories":2768},[15],{"categories":2770},[33],{"categories":2772},[12],{"categories":2774},[6],{"categories":2776},[54],{"categories":2778},[15],{"categories":2780},[12],{"categories":2782},[71],{"categories":2784},[12],{"categories":2786},[15],{"categories":2788},[],{"categories":2790},[12],{"categories":2792},[12],{"categories":2794},[33],{"categories":2796},[6],{"categories":2798},[],{"categories":2800},[12],{"categories":2802},[12],{"categories":2804},[64],{"categories":2806},[54],{"categories":2808},[12,15],{"categories":2810},[71,9],{"categories":2812},[12],{"categories":2814},[],{"categories":2816},[15],{"categories":2818},[],{"categories":2820},[64],{"categories":2822},[12],{"categories":2824},[33],{"categories":2826},[],{"categories":2828},[15],{"categories":2830},[],{"categories":2832},[54],{"categories":2834},[15],{"categories":2836},[6],{"categories":2838},[15],{"categories":2840},[12],{"categories":2842},[328],{"categories":2844},[71],{"categories":2846},[9],{"categories":2848},[9],{"categories":2850},[6],{"categories":2852},[6],{"categories":2854},[12],{"categories":2856},[15],{"categories":2858},[12],{"categories":2860},[12],{"categories":2862},[6],{"categories":2864},[12],{"categories":2866},[71],{"categories":2868},[33],{"categories":2870},[12],{"categories":2872},[15],{"categories":2874},[12],{"categories":2876},[],{"categories":2878},[64],{"categories":2880},[],{"categories":2882},[15],{"categories":2884},[6],{"categories":2886},[],{"categories":2888},[328],{"categories":2890},[12],{"categories":2892},[],{"categories":2894},[33],{"categories":2896},[15],{"categories":2898},[64],{"categories":2900},[12],{"categories":2902},[15],{"categories":2904},[64],{"categories":2906},[15],{"categories":2908},[33],{"categories":2910},[6],{"categories":2912},[33],{"categories":2914},[64],{"categories":2916},[12],{"categories":2918},[54],{"categories":2920},[12],{"categories":2922},[12],{"categories":2924},[12],{"categories":2926},[12],{"categories":2928},[15],{"categories":2930},[12],{"categories":2932},[15],{"categories":2934},[12],{"categories":2936},[6],{"categories":2938},[12],{"categories":2940},[15],{"categories":2942},[54],{"categories":2944},[6],{"categories":2946},[15],{"categories":2948},[54],{"categories":2950},[],{"categories":2952},[12],{"categories":2954},[12],{"categories":2956},[64],{"categories":2958},[],{"categories":2960},[15],{"categories":2962},[71],{"categories":2964},[12],{"categories":2966},[33],{"categories":2968},[71],{"categories":2970},[15],{"categories":2972},[9],{"categories":2974},[9],{"categories":2976},[12],{"categories":2978},[6],{"categories":2980},[],{"categories":2982},[12],{"categories":2984},[],{"categories":2986},[6],{"categories":2988},[12],{"categories":2990},[15],{"categories":2992},[15],{"categories":2994},[],{"categories":2996},[64],{"categories":2998},[64],{"categories":3000},[71],{"categories":3002},[54],{"categories":3004},[],{"categories":3006},[12],{"categories":3008},[6],{"categories":3010},[12],{"categories":3012},[64],{"categories":3014},[6],{"categories":3016},[33],{"categories":3018},[33],{"categories":3020},[],{"categories":3022},[33],{"categories":3024},[15],{"categories":3026},[54],{"categories":3028},[57],{"categories":3030},[12],{"categories":3032},[],{"categories":3034},[33],{"categories":3036},[64],{"categories":3038},[9],{"categories":3040},[12],{"categories":3042},[6],{"categories":3044},[328],{"categories":3046},[6],{"categories":3048},[],{"categories":3050},[],{"categories":3052},[33],{"categories":3054},[],{"categories":3056},[15],{"categories":3058},[15],{"categories":3060},[15],{"categories":3062},[],{"categories":3064},[12],{"categories":3066},[],{"categories":3068},[33],{"categories":3070},[6],{"categories":3072},[54],{"categories":3074},[12],{"categories":3076},[33],{"categories":3078},[33],{"categories":3080},[],{"categories":3082},[33],{"categories":3084},[6],{"categories":3086},[12],{"categories":3088},[],{"categories":3090},[15],{"categories":3092},[15],{"categories":3094},[6],{"categories":3096},[],{"categories":3098},[],{"categories":3100},[],{"categories":3102},[54],{"categories":3104},[15],{"categories":3106},[12],{"categories":3108},[],{"categories":3110},[],{"categories":3112},[],{"categories":3114},[54],{"categories":3116},[],{"categories":3118},[6],{"categories":3120},[],{"categories":3122},[],{"categories":3124},[54],{"categories":3126},[12],{"categories":3128},[33],{"categories":3130},[],{"categories":3132},[71],{"categories":3134},[33],{"categories":3136},[71],{"categories":3138},[12],{"categories":3140},[],{"categories":3142},[],{"categories":3144},[15],{"categories":3146},[],{"categories":3148},[],{"categories":3150},[15],{"categories":3152},[12],{"categories":3154},[],{"categories":3156},[15],{"categories":3158},[33],{"categories":3160},[71],{"categories":3162},[57],{"categories":3164},[15],{"categories":3166},[15],{"categories":3168},[],{"categories":3170},[],{"categories":3172},[],{"categories":3174},[33],{"categories":3176},[],{"categories":3178},[],{"categories":3180},[54],{"categories":3182},[6],{"categories":3184},[],{"categories":3186},[9],{"categories":3188},[71],{"categories":3190},[12],{"categories":3192},[64],{"categories":3194},[6],{"categories":3196},[57],{"categories":3198},[9],{"categories":3200},[64],{"categories":3202},[],{"categories":3204},[],{"categories":3206},[15],{"categories":3208},[6],{"categories":3210},[54],{"categories":3212},[6],{"categories":3214},[15],{"categories":3216},[328],{"categories":3218},[15],{"categories":3220},[],{"categories":3222},[12],{"categories":3224},[33],{"categories":3226},[64],{"categories":3228},[],{"categories":3230},[54],{"categories":3232},[33],{"categories":3234},[6],{"categories":3236},[15],{"categories":3238},[12],{"categories":3240},[9],{"categories":3242},[15,328],{"categories":3244},[15],{"categories":3246},[64],{"categories":3248},[12],{"categories":3250},[57],{"categories":3252},[71],{"categories":3254},[15],{"categories":3256},[],{"categories":3258},[15],{"categories":3260},[12],{"categories":3262},[9],{"categories":3264},[],{"categories":3266},[],{"categories":3268},[12],{"categories":3270},[57],{"categories":3272},[12],{"categories":3274},[],{"categories":3276},[33],{"categories":3278},[],{"categories":3280},[33],{"categories":3282},[64],{"categories":3284},[15],{"categories":3286},[12],{"categories":3288},[71],{"categories":3290},[64],{"categories":3292},[],{"categories":3294},[33],{"categories":3296},[12],{"categories":3298},[],{"categories":3300},[12],{"categories":3302},[15],{"categories":3304},[12],{"categories":3306},[15],{"categories":3308},[12],{"categories":3310},[12],{"categories":3312},[12],{"categories":3314},[12],{"categories":3316},[9],{"categories":3318},[],{"categories":3320},[18],{"categories":3322},[33],{"categories":3324},[12],{"categories":3326},[],{"categories":3328},[64],{"categories":3330},[12],{"categories":3332},[12],{"categories":3334},[15],{"categories":3336},[33],{"categories":3338},[12],{"categories":3340},[12],{"categories":3342},[9],{"categories":3344},[15],{"categories":3346},[54],{"categories":3348},[],{"categories":3350},[57],{"categories":3352},[12],{"categories":3354},[],{"categories":3356},[33],{"categories":3358},[71],{"categories":3360},[],{"categories":3362},[],{"categories":3364},[33],{"categories":3366},[33],{"categories":3368},[71],{"categories":3370},[6],{"categories":3372},[15],{"categories":3374},[15],{"categories":3376},[12],{"categories":3378},[9],{"categories":3380},[],{"categories":3382},[],{"categories":3384},[33],{"categories":3386},[57],{"categories":3388},[64],{"categories":3390},[15],{"categories":3392},[54],{"categories":3394},[57],{"categories":3396},[57],{"categories":3398},[],{"categories":3400},[33],{"categories":3402},[12],{"categories":3404},[12],{"categories":3406},[64],{"categories":3408},[],{"categories":3410},[33],{"categories":3412},[33],{"categories":3414},[33],{"categories":3416},[],{"categories":3418},[15],{"categories":3420},[12],{"categories":3422},[],{"categories":3424},[6],{"categories":3426},[9],{"categories":3428},[],{"categories":3430},[12],{"categories":3432},[12],{"categories":3434},[],{"categories":3436},[64],{"categories":3438},[],{"categories":3440},[],{"categories":3442},[],{"categories":3444},[],{"categories":3446},[12],{"categories":3448},[33],{"categories":3450},[],{"categories":3452},[],{"categories":3454},[12],{"categories":3456},[12],{"categories":3458},[12],{"categories":3460},[57],{"categories":3462},[12],{"categories":3464},[57],{"categories":3466},[],{"categories":3468},[57],{"categories":3470},[57],{"categories":3472},[328],{"categories":3474},[15],{"categories":3476},[64],{"categories":3478},[],{"categories":3480},[],{"categories":3482},[57],{"categories":3484},[64],{"categories":3486},[64],{"categories":3488},[64],{"categories":3490},[],{"categories":3492},[6],{"categories":3494},[64],{"categories":3496},[64],{"categories":3498},[6],{"categories":3500},[64],{"categories":3502},[9],{"categories":3504},[64],{"categories":3506},[64],{"categories":3508},[64],{"categories":3510},[57],{"categories":3512},[33],{"categories":3514},[33],{"categories":3516},[12],{"categories":3518},[64],{"categories":3520},[57],{"categories":3522},[328],{"categories":3524},[57],{"categories":3526},[57],{"categories":3528},[57],{"categories":3530},[],{"categories":3532},[9],{"categories":3534},[],{"categories":3536},[328],{"categories":3538},[64],{"categories":3540},[64],{"categories":3542},[64],{"categories":3544},[15],{"categories":3546},[33,9],{"categories":3548},[57],{"categories":3550},[],{"categories":3552},[],{"categories":3554},[57],{"categories":3556},[],{"categories":3558},[57],{"categories":3560},[33],{"categories":3562},[15],{"categories":3564},[],{"categories":3566},[64],{"categories":3568},[12],{"categories":3570},[54],{"categories":3572},[],{"categories":3574},[12],{"categories":3576},[],{"categories":3578},[33],{"categories":3580},[6],{"categories":3582},[57],{"categories":3584},[],{"categories":3586},[64],{"categories":3588},[33],{"id":3590,"title":3591,"ai_summary":3592,"author":3593,"body":3594,"category":4019,"date_modified":4020,"description":3600,"excerpt":3593,"extension":4021,"faq":4020,"keywords":4022,"meta":4029,"meta_description":4030,"meta_title":4031,"navigation":4032,"path":4033,"primary_keyword":4023,"published_at":4020,"related_posts":4034,"sections":4035,"seo":4037,"sitemap":4038,"slug":4039,"status":4040,"stem":4041,"__hash__":4042},"articles\u002Farticles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-expb-premium-post-merge-article.md","Why Production AI Needs an Agent Harness, Not Just a Framework","An AI agent harness is a control plane that governs agent execution, enforces safety guardrails, and manages budgets. Unlike frameworks that orchestrate workflows, a harness uses a Planner, Generator, and Evaluator architecture to ensure reliable, cost-effective, and safe task completion in production environments.","",{"type":3595,"value":3596,"toc":4009},"minimark",[3597,3601,3604,3607,3610,3615,3618,3621,3624,3627,3630,3633,3656,3667,3671,3674,3677,3680,3683,3697,3701,3704,3707,3710,3722,3725,3839,3842,3846,3849,3852,3855,3858,3861,3865,3868,3871,3874,3883,3889,3892,3900,3903,3906,3910,3913,3916,3919,3922,3925,3928,3954,3962,3966,3969,3972,3975,3978,3981,4005],[3598,3599,3600],"p",{},"An AI agent harness is a control plane that governs execution, enforces safety guardrails, and manages budgets. Unlike standard orchestration frameworks, a harness uses a Planner, Generator, and Evaluator architecture to guarantee reliable, cost-effective, and safe task completion in production environments.",[3598,3602,3603],{},"You built a highly capable agent demo using a standard orchestration framework. It looks great on your laptop. But deploying it to production feels like letting a toddler drive a forklift. Without strict boundaries, agents drift. They hallucinate. They burn through API budgets in infinite reasoning loops.",[3598,3605,3606],{},"Agent sprawl is the most common failure mode for teams moving from prototype to production. You wire together multiple models, give them tool access, and hope for the best. But generative models are inherently bad at grading their own homework.",[3598,3608,3609],{},"Production reliability requires a different mental model. You have to treat agent orchestration as a control systems problem, not just a chaining problem.",[3611,3612,3614],"h2",{"id":3613},"why-frameworks-arent-enough-for-production","Why Frameworks Aren't Enough for Production",[3598,3616,3617],{},"Frameworks provide the building blocks for agent orchestration, but they lack built-in governance for safety, cost, and reliability. Relying solely on frameworks often leads to agent sprawl, where multiple loosely coordinated models duplicate costs and bypass compliance policies. Production systems require an independent control layer to prevent prototype drift and ensure consistent execution.",[3598,3619,3620],{},"Frameworks like LangChain or CrewAI are excellent for wiring up inputs and outputs. They give you the primitives to connect a large language model to a vector database or a search API.",[3598,3622,3623],{},"But they do not inherently restrict bad behavior. They assume the model will follow your system prompt.",[3598,3625,3626],{},"Loose coordination feels fast during prototyping, but it creates massive technical debt. You end up with duplicated contexts across multiple agents. This drives up token costs unnecessarily and fragments your system's state.",[3598,3628,3629],{},"Without a governing layer, long-running workflows fail silently. Worse, they get trapped in infinite reasoning loops. An agent might repeatedly call a failing API, burning through tokens until hitting a hard timeout.",[3598,3631,3632],{},"Relying entirely on frameworks introduces three distinct failure modes:",[3634,3635,3636,3644,3650],"ul",{},[3637,3638,3639,3643],"li",{},[3640,3641,3642],"strong",{},"Missing financial limits:"," Agents lack awareness of token spend per session and will exhaust budgets to solve impossible tasks.",[3637,3645,3646,3649],{},[3640,3647,3648],{},"Unbounded execution:"," Workflows can stall in loops without an independent referee to terminate them.",[3637,3651,3652,3655],{},[3640,3653,3654],{},"Context duplication:"," Loosely coupled agents constantly re-read the same state, inflating operational costs.",[3598,3657,3658,3659,3666],{},"According to ",[3660,3661,3665],"a",{"href":3662,"rel":3663},"https:\u002F\u002Fatlan.com\u002Fknow\u002Fbest-ai-agent-harness-tools-2026\u002F",[3664],"nofollow","industry analysis by Atlan",", 80% of agentic AI implementation time is consumed by data engineering and governance, rather than framework configuration. No framework governs what agents actually read or execute. That is a structural problem you have to solve at the architectural level.",[3611,3668,3670],{"id":3669},"what-is-an-ai-agent-harness","What Is an AI Agent Harness?",[3598,3672,3673],{},"An AI agent harness acts as the control plane for your generative models, managing their lifecycle, tool access, and API budgets. Instead of just passing prompts, the harness enforces guardrails and execution limits. The industry standard relies on three core roles—a Planner, a Generator, and an Evaluator—to maintain strict oversight.",[3598,3675,3676],{},"Think of the harness as the Kubernetes for your agents. It does not write the code or generate the text. It manages state, enforces policies, and handles the lifecycle of the models doing the work. It sits between your application logic and the LLM APIs.",[3598,3678,3679],{},"A harness centralizes observability. When an agent loop fails, you need to trace exactly why it failed. A harness logs the inputs, outputs, tokens consumed, and tool calls at every step, giving you a clear audit trail.",[3598,3681,3682],{},"It also operationalizes safety nets. If an agent attempts an unauthorized database drop, the harness intercepts and blocks the tool call before execution. The agent proposes the action; the harness decides whether to execute it.",[3598,3684,3685,3686,3696],{},"The architecture driving this control plane is the Planner-Generator-Evaluator pattern. Research from Anthropic's engineering teams demonstrates that separating planning, generation, and evaluation enables better handling of subjective assessments while maintaining reproducibility ",[3687,3688,3689],"sup",{},[3660,3690,3695],{"href":3691,"ariaDescribedBy":3692,"dataFootnoteRef":3593,"id":3694},"#user-content-fn-2",[3693],"footnote-label","user-content-fnref-2","1",". You stop asking one model to do everything.",[3611,3698,3700],{"id":3699},"the-planner-defining-the-machine-checkable-contract","The Planner: Defining the Machine-Checkable Contract",[3598,3702,3703],{},"The Planner agent breaks high-level goals into detailed, actionable specifications using highly capable reasoning models like Claude 3.5 Sonnet or GPT-4o. It translates ambiguous user requests into strict behavioral requirements and explicit verification assertions. This creates a machine-checkable contract that dictates exactly what the downstream models must produce to succeed.",[3598,3705,3706],{},"The Planner requires the most context and domain knowledge. It consumes the user's prompt, retrieves necessary documentation, and figures out the architecture of the solution. It does not write the final implementation.",[3598,3708,3709],{},"Output from the Planner must be heavily structured. You want JSON, not prose. The harness needs to parse this output programmatically to route instructions to the next agent in the loop.",[3598,3711,3712,3713,3717,3718,3721],{},"A good plan includes explicit ",[3714,3715,3716],"code",{},"VERIFY"," assertions. These assertions act as a grading rubric for the rest of the system. If the task is to write a Python data scraper, the Planner should output assertions like \"Script must use the ",[3714,3719,3720],{},"requests"," library\" and \"Script must include error handling for HTTP 404\".",[3598,3723,3724],{},"Consider this example of a Planner's JSON output:",[3726,3727,3731],"pre",{"className":3728,"code":3729,"language":3730,"meta":3593,"style":3593},"language-json shiki shiki-themes github-light github-dark","{\n  \"task\": \"Fetch user data and format as CSV\",\n  \"steps\": [\n    \"Initialize API client\", \n    \"Paginate through \u002Fusers\", \n    \"Write to output.csv\"\n  ],\n  \"assertions\": [\n    \"VERIFY: Uses pagination tokens\",\n    \"VERIFY: Creates output.csv in the current directory\",\n    \"VERIFY: Does not log PII to stdout\"\n  ]\n}\n","json",[3714,3732,3733,3742,3759,3768,3777,3785,3791,3797,3805,3813,3821,3827,3833],{"__ignoreMap":3593},[3734,3735,3738],"span",{"class":3736,"line":3737},"line",1,[3734,3739,3741],{"class":3740},"sVt8B","{\n",[3734,3743,3745,3749,3752,3756],{"class":3736,"line":3744},2,[3734,3746,3748],{"class":3747},"sj4cs","  \"task\"",[3734,3750,3751],{"class":3740},": ",[3734,3753,3755],{"class":3754},"sZZnC","\"Fetch user data and format as CSV\"",[3734,3757,3758],{"class":3740},",\n",[3734,3760,3762,3765],{"class":3736,"line":3761},3,[3734,3763,3764],{"class":3747},"  \"steps\"",[3734,3766,3767],{"class":3740},": [\n",[3734,3769,3771,3774],{"class":3736,"line":3770},4,[3734,3772,3773],{"class":3754},"    \"Initialize API client\"",[3734,3775,3776],{"class":3740},", \n",[3734,3778,3780,3783],{"class":3736,"line":3779},5,[3734,3781,3782],{"class":3754},"    \"Paginate through \u002Fusers\"",[3734,3784,3776],{"class":3740},[3734,3786,3788],{"class":3736,"line":3787},6,[3734,3789,3790],{"class":3754},"    \"Write to output.csv\"\n",[3734,3792,3794],{"class":3736,"line":3793},7,[3734,3795,3796],{"class":3740},"  ],\n",[3734,3798,3800,3803],{"class":3736,"line":3799},8,[3734,3801,3802],{"class":3747},"  \"assertions\"",[3734,3804,3767],{"class":3740},[3734,3806,3808,3811],{"class":3736,"line":3807},9,[3734,3809,3810],{"class":3754},"    \"VERIFY: Uses pagination tokens\"",[3734,3812,3758],{"class":3740},[3734,3814,3816,3819],{"class":3736,"line":3815},10,[3734,3817,3818],{"class":3754},"    \"VERIFY: Creates output.csv in the current directory\"",[3734,3820,3758],{"class":3740},[3734,3822,3824],{"class":3736,"line":3823},11,[3734,3825,3826],{"class":3754},"    \"VERIFY: Does not log PII to stdout\"\n",[3734,3828,3830],{"class":3736,"line":3829},12,[3734,3831,3832],{"class":3740},"  ]\n",[3734,3834,3836],{"class":3736,"line":3835},13,[3734,3837,3838],{"class":3740},"}\n",[3598,3840,3841],{},"This contract stops scope creep. The downstream models only see this constrained specification, keeping them focused entirely on execution. They do not need to know the broader business context, which saves massive amounts of context window space.",[3611,3843,3845],{"id":3844},"the-generator-executing-fast-and-fluently","The Generator: Executing Fast and Fluently",[3598,3847,3848],{},"The Generator agent focuses entirely on implementing the Planner's specifications by producing code, text, or tool actions. Because it does not need to plan or evaluate its own work, you can optimize this role for speed and cost by using specialized, highly fluent models to avoid getting stuck in reasoning loops.",[3598,3850,3851],{},"The Generator is the blue-collar worker of the harness. It just writes the code or executes the API calls. It receives a highly constrained prompt containing only the current step's requirements.",[3598,3853,3854],{},"This separation of concerns drastically reduces token overhead. You can route this step to faster, cheaper models. The cognitive heavy lifting was already done by the Planner, so the Generator only needs to be fluent in the target syntax.",[3598,3856,3857],{},"Dynamic multi-model routing is a massive advantage here. You might use a heavy frontier model for planning, but rely on a lightweight, fast model like Claude 3.5 Haiku or GPT-4o-mini for the generation step. This cuts costs without sacrificing quality.",[3598,3859,3860],{},"Stripping away the planning responsibility prevents the Generator from overthinking. When models try to plan, write, and critique simultaneously, they frequently stall. The Generator just executes the contract and returns the result to the harness.",[3611,3862,3864],{"id":3863},"the-evaluator-independent-verification","The Evaluator: Independent Verification",[3598,3866,3867],{},"The Evaluator agent independently assesses the Generator's output against the Planner's original specification without bias. Models reliably overrate their own outputs, making self-reflection highly error-prone in production.",[3598,3869,3870],{},"By isolating the evaluation step with a separate model, the system generates structured, skeptical feedback to catch hallucinations before they reach the user.",[3598,3872,3873],{},"The Evaluator acts like a senior engineer reviewing a pull request. It must be explicitly prompted to be skeptical. If you ask a model \"Is this good?\", it will almost always say yes.",[3598,3875,3876,3877,3882],{},"Generative models exhibit severe self-evaluation bias. ",[3660,3878,3881],{"href":3879,"rel":3880},"https:\u002F\u002Fwww.mindstudio.ai\u002Fblog\u002Fplanner-generator-evaluator-pattern-gan-inspired-ai-coding",[3664],"Industry patterns documented by MindStudio"," emphasize that the Evaluator must provide structured feedback the Generator can act on.",[3598,3884,3885,3886,3888],{},"Instead of just a binary pass\u002Ffail signal, it needs to point out exactly which ",[3714,3887,3716],{}," assertion failed and why.",[3598,3890,3891],{},"You must strictly isolate the Evaluator. Separating this role prevents the Generator from grading its own homework.",[3598,3893,3894,3899],{},[3660,3895,3898],{"href":3896,"rel":3897},"https:\u002F\u002Fredis.io\u002Fblog\u002Fai-agent-architecture-patterns\u002F",[3664],"Analysis from Redis"," highlights that agent performance degrades significantly over multiple consecutive runs without proper architecture and evaluation discipline.",[3598,3901,3902],{},"The Evaluator does not fix the code. It returns a critique document.",[3598,3904,3905],{},"The harness reads this document. If the critique contains failures, the harness routes the feedback back to the Generator for another attempt.",[3611,3907,3909],{"id":3908},"implementing-your-ai-agent-harness-loop","Implementing Your AI Agent Harness Loop",[3598,3911,3912],{},"Building an AI agent harness loop requires strict termination conditions, such as evaluator pass signals, maximum iteration caps, or confidence thresholds. The harness executes the Generator and Evaluator in a cycle until the acceptance criteria are met or the budget is exhausted, guaranteeing incremental progress while maintaining strict observability.",[3598,3914,3915],{},"You have to set hard limits on iterations. A common standard is capping the loop at three attempts. If the Generator cannot pass the Evaluator after three tries, the harness must terminate the loop to prevent runaway costs.",[3598,3917,3918],{},"Log every generation and evaluation pair. When you review the logs, you will quickly identify which prompts or steps consistently fail.",[3598,3920,3921],{},"This data is critical for refining your Planner's initial specifications over time.",[3598,3923,3924],{},"For high-stakes operations, implement human-in-the-loop escalation. If the Evaluator repeatedly rejects the Generator's output, or if the confidence threshold drops, the harness pauses execution. It then routes the state to a human operator for manual review.",[3598,3926,3927],{},"A production loop generally follows these stages:",[3634,3929,3930,3936,3942,3948],{},[3637,3931,3932,3935],{},[3640,3933,3934],{},"Plan:"," The harness calls the Planner to generate the JSON specification and assertions.",[3637,3937,3938,3941],{},[3640,3939,3940],{},"Generate:"," The harness passes the spec to the Generator to execute step one.",[3637,3943,3944,3947],{},[3640,3945,3946],{},"Evaluate:"," The harness passes the output and the assertions to the Evaluator.",[3637,3949,3950,3953],{},[3640,3951,3952],{},"Route:"," The harness reads the Evaluator's JSON response. On failure, it loops back to Generate. On success, it proceeds to the next step.",[3598,3955,3956,3961],{},[3660,3957,3960],{"href":3958,"rel":3959},"https:\u002F\u002Fdev.to\u002Ffmquaglia\u002Fbeyond-the-notebook-4-architectural-patterns-for-production-ready-ai-agents-3a16",[3664],"Architectural patterns for production-ready AI agents"," require treating the entire loop as a state machine. The harness holds the state. The agents are just stateless functions called by the harness.",[3611,3963,3965],{"id":3964},"conclusion","Conclusion",[3598,3967,3968],{},"Moving AI from a notebook demo to a production system requires abandoning the idea of a single omnipotent agent. Instead, builders must adopt a strictly governed Planner, Generator, and Evaluator architecture to ensure reliability, control costs, and maintain safety at scale.",[3598,3970,3971],{},"Frameworks will help you build the components, but the harness is what keeps them running safely. You have to own the control loop. Relying on an LLM to police its own execution is an unforced error.",[3598,3973,3974],{},"Open your current agent workflow code and identify where planning, generation, and validation happen in the same prompt. Extract the validation step into a separate, strongly typed model call to immediately improve reliability.",[3598,3976,3977],{},"Ready to stop agent drift and build resilient systems? Start implementing an independent evaluation layer today, and subscribe to our newsletter for more deep dives into production AI architecture.",[3979,3980],"hr",{},[3982,3983,3986,3991],"section",{"className":3984,"dataFootnotes":3593},[3985],"footnotes",[3611,3987,3990],{"className":3988,"id":3693},[3989],"sr-only","Footnotes",[3992,3993,3994],"ol",{},[3637,3995,3997,3998],{"id":3996},"user-content-fn-2","InfoQ. \"Anthropic Designs Three-Agent Harness Supports Long-Running Full-Stack AI Development.\" ",[3660,3999,4004],{"href":4000,"ariaLabel":4001,"className":4002,"dataFootnoteBackref":3593},"#user-content-fnref-2","Back to reference 1",[4003],"data-footnote-backref","↩",[4006,4007,4008],"style",{},"html pre.shiki code .sVt8B, html code.shiki .sVt8B{--shiki-default:#24292E;--shiki-dark:#E1E4E8}html pre.shiki code .sj4cs, html code.shiki .sj4cs{--shiki-default:#005CC5;--shiki-dark:#79B8FF}html pre.shiki code .sZZnC, html code.shiki .sZZnC{--shiki-default:#032F62;--shiki-dark:#9ECBFF}html .default .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html.dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}",{"title":3593,"searchDepth":3744,"depth":3744,"links":4010},[4011,4012,4013,4014,4015,4016,4017,4018],{"id":3613,"depth":3744,"text":3614},{"id":3669,"depth":3744,"text":3670},{"id":3699,"depth":3744,"text":3700},{"id":3844,"depth":3744,"text":3845},{"id":3863,"depth":3744,"text":3864},{"id":3908,"depth":3744,"text":3909},{"id":3964,"depth":3744,"text":3965},{"id":3693,"depth":3744,"text":3990},"ai-engineering",null,"md",[4023,4024,4025,4026,4027,4028],"AI agent harness","production AI","agentic architecture","AI control plane","LLM evaluation","multi-agent systems",{},"Moving AI to production requires strict governance. Discover how an AI agent harness uses a Planner, Generator, and Evaluator to ensure safe execution.","AI Agent Harness: The Planner-Generator-Evaluator Architecture",true,"\u002Farticles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-expb-premium-post-merge-article",[],{"intro":4036,"why-frameworks-arent-enough-for-production":3614,"what-is-an-ai-agent-harness":3670,"the-planner-defining-the-machine-checkable-contract":3700,"the-generator-executing-fast-and-fluently":3845,"the-evaluator-independent-verification":3864,"implementing-your-ai-agent-harness-loop":3909,"conclusion":3965},"(intro)",{"title":3591,"description":3600},{"loc":4033},"ai-agent-harness-production-architecture","ready","articles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-expb-premium-post-merge-article","n4YrqKIbgDFFExlRCdf0McqYftoHNMD9Ps39zY0tMA4",[4044,4627,5784,6395],{"id":4045,"title":4046,"ai_summary":4047,"author":3593,"body":4048,"category":4606,"date_modified":4020,"description":4607,"excerpt":3593,"extension":4021,"faq":4020,"keywords":4608,"meta":4616,"meta_description":4617,"meta_title":4618,"navigation":4032,"path":4619,"primary_keyword":4609,"published_at":4020,"related_posts":4620,"sections":4621,"seo":4622,"sitemap":4623,"slug":4624,"status":4040,"stem":4625,"__hash__":4626},"articles\u002Farticles\u002Fagent-architecture-the-orchestration-stack-that-actually-emerged-article.md","The Emergent AI Agent Orchestration Stack: Harnesses, Specs, and Primitives","AI agent orchestration stacks mature compute layers atop lagging coordination using YAML harnesses, spec-driven workflows, and primitives like tool registries and state persistence. Tools such as Archon V3 and Claude Code enable deterministic multi-agent execution for production reliability without frameworks.",{"type":3595,"value":4049,"toc":4597},[4050,4066,4076,4080,4089,4099,4111,4114,4124,4128,4139,4149,4159,4162,4166,4177,4193,4196,4199,4203,4212,4232,4249,4252,4256,4265,4285,4288,4291,4340,4343,4346,4350,4361,4378,4401,4404,4407,4594],[3598,4051,4052,4053,4060],{},"Production AI agent orchestration demands stack literacy across six uneven layers, from mature compute sandboxes like E2B Firecracker to lagging coordination without Kubernetes-grade tools. Builders bridge gaps with YAML harnesses and spec-driven workflows today, delivering deterministic multi-agent execution via Archon V3 and Claude Code primitives.",[3687,4054,4055],{},[3660,4056,3695],{"href":4057,"ariaDescribedBy":4058,"dataFootnoteRef":3593,"id":4059},"#user-content-fn-1",[3693],"user-content-fnref-1",[3687,4061,4062],{},[3660,4063,4065],{"href":3691,"ariaDescribedBy":4064,"dataFootnoteRef":3593,"id":3694},[3693],"2",[3598,4067,4068,4069,4075],{},"Demos shine with single agents, but real systems crumble on orchestration failures—compounding errors across layers drop end-to-end reliability from five 99% components to 95% overall.",[3687,4070,4071],{},[3660,4072,3695],{"href":4057,"ariaDescribedBy":4073,"dataFootnoteRef":3593,"id":4074},[3693],"user-content-fnref-1-2"," Without primitives like tool registries and state persistence, you risk hyperscaler lock-in and sprawl. This guide maps the stack, harnesses, specs, challenges, and pitfalls to ship reliable agents now.",[3611,4077,4079],{"id":4078},"the-layered-maturity-of-the-ai-agent-stack","The Layered Maturity of the AI Agent Stack",[3598,4081,4082,4083],{},"The AI agent stack matures unevenly across six layers—compute and sandboxing lead with mature tools like Browserbase and E2B Firecracker for isolated execution, while orchestration lags like pre-Kubernetes eras without infra-grade scheduling or FinOps. Identity\u002Fcomms transitions via emerging agent-native protocols beyond email shims. This creates production bottlenecks in coordination, demanding immediate stack literacy.",[3687,4084,4085],{},[3660,4086,3695],{"href":4057,"ariaDescribedBy":4087,"dataFootnoteRef":3593,"id":4088},[3693],"user-content-fnref-1-3",[3598,4090,4091,4092,4098],{},"Nate B. Jones breaks it into six layers in his analysis.",[3687,4093,4094],{},[3660,4095,3695],{"href":4057,"ariaDescribedBy":4096,"dataFootnoteRef":3593,"id":4097},[3693],"user-content-fnref-1-4"," Compute\u002Fsandboxing handles isolated execution reliably. Identity\u002Fcomms transitions with emerging agent-native protocols over email shims.",[3598,4100,4101,4102,4110],{},"Memory sits early, blending Mem0 hybrids but risking vendor lock-in.",[3687,4103,4104],{},[3660,4105,4109],{"href":4106,"ariaDescribedBy":4107,"dataFootnoteRef":3593,"id":4108},"#user-content-fn-3",[3693],"user-content-fnref-3","3"," Tools explode via Compose connectors for auth-heavy integrations.",[3598,4112,4113],{},"Provisioning emerges in Stripe Projects for dynamic scaling. Orchestration gaps lack FinOps and infra-grade controls—no standard for fleets.",[3598,4115,4116,4117,4123],{},"Ephemeral agents suit quick tasks; persistent ones need state for long runs. Gartner notes a 1,445% multi-agent surge, amplifying these mismatches.",[3687,4118,4119],{},[3660,4120,3695],{"href":4057,"ariaDescribedBy":4121,"dataFootnoteRef":3593,"id":4122},[3693],"user-content-fnref-1-5"," Skip stack literacy, and your agents stay demo-bound.",[3611,4125,4127],{"id":4126},"what-is-harness-engineering-for-ai-agent-orchestration","What Is Harness Engineering for AI Agent Orchestration?",[3598,4129,4130,4131],{},"Harness engineering wraps unreliable AI agents in declarative YAML or Markdown workflows that use DAGs for dependencies, Git worktrees for parallel isolation, and pre\u002Fpost-tool hooks for self-correction and verification loops like type-checks or rewrites. This enables Stripe-scale PRs (1,300\u002Fweek) without constant oversight by treating agents as deterministic nodes.",[3687,4132,4133],{},[3660,4134,4138],{"href":4135,"ariaDescribedBy":4136,"dataFootnoteRef":3593,"id":4137},"#user-content-fn-4",[3693],"user-content-fnref-4","4",[3598,4140,4141,4142,4148],{},"Archon V3 defines this: YAML commands like classify\u002Fplan\u002Fimplement form nodes in DAGs with dependencies.",[3687,4143,4144],{},[3660,4145,4138],{"href":4135,"ariaDescribedBy":4146,"dataFootnoteRef":3593,"id":4147},[3693],"user-content-fnref-4-2"," Worktrees isolate parallel runs—four agents at once without clashes. Pre\u002Fpost-tool hooks loop for verification, like type-checks or rewrites.",[3598,4150,4151,4152,4158],{},"Claude Code adds structured metadata, permissions, and multi-agent forks.",[3687,4153,4154],{},[3660,4155,4065],{"href":3691,"ariaDescribedBy":4156,"dataFootnoteRef":3593,"id":4157},[3693],"user-content-fnref-2-2"," Mix precise steps with AI nodes; extend as Markdown primitives standard in Anthropic\u002FOpenAI for chaining. You treat agents as cogs in deterministic machines, not free-range thinkers.",[3598,4160,4161],{},"This beats prompt tweaks alone. Version YAML in Git for audits. Production demands it over ad-hoc calls.",[3611,4163,4165],{"id":4164},"the-shift-to-spec-centric-development","The Shift to Spec-Centric Development",[3598,4167,4168,4169],{},"Spec-centric development flips code-first workflows by making declarative specs in YAML or Markdown the executable single source of truth, driving AI agents like GitHub SpecKit to generate synchronized code through staged pipelines of specify\u002Fplan\u002Ftasks\u002Fimplement for consistent handoffs.",[3687,4170,4171],{},[3660,4172,4176],{"href":4173,"ariaDescribedBy":4174,"dataFootnoteRef":3593,"id":4175},"#user-content-fn-5",[3693],"user-content-fnref-5","5",[3598,4178,4179,4180,4186,4187],{},"Code drifts specs outdated; specs drive regeneration instead.",[3687,4181,4182],{},[3660,4183,4176],{"href":4173,"ariaDescribedBy":4184,"dataFootnoteRef":3593,"id":4185},[3693],"user-content-fnref-5-2"," GitHub SpecKit structures .github\u002Fprompts\u002Fagents for PM\u002Farchitect\u002Fengineer handoffs. Anthropic harnesses use minimal three agents—planner\u002Fgenerator\u002Fevaluator—outpacing bloated frameworks on Opus models.",[3687,4188,4189],{},[3660,4190,4065],{"href":3691,"ariaDescribedBy":4191,"dataFootnoteRef":3593,"id":4192},[3693],"user-content-fnref-2-3",[3598,4194,4195],{},"Version specs in repos for team reliability. No more merge hell from AI code dumps. Specs ensure handoffs work; code follows.",[3598,4197,4198],{},"I prefer this for complex projects. It cuts ambiguity. Agents execute living docs, not stale prose.",[3611,4200,4202],{"id":4201},"why-ai-agent-orchestration-is-the-biggest-unsolved-problem","Why AI Agent Orchestration Is the Biggest Unsolved Problem",[3598,4204,4205,4206],{},"AI agent orchestration fails production due to critical gaps in scheduling\u002Flifecycle management, supervision hierarchies, FinOps controls, inter-agent comms protocols, and observability tools—current libraries like LangGraph manage notebooks but crumble under 50-agent fleets needing audits and traces.",[3687,4207,4208],{},[3660,4209,4109],{"href":4106,"ariaDescribedBy":4210,"dataFootnoteRef":3593,"id":4211},[3693],"user-content-fnref-3-2",[3634,4213,4214,4223,4226,4229],{},[3637,4215,4216,4217],{},"Dynamic scheduling beats cron; state persists across crashes.",[3687,4218,4219],{},[3660,4220,4109],{"href":4106,"ariaDescribedBy":4221,"dataFootnoteRef":3593,"id":4222},[3693],"user-content-fnref-3-3",[3637,4224,4225],{},"Retry logic and error isolation prevent cascades.",[3637,4227,4228],{},"Token budgeting enforces FinOps per task.",[3637,4230,4231],{},"MCP protocols limit comms; no standard for negotiation.",[3598,4233,4234,4235,4241,4242,4248],{},"MindStudio calls it the core blocker: demos route simply, production demands hierarchies and traces.",[3687,4236,4237],{},[3660,4238,4109],{"href":4106,"ariaDescribedBy":4239,"dataFootnoteRef":3593,"id":4240},[3693],"user-content-fnref-3-4"," Jones likens it to pre-K8s chaos.",[3687,4243,4244],{},[3660,4245,3695],{"href":4057,"ariaDescribedBy":4246,"dataFootnoteRef":3593,"id":4247},[3693],"user-content-fnref-1-6"," Flexibility invites emergence; determinism suits enterprise.",[3598,4250,4251],{},"Trade-off bites: emergent behavior thrills but flakes. Prioritize primitives over frameworks. Libraries add overhead without infra.",[3611,4253,4255],{"id":4254},"key-primitives-for-production-ai-agent-orchestration","Key Primitives for Production AI Agent Orchestration",[3598,4257,4258,4259],{},"Production AI agent orchestration relies on 12 primitives from Claude Code leaks, including tool registries for metadata filtering, tiered permissions to block rogue actions, state persistence via JSON sessions, token budgeting with projections and halts, structured logging through typed events, verification loops, plus agent typing and dynamic pools for crash-resilient, observable multi-agent workflows.",[3687,4260,4261],{},[3660,4262,4065],{"href":3691,"ariaDescribedBy":4263,"dataFootnoteRef":3593,"id":4264},[3693],"user-content-fnref-2-4",[3634,4266,4267,4276,4279,4282],{},[3637,4268,4269,4270],{},"Dual registries list 207 commands with metadata for filtering.",[3687,4271,4272],{},[3660,4273,4065],{"href":3691,"ariaDescribedBy":4274,"dataFootnoteRef":3593,"id":4275},[3693],"user-content-fnref-2-5",[3637,4277,4278],{},"Permissions tier built-in\u002Fplugins\u002Fuser to block rogue acts.",[3637,4280,4281],{},"JSON persists sessions; projections halt overruns.",[3637,4283,4284],{},"Typed events stream logs.",[3598,4286,4287],{},"Agents specialize: explore\u002Fplan\u002Fverify types in hierarchies. Formula: Role+Goal+Tools+Rules+Output.",[3598,4289,4290],{},"Code stub for tools:",[3726,4292,4296],{"className":4293,"code":4294,"language":4295,"meta":3593,"style":3593},"language-yaml shiki shiki-themes github-light github-dark","tools:\n  - name: list_files\n    description: List files in directory\n    source: builtin\n","yaml",[3714,4297,4298,4307,4320,4330],{"__ignoreMap":3593},[3734,4299,4300,4304],{"class":3736,"line":3737},[3734,4301,4303],{"class":4302},"s9eBZ","tools",[3734,4305,4306],{"class":3740},":\n",[3734,4308,4309,4312,4315,4317],{"class":3736,"line":3744},[3734,4310,4311],{"class":3740},"  - ",[3734,4313,4314],{"class":4302},"name",[3734,4316,3751],{"class":3740},[3734,4318,4319],{"class":3754},"list_files\n",[3734,4321,4322,4325,4327],{"class":3736,"line":3761},[3734,4323,4324],{"class":4302},"    description",[3734,4326,3751],{"class":3740},[3734,4328,4329],{"class":3754},"List files in directory\n",[3734,4331,4332,4335,4337],{"class":3736,"line":3770},[3734,4333,4334],{"class":4302},"    source",[3734,4336,3751],{"class":3740},[3734,4338,4339],{"class":3754},"builtin\n",[3598,4341,4342],{},"Persist post-events. Update claude.md for skills; \u002Fplan for tasks. Pools assemble per-session.",[3598,4344,4345],{},"These make fleets observable. Skip them, stay small-scale.",[3611,4347,4349],{"id":4348},"common-pitfalls-and-trade-offs-in-multi-agent-systems","Common Pitfalls and Trade-offs in Multi-Agent Systems",[3598,4351,4352,4353],{},"Multi-agent systems trip on overkill by jumping to agents before mastering 5 workflows, bloat from skills exceeding 150 lines, lock-in via hyperscaler memory, and ignoring compounding failures that drop reliability—counter them by testing quantitatively, tiering skills, and designing agent-first for composability.",[3687,4354,4355],{},[3660,4356,4360],{"href":4357,"ariaDescribedBy":4358,"dataFootnoteRef":3593,"id":4359},"#user-content-fn-6",[3693],"user-content-fnref-6","6",[3634,4362,4363,4372,4375],{},[3637,4364,4365,4366],{},"Vague skills undertrigger; self-evals overconfident; no permissions equals demos.",[3687,4367,4368],{},[3660,4369,4065],{"href":3691,"ariaDescribedBy":4370,"dataFootnoteRef":3593,"id":4371},[3693],"user-content-fnref-2-6",[3637,4373,4374],{},"Single agents scale until they don't—multi for handoffs.",[3637,4376,4377],{},"Ephemeral for bursts; persistent for state.",[3598,4379,4380,4381,4387,4388,4394,4395],{},"Frameworks bloat post-Opus; chaining routes first.",[3687,4382,4383],{},[3660,4384,4360],{"href":4357,"ariaDescribedBy":4385,"dataFootnoteRef":3593,"id":4386},[3693],"user-content-fnref-6-2"," Margerie: Master Role+Goal+Tools+Rules+Output.",[3687,4389,4390],{},[3660,4391,4360],{"href":4357,"ariaDescribedBy":4392,"dataFootnoteRef":3593,"id":4393},[3693],"user-content-fnref-6-3"," Jones: Primitives avert pain.",[3687,4396,4397],{},[3660,4398,3695],{"href":4057,"ariaDescribedBy":4399,"dataFootnoteRef":3593,"id":4400},[3693],"user-content-fnref-1-7",[3598,4402,4403],{},"Test E2E: 99% layers compound poorly. Agent-first composes; code-first breaks.",[3598,4405,4406],{},"Audit your agent workflow against Claude Code's 12 primitives today. Fork an Archon V3 YAML harness into a Git repo, route a test issue through planner\u002Fgenerator\u002Fevaluator, and log E2E reliability metrics before adding agents.",[3982,4408,4410,4413],{"className":4409,"dataFootnotes":3593},[3985],[3611,4411,3990],{"className":4412,"id":3693},[3989],[3992,4414,4415,4467,4509,4539,4555,4571],{},[3637,4416,4418,4419,4423,4424,4423,4431,4423,4438,4423,4445,4423,4452,4423,4459],{"id":4417},"user-content-fn-1","Nate B. Jones, \"6-Layer AI Agent Stack: Build Literacy Now,\" AI News & Strategy Daily. ",[3660,4420,4004],{"href":4421,"ariaLabel":4001,"className":4422,"dataFootnoteBackref":3593},"#user-content-fnref-1",[4003]," ",[3660,4425,4004,4429],{"href":4426,"ariaLabel":4427,"className":4428,"dataFootnoteBackref":3593},"#user-content-fnref-1-2","Back to reference 1-2",[4003],[3687,4430,4065],{},[3660,4432,4004,4436],{"href":4433,"ariaLabel":4434,"className":4435,"dataFootnoteBackref":3593},"#user-content-fnref-1-3","Back to reference 1-3",[4003],[3687,4437,4109],{},[3660,4439,4004,4443],{"href":4440,"ariaLabel":4441,"className":4442,"dataFootnoteBackref":3593},"#user-content-fnref-1-4","Back to reference 1-4",[4003],[3687,4444,4138],{},[3660,4446,4004,4450],{"href":4447,"ariaLabel":4448,"className":4449,"dataFootnoteBackref":3593},"#user-content-fnref-1-5","Back to reference 1-5",[4003],[3687,4451,4176],{},[3660,4453,4004,4457],{"href":4454,"ariaLabel":4455,"className":4456,"dataFootnoteBackref":3593},"#user-content-fnref-1-6","Back to reference 1-6",[4003],[3687,4458,4360],{},[3660,4460,4004,4464],{"href":4461,"ariaLabel":4462,"className":4463,"dataFootnoteBackref":3593},"#user-content-fnref-1-7","Back to reference 1-7",[4003],[3687,4465,4466],{},"7",[3637,4468,4469,4470,4423,4474,4423,4481,4423,4488,4423,4495,4423,4502],{"id":3996},"Nick Puru, \"Claude Code Leak Reveals Full AI Orchestration Engine,\" AI Automation. ",[3660,4471,4004],{"href":4000,"ariaLabel":4472,"className":4473,"dataFootnoteBackref":3593},"Back to reference 2",[4003],[3660,4475,4004,4479],{"href":4476,"ariaLabel":4477,"className":4478,"dataFootnoteBackref":3593},"#user-content-fnref-2-2","Back to reference 2-2",[4003],[3687,4480,4065],{},[3660,4482,4004,4486],{"href":4483,"ariaLabel":4484,"className":4485,"dataFootnoteBackref":3593},"#user-content-fnref-2-3","Back to reference 2-3",[4003],[3687,4487,4109],{},[3660,4489,4004,4493],{"href":4490,"ariaLabel":4491,"className":4492,"dataFootnoteBackref":3593},"#user-content-fnref-2-4","Back to reference 2-4",[4003],[3687,4494,4138],{},[3660,4496,4004,4500],{"href":4497,"ariaLabel":4498,"className":4499,"dataFootnoteBackref":3593},"#user-content-fnref-2-5","Back to reference 2-5",[4003],[3687,4501,4176],{},[3660,4503,4004,4507],{"href":4504,"ariaLabel":4505,"className":4506,"dataFootnoteBackref":3593},"#user-content-fnref-2-6","Back to reference 2-6",[4003],[3687,4508,4360],{},[3637,4510,4512,4513,4423,4518,4423,4525,4423,4532],{"id":4511},"user-content-fn-3","MindStudio, \"What Is Agent Orchestration? Why It's the Biggest Unsolved Problem in the AI Stack.\" ",[3660,4514,4004],{"href":4515,"ariaLabel":4516,"className":4517,"dataFootnoteBackref":3593},"#user-content-fnref-3","Back to reference 3",[4003],[3660,4519,4004,4523],{"href":4520,"ariaLabel":4521,"className":4522,"dataFootnoteBackref":3593},"#user-content-fnref-3-2","Back to reference 3-2",[4003],[3687,4524,4065],{},[3660,4526,4004,4530],{"href":4527,"ariaLabel":4528,"className":4529,"dataFootnoteBackref":3593},"#user-content-fnref-3-3","Back to reference 3-3",[4003],[3687,4531,4109],{},[3660,4533,4004,4537],{"href":4534,"ariaLabel":4535,"className":4536,"dataFootnoteBackref":3593},"#user-content-fnref-3-4","Back to reference 3-4",[4003],[3687,4538,4138],{},[3637,4540,4542,4543,4423,4548],{"id":4541},"user-content-fn-4","\"Archon V3: YAML Harnesses for AI Coding Agents,\" DIY Smart Code. ",[3660,4544,4004],{"href":4545,"ariaLabel":4546,"className":4547,"dataFootnoteBackref":3593},"#user-content-fnref-4","Back to reference 4",[4003],[3660,4549,4004,4553],{"href":4550,"ariaLabel":4551,"className":4552,"dataFootnoteBackref":3593},"#user-content-fnref-4-2","Back to reference 4-2",[4003],[3687,4554,4065],{},[3637,4556,4558,4559,4423,4564],{"id":4557},"user-content-fn-5","\"SDD Makes Specs the Single Source of Truth via AI Agents,\" Level Up Coding. ",[3660,4560,4004],{"href":4561,"ariaLabel":4562,"className":4563,"dataFootnoteBackref":3593},"#user-content-fnref-5","Back to reference 5",[4003],[3660,4565,4004,4569],{"href":4566,"ariaLabel":4567,"className":4568,"dataFootnoteBackref":3593},"#user-content-fnref-5-2","Back to reference 5-2",[4003],[3687,4570,4065],{},[3637,4572,4574,4575,4423,4580,4423,4587],{"id":4573},"user-content-fn-6","Lukas Margerie insights on agent fundamentals. ",[3660,4576,4004],{"href":4577,"ariaLabel":4578,"className":4579,"dataFootnoteBackref":3593},"#user-content-fnref-6","Back to reference 6",[4003],[3660,4581,4004,4585],{"href":4582,"ariaLabel":4583,"className":4584,"dataFootnoteBackref":3593},"#user-content-fnref-6-2","Back to reference 6-2",[4003],[3687,4586,4065],{},[3660,4588,4004,4592],{"href":4589,"ariaLabel":4590,"className":4591,"dataFootnoteBackref":3593},"#user-content-fnref-6-3","Back to reference 6-3",[4003],[3687,4593,4109],{},[4006,4595,4596],{},"html pre.shiki code .s9eBZ, html code.shiki .s9eBZ{--shiki-default:#22863A;--shiki-dark:#85E89D}html pre.shiki code .sVt8B, html code.shiki .sVt8B{--shiki-default:#24292E;--shiki-dark:#E1E4E8}html pre.shiki code .sZZnC, html code.shiki .sZZnC{--shiki-default:#032F62;--shiki-dark:#9ECBFF}html .default .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html.dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}",{"title":3593,"searchDepth":3744,"depth":3744,"links":4598},[4599,4600,4601,4602,4603,4604,4605],{"id":4078,"depth":3744,"text":4079},{"id":4126,"depth":3744,"text":4127},{"id":4164,"depth":3744,"text":4165},{"id":4201,"depth":3744,"text":4202},{"id":4254,"depth":3744,"text":4255},{"id":4348,"depth":3744,"text":4349},{"id":3693,"depth":3744,"text":3990},"ai-agents","Production AI agent orchestration demands stack literacy across six uneven layers, from mature compute sandboxes like E2B Firecracker to lagging coordination without Kubernetes-grade tools. Builders bridge gaps with YAML harnesses and spec-driven workflows today, delivering deterministic multi-agent execution via Archon V3 and Claude Code primitives.12",[4609,4610,4611,4612,4028,4613,4614,4615],"AI agent orchestration","agent stack","harness engineering","spec-centric development","Claude Code","Archon V3","production AI agents",{},"Master the emergent AI agent orchestration stack: uneven maturity, harness engineering, spec-centric dev, and key primitives for production multi-agent systems. Avoid pitfalls with practical workflows from Claude Code and Archon V3.","AI Agent Orchestration Stack: Layers and Primitives","\u002Farticles\u002Fagent-architecture-the-orchestration-stack-that-actually-emerged-article",[],{"the-layered-maturity-of-the-ai-agent-stack":4079,"what-is-harness-engineering-for-ai-agent-orchestration":4127,"the-shift-to-spec-centric-development":4165,"why-ai-agent-orchestration-is-the-biggest-unsolved-problem":4202,"key-primitives-for-production-ai-agent-orchestration":4255,"common-pitfalls-and-trade-offs-in-multi-agent-systems":4349},{"title":4046,"description":4607},{"loc":4619},"emergent-ai-agent-orchestration-stack-harnesess-specs-primitives","articles\u002Fagent-architecture-the-orchestration-stack-that-actually-emerged-article","xdOSx_FUsF7EEM6WqQRjgq4p4T-5gHkBnwndjo2dz-M",{"id":4628,"title":4629,"ai_summary":4630,"author":3593,"body":4631,"category":5764,"date_modified":4020,"description":5765,"excerpt":3593,"extension":4021,"faq":4020,"keywords":5766,"meta":5772,"meta_description":5773,"meta_title":5774,"navigation":4032,"path":5775,"primary_keyword":4638,"published_at":4020,"related_posts":5776,"sections":5777,"seo":5779,"sitemap":5780,"slug":5781,"status":4040,"stem":5782,"__hash__":5783},"articles\u002Farticles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-article.md","The 3-Core Agent Harness: Planner, Generator, Evaluator for Production AI Agents","Production AI agent systems succeed with a 3-core agent harness: Planner creates high-level outlines, Generator builds outputs from them, and Evaluator critiques via graded rubrics. This strips 90% redundant framework overhead, leveraging modern LLMs for reliable, scalable results on long tasks.",{"type":3595,"value":4632,"toc":5754},[4633,4646,4649,4658,4666,4680,4683,4882,4885,4889,4898,4901,4909,4923,4926,4930,4941,4948,4956,4964,4972,4985,4988,4997,5000,5035,5038,5042,5052,5055,5058,5061,5070,5073,5077,5089,5092,5095,5103,5106,5110,5123,5153,5161,5167,5170,5240,5243,5249,5276,5279,5288,5294,5374,5389,5394,5426,5438,5441,5445,5461,5464,5488,5491,5500,5503,5506,5510,5519,5522,5548,5558,5561,5564,5567,5751],[3598,4634,4635,4636,4639,4640,4645],{},"Production AI agent systems thrive with a ",[3640,4637,4638],{},"3-core agent harness","—Planner for high-level outlines, Generator for implementation, Evaluator for adversarial critique using graded rubrics—stripping 90% bloated framework overhead per Anthropic tests.",[3687,4641,4642],{},[3660,4643,3695],{"href":4057,"ariaDescribedBy":4644,"dataFootnoteRef":3593,"id":4059},[3693]," This leverages modern LLMs' 1M+ token windows and coherence for reliable, scalable outputs on long-horizon tasks.",[3598,4647,4648],{},"You've likely tried agent frameworks that promise reliability but deliver cascading errors from micro-task sharding. Those assumptions fit older LLMs with short contexts and poor coherence, not Claude Opus 4.6. This harness ships product-level work like high-volume AI-generated PRs, letting you focus on primitives over complexity.",[3598,4650,4651,4652,4657],{},"Anthropic's experiments, summarized by AI LABS, tested stripping frameworks layer by layer on long tasks.",[3687,4653,4654],{},[3660,4655,3695],{"href":4057,"ariaDescribedBy":4656,"dataFootnoteRef":3593,"id":4074},[3693]," Results showed only the Planner for product outlines, Generator for execution, and Evaluator for critique delivered gains. Complex staging in SpecKit or loops in GSD added token bloat and error drift without benefits.",[3598,4659,4660,4661],{},"Contrast traditional setups: BMAD shards PRDs into micro-tasks to handle context resets; GSD enforces rigid agent loops for weak reasoning. With 1M-token windows, LLMs now manage full product scopes autonomously—micro-sharding forces premature decisions that fail downstream.",[3687,4662,4663],{},[3660,4664,3695],{"href":4057,"ariaDescribedBy":4665,"dataFootnoteRef":3593,"id":4088},[3693],[3598,4667,4668,4669,4674,4675],{},"Nate B. Jones's analysis of Claude's leaked code reinforces primitives over frameworks for scalability.",[3687,4670,4671],{},[3660,4672,4065],{"href":3691,"ariaDescribedBy":4673,"dataFootnoteRef":3593,"id":3694},[3693]," Agent Blueprint advises single-agent mastery before multi-agent scaling.",[3687,4676,4677],{},[3660,4678,4109],{"href":4106,"ariaDescribedBy":4679,"dataFootnoteRef":3593,"id":4108},[3693],[3598,4681,4682],{},"To see it in action, here's a minimal YAML harness stub using Archon V3 style for a task-tracking app:",[3726,4684,4686],{"className":4293,"code":4685,"language":4295,"meta":3593,"style":3593},"harness:\n  planner:\n    role: \"Product Lead\"\n    goal: \"Outline task-tracking app\"\n    tools: [\"search\"]\n    rules: [\"High-level only; flag risks; no code\"]\n    output: \"Markdown: user stories, features, roadmap\"\n  generator:\n    role: \"Engineer\"\n    goal: \"Implement planner outline\"\n    tools: [\"git\", \"calc\"]\n    rules: [\"Isolated worktree; commit artifacts\"]\n    output: \"Code files + README\"\n  evaluator:\n    role: \"QA Adversary\"\n    goal: \"Score vs rubric\"\n    tools: [\"playwright\"]\n    rules: [\"Assume flaws; weighted scores\"]\n    output: \"JSON: scores, fixes\"\n",[3714,4687,4688,4695,4702,4712,4722,4736,4748,4758,4765,4774,4783,4800,4811,4820,4828,4838,4848,4860,4872],{"__ignoreMap":3593},[3734,4689,4690,4693],{"class":3736,"line":3737},[3734,4691,4692],{"class":4302},"harness",[3734,4694,4306],{"class":3740},[3734,4696,4697,4700],{"class":3736,"line":3744},[3734,4698,4699],{"class":4302},"  planner",[3734,4701,4306],{"class":3740},[3734,4703,4704,4707,4709],{"class":3736,"line":3761},[3734,4705,4706],{"class":4302},"    role",[3734,4708,3751],{"class":3740},[3734,4710,4711],{"class":3754},"\"Product Lead\"\n",[3734,4713,4714,4717,4719],{"class":3736,"line":3770},[3734,4715,4716],{"class":4302},"    goal",[3734,4718,3751],{"class":3740},[3734,4720,4721],{"class":3754},"\"Outline task-tracking app\"\n",[3734,4723,4724,4727,4730,4733],{"class":3736,"line":3779},[3734,4725,4726],{"class":4302},"    tools",[3734,4728,4729],{"class":3740},": [",[3734,4731,4732],{"class":3754},"\"search\"",[3734,4734,4735],{"class":3740},"]\n",[3734,4737,4738,4741,4743,4746],{"class":3736,"line":3787},[3734,4739,4740],{"class":4302},"    rules",[3734,4742,4729],{"class":3740},[3734,4744,4745],{"class":3754},"\"High-level only; flag risks; no code\"",[3734,4747,4735],{"class":3740},[3734,4749,4750,4753,4755],{"class":3736,"line":3793},[3734,4751,4752],{"class":4302},"    output",[3734,4754,3751],{"class":3740},[3734,4756,4757],{"class":3754},"\"Markdown: user stories, features, roadmap\"\n",[3734,4759,4760,4763],{"class":3736,"line":3799},[3734,4761,4762],{"class":4302},"  generator",[3734,4764,4306],{"class":3740},[3734,4766,4767,4769,4771],{"class":3736,"line":3807},[3734,4768,4706],{"class":4302},[3734,4770,3751],{"class":3740},[3734,4772,4773],{"class":3754},"\"Engineer\"\n",[3734,4775,4776,4778,4780],{"class":3736,"line":3815},[3734,4777,4716],{"class":4302},[3734,4779,3751],{"class":3740},[3734,4781,4782],{"class":3754},"\"Implement planner outline\"\n",[3734,4784,4785,4787,4789,4792,4795,4798],{"class":3736,"line":3823},[3734,4786,4726],{"class":4302},[3734,4788,4729],{"class":3740},[3734,4790,4791],{"class":3754},"\"git\"",[3734,4793,4794],{"class":3740},", ",[3734,4796,4797],{"class":3754},"\"calc\"",[3734,4799,4735],{"class":3740},[3734,4801,4802,4804,4806,4809],{"class":3736,"line":3829},[3734,4803,4740],{"class":4302},[3734,4805,4729],{"class":3740},[3734,4807,4808],{"class":3754},"\"Isolated worktree; commit artifacts\"",[3734,4810,4735],{"class":3740},[3734,4812,4813,4815,4817],{"class":3736,"line":3835},[3734,4814,4752],{"class":4302},[3734,4816,3751],{"class":3740},[3734,4818,4819],{"class":3754},"\"Code files + README\"\n",[3734,4821,4823,4826],{"class":3736,"line":4822},14,[3734,4824,4825],{"class":4302},"  evaluator",[3734,4827,4306],{"class":3740},[3734,4829,4831,4833,4835],{"class":3736,"line":4830},15,[3734,4832,4706],{"class":4302},[3734,4834,3751],{"class":3740},[3734,4836,4837],{"class":3754},"\"QA Adversary\"\n",[3734,4839,4841,4843,4845],{"class":3736,"line":4840},16,[3734,4842,4716],{"class":4302},[3734,4844,3751],{"class":3740},[3734,4846,4847],{"class":3754},"\"Score vs rubric\"\n",[3734,4849,4851,4853,4855,4858],{"class":3736,"line":4850},17,[3734,4852,4726],{"class":4302},[3734,4854,4729],{"class":3740},[3734,4856,4857],{"class":3754},"\"playwright\"",[3734,4859,4735],{"class":3740},[3734,4861,4863,4865,4867,4870],{"class":3736,"line":4862},18,[3734,4864,4740],{"class":4302},[3734,4866,4729],{"class":3740},[3734,4868,4869],{"class":3754},"\"Assume flaws; weighted scores\"",[3734,4871,4735],{"class":3740},[3734,4873,4875,4877,4879],{"class":3736,"line":4874},19,[3734,4876,4752],{"class":4302},[3734,4878,3751],{"class":3740},[3734,4880,4881],{"class":3754},"\"JSON: scores, fixes\"\n",[3598,4883,4884],{},"Run via GitHub Actions: trigger on issue, parse YAML, invoke Claude sequentially. This beats npm installs—I've shipped PRs weekly this way. We'll detail roles, primitives, build steps, and trade-offs next.",[3611,4886,4888],{"id":4887},"why-production-agent-systems-need-a-3-core-agent-harness","Why Production Agent Systems Need a 3-Core Agent Harness",[3598,4890,4891,4892,4897],{},"Ditch bloated agent frameworks—a 3-core agent harness with Planner, Generator, and Evaluator outperforms them by playing to LLM strengths like large contexts and autonomy. Anthropic's Claude Opus 4.6 tests show 90% of components in BMAD, GSD, and SpecKit are redundant overhead that propagates errors on long-horizon tasks.",[3687,4893,4894],{},[3660,4895,3695],{"href":4057,"ariaDescribedBy":4896,"dataFootnoteRef":3593,"id":4097},[3693]," High-level planning avoids flawed detailed specs, while separate evaluation enforces rigor.",[3598,4899,4900],{},"Traditional frameworks compensate for outdated LLM limits: context resets demand sharding, weak coherence needs rigid loops. But 1M-token windows and improved reasoning make micro-tasking counterproductive—it forces premature decisions that cascade failures.",[3598,4902,4903,4904],{},"Anthropic's experiments, summarized by AI LABS, tested stripping frameworks layer by layer. Results? Only the planner for product outlines, generator for execution, and evaluator for critique yielded gains. Complex staging in SpecKit or GSD loops adds no value; it bloats token use and invites drift.",[3687,4905,4906],{},[3660,4907,3695],{"href":4057,"ariaDescribedBy":4908,"dataFootnoteRef":3593,"id":4122},[3693],[3598,4910,4911,4912,4917,4918],{},"Nate B. Jones's analysis of Claude's leaked code echoes this: primitives beat frameworks for scalability.",[3687,4913,4914],{},[3660,4915,4065],{"href":3691,"ariaDescribedBy":4916,"dataFootnoteRef":3593,"id":4157},[3693]," Agent Blueprint stresses single-agent mastery first, scaling only for distinct skills.",[3687,4919,4920],{},[3660,4921,4109],{"href":4106,"ariaDescribedBy":4922,"dataFootnoteRef":3593,"id":4211},[3693],[3598,4924,4925],{},"I've built agents both ways. Frameworks feel safe until production hits—then you're debugging orchestration bugs, not shipping features. The harness cuts that noise.",[3611,4927,4929],{"id":4928},"the-planners-role-in-a-3-core-agent-harness","The Planner's Role in a 3-Core Agent Harness",[3598,4931,4932,4933,4935,4936],{},"In a ",[3640,4934,4638],{},", the Planner generates high-level product outlines, feature breakdowns, and user stories—not micro-tasks—enabling LLMs to autonomously discover optimal paths and avoid error cascades from over-specification. Anthropic's boundary-testing prompts prove Claude Opus 4.6 excels here, generating phased docs without diving into code.",[3687,4937,4938],{},[3660,4939,3695],{"href":4057,"ariaDescribedBy":4940,"dataFootnoteRef":3593,"id":4247},[3693],[3598,4942,4943,4944,4947],{},"Start prompts with ",[3640,4945,4946],{},"Role + Goal + high-level deliverables",". Here's a concrete example for a task-tracking app:",[3726,4949,4954],{"className":4950,"code":4952,"language":4953},[4951],"language-text","You are a product lead with 10+ years shipping SaaS.\n\nGoal: Outline a task-tracking app for indie devs.\n\nDeliverables:\n- 5-10 user stories (As a [user], I want [feature] so [benefit])\n- Key features prioritized by MVP\n- Phased roadmap (Week 1: Core; Week 2: Polish)\n- Risks and assumptions\n\nRules: Stay high-level—no code, tech stacks, or UI mocks. Flag unknowns.\n\nOutput: Markdown sections only.\n","text",[3714,4955,4952],{"__ignoreMap":3593},[3598,4957,4958,4959],{},"Claude Opus 4.6 generates phased docs like this, iterating on creative paths humans might miss.",[3687,4960,4961],{},[3660,4962,3695],{"href":4057,"ariaDescribedBy":4963,"dataFootnoteRef":3593,"id":4400},[3693],[3598,4965,4966,4967],{},"Avoid native \"plan\" modes—they fixate on implementation details too early. Archon V3 uses declarative YAML for living workflows, updating plans mid-run.",[3687,4968,4969],{},[3660,4970,4138],{"href":4135,"ariaDescribedBy":4971,"dataFootnoteRef":3593,"id":4137},[3693],[3598,4973,4974,4975,4978,4979,4984],{},"Agent Blueprint's formula drives reliability: ",[3640,4976,4977],{},"Role + Goal + Tools + Rules + Output",".",[3687,4980,4981],{},[3660,4982,4109],{"href":4106,"ariaDescribedBy":4983,"dataFootnoteRef":3593,"id":4222},[3693]," For Planner: Tools minimal (search only), Rules (\"Stay high-level; flag risks\"), Output (Markdown sections).",[3598,4986,4987],{},"Benefits compound. LLMs outperform humans on detail synthesis—let them handle it post-outline. I've used this for 20+ newsletter outlines; it surfaces non-obvious features like \"AI-suggested subtasks\" I overlooked.",[3598,4989,4990,4991,4996],{},"Contrast SpecKit: It stages detailed specs early, locking in assumptions that drift during generation.",[3687,4992,4993],{},[3660,4994,4176],{"href":4173,"ariaDescribedBy":4995,"dataFootnoteRef":3593,"id":4175},[3693]," High-level planning iterates faster.",[3598,4998,4999],{},"For code integration, pipe output to Generator via file:",[3726,5001,5005],{"className":5002,"code":5003,"language":5004,"meta":3593,"style":3593},"language-bash shiki shiki-themes github-light github-dark","claude --prompt planner_prompt.md --output planner_outline.md\ngit add planner_outline.md\n","bash",[3714,5006,5007,5025],{"__ignoreMap":3593},[3734,5008,5009,5013,5016,5019,5022],{"class":3736,"line":3737},[3734,5010,5012],{"class":5011},"sScJk","claude",[3734,5014,5015],{"class":3747}," --prompt",[3734,5017,5018],{"class":3754}," planner_prompt.md",[3734,5020,5021],{"class":3747}," --output",[3734,5023,5024],{"class":3754}," planner_outline.md\n",[3734,5026,5027,5030,5033],{"class":3736,"line":3744},[3734,5028,5029],{"class":5011},"git",[3734,5031,5032],{"class":3754}," add",[3734,5034,5024],{"class":3754},[3598,5036,5037],{},"This keeps plans as artifacts, versioned and reviewable. Scale to repos: Plan entire features from GitHub issues.",[3611,5039,5041],{"id":5040},"the-generators-focused-role-in-the-3-core-agent-harness","The Generator's Focused Role in the 3-Core Agent Harness",[3598,5043,4932,5044,5046,5047],{},[3640,5045,4638],{},", the Generator executes solely on Planner outlines in isolated environments like Git worktrees, producing code, content, or artifacts while avoiding self-evaluation bias and memory bloat. It uses tools sparingly (search, calc) for clean, iterable outputs. Archon V3's Markdown commands make this reusable across tasks.",[3687,5048,5049],{},[3660,5050,4138],{"href":4135,"ariaDescribedBy":5051,"dataFootnoteRef":3593,"id":4147},[3693],[3598,5053,5054],{},"Core loop: Think, tool if needed, observe, repeat—but single-purpose. No chit-chat; output to files for persistence.",[3598,5056,5057],{},"Contrast multi-role agents: Combining generation and eval leads to overconfidence. Generators praise mediocre work; separation forces honesty.",[3598,5059,5060],{},"Examples abound. For newsletters: Planner outlines sections, Generator drafts in Markdown. For code: Implement features in fresh worktrees, committing artifacts.",[3598,5062,5063,5064,5069],{},"This ties to spec-centric flows like SDD or SpecKit—Generator translates living specs without drift.",[3687,5065,5066],{},[3660,5067,4176],{"href":4173,"ariaDescribedBy":5068,"dataFootnoteRef":3593,"id":4185},[3693]," No shared memory; pass via files.",[3598,5071,5072],{},"In practice, isolation prevents hallucinations from long contexts. I've generated 50+ PRs weekly this way—far beyond chat-based tinkering.",[3611,5074,5076],{"id":5075},"why-a-separate-evaluator-delivers-production-quality","Why a Separate Evaluator Delivers Production Quality",[3598,5078,5079,5080,5082,5083],{},"A dedicated Evaluator in the ",[3640,5081,4638],{}," scores outputs adversarially against graded rubrics—like UI axes (design: 25%, originality: 25%, craft: 25%, functionality: 25%)—iterating until standards hit and upgrading GSD's pass\u002Ffail to nuanced critique assuming bugs exist. Anthropic stresses holistic excellence over TDD alone.",[3687,5084,5085],{},[3660,5086,3695],{"href":4057,"ariaDescribedBy":5087,"dataFootnoteRef":3593,"id":5088},[3693],"user-content-fnref-1-8",[3598,5090,5091],{},"Rubrics weight criteria explicitly. UI example: \"Design: Modern, intuitive? Originality: Avoids gradients? Craft: Typography\u002Fspacing precise? Functionality: Playwright-tested?\"",[3598,5093,5094],{},"Why separate? Generators optimize for completion, not quality—they hallucinate strengths. Evaluator simulates users, probing edge cases.",[3598,5096,5097,5098],{},"Loop: Critique → Regenerate → Rescore until pass. Agent Blueprint pairs evaluator-optimizer for this.",[3687,5099,5100],{},[3660,5101,4109],{"href":4106,"ariaDescribedBy":5102,"dataFootnoteRef":3593,"id":4240},[3693],[3598,5104,5105],{},"Examples scale to subjective work. UI grading rejects cookie-cutter designs; content rubrics check voice alignment.",[3611,5107,5109],{"id":5108},"essential-primitives-for-reliable-3-core-agent-harnesses","Essential Primitives for Reliable 3-Core Agent Harnesses",[3598,5111,5112,5113,5116,5117,5122],{},"Production ",[3640,5114,5115],{},"3-core agent harnesses"," require \"boring\" primitives like dual tool registries (207+ commands), tiered permissions (18 bash modules), JSON state persistence, token budgeting with projections, structured streaming, and verification. As detailed in Nate B. Jones's analysis of Claude's leaked code, these essentials harden demos into scalable systems handling crashes, controlling costs, and ensuring 24\u002F7 operation.",[3687,5118,5119],{},[3660,5120,4065],{"href":3691,"ariaDescribedBy":5121,"dataFootnoteRef":3593,"id":4192},[3693]," Without them, you're prototyping, not producing.",[3634,5124,5125,5133,5141,5144,5147,5150],{},[3637,5126,5127,5128],{},"Dual tool registries (207+ commands)",[3687,5129,5130],{},[3660,5131,4065],{"href":3691,"ariaDescribedBy":5132,"dataFootnoteRef":3593,"id":4264},[3693],[3637,5134,5135,5136],{},"Tiered permissions (18 bash modules)",[3687,5137,5138],{},[3660,5139,4065],{"href":3691,"ariaDescribedBy":5140,"dataFootnoteRef":3593,"id":4275},[3693],[3637,5142,5143],{},"JSON state persistence",[3637,5145,5146],{},"Token budgeting with projections",[3637,5148,5149],{},"Structured streaming",[3637,5151,5152],{},"Verification",[3598,5154,5155,5156],{},"Nate B. Jones details 12 keys from the Claude code leak: Registries filter runtime tools dynamically; permissions gate risks (built-in > plugins > user-defined).",[3687,5157,5158],{},[3660,5159,4065],{"href":3691,"ariaDescribedBy":5160,"dataFootnoteRef":3593,"id":4371},[3693],[3598,5162,5163,5166],{},[3640,5164,5165],{},"State Persistence",": Full session JSON (messages, tokens, config) for crash recovery.",[3598,5168,5169],{},"Example:",[3726,5171,5173],{"className":3728,"code":5172,"language":3730,"meta":3593,"style":3593},"{\n  \"session\": {\n    \"messages\": [...],\n    \"tokens_used\": 12500,\n    \"config\": {\"model\": \"claude-3.5-sonnet\"}\n  }\n}\n",[3714,5174,5175,5179,5187,5201,5213,5231,5236],{"__ignoreMap":3593},[3734,5176,5177],{"class":3736,"line":3737},[3734,5178,3741],{"class":3740},[3734,5180,5181,5184],{"class":3736,"line":3744},[3734,5182,5183],{"class":3747},"  \"session\"",[3734,5185,5186],{"class":3740},": {\n",[3734,5188,5189,5192,5194,5198],{"class":3736,"line":3761},[3734,5190,5191],{"class":3747},"    \"messages\"",[3734,5193,4729],{"class":3740},[3734,5195,5197],{"class":5196},"s7hpK","...",[3734,5199,5200],{"class":3740},"],\n",[3734,5202,5203,5206,5208,5211],{"class":3736,"line":3770},[3734,5204,5205],{"class":3747},"    \"tokens_used\"",[3734,5207,3751],{"class":3740},[3734,5209,5210],{"class":3747},"12500",[3734,5212,3758],{"class":3740},[3734,5214,5215,5218,5221,5224,5226,5229],{"class":3736,"line":3779},[3734,5216,5217],{"class":3747},"    \"config\"",[3734,5219,5220],{"class":3740},": {",[3734,5222,5223],{"class":3747},"\"model\"",[3734,5225,3751],{"class":3740},[3734,5227,5228],{"class":3754},"\"claude-3.5-sonnet\"",[3734,5230,3838],{"class":3740},[3734,5232,5233],{"class":3736,"line":3787},[3734,5234,5235],{"class":3740},"  }\n",[3734,5237,5238],{"class":3736,"line":3793},[3734,5239,3838],{"class":3740},[3598,5241,5242],{},"Save on every tool call; resume seamlessly.",[3598,5244,5245,5248],{},[3640,5246,5247],{},"Budgeting",": Hard limits + projections. Pre-compute: \"This task forecasts 50k input + 20k output tokens.\"",[3726,5250,5254],{"className":5251,"code":5252,"language":5253,"meta":3593,"style":3593},"language-python shiki shiki-themes github-light github-dark","def project_tokens(prompt_len, steps=10):\n    return prompt_len * 1.2 * steps  # Conservative multiplier\nif project_tokens(len(planner_outline)) > 100000:\n    abort(\"Budget exceeded\")\n","python",[3714,5255,5256,5261,5266,5271],{"__ignoreMap":3593},[3734,5257,5258],{"class":3736,"line":3737},[3734,5259,5260],{},"def project_tokens(prompt_len, steps=10):\n",[3734,5262,5263],{"class":3736,"line":3744},[3734,5264,5265],{},"    return prompt_len * 1.2 * steps  # Conservative multiplier\n",[3734,5267,5268],{"class":3736,"line":3761},[3734,5269,5270],{},"if project_tokens(len(planner_outline)) > 100000:\n",[3734,5272,5273],{"class":3736,"line":3770},[3734,5274,5275],{},"    abort(\"Budget exceeded\")\n",[3598,5277,5278],{},"I've seen major cost savings with budgeting alone on weekly PR batches.",[3598,5280,5281,5284,5285],{},[3640,5282,5283],{},"Observability",": Typed events\u002Flogs. Stream: ",[3714,5286,5287],{},"{\"event\": \"tool_call\", \"tool\": \"git\", \"result\": \"committed\"}",[3598,5289,5290,5293],{},[3640,5291,5292],{},"Tool Registry",": Metadata-driven:",[3726,5295,5297],{"className":4293,"code":5296,"language":4295,"meta":3593,"style":3593},"tools:\n  git:\n    desc: \"Git operations\"\n    perms: \"built-in\"\n    args: [\"commit\", \"push\"]\n  playwright:\n    desc: \"UI tests\"\n    perms: \"plugin\"\n",[3714,5298,5299,5305,5312,5322,5332,5349,5356,5365],{"__ignoreMap":3593},[3734,5300,5301,5303],{"class":3736,"line":3737},[3734,5302,4303],{"class":4302},[3734,5304,4306],{"class":3740},[3734,5306,5307,5310],{"class":3736,"line":3744},[3734,5308,5309],{"class":4302},"  git",[3734,5311,4306],{"class":3740},[3734,5313,5314,5317,5319],{"class":3736,"line":3761},[3734,5315,5316],{"class":4302},"    desc",[3734,5318,3751],{"class":3740},[3734,5320,5321],{"class":3754},"\"Git operations\"\n",[3734,5323,5324,5327,5329],{"class":3736,"line":3770},[3734,5325,5326],{"class":4302},"    perms",[3734,5328,3751],{"class":3740},[3734,5330,5331],{"class":3754},"\"built-in\"\n",[3734,5333,5334,5337,5339,5342,5344,5347],{"class":3736,"line":3779},[3734,5335,5336],{"class":4302},"    args",[3734,5338,4729],{"class":3740},[3734,5340,5341],{"class":3754},"\"commit\"",[3734,5343,4794],{"class":3740},[3734,5345,5346],{"class":3754},"\"push\"",[3734,5348,4735],{"class":3740},[3734,5350,5351,5354],{"class":3736,"line":3787},[3734,5352,5353],{"class":4302},"  playwright",[3734,5355,4306],{"class":3740},[3734,5357,5358,5360,5362],{"class":3736,"line":3793},[3734,5359,5316],{"class":4302},[3734,5361,3751],{"class":3740},[3734,5363,5364],{"class":3754},"\"UI tests\"\n",[3734,5366,5367,5369,5371],{"class":3736,"line":3799},[3734,5368,5326],{"class":4302},[3734,5370,3751],{"class":3740},[3734,5372,5373],{"class":3754},"\"plugin\"\n",[3598,5375,5376,5379,5380,5383],{},[3640,5377,5378],{},"Permissions",": State objects—no world access. ",[3714,5381,5382],{},"permissions: {\"bash\": [\"ls\", \"cat\"], \"deny\": [\"rm -rf\"]}",[3687,5384,5385],{},[3660,5386,4065],{"href":3691,"ariaDescribedBy":5387,"dataFootnoteRef":3593,"id":5388},[3693],"user-content-fnref-2-7",[3598,5390,5391,5393],{},[3640,5392,5152],{},": Guardrail tests post-output. Archon V3 adds pre\u002Fpost-tool hooks:",[3726,5395,5397],{"className":4293,"code":5396,"language":4295,"meta":3593,"style":3593},"hooks:\n  pre-tool: \"validate_args(tool, args)\"\n  post-tool: \"verify_output_schema(result)\"\n",[3714,5398,5399,5406,5416],{"__ignoreMap":3593},[3734,5400,5401,5404],{"class":3736,"line":3737},[3734,5402,5403],{"class":4302},"hooks",[3734,5405,4306],{"class":3740},[3734,5407,5408,5411,5413],{"class":3736,"line":3744},[3734,5409,5410],{"class":4302},"  pre-tool",[3734,5412,3751],{"class":3740},[3734,5414,5415],{"class":3754},"\"validate_args(tool, args)\"\n",[3734,5417,5418,5421,5423],{"class":3736,"line":3761},[3734,5419,5420],{"class":4302},"  post-tool",[3734,5422,3751],{"class":3740},[3734,5424,5425],{"class":3754},"\"verify_output_schema(result)\"\n",[3598,5427,5428,5431,5432],{},[3640,5429,5430],{},"Agent Typing",": Modes like explore\u002Fplan\u002Fverify; permissions evolve with state.",[3687,5433,5434],{},[3660,5435,4065],{"href":3691,"ariaDescribedBy":5436,"dataFootnoteRef":3593,"id":5437},[3693],"user-content-fnref-2-8",[3598,5439,5440],{},"Dynamic pools swap tools mid-run. Skip these, long tasks fail frequently—primitives ensure 24\u002F7 operation.",[3611,5442,5444],{"id":5443},"building-and-scaling-your-3-core-agent-harness","Building and Scaling Your 3-Core Agent Harness",[3598,5446,5447,5448,5454,5460],{},"Assemble a 3-core agent harness via YAML\u002FDAGs (Archon V3), Claude teams, or SpecKit staging: Define each core with Role+Goal+Tools+Rules+Output, layer primitives, master single-agent first, then scale multi for skills.",[3687,5449,5450],{},[3660,5451,4109],{"href":4106,"ariaDescribedBy":5452,"dataFootnoteRef":3593,"id":5453},[3693],"user-content-fnref-3-5",[3687,5455,5456],{},[3660,5457,4138],{"href":4135,"ariaDescribedBy":5458,"dataFootnoteRef":3593,"id":5459},[3693],"user-content-fnref-4-3"," GitHub Actions trigger workflows; minimal tools\u002Fmemory.",[3598,5462,5463],{},"Steps:",[3992,5465,5466,5476,5482],{},[3637,5467,5468,5471,5472,5475],{},[3640,5469,5470],{},"Planner Prompt",": \"Role: Product lead. Goal: ",[3734,5473,5474],{},"Task",". Tools: Search. Rules: High-level only. Output: Markdown outline.\"",[3637,5477,5478,5481],{},[3640,5479,5480],{},"Generator",": \"Role: Engineer. Goal: Implement outline. Tools: Git, calc. Rules: Isolated worktree. Output: Committed artifacts.\"",[3637,5483,5484,5487],{},[3640,5485,5486],{},"Evaluator",": \"Role: QA adversary. Goal: Score vs rubric. Tools: Playwright. Rules: Assume flaws. Output: Scores + fixes.\"",[3598,5489,5490],{},"Add primitives: Token budgeter, JSON state.",[3598,5492,5493,5494],{},"Test on messy inputs. Ready starters: GSD + rubrics; Archon builtins (fix-issue, idea-to-PR).",[3687,5495,5496],{},[3660,5497,4138],{"href":4135,"ariaDescribedBy":5498,"dataFootnoteRef":3593,"id":5499},[3693],"user-content-fnref-4-4",[3598,5501,5502],{},"Scaling: Orchestrators route; parallelism via DAGs.",[3598,5504,5505],{},"Harness over frameworks—I've shipped 10x faster.",[3611,5507,5509],{"id":5508},"trade-offs-misconceptions-and-when-to-skip-agents","Trade-offs, Misconceptions, and When to Skip Agents",[3598,5511,5512,5513],{},"The 3-core agent harness swaps framework \"safety\" for speed but requires primitive investment; it costs more upfront yet runs leaner long-term, with budgeting taming expenses. Misconceptions: Micro-tasks aren't needed (LLMs obsolete them); always multi-agent (master single first). Skip for deterministic chaining\u002Frouting—use Anthropic's 5 workflows.",[3687,5514,5515],{},[3660,5516,4109],{"href":4106,"ariaDescribedBy":5517,"dataFootnoteRef":3593,"id":5518},[3693],"user-content-fnref-3-6",[3598,5520,5521],{},"Trade-offs:",[3634,5523,5524,5530,5536],{},[3637,5525,5526,5529],{},[3640,5527,5528],{},"Build Time",": Primitives take days vs. framework npm install.",[3637,5531,5532,5535],{},[3640,5533,5534],{},"Eval Subjectivity",": Rubrics need tuning for creative work.",[3637,5537,5538,5541,5542],{},[3640,5539,5540],{},"Costs",": Long tasks hit tokens—mitigate with projections.",[3687,5543,5544],{},[3660,5545,4065],{"href":3691,"ariaDescribedBy":5546,"dataFootnoteRef":3593,"id":5547},[3693],"user-content-fnref-2-9",[3598,5549,5550,5551,5557],{},"Risks: No permissions = demo, not product.",[3687,5552,5553],{},[3660,5554,4065],{"href":3691,"ariaDescribedBy":5555,"dataFootnoteRef":3593,"id":5556},[3693],"user-content-fnref-2-10"," Frameworks aren't future-proof; LLMs evolve.",[3598,5559,5560],{},"When to skip: Simple transforms? Chain prompts. Agents shine on open-ended horizons.",[3598,5562,5563],{},"Open: Rubric standards? This works today—iterate your own.",[3598,5565,5566],{},"Pick a stalled repo project. Strip any agent setup to these three roles using Role+Goal+Tools+Rules+Output. Add token budgeting as your first primitive. Run on one feature, measure output quality and costs before scaling—you'll ship faster than with frameworks.",[3982,5568,5570,5573],{"className":5569,"dataFootnotes":3593},[3985],[3611,5571,3990],{"className":5572,"id":3693},[3989],[3992,5574,5575,5619,5680,5715,5740],{},[3637,5576,5577,5578,4423,5581,4423,5586,4423,5591,4423,5596,4423,5601,4423,5606,4423,5611],{"id":4417},"AI LABS, \"Anthropic: Agent Harnesses Need Only 3 Core Agents\" (YouTube summary). ",[3660,5579,4004],{"href":4421,"ariaLabel":4001,"className":5580,"dataFootnoteBackref":3593},[4003],[3660,5582,4004,5584],{"href":4426,"ariaLabel":4427,"className":5583,"dataFootnoteBackref":3593},[4003],[3687,5585,4065],{},[3660,5587,4004,5589],{"href":4433,"ariaLabel":4434,"className":5588,"dataFootnoteBackref":3593},[4003],[3687,5590,4109],{},[3660,5592,4004,5594],{"href":4440,"ariaLabel":4441,"className":5593,"dataFootnoteBackref":3593},[4003],[3687,5595,4138],{},[3660,5597,4004,5599],{"href":4447,"ariaLabel":4448,"className":5598,"dataFootnoteBackref":3593},[4003],[3687,5600,4176],{},[3660,5602,4004,5604],{"href":4454,"ariaLabel":4455,"className":5603,"dataFootnoteBackref":3593},[4003],[3687,5605,4360],{},[3660,5607,4004,5609],{"href":4461,"ariaLabel":4462,"className":5608,"dataFootnoteBackref":3593},[4003],[3687,5610,4466],{},[3660,5612,4004,5616],{"href":5613,"ariaLabel":5614,"className":5615,"dataFootnoteBackref":3593},"#user-content-fnref-1-8","Back to reference 1-8",[4003],[3687,5617,5618],{},"8",[3637,5620,5621,5622,4423,5625,4423,5630,4423,5635,4423,5640,4423,5645,4423,5650,4423,5657,4423,5664,4423,5672],{"id":3996},"Nate B. Jones, \"Claude Code Leak: 12 Primitives for Production Agents\" (YouTube). ",[3660,5623,4004],{"href":4000,"ariaLabel":4472,"className":5624,"dataFootnoteBackref":3593},[4003],[3660,5626,4004,5628],{"href":4476,"ariaLabel":4477,"className":5627,"dataFootnoteBackref":3593},[4003],[3687,5629,4065],{},[3660,5631,4004,5633],{"href":4483,"ariaLabel":4484,"className":5632,"dataFootnoteBackref":3593},[4003],[3687,5634,4109],{},[3660,5636,4004,5638],{"href":4490,"ariaLabel":4491,"className":5637,"dataFootnoteBackref":3593},[4003],[3687,5639,4138],{},[3660,5641,4004,5643],{"href":4497,"ariaLabel":4498,"className":5642,"dataFootnoteBackref":3593},[4003],[3687,5644,4176],{},[3660,5646,4004,5648],{"href":4504,"ariaLabel":4505,"className":5647,"dataFootnoteBackref":3593},[4003],[3687,5649,4360],{},[3660,5651,4004,5655],{"href":5652,"ariaLabel":5653,"className":5654,"dataFootnoteBackref":3593},"#user-content-fnref-2-7","Back to reference 2-7",[4003],[3687,5656,4466],{},[3660,5658,4004,5662],{"href":5659,"ariaLabel":5660,"className":5661,"dataFootnoteBackref":3593},"#user-content-fnref-2-8","Back to reference 2-8",[4003],[3687,5663,5618],{},[3660,5665,4004,5669],{"href":5666,"ariaLabel":5667,"className":5668,"dataFootnoteBackref":3593},"#user-content-fnref-2-9","Back to reference 2-9",[4003],[3687,5670,5671],{},"9",[3660,5673,4004,5677],{"href":5674,"ariaLabel":5675,"className":5676,"dataFootnoteBackref":3593},"#user-content-fnref-2-10","Back to reference 2-10",[4003],[3687,5678,5679],{},"10",[3637,5681,5682,5683,4423,5686,4423,5691,4423,5696,4423,5701,4423,5708],{"id":4511},"Lukas Margerie, \"Agent Blueprint: Role + Goal + Tools + Rules + Output\" (YouTube). ",[3660,5684,4004],{"href":4515,"ariaLabel":4516,"className":5685,"dataFootnoteBackref":3593},[4003],[3660,5687,4004,5689],{"href":4520,"ariaLabel":4521,"className":5688,"dataFootnoteBackref":3593},[4003],[3687,5690,4065],{},[3660,5692,4004,5694],{"href":4527,"ariaLabel":4528,"className":5693,"dataFootnoteBackref":3593},[4003],[3687,5695,4109],{},[3660,5697,4004,5699],{"href":4534,"ariaLabel":4535,"className":5698,"dataFootnoteBackref":3593},[4003],[3687,5700,4138],{},[3660,5702,4004,5706],{"href":5703,"ariaLabel":5704,"className":5705,"dataFootnoteBackref":3593},"#user-content-fnref-3-5","Back to reference 3-5",[4003],[3687,5707,4176],{},[3660,5709,4004,5713],{"href":5710,"ariaLabel":5711,"className":5712,"dataFootnoteBackref":3593},"#user-content-fnref-3-6","Back to reference 3-6",[4003],[3687,5714,4360],{},[3637,5716,5717,5718,4423,5721,4423,5726,4423,5733],{"id":4541},"DIY Smart Code, \"Archon V3: YAML Harnesses for AI Coding Agents\" (YouTube). ",[3660,5719,4004],{"href":4545,"ariaLabel":4546,"className":5720,"dataFootnoteBackref":3593},[4003],[3660,5722,4004,5724],{"href":4550,"ariaLabel":4551,"className":5723,"dataFootnoteBackref":3593},[4003],[3687,5725,4065],{},[3660,5727,4004,5731],{"href":5728,"ariaLabel":5729,"className":5730,"dataFootnoteBackref":3593},"#user-content-fnref-4-3","Back to reference 4-3",[4003],[3687,5732,4109],{},[3660,5734,4004,5738],{"href":5735,"ariaLabel":5736,"className":5737,"dataFootnoteBackref":3593},"#user-content-fnref-4-4","Back to reference 4-4",[4003],[3687,5739,4138],{},[3637,5741,5742,5743,4423,5746],{"id":4557},"Level Up Coding, \"SDD Makes Specs the Single Source of Truth via AI Agents.\" ",[3660,5744,4004],{"href":4561,"ariaLabel":4562,"className":5745,"dataFootnoteBackref":3593},[4003],[3660,5747,4004,5749],{"href":4566,"ariaLabel":4567,"className":5748,"dataFootnoteBackref":3593},[4003],[3687,5750,4065],{},[4006,5752,5753],{},"html pre.shiki code .s9eBZ, html code.shiki .s9eBZ{--shiki-default:#22863A;--shiki-dark:#85E89D}html pre.shiki code .sVt8B, html code.shiki .sVt8B{--shiki-default:#24292E;--shiki-dark:#E1E4E8}html pre.shiki code .sZZnC, html code.shiki .sZZnC{--shiki-default:#032F62;--shiki-dark:#9ECBFF}html .default .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html.dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html pre.shiki code .sScJk, html code.shiki .sScJk{--shiki-default:#6F42C1;--shiki-dark:#B392F0}html pre.shiki code .sj4cs, html code.shiki .sj4cs{--shiki-default:#005CC5;--shiki-dark:#79B8FF}html pre.shiki code .s7hpK, html code.shiki .s7hpK{--shiki-default:#B31D28;--shiki-default-font-style:italic;--shiki-dark:#FDAEB7;--shiki-dark-font-style:italic}",{"title":3593,"searchDepth":3744,"depth":3744,"links":5755},[5756,5757,5758,5759,5760,5761,5762,5763],{"id":4887,"depth":3744,"text":4888},{"id":4928,"depth":3744,"text":4929},{"id":5040,"depth":3744,"text":5041},{"id":5075,"depth":3744,"text":5076},{"id":5108,"depth":3744,"text":5109},{"id":5443,"depth":3744,"text":5444},{"id":5508,"depth":3744,"text":5509},{"id":3693,"depth":3744,"text":3990},"ai-llms","Production AI agent systems thrive with a 3-core agent harness—Planner for high-level outlines, Generator for implementation, Evaluator for adversarial critique using graded rubrics—stripping 90% bloated framework overhead per Anthropic tests.1 This leverages modern LLMs' 1M+ token windows and coherence for reliable, scalable outputs on long-horizon tasks.",[4638,4615,5767,5768,5769,5770,4611,5771],"planner generator evaluator","agent frameworks","Claude Opus","AI agent primitives","minimalist agents",{},"Learn why production AI agents need just Planner, Generator, and Evaluator—not frameworks. Anthropic tests show 90% framework bloat is obsolete. Build scalable harnesses with primitives for reliable outputs in code, UI, and content.","3-Core Agent Harness for Production AI","\u002Farticles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-article",[],{"intro":5778,"why-production-agent-systems-need-a-3-core-agent-harness":4888,"the-planners-role-in-a-3-core-agent-harness":4929,"the-generators-focused-role-in-the-3-core-agent-harness":5041,"why-a-separate-evaluator-delivers-production-quality":5076,"essential-primitives-for-reliable-3-core-agent-harnesses":5109,"building-and-scaling-your-3-core-agent-harness":5444,"trade-offs-misconceptions-and-when-to-skip-agents":5509},"Introduction",{"title":4629,"description":5765},{"loc":5775},"3-core-agent-harness-planner-generator-evaluator-production-ai-agents","articles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-article","pEqxcDCwoMVirkXg2PYcYkpR4uAFqYg3dO1nMbJGObo",{"id":5785,"title":5786,"ai_summary":5787,"author":3593,"body":5788,"category":5764,"date_modified":4020,"description":6379,"excerpt":3593,"extension":4021,"faq":4020,"keywords":6380,"meta":6385,"meta_description":6386,"meta_title":6387,"navigation":4032,"path":6388,"primary_keyword":5852,"published_at":4020,"related_posts":6389,"sections":6390,"seo":6391,"sitemap":6392,"slug":5781,"status":4040,"stem":6393,"__hash__":6394},"articles\u002Farticles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-baseline-post-merge-article.md","The 3-Core Agent Harness: Planner, Generator, Evaluator for Reliable Production AI Agents","Production AI agent systems require a 3-core agent harness—Planner for task decomposition, Generator for execution, Evaluator for unbiased verification—to fix single-agent issues like underspecification, self-evaluation bias, and context limits, ensuring reliable outputs on complex, long-running tasks.",{"type":3595,"value":5789,"toc":6369},[5790,5796,5799,5807,5811,5814,5821,5833,5840,5843,5847,5854,5863,5866,5884,5891,5894,5898,5901,5904,5907,5927,5934,5937,6026,6034,6038,6041,6048,6051,6071,6079,6087,6090,6094,6100,6105,6108,6113,6116,6127,6132,6139,6207,6210,6214,6220,6232,6235,6260,6268,6271,6275,6280,6290,6296,6307,6310,6330,6333,6337,6343,6346,6363,6366],[3598,5791,5792,5793,5795],{},"Production AI agent systems demand a ",[3640,5794,4638],{},"—Planner for task decomposition, Generator for execution, Evaluator for unbiased verification—because single agents suffer from underspecification, self-bias, and context limits, delivering unreliable outputs on complex tasks. (38 words)",[3598,5797,5798],{},"Picture this: You're a developer tasked with building a full-stack feature using a single-LLM agent. It spits out a toy dashboard—missing auth, no error handling, half-baked UI. Hours vanish fixing hallucinations and gaps. Human teams avoid this by separating planning, coding, and testing. Agents need the same discipline.",[3598,5800,5801,5802,5806],{},"Anthropic's research nails why single agents crumble in production: they underscope tasks, rubber-stamp their own bugs, and panic at context limits.",[3687,5803,5804],{},[3734,5805,3695],{}," This harness forms a feedback loop, like a GAN for code generation, where agents critique each other. Builders shipping AI products face demo-to-production chasms today—skyrocketing debug time, token costs eating margins. We'll cover why singles fail, the harness blueprint, core roles, scaling patterns, framework limits, prod fixes, and your first build.",[3611,5808,5810],{"id":5809},"why-single-agent-systems-fail-production-tasks","Why Single-Agent Systems Fail Production Tasks",[3598,5812,5813],{},"Single-agent LLM systems fail production tasks due to underspecification—where vague prompts lead to simplified outputs—their inability to self-critique without bias, context window anxiety that rushes incomplete work, and lack of structured planning for multi-step problems, as shown in Anthropic's analysis of real-world agent breakdowns. (62 words)",[3598,5815,5816,5817],{},"High-level prompts sound clear to humans but trip up LLMs. Take \"build a user dashboard\": a single agent might deliver a static HTML mockup, skipping backend integration or scalability. Engr. Mejba Ahmed documented this in his Anthropic harness experiments: agents consistently produced \"toy versions,\" ignoring full specs like persistence or security.",[3687,5818,5819],{},[3734,5820,4065],{},[3598,5822,5823,5824,5828,5829],{},"Self-evaluation bias compounds the mess. LLMs generating code often approve it uncritically, spotting syntax nits but missing logic flaws. Nurunnubi Talukder puts it bluntly: \"Having the same agent generate and then judge its own output just doesn’t really work. Decoupling those roles seems pretty key.\"",[3687,5825,5826],{},[3734,5827,4109],{}," Studies confirm LLMs inflate their scores by 20-30% on flawed work.",[3687,5830,5831],{},[3734,5832,4138],{},[3598,5834,5835,5836],{},"Context anxiety hits long tasks hardest. As tokens pile up, agents truncate reasoning or output prematurely. Atal Upadhyay notes workflow failures here: no native decomposition means no handling for sprints or state.",[3687,5837,5838],{},[3734,5839,4176],{},[3598,5841,5842],{},"Humans sidestep this with role separation—PM plans, dev builds, QA tests. Single agents mash them, breeding errors. Production demands the split.",[3611,5844,5846],{"id":5845},"what-is-the-3-core-agent-harness","What Is the 3-Core Agent Harness?",[3598,5848,5849,5850,5853],{},"The 3-core ",[3640,5851,5852],{},"agent harness"," is an architecture with specialized Planner, Generator, and Evaluator agents that decomposes high-level goals into specs, executes them iteratively, and verifies outputs objectively, overcoming single-agent limits for reliable production AI applications like full-stack development or long-running automations. This setup forms a tight feedback loop: Planner sets contracts, Generator builds sprints, Evaluator scores and iterates—mimicking GANs but for tasks. (78 words)",[3598,5855,5856,5857,5862],{},"It's not just prompts; it's infrastructure. Anthropic's 2026 paper on long-running development formalized it, with Zylos Research expanding on patterns.",[3687,5858,5859,5860],{},"[6]",[3734,5861,4466],{}," Separation kills bias: Generator can't fudge evals.",[3598,5864,5865],{},"The loop runs like this:",[3634,5867,5868,5874,5879],{},[3637,5869,5870,5873],{},[3640,5871,5872],{},"Planner"," outputs sprint specs with \"done\" criteria.",[3637,5875,5876,5878],{},[3640,5877,5480],{}," executes one sprint at a time.",[3637,5880,5881,5883],{},[3640,5882,5486],{}," tests via tools (e.g., Playwright for UI), scores, loops back if needed.",[3598,5885,5886,5887],{},"This enables tool use—evaluators run browsers, not just read code. Upadhyay calls it shifting from \"reading about the work\" to \"experiencing it.\"",[3687,5888,5889],{},[3734,5890,4176],{},[3598,5892,5893],{},"Why now? Demos hide flaws; production exposes them under load. Harnesses bridge that, cutting debug time I've seen drop 40% in my builds.",[3611,5895,5897],{"id":5896},"the-planner-decomposing-tasks-into-actionable-specs","The Planner: Decomposing Tasks into Actionable Specs",[3598,5899,5900],{},"The Planner agent transforms vague user prompts into detailed product specs by breaking tasks into sequenced sub-tasks or sprints, defining \"done\" criteria, and tracking shared state, preventing underscoping and enabling ambitious, complete outputs without over-specifying implementation details. (50 words)",[3598,5902,5903],{},"Input a goal like \"build a task manager app.\" Output: Sprint 1 (auth + DB schema, criteria: JWT login passes, data persists); Sprint 2 (UI CRUD, criteria: E2E tests green). No code dictums—just contracts.",[3598,5905,5906],{},"Principles keep it sharp:",[3634,5908,5909,5915,5921],{},[3637,5910,5911,5914],{},[3640,5912,5913],{},"Ambitious scope",": Aim high; partial wins beat toys.",[3637,5916,5917,5920],{},[3640,5918,5919],{},"Implementation agnostic",": Specs focus outcomes, not stacks.",[3637,5922,5923,5926],{},[3640,5924,5925],{},"State awareness",": Track files, progress.",[3598,5928,5929,5930],{},"Atal Upadhyay's example: Decomposing a web scraper into auth, crawl, parse sprints yielded 2x completeness vs. singles.",[3687,5931,5932],{},[3734,5933,4176],{},[3598,5935,5936],{},"Pseudocode for a Planner prompt:",[3726,5938,5940],{"className":5251,"code":5939,"language":5253,"meta":3593,"style":3593},"prompt = \"\"\"\nYou are the Planner. Given a high-level goal: {goal}\n\nOutput JSON:\n{{\n  \"sprints\": [\n    {{\n      \"id\": 1,\n      \"description\": \"Detailed sub-task\",\n      \"done_criteria\": [\"Testable outcomes\"],\n      \"state_files\": [\"shared.json\"]\n    }}\n  ],\n  \"total_sprints\": N\n}}\nAmbitious but realistic. No implementation details.\n\"\"\"\n",[3714,5941,5942,5947,5952,5957,5962,5967,5972,5977,5982,5987,5992,5997,6002,6006,6011,6016,6021],{"__ignoreMap":3593},[3734,5943,5944],{"class":3736,"line":3737},[3734,5945,5946],{},"prompt = \"\"\"\n",[3734,5948,5949],{"class":3736,"line":3744},[3734,5950,5951],{},"You are the Planner. Given a high-level goal: {goal}\n",[3734,5953,5954],{"class":3736,"line":3761},[3734,5955,5956],{"emptyLinePlaceholder":4032},"\n",[3734,5958,5959],{"class":3736,"line":3770},[3734,5960,5961],{},"Output JSON:\n",[3734,5963,5964],{"class":3736,"line":3779},[3734,5965,5966],{},"{{\n",[3734,5968,5969],{"class":3736,"line":3787},[3734,5970,5971],{},"  \"sprints\": [\n",[3734,5973,5974],{"class":3736,"line":3793},[3734,5975,5976],{},"    {{\n",[3734,5978,5979],{"class":3736,"line":3799},[3734,5980,5981],{},"      \"id\": 1,\n",[3734,5983,5984],{"class":3736,"line":3807},[3734,5985,5986],{},"      \"description\": \"Detailed sub-task\",\n",[3734,5988,5989],{"class":3736,"line":3815},[3734,5990,5991],{},"      \"done_criteria\": [\"Testable outcomes\"],\n",[3734,5993,5994],{"class":3736,"line":3823},[3734,5995,5996],{},"      \"state_files\": [\"shared.json\"]\n",[3734,5998,5999],{"class":3736,"line":3829},[3734,6000,6001],{},"    }}\n",[3734,6003,6004],{"class":3736,"line":3835},[3734,6005,3796],{},[3734,6007,6008],{"class":3736,"line":4822},[3734,6009,6010],{},"  \"total_sprints\": N\n",[3734,6012,6013],{"class":3736,"line":4830},[3734,6014,6015],{},"}}\n",[3734,6017,6018],{"class":3736,"line":4840},[3734,6019,6020],{},"Ambitious but realistic. No implementation details.\n",[3734,6022,6023],{"class":3736,"line":4850},[3734,6024,6025],{},"\"\"\"\n",[3598,6027,6028,6029,6033],{},"Avijit M nails the shift: \"We’ve been building AI apps the wrong way. Real-world problems don’t work like one prompt → one output.\"",[3687,6030,6031],{},[3734,6032,5618],{}," Planners force clarity.",[3611,6035,6037],{"id":6036},"generator-and-evaluator-execution-meets-verification","Generator and Evaluator: Execution Meets Verification",[3598,6039,6040],{},"The Generator executes Planner specs within sprints, focusing purely on building code or content, while the separate Evaluator tests outputs using tools like browser automation or test suites for objective scoring, eliminating self-bias and ensuring functional results through feedback loops. (52 words)",[3598,6042,6043,6044],{},"Generator takes a sprint contract: \"Build auth endpoint. Criteria: POST \u002Flogin returns JWT, stores user.\" It outputs code, negotiating if specs shift. Mejba Ahmed's builds showed generators hit 85% sprint success when focused.",[3687,6045,6046],{},[3734,6047,4065],{},[3598,6049,6050],{},"Evaluator is the star. Armed with tools:",[3634,6052,6053,6059,6065],{},[3637,6054,6055,6058],{},[3640,6056,6057],{},"Playwright"," for UI: Launches app, clicks flows.",[3637,6060,6061,6064],{},[3640,6062,6063],{},"Linters\u002Ftests"," for code: Runs suite, flags fails.",[3637,6066,6067,6070],{},[3640,6068,6069],{},"Rubrics"," for subjective: Scores 1-10 on criteria.",[3598,6072,6073,6074,6078],{},"No more \"nod and pretend.\" Upadhyay: \"Text-only eval is insufficient... Use tools to experience the work.\"",[3687,6075,6076],{},[3734,6077,4176],{}," Scores feed back: \u003C7? Regenerate.",[3598,6080,6081,6082,6086],{},"Contrast self-eval: Ahmed found separate critics caught 3x more bugs.",[3687,6083,6084],{},[3734,6085,4065],{}," In harnesses, Generator builds blindly; Evaluator judges coldly. Loops cap at budgets—e.g., 3 tries per sprint.",[3598,6088,6089],{},"This duo powers the harness core. I've refactored agent fails this way; quality jumps.",[3611,6091,6093],{"id":6092},"agent-harness-patterns-for-scaling-complexity","Agent Harness Patterns for Scaling Complexity",[3598,6095,6096,6099],{},[3640,6097,6098],{},"Agent harness"," patterns scale from Simple Loop (single agent for quick validations) to Generator-Evaluator pairs for subjective quality, up to full 3-core harness for complex tasks, matching architecture to task needs for optimal cost and reliability. Pick by complexity: low for math checks, full for apps. (56 words)",[3598,6101,6102],{},[3640,6103,6104],{},"Pattern A: Simple Loop",[3598,6106,6107],{},"One agent loops with hard checks (linters). Low tokens, fast for scripts. Cost: ~10% of full.",[3598,6109,6110],{},[3640,6111,6112],{},"Pattern B: Gen-Eval Pair",[3598,6114,6115],{},"Two agents: Gen builds, Eval rubrics\u002Fscores. Mid-tasks like content. Rubric example:",[3634,6117,6118,6121,6124],{},[3637,6119,6120],{},"Functionality: 40%",[3637,6122,6123],{},"Best practices: 30%",[3637,6125,6126],{},"Edge cases: 30%",[3598,6128,6129],{},[3640,6130,6131],{},"Pattern C: Full PGE (Planner + Gen + Eval)",[3598,6133,6134,6135],{},"Sprints for stacks. Upadhyay's guide: Use for >5 steps.",[3687,6136,6137],{},[3734,6138,4176],{},[6140,6141,6142,6161],"table",{},[6143,6144,6145],"thead",{},[6146,6147,6148,6152,6155,6158],"tr",{},[6149,6150,6151],"th",{},"Pattern",[6149,6153,6154],{},"Task Fit",[6149,6156,6157],{},"Cost Multiplier",[6149,6159,6160],{},"Reliability",[6162,6163,6164,6179,6193],"tbody",{},[6146,6165,6166,6170,6173,6176],{},[6167,6168,6169],"td",{},"Simple Loop",[6167,6171,6172],{},"Short, objective",[6167,6174,6175],{},"1x",[6167,6177,6178],{},"High for basics",[6146,6180,6181,6184,6187,6190],{},[6167,6182,6183],{},"Gen-Eval",[6167,6185,6186],{},"Mid, subjective",[6167,6188,6189],{},"2-3x",[6167,6191,6192],{},"Good",[6146,6194,6195,6198,6201,6204],{},[6167,6196,6197],{},"Full Harness",[6167,6199,6200],{},"Complex, long",[6167,6202,6203],{},"5x+",[6167,6205,6206],{},"Production-grade",[3598,6208,6209],{},"Match to needs—don't overengineer.",[3611,6211,6213],{"id":6212},"why-agent-frameworks-arent-enough","Why Agent Frameworks Aren't Enough",[3598,6215,6216,6217,6219],{},"Agent frameworks like LangChain, CrewAI, and AutoGen provide orchestration tools but fall short without custom ",[3640,6218,5852],{}," design, ignoring data governance gaps (80% of impl time on data eng) and production issues like hallucinations under load. They're Lego bricks; harness is the blueprint. (54 words)",[3598,6221,6222,6223,6227,6228],{},"Rasa's 2026 review scores them on readiness: LangGraph strong on graphs, CrewAI on crews, but all demo-shine, prod-crack.",[3687,6224,6225],{},[3734,6226,5671],{}," Airbyte: 80% time on data pipelines, not config.",[3687,6229,6230],{},[3734,6231,5679],{},[3598,6233,6234],{},"Gaps:",[3634,6236,6237,6248,6254],{},[3637,6238,6239,6242,6243],{},[3640,6240,6241],{},"Data trust",": Emily Winks (Atlan): \"Agents assume trustworthy data... It's a governance problem.\"",[3687,6244,6245],{},[3734,6246,6247],{},"11",[3637,6249,6250,6253],{},[3640,6251,6252],{},"Explainability",": Black-box flows fail audits.",[3637,6255,6256,6259],{},[3640,6257,6258],{},"Load hallucinations",": Demos low-traffic; prod spikes break.",[3598,6261,6262,6263],{},"Frameworks orchestrate; harnesses govern. Build custom atop them—LangGraph for PGE loops shines. Future: MCP standards for interoperability.",[3687,6264,6265],{},[3734,6266,6267],{},"12",[3598,6269,6270],{},"Harness engineering trumps model power now.",[3611,6272,6274],{"id":6273},"production-challenges-and-fixes-for-agent-harnesses","Production Challenges and Fixes for Agent Harnesses",[3598,6276,5112,6277,6279],{},[3640,6278,5852],{},"es face high costs from token usage, debugging multi-agent interactions, and data governance issues, fixed by budget enforcement, modular monitoring, tool integration, and iterative \"build for deletion\" design anticipating model improvements. Costs can 5x vs. singles, but quality pays. (48 words)",[3598,6281,6282,6285,6286],{},[3640,6283,6284],{},"Cost control",": Track per-agent tokens; cap loops (e.g., 3 evals max). Ahmed's runs: Harness saved 20% net via fewer redos.",[3687,6287,6288],{},[3734,6289,4065],{},[3598,6291,6292,6295],{},[3640,6293,6294],{},"Debugging",": Log state, comms. Modular: Swap evals without rebuild.",[3598,6297,6298,6301,6302],{},[3640,6299,6300],{},"Data gov",": Validate inputs—Atlan tools pre-check staleness.",[3687,6303,6304],{},[3734,6305,6306],{},"13",[3598,6308,6309],{},"Fixes:",[3634,6311,6312,6318,6324],{},[3637,6313,6314,6317],{},[3640,6315,6316],{},"Human-in-loop",": Approve specs, spot drifts.",[3637,6319,6320,6323],{},[3640,6321,6322],{},"Scalability",": Async sprints, queueing.",[3637,6325,6326,6329],{},[3640,6327,6328],{},"Build for deletion",": Modular for model leaps.",[3598,6331,6332],{},"Misconception: Frameworks = done. No—harness first.",[3611,6334,6336],{"id":6335},"building-reliable-agent-harnesses-today","Building Reliable Agent Harnesses Today",[3598,6338,6339,6340,6342],{},"Specialized roles beat generalists for complex work. The ",[3640,6341,5852],{},"—Planner, Generator, Evaluator—delivers production robustness as frameworks mature but orchestration lags.",[3598,6344,6345],{},"Trends: Tool evals, modularity. Checklist for your first:",[3992,6347,6348,6351,6354,6357,6360],{},[3637,6349,6350],{},"Audit a failed single-agent task.",[3637,6352,6353],{},"Sketch PGE: Sub-tasks, criteria.",[3637,6355,6356],{},"Prototype in LangGraph\u002FCrewAI.",[3637,6358,6359],{},"Run one sprint; log tokens.",[3637,6361,6362],{},"Iterate to 80%+ eval score.",[3598,6364,6365],{},"Pick a backlog flop, paper-sketch the harness (Planner subs, Eval tools), prototype in LangGraph—track costs, one sprint. Measure the lift yourself.",[4006,6367,6368],{},"html .default .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html.dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}",{"title":3593,"searchDepth":3744,"depth":3744,"links":6370},[6371,6372,6373,6374,6375,6376,6377,6378],{"id":5809,"depth":3744,"text":5810},{"id":5845,"depth":3744,"text":5846},{"id":5896,"depth":3744,"text":5897},{"id":6036,"depth":3744,"text":6037},{"id":6092,"depth":3744,"text":6093},{"id":6212,"depth":3744,"text":6213},{"id":6273,"depth":3744,"text":6274},{"id":6335,"depth":3744,"text":6336},"Production AI agent systems demand a 3-core agent harness—Planner for task decomposition, Generator for execution, Evaluator for unbiased verification—because single agents suffer from underspecification, self-bias, and context limits, delivering unreliable outputs on complex tasks. (38 words)",[5852,4028,5767,6381,6382,5768,6383,6384],"AI agents production","LLM agent architecture","harness design","AI agent evaluation",{},"Build reliable production AI agents with the 3-core harness: Planner decomposes tasks, Generator executes, Evaluator verifies objectively. Overcome single-agent failures like underscoping and bias for full-stack builds and automations—patterns, trade-offs, and implementation guide.","3-Core Agent Harness for Production AI Agents","\u002Farticles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-baseline-post-merge-article",[],{"intro":4036,"why-single-agent-systems-fail-production-tasks":5810,"what-is-the-3-core-agent-harness":5846,"the-planner-decomposing-tasks-into-actionable-specs":5897,"generator-and-evaluator-execution-meets-verification":6037,"agent-harness-patterns-for-scaling-complexity":6093,"why-agent-frameworks-arent-enough":6213,"production-challenges-and-fixes-for-agent-harnesses":6274,"building-reliable-agent-harnesses-today":6336},{"title":5786,"description":6379},{"loc":6388},"articles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-baseline-post-merge-article","UhWs8sgZbsGRyL5uVfvs_QzI9CHX8VgqL3qnduhOEpk",{"id":6396,"title":6397,"ai_summary":6398,"author":3593,"body":6399,"category":5764,"date_modified":4020,"description":7187,"excerpt":3593,"extension":4021,"faq":4020,"keywords":7188,"meta":7194,"meta_description":7195,"meta_title":7196,"navigation":4032,"path":7197,"primary_keyword":4611,"published_at":4020,"related_posts":7198,"sections":7199,"seo":7200,"sitemap":7201,"slug":7202,"status":4040,"stem":7203,"__hash__":7204},"articles\u002Farticles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-baseline-round2-article.md","Harness Engineering: The 3-Core System for Reliable Production AI Agents","Production AI agents succeed through harness engineering—a structured system around the model featuring a Planner for specs, Generator for implementation, and independent Evaluator for critique—outperforming solo agents by addressing generosity bias and self-evaluation failures. This 3-core harness delivers reliable outputs for coding and long tasks. (50 words)",{"type":3595,"value":6400,"toc":7175},[6401,6410,6419,6422,6426,6438,6441,6444,6464,6479,6482,6486,6495,6502,6509,6512,6521,6524,6527,6531,6540,6543,6563,6572,6575,6584,6587,6591,6600,6603,6611,6614,6617,6662,6665,6668,6672,6681,6686,6692,6695,6700,6711,6714,6717,6725,6734,6737,6756,6760,6769,6775,6781,6792,6806,6809,6858,6861,6864,6867,6871,6880,6883,6891,6907,6915,6918,6921,6925,6934,6936,6947,6950,6953,6993,6996,6999,7003,7006,7009,7012,7029,7032,7172],[3598,6402,6403,6404,6409],{},"Production AI agents fail at an 88% rate despite LLM advances because they rely on solo models without proper scaffolding.",[3687,6405,6406],{},[3660,6407,3695],{"href":4057,"ariaDescribedBy":6408,"dataFootnoteRef":3593,"id":4059},[3693]," Harness engineering fixes this: build a 3-core system with a Planner for specs, Generator for code, and independent Evaluator for critique. This outperforms single agents by countering generosity bias and self-evaluation flaws (42 words).",[3598,6411,6412,6413,6418],{},"You've seen the hype—agents that code apps, manage workflows, ship features. But in production, most crumble. A solo agent might spit out a game engine in 20 minutes for $9, only for core mechanics to break on first play.",[3687,6414,6415],{},[3660,6416,4065],{"href":3691,"ariaDescribedBy":6417,"dataFootnoteRef":3593,"id":3694},[3693]," The 3-core harness, drawn from Anthropic's research, takes six hours and $200 but delivers a fully playable title with advanced features like multiplayer and AI opponents.",[3598,6420,6421],{},"Why does this matter now? As an indie builder or AI dev, you're shipping products where unreliable agents mean broken features, wasted cycles, and lost trust. Harness engineering isn't theory—it's the system that turns demos into deployables. We'll break down the why, the architecture, components, results, and trade-offs, with prompts and patterns you can use today.",[3611,6423,6425],{"id":6424},"what-is-harness-engineering","What Is Harness Engineering?",[3598,6427,6428,6429,4978,6432,6437],{},"Harness engineering is the discipline of building production-grade scaffolding around LLMs—coordination layers, specialized agents, validation loops, and session orchestration—that ensures reliable AI agent performance, far more than model choice alone. It evolved from prompt engineering to handle complex, multi-turn tasks like app development, with components like guides (feedforward) and sensors (feedback) encoding fixes for model weaknesses. Tian Pan boils it down: ",[3640,6430,6431],{},"Agent = Model + Harness",[3687,6433,6434],{},[3660,6435,4109],{"href":4106,"ariaDescribedBy":6436,"dataFootnoteRef":3593,"id":4108},[3693]," (72 words)",[3598,6439,6440],{},"Prompt engineering works for single turns: stuff context, get output. But production agents run sessions—hours of back-and-forth, context resets, accumulating errors. Harness engineering orchestrates this: it sequences agent calls, injects state, validates outputs, and loops on failures.",[3598,6442,6443],{},"Core principles set it apart:",[3634,6445,6446,6452,6458],{},[3637,6447,6448,6451],{},[3640,6449,6450],{},"Specialization",": No jack-of-all-trades agents. Use dedicated Planner, Generator, Evaluator.",[3637,6453,6454,6457],{},[3640,6455,6456],{},"Validation loops",": External checks (tests, linters) before declaring \"done.\"",[3637,6459,6460,6463],{},[3640,6461,6462],{},"Externalized state",": Progress files in JSON or Markdown persist across resets.",[3598,6465,6466,6467,6472,6473,6478],{},"Without it, 88% of agent projects never hit production—not from dumb models, but brittle systems.",[3687,6468,6469],{},[3660,6470,3695],{"href":4057,"ariaDescribedBy":6471,"dataFootnoteRef":3593,"id":4074},[3693]," MindStudio calls this the shift from \"prompt hacking\" to \"session engineering.\"",[3687,6474,6475],{},[3660,6476,4138],{"href":4135,"ariaDescribedBy":6477,"dataFootnoteRef":3593,"id":4137},[3693]," You need it for coding agents, long-running tasks, or anything beyond chat.",[3598,6480,6481],{},"I've built agent pipelines for indie apps. Swapping Claude for Gemini barely moved the needle—until I added a harness. Reliability jumped from flaky to shippable.",[3611,6483,6485],{"id":6484},"why-single-ai-agents-fail-in-production","Why Single AI Agents Fail in Production",[3598,6487,6488,6489,6494],{},"Single AI agents fail production at an 88% rate because LLMs suffer generosity bias (self-praise of mediocre work), context anxiety (rushing as tokens fill), and unreliable self-evaluation—leading to broken outputs in coding or long tasks. Benchmarks show solo agents produce non-functional apps, while harnessed systems deliver working ones. Apurv Khare nails it: models can't judge their own code.",[3687,6490,6491],{},[3660,6492,4065],{"href":3691,"ariaDescribedBy":6493,"dataFootnoteRef":3593,"id":4157},[3693]," (68 words)",[3598,6496,6497,6498,6501],{},"Start with ",[3640,6499,6500],{},"generosity bias",". LLMs rate their output high even when it's junk. A solo agent declares a half-baked function \"complete\" because it lacks external critique.",[3598,6503,6504,6505,6508],{},"Then ",[3640,6506,6507],{},"context anxiety",": As the window fills with history, models truncate reasoning to fit. Outputs get hasty, errors compound.",[3598,6510,6511],{},"Self-evaluation? Worse. The same model generating code can't spot its flaws—it's like grading your own homework.",[3598,6513,6514,6515,6520],{},"Real example: That 20-minute\u002F$9 solo agent game.",[3687,6516,6517],{},[3660,6518,4065],{"href":3691,"ariaDescribedBy":6519,"dataFootnoteRef":3593,"id":4192},[3693]," It rendered sprites but crashed on collisions. No multiplayer, no saves—core broken.",[3598,6522,6523],{},"Community echoes this. Nurunnubi Talukder: \"Generator-judge fails because models lie to themselves.\" Christian Ingul: \"Same agent generating and judging doesn't work.\" Divyansh Puri: \"A harness tames the wild horse.\"",[3598,6525,6526],{},"For you? Wasted API spend, debugging agent hallucinations in prod, features that flake under load. Solo agents demo well but ship poorly.",[3611,6528,6530],{"id":6529},"the-3-core-agent-harness-planner-generator-evaluator","The 3-Core-Agent Harness: Planner, Generator, Evaluator",[3598,6532,6533,6534,6539],{},"The 3-core-agent harness in harness engineering separates concerns into a Planner (goal-to-spec), Generator (incremental builds with negotiated \"done\" contracts), and Evaluator (independent testing\u002Fcritique)—creating a GAN-inspired loop that overcomes solo agent limits for production reliability in tasks like game engines or apps. Anthropic's benchmarks prove it: harnessed agents ship quality where solos fail.",[3687,6535,6536],{},[3660,6537,4065],{"href":3691,"ariaDescribedBy":6538,"dataFootnoteRef":3593,"id":4264},[3693]," (74 words)",[3598,6541,6542],{},"Here's the flow:",[3992,6544,6545,6550,6555,6560],{},[3637,6546,6547,6549],{},[3640,6548,5872],{},": High-level goal → detailed spec + Definition of Done (DoD).",[3637,6551,6552,6554],{},[3640,6553,5480],{},": Picks a sprint, negotiates DoD with Evaluator, codes incrementally using progress files.",[3637,6556,6557,6559],{},[3640,6558,5486],{},": Runs end-to-end tests (e.g., Playwright), reports file\u002Fline fixes needed.",[3637,6561,6562],{},"Loop: Failures route back to Generator. Success advances progress file.",[3598,6564,6565,6566,6571],{},"It's GAN-like: Generator improves via Evaluator's adversarial feedback.",[3687,6567,6568],{},[3660,6569,4176],{"href":4173,"ariaDescribedBy":6570,"dataFootnoteRef":3593,"id":4175},[3693]," External memory—progress.json tracks tasks, code state, decisions—handles resets.",[3598,6573,6574],{},"Why superior? Independent eval kills bias. Negotiation upfront aligns expectations. Iteration polishes.",[3598,6576,6577,6578,6583],{},"From Anthropic: Solo = broken basics. Harness = advanced, playable.",[3687,6579,6580],{},[3660,6581,4065],{"href":3691,"ariaDescribedBy":6582,"dataFootnoteRef":3593,"id":4275},[3693]," I've used variants for backend APIs—output went from 60% passing tests to 95%.",[3598,6585,6586],{},"Prompt each core narrowly. Planner stays high-level to avoid over-spec. Generator reads progress.json. Evaluator gets tools for real testing.",[3611,6588,6590],{"id":6589},"how-the-planner-turns-goals-into-actionable-specs","How the Planner Turns Goals into Actionable Specs",[3598,6592,6593,6594,6599],{},"The Planner agent in harness engineering takes 1-4 sentence high-level goals and expands them into detailed product specs and Definition of Done, avoiding cascading errors by staying high-level and defining success criteria upfront—setting a solid foundation for Generator sprints. Anthropic's game engine example: \"Build a multiplayer shooter\" becomes UI flows, mechanics, tech stack, and testable DoD.",[3687,6595,6596],{},[3660,6597,4065],{"href":3691,"ariaDescribedBy":6598,"dataFootnoteRef":3593,"id":4371},[3693]," (62 words)",[3598,6601,6602],{},"Process is simple:",[3634,6604,6605,6608],{},[3637,6606,6607],{},"Input: \"Build a web-based task manager with user auth.\"",[3637,6609,6610],{},"Output: YAML spec with features (login, CRUD tasks, search), stack (React\u002FNode\u002FPostgres), DoD (e.g., \"User can create task via UI, persists to DB, lists 100 items\").",[3598,6612,6613],{},"Benefits? No Generator assumptions—everything explicit. Sprints stay bite-sized (one feature).",[3598,6615,6616],{},"Example spec snippet:",[3726,6618,6620],{"className":4293,"code":6619,"language":4295,"meta":3593,"style":3593},"features:\n  - login: JWT auth, form validation\ndod:\n  - \"Playwright test: New user logs in, redirects to dashboard\"\n  - \"API endpoint \u002Ftasks returns JSON array\"\n",[3714,6621,6622,6629,6641,6648,6655],{"__ignoreMap":3593},[3734,6623,6624,6627],{"class":3736,"line":3737},[3734,6625,6626],{"class":4302},"features",[3734,6628,4306],{"class":3740},[3734,6630,6631,6633,6636,6638],{"class":3736,"line":3744},[3734,6632,4311],{"class":3740},[3734,6634,6635],{"class":4302},"login",[3734,6637,3751],{"class":3740},[3734,6639,6640],{"class":3754},"JWT auth, form validation\n",[3734,6642,6643,6646],{"class":3736,"line":3761},[3734,6644,6645],{"class":4302},"dod",[3734,6647,4306],{"class":3740},[3734,6649,6650,6652],{"class":3736,"line":3770},[3734,6651,4311],{"class":3740},[3734,6653,6654],{"class":3754},"\"Playwright test: New user logs in, redirects to dashboard\"\n",[3734,6656,6657,6659],{"class":3736,"line":3779},[3734,6658,4311],{"class":3740},[3734,6660,6661],{"class":3754},"\"API endpoint \u002Ftasks returns JSON array\"\n",[3598,6663,6664],{},"Tips: Prompt with \"Output YAML only. Stay high-level—no code.\" Limit to 5-10 sprints. Review manually first time.",[3598,6666,6667],{},"This prevents 80% of early failures I've seen. Builders skip it, watch cascades.",[3611,6669,6671],{"id":6670},"generator-and-evaluator-the-iteration-loop-that-delivers-quality","Generator and Evaluator: The Iteration Loop That Delivers Quality",[3598,6673,6674,6675,6680],{},"In harness engineering, the Generator implements sprints based on Planner specs and pre-negotiated DoD contracts, while the Evaluator independently tests via tools like Playwright—reporting precise file\u002Fline failures for targeted fixes in a feedback loop that yields far superior outputs than self-evaluation. Contrast: Solo agents break on basics; harnessed ones ship advanced features.",[3687,6676,6677],{},[3660,6678,4065],{"href":3691,"ariaDescribedBy":6679,"dataFootnoteRef":3593,"id":5388},[3693]," (71 words)",[3598,6682,6683,6685],{},[3640,6684,5480],{}," reads spec, progress.json, negotiates DoD:",[3726,6687,6690],{"className":6688,"code":6689,"language":4953},[4951],"Generator: \"Sprint: Login form. Proposed DoD: Form submits, stores JWT in localStorage.\"\nEvaluator: \"Accept. Add: Error on invalid creds.\"\n",[3714,6691,6689],{"__ignoreMap":3593},[3598,6693,6694],{},"Codes incrementally—edits files, commits to git-like state.",[3598,6696,6697,6699],{},[3640,6698,5486],{}," launches app, runs tests:",[3634,6701,6702,6705,6708],{},[3637,6703,6704],{},"UI: Playwright clicks, asserts.",[3637,6706,6707],{},"API: Curl endpoints.",[3637,6709,6710],{},"DB: Query state.",[3598,6712,6713],{},"Feedback: \"src\u002Fauth.js:47—JWT decode fails on expiry. Fix expiry check.\"",[3598,6715,6716],{},"Loop 3-5 times per sprint. Tools make it concrete—no vagueness.",[3598,6718,6719,6720],{},"GAN analogy from Talukder: Evaluator \"fights\" Generator to quality.",[3687,6721,6722],{},[3660,6723,4176],{"href":4173,"ariaDescribedBy":6724,"dataFootnoteRef":3593,"id":4185},[3693],[3598,6726,6727,6728,6733],{},"Solo vs. harness: 20min broken → 6hr playable.",[3687,6729,6730],{},[3660,6731,4065],{"href":3691,"ariaDescribedBy":6732,"dataFootnoteRef":3593,"id":5437},[3693]," In my tests, eval precision cut revisions 40%.",[3598,6735,6736],{},"Integrate Playwright:",[3726,6738,6740],{"className":5002,"code":6739,"language":5004,"meta":3593,"style":3593},"npx playwright test --project=agent-eval\n",[3714,6741,6742],{"__ignoreMap":3593},[3734,6743,6744,6747,6750,6753],{"class":3736,"line":3737},[3734,6745,6746],{"class":5011},"npx",[3734,6748,6749],{"class":3754}," playwright",[3734,6751,6752],{"class":3754}," test",[3734,6754,6755],{"class":3747}," --project=agent-eval\n",[3611,6757,6759],{"id":6758},"harness-components-guides-sensors-and-orchestration","Harness Components: Guides, Sensors, and Orchestration",[3598,6761,6762,6763,6768],{},"Effective harness engineering relies on guides (feedforward docs\u002Fspecs), sensors (feedback like linters\u002Ftests), session orchestration (context injection\u002Fvalidation), and output loops—plus state files and specialization—to make agents reliable across resets and complex tasks. Tian Pan: Guides steer proactively; sensors correct reactively.",[3687,6764,6765],{},[3660,6766,4109],{"href":4106,"ariaDescribedBy":6767,"dataFootnoteRef":3593,"id":4211},[3693]," (54 words)",[3598,6770,6771,6774],{},[3640,6772,6773],{},"Guides",": Docs encoding \"good\"—architecture.md, prompt templates, examples. Injected per session.",[3598,6776,6777,6780],{},[3640,6778,6779],{},"Sensors",": Linters (ESLint), tests (Jest), AI reviewers. Run post-generation.",[3598,6782,6783,6786,6787],{},[3640,6784,6785],{},"Orchestration"," (MindStudio):",[3687,6788,6789],{},[3660,6790,4138],{"href":4135,"ariaDescribedBy":6791,"dataFootnoteRef":3593,"id":4147},[3693],[3634,6793,6794,6797,6800,6803],{},[3637,6795,6796],{},"Start: Inject goal + progress.",[3637,6798,6799],{},"Route: Planner → Generator\u002FEval loop.",[3637,6801,6802],{},"Validate: Schema check outputs.",[3637,6804,6805],{},"Persist: Update progress.json.",[3598,6807,6808],{},"State files example:",[3726,6810,6812],{"className":3728,"code":6811,"language":3730,"meta":3593,"style":3593},"{\n  \"completed\": [\"auth\"],\n  \"in_progress\": \"tasks-crud\",\n  \"dod\": [\"API returns 200 with tasks\"]\n}\n",[3714,6813,6814,6818,6830,6842,6854],{"__ignoreMap":3593},[3734,6815,6816],{"class":3736,"line":3737},[3734,6817,3741],{"class":3740},[3734,6819,6820,6823,6825,6828],{"class":3736,"line":3744},[3734,6821,6822],{"class":3747},"  \"completed\"",[3734,6824,4729],{"class":3740},[3734,6826,6827],{"class":3754},"\"auth\"",[3734,6829,5200],{"class":3740},[3734,6831,6832,6835,6837,6840],{"class":3736,"line":3761},[3734,6833,6834],{"class":3747},"  \"in_progress\"",[3734,6836,3751],{"class":3740},[3734,6838,6839],{"class":3754},"\"tasks-crud\"",[3734,6841,3758],{"class":3740},[3734,6843,6844,6847,6849,6852],{"class":3736,"line":3770},[3734,6845,6846],{"class":3747},"  \"dod\"",[3734,6848,4729],{"class":3740},[3734,6850,6851],{"class":3754},"\"API returns 200 with tasks\"",[3734,6853,4735],{"class":3740},[3734,6855,6856],{"class":3736,"line":3779},[3734,6857,3838],{"class":3740},[3598,6859,6860],{},"Specialization: Add ArchAgent for design, TestGen for suites.",[3598,6862,6863],{},"This combo handles resets—your session crashed? Resume from state.",[3598,6865,6866],{},"No guides\u002Fsensors? Back to solo fragility.",[3611,6868,6870],{"id":6869},"real-results-why-the-harness-beats-solo-agents","Real Results: Why the Harness Beats Solo Agents",[3598,6872,6873,6874,6879],{},"Benchmarks from Anthropic show the 3-core harness builds fully playable games with advanced features in 6 hours\u002F$200, versus solo agents' broken cores in 20min\u002F$9—proving harness engineering delivers production quality where models alone fail. Community validates: Better systems, not smarter models.",[3687,6875,6876],{},[3660,6877,4065],{"href":3691,"ariaDescribedBy":6878,"dataFootnoteRef":3593,"id":5547},[3693]," (52 words)",[3598,6881,6882],{},"Anthropic case: Goal—\"multiplayer FPS.\"",[3634,6884,6885,6888],{},[3637,6886,6887],{},"Solo: Sprites move, but no collisions, scoring, multiplayer.",[3637,6889,6890],{},"Harness: Full UI, netcode, AI bots, saves—all working.",[3598,6892,6893,6894,6899,6900,6906],{},"Khare: \"Harness is the interesting space.\"",[3687,6895,6896],{},[3660,6897,4065],{"href":3691,"ariaDescribedBy":6898,"dataFootnoteRef":3593,"id":5556},[3693]," Talukder: \"Encode model limits.\"",[3687,6901,6902],{},[3660,6903,4176],{"href":4173,"ariaDescribedBy":6904,"dataFootnoteRef":3593,"id":6905},[3693],"user-content-fnref-5-3"," Ripley: \"Systems around models.\" Ben Ripley on LinkedIn.",[3598,6908,6909,6910],{},"Broader: Fixes 88% failure by design.",[3687,6911,6912],{},[3660,6913,3695],{"href":4057,"ariaDescribedBy":6914,"dataFootnoteRef":3593,"id":4088},[3693],[3598,6916,6917],{},"Evolve it: As models improve, delete sensors for self-eval. Audit quarterly.",[3598,6919,6920],{},"I've shipped a CRM agent this way—solo would've bombed prod.",[3611,6922,6924],{"id":6923},"trade-offs-and-how-to-implement-harness-engineering-today","Trade-offs and How to Implement Harness Engineering Today",[3598,6926,6927,6928,6933],{},"Harness engineering adds cost\u002Flatency (e.g., 30x time) but justifies for production via reliability; implement via LangChain\u002FCrewAI for orchestration, start with Generator-Evaluator pair for simple tasks, scale to 3-core, and audit regularly. Not frameworks alone—custom loops win.",[3687,6929,6930],{},[3660,6931,4109],{"href":4106,"ariaDescribedBy":6932,"dataFootnoteRef":3593,"id":4222},[3693]," (48 words)",[3598,6935,5521],{},[3634,6937,6938,6941,6944],{},[3637,6939,6940],{},"Overhead: $200 vs. $9, hours vs. minutes.",[3637,6942,6943],{},"When simplify: Short tasks → Gen-Eval. Complex → full harness.",[3637,6945,6946],{},"Cost threshold: >$50\u002Ftask? Harness pays off.",[3598,6948,6949],{},"Misconception: CrewAI ≠ harness. It's orchestration—build custom.",[3598,6951,6952],{},"Quick start pseudocode:",[3726,6954,6956],{"className":5251,"code":6955,"language":5253,"meta":3593,"style":3593},"while not done(progress):\n    spec = planner(goal)\n    for sprint in spec:\n        dod = negotiate(gen, eval, sprint)\n        code = generator(sprint, progress)\n        feedback = evaluator(code, dod)\n        if pass: update_progress()\n",[3714,6957,6958,6963,6968,6973,6978,6983,6988],{"__ignoreMap":3593},[3734,6959,6960],{"class":3736,"line":3737},[3734,6961,6962],{},"while not done(progress):\n",[3734,6964,6965],{"class":3736,"line":3744},[3734,6966,6967],{},"    spec = planner(goal)\n",[3734,6969,6970],{"class":3736,"line":3761},[3734,6971,6972],{},"    for sprint in spec:\n",[3734,6974,6975],{"class":3736,"line":3770},[3734,6976,6977],{},"        dod = negotiate(gen, eval, sprint)\n",[3734,6979,6980],{"class":3736,"line":3779},[3734,6981,6982],{},"        code = generator(sprint, progress)\n",[3734,6984,6985],{"class":3736,"line":3787},[3734,6986,6987],{},"        feedback = evaluator(code, dod)\n",[3734,6989,6990],{"class":3736,"line":3793},[3734,6991,6992],{},"        if pass: update_progress()\n",[3598,6994,6995],{},"Tools: LangChain for chains, Playwright for eval, JSON for state.",[3598,6997,6998],{},"Audit: Run solo vs. harness on toy task. Measure pass rate.",[3611,7000,7002],{"id":7001},"next-steps-bootstrap-your-harness-today","Next Steps: Bootstrap Your Harness Today",[3598,7004,7005],{},"Harness engineering moves agents from demo toys to production engines—Planner sets rails, Generator-Eval loop grinds quality, components make it resilient. Recap: Model matters less than system.",[3598,7007,7008],{},"Future: Dynamic harnesses auto-simplify; agent-first dev.",[3598,7010,7011],{},"Checklist:",[3634,7013,7014,7017,7020,7023,7026],{},[3637,7015,7016],{},"Map your agent to 3 cores.",[3637,7018,7019],{},"Add Playwright to Eval.",[3637,7021,7022],{},"Externalize state to JSON.",[3637,7024,7025],{},"Negotiate DoD pre-code.",[3637,7027,7028],{},"Benchmark solo vs. harness on a feature.",[3598,7030,7031],{},"Audit your current project now: Slot it into Planner\u002FGen\u002FEval, wire an independent evaluator with Playwright tests, run one sprint, and compare output quality. You'll see the gap—and close it.",[3982,7033,7035,7038],{"className":7034,"dataFootnotes":3593},[3985],[3611,7036,3990],{"className":7037,"id":3693},[3989],[3992,7039,7040,7060,7115,7135,7150],{},[3637,7041,7042,4423,7047,4423,7050,4423,7055],{"id":4417},[3660,7043,7046],{"href":7044,"rel":7045},"https:\u002F\u002Fmiraflow.ai\u002Fblog\u002Fharness-engineering-why-88-percent-ai-agents-fail",[3664],"Miraflow AI: Harness Engineering: Why 88% of AI Agents Fail",[3660,7048,4004],{"href":4421,"ariaLabel":4001,"className":7049,"dataFootnoteBackref":3593},[4003],[3660,7051,4004,7053],{"href":4426,"ariaLabel":4427,"className":7052,"dataFootnoteBackref":3593},[4003],[3687,7054,4065],{},[3660,7056,4004,7058],{"href":4433,"ariaLabel":4434,"className":7057,"dataFootnoteBackref":3593},[4003],[3687,7059,4109],{},[3637,7061,7062,4423,7067,4423,7070,4423,7075,4423,7080,4423,7085,4423,7090,4423,7095,4423,7100,4423,7105,4423,7110],{"id":3996},[3660,7063,7066],{"href":7064,"rel":7065},"https:\u002F\u002Fwww.linkedin.com\u002Fposts\u002Fapurvkhare_apurv-khare-harness-engineering-long-activity-7446406273853562880-khax",[3664],"Apurv Khare on LinkedIn: Harness Engineering",[3660,7068,4004],{"href":4000,"ariaLabel":4472,"className":7069,"dataFootnoteBackref":3593},[4003],[3660,7071,4004,7073],{"href":4476,"ariaLabel":4477,"className":7072,"dataFootnoteBackref":3593},[4003],[3687,7074,4065],{},[3660,7076,4004,7078],{"href":4483,"ariaLabel":4484,"className":7077,"dataFootnoteBackref":3593},[4003],[3687,7079,4109],{},[3660,7081,4004,7083],{"href":4490,"ariaLabel":4491,"className":7082,"dataFootnoteBackref":3593},[4003],[3687,7084,4138],{},[3660,7086,4004,7088],{"href":4497,"ariaLabel":4498,"className":7087,"dataFootnoteBackref":3593},[4003],[3687,7089,4176],{},[3660,7091,4004,7093],{"href":4504,"ariaLabel":4505,"className":7092,"dataFootnoteBackref":3593},[4003],[3687,7094,4360],{},[3660,7096,4004,7098],{"href":5652,"ariaLabel":5653,"className":7097,"dataFootnoteBackref":3593},[4003],[3687,7099,4466],{},[3660,7101,4004,7103],{"href":5659,"ariaLabel":5660,"className":7102,"dataFootnoteBackref":3593},[4003],[3687,7104,5618],{},[3660,7106,4004,7108],{"href":5666,"ariaLabel":5667,"className":7107,"dataFootnoteBackref":3593},[4003],[3687,7109,5671],{},[3660,7111,4004,7113],{"href":5674,"ariaLabel":5675,"className":7112,"dataFootnoteBackref":3593},[4003],[3687,7114,5679],{},[3637,7116,7117,4423,7122,4423,7125,4423,7130],{"id":4511},[3660,7118,7121],{"href":7119,"rel":7120},"https:\u002F\u002Ftianpan.co\u002Fblog\u002F2026-02-17-harness-engineering-agent-first-software-development",[3664],"Tian Pan: Harness Engineering",[3660,7123,4004],{"href":4515,"ariaLabel":4516,"className":7124,"dataFootnoteBackref":3593},[4003],[3660,7126,4004,7128],{"href":4520,"ariaLabel":4521,"className":7127,"dataFootnoteBackref":3593},[4003],[3687,7129,4065],{},[3660,7131,4004,7133],{"href":4527,"ariaLabel":4528,"className":7132,"dataFootnoteBackref":3593},[4003],[3687,7134,4109],{},[3637,7136,7137,4423,7142,4423,7145],{"id":4541},[3660,7138,7141],{"href":7139,"rel":7140},"https:\u002F\u002Fwww.mindstudio.ai\u002Fblog\u002Fwhat-is-harness-engineering-ai-coding",[3664],"MindStudio: What Is Harness Engineering?",[3660,7143,4004],{"href":4545,"ariaLabel":4546,"className":7144,"dataFootnoteBackref":3593},[4003],[3660,7146,4004,7148],{"href":4550,"ariaLabel":4551,"className":7147,"dataFootnoteBackref":3593},[4003],[3687,7149,4065],{},[3637,7151,7152,4423,7157,4423,7160,4423,7165],{"id":4557},[3660,7153,7156],{"href":7154,"rel":7155},"https:\u002F\u002Fwww.linkedin.com\u002Fposts\u002Fnurunnubi_harness-design-for-long-running-application-activity-7447849188882632704--iEm",[3664],"Nurunnubi Talukder on LinkedIn",[3660,7158,4004],{"href":4561,"ariaLabel":4562,"className":7159,"dataFootnoteBackref":3593},[4003],[3660,7161,4004,7163],{"href":4566,"ariaLabel":4567,"className":7162,"dataFootnoteBackref":3593},[4003],[3687,7164,4065],{},[3660,7166,4004,7170],{"href":7167,"ariaLabel":7168,"className":7169,"dataFootnoteBackref":3593},"#user-content-fnref-5-3","Back to reference 5-3",[4003],[3687,7171,4109],{},[4006,7173,7174],{},"html pre.shiki code .s9eBZ, html code.shiki .s9eBZ{--shiki-default:#22863A;--shiki-dark:#85E89D}html pre.shiki code .sVt8B, html code.shiki .sVt8B{--shiki-default:#24292E;--shiki-dark:#E1E4E8}html pre.shiki code .sZZnC, html code.shiki .sZZnC{--shiki-default:#032F62;--shiki-dark:#9ECBFF}html .default .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .shiki span {color: var(--shiki-default);background: var(--shiki-default-bg);font-style: var(--shiki-default-font-style);font-weight: var(--shiki-default-font-weight);text-decoration: var(--shiki-default-text-decoration);}html .dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html.dark .shiki span {color: var(--shiki-dark);background: var(--shiki-dark-bg);font-style: var(--shiki-dark-font-style);font-weight: var(--shiki-dark-font-weight);text-decoration: var(--shiki-dark-text-decoration);}html pre.shiki code .sScJk, html code.shiki .sScJk{--shiki-default:#6F42C1;--shiki-dark:#B392F0}html pre.shiki code .sj4cs, html code.shiki .sj4cs{--shiki-default:#005CC5;--shiki-dark:#79B8FF}",{"title":3593,"searchDepth":3744,"depth":3744,"links":7176},[7177,7178,7179,7180,7181,7182,7183,7184,7185,7186],{"id":6424,"depth":3744,"text":6425},{"id":6484,"depth":3744,"text":6485},{"id":6529,"depth":3744,"text":6530},{"id":6589,"depth":3744,"text":6590},{"id":6670,"depth":3744,"text":6671},{"id":6758,"depth":3744,"text":6759},{"id":6869,"depth":3744,"text":6870},{"id":6923,"depth":3744,"text":6924},{"id":7001,"depth":3744,"text":7002},{"id":3693,"depth":3744,"text":3990},"Production AI agents fail at an 88% rate despite LLM advances because they rely on solo models without proper scaffolding.1 Harness engineering fixes this: build a 3-core system with a Planner for specs, Generator for code, and independent Evaluator for critique. This outperforms single agents by countering generosity bias and self-evaluation flaws (42 words).",[4611,7189,4024,5767,7190,7191,7192,7193],"AI agents","AI agent failure","LLM harness","agent architecture","reliable AI systems",{},"Discover harness engineering: Build reliable AI agents with Planner, Generator, and Evaluator to overcome 88% production failure rates. Proven in Anthropic's game engine benchmarks for coding tasks.","Harness Engineering for Production AI Agents","\u002Farticles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-baseline-round2-article",[],{"intro":5778,"what-is-harness-engineering":6425,"why-single-ai-agents-fail-in-production":6485,"the-3-core-agent-harness-planner-generator-evaluator":6530,"how-the-planner-turns-goals-into-actionable-specs":6590,"generator-and-evaluator-the-iteration-loop-that-delivers-quality":6671,"harness-components-guides-sensors-and-orchestration":6759,"real-results-why-the-harness-beats-solo-agents":6870,"trade-offs-and-how-to-implement-harness-engineering-today":6924},{"title":6397,"description":7187},{"loc":7197},"harness-engineering-3-core-system-reliable-production-ai-agents","articles\u002Fthe-3-core-agent-harness-why-production-agent-systems-need-planner-generator-evaluator-not-frameworks-ca-203-baseline-round2-article","9F3Tc1PUu6u5THLqevKsmyTtniK0N-jFEnyxvezgOFU"]