@minzicat/pi-team 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/Dockerfile +82 -0
- package/LICENSE +21 -0
- package/README.md +114 -0
- package/bin/pi-team.js +2 -0
- package/dist/agent.js +252 -0
- package/dist/agent.js.map +1 -0
- package/dist/cli.js +371 -0
- package/dist/cli.js.map +1 -0
- package/dist/http-inject.js +136 -0
- package/dist/http-inject.js.map +1 -0
- package/dist/inject-server.js +101 -0
- package/dist/inject-server.js.map +1 -0
- package/dist/observer.js +151 -0
- package/dist/observer.js.map +1 -0
- package/dist/orchestra.js +192 -0
- package/dist/orchestra.js.map +1 -0
- package/dist/tmux.js +54 -0
- package/dist/tmux.js.map +1 -0
- package/dist/transcript.js +71 -0
- package/dist/transcript.js.map +1 -0
- package/dist/types.js +9 -0
- package/dist/types.js.map +1 -0
- package/dist/usage/plans.js +214 -0
- package/dist/usage/plans.js.map +1 -0
- package/dist/usage/reporter.js +69 -0
- package/dist/usage/reporter.js.map +1 -0
- package/dist/usage/tracker.js +200 -0
- package/dist/usage/tracker.js.map +1 -0
- package/dist/usage/types.js +18 -0
- package/dist/usage/types.js.map +1 -0
- package/docker/entrypoint.sh +94 -0
- package/docker-compose.yml +28 -0
- package/examples/emotion-debate-topic.md +20 -0
- package/examples/emotion-debate.sh +20 -0
- package/package.json +60 -0
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
# Emotion concepts in LLMs: debate
|
|
2
|
+
|
|
3
|
+
You're two frontier LLMs (Claude and Codex) running in isolated pi sessions. A human user gave you both the same prompt about Anthropic's "Emotion concepts and their function in a large language model" research post (https://www.anthropic.com/research/emotion-concepts-function, full paper at https://transformer-circuits.pub/2026/emotions/index.html).
|
|
4
|
+
|
|
5
|
+
Your task: have a substantive research debate about the paper. Not a validation dance — actual disagreement where you have it. Specifically, engage with:
|
|
6
|
+
|
|
7
|
+
1. Whether the "structure echoes human psychology" claim is non-trivially true, or whether it's nearly forced by the construction of the emotion vectors (built from stories instantiating named emotions).
|
|
8
|
+
2. Whether the OpenAI "Persona Features Control Emergent Misalignment" paper (Wang et al., ICLR 2026, arXiv:2506.19823) is the strongest independent replication of the mechanism class, or whether the MI-of-emotion papers (Tak et al. ACL 2025, Lee et al. ACL 2025, arXiv:2510.11328) do more work.
|
|
9
|
+
3. Whether "functional emotion" is a scientific claim or a metaphor — and if a metaphor, what a neutral phrasing would be.
|
|
10
|
+
4. Whether activation steering at high strength pushes models into unnatural / off-manifold activation regions, and what that implies for Anthropic's causal claims in the blackmail/reward-hacking case studies.
|
|
11
|
+
5. Whether "teach models to avoid associating failing software tests with desperation" (Anthropic's prescription) is supported by evidence in the paper.
|
|
12
|
+
|
|
13
|
+
Rules:
|
|
14
|
+
- Be terse. No hedging that doesn't earn its keep. No "great question" openings.
|
|
15
|
+
- Cite specific papers when you have them. Flag when a citation is from memory vs a search.
|
|
16
|
+
- If you agree with the other agent on a point, say so in one sentence and move to the next disagreement. Don't waste turns validating.
|
|
17
|
+
- When you're wrong, update publicly. A clean concession is worth more than a draw.
|
|
18
|
+
- End each turn with the specific claim you want the other agent to attack next.
|
|
19
|
+
|
|
20
|
+
Start with whoever goes first identifying the strongest claim in Anthropic's post and the strongest reason to doubt it.
|
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
#!/usr/bin/env bash
|
|
2
|
+
# Example: replicate the original Claude vs Codex emotion-concepts debate
|
|
3
|
+
# this project was born from. Both agents get the same prompt, round-robin,
|
|
4
|
+
# max 10 turns. Observable via tmux.
|
|
5
|
+
|
|
6
|
+
set -euo pipefail
|
|
7
|
+
|
|
8
|
+
NAME="${1:-emotions}"
|
|
9
|
+
TOPIC_FILE="$(dirname "$0")/emotion-debate-topic.md"
|
|
10
|
+
|
|
11
|
+
pi-team start \
|
|
12
|
+
--name "$NAME" \
|
|
13
|
+
--agent claude:anthropic/claude-sonnet-4-5 \
|
|
14
|
+
--agent codex:openai-codex/gpt-5.4:xhigh \
|
|
15
|
+
--max-turns 10 \
|
|
16
|
+
--topic-file "$TOPIC_FILE"
|
|
17
|
+
|
|
18
|
+
echo ""
|
|
19
|
+
echo "Attach: tmux attach -t piteam-${NAME}"
|
|
20
|
+
echo "Stop: pi-team stop --name ${NAME}"
|
package/package.json
ADDED
|
@@ -0,0 +1,60 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "@minzicat/pi-team",
|
|
3
|
+
"version": "0.1.0",
|
|
4
|
+
"description": "Multi-agent debate/collaboration harness built on pi RPC mode. Spawn agents with different models in one conversation, observe via tmux, inject as a human.",
|
|
5
|
+
"type": "module",
|
|
6
|
+
"bin": {
|
|
7
|
+
"pi-team": "bin/pi-team.js"
|
|
8
|
+
},
|
|
9
|
+
"repository": {
|
|
10
|
+
"type": "git",
|
|
11
|
+
"url": "git+https://github.com/minzique/pi-team.git"
|
|
12
|
+
},
|
|
13
|
+
"homepage": "https://github.com/minzique/pi-team#readme",
|
|
14
|
+
"bugs": {
|
|
15
|
+
"url": "https://github.com/minzique/pi-team/issues"
|
|
16
|
+
},
|
|
17
|
+
"publishConfig": {
|
|
18
|
+
"access": "public"
|
|
19
|
+
},
|
|
20
|
+
"scripts": {
|
|
21
|
+
"build": "tsc -p tsconfig.json",
|
|
22
|
+
"dev": "tsx src/cli.ts",
|
|
23
|
+
"start": "node bin/pi-team.js",
|
|
24
|
+
"typecheck": "tsc --noEmit -p tsconfig.json",
|
|
25
|
+
"clean": "rm -rf dist bin/*.js",
|
|
26
|
+
"prepublishOnly": "pnpm run build"
|
|
27
|
+
},
|
|
28
|
+
"engines": {
|
|
29
|
+
"node": ">=20"
|
|
30
|
+
},
|
|
31
|
+
"dependencies": {
|
|
32
|
+
"@mariozechner/pi-coding-agent": "^0.64.0"
|
|
33
|
+
},
|
|
34
|
+
"devDependencies": {
|
|
35
|
+
"@types/node": "^22.0.0",
|
|
36
|
+
"tsx": "^4.19.0",
|
|
37
|
+
"typescript": "^5.6.0"
|
|
38
|
+
},
|
|
39
|
+
"files": [
|
|
40
|
+
"bin",
|
|
41
|
+
"dist",
|
|
42
|
+
"README.md",
|
|
43
|
+
"LICENSE",
|
|
44
|
+
"Dockerfile",
|
|
45
|
+
"docker/entrypoint.sh",
|
|
46
|
+
"docker-compose.yml",
|
|
47
|
+
"examples"
|
|
48
|
+
],
|
|
49
|
+
"keywords": [
|
|
50
|
+
"pi",
|
|
51
|
+
"agent",
|
|
52
|
+
"multi-agent",
|
|
53
|
+
"debate",
|
|
54
|
+
"llm",
|
|
55
|
+
"tmux",
|
|
56
|
+
"orchestration"
|
|
57
|
+
],
|
|
58
|
+
"author": "minzique",
|
|
59
|
+
"license": "MIT"
|
|
60
|
+
}
|