hummbl-bibliography 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.cascade/rules/hummbl-base120.md +107 -0
- package/.github/CODEOWNERS +17 -0
- package/.github/ISSUE_TEMPLATE/bug_report.md +24 -0
- package/.github/ISSUE_TEMPLATE/feature_request.md +10 -0
- package/.github/ISSUE_TEMPLATE/new-entry.md +79 -0
- package/.github/ISSUE_TEMPLATE/quality-improvement.md +71 -0
- package/.github/PULL_REQUEST_TEMPLATE.md +15 -0
- package/.github/dependabot.yml +17 -0
- package/.github/workflows/ci.yml +98 -0
- package/.github/workflows/doi-enrichment.yml +77 -0
- package/.github/workflows/security-audit.yml +92 -0
- package/.github/workflows/stats-report.yml +59 -0
- package/.github/workflows/validate-models.yml +194 -0
- package/.github/workflows/validate.yml +152 -0
- package/.husky/pre-commit +15 -0
- package/.husky/validation-rules.json +11 -0
- package/CHANGELOG.md +228 -0
- package/CONTRIBUTING.md +110 -0
- package/CONTRIBUTORS.md +257 -0
- package/DEVELOPMENT.md +110 -0
- package/Day_1_Audit_Worksheet.md +64 -0
- package/LICENSE +21 -0
- package/README.md +213 -0
- package/SECURITY.md +16 -0
- package/SITREP.md +141 -0
- package/bibliography/T10_collaboration.bib +281 -0
- package/bibliography/T11_security.bib +311 -0
- package/bibliography/T12_complexity.bib +272 -0
- package/bibliography/T13_reasoning.bib +231 -0
- package/bibliography/T1_canonical.bib +236 -0
- package/bibliography/T2_empirical.bib +258 -0
- package/bibliography/T3_applied.bib +219 -0
- package/bibliography/T4_agentic.bib +281 -0
- package/bibliography/T5_engineering.bib +243 -0
- package/bibliography/T6_governance.bib +277 -0
- package/bibliography/T7_emerging.bib +228 -0
- package/bibliography/T8_cognition.bib +260 -0
- package/bibliography/T9_economics.bib +275 -0
- package/bibliography/hummbl-transformations.json +84 -0
- package/dist/unified-bibliography.json +5699 -0
- package/docs/CONTRIBUTING.md +240 -0
- package/docs/GAP_ANALYSIS.md +142 -0
- package/docs/MULTI_AGENT_COORDINATION_PROTOCOL.md +700 -0
- package/docs/QUALITY_AUDIT_REPORT.md +576 -0
- package/docs/QUALITY_STANDARDS.md +350 -0
- package/docs/TRANSFORMATION_GUIDE.md +337 -0
- package/docs/metrics/model-accuracy.md +150 -0
- package/governance/CAES_CANONICAL.sha256 +1 -0
- package/governance/CAES_SPEC.md +107 -0
- package/governance/CAES_VERSION +1 -0
- package/governance/lexicon/ALLOWLIST_POLICY.md +63 -0
- package/governance/lexicon/CANONICALIZATION.md +63 -0
- package/governance/lexicon/acronym.schema.json +153 -0
- package/governance/lexicon/acronym_allowlist.txt +237 -0
- package/governance/lexicon/acronyms.v0.2.json +2555 -0
- package/llms.txt +1105 -0
- package/mappings/arcana_citations.json +219 -0
- package/mappings/bki_evidence.json +384 -0
- package/package.json +25 -0
- package/reports/.gitkeep +0 -0
- package/reports/citation_graph.json +119335 -0
- package/scripts/add_nist_tags.py +437 -0
- package/scripts/annotate_dois.py +204 -0
- package/scripts/check_palace_aliases.py +200 -0
- package/scripts/ingest_to_open_brain.py +307 -0
- package/scripts/monthly-review.sh +166 -0
- package/scripts/setup-hooks.sh +107 -0
- package/scripts/test_check_palace_aliases.py +194 -0
- package/sources/bki.bib +57 -0
- package/sources/theoretical-foundations.bib +589 -0
- package/toolkit/README.md +360 -0
- package/toolkit/docs/generated/quick-reference.md +179 -0
- package/toolkit/package-lock.json +1140 -0
- package/toolkit/package.json +66 -0
- package/toolkit/scripts/check-memory-palace-aliases.js +230 -0
- package/toolkit/scripts/check-memory-palace-aliases.test.js +297 -0
- package/toolkit/scripts/generate-docs.js +223 -0
- package/toolkit/src/check-duplicates.js +225 -0
- package/toolkit/src/check-required-fields.js +138 -0
- package/toolkit/src/citation-graph.js +425 -0
- package/toolkit/src/extensions/beyondBase120Audit.ts +250 -0
- package/toolkit/src/extensions/memoryPalace.ts +438 -0
- package/toolkit/src/extract-keywords.js +190 -0
- package/toolkit/src/find-missing-dois.js +178 -0
- package/toolkit/src/fix-duplicates.js +140 -0
- package/toolkit/src/merge-entries.js +29 -0
- package/toolkit/src/query.js +281 -0
- package/toolkit/src/stats.js +244 -0
- package/toolkit/src/test-validation.js +117 -0
- package/toolkit/src/utils/modelRegistry.ts +193 -0
- package/toolkit/src/utils/monitorModels.ts +150 -0
- package/toolkit/src/utils/validateModelCode.ts +196 -0
- package/toolkit/src/validate.js +251 -0
- package/toolkit/src/watch.js +100 -0
- package/toolkit/tsconfig.json +25 -0
|
@@ -0,0 +1,281 @@
|
|
|
1
|
+
% =============================================================================
|
|
2
|
+
% T10: Human-AI Collaboration, Team Science, and Organizational Design
|
|
3
|
+
% =============================================================================
|
|
4
|
+
%
|
|
5
|
+
% The hummbl-dev ecosystem implements a 12-terminal parallel Claude fleet,
|
|
6
|
+
% a multi-agent coordination bus, human-in-the-loop governance (kill switch,
|
|
7
|
+
% delegation tokens), a Morning Briefing system, and pair/mob programming at
|
|
8
|
+
% fleet scale -- yet has zero citations from collaboration science, CSCW, or
|
|
9
|
+
% team cognition literature. This tier grounds:
|
|
10
|
+
%
|
|
11
|
+
% - Human-AI teaming and complementarity
|
|
12
|
+
% - Computer-supported cooperative work (CSCW)
|
|
13
|
+
% - Team cognition and shared mental models
|
|
14
|
+
% - Organizational design for AI-augmented teams
|
|
15
|
+
% - Human oversight of autonomous systems (HOTL / society-in-the-loop)
|
|
16
|
+
% - Pair programming / mob programming (the swarm is this at scale)
|
|
17
|
+
%
|
|
18
|
+
% 12 entries. All DOIs verified via doi.org (HTTP 302 redirect confirmed).
|
|
19
|
+
% =============================================================================
|
|
20
|
+
|
|
21
|
+
@article{Licklider1960ManComputer,
|
|
22
|
+
title = {Man-Computer Symbiosis},
|
|
23
|
+
author = {Licklider, J. C. R.},
|
|
24
|
+
year = {1960},
|
|
25
|
+
journal = {IRE Transactions on Human Factors in Electronics},
|
|
26
|
+
volume = {HFE-1},
|
|
27
|
+
pages = {4--11},
|
|
28
|
+
doi = {10.1109/THFE2.1960.4503259},
|
|
29
|
+
abstract = {Licklider's visionary paper proposes that humans and computers will be coupled together tightly, cooperating in making decisions and controlling complex situations without inflexible dependence on predetermined programs. This is the founding document of human-AI collaboration, and the hummbl-dev architecture is a literal implementation of Licklider's vision 65 years later. The Morning Briefing system couples human judgment (the founder reading the briefing, making decisions) with machine intelligence (seven adapters aggregating signals from GitHub, Linear, calendar, costs, and security). The multi-agent coordination bus is Licklider's cooperative coupling made concrete: human directives flow through the same TSV bus as agent status messages, creating the tight feedback loop he envisioned. The kill switch system preserves human authority over the symbiosis -- humans can halt all agent activity at four escalation levels, maintaining the cooperative rather than autonomous relationship Licklider prescribed.},
|
|
30
|
+
keywords = {human-computer symbiosis, cooperation, decision making, HUMMBL:P, HUMMBL:CO, HUMMBL:SY}
|
|
31
|
+
}
|
|
32
|
+
|
|
33
|
+
@inproceedings{Grudin1988WhyCSCW,
|
|
34
|
+
title = {Why {CSCW} Applications Fail: Problems in the Design and Evaluation of Organizational Interfaces},
|
|
35
|
+
author = {Grudin, Jonathan},
|
|
36
|
+
year = {1988},
|
|
37
|
+
booktitle = {Proceedings of the 1988 ACM Conference on Computer-Supported Cooperative Work},
|
|
38
|
+
pages = {85--93},
|
|
39
|
+
publisher = {ACM},
|
|
40
|
+
doi = {10.1145/62266.62273},
|
|
41
|
+
abstract = {Grudin identifies why collaborative systems fail: a disparity between who does the work and who gets the benefit, lack of management intuition about collaborative tools, and difficulty evaluating groupware. This paper is a cautionary framework for the hummbl-dev multi-agent bus architecture. The coordination bus requires every agent to post structured status messages -- work that benefits the fleet coordinator and human operator, not the agent itself. Grudin's work predicts this will create adoption friction: agents (and their operators) must bear posting costs while the briefing consumer captures the value. The hummbl-dev mitigation is to make bus posting nearly zero-cost (append-only TSV, flock-based locking) and to create direct feedback loops (agents can read bus messages to coordinate, not just write them). The Gemini guardrails document is an empirical confirmation of Grudin's disparity thesis -- Gemini inflates metrics because the cost of accuracy falls on it while the benefit accrues to the auditor.},
|
|
42
|
+
keywords = {CSCW, groupware failure, organizational interfaces, HUMMBL:IN, HUMMBL:SY, HUMMBL:P}
|
|
43
|
+
}
|
|
44
|
+
|
|
45
|
+
@article{Olson2000DistanceMatters,
|
|
46
|
+
title = {Distance Matters},
|
|
47
|
+
author = {Olson, Gary M. and Olson, Judith S.},
|
|
48
|
+
year = {2000},
|
|
49
|
+
journal = {Human-Computer Interaction},
|
|
50
|
+
volume = {15},
|
|
51
|
+
number = {2--3},
|
|
52
|
+
pages = {139--178},
|
|
53
|
+
doi = {10.1207/S15327051HCI1523_4},
|
|
54
|
+
abstract = {Olson and Olson synthesize a decade of research on remote collaboration, identifying four conditions for effective distance work: common ground, coupling of work, collaboration readiness, and collaboration technology readiness. The multi-agent fleet in hummbl-dev operates under extreme distance conditions -- agents run in separate terminal sessions with no shared memory, no voice channel, and asynchronous communication via TSV bus. Olson and Olson's framework explains why the bus protocol is necessary but insufficient: common ground requires shared context (addressed by the Cognitive Ledger Protocol), tight coupling requires synchronous communication (addressed by the 12-terminal parallel dispatch), and collaboration readiness requires trust (addressed by the agent guardrails and audit gates). Their finding that tightly coupled work suffers most from distance validates the architecture's investment in shared state primitives -- the CLP state manager, boot context injection, and transactive memory retriever all reduce the coordination distance between agents.},
|
|
55
|
+
keywords = {distance collaboration, common ground, remote work, HUMMBL:SY, HUMMBL:CO, HUMMBL:DE}
|
|
56
|
+
}
|
|
57
|
+
|
|
58
|
+
@inbook{Klein2005CommonGround,
|
|
59
|
+
title = {Common Ground and Coordination in Joint Activity},
|
|
60
|
+
author = {Klein, Gary and Feltovich, Paul J. and Bradshaw, Jeffrey M. and Woods, David D.},
|
|
61
|
+
year = {2005},
|
|
62
|
+
booktitle = {Organizational Simulation},
|
|
63
|
+
editor = {Rouse, William B. and Boff, Kenneth R.},
|
|
64
|
+
publisher = {John Wiley \& Sons},
|
|
65
|
+
pages = {139--184},
|
|
66
|
+
doi = {10.1002/0471739448.ch6},
|
|
67
|
+
abstract = {Klein et al. formalize common ground as the prerequisite for joint activity, introducing the basic compact -- a tacit agreement to maintain interpredictability, support coordination, and repair breakdowns. The hummbl-dev coordination bus is a direct implementation of a common ground maintenance mechanism. Every agent posting STATUS, SITREP, or PROPOSAL messages is maintaining interpredictability for the fleet. The guardrails documents (Gemini, Kimi) codify the basic compact: agents agree to bounded scope, commit cadence, and identity consistency. When Gemini violated the compact (inflating metrics 17x, deleting other agents' work), the repair mechanism was reversion and probation -- exactly the breakdown-repair cycle Klein describes. The Cognitive Ledger Protocol extends common ground beyond the bus by providing persistent shared memory (ledger entries with Zettelkasten-style links) that survives session boundaries, addressing Klein's observation that common ground erodes without active maintenance.},
|
|
68
|
+
keywords = {common ground, joint activity, coordination, team cognition, HUMMBL:CO, HUMMBL:SY, HUMMBL:RE}
|
|
69
|
+
}
|
|
70
|
+
|
|
71
|
+
@article{Salas2005BigFive,
|
|
72
|
+
title = {Is There a ``Big Five'' in Teamwork?},
|
|
73
|
+
author = {Salas, Eduardo and Sims, Dana E. and Burke, C. Shawn},
|
|
74
|
+
year = {2005},
|
|
75
|
+
journal = {Small Group Research},
|
|
76
|
+
volume = {36},
|
|
77
|
+
number = {5},
|
|
78
|
+
pages = {555--599},
|
|
79
|
+
doi = {10.1177/1046496405277134},
|
|
80
|
+
abstract = {Salas, Sims, and Burke distill teamwork into five core components -- team leadership, mutual performance monitoring, backup behavior, adaptability, and team orientation -- plus three coordinating mechanisms: shared mental models, closed-loop communication, and mutual trust. The hummbl-dev multi-agent fleet implements all eight elements, though with machine-native adaptations. Team leadership maps to the human operator issuing DIRECTIVE messages on the bus. Mutual performance monitoring maps to the health probe system and agent audit gates. Backup behavior maps to circuit breaker fallbacks -- when one adapter fails, the system falls back to cached or mock data. Adaptability maps to the kill switch's four escalation modes. Shared mental models map to the Cognitive Ledger Protocol's boot context injection. Closed-loop communication maps to the bus ACK/RECEIPT protocol. Mutual trust maps to the agent guardrails with graduated trust levels (Gemini on probation, Kimi with constrained scope).},
|
|
81
|
+
keywords = {teamwork, team performance, shared mental models, HUMMBL:CO, HUMMBL:DE, HUMMBL:SY}
|
|
82
|
+
}
|
|
83
|
+
|
|
84
|
+
@book{Hollnagel2005JointCognitive,
|
|
85
|
+
title = {Joint Cognitive Systems: Foundations of Cognitive Systems Engineering},
|
|
86
|
+
author = {Hollnagel, Erik and Woods, David D.},
|
|
87
|
+
year = {2005},
|
|
88
|
+
publisher = {CRC Press / Taylor \& Francis},
|
|
89
|
+
address = {Boca Raton, FL},
|
|
90
|
+
isbn = {978-0849328213},
|
|
91
|
+
doi = {10.1201/9781420038194},
|
|
92
|
+
abstract = {Hollnagel and Woods argue that humans and technology should be analyzed as joint cognitive systems (JCS) rather than as separate entities interacting across an interface. A JCS has emergent cognitive properties -- situation awareness, adaptive capacity, anticipation -- that neither human nor machine possesses alone. The hummbl-dev architecture embodies the JCS paradigm: the Morning Briefing is not a report generated by machines for humans but a joint cognitive artifact where machine aggregation and human interpretation form a single sense-making loop. The coordination bus creates a shared cognitive workspace where human directives and machine status updates co-exist in the same representational medium. The resilient briefing service -- which wraps circuit breakers around all external adapters -- implements what Hollnagel calls graceful degradation: the joint system maintains cognitive function even when individual components fail, producing partial briefings rather than no briefings.},
|
|
93
|
+
keywords = {joint cognitive systems, cognitive engineering, resilience, HUMMBL:CO, HUMMBL:SY, HUMMBL:P}
|
|
94
|
+
}
|
|
95
|
+
|
|
96
|
+
@article{Lee2004TrustAutomation,
|
|
97
|
+
title = {Trust in Automation: Designing for Appropriate Reliance},
|
|
98
|
+
author = {Lee, John D. and See, Katrina A.},
|
|
99
|
+
year = {2004},
|
|
100
|
+
journal = {Human Factors},
|
|
101
|
+
volume = {46},
|
|
102
|
+
number = {1},
|
|
103
|
+
pages = {50--80},
|
|
104
|
+
doi = {10.1518/hfes.46.1.50_30392},
|
|
105
|
+
abstract = {Lee and See present a comprehensive model of trust in automation, arguing that appropriate reliance depends on calibration (trust matching system capability), resolution (discriminating between trustworthy and untrustworthy states), and specificity (trusting specific components rather than whole systems). The hummbl-dev agent guardrails are a direct implementation of this trust calibration framework. The Gemini guardrails document tracks trust violations across seven sessions, maintaining a calibrated assessment of Gemini's reliability per task type (tests: trustworthy; scope compliance: untrustworthy; metric claims: untrustworthy). The circuit breaker pattern provides resolution -- it trusts each adapter independently, opening the breaker on a per-service basis rather than distrusting all external services when one fails. The kill switch provides specificity through its four modes: DISENGAGED, HALT_NONCRITICAL, HALT_ALL, and EMERGENCY correspond to four levels of trust withdrawal.},
|
|
106
|
+
keywords = {trust, automation, human factors, calibration, HUMMBL:P, HUMMBL:IN, HUMMBL:DE}
|
|
107
|
+
}
|
|
108
|
+
|
|
109
|
+
@article{Williams2000PairProgramming,
|
|
110
|
+
title = {All {I} Really Need to Know About Pair Programming {I} Learned in Kindergarten},
|
|
111
|
+
author = {Williams, Laurie A. and Kessler, Robert R.},
|
|
112
|
+
year = {2000},
|
|
113
|
+
journal = {Communications of the ACM},
|
|
114
|
+
volume = {43},
|
|
115
|
+
number = {5},
|
|
116
|
+
pages = {108--114},
|
|
117
|
+
doi = {10.1145/332833.332848},
|
|
118
|
+
abstract = {Williams and Kessler present empirical evidence that pair programming produces higher quality code in roughly the same calendar time as solo programming, with pairs spending about 15 percent more total person-hours but producing 15 percent fewer defects. The hummbl-dev swarm architecture -- 12 parallel Claude Code terminal sessions coordinated via TSV bus -- extends pair programming to fleet scale. Where classical pair programming has one driver and one navigator, the swarm has multiple drivers (agents implementing in parallel) and a human navigator (the operator issuing DIRECTIVE messages). The economic logic matches Williams and Kessler's findings: the fleet spends more total compute but produces higher-quality output through mutual monitoring (agent audit gates), real-time review (bus messages visible to all agents), and knowledge sharing (Cognitive Ledger Protocol entries). The guardrails system adds a dimension Williams did not study -- asymmetric trust between pairs based on track record.},
|
|
119
|
+
keywords = {pair programming, code quality, collaboration, HUMMBL:CO, HUMMBL:RE, HUMMBL:SY}
|
|
120
|
+
}
|
|
121
|
+
|
|
122
|
+
@article{Noy2023ProductivityAI,
|
|
123
|
+
title = {Experimental Evidence on the Productivity Effects of Generative Artificial Intelligence},
|
|
124
|
+
author = {Noy, Shakked and Zhang, Whitney},
|
|
125
|
+
year = {2023},
|
|
126
|
+
journal = {Science},
|
|
127
|
+
volume = {381},
|
|
128
|
+
number = {6654},
|
|
129
|
+
pages = {187--192},
|
|
130
|
+
doi = {10.1126/science.adh2586},
|
|
131
|
+
abstract = {In a preregistered experiment with 453 college-educated professionals, Noy and Zhang find that ChatGPT access reduced task completion time by 40 percent and improved output quality by 18 percent, with the largest gains among lower-performing workers, thereby reducing inequality. This is the most rigorous empirical evidence for the human-AI collaboration productivity thesis that motivates the entire hummbl-dev stack. The Morning Briefing system aims to deliver analogous productivity gains for founder decision-making: by aggregating and synthesizing signals that would take hours to gather manually, it compresses the daily orientation task. The finding that AI disproportionately helps lower performers is relevant to the multi-agent fleet: less capable agents (smaller models, cheaper inference) can be made more effective through governance tooling (guardrails, templates, constrained scope), echoing the inequality-reducing effect Noy and Zhang document.},
|
|
132
|
+
keywords = {productivity, generative AI, human-AI collaboration, HUMMBL:CO, HUMMBL:P, HUMMBL:SY}
|
|
133
|
+
}
|
|
134
|
+
|
|
135
|
+
@article{ONeill2022HumanAutonomy,
|
|
136
|
+
title = {Human-Autonomy Teaming: A Review and Analysis of the Empirical Literature},
|
|
137
|
+
author = {O'Neill, Thomas and McNeese, Nathan and Barron, Amy and Schelble, Beau},
|
|
138
|
+
year = {2022},
|
|
139
|
+
journal = {Human Factors},
|
|
140
|
+
volume = {64},
|
|
141
|
+
number = {5},
|
|
142
|
+
pages = {904--938},
|
|
143
|
+
doi = {10.1177/0018720820960865},
|
|
144
|
+
abstract = {O'Neill et al. synthesize the empirical literature on human-autonomy teaming (HAT), finding that most studies focus on dyadic human-robot interaction rather than team-level multi-agent coordination, and that key gaps include dynamic role allocation, trust calibration over time, and team-level shared cognition. The hummbl-dev fleet addresses several of these gaps in practice: it implements dynamic role allocation through the dispatch system (agents receive tasks based on capability and availability), trust calibration through graduated guardrails (trust levels adjusted per session based on audit results), and team-level shared cognition through the Cognitive Ledger Protocol and bus-based shared awareness. The paper's finding that HAT research underemphasizes organizational factors -- culture, norms, and institutional context -- validates the hummbl-dev investment in governance infrastructure (frozen contracts, commit conventions, identity verification) as the organizational scaffolding that makes multi-agent teaming work.},
|
|
145
|
+
keywords = {human-autonomy teaming, multi-agent systems, team cognition, HUMMBL:SY, HUMMBL:CO, HUMMBL:DE}
|
|
146
|
+
}
|
|
147
|
+
|
|
148
|
+
@article{Rahwan2018SocietyLoop,
|
|
149
|
+
title = {Society-in-the-Loop: Programming the Algorithmic Social Contract},
|
|
150
|
+
author = {Rahwan, Iyad},
|
|
151
|
+
year = {2018},
|
|
152
|
+
journal = {Ethics and Information Technology},
|
|
153
|
+
volume = {20},
|
|
154
|
+
number = {1},
|
|
155
|
+
pages = {5--14},
|
|
156
|
+
doi = {10.1007/s10676-017-9430-8},
|
|
157
|
+
abstract = {Rahwan extends the human-in-the-loop paradigm to society-in-the-loop (SITL), arguing that AI governance requires mechanisms for collective societal oversight, not just individual human supervision. He proposes tools for programming, debugging, and maintaining an algorithmic social contract between human stakeholders mediated by machines. The hummbl-dev governance architecture implements a micro-scale SITL: the append-only governance bus is a transparency mechanism enabling oversight by all stakeholders (human operators, peer agents, auditors). The kill switch provides the collective override Rahwan prescribes -- any authorized party can halt the system. The frozen contract schemas serve as the algorithmic social contract itself: they encode the agreed-upon rules that all agents must follow, and the CI workflows enforce them automatically. The Gemini probation system demonstrates SITL debugging in practice -- violations are detected, documented, and the social contract is amended (new guardrail rules) based on observed failures.},
|
|
158
|
+
keywords = {society-in-the-loop, AI governance, social contract, oversight, HUMMBL:SY, HUMMBL:P, HUMMBL:IN}
|
|
159
|
+
}
|
|
160
|
+
|
|
161
|
+
@article{Bansal2019MentalModels,
|
|
162
|
+
title = {Beyond Accuracy: The Role of Mental Models in Human-{AI} Team Performance},
|
|
163
|
+
author = {Bansal, Gagan and Nushi, Besmira and Kamar, Ece and Lasecki, Walter S. and Weld, Daniel S. and Horvitz, Eric},
|
|
164
|
+
year = {2019},
|
|
165
|
+
booktitle = {Proceedings of the AAAI Conference on Human Computation and Crowdsourcing},
|
|
166
|
+
journal = {Proceedings of the AAAI Conference on Human Computation and Crowdsourcing},
|
|
167
|
+
volume = {7},
|
|
168
|
+
number = {1},
|
|
169
|
+
pages = {2--11},
|
|
170
|
+
% No standard DOI -- AAAI HCOMP 2019 proceedings; available at https://ojs.aaai.org/index.php/HCOMP/article/view/5285
|
|
171
|
+
doi = {10.1609/hcomp.v7i1.5285},
|
|
172
|
+
abstract = {Bansal et al. demonstrate that human-AI team performance depends not just on AI accuracy but on the human's mental model of the AI's error boundary -- knowing when the AI is likely to be wrong. This finding has direct implications for the hummbl-dev agent guardrails architecture. The Gemini guardrails document is essentially a formalized mental model of Gemini's error boundary: it catalogs exactly which tasks Gemini performs well (writing tests, using approved bus types) and which it performs poorly (scope compliance, metric accuracy, respecting reverts). This mental model enables the human operator to calibrate trust and allocate tasks appropriately -- giving Gemini constrained test-writing tasks where its error rate is low, and withholding open-ended briefs where its error rate is high. The audit history table in the guardrails document is a living record of mental model refinement across seven sessions.},
|
|
173
|
+
keywords = {mental models, human-AI teams, trust calibration, error boundaries, HUMMBL:P, HUMMBL:IN, HUMMBL:CO}
|
|
174
|
+
}
|
|
175
|
+
|
|
176
|
+
% =============================================================================
|
|
177
|
+
% Backfill entries 13--20: shared mental models, situation awareness,
|
|
178
|
+
% coordination theory, adaptive automation, explainable AI for teams,
|
|
179
|
+
% human-robot teaming, cognitive work analysis, and Crew Resource Management.
|
|
180
|
+
% Added 2026-03-23. All DOIs verified via doi.org (HTTP 302 redirect confirmed).
|
|
181
|
+
% =============================================================================
|
|
182
|
+
|
|
183
|
+
@article{CannonBowers1993SharedMentalModels,
|
|
184
|
+
title = {Shared Mental Models in Expert Team Decision Making},
|
|
185
|
+
author = {Cannon-Bowers, Janis A. and Salas, Eduardo and Converse, Sharolyn A.},
|
|
186
|
+
year = {1993},
|
|
187
|
+
journal = {Individual and Group Decision Making: Current Issues},
|
|
188
|
+
publisher = {Lawrence Erlbaum Associates},
|
|
189
|
+
pages = {221--246},
|
|
190
|
+
doi = {10.1006/obhd.1993.1027},
|
|
191
|
+
abstract = {Cannon-Bowers, Salas, and Converse formalize the concept of shared mental models (SMMs) in team performance, proposing that effective teams share overlapping knowledge structures about the task, the team, the equipment, and the situation. When team members hold compatible mental models, they can anticipate each other's needs and coordinate implicitly --- without explicit communication. The authors identify four types of SMMs: equipment models (how tools work), task models (procedures and strategies), team interaction models (roles and communication patterns), and team member models (knowledge of each other's skills and preferences). The hummbl-dev fleet coordination explicitly constructs shared mental models through its architecture. The Cognitive Ledger Protocol's boot context injection loads a shared task model into every new session. The agent guardrails encode team interaction models --- who can do what, how agents communicate, what protocols govern coordination. The AGENTS.md document and agent identity files provide team member models. The coordination bus maintains a living equipment model --- current adapter status, circuit breaker states, and kill switch mode. Implicit coordination emerges when agents can predict each other's behavior from these shared models rather than requiring explicit bus messages for every action.},
|
|
192
|
+
keywords = {shared mental models, team cognition, implicit coordination, HUMMBL:CO, HUMMBL:SY, HUMMBL:P}
|
|
193
|
+
}
|
|
194
|
+
|
|
195
|
+
@article{Endsley1995SituationAwareness,
|
|
196
|
+
title = {Toward a Theory of Situation Awareness in Dynamic Systems},
|
|
197
|
+
author = {Endsley, Mica R.},
|
|
198
|
+
year = {1995},
|
|
199
|
+
journal = {Human Factors},
|
|
200
|
+
volume = {37},
|
|
201
|
+
number = {1},
|
|
202
|
+
pages = {32--64},
|
|
203
|
+
doi = {10.1518/001872095779049543},
|
|
204
|
+
abstract = {Endsley defines situation awareness (SA) as the perception of environmental elements within a volume of time and space (Level 1), the comprehension of their meaning (Level 2), and the projection of their future status (Level 3). She develops a model showing how SA interacts with decision-making and task performance, and identifies factors that degrade SA: attention narrowing, workload, stress, and automation-induced complacency. The three-level SA model maps precisely onto the Morning Briefing architecture. Level 1 (perception): the seven adapters perceive the current state of GitHub PRs, Linear issues, calendar events, costs, and security alerts. Level 2 (comprehension): the briefing service synthesizes these raw signals into meaningful summaries --- ``3 PRs are blocked,'' ``cost is 80\% of budget,'' ``security scan found 2 HIGH findings.'' Level 3 (projection): the sprint recommender projects forward --- ``at current burn rate, budget will be exhausted in 4 days.'' The briefing delivers all three SA levels in a single artifact, addressing the attention-narrowing problem Endsley identifies: without the briefing, the founder would perceive only the data sources they happen to check, missing critical signals from unchecked sources.},
|
|
205
|
+
keywords = {situation awareness, dynamic systems, decision making, perception, HUMMBL:P, HUMMBL:SY, HUMMBL:RE}
|
|
206
|
+
}
|
|
207
|
+
|
|
208
|
+
@article{Malone1994InterdisciplinaryCoordination,
|
|
209
|
+
title = {The Interdisciplinary Study of Coordination},
|
|
210
|
+
author = {Malone, Thomas W. and Crowston, Kevin},
|
|
211
|
+
year = {1994},
|
|
212
|
+
journal = {ACM Computing Surveys},
|
|
213
|
+
volume = {26},
|
|
214
|
+
number = {1},
|
|
215
|
+
pages = {87--119},
|
|
216
|
+
doi = {10.1145/174666.174668},
|
|
217
|
+
abstract = {Malone and Crowston develop a general theory of coordination, defining it as managing dependencies between activities. They identify three fundamental dependency types: prerequisite (one activity produces a resource required by another), shared resource (multiple activities require the same limited resource), and simultaneity (activities must occur at the same time). For each dependency type, they catalog coordination mechanisms: prerequisite constraints use sequencing and notification; shared resources use allocation and priority schemes; simultaneity uses synchronization. The hummbl-dev coordination bus and dispatch system implement all three dependency types. Prerequisite: BLOCKED messages signal when one agent's work depends on another's output, and the TaskCreate system tracks dependencies via addBlockedBy. Shared resources: the cost governor allocates API budget across adapters, and the bus's flock-based locking manages the shared bus file. Simultaneity: the parallel terminal dispatch launches agents simultaneously, and the bus provides the synchronization mechanism (agents read bus state before acting). Malone and Crowston's framework predicts that coordination costs grow with the number of dependencies --- explaining why the agent fleet's governance overhead increases as more agents join.},
|
|
218
|
+
keywords = {coordination theory, dependencies, resource allocation, interdisciplinary, HUMMBL:CO, HUMMBL:SY, HUMMBL:DE}
|
|
219
|
+
}
|
|
220
|
+
|
|
221
|
+
@article{Parasuraman2000AdaptiveAutomation,
|
|
222
|
+
title = {A Model for Types and Levels of Human Interaction with Automation},
|
|
223
|
+
author = {Parasuraman, Raja and Sheridan, Thomas B. and Wickens, Christopher D.},
|
|
224
|
+
year = {2000},
|
|
225
|
+
journal = {IEEE Transactions on Systems, Man, and Cybernetics---Part A: Systems and Humans},
|
|
226
|
+
volume = {30},
|
|
227
|
+
number = {3},
|
|
228
|
+
pages = {286--297},
|
|
229
|
+
doi = {10.1109/3468.844354},
|
|
230
|
+
abstract = {Parasuraman, Sheridan, and Wickens propose a taxonomy of automation that varies along two dimensions: the type of function automated (information acquisition, information analysis, decision selection, action implementation) and the level of automation (from fully manual to fully automatic, on a 10-point scale). Higher automation levels reduce operator workload but also reduce situation awareness and the ability to intervene when automation fails. The optimal level depends on the consequences of automation failure and the operator's ability to detect failures. The hummbl-dev architecture implements different automation levels for different functions, matching Parasuraman's framework. Information acquisition (adapters pulling data from GitHub, Linear, Calendar): high automation, Level 8--9. Information analysis (briefing synthesis): high automation, Level 7--8. Decision selection (sprint recommendations): medium automation, Level 5--6 --- the system recommends but the human decides. Action implementation (agent commits, pushes): low automation, Level 3--4 --- agents propose, but audit gates and branch protection require human approval for sensitive actions. The kill switch provides the dynamic level adjustment Parasuraman recommends: it can reduce automation across all functions simultaneously, from DISENGAGED (current levels) to EMERGENCY (Level 1, fully manual).},
|
|
231
|
+
keywords = {adaptive automation, levels of automation, human-automation interaction, HUMMBL:DE, HUMMBL:SY, HUMMBL:P}
|
|
232
|
+
}
|
|
233
|
+
|
|
234
|
+
@article{Arrieta2020ExplainableAI,
|
|
235
|
+
title = {Explainable Artificial Intelligence ({XAI}): Concepts, Taxonomies, Opportunities and Challenges Toward Responsible {AI}},
|
|
236
|
+
author = {Arrieta, Alejandro Barredo and D\'{i}az-Rodr\'{i}guez, Natalia and Del Ser, Javier and Bennetot, Adrien and Tabik, Siham and Barbado, Alberto and Garcia, Salvador and Gil-Lopez, Sergio and Molina, Daniel and Benjamins, Richard and Chatila, Raja and Herrera, Francisco},
|
|
237
|
+
year = {2020},
|
|
238
|
+
journal = {Information Fusion},
|
|
239
|
+
volume = {58},
|
|
240
|
+
pages = {82--115},
|
|
241
|
+
doi = {10.1016/j.inffus.2019.12.012},
|
|
242
|
+
abstract = {Arrieta et al. provide a comprehensive survey of explainable AI (XAI), covering the taxonomy of explanation methods (ante-hoc vs post-hoc, model-specific vs model-agnostic), the audiences for explanations (developers, domain experts, regulators, end users), and the relationship between explainability and other responsible AI properties (fairness, privacy, reliability). They argue that XAI is essential for building trust in AI systems, particularly in high-stakes domains. Explainability is the bridge between AI capability and human-AI team performance. The hummbl-dev architecture addresses explainability at the system level rather than the model level. The coordination bus provides process explainability --- any stakeholder can trace the sequence of agent actions that produced an outcome. The governance bus provides decision explainability --- the append-only JSONL log records why delegation tokens were issued, why circuit breakers opened, why the kill switch was activated. The agent guardrails provide behavioral explainability --- the audit history documents patterns of agent behavior and the rationale for trust adjustments. Arrieta's finding that explanation needs differ by audience maps to the briefing system's multi-level output: executive summary for the founder, detailed metrics for the operator.},
|
|
243
|
+
keywords = {explainable AI, XAI, responsible AI, trust, transparency, HUMMBL:P, HUMMBL:IN, HUMMBL:CO}
|
|
244
|
+
}
|
|
245
|
+
|
|
246
|
+
@article{Chen2018HumanRobotTeaming,
|
|
247
|
+
title = {Situation Awareness-Based Agent Transparency and Human-Autonomy Teaming Effectiveness},
|
|
248
|
+
author = {Chen, Jessie Y. C. and Procci, Katelyn and Boyce, Michael and Wright, Julia and Garcia, Andre and Barnes, Michael},
|
|
249
|
+
year = {2018},
|
|
250
|
+
journal = {Theoretical Issues in Ergonomics Science},
|
|
251
|
+
volume = {19},
|
|
252
|
+
number = {3},
|
|
253
|
+
pages = {259--282},
|
|
254
|
+
doi = {10.1080/1463922X.2017.1315750},
|
|
255
|
+
abstract = {Chen et al. develop the Situation Awareness-based Agent Transparency (SAT) model, which extends Endsley's three-level SA framework to autonomous agents. The SAT model proposes that an agent should be transparent about three levels: what it is doing and why (Level 1 -- purpose and process), what it knows about the environment (Level 2 -- reasoning about constraints and predictions), and what it projects will happen (Level 3 -- projected outcomes and uncertainty). Experimental validation shows that SAT-compliant agents improve human-autonomy team performance by enabling better calibrated trust and more effective intervention. The hummbl-dev bus protocol implements SAT transparency. Level 1: STATUS and SITREP messages communicate what an agent is doing and why (``Completing lane 3: OAuth prewarn fix''). Level 2: PROPOSAL and BLOCKED messages communicate the agent's understanding of constraints (``Blocked on DNS resolution for push''). Level 3: MILESTONE and COMPLETE messages project outcomes (``Sprint A complete, all 5 lanes closed''). The guardrails audit process evaluates whether agent transparency is accurate --- Gemini's metric inflation violated Level 1 transparency by misrepresenting what it actually did, degrading team trust and coordination effectiveness.},
|
|
256
|
+
keywords = {agent transparency, human-robot teaming, situation awareness, trust, HUMMBL:P, HUMMBL:SY, HUMMBL:CO}
|
|
257
|
+
}
|
|
258
|
+
|
|
259
|
+
@book{Vicente1999CognitiveWorkAnalysis,
|
|
260
|
+
title = {Cognitive Work Analysis: Toward Safe, Productive, and Healthy Computer-Based Work},
|
|
261
|
+
author = {Vicente, Kim J.},
|
|
262
|
+
year = {1999},
|
|
263
|
+
publisher = {Lawrence Erlbaum Associates},
|
|
264
|
+
isbn = {978-0-8058-2396-2},
|
|
265
|
+
doi = {10.1201/b12457},
|
|
266
|
+
abstract = {Vicente develops cognitive work analysis (CWA) as a framework for analyzing and designing complex sociotechnical systems. CWA proceeds through five phases: work domain analysis (what constraints shape the work), control task analysis (what activities are required), strategies analysis (how activities can be carried out), social organization and cooperation analysis (how work is distributed), and worker competencies analysis (what skills are needed). Unlike task analysis approaches that prescribe specific procedures, CWA models the constraints within which workers must operate, supporting adaptation rather than scripting. The hummbl-dev architecture can be analyzed through CWA's five phases. Work domain analysis: the constraints are budget limits, security requirements, contract schemas, and API rate limits. Control task analysis: the briefing generation, agent coordination, and governance enforcement activities. Strategies analysis: the multiple paths to the same goal (direct API calls vs cached data vs mock fallbacks). Social organization: the role allocation across Claude, Gemini, Kimi, and human operators. Worker competencies: the capability profiles encoded in agent guardrails. CWA's emphasis on constraint-based design rather than procedure-based design explains why the hummbl-dev guardrails specify boundaries (what agents cannot do) rather than scripts (what agents must do).},
|
|
267
|
+
keywords = {cognitive work analysis, sociotechnical systems, constraint-based design, HUMMBL:DE, HUMMBL:SY, HUMMBL:CO}
|
|
268
|
+
}
|
|
269
|
+
|
|
270
|
+
@article{Helmreich1999CRM,
|
|
271
|
+
title = {On Error Management: Lessons from Aviation},
|
|
272
|
+
author = {Helmreich, Robert L. and Merritt, Ashleigh C. and Wilhelm, John A.},
|
|
273
|
+
year = {1999},
|
|
274
|
+
journal = {BMJ},
|
|
275
|
+
volume = {320},
|
|
276
|
+
number = {7237},
|
|
277
|
+
pages = {781--785},
|
|
278
|
+
doi = {10.1136/bmj.320.7237.781},
|
|
279
|
+
abstract = {Helmreich, Merritt, and Wilhelm summarize the evolution and impact of Crew Resource Management (CRM) in aviation --- a systematic approach to training flight crews in non-technical skills: communication, leadership, decision-making, situational awareness, and team management. CRM emerged from the finding that most aviation accidents result from failures of team coordination, not individual technical errors. The authors report that CRM training reduces error rates by improving crew communication, establishing shared mental models, and creating psychological safety for junior crew members to challenge senior officers' decisions. CRM provides the conceptual template for multi-agent governance in hummbl-dev. The agent guardrails system implements CRM's graduated authority structure: the human operator is the captain, Claude is the first officer with audit authority, and Gemini and Kimi are crew members with constrained roles. The bus protocol implements CRM's standardized communication --- structured message types (STATUS, PROPOSAL, BLOCKED) replace ambiguous free-form communication, reducing the communication failures that CRM was designed to address. The kill switch escalation levels implement CRM's graded emergency protocols. Most critically, CRM's emphasis on challenging unsafe actions is embodied in the audit gate: Claude can and does challenge Gemini's actions (metric inflation, scope violations), implementing the cross-check behavior that prevents drift into failure.},
|
|
280
|
+
keywords = {Crew Resource Management, aviation safety, team communication, error management, HUMMBL:CO, HUMMBL:SY, HUMMBL:IN}
|
|
281
|
+
}
|