promptfoo 0.121.7 → 0.121.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/src/{accounts-CmWzeD2d.cjs → accounts-BVz5gHLK.cjs} +4 -4
- package/dist/src/{accounts-DanM1wq_.js → accounts-BWjqwsrf.js} +4 -4
- package/dist/src/{accounts-CjFnOPmb.js → accounts-D6IBfEE0.js} +5 -5
- package/dist/src/{accounts-Ca7WIoPY.js → accounts-DAv_0iE7.js} +4 -4
- package/dist/src/{agentic-utils-DDEGRV9v.js → agentic-utils-BJKAkz2e.js} +2 -2
- package/dist/src/{agentic-utils-DvPWSUpb.cjs → agentic-utils-C-A92xhn.cjs} +2 -2
- package/dist/src/{agentic-utils-TxUEMPYS.js → agentic-utils-DmoS_S4B.js} +2 -2
- package/dist/src/{agentic-utils-CJ0j3fBi.js → agentic-utils-GdToujHu.js} +2 -2
- package/dist/src/{agents-CBgJvRkB.js → agents-2C8NN6I1.js} +4 -4
- package/dist/src/{agents-CYn2n3QP.js → agents-BMAiSR2o.js} +2 -2
- package/dist/src/{agents-LrHuQqr1.js → agents-C-PGaxwj.js} +4 -4
- package/dist/src/{agents-D-vDNFx4.js → agents-C98cz5pl.js} +4 -4
- package/dist/src/{agents-B4sRuXg3.cjs → agents-DB8Ub2Ld.cjs} +2 -2
- package/dist/src/{agents-B8q7h_ek.js → agents-Dwshy2H8.js} +2 -2
- package/dist/src/{agents-QGg76OF-.js → agents-mlKjx-cK.js} +2 -2
- package/dist/src/{agents-eHZ9nlgA.cjs → agents-n2ej-c4H.cjs} +4 -4
- package/dist/src/{aimlapi-D5HXzZ0s.js → aimlapi-Bi-laUlp.js} +6 -6
- package/dist/src/{aimlapi-T6HGNxNe.cjs → aimlapi-D0OFV4Vj.cjs} +6 -6
- package/dist/src/{aimlapi-eYv3a_DK.js → aimlapi-WyUK0wYy.js} +6 -6
- package/dist/src/{aimlapi-CJEbQ0o6.js → aimlapi-v-63ZjEI.js} +6 -6
- package/dist/src/app/assets/Report-sCXUfaWo.js +1 -0
- package/dist/src/app/assets/{index-BnT6P6sF.js → index-BopgkZEh.js} +2 -2
- package/dist/src/app/index.html +1 -1
- package/dist/src/{audio-DyiebVB3.js → audio-DnEIHWZR.js} +3 -3
- package/dist/src/{audio-BqnRvcWG.js → audio-heR0mu0n.js} +3 -3
- package/dist/src/{audio-CPMtV1yR.js → audio-wafFO1wn.js} +3 -3
- package/dist/src/{audio-FnxbEnSE.cjs → audio-x44tsxIo.cjs} +3 -3
- package/dist/src/{authoritativeMarkupInjection-F2gBw0lN.cjs → authoritativeMarkupInjection-2G3Be6oL.cjs} +6 -6
- package/dist/src/{authoritativeMarkupInjection-DyAXAsSr.js → authoritativeMarkupInjection-81PPynHR.js} +6 -6
- package/dist/src/{authoritativeMarkupInjection-QEQmFS83.js → authoritativeMarkupInjection-D9O70HPi.js} +6 -6
- package/dist/src/{authoritativeMarkupInjection-BZIywVjG.js → authoritativeMarkupInjection-PxSf3Rh8.js} +5 -5
- package/dist/src/{base-E9I8zXjz.js → base-0Gzzue9Z.js} +2 -2
- package/dist/src/{base-Co80MMCi.js → base-Bp4c52YZ.js} +2 -2
- package/dist/src/{base-CKLo890h.js → base-BuNn-YBX.js} +2 -2
- package/dist/src/{base-DGJW48uz.cjs → base-BzdS8tod.cjs} +2 -2
- package/dist/src/{bestOfN-_kTi8Bxe.js → bestOfN-BHiOjeaq.js} +7 -7
- package/dist/src/{bestOfN-BBsO41z4.js → bestOfN-CdkNPPbX.js} +6 -6
- package/dist/src/{bestOfN-B3wNzjSB.js → bestOfN-ClUSOhN0.js} +7 -7
- package/dist/src/{bestOfN-CAwmg5UL.cjs → bestOfN-DWwXEg1h.cjs} +7 -7
- package/dist/src/cache-BKYi3kAA.js +3 -0
- package/dist/src/{cache-DpPWrkTE.js → cache-BR77mdIR.js} +3 -3
- package/dist/src/{cache-roFAE0cI.js → cache-CrioYnaa.js} +2 -2
- package/dist/src/{cache-DIXbtkNO.js → cache-DdriHsNX.js} +2 -2
- package/dist/src/{cache-CPGUA4Yl.cjs → cache-h5MWOBZI.cjs} +2 -2
- package/dist/src/{chat-Dabu84Br.js → chat-BBEnnpQk.js} +6 -6
- package/dist/src/{chat-CUCorGiL.js → chat-BSos6PvZ.js} +6 -6
- package/dist/src/{chat-TP8Qifkh.js → chat-Bnt7ieO0.js} +2 -2
- package/dist/src/{chat-DxTDQ83C.cjs → chat-DSyYuTYT.cjs} +6 -6
- package/dist/src/{chat-DqUFcWI0.js → chat-DTdf-J5Q.js} +6 -6
- package/dist/src/{chat-DG1wG4w0.cjs → chat-Dq3DomYU.cjs} +2 -2
- package/dist/src/{chat-GmlolEwo.js → chat-g5QLeLOo.js} +2 -2
- package/dist/src/{chat-iwaM5UTQ.js → chat-mTTuUAYb.js} +2 -2
- package/dist/src/{claude-agent-sdk-x1XJ1-pU.js → claude-agent-sdk-BGUac_kS.js} +7 -5
- package/dist/src/{claude-agent-sdk-D5Jl0SDh.js → claude-agent-sdk-BP__YGfK.js} +7 -5
- package/dist/src/{claude-agent-sdk-BQNp_y-F.js → claude-agent-sdk-Ddgx5BIQ.js} +7 -5
- package/dist/src/{claude-agent-sdk-DH416NBD.cjs → claude-agent-sdk-n2XcEclh.cjs} +7 -5
- package/dist/src/cloud-DiWbUiVP.js +3 -0
- package/dist/src/{cloud-D3DiFqH6.js → cloud-DqF5N1aJ.js} +2 -2
- package/dist/src/{cloudflare-ai-B6NVI3ax.js → cloudflare-ai-BGamMotN.js} +4 -4
- package/dist/src/{cloudflare-ai-r4tbYmWU.js → cloudflare-ai-BwW8W-w7.js} +4 -4
- package/dist/src/{cloudflare-ai-CEAW-xQa.cjs → cloudflare-ai-DCRGnsyL.cjs} +4 -4
- package/dist/src/{cloudflare-ai-RFSojyXG.js → cloudflare-ai-sD26nP6V.js} +4 -4
- package/dist/src/{cloudflare-gateway-BaZ4insB.js → cloudflare-gateway-2lnOT4qM.js} +3 -3
- package/dist/src/{cloudflare-gateway-BCkLouto.js → cloudflare-gateway-B1-8KNCt.js} +3 -3
- package/dist/src/{cloudflare-gateway-TJMLBj6I.cjs → cloudflare-gateway-CCC1DFrC.cjs} +3 -3
- package/dist/src/{cloudflare-gateway-CF-Vb-2Z.js → cloudflare-gateway-DOghiU6r.js} +3 -3
- package/dist/src/{codex-app-server-DIXZ230V.js → codex-app-server-BWeWamEb.js} +17 -2
- package/dist/src/{codex-app-server-B8KHEiF4.js → codex-app-server-DyQB1P0p.js} +17 -2
- package/dist/src/{codex-app-server-CnrLBCeA.cjs → codex-app-server-R9u_G7W9.cjs} +17 -2
- package/dist/src/{codex-app-server-Dd22dC_N.js → codex-app-server-ZQRJSJjU.js} +17 -2
- package/dist/src/{codex-sdk-CmQABzV3.js → codex-sdk-B62H0fe7.js} +14 -3
- package/dist/src/{codex-sdk-CFF6gUyi.cjs → codex-sdk-BRPUvJG8.cjs} +14 -3
- package/dist/src/{codex-sdk-B6Wah8Pa.js → codex-sdk-Dio1zJBS.js} +14 -3
- package/dist/src/codex-sdk-DxukZs_K.js +3 -0
- package/dist/src/{codex-sdk-D2d54RL8.js → codex-sdk-iEmW1eS2.js} +14 -3
- package/dist/src/{cometapi-Bu9B8NUY.js → cometapi--hh7dESS.js} +7 -7
- package/dist/src/{cometapi-OBILPLlu.js → cometapi-C7yWNGqt.js} +7 -7
- package/dist/src/{cometapi-CtzNCHKu.js → cometapi-CSIi16a0.js} +7 -7
- package/dist/src/{cometapi-DHCDlQUI.cjs → cometapi-sZgBZtbU.cjs} +7 -7
- package/dist/src/{completion-CSYfl2cd.cjs → completion-CWtqdn3z.cjs} +4 -4
- package/dist/src/{completion-CO2e1_62.js → completion-DT8cxo9T.js} +4 -4
- package/dist/src/{completion-DZNxcyfG.js → completion-DUScduXp.js} +4 -4
- package/dist/src/{completion-sNvCLTAP.js → completion-D_2IOAoS.js} +4 -4
- package/dist/src/{crescendo-QiaSLW0d.js → crescendo-B41TwUHM.js} +39 -18
- package/dist/src/{crescendo-J1Xx4_zb.js → crescendo-Bfic7KC4.js} +41 -20
- package/dist/src/{crescendo-BXEJK_bi.cjs → crescendo-DXFB7rHP.cjs} +41 -20
- package/dist/src/{crescendo-CU_Y2i-m.js → crescendo-DvvYxMLA.js} +41 -20
- package/dist/src/{custom-BJfP00Bh.js → custom-BdzuqFTN.js} +10 -10
- package/dist/src/{custom-notggYVl.js → custom-Cf5Q6r-P.js} +8 -8
- package/dist/src/{custom-CZVn-1-r.js → custom-DLgufezC.js} +10 -10
- package/dist/src/{custom-Cqia7M0D.cjs → custom-LEXHCRe3.cjs} +10 -10
- package/dist/src/{docker-4D1eL6Gq.js → docker-BOSO_6hK.js} +5 -5
- package/dist/src/{docker-D06JUoe2.cjs → docker-D0h2vFrc.cjs} +5 -5
- package/dist/src/{docker-DdJQBxK9.js → docker-D2TWGyTP.js} +5 -5
- package/dist/src/{docker-BBv1WUDu.js → docker-Vj_4_cPg.js} +5 -5
- package/dist/src/{embedding-BbrwopfX.cjs → embedding-BQIApR18.cjs} +4 -4
- package/dist/src/{embedding-Bi3rxrZF.js → embedding-CStK0TV6.js} +4 -4
- package/dist/src/{embedding--UZVe4_7.js → embedding-CU78FMnw.js} +4 -4
- package/dist/src/{embedding-C251p1-8.js → embedding-CV8lmCnU.js} +4 -4
- package/dist/src/{eval-0VRANImH.js → eval-B3BaNBbO.js} +4 -4
- package/dist/src/{eval-DscR5iOM.js → eval-DfR9885C.js} +1 -1
- package/dist/src/evalResult-BtZSUgQv.js +3 -0
- package/dist/src/{evalResult-eUkJv9Ko.js → evalResult-CcSqNl_Y.js} +3 -3
- package/dist/src/{evalResult-CvtS8h8u.cjs → evalResult-DHXs-9TL.cjs} +3 -3
- package/dist/src/{evalResult-2RRJvFyB.js → evalResult-PGqEbasb.js} +3 -3
- package/dist/src/evaluator-B9LGbKI8.js +3 -0
- package/dist/src/{evaluator-DRoiYB2q.js → evaluator-n_dEb00o.js} +20 -20
- package/dist/src/{evaluatorHelpers-DuqFFfq7.js → evaluatorHelpers-CrRObe2z.js} +4 -4
- package/dist/src/{evaluatorHelpers-CRqTvSux.cjs → evaluatorHelpers-D06I9WFL.cjs} +4 -4
- package/dist/src/{evaluatorHelpers-BsYP_muT.js → evaluatorHelpers-D1_kwvyp.js} +4 -4
- package/dist/src/{extractor-CIW3iN-b.js → extractor-BVkZtk4R.js} +4 -4
- package/dist/src/{extractor-CxRtnaHl.js → extractor-D3Fv_Tdh.js} +4 -4
- package/dist/src/{extractor-BR7XAzAL.js → extractor-Jp53vs-6.js} +4 -4
- package/dist/src/{extractor-BdxEtt3J.cjs → extractor-bV_NOoaz.cjs} +4 -4
- package/dist/src/{fetch-BufrQtvR.js → fetch-BSSAcMxf.js} +2 -2
- package/dist/src/fetch-BodQTrMU.js +3 -0
- package/dist/src/{fetch-Dw4XZHjj.cjs → fetch-Cfm4EuOB.cjs} +2 -2
- package/dist/src/{fetch-DXUnXkVU.js → fetch-Cpf1U1nO.js} +3 -3
- package/dist/src/{fetch-It34O8Ur.js → fetch-Doks14zQ.js} +2 -2
- package/dist/src/{goat-Qgurm-NP.js → goat-Ba7Gznzq.js} +18 -17
- package/dist/src/{goat-Ckd3q3AY.js → goat-CJngS-WU.js} +18 -17
- package/dist/src/{goat-ghadEDdy.js → goat-CwsbfQeu.js} +16 -15
- package/dist/src/{goat-una6pZGP.cjs → goat-DOMbozoX.cjs} +18 -17
- package/dist/src/graders-B3D7kCcD.js +3 -0
- package/dist/src/{graders-BGP99PdK.js → graders-BQt1BaQe.js} +18 -18
- package/dist/src/{graders-ClrU2fnd.cjs → graders-CBQ2s6gz.cjs} +18 -18
- package/dist/src/{graders-C0nXU_ZP.js → graders-DaRU98zs.js} +18 -18
- package/dist/src/{graders-BX0f2tvS.js → graders-KXzjnIim.js} +18 -18
- package/dist/src/{hydra-DE4xWwyc.js → hydra-BU6GjYoQ.js} +35 -17
- package/dist/src/{hydra-BxdG4nkg.js → hydra-BmXHxlyl.js} +33 -15
- package/dist/src/{hydra-BSNZZm2M.js → hydra-CR0KyYDb.js} +35 -17
- package/dist/src/{hydra-DrJttnvw.cjs → hydra-RO9jBks7.cjs} +35 -17
- package/dist/src/{image-B_fPIwdg.js → image-BBmZdKO3.js} +3 -3
- package/dist/src/{image-QzmydkiG.js → image-B_PFG7IG.js} +3 -3
- package/dist/src/{image-BvUAW344.js → image-BtODOZjh.js} +4 -4
- package/dist/src/{image-Cvjwx1uY.js → image-CYuNJIqd.js} +4 -4
- package/dist/src/{image-DfVCGPbI.cjs → image-E00WFZkq.cjs} +3 -3
- package/dist/src/{image-X0oY4350.cjs → image-HK2Cfqb1.cjs} +4 -4
- package/dist/src/{image-BN-hjLL9.js → image-LGj8dTcr.js} +3 -3
- package/dist/src/{image-B4oBtu6J.js → image-YMKejC0r.js} +4 -4
- package/dist/src/index.cjs +112 -115
- package/dist/src/index.d.cts +13 -0
- package/dist/src/index.d.ts +13 -0
- package/dist/src/index.js +113 -116
- package/dist/src/{indirectWebPwn-DBQhOjoD.js → indirectWebPwn-B80dLlFC.js} +5 -5
- package/dist/src/{indirectWebPwn-uyWdHx04.js → indirectWebPwn-BMTXXznx.js} +4 -4
- package/dist/src/{indirectWebPwn-tNx9OZ35.js → indirectWebPwn-BZFPV7Q9.js} +4 -4
- package/dist/src/{indirectWebPwn-CfQJt3gk.cjs → indirectWebPwn-BaEQEOIO.cjs} +5 -5
- package/dist/src/{indirectWebPwn-OsXnKejv.js → indirectWebPwn-BzpyMnFS.js} +5 -5
- package/dist/src/{indirectWebPwn-CbjUG0rh.js → indirectWebPwn-CiWB-vVH.js} +4 -4
- package/dist/src/{indirectWebPwn-BJ22AbQa.cjs → indirectWebPwn-D7NA9Nsv.cjs} +4 -4
- package/dist/src/{indirectWebPwn-02ZIghCS.js → indirectWebPwn-o_bEFMjP.js} +5 -5
- package/dist/src/{iterative-DJQEQpG3.js → iterative-B-l0syBV.js} +25 -15
- package/dist/src/{iterative-DQBuWM-j.cjs → iterative-BACUeCCz.cjs} +25 -15
- package/dist/src/{iterative-FTS4Bz67.js → iterative-CVwoExo8.js} +25 -15
- package/dist/src/{iterative-CpU6i2As.js → iterative-QDrGSyss.js} +23 -13
- package/dist/src/{iterativeImage-BUABMVOA.js → iterativeImage-BQg2OwA6.js} +3 -3
- package/dist/src/{iterativeImage-Doz8mgxF.js → iterativeImage-Bwn0fM75.js} +4 -4
- package/dist/src/{iterativeImage-ByFWkxax.cjs → iterativeImage-CcgVyASo.cjs} +4 -4
- package/dist/src/{iterativeImage-BzUapOUi.js → iterativeImage-D_UbQXg4.js} +4 -4
- package/dist/src/{iterativeMeta-C7APE_P1.js → iterativeMeta-CIu-CHRS.js} +36 -16
- package/dist/src/{iterativeMeta-B3YiAOc8.js → iterativeMeta-CN8CNjFA.js} +36 -16
- package/dist/src/{iterativeMeta-DgoQ7bLh.js → iterativeMeta-DN6BTjpq.js} +34 -14
- package/dist/src/{iterativeMeta-CSS8M6Ds.cjs → iterativeMeta-DlqY3BsS.cjs} +36 -16
- package/dist/src/{iterativeTree-DvZ7GBwt.js → iterativeTree-CJ8a8G9T.js} +78 -28
- package/dist/src/{iterativeTree-B5zxBBSW.js → iterativeTree-DcuFXnjL.js} +78 -28
- package/dist/src/{iterativeTree-CNyIk0Yn.js → iterativeTree-FrDDYAN0.js} +76 -26
- package/dist/src/{iterativeTree-CPMF10ve.cjs → iterativeTree-LOgAi0nU.cjs} +78 -28
- package/dist/src/{knowledgeBase-DUh34xba.cjs → knowledgeBase-CdbcGBZF.cjs} +4 -4
- package/dist/src/{knowledgeBase-Bi_8sV-H.js → knowledgeBase-CjOXp6Lr.js} +4 -4
- package/dist/src/{knowledgeBase-BadkINlJ.js → knowledgeBase-DxAq4n4z.js} +4 -4
- package/dist/src/{knowledgeBase-CkMljjdg.js → knowledgeBase-o_wTLzrt.js} +4 -4
- package/dist/src/{litellm-BKBo0jpC.js → litellm-B2gHwya_.js} +4 -4
- package/dist/src/{litellm-CtAr7bKG.cjs → litellm-CPpdlO7n.cjs} +4 -4
- package/dist/src/{litellm-BXyn5kZK.js → litellm-CYfgxLrM.js} +4 -4
- package/dist/src/{litellm-CNcfbCfa.js → litellm-ojWBKU3C.js} +4 -4
- package/dist/src/{luma-ray-D3FUc2K3.cjs → luma-ray-BCCO9XXG.cjs} +3 -3
- package/dist/src/{luma-ray-BMX1iEB6.js → luma-ray-BPrdihAb.js} +3 -3
- package/dist/src/{luma-ray-CR5TSpp4.js → luma-ray-DP5N79lB.js} +3 -3
- package/dist/src/{luma-ray-OEMmS1RB.js → luma-ray-DTDyoAlM.js} +3 -3
- package/dist/src/main.js +116 -119
- package/dist/src/{memoryPoisoning-Dp-btinn.cjs → memoryPoisoning-B6N3us35.cjs} +6 -6
- package/dist/src/{memoryPoisoning-D8h9gXJF.js → memoryPoisoning-Bc_BK_k2.js} +6 -6
- package/dist/src/{memoryPoisoning-CM83NWYl.js → memoryPoisoning-D375zwSX.js} +6 -6
- package/dist/src/{memoryPoisoning-cLuCoTuJ.js → memoryPoisoning-DJA0YjJT.js} +6 -6
- package/dist/src/{messages-BabO-cX8.js → messages-Bg29Nbit.js} +7 -7
- package/dist/src/{messages-DBPir0TQ.cjs → messages-BrZEnHsV.cjs} +7 -7
- package/dist/src/{messages-vsE_-Lv0.js → messages-CBulRaud.js} +7 -7
- package/dist/src/{messages-DGUlSNU7.js → messages-K9A8RxBM.js} +7 -7
- package/dist/src/{mischievousUser-0l8GD7Dp.js → mischievousUser-BDLwSGN0.js} +5 -5
- package/dist/src/{mischievousUser-frFYKxu6.js → mischievousUser-Blx-OtT3.js} +5 -5
- package/dist/src/{mischievousUser-BUOP9W5r.js → mischievousUser-CHuTTvBg.js} +5 -5
- package/dist/src/{mischievousUser-olGgHIVR.cjs → mischievousUser-CSUrH3fq.cjs} +5 -5
- package/dist/src/{modelslab-Cogmu4mG.js → modelslab-BjEk7yCP.js} +4 -4
- package/dist/src/{modelslab-EyDczZ5A.js → modelslab-CBCrdIBc.js} +4 -4
- package/dist/src/{modelslab-Dzst7VTU.js → modelslab-CrGpXuhv.js} +4 -4
- package/dist/src/{modelslab-CNV5bMSk.cjs → modelslab-Cvh0klQx.cjs} +4 -4
- package/dist/src/{nova-reel-BGPNBOMS.js → nova-reel-CUDDZcSA.js} +3 -3
- package/dist/src/{nova-reel-B_5NKFu1.js → nova-reel-CyDESu5J.js} +3 -3
- package/dist/src/{nova-reel-CjJRxI1X.cjs → nova-reel-DH_Ksu6X.cjs} +3 -3
- package/dist/src/{nova-reel-C4eUJGse.js → nova-reel-YQAqUYJY.js} +3 -3
- package/dist/src/{nova-sonic-ChPlh5na.js → nova-sonic-BVFFB7JZ.js} +2 -2
- package/dist/src/{nova-sonic-DuOG9Aun.cjs → nova-sonic-Bg3cxMMu.cjs} +2 -2
- package/dist/src/{nova-sonic-CrV0iaY_.js → nova-sonic-BhmnRGyh.js} +2 -2
- package/dist/src/{nova-sonic-BNGmgfFz.js → nova-sonic-DxmK95c1.js} +2 -2
- package/dist/src/{openclaw-Dphc01BY.cjs → openclaw-CHQaZi_-.cjs} +6 -6
- package/dist/src/{openclaw-zIJAsz3P.js → openclaw-CWOm2eOr.js} +6 -6
- package/dist/src/{openclaw-CF7fMido.js → openclaw-Cdk9JKfY.js} +6 -6
- package/dist/src/{openclaw-BIHlu_36.js → openclaw-DhF8rUpI.js} +6 -6
- package/dist/src/{opencode-sdk-B3vlPLsp.js → opencode-sdk-BRjiPV-g.js} +2 -2
- package/dist/src/{opencode-sdk-DoY6GbWw.cjs → opencode-sdk-CPFMw0ed.cjs} +2 -2
- package/dist/src/{opencode-sdk-sRKYHGoI.js → opencode-sdk-CaSOCsBA.js} +2 -2
- package/dist/src/{opencode-sdk-D05JSgMQ.js → opencode-sdk-CqkyG8De.js} +2 -2
- package/dist/src/{promptfoo-Rjp-MeBb.js → promptfoo-BU4_0J85.js} +64 -7
- package/dist/src/{promptfoo-BDrfT30-.js → promptfoo-CReYAtfb.js} +64 -7
- package/dist/src/{promptfoo-b-baRMj-.cjs → promptfoo-ClChwT74.cjs} +93 -6
- package/dist/src/{promptfoo-Cm4hiy1Y.js → promptfoo-CqEpj6Sr.js} +64 -7
- package/dist/src/{providers-B9KzWxAX.js → providers-B7TyByfj.js} +94 -50
- package/dist/src/{providers-DVYRZP4E.js → providers-BGc7tDtQ.js} +93 -49
- package/dist/src/{providers-BYAn82cf.js → providers-CSOp-bCm.js} +1 -1
- package/dist/src/{providers-BDVVIQM6.cjs → providers-V6RBuieY.cjs} +93 -49
- package/dist/src/{providers-BCCz6_IX.js → providers-iH3Sw1yo.js} +93 -49
- package/dist/src/{quiverai-BvIhI_0l.js → quiverai-58BtRRet.js} +3 -3
- package/dist/src/{quiverai-Cv7rJKDz.js → quiverai-C1dYu5MW.js} +3 -3
- package/dist/src/{quiverai-CdTWPe-A.js → quiverai-CNMIpZQg.js} +3 -3
- package/dist/src/{quiverai-BAp6iTZD.cjs → quiverai-fmSfU43k.cjs} +3 -3
- package/dist/src/{registry-KCVF1CFC.cjs → registry-6Jw6ebor.cjs} +14 -14
- package/dist/src/{registry-BUJrgjwv.js → registry-BTGk2ZkB.js} +14 -14
- package/dist/src/{registry-DXm1t_x0.js → registry-BTNqmP5o.js} +14 -14
- package/dist/src/{registry-Dp5EqoXc.js → registry-NGnOG2xa.js} +14 -14
- package/dist/src/{remoteGeneration-COpWcmWd.js → remoteGeneration--D6WjzUm.js} +4 -4
- package/dist/src/{remoteGeneration-DS9N3pgB.cjs → remoteGeneration-BpIYlb_O.cjs} +4 -4
- package/dist/src/{remoteGeneration-DsaSwmG2.js → remoteGeneration-CJC3E0aW.js} +4 -4
- package/dist/src/{remoteGeneration-B1_XsKXU.js → remoteGeneration-D6UjE2JT.js} +4 -4
- package/dist/src/{responses-B6ktc3Ra.js → responses-5Gf5HNOi.js} +9 -5
- package/dist/src/{responses-URRzV8qE.js → responses-BVi7xIdv.js} +9 -5
- package/dist/src/{responses-1UFFF9N_.cjs → responses-CUARGrhY.cjs} +9 -5
- package/dist/src/{responses-B3W2JvOQ.js → responses-CrmWv6iz.js} +9 -5
- package/dist/src/{sagemaker-DzffAqo_.cjs → sagemaker-BeVTKfrv.cjs} +9 -9
- package/dist/src/{sagemaker-yr1QKeBs.js → sagemaker-BwbV5U7_.js} +9 -9
- package/dist/src/{sagemaker-vhtSV7JI.js → sagemaker-ClAZ6Qwc.js} +9 -9
- package/dist/src/{sagemaker-CujrzP1a.js → sagemaker-DY2qrOpq.js} +9 -9
- package/dist/src/{scanner-DS0109SS.js → scanner-BS-iFIp3.js} +5 -5
- package/dist/src/server/index.js +111 -114
- package/dist/src/{server-B8rqV126.cjs → server-BHOEL8p8.cjs} +3 -3
- package/dist/src/{server-CMJD10J4.js → server-CbiJppij.js} +3 -3
- package/dist/src/server-D18AAlAc.js +3 -0
- package/dist/src/{server-DhMHosWj.js → server-DLYjSFm2.js} +5 -5
- package/dist/src/{server-Ddp8GNMp.js → server-JQYD_Nws.js} +5 -5
- package/dist/src/{shared-7pmVZLNO.js → shared-CRq0gGVf.js} +8 -8
- package/dist/src/{shared-D6IjElRI.js → shared-CSIGeGLl.js} +8 -8
- package/dist/src/{shared-9WHQ1oNE.js → shared-DNvim54U.js} +7 -7
- package/dist/src/{shared-WkgnDkcg.cjs → shared-aHWko3P1.cjs} +8 -8
- package/dist/src/{simulatedUser-U_qAHnuB.js → simulatedUser-C7sOFSF6.js} +5 -5
- package/dist/src/{simulatedUser-C9aQObBI.js → simulatedUser-DH_7RzEQ.js} +5 -5
- package/dist/src/{simulatedUser-p3tACcmw.js → simulatedUser-lgMMmniD.js} +5 -5
- package/dist/src/{simulatedUser-Cu601Dd4.cjs → simulatedUser-mnCUS9Bm.cjs} +5 -5
- package/dist/src/{storage-QdU-SmvD.js → storage-95htjpLs.js} +3 -3
- package/dist/src/{storage-CA-v9V2v.cjs → storage-A4WnAeN3.cjs} +3 -3
- package/dist/src/{storage-CD-GWAdx.js → storage-B2Ql_oq4.js} +3 -3
- package/dist/src/{storage-BU4qcnOb.js → storage-EKVWZBNY.js} +4 -4
- package/dist/src/{strategies-DRJjGTIY.js → strategies-CBI1brSy.js} +10 -10
- package/dist/src/{strategies-7CS3Alao.cjs → strategies-CCcnEbFO.cjs} +9 -9
- package/dist/src/{strategies-CiSeroPH.js → strategies-CD1gHeeQ.js} +9 -9
- package/dist/src/telemetry-BUm_krVX.js +3 -0
- package/dist/src/{telemetry-DmXYcJNV.js → telemetry-BbpmrenM.js} +4 -4
- package/dist/src/{telemetry-DwX9XUN5.js → telemetry-C4bX-6Sr.js} +4 -4
- package/dist/src/{telemetry-CJ7FnCsc.cjs → telemetry-C_ImlCOk.cjs} +4 -4
- package/dist/src/{telemetry-00ezXr_t.js → telemetry-DOE567Wj.js} +4 -4
- package/dist/src/{tracingOptions-ji2OuXbT.js → tracingOptions-BOP1FsRt.js} +2 -2
- package/dist/src/{tracingOptions-Chi74lOD.js → tracingOptions-BvmDa_jH.js} +2 -2
- package/dist/src/{tracingOptions-DrbSFaKy.cjs → tracingOptions-DFBoE8O0.cjs} +2 -2
- package/dist/src/{tracingOptions-BnwKCkSB.js → tracingOptions-xhjOg2b1.js} +2 -2
- package/dist/src/{transcription-Dkd22_4K.js → transcription-BOXDoehT.js} +4 -4
- package/dist/src/{transcription-CfU5loSq.js → transcription-CpVdKc4P.js} +4 -4
- package/dist/src/{transcription-mzuf18Mq.cjs → transcription-D8kkPXg_.cjs} +4 -4
- package/dist/src/{transcription-B8uIgCYX.js → transcription-Z94eV9LR.js} +4 -4
- package/dist/src/{transform-BIMynQsA.js → transform-BufxPIQL.js} +3 -3
- package/dist/src/{transform-DhNkAUs8.cjs → transform-DJkt81VY.cjs} +3 -3
- package/dist/src/{transform-EtD4jAWi.js → transform-DtTfiGoh.js} +3 -3
- package/dist/src/{transform-DmvYBRll.js → transform-Wp6s_5QE.js} +3 -3
- package/dist/src/{util-IYzs5Y04.cjs → util-BHCAeuXx.cjs} +3 -3
- package/dist/src/{util--WMgw7wM.js → util-CMrHV35u.js} +3 -3
- package/dist/src/{util-SPsvFONY.cjs → util-COnzevXE.cjs} +3 -3
- package/dist/src/{util-LKTmNsMQ.js → util-CYev3d-r.js} +16 -3
- package/dist/src/{util-Df8YMvS1.js → util-DGqkTb2-.js} +4 -4
- package/dist/src/{util-CN8om2rz.cjs → util-DNtUsus_.cjs} +4 -4
- package/dist/src/{util-Bx677_k2.js → util-DRfqa4xz.js} +3 -3
- package/dist/src/{util-DiQ3QvBB.js → util-DTq3jq2z.js} +3 -3
- package/dist/src/{util-5WnCSb0h.js → util-DeY58psG.js} +16 -3
- package/dist/src/{util-DNl96nNs.js → util-DpV6KT5i.js} +4 -4
- package/dist/src/{util-I-Rf-KaD.js → util-DwNJzqOV.js} +3 -3
- package/dist/src/{util-kDURhgJW.js → util-ETfU_sS9.js} +4 -4
- package/dist/src/{util-BSIuSLVK.cjs → util-NYQvo1C7.cjs} +16 -3
- package/dist/src/{util-CoQWM76y.js → util-X4KQgyVD.js} +3 -3
- package/dist/src/{util-DURocbYR.js → util-jZRrXe1P.js} +3 -3
- package/dist/src/{util-efByNxcr.js → util-o2Qg5rZv.js} +16 -3
- package/dist/src/{version-BK20a4sw.js → version-CHR-EFec.js} +2 -2
- package/dist/src/{version-eRkNuGv8.js → version-F0YDgb7J.js} +2 -2
- package/dist/src/{version-BWCSaByA.cjs → version-VzUqOBZk.cjs} +2 -2
- package/dist/src/{version-lpHV_53E.js → version-qVEN5qCm.js} +2 -2
- package/dist/tsconfig.tsbuildinfo +1 -1
- package/package.json +5 -5
- package/dist/src/app/assets/Report-BNHJKN35.js +0 -1
- package/dist/src/cache-Cf7b4pWE.js +0 -3
- package/dist/src/cloud-p96PA4MH.js +0 -3
- package/dist/src/codex-sdk-BGjVAk23.js +0 -3
- package/dist/src/evalResult-DqzsS6_W.js +0 -3
- package/dist/src/evaluator-DNdJF1Gv.js +0 -3
- package/dist/src/fetch-_YgGd2qv.js +0 -3
- package/dist/src/graders-BDT7dif6.js +0 -3
- package/dist/src/server-BaLytskk.js +0 -3
- package/dist/src/telemetry-ByPqDcKC.js +0 -3
|
@@ -1,16 +1,16 @@
|
|
|
1
1
|
import { a as logger, m as extractFirstJsonObject } from "./logger-Ct2S6Yx-.js";
|
|
2
2
|
import { t as invariant } from "./invariant-Ddh24eXh.js";
|
|
3
|
-
import { l as sleep } from "./fetch-
|
|
4
|
-
import { o as isLoggedIntoCloud } from "./accounts-
|
|
3
|
+
import { l as sleep } from "./fetch-Doks14zQ.js";
|
|
4
|
+
import { o as isLoggedIntoCloud } from "./accounts-DAv_0iE7.js";
|
|
5
5
|
import { o as getNunjucksEngine } from "./render-DFfDeYUK.js";
|
|
6
|
-
import { l as shouldGenerateRemote } from "./remoteGeneration-
|
|
6
|
+
import { l as shouldGenerateRemote } from "./remoteGeneration-CJC3E0aW.js";
|
|
7
7
|
import { a as createEmptyTokenUsage, n as accumulateResponseTokenUsage } from "./tokenUsageUtils-CmnQ0G2m.js";
|
|
8
|
-
import { a as extractPromptFromTags, i as extractMaterializedVariablesFromJsonWithMetadata, o as getSessionId } from "./util-
|
|
9
|
-
import { t as PromptfooChatCompletionProvider } from "./promptfoo-
|
|
10
|
-
import { c as getTargetResponse, f as redteamProviderManager, i as externalizeResponseForRedteamHistory, m as TokenUsageTracker, n as checkPenalizedPhrases, o as getGraderAssertionValue, r as createIterationContext, t as buildGraderResultAssertion } from "./shared-
|
|
11
|
-
import { n as checkExfilTracking } from "./indirectWebPwn-
|
|
12
|
-
import { n as renderPrompt } from "./evaluatorHelpers-
|
|
13
|
-
import { t as Strategies } from "./strategies-
|
|
8
|
+
import { a as extractPromptFromTags, i as extractMaterializedVariablesFromJsonWithMetadata, o as getSessionId } from "./util-DpV6KT5i.js";
|
|
9
|
+
import { a as assertRemoteMaterializationHandled, o as buildRemoteMaterializationContextVars, s as buildRemoteMaterializedInputVariables, t as PromptfooChatCompletionProvider } from "./promptfoo-CqEpj6Sr.js";
|
|
10
|
+
import { c as getTargetResponse, f as redteamProviderManager, i as externalizeResponseForRedteamHistory, m as TokenUsageTracker, n as checkPenalizedPhrases, o as getGraderAssertionValue, r as createIterationContext, t as buildGraderResultAssertion } from "./shared-CSIGeGLl.js";
|
|
11
|
+
import { n as checkExfilTracking } from "./indirectWebPwn-CiWB-vVH.js";
|
|
12
|
+
import { n as renderPrompt } from "./evaluatorHelpers-CrRObe2z.js";
|
|
13
|
+
import { t as Strategies } from "./strategies-CD1gHeeQ.js";
|
|
14
14
|
import { t as applyRuntimeTransforms } from "./runtimeTransform-DigbjU1r.js";
|
|
15
15
|
import { n as CLOUD_ATTACKER_SYSTEM_PROMPT, r as JUDGE_SYSTEM_PROMPT, t as ATTACKER_SYSTEM_PROMPT } from "./prompts-DHhQsANy.js";
|
|
16
16
|
import dedent from "dedent";
|
|
@@ -155,14 +155,20 @@ async function evaluateResponse(provider, judgeSystemPrompt, targetResponse, pre
|
|
|
155
155
|
* @param redteamHistory - The conversation history of the red team.
|
|
156
156
|
* @returns A promise that resolves to an object containing the improvement and new prompt.
|
|
157
157
|
*/
|
|
158
|
-
async function getNewPrompt(redteamProvider, redteamHistory) {
|
|
158
|
+
async function getNewPrompt(redteamProvider, redteamHistory, materializationContext) {
|
|
159
159
|
const redteamBody = JSON.stringify(redteamHistory);
|
|
160
160
|
const redteamResp = await redteamProvider.callApi(redteamBody, {
|
|
161
161
|
prompt: {
|
|
162
162
|
raw: redteamBody,
|
|
163
163
|
label: "history"
|
|
164
164
|
},
|
|
165
|
-
vars: {
|
|
165
|
+
vars: materializationContext ? buildRemoteMaterializationContextVars({
|
|
166
|
+
injectVar: void 0,
|
|
167
|
+
inputs: materializationContext.inputs,
|
|
168
|
+
materializationIndex: materializationContext.materializationIndex,
|
|
169
|
+
pluginId: materializationContext.pluginId,
|
|
170
|
+
purpose: materializationContext.purpose
|
|
171
|
+
}) : {}
|
|
166
172
|
});
|
|
167
173
|
if (redteamProvider.delay) {
|
|
168
174
|
logger.debug(`[IterativeTree] Sleeping for ${redteamProvider.delay}ms`);
|
|
@@ -185,6 +191,9 @@ async function getNewPrompt(redteamProvider, redteamHistory) {
|
|
|
185
191
|
logger.info(`[IterativeTree] Failed to parse attacker response as JSON (primary and fallback). Skipping this turn. primary=${String(primaryErr)} fallback=${String(fallbackErr)} outputPreview="${redteamResp.output.slice(0, 200)}"`);
|
|
186
192
|
return {
|
|
187
193
|
improvement: "parse failure – skipping turn",
|
|
194
|
+
inputMaterialization: redteamResp.inputMaterialization,
|
|
195
|
+
materializationHandled: redteamResp.materializationHandled,
|
|
196
|
+
materializedVars: redteamResp.materializedVars,
|
|
188
197
|
prompt: "",
|
|
189
198
|
tokenUsage: redteamResp.tokenUsage
|
|
190
199
|
};
|
|
@@ -193,6 +202,9 @@ async function getNewPrompt(redteamProvider, redteamHistory) {
|
|
|
193
202
|
else retObj = redteamResp.output;
|
|
194
203
|
return {
|
|
195
204
|
...retObj,
|
|
205
|
+
inputMaterialization: redteamResp.inputMaterialization,
|
|
206
|
+
materializationHandled: redteamResp.materializationHandled,
|
|
207
|
+
materializedVars: redteamResp.materializedVars,
|
|
196
208
|
tokenUsage: redteamResp.tokenUsage
|
|
197
209
|
};
|
|
198
210
|
}
|
|
@@ -231,13 +243,16 @@ function updateRedteamHistory(targetResponse, goal, score, containsPenalizedPhra
|
|
|
231
243
|
* @param id - Optional custom UUID for the node. If not provided, a new UUID will be generated.
|
|
232
244
|
* @returns A new TreeNode object.
|
|
233
245
|
*/
|
|
234
|
-
function createTreeNode(prompt, score, depth, id) {
|
|
246
|
+
function createTreeNode(prompt, score, depth, id, options) {
|
|
235
247
|
return {
|
|
236
248
|
id: id || crypto.randomUUID(),
|
|
237
249
|
prompt,
|
|
238
250
|
score,
|
|
239
251
|
children: [],
|
|
240
|
-
depth
|
|
252
|
+
depth,
|
|
253
|
+
inputMaterialization: options?.inputMaterialization,
|
|
254
|
+
materializationHandled: options?.materializationHandled,
|
|
255
|
+
materializedVars: options?.materializedVars
|
|
241
256
|
};
|
|
242
257
|
}
|
|
243
258
|
/**
|
|
@@ -314,10 +329,20 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
314
329
|
loggerTag: "[IterativeTree]"
|
|
315
330
|
});
|
|
316
331
|
const iterationVars = iterationContext?.vars || {};
|
|
317
|
-
let { improvement, prompt: newInjectVar } = await getNewPrompt(redteamProvider, [...redteamHistory, {
|
|
332
|
+
let { improvement, inputMaterialization, materializationHandled, materializedVars, prompt: newInjectVar } = await getNewPrompt(redteamProvider, [...redteamHistory, {
|
|
318
333
|
role: "assistant",
|
|
319
334
|
content: node.prompt
|
|
320
|
-
}])
|
|
335
|
+
}], shouldGenerateRemote() ? {
|
|
336
|
+
inputs,
|
|
337
|
+
materializationIndex: attempts,
|
|
338
|
+
pluginId: String(test?.metadata?.pluginId || "unknown-plugin"),
|
|
339
|
+
purpose: test?.metadata?.purpose
|
|
340
|
+
} : void 0);
|
|
341
|
+
if (inputs && shouldGenerateRemote()) assertRemoteMaterializationHandled({
|
|
342
|
+
inputMaterialization,
|
|
343
|
+
materializationHandled,
|
|
344
|
+
materializedVars
|
|
345
|
+
}, "Iterative Tree multi-input generation");
|
|
321
346
|
attempts++;
|
|
322
347
|
const extractedPrompt = extractPromptFromTags(newInjectVar);
|
|
323
348
|
if (extractedPrompt) newInjectVar = extractedPrompt;
|
|
@@ -360,14 +385,22 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
360
385
|
...iterationVars,
|
|
361
386
|
[injectVar]: finalInjectVar
|
|
362
387
|
};
|
|
363
|
-
if (inputs && Object.keys(inputs).length > 0) try {
|
|
364
|
-
const
|
|
388
|
+
if (inputs && Object.keys(inputs).length > 0) if (shouldGenerateRemote()) try {
|
|
389
|
+
const parsed = JSON.parse(newInjectVar);
|
|
390
|
+
Object.assign(updatedVars, buildRemoteMaterializedInputVariables({
|
|
391
|
+
inputMaterialization,
|
|
392
|
+
materializationHandled,
|
|
393
|
+
materializedVars
|
|
394
|
+
}, parsed, inputs).vars);
|
|
395
|
+
} catch {}
|
|
396
|
+
else try {
|
|
397
|
+
const { vars: localMaterializedVars } = await extractMaterializedVariablesFromJsonWithMetadata(JSON.parse(newInjectVar), inputs, {
|
|
365
398
|
materializationIndex: attempts - 1,
|
|
366
399
|
pluginId: String(test?.metadata?.pluginId || "unknown-plugin"),
|
|
367
400
|
provider: redteamProvider,
|
|
368
401
|
purpose: test?.metadata?.purpose
|
|
369
402
|
});
|
|
370
|
-
Object.assign(updatedVars,
|
|
403
|
+
Object.assign(updatedVars, localMaterializedVars);
|
|
371
404
|
} catch {}
|
|
372
405
|
const targetPrompt = await renderPrompt(prompt, updatedVars, filters, targetProvider, [injectVar]);
|
|
373
406
|
let targetResponse = await getTargetResponse(targetProvider, targetPrompt, iterationContext, options);
|
|
@@ -404,11 +437,18 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
404
437
|
const containsPenalizedPhrase = checkPenalizedPhrases(targetResponse.output);
|
|
405
438
|
const { score, explanation } = await evaluateResponse(gradingProvider, judgeSystemPrompt, targetResponse.output, bestResponse, containsPenalizedPhrase);
|
|
406
439
|
logger.debug(`[Depth ${depth}, Attempt ${attempts}] Evaluation: score=${score}, penalized=${containsPenalizedPhrase}. Max score so far: ${maxScore}`);
|
|
407
|
-
nextLevelNodes.push(createTreeNode(newInjectVar, score, depth + 1
|
|
440
|
+
nextLevelNodes.push(createTreeNode(newInjectVar, score, depth + 1, void 0, {
|
|
441
|
+
inputMaterialization,
|
|
442
|
+
materializationHandled,
|
|
443
|
+
materializedVars
|
|
444
|
+
}));
|
|
408
445
|
if (score > maxScore) {
|
|
409
446
|
maxScore = score;
|
|
410
447
|
bestResponse = targetResponse.output;
|
|
411
448
|
bestNode.prompt = newInjectVar;
|
|
449
|
+
bestNode.inputMaterialization = inputMaterialization;
|
|
450
|
+
bestNode.materializationHandled = materializationHandled;
|
|
451
|
+
bestNode.materializedVars = materializedVars;
|
|
412
452
|
bestFinalAttackPrompt = finalInjectVar;
|
|
413
453
|
bestTransformDisplayVars = lastTransformDisplayVars;
|
|
414
454
|
logger.debug(`[Depth ${depth}, Attempt ${attempts}] New max score: ${maxScore}`);
|
|
@@ -420,7 +460,7 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
420
460
|
noImprovementCount++;
|
|
421
461
|
if (noImprovementCount % 5 === 0) logger.debug(`[Depth ${depth}, Attempt ${attempts}] No improvement for ${noImprovementCount} consecutive iterations. Max score: ${maxScore}`);
|
|
422
462
|
}
|
|
423
|
-
const { getGraderById } = await import("./graders-
|
|
463
|
+
const { getGraderById } = await import("./graders-KXzjnIim.js").then((n) => n.r);
|
|
424
464
|
let graderPassed;
|
|
425
465
|
let assertToUse = test?.assert?.find((a) => a.type && a.type.includes(test.metadata?.pluginId));
|
|
426
466
|
if (!assertToUse) assertToUse = test?.assert?.find((a) => a.type);
|
|
@@ -619,13 +659,23 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
619
659
|
[injectVar]: bestPrompt
|
|
620
660
|
};
|
|
621
661
|
if (inputs && Object.keys(inputs).length > 0) try {
|
|
622
|
-
const
|
|
623
|
-
|
|
624
|
-
|
|
625
|
-
|
|
626
|
-
|
|
627
|
-
|
|
628
|
-
|
|
662
|
+
const parsed = JSON.parse(bestPrompt);
|
|
663
|
+
if (shouldGenerateRemote()) {
|
|
664
|
+
const remoteBestNodeMaterialization = {
|
|
665
|
+
inputMaterialization: bestNode.inputMaterialization,
|
|
666
|
+
materializationHandled: bestNode.materializationHandled,
|
|
667
|
+
materializedVars: bestNode.materializedVars
|
|
668
|
+
};
|
|
669
|
+
if (remoteBestNodeMaterialization.materializationHandled) Object.assign(finalUpdatedVars, buildRemoteMaterializedInputVariables(remoteBestNodeMaterialization, parsed, inputs).vars);
|
|
670
|
+
} else {
|
|
671
|
+
const { vars: materializedVars } = await extractMaterializedVariablesFromJsonWithMetadata(parsed, inputs, {
|
|
672
|
+
materializationIndex: attempts,
|
|
673
|
+
pluginId: String(test?.metadata?.pluginId || "unknown-plugin"),
|
|
674
|
+
provider: redteamProvider,
|
|
675
|
+
purpose: test?.metadata?.purpose
|
|
676
|
+
});
|
|
677
|
+
Object.assign(finalUpdatedVars, materializedVars);
|
|
678
|
+
}
|
|
629
679
|
} catch {}
|
|
630
680
|
const finalTargetPrompt = await renderPrompt(prompt, finalUpdatedVars, filters, targetProvider, [injectVar]);
|
|
631
681
|
const finalTargetResponse = await getTargetResponse(targetProvider, finalTargetPrompt, context, options);
|
|
@@ -766,4 +816,4 @@ var RedteamIterativeTreeProvider = class {
|
|
|
766
816
|
//#endregion
|
|
767
817
|
export { RedteamIterativeTreeProvider as default };
|
|
768
818
|
|
|
769
|
-
//# sourceMappingURL=iterativeTree-
|
|
819
|
+
//# sourceMappingURL=iterativeTree-DcuFXnjL.js.map
|
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
import { a as logger, m as extractFirstJsonObject } from "./logger-KD8JjCRJ.js";
|
|
2
|
-
import { m as sleep } from "./fetch-
|
|
2
|
+
import { m as sleep } from "./fetch-BSSAcMxf.js";
|
|
3
3
|
import { t as invariant } from "./invariant-DIYf9sP1.js";
|
|
4
|
-
import { c as isLoggedIntoCloud } from "./accounts-
|
|
4
|
+
import { c as isLoggedIntoCloud } from "./accounts-BWjqwsrf.js";
|
|
5
5
|
import { o as getNunjucksEngine } from "./render-_6ur1fhE.js";
|
|
6
|
-
import { l as shouldGenerateRemote } from "./remoteGeneration
|
|
6
|
+
import { l as shouldGenerateRemote } from "./remoteGeneration--D6WjzUm.js";
|
|
7
7
|
import { a as createEmptyTokenUsage, n as accumulateResponseTokenUsage } from "./tokenUsageUtils-BjVkdk18.js";
|
|
8
|
-
import { a as extractPromptFromTags, i as extractMaterializedVariablesFromJsonWithMetadata, o as getSessionId } from "./util-
|
|
9
|
-
import { t as PromptfooChatCompletionProvider } from "./promptfoo-
|
|
10
|
-
import { c as getTargetResponse, f as redteamProviderManager, i as externalizeResponseForRedteamHistory, m as TokenUsageTracker, n as checkPenalizedPhrases, o as getGraderAssertionValue, r as createIterationContext, t as buildGraderResultAssertion } from "./shared-
|
|
11
|
-
import { n as checkExfilTracking } from "./indirectWebPwn-
|
|
8
|
+
import { a as extractPromptFromTags, i as extractMaterializedVariablesFromJsonWithMetadata, o as getSessionId } from "./util-DGqkTb2-.js";
|
|
9
|
+
import { a as assertRemoteMaterializationHandled, o as buildRemoteMaterializationContextVars, s as buildRemoteMaterializedInputVariables, t as PromptfooChatCompletionProvider } from "./promptfoo-CReYAtfb.js";
|
|
10
|
+
import { c as getTargetResponse, f as redteamProviderManager, i as externalizeResponseForRedteamHistory, m as TokenUsageTracker, n as checkPenalizedPhrases, o as getGraderAssertionValue, r as createIterationContext, t as buildGraderResultAssertion } from "./shared-CRq0gGVf.js";
|
|
11
|
+
import { n as checkExfilTracking } from "./indirectWebPwn-BZFPV7Q9.js";
|
|
12
12
|
import { n as renderPrompt, t as Strategies } from "./server/index.js";
|
|
13
13
|
import { t as applyRuntimeTransforms } from "./runtimeTransform-BJOpL9Yc.js";
|
|
14
14
|
import { n as CLOUD_ATTACKER_SYSTEM_PROMPT, r as JUDGE_SYSTEM_PROMPT, t as ATTACKER_SYSTEM_PROMPT } from "./prompts-BYMtqPCw.js";
|
|
@@ -154,14 +154,20 @@ async function evaluateResponse(provider, judgeSystemPrompt, targetResponse, pre
|
|
|
154
154
|
* @param redteamHistory - The conversation history of the red team.
|
|
155
155
|
* @returns A promise that resolves to an object containing the improvement and new prompt.
|
|
156
156
|
*/
|
|
157
|
-
async function getNewPrompt(redteamProvider, redteamHistory) {
|
|
157
|
+
async function getNewPrompt(redteamProvider, redteamHistory, materializationContext) {
|
|
158
158
|
const redteamBody = JSON.stringify(redteamHistory);
|
|
159
159
|
const redteamResp = await redteamProvider.callApi(redteamBody, {
|
|
160
160
|
prompt: {
|
|
161
161
|
raw: redteamBody,
|
|
162
162
|
label: "history"
|
|
163
163
|
},
|
|
164
|
-
vars: {
|
|
164
|
+
vars: materializationContext ? buildRemoteMaterializationContextVars({
|
|
165
|
+
injectVar: void 0,
|
|
166
|
+
inputs: materializationContext.inputs,
|
|
167
|
+
materializationIndex: materializationContext.materializationIndex,
|
|
168
|
+
pluginId: materializationContext.pluginId,
|
|
169
|
+
purpose: materializationContext.purpose
|
|
170
|
+
}) : {}
|
|
165
171
|
});
|
|
166
172
|
if (redteamProvider.delay) {
|
|
167
173
|
logger.debug(`[IterativeTree] Sleeping for ${redteamProvider.delay}ms`);
|
|
@@ -184,6 +190,9 @@ async function getNewPrompt(redteamProvider, redteamHistory) {
|
|
|
184
190
|
logger.info(`[IterativeTree] Failed to parse attacker response as JSON (primary and fallback). Skipping this turn. primary=${String(primaryErr)} fallback=${String(fallbackErr)} outputPreview="${redteamResp.output.slice(0, 200)}"`);
|
|
185
191
|
return {
|
|
186
192
|
improvement: "parse failure – skipping turn",
|
|
193
|
+
inputMaterialization: redteamResp.inputMaterialization,
|
|
194
|
+
materializationHandled: redteamResp.materializationHandled,
|
|
195
|
+
materializedVars: redteamResp.materializedVars,
|
|
187
196
|
prompt: "",
|
|
188
197
|
tokenUsage: redteamResp.tokenUsage
|
|
189
198
|
};
|
|
@@ -192,6 +201,9 @@ async function getNewPrompt(redteamProvider, redteamHistory) {
|
|
|
192
201
|
else retObj = redteamResp.output;
|
|
193
202
|
return {
|
|
194
203
|
...retObj,
|
|
204
|
+
inputMaterialization: redteamResp.inputMaterialization,
|
|
205
|
+
materializationHandled: redteamResp.materializationHandled,
|
|
206
|
+
materializedVars: redteamResp.materializedVars,
|
|
195
207
|
tokenUsage: redteamResp.tokenUsage
|
|
196
208
|
};
|
|
197
209
|
}
|
|
@@ -230,13 +242,16 @@ function updateRedteamHistory(targetResponse, goal, score, containsPenalizedPhra
|
|
|
230
242
|
* @param id - Optional custom UUID for the node. If not provided, a new UUID will be generated.
|
|
231
243
|
* @returns A new TreeNode object.
|
|
232
244
|
*/
|
|
233
|
-
function createTreeNode(prompt, score, depth, id) {
|
|
245
|
+
function createTreeNode(prompt, score, depth, id, options) {
|
|
234
246
|
return {
|
|
235
247
|
id: id || crypto.randomUUID(),
|
|
236
248
|
prompt,
|
|
237
249
|
score,
|
|
238
250
|
children: [],
|
|
239
|
-
depth
|
|
251
|
+
depth,
|
|
252
|
+
inputMaterialization: options?.inputMaterialization,
|
|
253
|
+
materializationHandled: options?.materializationHandled,
|
|
254
|
+
materializedVars: options?.materializedVars
|
|
240
255
|
};
|
|
241
256
|
}
|
|
242
257
|
/**
|
|
@@ -313,10 +328,20 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
313
328
|
loggerTag: "[IterativeTree]"
|
|
314
329
|
});
|
|
315
330
|
const iterationVars = iterationContext?.vars || {};
|
|
316
|
-
let { improvement, prompt: newInjectVar } = await getNewPrompt(redteamProvider, [...redteamHistory, {
|
|
331
|
+
let { improvement, inputMaterialization, materializationHandled, materializedVars, prompt: newInjectVar } = await getNewPrompt(redteamProvider, [...redteamHistory, {
|
|
317
332
|
role: "assistant",
|
|
318
333
|
content: node.prompt
|
|
319
|
-
}])
|
|
334
|
+
}], shouldGenerateRemote() ? {
|
|
335
|
+
inputs,
|
|
336
|
+
materializationIndex: attempts,
|
|
337
|
+
pluginId: String(test?.metadata?.pluginId || "unknown-plugin"),
|
|
338
|
+
purpose: test?.metadata?.purpose
|
|
339
|
+
} : void 0);
|
|
340
|
+
if (inputs && shouldGenerateRemote()) assertRemoteMaterializationHandled({
|
|
341
|
+
inputMaterialization,
|
|
342
|
+
materializationHandled,
|
|
343
|
+
materializedVars
|
|
344
|
+
}, "Iterative Tree multi-input generation");
|
|
320
345
|
attempts++;
|
|
321
346
|
const extractedPrompt = extractPromptFromTags(newInjectVar);
|
|
322
347
|
if (extractedPrompt) newInjectVar = extractedPrompt;
|
|
@@ -359,14 +384,22 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
359
384
|
...iterationVars,
|
|
360
385
|
[injectVar]: finalInjectVar
|
|
361
386
|
};
|
|
362
|
-
if (inputs && Object.keys(inputs).length > 0) try {
|
|
363
|
-
const
|
|
387
|
+
if (inputs && Object.keys(inputs).length > 0) if (shouldGenerateRemote()) try {
|
|
388
|
+
const parsed = JSON.parse(newInjectVar);
|
|
389
|
+
Object.assign(updatedVars, buildRemoteMaterializedInputVariables({
|
|
390
|
+
inputMaterialization,
|
|
391
|
+
materializationHandled,
|
|
392
|
+
materializedVars
|
|
393
|
+
}, parsed, inputs).vars);
|
|
394
|
+
} catch {}
|
|
395
|
+
else try {
|
|
396
|
+
const { vars: localMaterializedVars } = await extractMaterializedVariablesFromJsonWithMetadata(JSON.parse(newInjectVar), inputs, {
|
|
364
397
|
materializationIndex: attempts - 1,
|
|
365
398
|
pluginId: String(test?.metadata?.pluginId || "unknown-plugin"),
|
|
366
399
|
provider: redteamProvider,
|
|
367
400
|
purpose: test?.metadata?.purpose
|
|
368
401
|
});
|
|
369
|
-
Object.assign(updatedVars,
|
|
402
|
+
Object.assign(updatedVars, localMaterializedVars);
|
|
370
403
|
} catch {}
|
|
371
404
|
const targetPrompt = await renderPrompt(prompt, updatedVars, filters, targetProvider, [injectVar]);
|
|
372
405
|
let targetResponse = await getTargetResponse(targetProvider, targetPrompt, iterationContext, options);
|
|
@@ -403,11 +436,18 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
403
436
|
const containsPenalizedPhrase = checkPenalizedPhrases(targetResponse.output);
|
|
404
437
|
const { score, explanation } = await evaluateResponse(gradingProvider, judgeSystemPrompt, targetResponse.output, bestResponse, containsPenalizedPhrase);
|
|
405
438
|
logger.debug(`[Depth ${depth}, Attempt ${attempts}] Evaluation: score=${score}, penalized=${containsPenalizedPhrase}. Max score so far: ${maxScore}`);
|
|
406
|
-
nextLevelNodes.push(createTreeNode(newInjectVar, score, depth + 1
|
|
439
|
+
nextLevelNodes.push(createTreeNode(newInjectVar, score, depth + 1, void 0, {
|
|
440
|
+
inputMaterialization,
|
|
441
|
+
materializationHandled,
|
|
442
|
+
materializedVars
|
|
443
|
+
}));
|
|
407
444
|
if (score > maxScore) {
|
|
408
445
|
maxScore = score;
|
|
409
446
|
bestResponse = targetResponse.output;
|
|
410
447
|
bestNode.prompt = newInjectVar;
|
|
448
|
+
bestNode.inputMaterialization = inputMaterialization;
|
|
449
|
+
bestNode.materializationHandled = materializationHandled;
|
|
450
|
+
bestNode.materializedVars = materializedVars;
|
|
411
451
|
bestFinalAttackPrompt = finalInjectVar;
|
|
412
452
|
bestTransformDisplayVars = lastTransformDisplayVars;
|
|
413
453
|
logger.debug(`[Depth ${depth}, Attempt ${attempts}] New max score: ${maxScore}`);
|
|
@@ -419,7 +459,7 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
419
459
|
noImprovementCount++;
|
|
420
460
|
if (noImprovementCount % 5 === 0) logger.debug(`[Depth ${depth}, Attempt ${attempts}] No improvement for ${noImprovementCount} consecutive iterations. Max score: ${maxScore}`);
|
|
421
461
|
}
|
|
422
|
-
const { getGraderById } = await import("./graders-
|
|
462
|
+
const { getGraderById } = await import("./graders-DaRU98zs.js").then((n) => n.r);
|
|
423
463
|
let graderPassed;
|
|
424
464
|
let assertToUse = test?.assert?.find((a) => a.type && a.type.includes(test.metadata?.pluginId));
|
|
425
465
|
if (!assertToUse) assertToUse = test?.assert?.find((a) => a.type);
|
|
@@ -618,13 +658,23 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
618
658
|
[injectVar]: bestPrompt
|
|
619
659
|
};
|
|
620
660
|
if (inputs && Object.keys(inputs).length > 0) try {
|
|
621
|
-
const
|
|
622
|
-
|
|
623
|
-
|
|
624
|
-
|
|
625
|
-
|
|
626
|
-
|
|
627
|
-
|
|
661
|
+
const parsed = JSON.parse(bestPrompt);
|
|
662
|
+
if (shouldGenerateRemote()) {
|
|
663
|
+
const remoteBestNodeMaterialization = {
|
|
664
|
+
inputMaterialization: bestNode.inputMaterialization,
|
|
665
|
+
materializationHandled: bestNode.materializationHandled,
|
|
666
|
+
materializedVars: bestNode.materializedVars
|
|
667
|
+
};
|
|
668
|
+
if (remoteBestNodeMaterialization.materializationHandled) Object.assign(finalUpdatedVars, buildRemoteMaterializedInputVariables(remoteBestNodeMaterialization, parsed, inputs).vars);
|
|
669
|
+
} else {
|
|
670
|
+
const { vars: materializedVars } = await extractMaterializedVariablesFromJsonWithMetadata(parsed, inputs, {
|
|
671
|
+
materializationIndex: attempts,
|
|
672
|
+
pluginId: String(test?.metadata?.pluginId || "unknown-plugin"),
|
|
673
|
+
provider: redteamProvider,
|
|
674
|
+
purpose: test?.metadata?.purpose
|
|
675
|
+
});
|
|
676
|
+
Object.assign(finalUpdatedVars, materializedVars);
|
|
677
|
+
}
|
|
628
678
|
} catch {}
|
|
629
679
|
const finalTargetPrompt = await renderPrompt(prompt, finalUpdatedVars, filters, targetProvider, [injectVar]);
|
|
630
680
|
const finalTargetResponse = await getTargetResponse(targetProvider, finalTargetPrompt, context, options);
|
|
@@ -765,4 +815,4 @@ var RedteamIterativeTreeProvider = class {
|
|
|
765
815
|
//#endregion
|
|
766
816
|
export { RedteamIterativeTreeProvider as default };
|
|
767
817
|
|
|
768
|
-
//# sourceMappingURL=iterativeTree-
|
|
818
|
+
//# sourceMappingURL=iterativeTree-FrDDYAN0.js.map
|
|
@@ -1,17 +1,17 @@
|
|
|
1
1
|
const require_rolldown_runtime = require("./rolldown-runtime-D_mwlA32.cjs");
|
|
2
2
|
const require_logger = require("./logger-cfNpzI4o.cjs");
|
|
3
3
|
const require_invariant = require("./invariant-QtnLD03y.cjs");
|
|
4
|
-
const require_fetch = require("./fetch-
|
|
5
|
-
const require_accounts = require("./accounts-
|
|
4
|
+
const require_fetch = require("./fetch-Cfm4EuOB.cjs");
|
|
5
|
+
const require_accounts = require("./accounts-BVz5gHLK.cjs");
|
|
6
6
|
const require_render = require("./render-BNTrbmBw.cjs");
|
|
7
|
-
const require_remoteGeneration = require("./remoteGeneration-
|
|
7
|
+
const require_remoteGeneration = require("./remoteGeneration-BpIYlb_O.cjs");
|
|
8
8
|
const require_tokenUsageUtils = require("./tokenUsageUtils-_B-P8IAi.cjs");
|
|
9
|
-
const require_util = require("./util-
|
|
10
|
-
const require_promptfoo = require("./promptfoo-
|
|
11
|
-
const require_shared = require("./shared-
|
|
12
|
-
const require_indirectWebPwn = require("./indirectWebPwn-
|
|
13
|
-
const require_evaluatorHelpers = require("./evaluatorHelpers-
|
|
14
|
-
const require_strategies = require("./strategies-
|
|
9
|
+
const require_util = require("./util-DNtUsus_.cjs");
|
|
10
|
+
const require_promptfoo = require("./promptfoo-ClChwT74.cjs");
|
|
11
|
+
const require_shared = require("./shared-aHWko3P1.cjs");
|
|
12
|
+
const require_indirectWebPwn = require("./indirectWebPwn-D7NA9Nsv.cjs");
|
|
13
|
+
const require_evaluatorHelpers = require("./evaluatorHelpers-D06I9WFL.cjs");
|
|
14
|
+
const require_strategies = require("./strategies-CCcnEbFO.cjs");
|
|
15
15
|
const require_runtimeTransform = require("./runtimeTransform-ON3YYILw.cjs");
|
|
16
16
|
const require_prompts = require("./prompts-hNvWBD3z.cjs");
|
|
17
17
|
let dedent = require("dedent");
|
|
@@ -157,14 +157,20 @@ async function evaluateResponse(provider, judgeSystemPrompt, targetResponse, pre
|
|
|
157
157
|
* @param redteamHistory - The conversation history of the red team.
|
|
158
158
|
* @returns A promise that resolves to an object containing the improvement and new prompt.
|
|
159
159
|
*/
|
|
160
|
-
async function getNewPrompt(redteamProvider, redteamHistory) {
|
|
160
|
+
async function getNewPrompt(redteamProvider, redteamHistory, materializationContext) {
|
|
161
161
|
const redteamBody = JSON.stringify(redteamHistory);
|
|
162
162
|
const redteamResp = await redteamProvider.callApi(redteamBody, {
|
|
163
163
|
prompt: {
|
|
164
164
|
raw: redteamBody,
|
|
165
165
|
label: "history"
|
|
166
166
|
},
|
|
167
|
-
vars: {
|
|
167
|
+
vars: materializationContext ? require_promptfoo.buildRemoteMaterializationContextVars({
|
|
168
|
+
injectVar: void 0,
|
|
169
|
+
inputs: materializationContext.inputs,
|
|
170
|
+
materializationIndex: materializationContext.materializationIndex,
|
|
171
|
+
pluginId: materializationContext.pluginId,
|
|
172
|
+
purpose: materializationContext.purpose
|
|
173
|
+
}) : {}
|
|
168
174
|
});
|
|
169
175
|
if (redteamProvider.delay) {
|
|
170
176
|
require_logger.logger.debug(`[IterativeTree] Sleeping for ${redteamProvider.delay}ms`);
|
|
@@ -187,6 +193,9 @@ async function getNewPrompt(redteamProvider, redteamHistory) {
|
|
|
187
193
|
require_logger.logger.info(`[IterativeTree] Failed to parse attacker response as JSON (primary and fallback). Skipping this turn. primary=${String(primaryErr)} fallback=${String(fallbackErr)} outputPreview="${redteamResp.output.slice(0, 200)}"`);
|
|
188
194
|
return {
|
|
189
195
|
improvement: "parse failure – skipping turn",
|
|
196
|
+
inputMaterialization: redteamResp.inputMaterialization,
|
|
197
|
+
materializationHandled: redteamResp.materializationHandled,
|
|
198
|
+
materializedVars: redteamResp.materializedVars,
|
|
190
199
|
prompt: "",
|
|
191
200
|
tokenUsage: redteamResp.tokenUsage
|
|
192
201
|
};
|
|
@@ -195,6 +204,9 @@ async function getNewPrompt(redteamProvider, redteamHistory) {
|
|
|
195
204
|
else retObj = redteamResp.output;
|
|
196
205
|
return {
|
|
197
206
|
...retObj,
|
|
207
|
+
inputMaterialization: redteamResp.inputMaterialization,
|
|
208
|
+
materializationHandled: redteamResp.materializationHandled,
|
|
209
|
+
materializedVars: redteamResp.materializedVars,
|
|
198
210
|
tokenUsage: redteamResp.tokenUsage
|
|
199
211
|
};
|
|
200
212
|
}
|
|
@@ -233,13 +245,16 @@ function updateRedteamHistory(targetResponse, goal, score, containsPenalizedPhra
|
|
|
233
245
|
* @param id - Optional custom UUID for the node. If not provided, a new UUID will be generated.
|
|
234
246
|
* @returns A new TreeNode object.
|
|
235
247
|
*/
|
|
236
|
-
function createTreeNode(prompt, score, depth, id) {
|
|
248
|
+
function createTreeNode(prompt, score, depth, id, options) {
|
|
237
249
|
return {
|
|
238
250
|
id: id || crypto.randomUUID(),
|
|
239
251
|
prompt,
|
|
240
252
|
score,
|
|
241
253
|
children: [],
|
|
242
|
-
depth
|
|
254
|
+
depth,
|
|
255
|
+
inputMaterialization: options?.inputMaterialization,
|
|
256
|
+
materializationHandled: options?.materializationHandled,
|
|
257
|
+
materializedVars: options?.materializedVars
|
|
243
258
|
};
|
|
244
259
|
}
|
|
245
260
|
/**
|
|
@@ -316,10 +331,20 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
316
331
|
loggerTag: "[IterativeTree]"
|
|
317
332
|
});
|
|
318
333
|
const iterationVars = iterationContext?.vars || {};
|
|
319
|
-
let { improvement, prompt: newInjectVar } = await getNewPrompt(redteamProvider, [...redteamHistory, {
|
|
334
|
+
let { improvement, inputMaterialization, materializationHandled, materializedVars, prompt: newInjectVar } = await getNewPrompt(redteamProvider, [...redteamHistory, {
|
|
320
335
|
role: "assistant",
|
|
321
336
|
content: node.prompt
|
|
322
|
-
}])
|
|
337
|
+
}], require_remoteGeneration.shouldGenerateRemote() ? {
|
|
338
|
+
inputs,
|
|
339
|
+
materializationIndex: attempts,
|
|
340
|
+
pluginId: String(test?.metadata?.pluginId || "unknown-plugin"),
|
|
341
|
+
purpose: test?.metadata?.purpose
|
|
342
|
+
} : void 0);
|
|
343
|
+
if (inputs && require_remoteGeneration.shouldGenerateRemote()) require_promptfoo.assertRemoteMaterializationHandled({
|
|
344
|
+
inputMaterialization,
|
|
345
|
+
materializationHandled,
|
|
346
|
+
materializedVars
|
|
347
|
+
}, "Iterative Tree multi-input generation");
|
|
323
348
|
attempts++;
|
|
324
349
|
const extractedPrompt = require_util.extractPromptFromTags(newInjectVar);
|
|
325
350
|
if (extractedPrompt) newInjectVar = extractedPrompt;
|
|
@@ -362,14 +387,22 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
362
387
|
...iterationVars,
|
|
363
388
|
[injectVar]: finalInjectVar
|
|
364
389
|
};
|
|
365
|
-
if (inputs && Object.keys(inputs).length > 0) try {
|
|
366
|
-
const
|
|
390
|
+
if (inputs && Object.keys(inputs).length > 0) if (require_remoteGeneration.shouldGenerateRemote()) try {
|
|
391
|
+
const parsed = JSON.parse(newInjectVar);
|
|
392
|
+
Object.assign(updatedVars, require_promptfoo.buildRemoteMaterializedInputVariables({
|
|
393
|
+
inputMaterialization,
|
|
394
|
+
materializationHandled,
|
|
395
|
+
materializedVars
|
|
396
|
+
}, parsed, inputs).vars);
|
|
397
|
+
} catch {}
|
|
398
|
+
else try {
|
|
399
|
+
const { vars: localMaterializedVars } = await require_util.extractMaterializedVariablesFromJsonWithMetadata(JSON.parse(newInjectVar), inputs, {
|
|
367
400
|
materializationIndex: attempts - 1,
|
|
368
401
|
pluginId: String(test?.metadata?.pluginId || "unknown-plugin"),
|
|
369
402
|
provider: redteamProvider,
|
|
370
403
|
purpose: test?.metadata?.purpose
|
|
371
404
|
});
|
|
372
|
-
Object.assign(updatedVars,
|
|
405
|
+
Object.assign(updatedVars, localMaterializedVars);
|
|
373
406
|
} catch {}
|
|
374
407
|
const targetPrompt = await require_evaluatorHelpers.renderPrompt(prompt, updatedVars, filters, targetProvider, [injectVar]);
|
|
375
408
|
let targetResponse = await require_shared.getTargetResponse(targetProvider, targetPrompt, iterationContext, options);
|
|
@@ -406,11 +439,18 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
406
439
|
const containsPenalizedPhrase = require_shared.checkPenalizedPhrases(targetResponse.output);
|
|
407
440
|
const { score, explanation } = await evaluateResponse(gradingProvider, judgeSystemPrompt, targetResponse.output, bestResponse, containsPenalizedPhrase);
|
|
408
441
|
require_logger.logger.debug(`[Depth ${depth}, Attempt ${attempts}] Evaluation: score=${score}, penalized=${containsPenalizedPhrase}. Max score so far: ${maxScore}`);
|
|
409
|
-
nextLevelNodes.push(createTreeNode(newInjectVar, score, depth + 1
|
|
442
|
+
nextLevelNodes.push(createTreeNode(newInjectVar, score, depth + 1, void 0, {
|
|
443
|
+
inputMaterialization,
|
|
444
|
+
materializationHandled,
|
|
445
|
+
materializedVars
|
|
446
|
+
}));
|
|
410
447
|
if (score > maxScore) {
|
|
411
448
|
maxScore = score;
|
|
412
449
|
bestResponse = targetResponse.output;
|
|
413
450
|
bestNode.prompt = newInjectVar;
|
|
451
|
+
bestNode.inputMaterialization = inputMaterialization;
|
|
452
|
+
bestNode.materializationHandled = materializationHandled;
|
|
453
|
+
bestNode.materializedVars = materializedVars;
|
|
414
454
|
bestFinalAttackPrompt = finalInjectVar;
|
|
415
455
|
bestTransformDisplayVars = lastTransformDisplayVars;
|
|
416
456
|
require_logger.logger.debug(`[Depth ${depth}, Attempt ${attempts}] New max score: ${maxScore}`);
|
|
@@ -422,7 +462,7 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
422
462
|
noImprovementCount++;
|
|
423
463
|
if (noImprovementCount % 5 === 0) require_logger.logger.debug(`[Depth ${depth}, Attempt ${attempts}] No improvement for ${noImprovementCount} consecutive iterations. Max score: ${maxScore}`);
|
|
424
464
|
}
|
|
425
|
-
const { getGraderById } = await Promise.resolve().then(() => require("./graders-
|
|
465
|
+
const { getGraderById } = await Promise.resolve().then(() => require("./graders-CBQ2s6gz.cjs")).then((n) => n.graders_exports);
|
|
426
466
|
let graderPassed;
|
|
427
467
|
let assertToUse = test?.assert?.find((a) => a.type && a.type.includes(test.metadata?.pluginId));
|
|
428
468
|
if (!assertToUse) assertToUse = test?.assert?.find((a) => a.type);
|
|
@@ -621,13 +661,23 @@ async function runRedteamConversation({ context, filters, injectVar, options, pr
|
|
|
621
661
|
[injectVar]: bestPrompt
|
|
622
662
|
};
|
|
623
663
|
if (inputs && Object.keys(inputs).length > 0) try {
|
|
624
|
-
const
|
|
625
|
-
|
|
626
|
-
|
|
627
|
-
|
|
628
|
-
|
|
629
|
-
|
|
630
|
-
|
|
664
|
+
const parsed = JSON.parse(bestPrompt);
|
|
665
|
+
if (require_remoteGeneration.shouldGenerateRemote()) {
|
|
666
|
+
const remoteBestNodeMaterialization = {
|
|
667
|
+
inputMaterialization: bestNode.inputMaterialization,
|
|
668
|
+
materializationHandled: bestNode.materializationHandled,
|
|
669
|
+
materializedVars: bestNode.materializedVars
|
|
670
|
+
};
|
|
671
|
+
if (remoteBestNodeMaterialization.materializationHandled) Object.assign(finalUpdatedVars, require_promptfoo.buildRemoteMaterializedInputVariables(remoteBestNodeMaterialization, parsed, inputs).vars);
|
|
672
|
+
} else {
|
|
673
|
+
const { vars: materializedVars } = await require_util.extractMaterializedVariablesFromJsonWithMetadata(parsed, inputs, {
|
|
674
|
+
materializationIndex: attempts,
|
|
675
|
+
pluginId: String(test?.metadata?.pluginId || "unknown-plugin"),
|
|
676
|
+
provider: redteamProvider,
|
|
677
|
+
purpose: test?.metadata?.purpose
|
|
678
|
+
});
|
|
679
|
+
Object.assign(finalUpdatedVars, materializedVars);
|
|
680
|
+
}
|
|
631
681
|
} catch {}
|
|
632
682
|
const finalTargetPrompt = await require_evaluatorHelpers.renderPrompt(prompt, finalUpdatedVars, filters, targetProvider, [injectVar]);
|
|
633
683
|
const finalTargetResponse = await require_shared.getTargetResponse(targetProvider, finalTargetPrompt, context, options);
|
|
@@ -768,4 +818,4 @@ var RedteamIterativeTreeProvider = class {
|
|
|
768
818
|
//#endregion
|
|
769
819
|
exports.default = RedteamIterativeTreeProvider;
|
|
770
820
|
|
|
771
|
-
//# sourceMappingURL=iterativeTree-
|
|
821
|
+
//# sourceMappingURL=iterativeTree-LOgAi0nU.cjs.map
|
|
@@ -1,9 +1,9 @@
|
|
|
1
1
|
const require_logger = require("./logger-cfNpzI4o.cjs");
|
|
2
2
|
const require_createHash = require("./createHash-CSiqnK5P.cjs");
|
|
3
|
-
const require_cache = require("./cache-
|
|
3
|
+
const require_cache = require("./cache-h5MWOBZI.cjs");
|
|
4
4
|
const require_tokenUsageUtils = require("./tokenUsageUtils-_B-P8IAi.cjs");
|
|
5
|
-
const require_telemetry = require("./telemetry-
|
|
6
|
-
const require_base = require("./base-
|
|
5
|
+
const require_telemetry = require("./telemetry-C_ImlCOk.cjs");
|
|
6
|
+
const require_base = require("./base-BzdS8tod.cjs");
|
|
7
7
|
//#region src/providers/bedrock/knowledgeBase.ts
|
|
8
8
|
/**
|
|
9
9
|
* AWS Bedrock Knowledge Base provider for RAG (Retrieval Augmented Generation).
|
|
@@ -133,4 +133,4 @@ var AwsBedrockKnowledgeBaseProvider = class extends require_base.AwsBedrockGener
|
|
|
133
133
|
//#endregion
|
|
134
134
|
exports.AwsBedrockKnowledgeBaseProvider = AwsBedrockKnowledgeBaseProvider;
|
|
135
135
|
|
|
136
|
-
//# sourceMappingURL=knowledgeBase-
|
|
136
|
+
//# sourceMappingURL=knowledgeBase-CdbcGBZF.cjs.map
|
|
@@ -1,9 +1,9 @@
|
|
|
1
1
|
import { a as logger, w as getEnvInt } from "./logger-KD8JjCRJ.js";
|
|
2
2
|
import { n as sha256 } from "./createHash-CGVzWdjj.js";
|
|
3
|
-
import { i as getCache, o as isCacheEnabled } from "./cache-
|
|
3
|
+
import { i as getCache, o as isCacheEnabled } from "./cache-CrioYnaa.js";
|
|
4
4
|
import { a as createEmptyTokenUsage } from "./tokenUsageUtils-BjVkdk18.js";
|
|
5
|
-
import { n as telemetry } from "./telemetry-
|
|
6
|
-
import { n as createBedrockRequestHandler, r as hasProxyEnv, t as AwsBedrockGenericProvider } from "./base-
|
|
5
|
+
import { n as telemetry } from "./telemetry-BbpmrenM.js";
|
|
6
|
+
import { n as createBedrockRequestHandler, r as hasProxyEnv, t as AwsBedrockGenericProvider } from "./base-0Gzzue9Z.js";
|
|
7
7
|
//#region src/providers/bedrock/knowledgeBase.ts
|
|
8
8
|
/**
|
|
9
9
|
* AWS Bedrock Knowledge Base provider for RAG (Retrieval Augmented Generation).
|
|
@@ -133,4 +133,4 @@ var AwsBedrockKnowledgeBaseProvider = class extends AwsBedrockGenericProvider {
|
|
|
133
133
|
//#endregion
|
|
134
134
|
export { AwsBedrockKnowledgeBaseProvider };
|
|
135
135
|
|
|
136
|
-
//# sourceMappingURL=knowledgeBase-
|
|
136
|
+
//# sourceMappingURL=knowledgeBase-CjOXp6Lr.js.map
|