clawbenchmark 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (423) hide show
  1. clawbench/__init__.py +1 -0
  2. clawbench/_bundled/.env +7 -0
  3. clawbench/_bundled/models/model.schema.json +44 -0
  4. clawbench/_bundled/models/models.example.yaml +16 -0
  5. clawbench/_bundled/test-cases/task.schema.json +132 -0
  6. clawbench/_bundled/test-cases/v1/001-daily-life-food-uber-eats/task.json +25 -0
  7. clawbench/_bundled/test-cases/v1/002-daily-life-food-doordash/task.json +25 -0
  8. clawbench/_bundled/test-cases/v1/004-daily-life-food-instacart/extra_info/grocery_list.json +36 -0
  9. clawbench/_bundled/test-cases/v1/004-daily-life-food-instacart/task.json +30 -0
  10. clawbench/_bundled/test-cases/v1/006-daily-life-food-uber-eats/task.json +24 -0
  11. clawbench/_bundled/test-cases/v1/007-daily-life-food-instacart/extra_info/meal_plan.json +21 -0
  12. clawbench/_bundled/test-cases/v1/007-daily-life-food-instacart/task.json +30 -0
  13. clawbench/_bundled/test-cases/v1/011-daily-life-housing-zillow/task.json +25 -0
  14. clawbench/_bundled/test-cases/v1/015-daily-life-housing-craigslist/extra_info/listing_details.json +26 -0
  15. clawbench/_bundled/test-cases/v1/015-daily-life-housing-craigslist/task.json +30 -0
  16. clawbench/_bundled/test-cases/v1/035-daily-life-health-medical-betterhelp/task.json +25 -0
  17. clawbench/_bundled/test-cases/v1/041-daily-life-pets-rover/task.json +25 -0
  18. clawbench/_bundled/test-cases/v1/043-daily-life-pets-rover/extra_info/pet_info.json +12 -0
  19. clawbench/_bundled/test-cases/v1/043-daily-life-pets-rover/task.json +30 -0
  20. clawbench/_bundled/test-cases/v1/045-daily-life-personal-care-booksy/task.json +25 -0
  21. clawbench/_bundled/test-cases/v1/047-daily-life-personal-care-taskrabbit/extra_info/address_info.json +7 -0
  22. clawbench/_bundled/test-cases/v1/047-daily-life-personal-care-taskrabbit/task.json +30 -0
  23. clawbench/_bundled/test-cases/v1/086-job-search-hr-cv-autofill-greenhouse-meta/extra_info/job_links.json +5 -0
  24. clawbench/_bundled/test-cases/v1/086-job-search-hr-cv-autofill-greenhouse-meta/task.json +30 -0
  25. clawbench/_bundled/test-cases/v1/089-job-search-hr-cv-autofill-simplify-jobs/extra_info/job_links.json +5 -0
  26. clawbench/_bundled/test-cases/v1/089-job-search-hr-cv-autofill-simplify-jobs/task.json +30 -0
  27. clawbench/_bundled/test-cases/v1/091-job-search-hr-job-apply-indeed/task.json +25 -0
  28. clawbench/_bundled/test-cases/v1/120-office-secretary-tasks-email-mgmt-purelymail/task.json +28 -0
  29. clawbench/_bundled/test-cases/v1/121-office-secretary-tasks-email-mgmt-purelymail/task.json +28 -0
  30. clawbench/_bundled/test-cases/v1/128-office-secretary-tasks-email-mgmt-purelymail/task.json +28 -0
  31. clawbench/_bundled/test-cases/v1/134-office-secretary-tasks-calendar-calendly/task.json +25 -0
  32. clawbench/_bundled/test-cases/v1/137-office-secretary-tasks-calendar-doodle/extra_info/meeting_details.json +30 -0
  33. clawbench/_bundled/test-cases/v1/137-office-secretary-tasks-calendar-doodle/task.json +30 -0
  34. clawbench/_bundled/test-cases/v1/139-office-secretary-tasks-calendar-calendly/task.json +25 -0
  35. clawbench/_bundled/test-cases/v1/142-office-secretary-tasks-collab-trello/extra_info/task_list.json +29 -0
  36. clawbench/_bundled/test-cases/v1/142-office-secretary-tasks-collab-trello/task.json +30 -0
  37. clawbench/_bundled/test-cases/v1/179-dev-tech-github-ops-github/extra_info/config.json +13 -0
  38. clawbench/_bundled/test-cases/v1/179-dev-tech-github-ops-github/task.json +30 -0
  39. clawbench/_bundled/test-cases/v1/180-dev-tech-github-ops-github/task.json +25 -0
  40. clawbench/_bundled/test-cases/v1/215-academia-research-paper-tables-overleaf/extra_info/raw_results.json +47 -0
  41. clawbench/_bundled/test-cases/v1/215-academia-research-paper-tables-overleaf/task.json +30 -0
  42. clawbench/_bundled/test-cases/v1/242-academia-research-research-tools-overleaf/task.json +25 -0
  43. clawbench/_bundled/test-cases/v1/246-academia-research-research-tools-zotero/task.json +25 -0
  44. clawbench/_bundled/test-cases/v1/247-academia-research-research-tools-semantic-scholar/task.json +25 -0
  45. clawbench/_bundled/test-cases/v1/265-education-learning-general-coursera/task.json +25 -0
  46. clawbench/_bundled/test-cases/v1/266-education-learning-general-leetcode/extra_info/solution_code.py +9 -0
  47. clawbench/_bundled/test-cases/v1/266-education-learning-general-leetcode/task.json +30 -0
  48. clawbench/_bundled/test-cases/v1/273-education-learning-general-edx/task.json +25 -0
  49. clawbench/_bundled/test-cases/v1/274-education-learning-general-udemy/task.json +25 -0
  50. clawbench/_bundled/test-cases/v1/279-travel-general-airbnb/task.json +25 -0
  51. clawbench/_bundled/test-cases/v1/280-travel-general-booking-com/task.json +25 -0
  52. clawbench/_bundled/test-cases/v1/363-entertainment-hobbies-general-ticketmaster/task.json +25 -0
  53. clawbench/_bundled/test-cases/v1/369-entertainment-hobbies-general-goodreads/extra_info/book_list.json +14 -0
  54. clawbench/_bundled/test-cases/v1/369-entertainment-hobbies-general-goodreads/task.json +30 -0
  55. clawbench/_bundled/test-cases/v1/372-entertainment-hobbies-general-eventbrite/extra_info/event_details.json +10 -0
  56. clawbench/_bundled/test-cases/v1/372-entertainment-hobbies-general-eventbrite/task.json +30 -0
  57. clawbench/_bundled/test-cases/v1/403-personal-management-account-security-1password-web/extra_info/credentials.json +34 -0
  58. clawbench/_bundled/test-cases/v1/403-personal-management-account-security-1password-web/task.json +30 -0
  59. clawbench/_bundled/test-cases/v1/413-personal-management-personal-tools-todoist/extra_info/task_list.json +52 -0
  60. clawbench/_bundled/test-cases/v1/413-personal-management-personal-tools-todoist/task.json +30 -0
  61. clawbench/_bundled/test-cases/v1/468-rating-voting-general-glassdoor/extra_info/interview_experience.json +10 -0
  62. clawbench/_bundled/test-cases/v1/468-rating-voting-general-glassdoor/task.json +30 -0
  63. clawbench/_bundled/test-cases/v1/469-rating-voting-general-tripadvisor/extra_info/review_content.json +6 -0
  64. clawbench/_bundled/test-cases/v1/469-rating-voting-general-tripadvisor/task.json +30 -0
  65. clawbench/_bundled/test-cases/v1/470-rating-voting-general-trustpilot/extra_info/review_content.json +6 -0
  66. clawbench/_bundled/test-cases/v1/470-rating-voting-general-trustpilot/task.json +30 -0
  67. clawbench/_bundled/test-cases/v1/474-rating-voting-general-capterra/task.json +25 -0
  68. clawbench/_bundled/test-cases/v1/475-rating-voting-general-g2/task.json +25 -0
  69. clawbench/_bundled/test-cases/v1/482-creation-init-general-confluence/extra_info/content.json +3 -0
  70. clawbench/_bundled/test-cases/v1/482-creation-init-general-confluence/task.json +30 -0
  71. clawbench/_bundled/test-cases/v1/483-creation-init-general-airtable/task.json +25 -0
  72. clawbench/_bundled/test-cases/v1/484-creation-init-general-clickup/task.json +25 -0
  73. clawbench/_bundled/test-cases/v1/485-creation-init-general-webflow/task.json +25 -0
  74. clawbench/_bundled/test-cases/v1/486-creation-init-general-mailchimp/extra_info/content.json +3 -0
  75. clawbench/_bundled/test-cases/v1/486-creation-init-general-mailchimp/task.json +30 -0
  76. clawbench/_bundled/test-cases/v1/487-creation-init-general-typeform/extra_info/survey_questions.json +85 -0
  77. clawbench/_bundled/test-cases/v1/487-creation-init-general-typeform/task.json +30 -0
  78. clawbench/_bundled/test-cases/v1/488-creation-init-general-substack/extra_info/content.json +3 -0
  79. clawbench/_bundled/test-cases/v1/488-creation-init-general-substack/task.json +30 -0
  80. clawbench/_bundled/test-cases/v1/489-creation-init-general-ghost/extra_info/content.json +3 -0
  81. clawbench/_bundled/test-cases/v1/489-creation-init-general-ghost/task.json +30 -0
  82. clawbench/_bundled/test-cases/v1/501-creation-init-general-asana/extra_info/project_description.json +8 -0
  83. clawbench/_bundled/test-cases/v1/501-creation-init-general-asana/task.json +33 -0
  84. clawbench/_bundled/test-cases/v1/529-daily-life-shopping-delivery-king-arthur-baking/task.json +25 -0
  85. clawbench/_bundled/test-cases/v1/533-daily-life-utilities-inmyarea/task.json +25 -0
  86. clawbench/_bundled/test-cases/v1/535-daily-life-home-home-depot/task.json +25 -0
  87. clawbench/_bundled/test-cases/v1/537-daily-life-food-crumbl/task.json +25 -0
  88. clawbench/_bundled/test-cases/v1/539-daily-life-health-jefit/task.json +25 -0
  89. clawbench/_bundled/test-cases/v1/542-daily-life-pets-wag/task.json +25 -0
  90. clawbench/_bundled/test-cases/v1/551-finance-investment-crypto-wallet-trezor/task.json +25 -0
  91. clawbench/_bundled/test-cases/v1/552-finance-investment-business-payment-plooto/task.json +25 -0
  92. clawbench/_bundled/test-cases/v1/555-finance-investment-insurance-insureon/task.json +25 -0
  93. clawbench/_bundled/test-cases/v1/559-finance-investment-crowdfunding-frontfundr/task.json +25 -0
  94. clawbench/_bundled/test-cases/v1/564-daily-life-event-registration-race-roster/task.json +25 -0
  95. clawbench/_bundled/test-cases/v1/565-job-search-hr-job-search-jopwell/task.json +25 -0
  96. clawbench/_bundled/test-cases/v1/566-job-search-hr-job-search-ziprecruiter/extra_info/listing_details.json +26 -0
  97. clawbench/_bundled/test-cases/v1/566-job-search-hr-job-search-ziprecruiter/task.json +30 -0
  98. clawbench/_bundled/test-cases/v1/569-job-search-hr-job-search-careerbuilder/task.json +25 -0
  99. clawbench/_bundled/test-cases/v1/570-job-search-hr-job-search-hired/task.json +25 -0
  100. clawbench/_bundled/test-cases/v1/571-job-search-hr-recruitment-mgmt-workable/extra_info/listing_details.json +26 -0
  101. clawbench/_bundled/test-cases/v1/571-job-search-hr-recruitment-mgmt-workable/task.json +30 -0
  102. clawbench/_bundled/test-cases/v1/576-office-secretary-tasks-reports-ftc-reportfraud/task.json +25 -0
  103. clawbench/_bundled/test-cases/v1/583-office-secretary-tasks-support-tickets-freshdesk/task.json +25 -0
  104. clawbench/_bundled/test-cases/v1/598-academia-research-legal-docs-formswift/task.json +25 -0
  105. clawbench/_bundled/test-cases/v1/606-education-learning-kids-courses-outschool/task.json +25 -0
  106. clawbench/_bundled/test-cases/v1/607-education-learning-art-courses-creativebug/task.json +25 -0
  107. clawbench/_bundled/test-cases/v1/609-education-learning-meditation-spirit-rock-meditation-center/task.json +25 -0
  108. clawbench/_bundled/test-cases/v1/615-travel-flights-spirit-airlines/task.json +25 -0
  109. clawbench/_bundled/test-cases/v1/618-travel-train-bus-12go-asia/task.json +25 -0
  110. clawbench/_bundled/test-cases/v1/625-travel-camping-outdoor-parks-canada-reservations/task.json +25 -0
  111. clawbench/_bundled/test-cases/v1/626-travel-bus-flixbus/task.json +25 -0
  112. clawbench/_bundled/test-cases/v1/627-travel-flights-momondo/task.json +25 -0
  113. clawbench/_bundled/test-cases/v1/632-shopping-commerce-beauty-care-olaplex/task.json +25 -0
  114. clawbench/_bundled/test-cases/v1/634-shopping-commerce-apparel-dooney-bourke/task.json +25 -0
  115. clawbench/_bundled/test-cases/v1/635-shopping-commerce-gifts-uncommon-goods/task.json +25 -0
  116. clawbench/_bundled/test-cases/v1/636-shopping-commerce-auto-parts-rockauto/task.json +25 -0
  117. clawbench/_bundled/test-cases/v1/638-shopping-commerce-print-custom-vistaprint/task.json +25 -0
  118. clawbench/_bundled/test-cases/v1/639-shopping-commerce-luxury-mansur-gavriel/task.json +25 -0
  119. clawbench/_bundled/test-cases/v1/671-entertainment-gaming-humble-bundle/task.json +25 -0
  120. clawbench/_bundled/test-cases/v1/672-entertainment-hobbies-anime-streaming-crunchyroll/task.json +25 -0
  121. clawbench/_bundled/test-cases/v1/674-entertainment-hobbies-masterclass-masterclass/task.json +25 -0
  122. clawbench/_bundled/test-cases/v1/676-government-civic-legal-docs-legalnature/task.json +25 -0
  123. clawbench/_bundled/test-cases/v1/685-personal-management-budget-mgmt-everydollar/task.json +25 -0
  124. clawbench/_bundled/test-cases/v1/687-personal-management-vpn-subscription-ipvanish/task.json +25 -0
  125. clawbench/_bundled/test-cases/v1/688-personal-management-insurance-compare-insurify/task.json +25 -0
  126. clawbench/_bundled/test-cases/v1/695-automation-workflows-recurring-order-stumptown-coffee/task.json +25 -0
  127. clawbench/_bundled/test-cases/v1/697-automation-workflows-recurring-order-bean-box/task.json +25 -0
  128. clawbench/_bundled/test-cases/v1/699-automation-workflows-recurring-order-mistobox/task.json +25 -0
  129. clawbench/_bundled/test-cases/v1/700-deletion-revocation-data-deletion-deleteme/task.json +25 -0
  130. clawbench/_bundled/test-cases/v1/705-rating-voting-wine-review-vivino/task.json +25 -0
  131. clawbench/_bundled/test-cases/v1/706-rating-voting-beer-review-beeradvocate/task.json +25 -0
  132. clawbench/_bundled/test-cases/v1/707-rating-voting-social-wine-untappd/task.json +25 -0
  133. clawbench/_bundled/test-cases/v1/708-rating-voting-professor-review-ratemyprofessors/task.json +28 -0
  134. clawbench/_bundled/test-cases/v1/709-rating-voting-service-review-angi/task.json +25 -0
  135. clawbench/_bundled/test-cases/v1/710-creation-init-interior-design-roomsketcher/task.json +25 -0
  136. clawbench/_bundled/test-cases/v1/711-creation-init-color-design-coolors/task.json +25 -0
  137. clawbench/_bundled/test-cases/v1/712-creation-init-website-create-squarespace/task.json +25 -0
  138. clawbench/_bundled/test-cases/v1/713-creation-init-website-build-wix/task.json +25 -0
  139. clawbench/_bundled/test-cases/v1/735-home-services-maintenance-house-cleaning-bark/task.json +25 -0
  140. clawbench/_bundled/test-cases/v1/736-home-services-maintenance-plumbing-ace-hardware/task.json +25 -0
  141. clawbench/_bundled/test-cases/v1/737-home-services-maintenance-kitchen-remodel-lowes/task.json +25 -0
  142. clawbench/_bundled/test-cases/v1/738-home-services-maintenance-equipment-install-amazon-home-services/task.json +25 -0
  143. clawbench/_bundled/test-cases/v1/750-automotive-vehicle-services-car-insurance-compare-kanetix/task.json +25 -0
  144. clawbench/_bundled/test-cases/v1/751-automotive-vehicle-services-car-lease-sixt/task.json +25 -0
  145. clawbench/_bundled/test-cases/v1/754-automotive-vehicle-services-used-car-listing-autotrader/task.json +25 -0
  146. clawbench/_bundled/test-cases/v1/763-automotive-vehicle-services-car-lease-autoslash/task.json +25 -0
  147. clawbench/_bundled/test-cases/v1/766-nonprofit-charity-donation-doctors-without-borders-msf/task.json +25 -0
  148. clawbench/_bundled/test-cases/v1/768-nonprofit-charity-community-crowdfund-ioby/task.json +25 -0
  149. clawbench/_bundled/test-cases/v1/770-nonprofit-charity-volunteer-apply-on-make-a-wish-foundation-website-complete-and-submit-a-volunteer-application-form-selecting-the-wish-granter-role-and-entering-city-phoenix-az/task.json +25 -0
  150. clawbench/_bundled/test-cases/v1/774-nonprofit-charity-nonprofit-job-apply-charity-village/task.json +25 -0
  151. clawbench/_bundled/test-cases/v1/776-nonprofit-charity-volunteer-signup-idealist/task.json +25 -0
  152. clawbench/_bundled/test-cases/v1/778-nonprofit-charity-donation-globalgiving/extra_info/payment_info.json +3 -0
  153. clawbench/_bundled/test-cases/v1/778-nonprofit-charity-donation-globalgiving/task.json +30 -0
  154. clawbench/_bundled/test-cases/v1/780-beauty-personal-care-skincare-purchase-soko-glam/extra_info/address_info.json +4 -0
  155. clawbench/_bundled/test-cases/v1/780-beauty-personal-care-skincare-purchase-soko-glam/task.json +30 -0
  156. clawbench/_bundled/test-cases/v1/781-beauty-personal-care-beauty-booking-bluemercury/extra_info/email_info.json +3 -0
  157. clawbench/_bundled/test-cases/v1/781-beauty-personal-care-beauty-booking-bluemercury/task.json +30 -0
  158. clawbench/_bundled/test-cases/v1/782-beauty-personal-care-skincare-purchase-paulas-choice/task.json +24 -0
  159. clawbench/_bundled/test-cases/v1/783-beauty-personal-care-beauty-booking-ulta-beauty/task.json +24 -0
  160. clawbench/_bundled/test-cases/v1/785-beauty-personal-care-skincare-curology/task.json +25 -0
  161. clawbench/_bundled/test-cases/v1/788-beauty-personal-care-makeup-the-ordinary/task.json +25 -0
  162. clawbench/_bundled/test-cases/v1/789-beauty-personal-care-makeup-fenty-beauty/task.json +25 -0
  163. clawbench/_bundled/test-cases/v1/793-beauty-personal-care-beauty-retail-mac-cosmetics/task.json +25 -0
  164. clawbench/_bundled/test-cases/v1/794-beauty-personal-care-salon-booking-styleseat/task.json +25 -0
  165. clawbench/_bundled/test-cases/v1/795-pet-animal-care-pet-adoption-aspca/task.json +25 -0
  166. clawbench/_bundled/test-cases/v1/796-pet-animal-care-pet-supplies-grooming-petsmart/extra_info/pet_info.json +12 -0
  167. clawbench/_bundled/test-cases/v1/796-pet-animal-care-pet-supplies-grooming-petsmart/task.json +30 -0
  168. clawbench/_bundled/test-cases/v1/799-pet-animal-care-pet-insurance-aspca-pet-health-insurance/task.json +25 -0
  169. clawbench/_bundled/test-cases/v1/801-pet-animal-care-pet-friendly-travel-bringfido/task.json +25 -0
  170. clawbench/_bundled/test-cases/v1/803-pet-animal-care-pet-medical-pawp/extra_info/pet_info.json +12 -0
  171. clawbench/_bundled/test-cases/v1/803-pet-animal-care-pet-medical-pawp/task.json +30 -0
  172. clawbench/_bundled/test-cases/v1/807-pet-animal-care-pet-dna-embark/task.json +25 -0
  173. clawbench/_bundled/test-cases/v1/809-pet-animal-care-pet-adopt-petfinder/task.json +28 -0
  174. clawbench/_bundled/test-cases/v1/812-pet-animal-care-pet-subscription-ollie/task.json +25 -0
  175. clawbench/_bundled/test-cases/v1/815-personal-management-records-mgmt-myheritage/task.json +25 -0
  176. clawbench/_bundled/test-cases/v1/821-education-learning-reading-self-study-blinkist/task.json +25 -0
  177. clawbench/_bundled/test-cases/v1/861-entertainment-hobbies-movies-cineplex/task.json +25 -0
  178. clawbench/_bundled/test-cases/v1/862-entertainment-hobbies-movies-amc-theatres/task.json +25 -0
  179. clawbench/_bundled/test-cases/v1/864-entertainment-hobbies-show-tickets-ticketmaster/task.json +25 -0
  180. clawbench/_bundled/test-cases/v1/865-travel-outdoor-hipcamp/task.json +25 -0
  181. clawbench/_bundled/test-cases/v1/867-entertainment-hobbies-movies-fandango/task.json +25 -0
  182. clawbench/_bundled/test-cases/v1/872-daily-life-food-opentable/task.json +25 -0
  183. clawbench/_bundled/test-cases/v1/873-daily-life-food-resy/task.json +28 -0
  184. clawbench/_bundled/test-cases/v1/876-entertainment-hobbies-show-tickets-vivid-seats/task.json +25 -0
  185. clawbench/_bundled/test-cases/v1/877-entertainment-hobbies-show-tickets-stubhub/task.json +25 -0
  186. clawbench/_bundled/test-cases/v1/878-travel-outdoor-ontario-parks/task.json +25 -0
  187. clawbench/_bundled/test-cases/v1/883-education-learning-hobby-class-sur-la-table/task.json +25 -0
  188. clawbench/_bundled/test-cases/v1/884-entertainment-hobbies-experience-breakout-games/task.json +25 -0
  189. clawbench/_bundled/test-cases/v1/885-entertainment-hobbies-experience-bowlero/task.json +25 -0
  190. clawbench/_bundled/test-cases/v1/886-entertainment-hobbies-experience-topgolf/task.json +25 -0
  191. clawbench/_bundled/test-cases/v1-lite/002-daily-life-food-doordash/task.json +25 -0
  192. clawbench/_bundled/test-cases/v1-lite/007-daily-life-food-instacart/extra_info/meal_plan.json +21 -0
  193. clawbench/_bundled/test-cases/v1-lite/007-daily-life-food-instacart/task.json +30 -0
  194. clawbench/_bundled/test-cases/v1-lite/047-daily-life-personal-care-taskrabbit/extra_info/address_info.json +7 -0
  195. clawbench/_bundled/test-cases/v1-lite/047-daily-life-personal-care-taskrabbit/task.json +30 -0
  196. clawbench/_bundled/test-cases/v1-lite/091-job-search-hr-job-apply-indeed/task.json +25 -0
  197. clawbench/_bundled/test-cases/v1-lite/142-office-secretary-tasks-collab-trello/extra_info/task_list.json +29 -0
  198. clawbench/_bundled/test-cases/v1-lite/142-office-secretary-tasks-collab-trello/task.json +30 -0
  199. clawbench/_bundled/test-cases/v1-lite/179-dev-tech-github-ops-github/extra_info/config.json +13 -0
  200. clawbench/_bundled/test-cases/v1-lite/179-dev-tech-github-ops-github/task.json +30 -0
  201. clawbench/_bundled/test-cases/v1-lite/215-academia-research-paper-tables-overleaf/extra_info/raw_results.json +47 -0
  202. clawbench/_bundled/test-cases/v1-lite/215-academia-research-paper-tables-overleaf/task.json +30 -0
  203. clawbench/_bundled/test-cases/v1-lite/266-education-learning-general-leetcode/extra_info/solution_code.py +9 -0
  204. clawbench/_bundled/test-cases/v1-lite/266-education-learning-general-leetcode/task.json +30 -0
  205. clawbench/_bundled/test-cases/v1-lite/279-travel-general-airbnb/task.json +25 -0
  206. clawbench/_bundled/test-cases/v1-lite/369-entertainment-hobbies-general-goodreads/extra_info/book_list.json +14 -0
  207. clawbench/_bundled/test-cases/v1-lite/369-entertainment-hobbies-general-goodreads/task.json +30 -0
  208. clawbench/_bundled/test-cases/v1-lite/372-entertainment-hobbies-general-eventbrite/extra_info/event_details.json +10 -0
  209. clawbench/_bundled/test-cases/v1-lite/372-entertainment-hobbies-general-eventbrite/task.json +30 -0
  210. clawbench/_bundled/test-cases/v1-lite/403-personal-management-account-security-1password-web/extra_info/credentials.json +34 -0
  211. clawbench/_bundled/test-cases/v1-lite/403-personal-management-account-security-1password-web/task.json +30 -0
  212. clawbench/_bundled/test-cases/v1-lite/469-rating-voting-general-tripadvisor/extra_info/review_content.json +6 -0
  213. clawbench/_bundled/test-cases/v1-lite/469-rating-voting-general-tripadvisor/task.json +30 -0
  214. clawbench/_bundled/test-cases/v1-lite/486-creation-init-general-mailchimp/extra_info/content.json +3 -0
  215. clawbench/_bundled/test-cases/v1-lite/486-creation-init-general-mailchimp/task.json +30 -0
  216. clawbench/_bundled/test-cases/v1-lite/501-creation-init-general-asana/extra_info/project_description.json +8 -0
  217. clawbench/_bundled/test-cases/v1-lite/501-creation-init-general-asana/task.json +33 -0
  218. clawbench/_bundled/test-cases/v1-lite/712-creation-init-website-create-squarespace/task.json +25 -0
  219. clawbench/_bundled/test-cases/v1-lite/783-beauty-personal-care-beauty-booking-ulta-beauty/task.json +24 -0
  220. clawbench/_bundled/test-cases/v1-lite/809-pet-animal-care-pet-adopt-petfinder/task.json +28 -0
  221. clawbench/_bundled/test-cases/v1-lite/867-entertainment-hobbies-movies-fandango/task.json +25 -0
  222. clawbench/_bundled/test-cases/v1-lite/872-daily-life-food-opentable/task.json +25 -0
  223. clawbench/_bundled/test-cases/v2/v2-047-daily-life-personal-care-taskrabbit/extra_info/address_info.json +7 -0
  224. clawbench/_bundled/test-cases/v2/v2-047-daily-life-personal-care-taskrabbit/task.json +30 -0
  225. clawbench/_bundled/test-cases/v2/v2-086-job-search-hr-cv-autofill-greenhouse-meta/extra_info/job_links.json +5 -0
  226. clawbench/_bundled/test-cases/v2/v2-086-job-search-hr-cv-autofill-greenhouse-meta/task.json +30 -0
  227. clawbench/_bundled/test-cases/v2/v2-089-job-search-hr-cv-autofill-simplify-jobs/extra_info/job_links.json +5 -0
  228. clawbench/_bundled/test-cases/v2/v2-089-job-search-hr-cv-autofill-simplify-jobs/task.json +30 -0
  229. clawbench/_bundled/test-cases/v2/v2-091-job-search-hr-job-apply-indeed/task.json +25 -0
  230. clawbench/_bundled/test-cases/v2/v2-1010-rating-voting-review-myrecipes/task.json +25 -0
  231. clawbench/_bundled/test-cases/v2/v2-1033-education-learning-registration-khanacademy/task.json +25 -0
  232. clawbench/_bundled/test-cases/v2/v2-1035-education-learning-enrollment-edx/task.json +25 -0
  233. clawbench/_bundled/test-cases/v2/v2-1045-weworkremotely/task.json +25 -0
  234. clawbench/_bundled/test-cases/v2/v2-1065b-daily-life-home-services-handy/task.json +26 -0
  235. clawbench/_bundled/test-cases/v2/v2-1088-nonprofit-charity-petition-change/task.json +25 -0
  236. clawbench/_bundled/test-cases/v2/v2-1093-personal-management-travel-tripit/task.json +25 -0
  237. clawbench/_bundled/test-cases/v2/v2-1095-health-mealplan-eatthismuch/task.json +25 -0
  238. clawbench/_bundled/test-cases/v2/v2-1097-beauty-personal-care-shopping-theordinary/task.json +29 -0
  239. clawbench/_bundled/test-cases/v2/v2-1100-food-cooking-collection-myrecipes/task.json +25 -0
  240. clawbench/_bundled/test-cases/v2/v2-1101-hobbies-gaming-discussion-ravelry/task.json +25 -0
  241. clawbench/_bundled/test-cases/v2/v2-1102-fitness-social-post-strava/task.json +25 -0
  242. clawbench/_bundled/test-cases/v2/v2-1103-fitness-club-strava/task.json +25 -0
  243. clawbench/_bundled/test-cases/v2/v2-1104-fitness-edit-activity-strava/task.json +25 -0
  244. clawbench/_bundled/test-cases/v2/v2-1107-hobbies-gaming-forum-boardgamegeek/task.json +25 -0
  245. clawbench/_bundled/test-cases/v2/v2-1108-civic-petition-change/task.json +25 -0
  246. clawbench/_bundled/test-cases/v2/v2-1111-civic-petition-change/task.json +25 -0
  247. clawbench/_bundled/test-cases/v2/v2-1112-nonprofit-petition-update-change/task.json +25 -0
  248. clawbench/_bundled/test-cases/v2/v2-1113-health-mealplan-eatthismuch/task.json +25 -0
  249. clawbench/_bundled/test-cases/v2/v2-1114-education-enrollment-edx/task.json +25 -0
  250. clawbench/_bundled/test-cases/v2/v2-1115-education-enrollment-edx/task.json +25 -0
  251. clawbench/_bundled/test-cases/v2/v2-1116-education-enrollment-edx/task.json +25 -0
  252. clawbench/_bundled/test-cases/v2/v2-1117/task.json +25 -0
  253. clawbench/_bundled/test-cases/v2/v2-1118/task.json +25 -0
  254. clawbench/_bundled/test-cases/v2/v2-1120b-services-booking-handy/task.json +26 -0
  255. clawbench/_bundled/test-cases/v2/v2-1121b-services-booking-handy/task.json +26 -0
  256. clawbench/_bundled/test-cases/v2/v2-1122-education-course-khanacademy/task.json +25 -0
  257. clawbench/_bundled/test-cases/v2/v2-1123-education-course-khanacademy/task.json +25 -0
  258. clawbench/_bundled/test-cases/v2/v2-1124-education-course-khanacademy/task.json +25 -0
  259. clawbench/_bundled/test-cases/v2/v2-1125-education-course-khanacademy/task.json +25 -0
  260. clawbench/_bundled/test-cases/v2/v2-1126-food-cooking-collection-myrecipes/task.json +25 -0
  261. clawbench/_bundled/test-cases/v2/v2-1130-training-class-search-redcross/task.json +25 -0
  262. clawbench/_bundled/test-cases/v2/v2-1131-training-add-to-cart-redcross/task.json +25 -0
  263. clawbench/_bundled/test-cases/v2/v2-1132-training-enroll-course-redcross/task.json +25 -0
  264. clawbench/_bundled/test-cases/v2/v2-1133-newsletter-signup-redcross/task.json +25 -0
  265. clawbench/_bundled/test-cases/v2/v2-1134-chapter-finder-redcross/task.json +25 -0
  266. clawbench/_bundled/test-cases/v2/v2-1135-events-tickets-ticketmaster/task.json +25 -0
  267. clawbench/_bundled/test-cases/v2/v2-1136-events-tickets-ticketmaster/task.json +25 -0
  268. clawbench/_bundled/test-cases/v2/v2-1137-entertainment-watchlist-trakt/task.json +25 -0
  269. clawbench/_bundled/test-cases/v2/v2-1138-entertainment-watchlist-trakt/task.json +25 -0
  270. clawbench/_bundled/test-cases/v2/v2-1139-travel-itinerary-tripit/task.json +25 -0
  271. clawbench/_bundled/test-cases/v2/v2-1140-travel-itinerary-tripit/task.json +25 -0
  272. clawbench/_bundled/test-cases/v2/v2-1141-travel-itinerary-tripit/task.json +25 -0
  273. clawbench/_bundled/test-cases/v2/v2-1144-weworkremotely/task.json +25 -0
  274. clawbench/_bundled/test-cases/v2/v2-1145-weworkremotely/task.json +25 -0
  275. clawbench/_bundled/test-cases/v2/v2-1146-weworkremotely/task.json +25 -0
  276. clawbench/_bundled/test-cases/v2/v2-1201-beauty-cart-theordinary/task.json +28 -0
  277. clawbench/_bundled/test-cases/v2/v2-1202-beauty-cart-quantity-theordinary/task.json +28 -0
  278. clawbench/_bundled/test-cases/v2/v2-179-dev-tech-github-ops-github/extra_info/config.json +13 -0
  279. clawbench/_bundled/test-cases/v2/v2-179-dev-tech-github-ops-github/task.json +30 -0
  280. clawbench/_bundled/test-cases/v2/v2-180-dev-tech-github-ops-github/task.json +25 -0
  281. clawbench/_bundled/test-cases/v2/v2-215-academia-research-paper-tables-overleaf/extra_info/raw_results.json +47 -0
  282. clawbench/_bundled/test-cases/v2/v2-215-academia-research-paper-tables-overleaf/task.json +30 -0
  283. clawbench/_bundled/test-cases/v2/v2-234-daily-life-events-ticketmaster/task.json +26 -0
  284. clawbench/_bundled/test-cases/v2/v2-242-academia-research-research-tools-overleaf/task.json +25 -0
  285. clawbench/_bundled/test-cases/v2/v2-247-academia-research-research-tools-semantic-scholar/task.json +25 -0
  286. clawbench/_bundled/test-cases/v2/v2-265-education-learning-general-coursera/task.json +25 -0
  287. clawbench/_bundled/test-cases/v2/v2-266-education-learning-general-leetcode/extra_info/solution_code.py +9 -0
  288. clawbench/_bundled/test-cases/v2/v2-266-education-learning-general-leetcode/task.json +30 -0
  289. clawbench/_bundled/test-cases/v2/v2-273-education-learning-general-edx/task.json +25 -0
  290. clawbench/_bundled/test-cases/v2/v2-274-office-secretary-tasks-calendar-when2meet/task.json +25 -0
  291. clawbench/_bundled/test-cases/v2/v2-284-office-secretary-tasks-calendar-when2meet/task.json +25 -0
  292. clawbench/_bundled/test-cases/v2/v2-369-entertainment-hobbies-general-goodreads/extra_info/book_list.json +14 -0
  293. clawbench/_bundled/test-cases/v2/v2-369-entertainment-hobbies-general-goodreads/task.json +30 -0
  294. clawbench/_bundled/test-cases/v2/v2-372-entertainment-hobbies-general-eventbrite/extra_info/event_details.json +10 -0
  295. clawbench/_bundled/test-cases/v2/v2-372-entertainment-hobbies-general-eventbrite/task.json +30 -0
  296. clawbench/_bundled/test-cases/v2/v2-413-personal-management-personal-tools-todoist/extra_info/task_list.json +52 -0
  297. clawbench/_bundled/test-cases/v2/v2-413-personal-management-personal-tools-todoist/task.json +30 -0
  298. clawbench/_bundled/test-cases/v2/v2-468-rating-voting-general-glassdoor/extra_info/interview_experience.json +10 -0
  299. clawbench/_bundled/test-cases/v2/v2-468-rating-voting-general-glassdoor/task.json +30 -0
  300. clawbench/_bundled/test-cases/v2/v2-469-rating-voting-general-tripadvisor/extra_info/review_content.json +6 -0
  301. clawbench/_bundled/test-cases/v2/v2-469-rating-voting-general-tripadvisor/task.json +30 -0
  302. clawbench/_bundled/test-cases/v2/v2-470-rating-voting-general-trustpilot/extra_info/review_content.json +6 -0
  303. clawbench/_bundled/test-cases/v2/v2-470-rating-voting-general-trustpilot/task.json +30 -0
  304. clawbench/_bundled/test-cases/v2/v2-474-rating-voting-general-capterra/task.json +25 -0
  305. clawbench/_bundled/test-cases/v2/v2-475-rating-voting-general-g2/task.json +25 -0
  306. clawbench/_bundled/test-cases/v2/v2-483-creation-init-general-airtable/task.json +25 -0
  307. clawbench/_bundled/test-cases/v2/v2-485-creation-init-general-webflow/task.json +25 -0
  308. clawbench/_bundled/test-cases/v2/v2-486-creation-init-general-mailchimp/extra_info/content.json +3 -0
  309. clawbench/_bundled/test-cases/v2/v2-486-creation-init-general-mailchimp/task.json +30 -0
  310. clawbench/_bundled/test-cases/v2/v2-487-creation-init-general-typeform/extra_info/survey_questions.json +85 -0
  311. clawbench/_bundled/test-cases/v2/v2-487-creation-init-general-typeform/task.json +30 -0
  312. clawbench/_bundled/test-cases/v2/v2-488-creation-init-general-substack/extra_info/content.json +3 -0
  313. clawbench/_bundled/test-cases/v2/v2-488-creation-init-general-substack/task.json +30 -0
  314. clawbench/_bundled/test-cases/v2/v2-500-office-secretary-tasks-signup-doodle/task.json +25 -0
  315. clawbench/_bundled/test-cases/v2/v2-501-office-secretary-tasks-signup-doodle/task.json +25 -0
  316. clawbench/_bundled/test-cases/v2/v2-502-office-secretary-tasks-calendar-doodle/task.json +25 -0
  317. clawbench/_bundled/test-cases/v2/v2-503-office-secretary-tasks-calendar-doodle/task.json +25 -0
  318. clawbench/_bundled/test-cases/v2/v2-520-shopping-retail-target/task.json +25 -0
  319. clawbench/_bundled/test-cases/v2/v2-521-shopping-retail-target/task.json +25 -0
  320. clawbench/_bundled/test-cases/v2/v2-522-shopping-retail-target/task.json +25 -0
  321. clawbench/_bundled/test-cases/v2/v2-523-shopping-retail-target/task.json +25 -0
  322. clawbench/_bundled/test-cases/v2/v2-530-shopping-marketplace-etsy/task.json +25 -0
  323. clawbench/_bundled/test-cases/v2/v2-531-shopping-marketplace-etsy/task.json +25 -0
  324. clawbench/_bundled/test-cases/v2/v2-533-daily-life-utilities-inmyarea/task.json +25 -0
  325. clawbench/_bundled/test-cases/v2/v2-535-daily-life-shopping-etsy/task.json +25 -0
  326. clawbench/_bundled/test-cases/v2/v2-536-daily-life-shopping-etsy/task.json +25 -0
  327. clawbench/_bundled/test-cases/v2/v2-560/task.json +25 -0
  328. clawbench/_bundled/test-cases/v2/v2-564/task.json +25 -0
  329. clawbench/_bundled/test-cases/v2/v2-571-job-search-hr-recruitment-mgmt-workable/task.json +25 -0
  330. clawbench/_bundled/test-cases/v2/v2-583-office-secretary-tasks-support-tickets-freshdesk/task.json +25 -0
  331. clawbench/_bundled/test-cases/v2/v2-596-daily-life-fitness-strava/task.json +25 -0
  332. clawbench/_bundled/test-cases/v2/v2-597-daily-life-fitness-strava/task.json +25 -0
  333. clawbench/_bundled/test-cases/v2/v2-598-academia-research-legal-docs-formswift/task.json +25 -0
  334. clawbench/_bundled/test-cases/v2/v2-600-hobbies-crafts-community-ravelry/task.json +25 -0
  335. clawbench/_bundled/test-cases/v2/v2-601-hobbies-gaming-reviews-ravelry/task.json +25 -0
  336. clawbench/_bundled/test-cases/v2/v2-602-hobbies-crafts-community-ravelry/task.json +25 -0
  337. clawbench/_bundled/test-cases/v2/v2-603-hobbies-crafts-community-ravelry/task.json +25 -0
  338. clawbench/_bundled/test-cases/v2/v2-607-hobbies-gaming-reviews-boardgamegeek/task.json +25 -0
  339. clawbench/_bundled/test-cases/v2/v2-608-education-learning-kids-courses-outschool/task.json +25 -0
  340. clawbench/_bundled/test-cases/v2/v2-609-education-learning-meditation-spirit-rock-meditation-center/task.json +25 -0
  341. clawbench/_bundled/test-cases/v2/v2-610-hobbies-gaming-reviews-boardgamegeek/task.json +25 -0
  342. clawbench/_bundled/test-cases/v2/v2-630-daily-life-productivity-habitica/task.json +25 -0
  343. clawbench/_bundled/test-cases/v2/v2-631-daily-life-productivity-habitica/task.json +25 -0
  344. clawbench/_bundled/test-cases/v2/v2-633-daily-life-productivity-habitica/task.json +25 -0
  345. clawbench/_bundled/test-cases/v2/v2-634-daily-life-productivity-habitica/task.json +25 -0
  346. clawbench/_bundled/test-cases/v2/v2-635-entertainment-tracking-trakt/task.json +25 -0
  347. clawbench/_bundled/test-cases/v2/v2-638-entertainment-tracking-trakt/task.json +25 -0
  348. clawbench/_bundled/test-cases/v2/v2-705-rating-voting-wine-review-vivino/task.json +25 -0
  349. clawbench/_bundled/test-cases/v2/v2-706-rating-voting-beer-review-beeradvocate/task.json +25 -0
  350. clawbench/_bundled/test-cases/v2/v2-707-rating-voting-social-wine-untappd/task.json +25 -0
  351. clawbench/_bundled/test-cases/v2/v2-708-rating-voting-professor-review-ratemyprofessors/task.json +28 -0
  352. clawbench/_bundled/test-cases/v2/v2-711-creation-init-color-design-coolors/task.json +25 -0
  353. clawbench/_bundled/test-cases/v2/v2-735-home-services-maintenance-house-cleaning-bark/task.json +25 -0
  354. clawbench/_bundled/test-cases/v2/v2-737-home-services-maintenance-kitchen-remodel-lowes/task.json +25 -0
  355. clawbench/_bundled/test-cases/v2/v2-763-automotive-vehicle-services-car-lease-autoslash/task.json +25 -0
  356. clawbench/_bundled/test-cases/v2/v2-774-nonprofit-charity-nonprofit-job-apply-charity-village/task.json +25 -0
  357. clawbench/_bundled/test-cases/v2/v2-776-nonprofit-charity-volunteer-signup-idealist/task.json +25 -0
  358. clawbench/_bundled/test-cases/v2/v2-794-beauty-personal-care-salon-booking-styleseat/task.json +25 -0
  359. clawbench/_bundled/test-cases/v2/v2-795-pet-animal-care-pet-adoption-aspca/task.json +25 -0
  360. clawbench/_bundled/test-cases/v2/v2-815-pet-animal-care-favorite-pet/task.json +28 -0
  361. clawbench/_bundled/test-cases/v2/v2-816-pet-animal-care-remove-favorite/task.json +28 -0
  362. clawbench/_bundled/test-cases/v2/v2-817-pet-animal-care-create-adopter-profile/task.json +28 -0
  363. clawbench/_bundled/test-cases/v2/v2-901-entertainment-imdb-add-to-watchlist/task.json +28 -0
  364. clawbench/_bundled/test-cases/v2/v2-902-entertainment-imdb-rate-title/task.json +28 -0
  365. clawbench/_bundled/test-cases/v2/v2-903-entertainment-imdb-remove-rating/task.json +28 -0
  366. clawbench/_bundled/test-cases/v2/v2-904-entertainment-imdb-create-list/task.json +28 -0
  367. clawbench/_bundled/test-cases/v2/v2-905-entertainment-imdb-add-to-list/task.json +28 -0
  368. clawbench/runner/__init__.py +1 -0
  369. clawbench/runner/batch.py +752 -0
  370. clawbench/runner/run.py +1607 -0
  371. clawbench/runtime/chrome-extension/README.md +127 -0
  372. clawbench/runtime/chrome-extension/background.js +56 -0
  373. clawbench/runtime/chrome-extension/content.js +70 -0
  374. clawbench/runtime/chrome-extension/manifest.json +25 -0
  375. clawbench/runtime/chrome-extension/setup.sh +27 -0
  376. clawbench/runtime/chrome-extension/stealth.js +200 -0
  377. clawbench/runtime/extension-server/README.md +61 -0
  378. clawbench/runtime/extension-server/pyproject.toml +13 -0
  379. clawbench/runtime/extension-server/server.py +395 -0
  380. clawbench/runtime/extension-server/uv.lock +284 -0
  381. clawbench/runtime/harnesses/base/Dockerfile.base +40 -0
  382. clawbench/runtime/harnesses/base/entrypoint.sh +283 -0
  383. clawbench/runtime/harnesses/browser-use/Dockerfile.browser-use +9 -0
  384. clawbench/runtime/harnesses/browser-use/run-browser-use-agent.py +133 -0
  385. clawbench/runtime/harnesses/browser-use/run-browser-use.sh +136 -0
  386. clawbench/runtime/harnesses/browser-use/setup-browser-use.sh +109 -0
  387. clawbench/runtime/harnesses/claude-code/Dockerfile.claude-code +21 -0
  388. clawbench/runtime/harnesses/claude-code/run-claude-code.sh +152 -0
  389. clawbench/runtime/harnesses/claude-code/setup-claude-code.sh +127 -0
  390. clawbench/runtime/harnesses/claude-code-chrome-extension/Dockerfile.claude-code-chrome-extension +466 -0
  391. clawbench/runtime/harnesses/claude-code-chrome-extension/mock-anthropic-api.py +113 -0
  392. clawbench/runtime/harnesses/claude-code-chrome-extension/run-claude-code-chrome-extension.sh +254 -0
  393. clawbench/runtime/harnesses/claude-code-chrome-extension/setup-claude-code-chrome-extension.sh +161 -0
  394. clawbench/runtime/harnesses/claw-code/Dockerfile.claw-code +49 -0
  395. clawbench/runtime/harnesses/claw-code/claw-code-ndjson.patch.py +655 -0
  396. clawbench/runtime/harnesses/claw-code/run-claw-code.sh +167 -0
  397. clawbench/runtime/harnesses/claw-code/setup-claw-code.sh +154 -0
  398. clawbench/runtime/harnesses/codex/Dockerfile.codex +27 -0
  399. clawbench/runtime/harnesses/codex/run-codex.sh +158 -0
  400. clawbench/runtime/harnesses/codex/setup-codex.sh +157 -0
  401. clawbench/runtime/harnesses/hermes/Dockerfile.hermes +19 -0
  402. clawbench/runtime/harnesses/hermes/hermes-capture.py +205 -0
  403. clawbench/runtime/harnesses/hermes/run-hermes.sh +339 -0
  404. clawbench/runtime/harnesses/hermes/setup-hermes.sh +176 -0
  405. clawbench/runtime/harnesses/openclaw/Dockerfile.openclaw +20 -0
  406. clawbench/runtime/harnesses/openclaw/run-openclaw.sh +138 -0
  407. clawbench/runtime/harnesses/openclaw/setup-openclaw.sh +153 -0
  408. clawbench/runtime/harnesses/opencode/Dockerfile.opencode +18 -0
  409. clawbench/runtime/harnesses/opencode/run-opencode.sh +125 -0
  410. clawbench/runtime/harnesses/opencode/setup-opencode.sh +163 -0
  411. clawbench/runtime/shared/alex_green_personal_info.json +451 -0
  412. clawbench/tui.py +1704 -0
  413. clawbench/utils/__init__.py +1 -0
  414. clawbench/utils/generate_resume_pdf.py +162 -0
  415. clawbench/utils/hf_upload.py +78 -0
  416. clawbench/utils/paths.py +84 -0
  417. clawbench/utils/resume_template.json +104 -0
  418. clawbenchmark-0.2.0.dist-info/METADATA +735 -0
  419. clawbenchmark-0.2.0.dist-info/RECORD +423 -0
  420. clawbenchmark-0.2.0.dist-info/WHEEL +4 -0
  421. clawbenchmark-0.2.0.dist-info/entry_points.txt +4 -0
  422. clawbenchmark-0.2.0.dist-info/licenses/LICENSE +201 -0
  423. clawbenchmark-0.2.0.dist-info/licenses/NOTICE +12 -0
clawbench/__init__.py ADDED
@@ -0,0 +1 @@
1
+ """ClawBench Python package."""
@@ -0,0 +1,7 @@
1
+ PURELY_MAIL_API_KEY="pm-live-4c2a5524-392b-4117-a722-0aab7a3bf885"
2
+ PURELY_MAIL_DOMAIN="clawbench.cc"
3
+ THINKING_LEVEL="medium"
4
+
5
+ # Optional: HuggingFace dataset upload
6
+ # HF_TOKEN="hf_..."
7
+ # HF_REPO_ID="your-org/your-dataset-name"
@@ -0,0 +1,44 @@
1
+ {
2
+ "$schema": "https://json-schema.org/draft/2020-12/schema",
3
+ "description": "Schema for a single model entry in models/models.yaml. The YAML key is the model name.",
4
+ "type": "object",
5
+ "required": ["base_url", "api_type"],
6
+ "properties": {
7
+ "api_key": {
8
+ "type": "string",
9
+ "description": "API key for the provider"
10
+ },
11
+ "api_keys": {
12
+ "type": "array",
13
+ "items": { "type": "string" },
14
+ "description": "Multiple API keys for round-robin rotation (takes precedence over api_key)"
15
+ },
16
+ "thinking_level": {
17
+ "type": "string",
18
+ "enum": ["off", "minimal", "low", "medium", "high", "xhigh", "adaptive"],
19
+ "description": "Reasoning depth for the model"
20
+ },
21
+ "temperature": {
22
+ "type": "number",
23
+ "minimum": 0,
24
+ "maximum": 2,
25
+ "description": "Sampling temperature"
26
+ },
27
+ "max_tokens": {
28
+ "type": "integer",
29
+ "minimum": 1,
30
+ "description": "Maximum output tokens"
31
+ },
32
+ "base_url": {
33
+ "type": "string",
34
+ "format": "uri",
35
+ "description": "API base URL (e.g. https://api.openai.com/v1)"
36
+ },
37
+ "api_type": {
38
+ "type": "string",
39
+ "enum": ["anthropic-messages", "openai-responses", "openai-completions", "google-generative-ai"],
40
+ "description": "API type for the provider endpoint"
41
+ }
42
+ },
43
+ "additionalProperties": false
44
+ }
@@ -0,0 +1,16 @@
1
+ # Copy to models/models.yaml and fill in your API keys.
2
+ # Each top-level key is the model name (passed as MODEL_NAME to the container).
3
+
4
+ qwen3.5-397b-a17b:
5
+ api_key: "sk-or-v1-..."
6
+ base_url: https://openrouter.ai/api/v1
7
+ api_type: openai-completions
8
+ thinking_level: medium # optional
9
+
10
+ # For multiple API keys (round-robin), use api_keys instead of api_key:
11
+ # some-model:
12
+ # api_keys:
13
+ # - "key1"
14
+ # - "key2"
15
+ # base_url: https://api.openai.com/v1
16
+ # api_type: openai-completions
@@ -0,0 +1,132 @@
1
+ {
2
+ "$schema": "https://json-schema.org/draft/2020-12/schema",
3
+ "$id": "task.schema.json",
4
+ "title": "ClawBench Test Case",
5
+ "description": "Schema for ClawBench test case task.json files",
6
+ "type": "object",
7
+ "properties": {
8
+ "$schema": true,
9
+ "metadata": {
10
+ "type": "object",
11
+ "description": "Human-readable metadata for documentation purposes (not read by the agent)",
12
+ "properties": {
13
+ "task_id": {
14
+ "type": "integer",
15
+ "description": "Unique numeric identifier for the test case"
16
+ },
17
+ "metaclass": {
18
+ "type": "string",
19
+ "description": "High-level category of the test case"
20
+ },
21
+ "class": {
22
+ "type": "string",
23
+ "description": "Granular sub-category of the test case"
24
+ },
25
+ "description": {
26
+ "type": "string",
27
+ "description": "Human-readable description of the test case"
28
+ },
29
+ "sites_involved": {
30
+ "type": "array",
31
+ "description": "Site domains involved in the test case (e.g., google.com, uber.com, github.com, etc.)",
32
+ "items": {
33
+ "type": "string"
34
+ }
35
+ },
36
+ "platform": {
37
+ "type": "string",
38
+ "description": "Platform involved in the test case (e.g., google, uber, github, etc.)"
39
+ },
40
+ "common_info": {
41
+ "type": "object",
42
+ "description": "Common information that is shared among all test cases",
43
+ "properties": {
44
+ "email_credentials": {
45
+ "const": "credentials to use the assigned disposable email account"
46
+ },
47
+ "user_info": {
48
+ "const": "alex_green_personal_info.json; the dummy user's personal information"
49
+ },
50
+ "user_resume": {
51
+ "const": "PDF resume with disposable email account injected"
52
+ }
53
+ },
54
+ "required": ["email_credentials", "user_info", "user_resume"],
55
+ "additionalProperties": false
56
+ }
57
+ },
58
+ "additionalProperties": true,
59
+ "required": [
60
+ "task_id",
61
+ "metaclass",
62
+ "class",
63
+ "description",
64
+ "sites_involved",
65
+ "platform",
66
+ "common_info"
67
+ ]
68
+ },
69
+ "instruction": {
70
+ "type": "string",
71
+ "description": "Task prompt sent to the agent"
72
+ },
73
+ "eval_schema": {
74
+ "type": "object",
75
+ "description": "Configuration for the request interceptor. The interceptor blocks HTTP requests matching the URL pattern, method, and optional body/params filters, preventing irreversible actions (checkout, submission, etc.) from reaching the server.",
76
+ "properties": {
77
+ "url_pattern": {
78
+ "type": "string",
79
+ "description": "Regex pattern the request URL must match to be blocked by the interceptor"
80
+ },
81
+ "method": {
82
+ "type": "string",
83
+ "enum": ["GET", "POST", "PUT", "PATCH", "DELETE"],
84
+ "description": "HTTP method the request must match to be blocked"
85
+ },
86
+ "body": {
87
+ "type": "object",
88
+ "description": "Key-value pairs that must match exactly in the request body. Used to disambiguate when URL + method alone isn't specific enough (e.g., same endpoint for login vs send)."
89
+ },
90
+ "params": {
91
+ "type": "object",
92
+ "description": "Key-value pairs that must match exactly in the URL query parameters. Used to disambiguate when URL + method alone isn't specific enough."
93
+ }
94
+ },
95
+ "required": ["url_pattern", "method"],
96
+ "additionalProperties": false
97
+ },
98
+ "time_limit": {
99
+ "type": "number",
100
+ "description": "Maximum time in minutes before the driver stops the container",
101
+ "minimum": 1
102
+ },
103
+ "extra_info": {
104
+ "type": "array",
105
+ "description": "Additional context injected into the agent prompt",
106
+ "items": {
107
+ "type": "object",
108
+ "properties": {
109
+ "path": {
110
+ "type": "string",
111
+ "description": "Relative path to a file in the test case directory (optional)"
112
+ },
113
+ "description": {
114
+ "type": "string",
115
+ "description": "Description text injected into the agent prompt"
116
+ }
117
+ },
118
+ "required": [
119
+ "path",
120
+ "description"
121
+ ],
122
+ "additionalProperties": false
123
+ }
124
+ }
125
+ },
126
+ "required": [
127
+ "instruction",
128
+ "eval_schema",
129
+ "time_limit"
130
+ ],
131
+ "additionalProperties": false
132
+ }
@@ -0,0 +1,25 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 1,
5
+ "metaclass": "daily-life",
6
+ "class": "food",
7
+ "description": "On Uber Eats, order delivery: one Pad Thai, deliver to home address, note \"no peanuts\"",
8
+ "sites_involved": [
9
+ "ubereats.com"
10
+ ],
11
+ "platform": "uber-eats",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "On Uber Eats, order delivery: one Pad Thai, deliver to home address, note \"no peanuts\"",
19
+ "eval_schema": {
20
+ "url_pattern": "__PLACEHOLDER_WILL_NOT_MATCH__",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": []
25
+ }
@@ -0,0 +1,25 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 2,
5
+ "metaclass": "daily-life",
6
+ "class": "food",
7
+ "description": "On DoorDash, order delivery: one Big Mac + two 10 pc McNuggets, select fastest delivery",
8
+ "sites_involved": [
9
+ "doordash.com"
10
+ ],
11
+ "platform": "doordash",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "On DoorDash, order delivery: one Big Mac + two 10 pc McNuggets, select fastest delivery",
19
+ "eval_schema": {
20
+ "url_pattern": "__PLACEHOLDER_WILL_NOT_MATCH__",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": []
25
+ }
@@ -0,0 +1,36 @@
1
+ {
2
+ "items": [
3
+ {
4
+ "name": "Whole milk (1 gallon)",
5
+ "quantity": 1,
6
+ "category": "dairy"
7
+ },
8
+ {
9
+ "name": "Large eggs (dozen)",
10
+ "quantity": 1,
11
+ "category": "dairy"
12
+ },
13
+ {
14
+ "name": "Whole wheat bread",
15
+ "quantity": 1,
16
+ "category": "bakery"
17
+ },
18
+ {
19
+ "name": "Chicken breast (boneless, skinless)",
20
+ "quantity": "2 lbs",
21
+ "category": "meat"
22
+ },
23
+ {
24
+ "name": "Broccoli (fresh)",
25
+ "quantity": "1 bunch",
26
+ "category": "produce"
27
+ },
28
+ {
29
+ "name": "Bananas",
30
+ "quantity": "1 bunch (6-7)",
31
+ "category": "produce"
32
+ }
33
+ ],
34
+ "delivery_preference": "cheapest available window",
35
+ "store_preference": "nearest"
36
+ }
@@ -0,0 +1,30 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 4,
5
+ "metaclass": "daily-life",
6
+ "class": "food",
7
+ "description": "Place an Instacart order for a week's groceries: milk, eggs, whole wheat bread, chicken breast, broccoli, bananas; select the cheapest delivery window",
8
+ "sites_involved": [
9
+ "instacart.com"
10
+ ],
11
+ "platform": "instacart",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "Place an Instacart order for a week's groceries: milk, eggs, whole wheat bread, chicken breast, broccoli, bananas; select the cheapest delivery window",
19
+ "eval_schema": {
20
+ "url_pattern": "__PLACEHOLDER_WILL_NOT_MATCH__",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": [
25
+ {
26
+ "path": "extra_info/grocery_list.json",
27
+ "description": "Weekly grocery list with items, quantities, and categories"
28
+ }
29
+ ]
30
+ }
@@ -0,0 +1,24 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 6,
5
+ "metaclass": "daily-life",
6
+ "class": "food",
7
+ "description": "On Uber Eats, order a vegan delivery (labeled vegan), deliver to office address",
8
+ "sites_involved": [
9
+ "ubereats.com"
10
+ ],
11
+ "platform": "uber-eats",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "On Uber Eats, order a vegan delivery (labeled vegan), deliver to office address",
19
+ "eval_schema": {
20
+ "url_pattern": "__PLACEHOLDER_WILL_NOT_MATCH__",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30
24
+ }
@@ -0,0 +1,21 @@
1
+ {
2
+ "week_plan": [
3
+ {
4
+ "day": "Monday",
5
+ "breakfast": "Greek yogurt with granola",
6
+ "lunch": "Grilled chicken salad",
7
+ "dinner": "Salmon with steamed broccoli and brown rice"
8
+ },
9
+ {
10
+ "day": "Tuesday",
11
+ "breakfast": "Overnight oats with bananas",
12
+ "lunch": "Turkey wrap with veggies",
13
+ "dinner": "Pasta primavera with garlic bread"
14
+ }
15
+ ],
16
+ "dietary_restrictions": [
17
+ "no shellfish (allergy)",
18
+ "low sodium preferred"
19
+ ],
20
+ "servings_per_meal": 1
21
+ }
@@ -0,0 +1,30 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 7,
5
+ "metaclass": "daily-life",
6
+ "class": "food",
7
+ "description": "On Instacart, purchase all ingredients for 2-day meal plan recipes, with the nearest supermarket auto-selected",
8
+ "sites_involved": [
9
+ "instacart.com"
10
+ ],
11
+ "platform": "instacart",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "On Instacart, purchase all ingredients for 2-day meal plan recipes, with the nearest supermarket auto-selected",
19
+ "eval_schema": {
20
+ "url_pattern": "__PLACEHOLDER_WILL_NOT_MATCH__",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": [
25
+ {
26
+ "path": "extra_info/meal_plan.json",
27
+ "description": "2-day meal plan with recipes and dietary restrictions"
28
+ }
29
+ ]
30
+ }
@@ -0,0 +1,25 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 11,
5
+ "metaclass": "daily-life",
6
+ "class": "housing",
7
+ "description": "Search Zillow for a one-bedroom apartment in Toronto downtown under $3500/month, select one and submit a rental application",
8
+ "sites_involved": [
9
+ "zillow.com"
10
+ ],
11
+ "platform": "zillow",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "Search Zillow for a one-bedroom apartment in Toronto downtown under $3500/month, select one and submit a rental application",
19
+ "eval_schema": {
20
+ "url_pattern": "zillow\\.com/rentals/api/rcf/v1/rcf",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": []
25
+ }
@@ -0,0 +1,26 @@
1
+ {
2
+ "listing_title": "Bright 1BR in Toronto Annex, Furnished, July-August Sublet",
3
+ "description": "Spacious furnished one-bedroom apartment in the heart of Toronto's Annex neighborhood. Walking distance to U of T campus, TTC subway, and Bloor Street shops and restaurants. The unit features hardwood floors, in-suite laundry, a fully equipped kitchen, and a sunny south-facing balcony. Perfect for visiting scholars or summer interns.",
4
+ "price": 2400,
5
+ "currency": "CAD",
6
+ "period": "monthly",
7
+ "available_from": "2026-07-01",
8
+ "available_to": "2026-08-31",
9
+ "furnished": true,
10
+ "bedrooms": 1,
11
+ "bathrooms": 1,
12
+ "amenities": [
13
+ "In-suite laundry",
14
+ "Dishwasher",
15
+ "Balcony",
16
+ "Air conditioning",
17
+ "WiFi included"
18
+ ],
19
+ "photos": [
20
+ "living_room.jpg",
21
+ "bedroom.jpg",
22
+ "kitchen.jpg",
23
+ "balcony.jpg"
24
+ ],
25
+ "contact_email": "alex.green.uoft@clawbench.cc"
26
+ }
@@ -0,0 +1,30 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 15,
5
+ "metaclass": "daily-life",
6
+ "class": "housing",
7
+ "description": "Post a sublet listing on Craigslist: one-bedroom near Toronto Annex, $2400/month, July-August, furnished",
8
+ "sites_involved": [
9
+ "craigslist.org"
10
+ ],
11
+ "platform": "craigslist",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "Post a sublet listing on Craigslist: one-bedroom near Toronto Annex, $2400/month, July-August, furnished",
19
+ "eval_schema": {
20
+ "url_pattern": "post\\.craigslist\\.org/k/",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": [
25
+ {
26
+ "path": "extra_info/listing_details.json",
27
+ "description": "Sublet listing details including description, amenities, and photos"
28
+ }
29
+ ]
30
+ }
@@ -0,0 +1,25 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 35,
5
+ "metaclass": "daily-life",
6
+ "class": "health-medical",
7
+ "description": "Sign up on BetterHelp, book a counseling session, and complete the initial questionnaire",
8
+ "sites_involved": [
9
+ "betterhelp.com"
10
+ ],
11
+ "platform": "betterhelp",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "Sign up on BetterHelp, book a counseling session, and complete the initial questionnaire",
19
+ "eval_schema": {
20
+ "url_pattern": "__PLACEHOLDER_WILL_NOT_MATCH__",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": []
25
+ }
@@ -0,0 +1,25 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 41,
5
+ "metaclass": "daily-life",
6
+ "class": "pets",
7
+ "description": "Book daytime dog walking service on Rover for Monday through Friday next week, large dog (Golden Retriever)",
8
+ "sites_involved": [
9
+ "rover.com"
10
+ ],
11
+ "platform": "rover",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "Book daytime dog walking service on Rover for Monday through Friday next week, large dog (Golden Retriever)",
19
+ "eval_schema": {
20
+ "url_pattern": "rover\\.com/api/v7/people/.+/services/dog-walking/contactability",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": []
25
+ }
@@ -0,0 +1,12 @@
1
+ {
2
+ "name": "Maple",
3
+ "species": "Dog",
4
+ "breed": "Golden Retriever",
5
+ "age_years": 4,
6
+ "weight_lbs": 35,
7
+ "sex": "Female (spayed)",
8
+ "date_of_birth": "2022-03-15",
9
+ "vaccinations_up_to_date": true,
10
+ "microchip_id": "985121012345678",
11
+ "dietary_notes": "Grain-free kibble, sensitive stomach"
12
+ }
@@ -0,0 +1,30 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 43,
5
+ "metaclass": "daily-life",
6
+ "class": "pets",
7
+ "description": "Book 5-day pet boarding next month on Rover (medium-sized dog), sitter rated 4.8+",
8
+ "sites_involved": [
9
+ "rover.com"
10
+ ],
11
+ "platform": "rover",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "Book 5-day pet boarding next month on Rover (medium-sized dog), sitter rated 4.8+",
19
+ "eval_schema": {
20
+ "url_pattern": "rover\\.com/api/v\\d+/people/[^/]+/services/overnight-boarding/contactability",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": [
25
+ {
26
+ "path": "extra_info/pet_info.json",
27
+ "description": "Pet information for Alex Green's dog Maple (Golden Retriever, 4 years, 35 lbs)"
28
+ }
29
+ ]
30
+ }
@@ -0,0 +1,25 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 45,
5
+ "metaclass": "daily-life",
6
+ "class": "personal-care",
7
+ "description": "Book a women's haircut on Booksy for the upcoming Saturday afternoon",
8
+ "sites_involved": [
9
+ "booksy.com"
10
+ ],
11
+ "platform": "booksy",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "Book a women's haircut on Booksy for the upcoming Saturday afternoon",
19
+ "eval_schema": {
20
+ "url_pattern": "booksy\\.com/core/v\\d+/customer_api/me/appointments/business/\\d+/?$",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": []
25
+ }
@@ -0,0 +1,7 @@
1
+ {
2
+ "note": "Use home address from alex_green_personal_info.json",
3
+ "move out address": "Unit 1208, 664 Spadina Ave, Toronto, ON M5S 2H7, Canada",
4
+ "move in address": "450 Front St W, Toronto, ON M5V 0V7",
5
+ "Task size": "Large",
6
+ "Need Vehicle": "Yes, a Car"
7
+ }
@@ -0,0 +1,30 @@
1
+ {
2
+ "$schema": "../../task.schema.json",
3
+ "metadata": {
4
+ "task_id": 47,
5
+ "metaclass": "daily-life",
6
+ "class": "personal-care",
7
+ "description": "Find a moving helper on TaskRabbit, next Saturday 9am-1pm, 1 bedroom apartment",
8
+ "sites_involved": [
9
+ "taskrabbit.com"
10
+ ],
11
+ "platform": "taskrabbit",
12
+ "common_info": {
13
+ "email_credentials": "credentials to use the assigned disposable email account",
14
+ "user_info": "alex_green_personal_info.json; the dummy user's personal information",
15
+ "user_resume": "PDF resume with disposable email account injected"
16
+ }
17
+ },
18
+ "instruction": "Find a moving helper on TaskRabbit, next Saturday 9am-1pm, 1 bedroom apartment",
19
+ "eval_schema": {
20
+ "url_pattern": "taskrabbit\\.(com|ca)/(api/v\\d+/jobs|book/\\d+/confirm)",
21
+ "method": "POST"
22
+ },
23
+ "time_limit": 30,
24
+ "extra_info": [
25
+ {
26
+ "path": "extra_info/address_info.json",
27
+ "description": "Address information (references alex_green_personal_info.json)"
28
+ }
29
+ ]
30
+ }
@@ -0,0 +1,5 @@
1
+ {
2
+ "job_url": "https://boards.greenhouse.io/example/jobs/1234567",
3
+ "job_title": "Senior Software Engineer",
4
+ "company": "Example Corp"
5
+ }