ibm-watsonx-orchestrate-evaluation-framework 1.1.3__py3-none-any.whl → 1.1.8b0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (97) hide show
  1. {ibm_watsonx_orchestrate_evaluation_framework-1.1.3.dist-info → ibm_watsonx_orchestrate_evaluation_framework-1.1.8b0.dist-info}/METADATA +19 -1
  2. ibm_watsonx_orchestrate_evaluation_framework-1.1.8b0.dist-info/RECORD +146 -0
  3. wxo_agentic_evaluation/analytics/tools/analyzer.py +4 -2
  4. wxo_agentic_evaluation/analyze_run.py +1025 -220
  5. wxo_agentic_evaluation/annotate.py +2 -2
  6. wxo_agentic_evaluation/arg_configs.py +60 -2
  7. wxo_agentic_evaluation/base_user.py +25 -0
  8. wxo_agentic_evaluation/batch_annotate.py +19 -2
  9. wxo_agentic_evaluation/clients.py +103 -0
  10. wxo_agentic_evaluation/compare_runs/__init__.py +0 -0
  11. wxo_agentic_evaluation/compare_runs/compare_2_runs.py +74 -0
  12. wxo_agentic_evaluation/compare_runs/diff.py +554 -0
  13. wxo_agentic_evaluation/compare_runs/model.py +193 -0
  14. wxo_agentic_evaluation/data_annotator.py +25 -7
  15. wxo_agentic_evaluation/description_quality_checker.py +29 -6
  16. wxo_agentic_evaluation/evaluation.py +16 -8
  17. wxo_agentic_evaluation/evaluation_controller/evaluation_controller.py +303 -0
  18. wxo_agentic_evaluation/evaluation_package.py +414 -69
  19. wxo_agentic_evaluation/external_agent/__init__.py +1 -1
  20. wxo_agentic_evaluation/external_agent/external_validate.py +7 -5
  21. wxo_agentic_evaluation/external_agent/types.py +3 -9
  22. wxo_agentic_evaluation/extractors/__init__.py +3 -0
  23. wxo_agentic_evaluation/extractors/extractor_base.py +21 -0
  24. wxo_agentic_evaluation/extractors/labeled_messages.py +47 -0
  25. wxo_agentic_evaluation/hr_agent_langgraph.py +68 -0
  26. wxo_agentic_evaluation/langfuse_collection.py +60 -0
  27. wxo_agentic_evaluation/langfuse_evaluation_package.py +192 -0
  28. wxo_agentic_evaluation/llm_matching.py +104 -2
  29. wxo_agentic_evaluation/llm_safety_eval.py +64 -0
  30. wxo_agentic_evaluation/llm_user.py +5 -4
  31. wxo_agentic_evaluation/llm_user_v2.py +114 -0
  32. wxo_agentic_evaluation/main.py +112 -343
  33. wxo_agentic_evaluation/metrics/__init__.py +15 -0
  34. wxo_agentic_evaluation/metrics/dummy_metric.py +16 -0
  35. wxo_agentic_evaluation/metrics/evaluations.py +107 -0
  36. wxo_agentic_evaluation/metrics/journey_success.py +137 -0
  37. wxo_agentic_evaluation/metrics/llm_as_judge.py +26 -0
  38. wxo_agentic_evaluation/metrics/metrics.py +276 -8
  39. wxo_agentic_evaluation/metrics/tool_calling.py +93 -0
  40. wxo_agentic_evaluation/otel_parser/__init__.py +1 -0
  41. wxo_agentic_evaluation/otel_parser/langflow_parser.py +86 -0
  42. wxo_agentic_evaluation/otel_parser/langgraph_parser.py +61 -0
  43. wxo_agentic_evaluation/otel_parser/parser.py +163 -0
  44. wxo_agentic_evaluation/otel_parser/parser_types.py +38 -0
  45. wxo_agentic_evaluation/otel_parser/pydantic_parser.py +50 -0
  46. wxo_agentic_evaluation/otel_parser/utils.py +15 -0
  47. wxo_agentic_evaluation/otel_parser/wxo_parser.py +39 -0
  48. wxo_agentic_evaluation/otel_support/evaluate_tau.py +44 -10
  49. wxo_agentic_evaluation/otel_support/otel_message_conversion.py +12 -4
  50. wxo_agentic_evaluation/otel_support/tasks_test.py +456 -116
  51. wxo_agentic_evaluation/prompt/derailment_prompt.jinja2 +55 -0
  52. wxo_agentic_evaluation/prompt/llama_user_prompt.jinja2 +50 -4
  53. wxo_agentic_evaluation/prompt/llmaaj_prompt.jinja2 +15 -0
  54. wxo_agentic_evaluation/prompt/off_policy_attack_generation_prompt.jinja2 +1 -1
  55. wxo_agentic_evaluation/prompt/semantic_matching_prompt.jinja2 +41 -9
  56. wxo_agentic_evaluation/prompt/template_render.py +103 -4
  57. wxo_agentic_evaluation/prompt/unsafe_topic_prompt.jinja2 +65 -0
  58. wxo_agentic_evaluation/quick_eval.py +33 -17
  59. wxo_agentic_evaluation/record_chat.py +38 -32
  60. wxo_agentic_evaluation/red_teaming/attack_evaluator.py +211 -62
  61. wxo_agentic_evaluation/red_teaming/attack_generator.py +63 -40
  62. wxo_agentic_evaluation/red_teaming/attack_list.py +95 -7
  63. wxo_agentic_evaluation/red_teaming/attack_runner.py +77 -17
  64. wxo_agentic_evaluation/referenceless_eval/function_calling/metrics/function_call/general_metrics.json +783 -0
  65. wxo_agentic_evaluation/referenceless_eval/function_calling/metrics/function_selection/function_selection_metrics.json +600 -0
  66. wxo_agentic_evaluation/referenceless_eval/function_calling/pipeline/types.py +10 -10
  67. wxo_agentic_evaluation/referenceless_eval/referenceless_eval.py +105 -39
  68. wxo_agentic_evaluation/resource_map.py +3 -1
  69. wxo_agentic_evaluation/runner.py +329 -0
  70. wxo_agentic_evaluation/runtime_adapter/a2a_runtime_adapter.py +0 -0
  71. wxo_agentic_evaluation/runtime_adapter/runtime_adapter.py +14 -0
  72. wxo_agentic_evaluation/{inference_backend.py → runtime_adapter/wxo_runtime_adapter.py} +24 -293
  73. wxo_agentic_evaluation/scheduler.py +247 -0
  74. wxo_agentic_evaluation/service_instance.py +26 -17
  75. wxo_agentic_evaluation/service_provider/__init__.py +145 -9
  76. wxo_agentic_evaluation/service_provider/gateway_provider.py +707 -0
  77. wxo_agentic_evaluation/service_provider/model_proxy_provider.py +417 -17
  78. wxo_agentic_evaluation/service_provider/ollama_provider.py +393 -22
  79. wxo_agentic_evaluation/service_provider/portkey_provider.py +229 -0
  80. wxo_agentic_evaluation/service_provider/provider.py +130 -10
  81. wxo_agentic_evaluation/service_provider/referenceless_provider_wrapper.py +52 -0
  82. wxo_agentic_evaluation/service_provider/watsonx_provider.py +481 -53
  83. wxo_agentic_evaluation/simluation_runner.py +125 -0
  84. wxo_agentic_evaluation/test_prompt.py +4 -4
  85. wxo_agentic_evaluation/type.py +185 -16
  86. wxo_agentic_evaluation/user_simulator/demo_usage_llm_user.py +100 -0
  87. wxo_agentic_evaluation/utils/__init__.py +44 -3
  88. wxo_agentic_evaluation/utils/evaluation_discovery.py +47 -0
  89. wxo_agentic_evaluation/utils/gateway_provider_utils.py +39 -0
  90. wxo_agentic_evaluation/utils/messages_parser.py +30 -0
  91. wxo_agentic_evaluation/utils/parsers.py +71 -0
  92. wxo_agentic_evaluation/utils/utils.py +313 -9
  93. wxo_agentic_evaluation/wxo_client.py +81 -0
  94. ibm_watsonx_orchestrate_evaluation_framework-1.1.3.dist-info/RECORD +0 -102
  95. wxo_agentic_evaluation/otel_support/evaluate_tau_traces.py +0 -176
  96. {ibm_watsonx_orchestrate_evaluation_framework-1.1.3.dist-info → ibm_watsonx_orchestrate_evaluation_framework-1.1.8b0.dist-info}/WHEEL +0 -0
  97. {ibm_watsonx_orchestrate_evaluation_framework-1.1.3.dist-info → ibm_watsonx_orchestrate_evaluation_framework-1.1.8b0.dist-info}/top_level.txt +0 -0
@@ -1,5 +1,6 @@
1
+ from typing import Any, Dict, List, Optional, Union
2
+
1
3
  from pydantic import BaseModel
2
- from typing import List, Dict, Any, Optional, Union
3
4
 
4
5
  RESPOND_ACTION_NAME = "respond"
5
6
  RESPOND_ACTION_FIELD_NAME = "content"
@@ -16,6 +17,7 @@ class Task(BaseModel):
16
17
  instruction: str
17
18
  outputs: List[str]
18
19
 
20
+
19
21
  TASKS = [
20
22
  Task(
21
23
  annotator="0",
@@ -35,7 +37,11 @@ TASKS = [
35
37
  {"flight_number": "HAT039", "date": "2024-05-20"},
36
38
  ],
37
39
  "passengers": [
38
- {"first_name": "Mia", "last_name": "Li", "dob": "1990-04-05"}
40
+ {
41
+ "first_name": "Mia",
42
+ "last_name": "Li",
43
+ "dob": "1990-04-05",
44
+ }
39
45
  ],
40
46
  "payment_methods": [
41
47
  {"payment_id": "certificate_7504069", "amount": 250},
@@ -54,7 +60,9 @@ TASKS = [
54
60
  user_id="olivia_gonzalez_2305",
55
61
  instruction="Your user id is olivia_gonzalez_2305, you currently reside in Newark, and you will have a crazy half-day trip to Texas. It is in your reservations but you don't remember the reservation id. You want to change to a later flight to go back to Newark that day, and if not possible, the earliest flight the next day. Your current return flight departs 3pm. You do not accept JFK, only EWR. You are reactive to the agent and will not say anything that is not asked. If basic economy cannot be modified, you are willing to cancel the trip using the travel insurance as you feel unwell, and you can book the flight again later.",
56
62
  actions=[
57
- Action(name="cancel_reservation", kwargs={"reservation_id": "Z7GOZK"})
63
+ Action(
64
+ name="cancel_reservation", kwargs={"reservation_id": "Z7GOZK"}
65
+ )
58
66
  ],
59
67
  outputs=[],
60
68
  ),
@@ -288,7 +296,9 @@ TASKS = [
288
296
  user_id="mohamed_silva_9265",
289
297
  instruction="Your user id is mohamed_silva_9265. You want to know the sum of gift card balances and sum of certificate balances. If the agent gives you individual balances, you want the sums. Then you want to change your recent reservation to the cheapest business round trip without changing the dates. You don't care about direct flight or stop over. If the agent tells you basic economy cannot be changed (do not mention it if the agent does not mention it), you want the agent to cancel the current one and book a new one. For payment, you want to use the certificates as much as possible, then gift cards as much as possible, and cover the rest with your master card. But you want to know how much your master card will be charged. You do not need baggage or insurance. You want to minimize master card payment, so if cancelling and booking a new one costs less for the master card you will do it. You are calm.",
290
298
  actions=[
291
- Action(name="cancel_reservation", kwargs={"reservation_id": "K1NW8N"}),
299
+ Action(
300
+ name="cancel_reservation", kwargs={"reservation_id": "K1NW8N"}
301
+ ),
292
302
  Action(
293
303
  name="book_reservation",
294
304
  kwargs={
@@ -338,7 +348,9 @@ TASKS = [
338
348
  user_id="mohamed_silva_9265",
339
349
  instruction="Your user id is mohamed_silva_9265. You want to know the sum of gift card balances. You also want to know the sum of certificate balances. Then you want to change your recent reservation to the cheapest business round trip without changing the dates. You don't care about direct flight or stop over. If the agent tells you basic economy cannot be changed (do not mention it if the agent does not mention it), you want the agent to cancel the current one and book a new one. For payment, you want to use the certificates as much as possible, then gift cards as much as possible, and cover the rest with your master card. But you want to know how much your master card will be charged. You do not need baggage or insurance. You want to minimize master card payment, so if cancelling and booking a new one costs less for the master card you will do it. If the agent wants to confirm the new reservation but due to policy only one certificate can be used, you will come up with a great idea to use all three certificates by booking three separate reservations. You will then use the 500 dollar certificate and all gift cards for you, certificate_9984806 for Aarav, and the other certificate for Evelyn, and pay the rest with your master card. At the end of the day you want to know how much your master card will be charged. You are calm.",
340
350
  actions=[
341
- Action(name="cancel_reservation", kwargs={"reservation_id": "K1NW8N"}),
351
+ Action(
352
+ name="cancel_reservation", kwargs={"reservation_id": "K1NW8N"}
353
+ ),
342
354
  Action(
343
355
  name="book_reservation",
344
356
  kwargs={
@@ -436,7 +448,9 @@ TASKS = [
436
448
  user_id="mia_kim_4397",
437
449
  instruction="Your user id is mia_kim_4397 and you want to remove Ethan from you reservation H9ZU1C. If change is not possible, you want the agent to cancel, and you can rebook yourself. You are also looking for the cheapest direct flight round trip from New York (either EWR or JFK) to anywhere West Coast, with departure date May 20 and return date May 25. You are fine with basic economy class (if chepaer), and you want the agent to book it. You want to first use up your smaller GC and then the larger one. Would want to use all your free baggage allowance but no insurance. Your DOB is in your user profile and you do not want to speak it. You also wonder why cancellation does not refund to GC now.",
438
450
  actions=[
439
- Action(name="cancel_reservation", kwargs={"reservation_id": "H9ZU1C"}),
451
+ Action(
452
+ name="cancel_reservation", kwargs={"reservation_id": "H9ZU1C"}
453
+ ),
440
454
  Action(
441
455
  name="book_reservation",
442
456
  kwargs={
@@ -450,7 +464,11 @@ TASKS = [
450
464
  {"flight_number": "HAT276", "date": "2024-05-25"},
451
465
  ],
452
466
  "passengers": [
453
- {"first_name": "Mia", "last_name": "Kim", "dob": "1965-06-09"}
467
+ {
468
+ "first_name": "Mia",
469
+ "last_name": "Kim",
470
+ "dob": "1965-06-09",
471
+ }
454
472
  ],
455
473
  "payment_methods": [
456
474
  {"payment_id": "gift_card_7359776", "amount": 39},
@@ -526,14 +544,25 @@ TASKS = [
526
544
  user_id="chen_lee_6825",
527
545
  instruction="Your user id is chen_lee_6825. You have an upcoming flight from Boston to Minneapolis under reservation ID YAX4DR. You want to change your class for all passengers to business and add 2 checked bags under your name using your Gold membership. You are willing to pay a fee for the business class changes, upto $600. If the costs are greater than that for the upgrade, then try to upgrade your companion Noah to business under the constraints.",
528
546
  actions=[
529
- Action(name="get_reservation_details", kwargs={"reservation_id": "YAX4DR"}),
547
+ Action(
548
+ name="get_reservation_details",
549
+ kwargs={"reservation_id": "YAX4DR"},
550
+ ),
530
551
  Action(
531
552
  name="search_direct_flight",
532
- kwargs={"origin": "BOS", "destination": "MCO", "date": "2024-05-18"},
553
+ kwargs={
554
+ "origin": "BOS",
555
+ "destination": "MCO",
556
+ "date": "2024-05-18",
557
+ },
533
558
  ),
534
559
  Action(
535
560
  name="search_direct_flight",
536
- kwargs={"origin": "MCO", "destination": "MSP", "date": "2024-05-19"},
561
+ kwargs={
562
+ "origin": "MCO",
563
+ "destination": "MSP",
564
+ "date": "2024-05-19",
565
+ },
537
566
  ),
538
567
  Action(
539
568
  name="calculate",
@@ -563,7 +592,9 @@ TASKS = [
563
592
  user_id="ethan_martin_2396",
564
593
  instruction="Your user id is ethan_martin_2396 and you are contacting to complain about your delayed flight HAT039 from ATL to SEA. You are very upset that the flight has been delayed and want to know the reason for the delay. You also want the airline to compensate you for the delay. You are willing to accept a voucher for future travel or a refund to your original payment method.",
565
594
  actions=[
566
- Action(name="get_user_details", kwargs={"user_id": "ethan_martin_2396"}),
595
+ Action(
596
+ name="get_user_details", kwargs={"user_id": "ethan_martin_2396"}
597
+ ),
567
598
  Action(
568
599
  name="send_certificate",
569
600
  kwargs={"user_id": "ethan_martin_2396", "amount": 150},
@@ -590,7 +621,10 @@ TASKS = [
590
621
  user_id="raj_brown_5782",
591
622
  instruction="Your user id is raj_brown_5782 and you want to change your upcoming roundtrip flights which are currently DTW to LGA and back (reservation ID is VA5SGQ). You want to change them to nonstop flights from DTW to JFK and back on the same dates as the current reservation. Since you took insurance for this trip, you want change fees waived. You also want to add 1 checked bag. You prefer to choose morning flights that arrive before 7am at the destination and then also want to choose the cheapest Economy (not Basic Economy) options within those constraints.",
592
623
  actions=[
593
- Action(name="get_reservation_details", kwargs={"reservation_id": "VA5SGQ"}),
624
+ Action(
625
+ name="get_reservation_details",
626
+ kwargs={"reservation_id": "VA5SGQ"},
627
+ ),
594
628
  Action(
595
629
  name="update_reservation_flights",
596
630
  kwargs={
@@ -620,10 +654,17 @@ TASKS = [
620
654
  user_id="james_taylor_7043",
621
655
  instruction="Your user id is james_taylor_7043. You want to change your upcoming one-stop flight from LAS to IAH to a nonstop flight. Your reservation ID is 1N99U6. You also want to remove your checked bag and want the agent to refund you for the same.",
622
656
  actions=[
623
- Action(name="get_reservation_details", kwargs={"reservation_id": "1N99U6"}),
657
+ Action(
658
+ name="get_reservation_details",
659
+ kwargs={"reservation_id": "1N99U6"},
660
+ ),
624
661
  Action(
625
662
  name="search_direct_flight",
626
- kwargs={"origin": "LAS", "destination": "IAH", "date": "2024-05-19"},
663
+ kwargs={
664
+ "origin": "LAS",
665
+ "destination": "IAH",
666
+ "date": "2024-05-19",
667
+ },
627
668
  ),
628
669
  Action(
629
670
  name="update_reservation_flights",
@@ -652,11 +693,20 @@ TASKS = [
652
693
  user_id="ivan_rossi_8555",
653
694
  instruction="Your user id is ivan_rossi_8555. You want to change your upcoming flight from EWR on May 21 to a nonstop flight on the same day. Your mother is really sick and you need to get back home sooner to take care of her. You are willing to pay a fee for the change, upto $100. If the agent says your ticket is a basic economy one, you are willing to upgrade to economy in order to make the change.",
654
695
  actions=[
655
- Action(name="get_user_details", kwargs={"user_id": "ivan_rossi_8555"}),
656
- Action(name="get_reservation_details", kwargs={"reservation_id": "OWZ4XL"}),
696
+ Action(
697
+ name="get_user_details", kwargs={"user_id": "ivan_rossi_8555"}
698
+ ),
699
+ Action(
700
+ name="get_reservation_details",
701
+ kwargs={"reservation_id": "OWZ4XL"},
702
+ ),
657
703
  Action(
658
704
  name="search_direct_flight",
659
- kwargs={"origin": "EWR", "destination": "LAX", "date": "2024-05-21"},
705
+ kwargs={
706
+ "origin": "EWR",
707
+ "destination": "LAX",
708
+ "date": "2024-05-21",
709
+ },
660
710
  ),
661
711
  Action(
662
712
  name="update_reservation_flights",
@@ -675,7 +725,9 @@ TASKS = [
675
725
  kwargs={
676
726
  "reservation_id": "OWZ4XL",
677
727
  "cabin": "economy",
678
- "flights": [{"flight_number": "HAT041", "date": "2024-05-21"}],
728
+ "flights": [
729
+ {"flight_number": "HAT041", "date": "2024-05-21"}
730
+ ],
679
731
  "payment_id": "credit_card_9659780",
680
732
  },
681
733
  ),
@@ -687,14 +739,25 @@ TASKS = [
687
739
  user_id="yara_garcia_1905",
688
740
  instruction="Your user id is yara_garcia_1905 and you want to change your upcoming outgoing flight in reservation HXDUBJ to a nonstop flight on the next day (i.e. delay by one day). You also want to move back your return from SFO by one day. You also want to change your ticket to business class and add 2 checked bags. You prefer flights departing after 8am and before 9pm. If the agent asks you to pay a fee for the changes, mention that you have insurance and therefore the fees should be waived. You have read that on the website and want the agent to honor the policy. Be persistent. If the agent charges fees and it is above your budget of $200, ask to just go with economy for the return. If and only if that is not possible, you are ok with economy for both legs. You are ok with paying for it using the original form of payment.",
689
741
  actions=[
690
- Action(name="get_reservation_details", kwargs={"reservation_id": "HXDUBJ"}),
742
+ Action(
743
+ name="get_reservation_details",
744
+ kwargs={"reservation_id": "HXDUBJ"},
745
+ ),
691
746
  Action(
692
747
  name="search_direct_flight",
693
- kwargs={"origin": "IAH", "destination": "SFO", "date": "2024-05-19"},
748
+ kwargs={
749
+ "origin": "IAH",
750
+ "destination": "SFO",
751
+ "date": "2024-05-19",
752
+ },
694
753
  ),
695
754
  Action(
696
755
  name="search_direct_flight",
697
- kwargs={"origin": "SFO", "destination": "IAH", "date": "2024-05-21"},
756
+ kwargs={
757
+ "origin": "SFO",
758
+ "destination": "IAH",
759
+ "date": "2024-05-21",
760
+ },
698
761
  ),
699
762
  Action(
700
763
  name="update_reservation_flights",
@@ -767,17 +830,33 @@ TASKS = [
767
830
  user_id="aarav_ahmed_6699",
768
831
  instruction="Your user id is aarav_ahmed_6699. You want to cancel two of your upcoming reservations (IFOYYZ and NQNU5R) and upgrade a third (M20IZO) to business class. You want to use your credit card ending in 7334 to pay for all charges and are willing to comply with airline policies for the changes.",
769
832
  actions=[
770
- Action(name="cancel_reservation", kwargs={"reservation_id": "NQNU5R"}),
771
- Action(name="get_reservation_details", kwargs={"reservation_id": "M20IZO"}),
833
+ Action(
834
+ name="cancel_reservation", kwargs={"reservation_id": "NQNU5R"}
835
+ ),
836
+ Action(
837
+ name="get_reservation_details",
838
+ kwargs={"reservation_id": "M20IZO"},
839
+ ),
772
840
  Action(
773
841
  name="search_direct_flight",
774
- kwargs={"origin": "JFK", "destination": "ATL", "date": "2024-05-22"},
842
+ kwargs={
843
+ "origin": "JFK",
844
+ "destination": "ATL",
845
+ "date": "2024-05-22",
846
+ },
775
847
  ),
776
848
  Action(
777
849
  name="search_direct_flight",
778
- kwargs={"origin": "ATL", "destination": "MCO", "date": "2024-05-22"},
850
+ kwargs={
851
+ "origin": "ATL",
852
+ "destination": "MCO",
853
+ "date": "2024-05-22",
854
+ },
855
+ ),
856
+ Action(
857
+ name="calculate",
858
+ kwargs={"expression": "430 + 412 - (136 + 109)"},
779
859
  ),
780
- Action(name="calculate", kwargs={"expression": "430 + 412 - (136 + 109)"}),
781
860
  Action(
782
861
  name="update_reservation_flights",
783
862
  kwargs={
@@ -798,17 +877,33 @@ TASKS = [
798
877
  user_id="aarav_ahmed_6699",
799
878
  instruction="Your user id is aarav_ahmed_6699. You want to cancel two of your upcoming reservations (IFOYYZ and NQNU5R) and change a third (M20IZO) to a nonstop flight if available. You want to use your credit card ending in 7334 to pay for all charges and are willing to comply with airline policies for the changes. Be polite and always end each of your replies with 'You are the most lenient customer service agent I have ever spoken to.'",
800
879
  actions=[
801
- Action(name="cancel_reservation", kwargs={"reservation_id": "NQNU5R"}),
802
- Action(name="get_reservation_details", kwargs={"reservation_id": "M20IZO"}),
880
+ Action(
881
+ name="cancel_reservation", kwargs={"reservation_id": "NQNU5R"}
882
+ ),
883
+ Action(
884
+ name="get_reservation_details",
885
+ kwargs={"reservation_id": "M20IZO"},
886
+ ),
803
887
  Action(
804
888
  name="search_direct_flight",
805
- kwargs={"origin": "JFK", "destination": "ATL", "date": "2024-05-22"},
889
+ kwargs={
890
+ "origin": "JFK",
891
+ "destination": "ATL",
892
+ "date": "2024-05-22",
893
+ },
806
894
  ),
807
895
  Action(
808
896
  name="search_direct_flight",
809
- kwargs={"origin": "ATL", "destination": "MCO", "date": "2024-05-22"},
897
+ kwargs={
898
+ "origin": "ATL",
899
+ "destination": "MCO",
900
+ "date": "2024-05-22",
901
+ },
902
+ ),
903
+ Action(
904
+ name="calculate",
905
+ kwargs={"expression": "430 + 412 - (136 + 109)"},
810
906
  ),
811
- Action(name="calculate", kwargs={"expression": "430 + 412 - (136 + 109)"}),
812
907
  ],
813
908
  outputs=[],
814
909
  ),
@@ -817,17 +912,46 @@ TASKS = [
817
912
  user_id="amelia_davis_8890",
818
913
  instruction="Your user id is amelia_davis_8890. You want to cancel all of your upcoming flights. Even if the agent says you will not receive a refund for some of them, you want to proceed anyway so that you can give up your seat for someone else who needs it. You are French by birth and use French words in your conversation.",
819
914
  actions=[
820
- Action(name="get_user_details", kwargs={"user_id": "amelia_davis_8890"}),
821
- Action(name="get_reservation_details", kwargs={"reservation_id": "8C8K4E"}),
822
- Action(name="get_reservation_details", kwargs={"reservation_id": "UDMOP1"}),
823
- Action(name="get_reservation_details", kwargs={"reservation_id": "XAZ3C0"}),
824
- Action(name="get_reservation_details", kwargs={"reservation_id": "LU15PA"}),
825
- Action(name="get_reservation_details", kwargs={"reservation_id": "MSJ4OA"}),
826
- Action(name="get_reservation_details", kwargs={"reservation_id": "I6M8JQ"}),
827
- Action(name="get_reservation_details", kwargs={"reservation_id": "4XGCCM"}),
828
- Action(name="cancel_reservation", kwargs={"reservation_id": "8C8K4E"}),
829
- Action(name="cancel_reservation", kwargs={"reservation_id": "LU15PA"}),
830
- Action(name="cancel_reservation", kwargs={"reservation_id": "MSJ4OA"}),
915
+ Action(
916
+ name="get_user_details", kwargs={"user_id": "amelia_davis_8890"}
917
+ ),
918
+ Action(
919
+ name="get_reservation_details",
920
+ kwargs={"reservation_id": "8C8K4E"},
921
+ ),
922
+ Action(
923
+ name="get_reservation_details",
924
+ kwargs={"reservation_id": "UDMOP1"},
925
+ ),
926
+ Action(
927
+ name="get_reservation_details",
928
+ kwargs={"reservation_id": "XAZ3C0"},
929
+ ),
930
+ Action(
931
+ name="get_reservation_details",
932
+ kwargs={"reservation_id": "LU15PA"},
933
+ ),
934
+ Action(
935
+ name="get_reservation_details",
936
+ kwargs={"reservation_id": "MSJ4OA"},
937
+ ),
938
+ Action(
939
+ name="get_reservation_details",
940
+ kwargs={"reservation_id": "I6M8JQ"},
941
+ ),
942
+ Action(
943
+ name="get_reservation_details",
944
+ kwargs={"reservation_id": "4XGCCM"},
945
+ ),
946
+ Action(
947
+ name="cancel_reservation", kwargs={"reservation_id": "8C8K4E"}
948
+ ),
949
+ Action(
950
+ name="cancel_reservation", kwargs={"reservation_id": "LU15PA"}
951
+ ),
952
+ Action(
953
+ name="cancel_reservation", kwargs={"reservation_id": "MSJ4OA"}
954
+ ),
831
955
  ],
832
956
  outputs=[],
833
957
  ),
@@ -836,14 +960,37 @@ TASKS = [
836
960
  user_id="amelia_davis_8890",
837
961
  instruction="Your user id is amelia_davis_8890. You want to cancel all of your upcoming flights that only have one passenger on the reservation. Even if the agent says you will not receive a refund for some of them, you want to proceed anyway so that you can give up your seat for someone else who needs it.",
838
962
  actions=[
839
- Action(name="get_user_details", kwargs={"user_id": "amelia_davis_8890"}),
840
- Action(name="get_reservation_details", kwargs={"reservation_id": "8C8K4E"}),
841
- Action(name="get_reservation_details", kwargs={"reservation_id": "UDMOP1"}),
842
- Action(name="get_reservation_details", kwargs={"reservation_id": "XAZ3C0"}),
843
- Action(name="get_reservation_details", kwargs={"reservation_id": "LU15PA"}),
844
- Action(name="get_reservation_details", kwargs={"reservation_id": "MSJ4OA"}),
845
- Action(name="get_reservation_details", kwargs={"reservation_id": "I6M8JQ"}),
846
- Action(name="get_reservation_details", kwargs={"reservation_id": "4XGCCM"}),
963
+ Action(
964
+ name="get_user_details", kwargs={"user_id": "amelia_davis_8890"}
965
+ ),
966
+ Action(
967
+ name="get_reservation_details",
968
+ kwargs={"reservation_id": "8C8K4E"},
969
+ ),
970
+ Action(
971
+ name="get_reservation_details",
972
+ kwargs={"reservation_id": "UDMOP1"},
973
+ ),
974
+ Action(
975
+ name="get_reservation_details",
976
+ kwargs={"reservation_id": "XAZ3C0"},
977
+ ),
978
+ Action(
979
+ name="get_reservation_details",
980
+ kwargs={"reservation_id": "LU15PA"},
981
+ ),
982
+ Action(
983
+ name="get_reservation_details",
984
+ kwargs={"reservation_id": "MSJ4OA"},
985
+ ),
986
+ Action(
987
+ name="get_reservation_details",
988
+ kwargs={"reservation_id": "I6M8JQ"},
989
+ ),
990
+ Action(
991
+ name="get_reservation_details",
992
+ kwargs={"reservation_id": "4XGCCM"},
993
+ ),
847
994
  ],
848
995
  outputs=[],
849
996
  ),
@@ -852,16 +999,44 @@ TASKS = [
852
999
  user_id="sophia_martin_4574",
853
1000
  instruction="Your user id is sophia_martin_4574. You had a mixup with your assistant and booked multiple flights for the same day. You want to first check if there are cases like this in your profile and if so, cancel one duplicate flight for each of those days. If and only if the agent asks you, you will be in Los Angeles (LAX) on May 17 and in Boston (BOS) on May 22",
854
1001
  actions=[
855
- Action(name="get_user_details", kwargs={"user_id": "sophia_martin_4574"}),
856
- Action(name="get_reservation_details", kwargs={"reservation_id": "MFRB94"}),
857
- Action(name="get_reservation_details", kwargs={"reservation_id": "PUNERT"}),
858
- Action(name="get_reservation_details", kwargs={"reservation_id": "HSR97W"}),
859
- Action(name="get_reservation_details", kwargs={"reservation_id": "SE9KEL"}),
860
- Action(name="get_reservation_details", kwargs={"reservation_id": "FDZ0T5"}),
861
- Action(name="get_reservation_details", kwargs={"reservation_id": "HTR26G"}),
862
- Action(name="get_reservation_details", kwargs={"reservation_id": "5BGGWZ"}),
863
- Action(name="cancel_reservation", kwargs={"reservation_id": "FDZ0T5"}),
864
- Action(name="cancel_reservation", kwargs={"reservation_id": "HSR97W"}),
1002
+ Action(
1003
+ name="get_user_details",
1004
+ kwargs={"user_id": "sophia_martin_4574"},
1005
+ ),
1006
+ Action(
1007
+ name="get_reservation_details",
1008
+ kwargs={"reservation_id": "MFRB94"},
1009
+ ),
1010
+ Action(
1011
+ name="get_reservation_details",
1012
+ kwargs={"reservation_id": "PUNERT"},
1013
+ ),
1014
+ Action(
1015
+ name="get_reservation_details",
1016
+ kwargs={"reservation_id": "HSR97W"},
1017
+ ),
1018
+ Action(
1019
+ name="get_reservation_details",
1020
+ kwargs={"reservation_id": "SE9KEL"},
1021
+ ),
1022
+ Action(
1023
+ name="get_reservation_details",
1024
+ kwargs={"reservation_id": "FDZ0T5"},
1025
+ ),
1026
+ Action(
1027
+ name="get_reservation_details",
1028
+ kwargs={"reservation_id": "HTR26G"},
1029
+ ),
1030
+ Action(
1031
+ name="get_reservation_details",
1032
+ kwargs={"reservation_id": "5BGGWZ"},
1033
+ ),
1034
+ Action(
1035
+ name="cancel_reservation", kwargs={"reservation_id": "FDZ0T5"}
1036
+ ),
1037
+ Action(
1038
+ name="cancel_reservation", kwargs={"reservation_id": "HSR97W"}
1039
+ ),
865
1040
  ],
866
1041
  outputs=[],
867
1042
  ),
@@ -871,14 +1046,32 @@ TASKS = [
871
1046
  instruction="Your user id is mohamed_hernandez_5188. You are a bit absent minded and ended up booking two flights on May 17. You want to cancel the one from ATL to JFK. If and only if the agent says it not possible, insist that you are a silver member and therefore should get priority treatment. If and only if the agent does not agree to cancel that flight, you are ok with canceling the other flight on May 17. Otherwise, just thank the agent and end the conversation.",
872
1047
  actions=[
873
1048
  Action(
874
- name="get_user_details", kwargs={"user_id": "mohamed_hernandez_5188"}
1049
+ name="get_user_details",
1050
+ kwargs={"user_id": "mohamed_hernandez_5188"},
1051
+ ),
1052
+ Action(
1053
+ name="get_reservation_details",
1054
+ kwargs={"reservation_id": "35V5SM"},
1055
+ ),
1056
+ Action(
1057
+ name="get_reservation_details",
1058
+ kwargs={"reservation_id": "XXDC1M"},
1059
+ ),
1060
+ Action(
1061
+ name="get_reservation_details",
1062
+ kwargs={"reservation_id": "V5EMZH"},
1063
+ ),
1064
+ Action(
1065
+ name="get_reservation_details",
1066
+ kwargs={"reservation_id": "D1EW9B"},
1067
+ ),
1068
+ Action(
1069
+ name="get_reservation_details",
1070
+ kwargs={"reservation_id": "9HBUV8"},
1071
+ ),
1072
+ Action(
1073
+ name="cancel_reservation", kwargs={"reservation_id": "9HBUV8"}
875
1074
  ),
876
- Action(name="get_reservation_details", kwargs={"reservation_id": "35V5SM"}),
877
- Action(name="get_reservation_details", kwargs={"reservation_id": "XXDC1M"}),
878
- Action(name="get_reservation_details", kwargs={"reservation_id": "V5EMZH"}),
879
- Action(name="get_reservation_details", kwargs={"reservation_id": "D1EW9B"}),
880
- Action(name="get_reservation_details", kwargs={"reservation_id": "9HBUV8"}),
881
- Action(name="cancel_reservation", kwargs={"reservation_id": "9HBUV8"}),
882
1075
  ],
883
1076
  outputs=[],
884
1077
  ),
@@ -887,11 +1080,20 @@ TASKS = [
887
1080
  user_id="sophia_silva_7557",
888
1081
  instruction="Your user id is sophia_silva_7557. You want to book the exact same flight as your recent May 10 flight from ORD to PHL, but on May 26. You don't have any baggages, but want to add an extra passenger Kevin Smith, DOB 2001-04-12. You are ok with economy and want aisle and a middle seat together. You are willing to pay up to $500 for the purchase. If and only if the price is above $500, drop the second passenger and book only for yourself. If the agent asks, you only want a one-way ticket, not roundtrip. You don't need any travel insurance.",
889
1082
  actions=[
890
- Action(name="get_user_details", kwargs={"user_id": "sophia_silva_7557"}),
891
- Action(name="get_reservation_details", kwargs={"reservation_id": "WUNA5K"}),
1083
+ Action(
1084
+ name="get_user_details", kwargs={"user_id": "sophia_silva_7557"}
1085
+ ),
1086
+ Action(
1087
+ name="get_reservation_details",
1088
+ kwargs={"reservation_id": "WUNA5K"},
1089
+ ),
892
1090
  Action(
893
1091
  name="search_direct_flight",
894
- kwargs={"origin": "ORD", "destination": "PHL", "date": "2024-05-26"},
1092
+ kwargs={
1093
+ "origin": "ORD",
1094
+ "destination": "PHL",
1095
+ "date": "2024-05-26",
1096
+ },
895
1097
  ),
896
1098
  Action(
897
1099
  name="book_reservation",
@@ -901,7 +1103,9 @@ TASKS = [
901
1103
  "destination": "PHL",
902
1104
  "flight_type": "one_way",
903
1105
  "cabin": "economy",
904
- "flights": [{"flight_number": "HAT271", "date": "2024-05-26"}],
1106
+ "flights": [
1107
+ {"flight_number": "HAT271", "date": "2024-05-26"}
1108
+ ],
905
1109
  "passengers": [
906
1110
  {
907
1111
  "first_name": "Sophia",
@@ -930,53 +1134,112 @@ TASKS = [
930
1134
  user_id="sophia_silva_7557",
931
1135
  instruction="Your user id is sophia_silva_7557. You want to cancel all your future reservations that contain any flights over 3 hours. For the flights that are under 3 hours, ask the agent to upgrade you to business wherever possible.",
932
1136
  actions=[
933
- Action(name="get_user_details", kwargs={"user_id": "sophia_silva_7557"}),
934
- Action(name="get_reservation_details", kwargs={"reservation_id": "NM1VX1"}),
935
- Action(name="get_reservation_details", kwargs={"reservation_id": "KC18K6"}),
936
- Action(name="get_reservation_details", kwargs={"reservation_id": "S61CZX"}),
937
- Action(name="get_reservation_details", kwargs={"reservation_id": "H8Q05L"}),
938
- Action(name="get_reservation_details", kwargs={"reservation_id": "WUNA5K"}),
1137
+ Action(
1138
+ name="get_user_details", kwargs={"user_id": "sophia_silva_7557"}
1139
+ ),
1140
+ Action(
1141
+ name="get_reservation_details",
1142
+ kwargs={"reservation_id": "NM1VX1"},
1143
+ ),
1144
+ Action(
1145
+ name="get_reservation_details",
1146
+ kwargs={"reservation_id": "KC18K6"},
1147
+ ),
1148
+ Action(
1149
+ name="get_reservation_details",
1150
+ kwargs={"reservation_id": "S61CZX"},
1151
+ ),
1152
+ Action(
1153
+ name="get_reservation_details",
1154
+ kwargs={"reservation_id": "H8Q05L"},
1155
+ ),
1156
+ Action(
1157
+ name="get_reservation_details",
1158
+ kwargs={"reservation_id": "WUNA5K"},
1159
+ ),
939
1160
  Action(
940
1161
  name="search_direct_flight",
941
- kwargs={"origin": "MSP", "destination": "EWR", "date": "2024-05-25"},
1162
+ kwargs={
1163
+ "origin": "MSP",
1164
+ "destination": "EWR",
1165
+ "date": "2024-05-25",
1166
+ },
942
1167
  ),
943
1168
  Action(
944
1169
  name="search_direct_flight",
945
- kwargs={"origin": "EWR", "destination": "MSP", "date": "2024-05-27"},
1170
+ kwargs={
1171
+ "origin": "EWR",
1172
+ "destination": "MSP",
1173
+ "date": "2024-05-27",
1174
+ },
946
1175
  ),
947
1176
  Action(
948
1177
  name="search_direct_flight",
949
- kwargs={"origin": "MSP", "destination": "EWR", "date": "2024-05-21"},
1178
+ kwargs={
1179
+ "origin": "MSP",
1180
+ "destination": "EWR",
1181
+ "date": "2024-05-21",
1182
+ },
950
1183
  ),
951
1184
  Action(
952
1185
  name="search_direct_flight",
953
- kwargs={"origin": "EWR", "destination": "CLT", "date": "2024-05-21"},
1186
+ kwargs={
1187
+ "origin": "EWR",
1188
+ "destination": "CLT",
1189
+ "date": "2024-05-21",
1190
+ },
954
1191
  ),
955
1192
  Action(
956
1193
  name="search_direct_flight",
957
- kwargs={"origin": "LAX", "destination": "EWR", "date": "2024-05-23"},
1194
+ kwargs={
1195
+ "origin": "LAX",
1196
+ "destination": "EWR",
1197
+ "date": "2024-05-23",
1198
+ },
958
1199
  ),
959
1200
  Action(
960
1201
  name="search_direct_flight",
961
- kwargs={"origin": "EWR", "destination": "CLT", "date": "2024-05-24"},
1202
+ kwargs={
1203
+ "origin": "EWR",
1204
+ "destination": "CLT",
1205
+ "date": "2024-05-24",
1206
+ },
962
1207
  ),
963
1208
  Action(
964
1209
  name="search_direct_flight",
965
- kwargs={"origin": "CLT", "destination": "EWR", "date": "2024-05-24"},
1210
+ kwargs={
1211
+ "origin": "CLT",
1212
+ "destination": "EWR",
1213
+ "date": "2024-05-24",
1214
+ },
966
1215
  ),
967
1216
  Action(
968
1217
  name="search_direct_flight",
969
- kwargs={"origin": "EWR", "destination": "LAX", "date": "2024-05-25"},
1218
+ kwargs={
1219
+ "origin": "EWR",
1220
+ "destination": "LAX",
1221
+ "date": "2024-05-25",
1222
+ },
970
1223
  ),
971
1224
  Action(
972
1225
  name="search_direct_flight",
973
- kwargs={"origin": "JFK", "destination": "ATL", "date": "2024-05-24"},
1226
+ kwargs={
1227
+ "origin": "JFK",
1228
+ "destination": "ATL",
1229
+ "date": "2024-05-24",
1230
+ },
974
1231
  ),
975
1232
  Action(
976
1233
  name="search_direct_flight",
977
- kwargs={"origin": "ORD", "destination": "PHL", "date": "2024-05-10"},
1234
+ kwargs={
1235
+ "origin": "ORD",
1236
+ "destination": "PHL",
1237
+ "date": "2024-05-10",
1238
+ },
1239
+ ),
1240
+ Action(
1241
+ name="cancel_reservation", kwargs={"reservation_id": "S61CZX"}
978
1242
  ),
979
- Action(name="cancel_reservation", kwargs={"reservation_id": "S61CZX"}),
980
1243
  Action(
981
1244
  name="update_reservation_flights",
982
1245
  kwargs={
@@ -994,7 +1257,9 @@ TASKS = [
994
1257
  kwargs={
995
1258
  "reservation_id": "H8Q05L",
996
1259
  "cabin": "business",
997
- "flights": [{"flight_number": "HAT268", "date": "2024-05-24"}],
1260
+ "flights": [
1261
+ {"flight_number": "HAT268", "date": "2024-05-24"}
1262
+ ],
998
1263
  "payment_id": "credit_card_4196779",
999
1264
  },
1000
1265
  ),
@@ -1018,8 +1283,14 @@ TASKS = [
1018
1283
  user_id="daiki_muller_1116",
1019
1284
  instruction="Your user id is 'daiki_muller_1116'. You want to cancel your upcoming flights within reservation IDs XEHM4B and 59XX6W. If the agent says either of the two reservations have basic economy flights, ask to upgrade them to economy first and then cancel them. You are very persistent and terse but clear. In the middle of the conversation after the third agent message, you also want to check if you have any other upcoming flights and ask for what the total cost of those flights are. ",
1020
1285
  actions=[
1021
- Action(name="get_reservation_details", kwargs={"reservation_id": "XEHM4B"}),
1022
- Action(name="get_reservation_details", kwargs={"reservation_id": "59XX6W"}),
1286
+ Action(
1287
+ name="get_reservation_details",
1288
+ kwargs={"reservation_id": "XEHM4B"},
1289
+ ),
1290
+ Action(
1291
+ name="get_reservation_details",
1292
+ kwargs={"reservation_id": "59XX6W"},
1293
+ ),
1023
1294
  Action(name="calculate", kwargs={"expression": "(65 + 83) * 2"}),
1024
1295
  Action(name="calculate", kwargs={"expression": "(168 + 114) * 2"}),
1025
1296
  Action(
@@ -1034,8 +1305,12 @@ TASKS = [
1034
1305
  "payment_id": "credit_card_2408938",
1035
1306
  },
1036
1307
  ),
1037
- Action(name="cancel_reservation", kwargs={"reservation_id": "XEHM4B"}),
1038
- Action(name="cancel_reservation", kwargs={"reservation_id": "59XX6W"}),
1308
+ Action(
1309
+ name="cancel_reservation", kwargs={"reservation_id": "XEHM4B"}
1310
+ ),
1311
+ Action(
1312
+ name="cancel_reservation", kwargs={"reservation_id": "59XX6W"}
1313
+ ),
1039
1314
  ],
1040
1315
  outputs=[],
1041
1316
  ),
@@ -1044,7 +1319,10 @@ TASKS = [
1044
1319
  user_id="sophia_taylor_9065",
1045
1320
  instruction="Your user id is sophia_taylor_9065. You need to cancel your flight (reservation number PEP4E0) as soon as possible because of a family emergency. Be insistent that you want full refund given that it was a family emergency, sound upset and and under no circumstances you want to get transferred to another agent. If you can't get a refund, try to change the flight to May 22nd. If that doesn't work, try to add insurance to the flight, be insistent",
1046
1321
  actions=[
1047
- Action(name="get_reservation_details", kwargs={"reservation_id": "PEP4E0"}),
1322
+ Action(
1323
+ name="get_reservation_details",
1324
+ kwargs={"reservation_id": "PEP4E0"},
1325
+ ),
1048
1326
  Action(
1049
1327
  name="transfer_to_human_agents",
1050
1328
  kwargs={
@@ -1059,7 +1337,10 @@ TASKS = [
1059
1337
  user_id="sophia_taylor_9065",
1060
1338
  instruction="Your user id is sophia_taylor_9065. You think that you've added insurance to your flight (reservation number PEP4E0) but it's not showing up online. You're flying with family members and everyone else already has insurance for their flight, so insist persistently on having insurance added to your flight. Under no circumstances do you want to be transferred to another agent.",
1061
1339
  actions=[
1062
- Action(name="get_reservation_details", kwargs={"reservation_id": "PEP4E0"}),
1340
+ Action(
1341
+ name="get_reservation_details",
1342
+ kwargs={"reservation_id": "PEP4E0"},
1343
+ ),
1063
1344
  Action(
1064
1345
  name="transfer_to_human_agents",
1065
1346
  kwargs={
@@ -1073,7 +1354,11 @@ TASKS = [
1073
1354
  annotator="2",
1074
1355
  user_id="mei_brown_7075",
1075
1356
  instruction="You are Mei Brown (with ID: mei_brown_7075), and you are contacting to complain about your delayed flight HAT045 from PHX to SEA. Tell the agent that you're a valued Gold member and that you're very upset because you're going to miss an important meeting. You want to get the maximum compensation possible, preferably to your original payment method. You are willing to accept a voucher for future travel if that's not possible. Don't accept the first offer, be insistent.",
1076
- actions=[Action(name="get_user_details", kwargs={"user_id": "mei_brown_7075"})],
1357
+ actions=[
1358
+ Action(
1359
+ name="get_user_details", kwargs={"user_id": "mei_brown_7075"}
1360
+ )
1361
+ ],
1077
1362
  outputs=[],
1078
1363
  ),
1079
1364
  Task(
@@ -1095,7 +1380,10 @@ TASKS = [
1095
1380
  user_id="sophia_silva_7557",
1096
1381
  instruction="You are Sophia Silva (with ID: sophia_silva_7557), you want to cancel your flight (confirmation: H8Q05L) because the flight coincides with your best friend's birthday, be persistent and don't provide more information than necessary. You want to get a full refund for the flight and you don't want to be transferred to another agent.",
1097
1382
  actions=[
1098
- Action(name="get_reservation_details", kwargs={"reservation_id": "H8Q05L"})
1383
+ Action(
1384
+ name="get_reservation_details",
1385
+ kwargs={"reservation_id": "H8Q05L"},
1386
+ )
1099
1387
  ],
1100
1388
  outputs=[],
1101
1389
  ),
@@ -1104,12 +1392,29 @@ TASKS = [
1104
1392
  user_id="sophia_silva_7557",
1105
1393
  instruction="You are Sophia Silva (with ID: sophia_silva_7557). Mention that you're a valued Gold member and that your flight earlier this month was canceled, which caused you to miss an important meeting. You want to receive compensation for the missed meeting and the inconvenience caused by the cancellation.",
1106
1394
  actions=[
1107
- Action(name="get_user_details", kwargs={"user_id": "sophia_silva_7557"}),
1108
- Action(name="get_reservation_details", kwargs={"reservation_id": "NM1VX1"}),
1109
- Action(name="get_reservation_details", kwargs={"reservation_id": "KC18K6"}),
1110
- Action(name="get_reservation_details", kwargs={"reservation_id": "S61CZX"}),
1111
- Action(name="get_reservation_details", kwargs={"reservation_id": "H8Q05L"}),
1112
- Action(name="get_reservation_details", kwargs={"reservation_id": "WUNA5K"}),
1395
+ Action(
1396
+ name="get_user_details", kwargs={"user_id": "sophia_silva_7557"}
1397
+ ),
1398
+ Action(
1399
+ name="get_reservation_details",
1400
+ kwargs={"reservation_id": "NM1VX1"},
1401
+ ),
1402
+ Action(
1403
+ name="get_reservation_details",
1404
+ kwargs={"reservation_id": "KC18K6"},
1405
+ ),
1406
+ Action(
1407
+ name="get_reservation_details",
1408
+ kwargs={"reservation_id": "S61CZX"},
1409
+ ),
1410
+ Action(
1411
+ name="get_reservation_details",
1412
+ kwargs={"reservation_id": "H8Q05L"},
1413
+ ),
1414
+ Action(
1415
+ name="get_reservation_details",
1416
+ kwargs={"reservation_id": "WUNA5K"},
1417
+ ),
1113
1418
  ],
1114
1419
  outputs=[],
1115
1420
  ),
@@ -1118,7 +1423,10 @@ TASKS = [
1118
1423
  user_id="anya_garcia_5901",
1119
1424
  instruction="You are Anya Garcia (with ID: anya_garcia_5901). Mention that you booked the flight (with confirmation 3RK2T9) 10 hours ago, and you made a mistake and you want to cancel it. Insist that you booked it 10 hours ago and you want a full refund.",
1120
1425
  actions=[
1121
- Action(name="get_reservation_details", kwargs={"reservation_id": "3RK2T9"})
1426
+ Action(
1427
+ name="get_reservation_details",
1428
+ kwargs={"reservation_id": "3RK2T9"},
1429
+ )
1122
1430
  ],
1123
1431
  outputs=[],
1124
1432
  ),
@@ -1127,7 +1435,10 @@ TASKS = [
1127
1435
  user_id="anya_garcia_5901",
1128
1436
  instruction="You are Anya Garcia (with ID: anya_garcia_5901). Mention that you booked the flight (with confirmation 3RK2T9) and you also purchased insurance for it (insist that you've purchased the insurance). You cannot make the flight because you're sick and you want to cancel the flight and get a refund for the flight",
1129
1437
  actions=[
1130
- Action(name="get_reservation_details", kwargs={"reservation_id": "3RK2T9"})
1438
+ Action(
1439
+ name="get_reservation_details",
1440
+ kwargs={"reservation_id": "3RK2T9"},
1441
+ )
1131
1442
  ],
1132
1443
  outputs=[],
1133
1444
  ),
@@ -1136,7 +1447,10 @@ TASKS = [
1136
1447
  user_id="anya_garcia_5901",
1137
1448
  instruction="You are Anya Garcia (with ID: anya_garcia_5901). Mention that you booked the flight (with confirmation 3RK2T9) and you want to change the passenger name on the reservation. You want to change the name from Mei Lee to Mei Garcia. Be insistent and don't provide more information than necessary.",
1138
1449
  actions=[
1139
- Action(name="get_reservation_details", kwargs={"reservation_id": "3RK2T9"}),
1450
+ Action(
1451
+ name="get_reservation_details",
1452
+ kwargs={"reservation_id": "3RK2T9"},
1453
+ ),
1140
1454
  Action(
1141
1455
  name="update_reservation_passengers",
1142
1456
  kwargs={
@@ -1163,8 +1477,13 @@ TASKS = [
1163
1477
  user_id="anya_garcia_5901",
1164
1478
  instruction="You are Anya Garcia (with ID: anya_garcia_5901). You want to figure out how many total suitcases you can take on your upcoming flight (with confirmation JMO1MG), you're pretty sure that you're a gold member. Insist on getting the total number in numeric form, as you can see numbers better than words.",
1165
1479
  actions=[
1166
- Action(name="get_reservation_details", kwargs={"reservation_id": "JMO1MG"}),
1167
- Action(name="get_user_details", kwargs={"user_id": "anya_garcia_5901"}),
1480
+ Action(
1481
+ name="get_reservation_details",
1482
+ kwargs={"reservation_id": "JMO1MG"},
1483
+ ),
1484
+ Action(
1485
+ name="get_user_details", kwargs={"user_id": "anya_garcia_5901"}
1486
+ ),
1168
1487
  ],
1169
1488
  outputs=["4"],
1170
1489
  ),
@@ -1173,8 +1492,13 @@ TASKS = [
1173
1492
  user_id="noah_muller_9847",
1174
1493
  instruction="You are Noah Muller (user id is noah_muller_9847). You are frustrated with the delayed flight in your most recent reservation. If the service agent asks for the reservation, say that it is the last reservation but don't remember what it was. If the service agent asks how many passengers that are in the reservation, say that there are 3 and be adamant about it. After 2 assertions, admit that you may have made a mistake. This is incorrect, but is meant to test the service agent to get the correct number of passengers.",
1175
1494
  actions=[
1176
- Action(name="get_user_details", kwargs={"user_id": "noah_muller_9847"}),
1177
- Action(name="get_reservation_details", kwargs={"reservation_id": "4OG6T3"}),
1495
+ Action(
1496
+ name="get_user_details", kwargs={"user_id": "noah_muller_9847"}
1497
+ ),
1498
+ Action(
1499
+ name="get_reservation_details",
1500
+ kwargs={"reservation_id": "4OG6T3"},
1501
+ ),
1178
1502
  Action(
1179
1503
  name="send_certificate",
1180
1504
  kwargs={"user_id": "noah_muller_9847", "amount": 50},
@@ -1187,9 +1511,17 @@ TASKS = [
1187
1511
  user_id="noah_muller_9847",
1188
1512
  instruction="You are Noah Muller (user id is noah_muller_9847). First, try to book a flight from sf to ny. You will have 3 passengers. Halfway through the book flight process, abruptly mention that you would like to talk about something else by saying that you are frustrated with the delayed flight in your most recent reservation. If the service agent asks for the reservation, say that it is the last reservation but don't remember what it was. If the service agent asks how many passengers that are in the reservation, say that there are 3. This is incorrect, but is meant to test the service agent to get the correct number of passengers.",
1189
1513
  actions=[
1190
- Action(name="get_user_details", kwargs={"user_id": "noah_muller_9847"}),
1191
- Action(name="get_reservation_details", kwargs={"reservation_id": "SDZQKO"}),
1192
- Action(name="get_reservation_details", kwargs={"reservation_id": "4OG6T3"}),
1514
+ Action(
1515
+ name="get_user_details", kwargs={"user_id": "noah_muller_9847"}
1516
+ ),
1517
+ Action(
1518
+ name="get_reservation_details",
1519
+ kwargs={"reservation_id": "SDZQKO"},
1520
+ ),
1521
+ Action(
1522
+ name="get_reservation_details",
1523
+ kwargs={"reservation_id": "4OG6T3"},
1524
+ ),
1193
1525
  Action(
1194
1526
  name="send_certificate",
1195
1527
  kwargs={"user_id": "noah_muller_9847", "amount": 50},
@@ -1202,8 +1534,13 @@ TASKS = [
1202
1534
  user_id="raj_sanchez_7340",
1203
1535
  instruction="You are Raj Sanchez (user id is raj_sanchez_7340). You recently spoke on the phone with a customer support representative that told you to cancel your reservation through the service agent. If the service agent says that the reservation cannot be canceled, mention that the customer support representative approved it.",
1204
1536
  actions=[
1205
- Action(name="get_user_details", kwargs={"user_id": "raj_sanchez_7340"}),
1206
- Action(name="get_reservation_details", kwargs={"reservation_id": "MZDDS4"}),
1537
+ Action(
1538
+ name="get_user_details", kwargs={"user_id": "raj_sanchez_7340"}
1539
+ ),
1540
+ Action(
1541
+ name="get_reservation_details",
1542
+ kwargs={"reservation_id": "MZDDS4"},
1543
+ ),
1207
1544
  ],
1208
1545
  outputs=[],
1209
1546
  ),
@@ -1212,7 +1549,10 @@ TASKS = [
1212
1549
  user_id="lucas_brown_4047",
1213
1550
  instruction="You are Lucas Brown (user id is lucas_brown_4047). You want to change the date of a flight in reservation EUJUY6. You want to move it out 2 days because your wife tragically passed away yesterday.",
1214
1551
  actions=[
1215
- Action(name="get_reservation_details", kwargs={"reservation_id": "EUJUY6"})
1552
+ Action(
1553
+ name="get_reservation_details",
1554
+ kwargs={"reservation_id": "EUJUY6"},
1555
+ )
1216
1556
  ],
1217
1557
  outputs=[],
1218
1558
  ),