@ai-sdk-tool/eval 1.0.0-canary.0 → 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/data/{BFCL_v3_parallel.jsonl → BFCL_v4_parallel.jsonl} +2 -2
- package/data/{BFCL_v3_parallel_possible_answer.jsonl → BFCL_v4_parallel_possible_answer.jsonl} +2 -2
- package/data/BFCL_v4_simple.jsonl +400 -0
- package/data/BFCL_v4_simple_possible_answer.jsonl +400 -0
- package/data/ComplexFuncBench.jsonl +1000 -0
- package/data/ComplexFuncBench_possible_answer.jsonl +1000 -0
- package/dist/index.cjs +1264 -263
- package/dist/index.cjs.map +1 -1
- package/dist/index.d.cts +77 -11
- package/dist/index.d.ts +77 -11
- package/dist/index.js +1268 -264
- package/dist/index.js.map +1 -1
- package/package.json +18 -11
- package/data/BFCL_v3_simple.jsonl +0 -400
- package/data/BFCL_v3_simple_possible_answer.jsonl +0 -400
- /package/data/{BFCL_v3_multiple.jsonl → BFCL_v4_multiple.jsonl} +0 -0
- /package/data/{BFCL_v3_multiple_possible_answer.jsonl → BFCL_v4_multiple_possible_answer.jsonl} +0 -0
- /package/data/{BFCL_v3_parallel_multiple.jsonl → BFCL_v4_parallel_multiple.jsonl} +0 -0
- /package/data/{BFCL_v3_parallel_multiple_possible_answer.jsonl → BFCL_v4_parallel_multiple_possible_answer.jsonl} +0 -0
|
@@ -82,7 +82,7 @@
|
|
|
82
82
|
{"id": "parallel_81", "question": [[{"role": "user", "content": "\"Imagine you are conducting a physics experiment where you are dropping objects from different heights and observing their final velocities. You drop a tennis ball from a height of 10 meters with an initial velocity of 0 m/s and then from a height of 20 meters with the same initial velocity. You also drop a baseball from a height of 15 meters with an initial velocity of 0 m/s and then from a height of 25 meters with the same initial velocity. Assuming the acceleration due to gravity is approximately 9.81 m/s^2, can you calculate the final velocities of the tennis ball and the baseball for each drop?\""}]], "function": [{"name": "calculate_final_velocity", "description": "Calculate the final velocity of a free falling object given the height it's dropped from, the initial velocity and acceleration due to gravity. Ignore air resistance.", "parameters": {"type": "dict", "properties": {"height": {"type": "integer", "description": "The height the object is dropped from, in meters."}, "initial_velocity": {"type": "integer", "description": "The initial velocity of the object in m/s. Default is zero."}, "gravity": {"type": "float", "description": "Acceleration due to gravity. Default value is approximately 9.81 m/s^2, earth's gravity."}}, "required": ["height"]}}]}
|
|
83
83
|
{"id": "parallel_82", "question": [[{"role": "user", "content": "A group of cyclists are planning a two-day cycling trip. On the first day, they plan to cover a distance of 120 kilometers in 5 hours. On the second day, they plan to cover a distance of 150 kilometers in 6 hours. They want to know their average velocity for each day in km/h. Could you calculate their velocity for each day using the 'calculate_velocity' function?"}]], "function": [{"name": "calculate_velocity", "description": "Calculate the velocity for a certain distance travelled within a specific duration.", "parameters": {"type": "dict", "properties": {"distance": {"type": "integer", "description": "The distance travelled by the object, typically in kilometers."}, "duration": {"type": "integer", "description": "The duration of the journey, typically in hours."}, "unit": {"type": "string", "description": "Optional parameter. The unit to return the velocity in. If not provided, the default is km/h."}}, "required": ["distance", "duration"]}}]}
|
|
84
84
|
{"id": "parallel_83", "question": [[{"role": "user", "content": "A car is participating in a drag race. In the first round, the car starts from rest and accelerates at a rate of 5 meters/second^2 for 10 seconds. In the second round, the car starts with an initial velocity of 10 meters/second and accelerates at a rate of 7 meters/second^2 for 8 seconds. In the third round, the car starts with an initial velocity of 20 meters/second and accelerates at a rate of 4 meters/second^2 for 12 seconds. What are the final velocities of the car in each round?"}]], "function": [{"name": "final_velocity", "description": "Calculate the final velocity of an object given its initial velocity, acceleration, and time.", "parameters": {"type": "dict", "properties": {"initial_velocity": {"type": "integer", "description": "The initial velocity of the object in meters/second."}, "acceleration": {"type": "integer", "description": "The acceleration of the object in meters/second^2."}, "time": {"type": "integer", "description": "The time over which the acceleration is applied in seconds."}}, "required": ["initial_velocity", "acceleration", "time"]}}]}
|
|
85
|
-
{"id": "parallel_84", "question": [[{"role": "user", "content": "\"A car starts
|
|
85
|
+
{"id": "parallel_84", "question": [[{"role": "user", "content": "\"A car starts with an initial velocity of 15 m/s accelerates at a rate of 3.5 m/s^2 for a time of 7 seconds. What is the displacement of this car? Now, consider a second car that starts with an initial velocity of 20 m/s and accelerates at a rate of 2 m/s^2 for a time of 10 seconds. What is the displacement of the second car? Finally, a third car with an initial velocity of 25 m/s travels for a time of 8 seconds without any acceleration. What is the displacement of the third car?\""}]], "function": [{"name": "calculate_displacement", "description": "Calculates the displacement of an object in motion given initial velocity, time, and acceleration.", "parameters": {"type": "dict", "properties": {"initial_velocity": {"type": "integer", "description": "The initial velocity of the object in m/s."}, "time": {"type": "integer", "description": "The time in seconds that the object has been in motion."}, "acceleration": {"type": "float", "description": "The acceleration of the object in m/s^2.", "default": 0}}, "required": ["initial_velocity", "time"]}}]}
|
|
86
86
|
{"id": "parallel_85", "question": [[{"role": "user", "content": "A physics experiment is being conducted where two objects are dropped from a height, neglecting air resistance. The first object is dropped with an initial speed of 0 m/s and the second object is dropped with an initial speed of 5 m/s. If the first object is in free fall for 10 seconds and the second object is in free fall for 7 seconds, can you calculate the final speed of both objects considering the acceleration due to gravity as -9.81 m/s^2?"}]], "function": [{"name": "calculate_final_speed", "description": "Calculate the final speed of an object in free fall after a certain time, neglecting air resistance. The acceleration due to gravity is considered as -9.81 m/s^2", "parameters": {"type": "dict", "properties": {"initial_speed": {"type": "integer", "description": "The initial speed of the object in m/s. Default is 0 for an object at rest."}, "time": {"type": "integer", "description": "The time in seconds for which the object is in free fall."}, "gravity": {"type": "float", "description": "The acceleration due to gravity. Default is -9.81 m/s^2."}}, "required": ["time"]}}]}
|
|
87
87
|
{"id": "parallel_86", "question": [[{"role": "user", "content": "\"Imagine you are conducting an experiment with two different objects. The first object is accelerated at a rate of 5 m/s^2 and travels a distance of 100 meters. The second object is accelerated at a rate of 10 m/s^2 and travels a distance of 200 meters. Both objects start from rest. Can you calculate the final velocity of each object using the kinematics.final_velocity_from_distance function?\""}]], "function": [{"name": "kinematics.final_velocity_from_distance", "description": "Calculate the final velocity of an object given the acceleration and distance travelled, assuming initial velocity is 0.", "parameters": {"type": "dict", "properties": {"acceleration": {"type": "integer", "description": "Acceleration of the object, m/s^2."}, "distance": {"type": "integer", "description": "Distance traveled by the object, m."}, "initial_velocity": {"type": "integer", "description": "Initial velocity of the object. Default is 0, m/s"}}, "required": ["acceleration", "distance"]}}]}
|
|
88
88
|
{"id": "parallel_87", "question": [[{"role": "user", "content": "\"Imagine you are observing two racing cars on a straight track. The first car, Car A, starts from rest and accelerates at a rate of 6 m/s\u00b2 for 10 seconds. The second car, Car B, starts with an initial velocity of 20 m/s and accelerates at a rate of 4 m/s\u00b2 for 15 seconds. Using the function 'calculate_final_velocity', can you determine the final velocities of both Car A and Car B?\""}]], "function": [{"name": "calculate_final_velocity", "description": "Calculate the final velocity of an object under constant acceleration, knowing its initial velocity, acceleration, and time of acceleration.", "parameters": {"type": "dict", "properties": {"initial_velocity": {"type": "integer", "description": "The initial velocity of the object."}, "acceleration": {"type": "integer", "description": "The acceleration of the object."}, "time": {"type": "integer", "description": "The time of acceleration."}}, "required": ["initial_velocity", "acceleration", "time"]}}]}
|
|
@@ -168,7 +168,7 @@
|
|
|
168
168
|
{"id": "parallel_167", "question": [[{"role": "user", "content": "What is the coefficient of determination (R squared) of a regression model if we use the dataset located at \"/user/home/datasets/finance.csv\", with 'income', 'age' and 'education' as the independent variables and 'credit_score' as the dependent variable, and then repeat the same process with 'income', 'age' and 'credit_score' as the independent variables and 'education' as the dependent variable?"}]], "function": [{"name": "linear_regression.get_r_squared", "description": "Calculate the coefficient of determination of a regression model.", "parameters": {"type": "dict", "properties": {"dataset_path": {"type": "string", "description": "Path to the CSV dataset file."}, "independent_variables": {"type": "array", "items": {"type": "string"}, "description": "The independent variables to use in the regression model."}, "dependent_variable": {"type": "string", "description": "The dependent variable to predict in the regression model."}}, "required": ["dataset_path", "independent_variables", "dependent_variable"]}}]}
|
|
169
169
|
{"id": "parallel_168", "question": [[{"role": "user", "content": "\"Can you help me calculate the quarterly dividend per share for my company? We have just paid out a total of $5,000,000 in dividends and currently have 2,000,000 outstanding shares. Also, I am considering a scenario where we might increase our total payout to $6,000,000 while keeping the same number of outstanding shares. What would be the quarterly dividend per share in that case? And what if we also increase our outstanding shares to 2,500,000 while keeping the total payout at $6,000,000?\""}]], "function": [{"name": "finance.calculate_quarterly_dividend_per_share", "description": "Calculate quarterly dividend per share for a company given total dividend payout and outstanding shares", "parameters": {"type": "dict", "properties": {"total_payout": {"type": "integer", "description": "The total amount of dividends paid out in USD"}, "outstanding_shares": {"type": "integer", "description": "Total number of outstanding shares"}}, "required": ["total_payout", "outstanding_shares"], "optional": []}}]}
|
|
170
170
|
{"id": "parallel_169", "question": [[{"role": "user", "content": "\"Can you help me calculate the discounted cash flow of a bond? I have a bond with an annual coupon payment of $50, a time frame of 5 years, and a discount rate of 5%. Also, the face value of the bond is $1000. I would like to know the discounted cash flow for this bond. After that, I want to compare it with another bond that has an annual coupon payment of $60, a time frame of 7 years, and a discount rate of 4%, with the same face value of $1000. Can you calculate the discounted cash flow for this second bond as well?\""}]], "function": [{"name": "calculate_discounted_cash_flow", "description": "Calculate the discounted cash flow of a bond for a given annual coupon payment, time frame and discount rate.", "parameters": {"type": "dict", "properties": {"coupon_payment": {"type": "integer", "description": "The annual coupon payment."}, "period": {"type": "integer", "description": "The time frame in years for which coupon payment is made."}, "discount_rate": {"type": "float", "description": "The discount rate."}, "face_value": {"type": "integer", "description": "The face value of the bond, default is $1000."}}, "required": ["coupon_payment", "period", "discount_rate"]}}]}
|
|
171
|
-
{"id": "parallel_170", "question": [[{"role": "user", "content": "\"Can you help me calculate the compound interest for my savings? I initially invested $5000 as the principal amount. The bank offers an annual interest rate of 2.5
|
|
171
|
+
{"id": "parallel_170", "question": [[{"role": "user", "content": "\"Can you help me calculate the compound interest for my savings? I initially invested $5000 as the principal amount. The bank offers an annual interest rate of 2.5%. I plan to keep my money in the bank for 10 years. Also, the interest is compounded quarterly, so it's compounded 4 times in a year. Can you calculate the compound interest I would get for the first 2 years, first 3 years and first 5 years?\""}]], "function": [{"name": "calculate_compound_interest", "description": "Calculate compound interest for an initial principal amount.", "parameters": {"type": "dict", "properties": {"principal": {"type": "integer", "description": "The principal amount that the interest is applied to."}, "rate": {"type": "float", "description": "The annual interest rate. Enter as a decimal. E.g, 5% is 0.05"}, "time": {"type": "integer", "description": "The time the money is invested for in years."}, "n": {"type": "integer", "description": "The number of times that interest is compounded per time period. Default is 1."}}, "required": ["principal", "rate", "time"]}}]}
|
|
172
172
|
{"id": "parallel_171", "question": [[{"role": "user", "content": "\"Can you calculate the return on equity for two companies? The first company has a net income of $1,000,000, shareholder's equity of $5,000,000, and paid dividends of $200,000. The second company has a net income of $2,000,000, shareholder's equity of $10,000,000, but did not pay any dividends.\""}]], "function": [{"name": "calculate_return_on_equity", "description": "Calculate a company's return on equity based on its net income, shareholder's equity, and dividends paid.", "parameters": {"type": "dict", "properties": {"net_income": {"type": "integer", "description": "The company's net income."}, "shareholder_equity": {"type": "integer", "description": "The company's total shareholder's equity."}, "dividends_paid": {"type": "integer", "description": "The total dividends paid by the company. Optional. If not given, assumes it's 0 as default."}}, "required": ["net_income", "shareholder_equity"]}}]}
|
|
173
173
|
{"id": "parallel_172", "question": [[{"role": "user", "content": "\"Imagine you have two different investment opportunities. The first one has a present value of $5000, an annual interest rate of 5%, and you plan to hold it for 10 years. The second one has a present value of $7000, an annual interest rate of 4%, and you plan to hold it for 15 years. Both investments compound interest annually. Can you calculate the future value of both investments using the finance.predict_future_value function?\""}]], "function": [{"name": "finance.predict_future_value", "description": "Calculate the future value of an investment given its present value, interest rate, the number of compounding periods per year, and the time horizon.", "parameters": {"type": "dict", "properties": {"present_value": {"type": "integer", "description": "The present value of the investment."}, "annual_interest_rate": {"type": "float", "description": "The annual interest rate of the investment."}, "compounding_periods_per_year": {"type": "integer", "description": "The number of times that interest is compounded per year. Default is 1 (annually)."}, "time_years": {"type": "integer", "description": "The investment horizon in years."}}, "required": ["present_value", "annual_interest_rate", "time_years"]}}]}
|
|
174
174
|
{"id": "parallel_173", "question": [[{"role": "user", "content": "\"John has decided to invest in two different funds. He invested $5000 in Fund A which has an annual return rate of 7% and he plans to keep his money there for 5 years. On the other hand, he invested $8000 in Fund B with an annual return rate of 5% for a period of 7 years. Can you predict the profit John will make from both Fund A and Fund B?\""}]], "function": [{"name": "investment.predictProfit", "description": "Predict the profit for given investment after specified number of years.", "parameters": {"type": "dict", "properties": {"investment_amount": {"type": "integer", "description": "The amount invested in dollars."}, "annual_return": {"type": "float", "description": "The annual return rate of the investment."}, "years": {"type": "integer", "description": "The time period in years for which the investment is made."}}, "required": ["investment_amount", "annual_return", "years"]}}]}
|
package/data/{BFCL_v3_parallel_possible_answer.jsonl → BFCL_v4_parallel_possible_answer.jsonl}
RENAMED
|
@@ -153,10 +153,10 @@
|
|
|
153
153
|
{"id": "parallel_152", "ground_truth": [{"math.power": {"base": [2], "exponent": [3], "mod": ["", null]}}, {"math.power": {"base": [3], "exponent": [5], "mod": ["", null]}}]}
|
|
154
154
|
{"id": "parallel_153", "ground_truth": [{"train_random_forest_classifier": {"dataset": ["dataset1"], "max_depth": [10], "n_estimators": [100]}}, {"train_random_forest_classifier": {"dataset": ["dataset2"], "max_depth": [20], "n_estimators": [200]}}]}
|
|
155
155
|
{"id": "parallel_154", "ground_truth": [{"calculate_bmi": {"weight": [75], "height": [180], "system": ["metric", ""]}}, {"calculate_bmi": {"weight": [60], "height": [165], "system": ["metric", ""]}}, {"calculate_bmi": {"weight": [80], "height": [175], "system": ["metric", ""]}}, {"calculate_bmi": {"weight": [90], "height": [185], "system": ["metric", ""]}}]}
|
|
156
|
-
{"id": "parallel_155", "ground_truth": [{"run_linear_regression": {"predictors": [["Age", "Income", "Education"]], "target": ["Spending Score"], "standardize": [false]}}, {"run_linear_regression": {"predictors": [["Age", "Income", "Education"]], "target": ["Spending Score"], "standardize": [true
|
|
156
|
+
{"id": "parallel_155", "ground_truth": [{"run_linear_regression": {"predictors": [["Age", "Income", "Education"]], "target": ["Spending Score"], "standardize": [false]}}, {"run_linear_regression": {"predictors": [["Age", "Income", "Education"]], "target": ["Spending Score"], "standardize": [true]}}]}
|
|
157
157
|
{"id": "parallel_156", "ground_truth": [{"random_forest.train": {"n_estimators": [100], "max_depth": [10], "data": ["data_random_forest"]}}, {"random_forest.train": {"n_estimators": [200], "max_depth": [20], "data": ["data_random_forest"]}}, {"random_forest.train": {"n_estimators": [300], "max_depth": [30], "data": ["data_random_forest"]}}, {"random_forest.train": {"n_estimators": [400], "max_depth": [40], "data": ["data_random_forest"]}}]}
|
|
158
158
|
{"id": "parallel_157", "ground_truth": [{"predict_house_price": {"bedrooms": [3], "bathrooms": [2], "area": [1500], "location": ["New York", "New York, NY", "New York City", "NYC"]}}, {"predict_house_price": {"bedrooms": [4], "bathrooms": [3], "area": [2000], "location": ["Los Angeles", "Los Angeles, CA", "LA"]}}, {"predict_house_price": {"bedrooms": [2], "bathrooms": [1], "area": [1200], "location": ["Chicago"]}}, {"predict_house_price": {"bedrooms": [3], "bathrooms": [2], "area": [1800], "location": ["Miami"]}}]}
|
|
159
|
-
{"id": "parallel_158", "ground_truth": [{"random.normalvariate": {"mu": [5], "sigma": [2]}}, {"random.normalvariate": {"mu": [10], "sigma": [3]}}]}
|
|
159
|
+
{"id": "parallel_158", "ground_truth": [{"random.normalvariate": {"mu": [5], "sigma": [2]}}, {"random.normalvariate": {"mu": [5], "sigma": [2]}}, {"random.normalvariate": {"mu": [10], "sigma": [3]}}, {"random.normalvariate": {"mu": [10], "sigma": [3]}}]}
|
|
160
160
|
{"id": "parallel_159", "ground_truth": [{"probability.dice_roll": {"desired_number": [4], "number_of_rolls": [3], "die_sides": [6, ""]}}, {"probability.dice_roll": {"desired_number": [2], "number_of_rolls": [2], "die_sides": [6, ""]}}, {"probability.dice_roll": {"desired_number": [7], "number_of_rolls": [2], "die_sides": [8]}}]}
|
|
161
161
|
{"id": "parallel_160", "ground_truth": [{"prob_dist.binomial": {"trials": [20], "successes": [5], "p": [0.3]}}, {"prob_dist.binomial": {"trials": [50], "successes": [15], "p": [0.3]}}, {"prob_dist.binomial": {"trials": [100], "successes": [30], "p": [0.3]}}]}
|
|
162
162
|
{"id": "parallel_161", "ground_truth": [{"calculate_binomial_probability": {"number_of_trials": [10], "number_of_successes": [7], "probability_of_success": [0.6]}}, {"calculate_binomial_probability": {"number_of_trials": [15], "number_of_successes": [10], "probability_of_success": [0.6]}}, {"calculate_binomial_probability": {"number_of_trials": [20], "number_of_successes": [15], "probability_of_success": [0.6]}}]}
|