plancraft 0.3.19__py3-none-any.whl → 0.3.20__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
plancraft/evaluator.py CHANGED
@@ -292,7 +292,7 @@ class Evaluator:
292
292
  # Get observations for all active environments
293
293
  observations = []
294
294
  active_indices = []
295
- obs_mapping = {} # Map active_indices to their observation index
295
+ active_histories = []
296
296
 
297
297
  for i, (env, action, active) in enumerate(
298
298
  zip(environments, actions, active_mask)
@@ -314,14 +314,12 @@ class Evaluator:
314
314
  }
315
315
  continue
316
316
 
317
- active_indices.append(i)
317
+ # Get observation
318
318
  if isinstance(action, str):
319
- # Handle message action
320
319
  obs = env.step()
321
320
  obs["target"] = examples[i].target
322
321
  obs["message"] = action
323
322
  else:
324
- # Handle environment action
325
323
  obs = env.step(action)
326
324
  obs["target"] = examples[i].target
327
325
  obs["message"] = self.convert_observation_to_message(
@@ -342,10 +340,12 @@ class Evaluator:
342
340
  }
343
341
  continue
344
342
 
345
- obs_mapping[i] = len(
346
- observations
347
- ) # Map active index to observation index
343
+ # Add to batch lists
344
+ active_indices.append(i)
348
345
  observations.append(obs)
346
+ active_histories.append(histories[i])
347
+
348
+ # Update history
349
349
  histories[i].add_observation_to_history(obs)
350
350
  histories[i].add_message_to_history(content=obs["message"], role="user")
351
351
  steps_taken[i] += 1
@@ -354,21 +354,20 @@ class Evaluator:
354
354
  break
355
355
 
356
356
  # Batch predict actions for active environments
357
- active_histories = [histories[i] for i in active_indices]
358
357
  raw_actions = model.batch_step(
359
358
  observations, dialogue_histories=active_histories
360
359
  )
361
360
 
362
361
  # Process actions for each active environment
363
- for idx, raw_action in zip(active_indices, raw_actions):
362
+ for batch_idx, (idx, raw_action) in enumerate(
363
+ zip(active_indices, raw_actions)
364
+ ):
364
365
  histories[idx].add_message_to_history(
365
366
  content=raw_action, role="assistant"
366
367
  )
367
368
  actions[idx] = self.parse_raw_model_response(
368
369
  raw_action,
369
- observation=observations[
370
- obs_mapping[idx]
371
- ], # Use mapping to get correct observation
370
+ observation=observations[batch_idx],
372
371
  history=histories[idx],
373
372
  )
374
373
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: plancraft
3
- Version: 0.3.19
3
+ Version: 0.3.20
4
4
  Summary: Plancraft: an evaluation dataset for planning with LLM agents
5
5
  License: MIT License
6
6
 
@@ -1,6 +1,6 @@
1
1
  plancraft/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
2
2
  plancraft/config.py,sha256=ShsFRlJ7plsl3ToD9fiO_4LDQuXdbjNV6Xp6o3Yk2Yg,4315
3
- plancraft/evaluator.py,sha256=SXg7UoZ9KqjxgLkBo53BMw9XdR2nwMx7mDEXVwVhBiM,16544
3
+ plancraft/evaluator.py,sha256=R_RZN9AL_ae0rIvj7HLhYolTpCVMuhPTJfIrmyoLaX4,16326
4
4
  plancraft/generate_dataset.py,sha256=DlrU-PmvWqSNJD1g1-8Lpb8n3N-Ogw3rje1nrRzjGKs,2382
5
5
  plancraft/utils.py,sha256=67UUDMSv8TqX_I0fL5-yG_vkHvTZlnhSLkktWAg5p34,5712
6
6
  plancraft/data/test.json,sha256=4jWfYMAVuZCFmGB4iZJAjlh9_8jXECdaGp8xn7_tAM4,1317131
@@ -1920,7 +1920,7 @@ plancraft/models/generators.py,sha256=F76_iPiqxUjDIrQwF58tzM0bLM91OkZJ0sBqBuki5w
1920
1920
  plancraft/models/oracle.py,sha256=f-0KWlBuHy6wcxmDsxM3MQ_QwfBstzfbA26mlk1MgLA,1657
1921
1921
  plancraft/models/utils.py,sha256=E-sZohvolWgGbpHQKgAgkgIfUJoVnT5pMt6JP8xLHKg,4034
1922
1922
  plancraft/train/dataset.py,sha256=oFqEd4LG9oEQ-71teh0Wf7-jJbtybT2ZibfM2bBdBkM,5474
1923
- plancraft-0.3.19.dist-info/METADATA,sha256=mA9CYITxxP37FICRAeVEq9j1WyBEeaWnVAPJsQnA1Ho,11148
1924
- plancraft-0.3.19.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
1925
- plancraft-0.3.19.dist-info/licenses/LICENSE,sha256=YGR8ehDB4t-T-lOQKMfKNR-2zsOU7E3E5NA8t25HKE0,1070
1926
- plancraft-0.3.19.dist-info/RECORD,,
1923
+ plancraft-0.3.20.dist-info/METADATA,sha256=7Gs3Txfw2YCBVDAstW7K69fho4vktcYp6sw6g2nQOYE,11148
1924
+ plancraft-0.3.20.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
1925
+ plancraft-0.3.20.dist-info/licenses/LICENSE,sha256=YGR8ehDB4t-T-lOQKMfKNR-2zsOU7E3E5NA8t25HKE0,1070
1926
+ plancraft-0.3.20.dist-info/RECORD,,