PyPI - palimpzest - Versions diffs - 0.7.21__py3-none-any.whl → 0.8.1__py3-none-any.whl - Mend

palimpzest 0.7.21py3-none-any.whl → 0.8.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (89) hide show

palimpzest/__init__.py +37 -6
palimpzest/agents/__init__.py +0 -0
palimpzest/agents/compute_agents.py +0 -0
palimpzest/agents/search_agents.py +637 -0
palimpzest/constants.py +343 -209
palimpzest/core/data/context.py +393 -0
palimpzest/core/data/context_manager.py +163 -0
palimpzest/core/data/dataset.py +639 -0
palimpzest/core/data/{datareaders.py → iter_dataset.py} +202 -126
palimpzest/core/elements/groupbysig.py +16 -13
palimpzest/core/elements/records.py +166 -75
palimpzest/core/lib/schemas.py +152 -390
palimpzest/core/{data/dataclasses.py → models.py} +306 -170
palimpzest/policy.py +2 -27
palimpzest/prompts/__init__.py +35 -5
palimpzest/prompts/agent_prompts.py +357 -0
palimpzest/prompts/context_search.py +9 -0
palimpzest/prompts/convert_prompts.py +62 -6
palimpzest/prompts/filter_prompts.py +51 -6
palimpzest/prompts/join_prompts.py +163 -0
palimpzest/prompts/moa_proposer_convert_prompts.py +6 -6
palimpzest/prompts/prompt_factory.py +375 -47
palimpzest/prompts/split_proposer_prompts.py +1 -1
palimpzest/prompts/util_phrases.py +5 -0
palimpzest/prompts/validator.py +239 -0
palimpzest/query/execution/all_sample_execution_strategy.py +134 -76
palimpzest/query/execution/execution_strategy.py +210 -317
palimpzest/query/execution/execution_strategy_type.py +5 -7
palimpzest/query/execution/mab_execution_strategy.py +249 -136
palimpzest/query/execution/parallel_execution_strategy.py +153 -244
palimpzest/query/execution/single_threaded_execution_strategy.py +107 -64
palimpzest/query/generators/generators.py +160 -331
palimpzest/query/operators/__init__.py +15 -5
palimpzest/query/operators/aggregate.py +50 -33
palimpzest/query/operators/compute.py +201 -0
palimpzest/query/operators/convert.py +33 -19
palimpzest/query/operators/critique_and_refine_convert.py +7 -5
palimpzest/query/operators/distinct.py +62 -0
palimpzest/query/operators/filter.py +26 -16
palimpzest/query/operators/join.py +403 -0
palimpzest/query/operators/limit.py +3 -3
palimpzest/query/operators/logical.py +205 -77
palimpzest/query/operators/mixture_of_agents_convert.py +10 -8
palimpzest/query/operators/physical.py +27 -21
palimpzest/query/operators/project.py +3 -3
palimpzest/query/operators/rag_convert.py +7 -7
palimpzest/query/operators/retrieve.py +9 -9
palimpzest/query/operators/scan.py +81 -42
palimpzest/query/operators/search.py +524 -0
palimpzest/query/operators/split_convert.py +10 -8
palimpzest/query/optimizer/__init__.py +7 -9
palimpzest/query/optimizer/cost_model.py +108 -441
palimpzest/query/optimizer/optimizer.py +123 -181
palimpzest/query/optimizer/optimizer_strategy.py +66 -61
palimpzest/query/optimizer/plan.py +352 -67
palimpzest/query/optimizer/primitives.py +43 -19
palimpzest/query/optimizer/rules.py +484 -646
palimpzest/query/optimizer/tasks.py +127 -58
palimpzest/query/processor/config.py +42 -76
palimpzest/query/processor/query_processor.py +73 -18
palimpzest/query/processor/query_processor_factory.py +46 -38
palimpzest/schemabuilder/schema_builder.py +15 -28
palimpzest/utils/model_helpers.py +32 -77
palimpzest/utils/progress.py +114 -102
palimpzest/validator/__init__.py +0 -0
palimpzest/validator/validator.py +306 -0
{palimpzest-0.7.21.dist-info → palimpzest-0.8.1.dist-info}/METADATA +6 -1
palimpzest-0.8.1.dist-info/RECORD +95 -0
palimpzest/core/lib/fields.py +0 -141
palimpzest/prompts/code_synthesis_prompts.py +0 -28
palimpzest/query/execution/random_sampling_execution_strategy.py +0 -240
palimpzest/query/generators/api_client_factory.py +0 -30
palimpzest/query/operators/code_synthesis_convert.py +0 -488
palimpzest/query/operators/map.py +0 -130
palimpzest/query/processor/nosentinel_processor.py +0 -33
palimpzest/query/processor/processing_strategy_type.py +0 -28
palimpzest/query/processor/sentinel_processor.py +0 -88
palimpzest/query/processor/streaming_processor.py +0 -149
palimpzest/sets.py +0 -405
palimpzest/utils/datareader_helpers.py +0 -61
palimpzest/utils/demo_helpers.py +0 -75
palimpzest/utils/field_helpers.py +0 -69
palimpzest/utils/generation_helpers.py +0 -69
palimpzest/utils/sandbox.py +0 -183
palimpzest-0.7.21.dist-info/RECORD +0 -95
/palimpzest/core/{elements/index.py → data/index_dataset.py} +0 -0
{palimpzest-0.7.21.dist-info → palimpzest-0.8.1.dist-info}/WHEEL +0 -0
{palimpzest-0.7.21.dist-info → palimpzest-0.8.1.dist-info}/licenses/LICENSE +0 -0
{palimpzest-0.7.21.dist-info → palimpzest-0.8.1.dist-info}/top_level.txt +0 -0

palimpzest/prompts/filter_prompts.py CHANGED Viewed

@@ -12,8 +12,8 @@ INPUT FIELDS:
 {example_input_fields}
 CONTEXT:
-{example_context}
-{image_disclaimer}
+{example_context}{image_disclaimer}{audio_disclaimer}
 FILTER CONDITION: {example_filter_condition}
 Let's think step-by-step in order to answer the question.
@@ -24,31 +24,67 @@ ANSWER: TRUE
 ---
 """
-COT_BOOL_BASE_USER_PROMPT = """You are a helpful assistant whose job is to {job_instruction}.
+COT_BOOL_NO_REASONING_BASE_SYSTEM_PROMPT = """You are a helpful assistant whose job is to {job_instruction}.
 You will be presented with a context and a filter condition. Output TRUE if the context satisfies the filter condition, and FALSE otherwise.
+Remember, your answer must be TRUE or FALSE. Finish your response with a newline character followed by ---
+An example is shown below:
+---
+INPUT FIELDS:
+{example_input_fields}
+CONTEXT:
+{example_context}{image_disclaimer}{audio_disclaimer}
+FILTER CONDITION: {example_filter_condition}
+ANSWER: TRUE
+---
+"""
+COT_BOOL_BASE_USER_PROMPT = """You are a helpful assistant whose job is to {job_instruction}.
+You will be presented with a context and a filter condition. Output TRUE if the context satisfies the filter condition, and FALSE otherwise.
+{desc_section}
 Remember, your answer must be TRUE or FALSE. Finish your response with a newline character followed by ---
 ---
 INPUT FIELDS:
 {input_fields_desc}
 CONTEXT:
-{context}
-<<image-placeholder>>
+{context}<<image-placeholder>><<audio-placeholder>>
 FILTER CONDITION: {filter_condition}
 Let's think step-by-step in order to answer the question.
 REASONING: """
+COT_BOOL_NO_REASONING_BASE_USER_PROMPT = """You are a helpful assistant whose job is to {job_instruction}.
+You will be presented with a context and a filter condition. Output TRUE if the context satisfies the filter condition, and FALSE otherwise.
+{desc_section}
+Remember, your answer must be TRUE or FALSE. Finish your response with a newline character followed by ---
+---
+INPUT FIELDS:
+{input_fields_desc}
+CONTEXT:
+{context}<<image-placeholder>><<audio-placeholder>>
+FILTER CONDITION: {filter_condition}
+ANSWER: """
 ### TEMPLATE INPUTS ###
 COT_BOOL_JOB_INSTRUCTION = """answer a TRUE / FALSE question"""
 COT_BOOL_IMAGE_JOB_INSTRUCTION = """analyze input image(s) and/or text in order to answer a TRUE / FALSE question"""
+COT_BOOL_AUDIO_JOB_INSTRUCTION = """analyze input audio and/or text in order to answer a TRUE / FALSE question"""
 COT_BOOL_EXAMPLE_INPUT_FIELDS = """- text: a short passage of text"""
 COT_BOOL_IMAGE_EXAMPLE_INPUT_FIELDS = """- image: an image of a scene
 - photographer: the photographer of the image"""
+COT_BOOL_AUDIO_EXAMPLE_INPUT_FIELDS = """- recording: an audio recording of a newscast
+- speaker: the name of the speaker in the recording"""
 COT_BOOL_EXAMPLE_CONTEXT = """{{
   "text": "The quick brown fox jumps over the lazy dog."
@@ -57,13 +93,22 @@ COT_BOOL_IMAGE_EXAMPLE_CONTEXT = """{{
   "image": <bytes>,
   "photographer": "CameraEnthusiast1"
 }}"""
+COT_BOOL_AUDIO_EXAMPLE_CONTEXT = """{{
+  "recording": <bytes>,
+  "speaker": "Walter Cronkite"
+}}"""
 COT_BOOL_EXAMPLE_FILTER_CONDITION = "the text mentions an animal"
 COT_BOOL_IMAGE_EXAMPLE_FILTER_CONDITION = "there's an animal in this image"
+COT_BOOL_AUDIO_EXAMPLE_FILTER_CONDITION = "the newscast discusses a flashpoint in the Cold War"
 COT_BOOL_IMAGE_DISCLAIMER = """
-<image content provided here; assume in this example the image shows a dog and a cat playing>
+\n<image content provided here; assume in this example the image shows a dog and a cat playing>
+"""
+COT_BOOL_AUDIO_DISCLAIMER = """
+\n<audio content provided here; assume in this example the recording is about the Cuban Missile Crisis>
 """
 COT_BOOL_EXAMPLE_REASONING = """the text mentions the words "fox" and "dog" which are animals, therefore the answer is TRUE."""
 COT_BOOL_IMAGE_EXAMPLE_REASONING = """the image shows a dog and a cat playing, both of which are animals, therefore the answer is TRUE."""
+COT_BOOL_AUDIO_EXAMPLE_REASONING = """the newscast discusses the Cuban Missile Crisis, which was a flashpoint in the Cold War, therefore the answer is TRUE."""

palimpzest/prompts/join_prompts.py ADDED Viewed

@@ -0,0 +1,163 @@
+"""This file contains prompts for join operations."""
+### BASE PROMPTS ###
+COT_JOIN_BASE_SYSTEM_PROMPT = """You are a helpful assistant whose job is to {job_instruction}.
+You will be presented with two data records and a join condition. Output TRUE if the two data records satisfy the join condition, and FALSE otherwise.
+Remember, your answer must be TRUE or FALSE. Finish your response with a newline character followed by ---
+An example is shown below:
+---
+LEFT INPUT FIELDS:
+{example_input_fields}
+LEFT CONTEXT:
+{example_context}{image_disclaimer}{audio_disclaimer}
+RIGHT INPUT FIELDS:
+{right_example_input_fields}
+RIGHT CONTEXT:
+{right_example_context}{right_image_disclaimer}{right_audio_disclaimer}
+JOIN CONDITION: {example_join_condition}
+Let's think step-by-step in order to evaluate the join condition.
+REASONING: {example_reasoning}
+ANSWER: TRUE
+---
+"""
+COT_JOIN_NO_REASONING_BASE_SYSTEM_PROMPT = """You are a helpful assistant whose job is to {job_instruction}.
+You will be presented with two data records and a join condition. Output TRUE if the two data records satisfy the join condition, and FALSE otherwise.
+Remember, your answer must be TRUE or FALSE. Finish your response with a newline character followed by ---
+An example is shown below:
+---
+LEFT INPUT FIELDS:
+{example_input_fields}
+LEFT CONTEXT:
+{example_context}{image_disclaimer}{audio_disclaimer}
+RIGHT INPUT FIELDS:
+{right_example_input_fields}
+RIGHT CONTEXT:
+{right_example_context}{right_image_disclaimer}{right_audio_disclaimer}
+JOIN CONDITION: {example_join_condition}
+ANSWER: TRUE
+---
+"""
+COT_JOIN_BASE_USER_PROMPT = """You are a helpful assistant whose job is to {job_instruction}.
+You will be presented with two data records and a join condition. Output TRUE if the two data records satisfy the join condition, and FALSE otherwise.
+{desc_section}
+Remember, your answer must be TRUE or FALSE. Finish your response with a newline character followed by ---
+---
+LEFT INPUT FIELDS:
+{input_fields_desc}
+LEFT CONTEXT:
+{context}<<image-placeholder>><<audio-placeholder>>
+RIGHT INPUT FIELDS:
+{right_input_fields_desc}
+RIGHT CONTEXT:
+{right_context}<<image-placeholder>><<audio-placeholder>>
+JOIN CONDITION: {join_condition}
+Let's think step-by-step in order to evaluate the join condition.
+REASONING: """
+COT_JOIN_NO_REASONING_BASE_USER_PROMPT = """You are a helpful assistant whose job is to {job_instruction}.
+You will be presented with two data records and a join condition. Output TRUE if the two data records satisfy the join condition, and FALSE otherwise.
+{desc_section}
+Remember, your answer must be TRUE or FALSE. Finish your response with a newline character followed by ---
+---
+LEFT INPUT FIELDS:
+{input_fields_desc}
+LEFT CONTEXT:
+{context}<<image-placeholder>><<audio-placeholder>>
+RIGHT INPUT FIELDS:
+{right_input_fields_desc}
+RIGHT CONTEXT:
+{right_context}<<image-placeholder>><<audio-placeholder>>
+JOIN CONDITION: {join_condition}
+ANSWER: """
+### TEMPLATE INPUTS ###
+COT_JOIN_JOB_INSTRUCTION = """determine whether two data records satisfy a join condition"""
+COT_JOIN_IMAGE_JOB_INSTRUCTION = """analyze input image(s) and/or text in order to determine whether two data records satisfy a join condition"""
+COT_JOIN_AUDIO_JOB_INSTRUCTION = """analyze input audio and/or text in order to determine whether two data records satisfy a join condition"""
+COT_JOIN_EXAMPLE_INPUT_FIELDS = """- text: a short passage of text"""
+COT_JOIN_IMAGE_EXAMPLE_INPUT_FIELDS = """- image: an image of a scene
+- photographer: the photographer of the image"""
+COT_JOIN_AUDIO_EXAMPLE_INPUT_FIELDS = """- recording: an audio recording of a newscast
+- speaker: the name of the speaker in the recording"""
+COT_JOIN_RIGHT_EXAMPLE_INPUT_FIELDS = """- contents: the contents of a text file"""
+COT_JOIN_IMAGE_RIGHT_EXAMPLE_INPUT_FIELDS = """- image: an image of a scene
+- photographer: the photographer of the image"""
+COT_JOIN_AUDIO_RIGHT_EXAMPLE_INPUT_FIELDS = """- recording: an audio recording of a newscast
+- speaker: the name of the speaker in the recording"""
+COT_JOIN_EXAMPLE_CONTEXT = """{{
+  "text": "The quick brown fox jumps over the lazy dog."
+}}"""
+COT_JOIN_IMAGE_EXAMPLE_CONTEXT = """{{
+  "image": <bytes>,
+  "photographer": "CameraEnthusiast1"
+}}"""
+COT_JOIN_AUDIO_EXAMPLE_CONTEXT = """{{
+  "recording": <bytes>,
+  "speaker": "Walter Cronkite"
+}}"""
+COT_JOIN_RIGHT_EXAMPLE_CONTEXT = """{{
+  "contents": "Foxes are wild animals which primarily hunt small mammals like rabbits and rodents."
+}}"""
+COT_JOIN_IMAGE_RIGHT_EXAMPLE_CONTEXT = """{{
+  "image": <bytes>,
+  "filename": "img123.png"
+}}"""
+COT_JOIN_AUDIO_RIGHT_EXAMPLE_CONTEXT = """{{
+  "recording": <bytes>,
+  "speaker": "Barbara Walters"
+}}"""
+COT_JOIN_EXAMPLE_JOIN_CONDITION = "each record mentions the same animal"
+COT_JOIN_IMAGE_EXAMPLE_JOIN_CONDITION = "the images are of the same subject"
+COT_JOIN_AUDIO_EXAMPLE_JOIN_CONDITION = "the recordings are about the same subject"
+COT_JOIN_IMAGE_DISCLAIMER = """
+\n<image content provided here; assume in this example the image shows a horse in a field>
+"""
+COT_JOIN_AUDIO_DISCLAIMER = """
+\n<audio content provided here; assume in this example the recording is about the Cuban Missile Crisis>
+"""
+COT_JOIN_RIGHT_IMAGE_DISCLAIMER = """
+\n<image content provided here; assume in this example the image shows a horse in its stable>
+"""
+COT_JOIN_RIGHT_AUDIO_DISCLAIMER = """
+\n<audio content provided here; assume in this example the recording is from a telecast about the Cuban Missile Crisis's historical significance>
+"""
+COT_JOIN_EXAMPLE_REASONING = """both passages mention a fox, which is the same animal, therefore the answer is TRUE."""
+COT_JOIN_IMAGE_EXAMPLE_REASONING = """both images show a horse, which appears to be the main subject of each image, therefore the answer is TRUE."""
+COT_JOIN_AUDIO_EXAMPLE_REASONING = """both recordings discuss the Cuban Missile Crisis, which is the same subject, therefore the answer is TRUE."""

palimpzest/prompts/moa_proposer_convert_prompts.py CHANGED Viewed

@@ -16,8 +16,8 @@ OUTPUT FIELDS:
 {example_output_fields}
 CONTEXT:
-{example_context}
-{image_disclaimer}
+{example_context}{image_disclaimer}
 Let's think step-by-step in order to answer the question.
 ANSWER: {example_answer}
@@ -27,7 +27,7 @@ ANSWER: {example_answer}
 COT_MOA_PROPOSER_BASE_USER_PROMPT = """You are a helpful assistant whose job is to {job_instruction}.
 You will be presented with a context and a set of output fields to generate. Your task is to generate a paragraph or two which describes what you believe is the correct value for each output field.
 Be sure to cite information from the context as evidence of why your answers are correct. Do not hallucinate evidence.
+{desc_section}
 You will be provided with a description of each input field and each output field.
 ---
 INPUT FIELDS:
@@ -37,8 +37,8 @@ OUTPUT FIELDS:
 {output_fields_desc}
 CONTEXT:
-{context}
-<<image-placeholder>>
+{context}<<image-placeholder>>
 Let's think step-by-step in order to answer the question.
 ANSWER: """
@@ -68,7 +68,7 @@ COT_MOA_PROPOSER_IMAGE_EXAMPLE_CONTEXT = """{{
 }}"""
 COT_MOA_PROPOSER_IMAGE_DISCLAIMER = """
-<image content provided here; assume in this example the image shows a dog and a cat playing>
+\n<image content provided here; assume in this example the image shows a dog and a cat playing>
 """
 COT_MOA_PROPOSER_EXAMPLE_ANSWER = """the text passage mentions the scientist's name as "Augusta Ada King, Countess of Lovelace, also known as Ada Lovelace" and the scientist's birthday as "December 10, 1815". Therefore, the name of the scientist is "Augusta Ada King" and the birth year is 1815."""

palimpzest 0.7.21__py3-none-any.whl → 0.8.1__py3-none-any.whl

palimpzest 0.7.21py3-none-any.whl → 0.8.1py3-none-any.whl