sdg-hub 0.2.1__py3-none-any.whl → 0.3.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (44) hide show
  1. sdg_hub/_version.py +16 -3
  2. sdg_hub/core/blocks/deprecated_blocks/selector.py +1 -1
  3. sdg_hub/core/blocks/evaluation/evaluate_faithfulness_block.py +175 -416
  4. sdg_hub/core/blocks/evaluation/evaluate_relevancy_block.py +174 -415
  5. sdg_hub/core/blocks/evaluation/verify_question_block.py +180 -415
  6. sdg_hub/core/blocks/llm/client_manager.py +92 -43
  7. sdg_hub/core/blocks/llm/config.py +1 -0
  8. sdg_hub/core/blocks/llm/llm_chat_block.py +74 -16
  9. sdg_hub/core/blocks/llm/llm_chat_with_parsing_retry_block.py +277 -115
  10. sdg_hub/core/blocks/llm/text_parser_block.py +88 -23
  11. sdg_hub/core/blocks/registry.py +48 -34
  12. sdg_hub/core/blocks/transform/__init__.py +2 -0
  13. sdg_hub/core/blocks/transform/index_based_mapper.py +1 -1
  14. sdg_hub/core/blocks/transform/json_structure_block.py +142 -0
  15. sdg_hub/core/flow/base.py +326 -62
  16. sdg_hub/core/utils/datautils.py +54 -0
  17. sdg_hub/core/utils/flow_metrics.py +261 -0
  18. sdg_hub/core/utils/logger_config.py +50 -9
  19. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/__init__.py +0 -0
  20. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/__init__.py +0 -0
  21. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/detailed_summary.yaml +11 -0
  22. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/flow.yaml +159 -0
  23. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/__init__.py +0 -0
  24. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/extractive_summary.yaml +65 -0
  25. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/flow.yaml +161 -0
  26. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_answers.yaml +15 -0
  27. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_multiple_qa.yaml +21 -0
  28. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_question_list.yaml +44 -0
  29. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/__init__.py +0 -0
  30. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/flow.yaml +104 -0
  31. sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/key_facts_summary.yaml +61 -0
  32. sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/flow.yaml +0 -7
  33. sdg_hub/flows/text_analysis/__init__.py +2 -0
  34. sdg_hub/flows/text_analysis/structured_insights/__init__.py +6 -0
  35. sdg_hub/flows/text_analysis/structured_insights/analyze_sentiment.yaml +27 -0
  36. sdg_hub/flows/text_analysis/structured_insights/extract_entities.yaml +38 -0
  37. sdg_hub/flows/text_analysis/structured_insights/extract_keywords.yaml +21 -0
  38. sdg_hub/flows/text_analysis/structured_insights/flow.yaml +153 -0
  39. sdg_hub/flows/text_analysis/structured_insights/summarize.yaml +21 -0
  40. {sdg_hub-0.2.1.dist-info → sdg_hub-0.3.0.dist-info}/METADATA +42 -15
  41. {sdg_hub-0.2.1.dist-info → sdg_hub-0.3.0.dist-info}/RECORD +44 -22
  42. {sdg_hub-0.2.1.dist-info → sdg_hub-0.3.0.dist-info}/WHEEL +0 -0
  43. {sdg_hub-0.2.1.dist-info → sdg_hub-0.3.0.dist-info}/licenses/LICENSE +0 -0
  44. {sdg_hub-0.2.1.dist-info → sdg_hub-0.3.0.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,153 @@
1
+ metadata:
2
+ id: green-clay-812
3
+ name: "Structured Text Insights Extraction Flow"
4
+ description: >-
5
+ Multi-step pipeline for extracting structured insights from text including
6
+ summary, keywords, entities, and sentiment analysis combined into a JSON output
7
+ version: "1.0.0"
8
+ author: "SDG Hub Contributors"
9
+ recommended_models:
10
+ default: "openai/gpt-oss-120b"
11
+ compatible:
12
+ - "meta-llama/Llama-3.3-70B-Instruct"
13
+ - "microsoft/phi-4"
14
+ - "mistralai/Mixtral-8x7B-Instruct-v0.1"
15
+ experimental:
16
+ - "gpt-4o"
17
+ tags:
18
+ - "text-analysis"
19
+ - "summarization"
20
+ - "nlp"
21
+ - "structured-output"
22
+ - "insights"
23
+ - "sentiment-analysis"
24
+ - "entity-extraction"
25
+ - "keyword-extraction"
26
+ license: "Apache-2.0"
27
+ min_sdg_hub_version: "0.2.0"
28
+ dataset_requirements:
29
+ required_columns:
30
+ - "text"
31
+ description: >-
32
+ Input dataset should contain text content for analysis. Each text should be
33
+ substantial enough for meaningful analysis (minimum 50 words recommended).
34
+ Works well with news articles, blog posts, reviews, and other content.
35
+
36
+ blocks:
37
+ # Extract Summary
38
+ - block_type: "PromptBuilderBlock"
39
+ block_config:
40
+ block_name: "build_summary_prompt"
41
+ input_cols:
42
+ - "text"
43
+ output_cols: "summary_prompt"
44
+ prompt_config_path: "summarize.yaml"
45
+ - block_type: "LLMChatBlock"
46
+ block_config:
47
+ block_name: "generate_summary"
48
+ input_cols: "summary_prompt"
49
+ output_cols: "raw_summary"
50
+ max_tokens: 1024
51
+ temperature: 0.3
52
+ async_mode: true
53
+ - block_type: "TextParserBlock"
54
+ block_config:
55
+ block_name: "parse_summary"
56
+ input_cols: "raw_summary"
57
+ output_cols: "summary"
58
+ start_tags:
59
+ - "[SUMMARY]"
60
+ end_tags:
61
+ - "[/SUMMARY]"
62
+
63
+ # Extract Keywords
64
+ - block_type: "PromptBuilderBlock"
65
+ block_config:
66
+ block_name: "build_keywords_prompt"
67
+ input_cols:
68
+ - "text"
69
+ output_cols: "keywords_prompt"
70
+ prompt_config_path: "extract_keywords.yaml"
71
+ - block_type: "LLMChatBlock"
72
+ block_config:
73
+ block_name: "generate_keywords"
74
+ input_cols: "keywords_prompt"
75
+ output_cols: "raw_keywords"
76
+ max_tokens: 512
77
+ temperature: 0.3
78
+ async_mode: true
79
+ - block_type: "TextParserBlock"
80
+ block_config:
81
+ block_name: "parse_keywords"
82
+ input_cols: "raw_keywords"
83
+ output_cols: "keywords"
84
+ start_tags:
85
+ - "[KEYWORDS]"
86
+ end_tags:
87
+ - "[/KEYWORDS]"
88
+
89
+ # Extract Entities
90
+ - block_type: "PromptBuilderBlock"
91
+ block_config:
92
+ block_name: "build_entities_prompt"
93
+ input_cols:
94
+ - "text"
95
+ output_cols: "entities_prompt"
96
+ prompt_config_path: "extract_entities.yaml"
97
+ - block_type: "LLMChatBlock"
98
+ block_config:
99
+ block_name: "generate_entities"
100
+ input_cols: "entities_prompt"
101
+ output_cols: "raw_entities"
102
+ max_tokens: 1024
103
+ temperature: 0.3
104
+ async_mode: true
105
+ - block_type: "TextParserBlock"
106
+ block_config:
107
+ block_name: "parse_entities"
108
+ input_cols: "raw_entities"
109
+ output_cols: "entities"
110
+ start_tags:
111
+ - "[ENTITIES]"
112
+ end_tags:
113
+ - "[/ENTITIES]"
114
+
115
+ # Extract Sentiment
116
+ - block_type: "PromptBuilderBlock"
117
+ block_config:
118
+ block_name: "build_sentiment_prompt"
119
+ input_cols:
120
+ - "text"
121
+ output_cols: "sentiment_prompt"
122
+ prompt_config_path: "analyze_sentiment.yaml"
123
+ - block_type: "LLMChatBlock"
124
+ block_config:
125
+ block_name: "generate_sentiment"
126
+ input_cols: "sentiment_prompt"
127
+ output_cols: "raw_sentiment"
128
+ max_tokens: 256
129
+ temperature: 0.1
130
+ async_mode: true
131
+ - block_type: "TextParserBlock"
132
+ block_config:
133
+ block_name: "parse_sentiment"
134
+ input_cols: "raw_sentiment"
135
+ output_cols: "sentiment"
136
+ start_tags:
137
+ - "[SENTIMENT]"
138
+ end_tags:
139
+ - "[/SENTIMENT]"
140
+
141
+ # Create Structured Insights
142
+ - block_type: "JSONStructureBlock"
143
+ block_config:
144
+ block_name: "create_structured_insights"
145
+ input_cols:
146
+ - "summary"
147
+ - "keywords"
148
+ - "entities"
149
+ - "sentiment"
150
+ output_cols:
151
+ - "structured_insights"
152
+ ensure_json_serializable: true
153
+
@@ -0,0 +1,21 @@
1
+ - role: system
2
+ content: You are an AI assistant expert at creating concise, informative summaries that capture the most important information from text.
3
+
4
+ - role: user
5
+ content: |
6
+ Create a brief, concise summary of the following text. Your summary should:
7
+
8
+ 1. Be 2-3 sentences maximum
9
+ 2. Capture the most important information and key points
10
+ 3. Be clear and easy to understand
11
+ 4. Avoid adding any information not present in the original text
12
+ 5. Focus on the main topic, key facts, and significant details
13
+
14
+ Text to summarize:
15
+ {{text}}
16
+
17
+ Provide your response in the following format:
18
+ [SUMMARY]
19
+ Your summary here
20
+ [/SUMMARY]
21
+
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: sdg_hub
3
- Version: 0.2.1
3
+ Version: 0.3.0
4
4
  Summary: Synthetic Data Generation
5
5
  Author-email: Red Hat AI Innovation <abhandwa@redhat.com>
6
6
  License: Apache-2.0
@@ -27,7 +27,6 @@ Requires-Dist: datasets<4.0.0,>=2.18.0
27
27
  Requires-Dist: httpx<1.0.0,>=0.25.0
28
28
  Requires-Dist: jinja2
29
29
  Requires-Dist: litellm<1.75.0,>=1.73.0
30
- Requires-Dist: openai<2.0.0,>=1.13.3
31
30
  Requires-Dist: rich
32
31
  Requires-Dist: pydantic<3.0.0,>=2.0.0
33
32
  Requires-Dist: python-dotenv<2.0.0,>=1.0.0
@@ -54,6 +53,7 @@ Requires-Dist: sentence-transformers; extra == "examples"
54
53
  Requires-Dist: instructor; extra == "examples"
55
54
  Requires-Dist: fastapi; extra == "examples"
56
55
  Requires-Dist: nest-asyncio; extra == "examples"
56
+ Requires-Dist: ipykernel; extra == "examples"
57
57
  Provides-Extra: dev
58
58
  Requires-Dist: pre-commit<4.0,>=3.0.4; extra == "dev"
59
59
  Requires-Dist: pylint<4.0,>=2.16.2; extra == "dev"
@@ -64,6 +64,7 @@ Requires-Dist: pytest-cov; extra == "dev"
64
64
  Requires-Dist: pytest-html; extra == "dev"
65
65
  Requires-Dist: tox<5,>=4.4.2; extra == "dev"
66
66
  Requires-Dist: ruff; extra == "dev"
67
+ Requires-Dist: pytest-env; extra == "dev"
67
68
  Dynamic: license-file
68
69
 
69
70
  # `sdg_hub`: Synthetic Data Generation Toolkit
@@ -92,6 +93,8 @@ A modular Python framework for building synthetic data generation pipelines usin
92
93
 
93
94
  **📊 Rich Monitoring** - Detailed logging with progress bars and execution summaries.
94
95
 
96
+ **📋 Dataset Schema Discovery** - Instantly discover required data formats. Get empty datasets with correct schema for easy validation and data preparation.
97
+
95
98
  **🧩 Easily Extensible** - Create custom blocks with simple inheritance. Rich logging and monitoring built-in.
96
99
 
97
100
 
@@ -176,22 +179,46 @@ flow.set_model_config(
176
179
  api_key="your_key",
177
180
  )
178
181
  ```
179
- #### Load your dataset and run the flow
182
+ #### Discover dataset requirements and create your dataset
180
183
  ```python
181
- # Create your dataset with required columns
182
- dataset = Dataset.from_dict({
183
- 'document': ['Your document text here...'],
184
- 'document_outline': ['1. Topic A; 2. Topic B; 3. Topic C'],
185
- 'domain': ['Computer Science'],
186
- 'icl_document': ['Example document for in-context learning...'],
187
- 'icl_query_1': ['Example question 1?'],
188
- 'icl_response_1': ['Example answer 1'],
189
- 'icl_query_2': ['Example question 2?'],
190
- 'icl_response_2': ['Example answer 2'],
191
- 'icl_query_3': ['Example question 3?'],
192
- 'icl_response_3': ['Example answer 3']
184
+ # First, discover what data the flow needs
185
+ # Get an empty dataset with the exact schema needed
186
+ schema_dataset = flow.get_dataset_schema() # Get empty dataset with correct schema
187
+ print(f"Required columns: {schema_dataset.column_names}")
188
+ print(f"Schema: {schema_dataset.features}")
189
+
190
+ # Option 1: Add data directly to the schema dataset
191
+ dataset = schema_dataset.add_item({
192
+ 'document': 'Your document text here...',
193
+ 'document_outline': '1. Topic A; 2. Topic B; 3. Topic C',
194
+ 'domain': 'Computer Science',
195
+ 'icl_document': 'Example document for in-context learning...',
196
+ 'icl_query_1': 'Example question 1?',
197
+ 'icl_response_1': 'Example answer 1',
198
+ 'icl_query_2': 'Example question 2?',
199
+ 'icl_response_2': 'Example answer 2',
200
+ 'icl_query_3': 'Example question 3?',
201
+ 'icl_response_3': 'Example answer 3'
193
202
  })
194
203
 
204
+ # Option 2: Create your own dataset and validate the schema
205
+ my_dataset = Dataset.from_dict(my_data_dict)
206
+ if my_dataset.features == schema_dataset.features:
207
+ print("✅ Schema matches - ready to generate!")
208
+ dataset = my_dataset
209
+ else:
210
+ print("❌ Schema mismatch - check your columns")
211
+
212
+ # Option 3: Get raw requirements for detailed inspection
213
+ requirements = flow.get_dataset_requirements()
214
+ if requirements:
215
+ print(f"Required: {requirements.required_columns}")
216
+ print(f"Optional: {requirements.optional_columns}")
217
+ print(f"Min samples: {requirements.min_samples}")
218
+ ```
219
+
220
+ #### Dry Run and Generate
221
+ ```python
195
222
  # Quick Testing with Dry Run
196
223
  dry_result = flow.dry_run(dataset, sample_size=1)
197
224
  print(f"Dry run completed in {dry_result['execution_time_seconds']:.2f}s")
@@ -1,10 +1,10 @@
1
1
  sdg_hub/__init__.py,sha256=Tw-6R5a8_W1kJcTAsW3R9ltBDP1dy5-fe7Tvt3cSyCQ,550
2
- sdg_hub/_version.py,sha256=UoNvMtd4wCG76RwoSpNCUtaFyTwakGcZolfjXzNVSMY,511
2
+ sdg_hub/_version.py,sha256=5zTqm8rgXsWYBpB2M3Zw_K1D-aV8wP7NsBLrmMKkrAQ,704
3
3
  sdg_hub/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
4
4
  sdg_hub/core/__init__.py,sha256=NwqB4fwhC29W50VW7QXZssLxx122YvgO9LHDLdgAnrI,496
5
5
  sdg_hub/core/blocks/__init__.py,sha256=9sCkCvDQzJGSedaePVlEIpbNwrkBz_K500VW_6FLhuE,1601
6
6
  sdg_hub/core/blocks/base.py,sha256=TrzUAkG7Tiquk0Z3SOFsb5mRnHd1IbHH6gFPVH1P7T8,10424
7
- sdg_hub/core/blocks/registry.py,sha256=U__75QrxFpRaJlt36mOd26dgOqBeePs-ZX0Rnutp6r0,9782
7
+ sdg_hub/core/blocks/registry.py,sha256=FuEN_pnq-nSH1LguY3_oCubT6Kz3SuJjk3TcUpLT-lw,10695
8
8
  sdg_hub/core/blocks/deprecated_blocks/__init__.py,sha256=RDu3MWFStDQko-TKkx8tGoB1UTatP_RSldZK43zHDvY,889
9
9
  sdg_hub/core/blocks/deprecated_blocks/combine_columns.py,sha256=HCvpaYsAwgx1Dm0vIshcWsKoVsRT0KrmKp9j4oqtByc,2757
10
10
  sdg_hub/core/blocks/deprecated_blocks/duplicate_columns.py,sha256=maCaaEs0EMMzt7L1xm7fAH3ylaFMHEkeC_dtOw3FrjU,2694
@@ -13,44 +13,59 @@ sdg_hub/core/blocks/deprecated_blocks/flatten_columns.py,sha256=IenCskrPEv09h2uT
13
13
  sdg_hub/core/blocks/deprecated_blocks/llmblock.py,sha256=34lzC43BODpMk5AwlWA1ctdYPmN7cA6WL5vMXaI0P0Y,20385
14
14
  sdg_hub/core/blocks/deprecated_blocks/rename_columns.py,sha256=thp-mHtkRmUw_nYKpldy_mLWR2AvC5YUhbqDETM6-T0,2620
15
15
  sdg_hub/core/blocks/deprecated_blocks/sample_populator.py,sha256=UdueMApxOmPWaxxMrw7b1v74fKJBfqqRATEBqgmVtNw,1737
16
- sdg_hub/core/blocks/deprecated_blocks/selector.py,sha256=ABcXZrqEMsgKfdGAkSo2plMp4LsZSqPhEQugoDEYm1I,2950
16
+ sdg_hub/core/blocks/deprecated_blocks/selector.py,sha256=nWecsVsW8DvBcqAF_LOqXmW-5MQ28uN3d1y6wkSy38c,2960
17
17
  sdg_hub/core/blocks/deprecated_blocks/set_to_majority_value.py,sha256=44TQu-rK5isia-otMVB1zHd8D-wWmu3C8CI1NLtfY5s,2729
18
18
  sdg_hub/core/blocks/evaluation/__init__.py,sha256=kFXee-vsVVdU2XtLio9qHgPx_a0zoB_rQr509EKBGJc,357
19
- sdg_hub/core/blocks/evaluation/evaluate_faithfulness_block.py,sha256=ZuQ8jq2JwTdslUJtFi1E9NXebCWFZS8isXOafcJ_CMU,23026
20
- sdg_hub/core/blocks/evaluation/evaluate_relevancy_block.py,sha256=ieQRwl4bx5EQ3m7Wa2P3pHLUPQY7HuwNWjHUCo98u6g,22832
21
- sdg_hub/core/blocks/evaluation/verify_question_block.py,sha256=fSNbW1KpdfVE0fQsm4Y8QfVk6A3J5H3C0dtGn49t8tM,22853
19
+ sdg_hub/core/blocks/evaluation/evaluate_faithfulness_block.py,sha256=vFi3YIxVPNnzgdenIeAl7yUb4OOUY_uUOXS-pWLsDmw,12223
20
+ sdg_hub/core/blocks/evaluation/evaluate_relevancy_block.py,sha256=NXT1lixR-JnOXNlBCbMjULcpu4kh2SthhwCWEobiBt0,12115
21
+ sdg_hub/core/blocks/evaluation/verify_question_block.py,sha256=LKoIHdxUuTVO24n_M9cAliEj56uEe2kQAecKTRz65zI,12465
22
22
  sdg_hub/core/blocks/filtering/__init__.py,sha256=isxSVSvDqkMjG8dQSl3Q2M4g5c1t9fTjBSA21icf-yA,275
23
23
  sdg_hub/core/blocks/filtering/column_value_filter.py,sha256=H8Gif0q9Wc_d1TnVow8Zpsg7blJOFGN1EZmV6OPpkcg,5971
24
24
  sdg_hub/core/blocks/llm/__init__.py,sha256=N6-Prgd4X85oWbMQzhYMrq7OX-NTJm57cghowK-val0,844
25
- sdg_hub/core/blocks/llm/client_manager.py,sha256=vaoPoTITJ9IlooeVRfu6M4WBc08mp4aJZ5tvnl2fMv8,12309
26
- sdg_hub/core/blocks/llm/config.py,sha256=TmbfqxPHH3mShTK2EuCX2AGKtDvl0aSvihsaqgzABtM,11266
25
+ sdg_hub/core/blocks/llm/client_manager.py,sha256=IpMUwECL9_oNFC3yxg9A6BRqMcdg0Wdpzx28BhX45Xo,14742
26
+ sdg_hub/core/blocks/llm/config.py,sha256=gc4xp5D20MSlKMFEos0QAaKUwgbZpBtMGXmn6LsIk78,11289
27
27
  sdg_hub/core/blocks/llm/error_handler.py,sha256=7T-019ZFB9qgZoX1ybIiXyaLjPzrF96qcKmUu6vmO6g,12178
28
- sdg_hub/core/blocks/llm/llm_chat_block.py,sha256=3o2oV_ecWsEHFp5FWPIpBT-yJ1imJmeZy2b9GZL-T54,20121
29
- sdg_hub/core/blocks/llm/llm_chat_with_parsing_retry_block.py,sha256=mMmifTC-sRUhdxuLRRtAMhQC7r7NOyTAfBx-xTzLzTc,19669
28
+ sdg_hub/core/blocks/llm/llm_chat_block.py,sha256=9ytjxjADM0FydkLapZPSQPfzjjrFIdFONs3EJEoKnaw,23007
29
+ sdg_hub/core/blocks/llm/llm_chat_with_parsing_retry_block.py,sha256=H7LqYpEiFO1g2cxncAl4vkLhQxAYgGpV6cUyQTSG03k,27628
30
30
  sdg_hub/core/blocks/llm/prompt_builder_block.py,sha256=fkJd718X1oYlMY1cjo_8WCO16Gl8Tm0bUPWR78E_uws,13935
31
- sdg_hub/core/blocks/llm/text_parser_block.py,sha256=vQgUaeYJI9HuxDPRjII-NIOsR01JA-sBBGl05623L8I,14391
32
- sdg_hub/core/blocks/transform/__init__.py,sha256=Y_3izPCtgnMbFK-gBMeLHZspSrNLgbGheAJXU57XfFw,746
31
+ sdg_hub/core/blocks/llm/text_parser_block.py,sha256=8oRlXEkw8ULA8XVa7WtQZUojodl_ihs1omZpvbwoJQE,17165
32
+ sdg_hub/core/blocks/transform/__init__.py,sha256=lF9InjOzA6p_mjiwV-a2Kwstq9kqRiQ-dEwbsmR9yQs,825
33
33
  sdg_hub/core/blocks/transform/duplicate_columns.py,sha256=SaP7rIF4ZFEFFa50aU2xGNIuddXaEZrKxdWfHjzFpVI,2833
34
- sdg_hub/core/blocks/transform/index_based_mapper.py,sha256=mGup5agvDf9kAFSvXE5X6Puo6CQc9UOdFdbhdFWJjwk,8225
34
+ sdg_hub/core/blocks/transform/index_based_mapper.py,sha256=XC_a7Skbd3mu7f4ra8fGWPxMwqUMSjJkQ7Ag7vflwJA,8235
35
+ sdg_hub/core/blocks/transform/json_structure_block.py,sha256=hm-0M0NAyUREgJRPyV1u-laorgX6MZ1o17E9rNBhN78,5010
35
36
  sdg_hub/core/blocks/transform/melt_columns.py,sha256=vaYa5Taq6GhNZYWFL4uPK3-SfN2BsKEm-wvjd2EYYoI,4382
36
37
  sdg_hub/core/blocks/transform/rename_columns.py,sha256=qeB5L2utqDQnutUetH1VKZSqDiJSH_yUp5EFCV-XCVI,1998
37
38
  sdg_hub/core/blocks/transform/text_concat.py,sha256=_-B__Hob1WwgwkILPIZvTnsDzuwtoX1hKviyzHlnnes,3149
38
39
  sdg_hub/core/blocks/transform/uniform_col_val_setter.py,sha256=XnjiT29z3PzIPy8M-mmE2w-Miab6Ed5ahy32SaxTCTE,3263
39
40
  sdg_hub/core/flow/__init__.py,sha256=N2NZGngvd7qpT5FI_knKukUFM0IkD9K5jdTi-gDeUI4,475
40
- sdg_hub/core/flow/base.py,sha256=Jm90xQ1ns0ArEiqkceSME6phzBtkw6nthjSJNTU3IkQ,45530
41
+ sdg_hub/core/flow/base.py,sha256=8Xacytg9M82Mbv8r2GLbQgNltH-hCtFS1Fa1WpfFlSw,56488
41
42
  sdg_hub/core/flow/checkpointer.py,sha256=stm5ZtjjEiLk9ZkAAnoQQn5Y8Yl_d7qCsQLZTrCXR48,11867
42
43
  sdg_hub/core/flow/metadata.py,sha256=h9jpvAzWsF5n4ztZMzwa9ZNgnzKTHmFWdn7YbyJLHCw,12977
43
44
  sdg_hub/core/flow/migration.py,sha256=6and-RBqV0t2gRipr1GiOOVnyBJdtyyjw1kO08Z--d4,7558
44
45
  sdg_hub/core/flow/registry.py,sha256=DzCqEEgwhvwnCBAGLogoMVdwXh4pCHrxOWqoxam7O8I,12162
45
46
  sdg_hub/core/flow/validation.py,sha256=pUJvgaUjLpKNwvW6djcqVOF-HShOjegEmGOnUnoX4BA,9722
46
47
  sdg_hub/core/utils/__init__.py,sha256=C2FzLn3dHprwGJDEgI4fyFS3aoCJR-9PhHsunxropJ8,351
47
- sdg_hub/core/utils/datautils.py,sha256=QnzMl7nOp0crNJEWgAqurOuuAyz0SnvAjLiKzvG0uds,1933
48
+ sdg_hub/core/utils/datautils.py,sha256=q94NzBEtNwRFhzpk3FHofgJJU0gVRgAV3AAWZ1MroFk,3860
48
49
  sdg_hub/core/utils/error_handling.py,sha256=yku8cGj_nKCyXDsnb-mHCpgukkkAMucJ4iAUrIzqysc,5510
49
50
  sdg_hub/core/utils/flow_id_words.yaml,sha256=5QHpQdP7zwahRuooyAlJIwBY7WcDR7vtbJXxVJqujbg,2317
50
51
  sdg_hub/core/utils/flow_identifier.py,sha256=aAHfK_G9AwEtMglLRMdMpi_AI1dciub5UqBGm4yb2HE,2841
51
- sdg_hub/core/utils/logger_config.py,sha256=MPYdpyNXh_pxFUOAvSCHa98LGjxjaLXoUoqWekqTG4s,422
52
+ sdg_hub/core/utils/flow_metrics.py,sha256=VOdreUzP0kPgnkPjuQk87tZsK5f1u6XGEPM8ugCt0CY,8824
53
+ sdg_hub/core/utils/logger_config.py,sha256=6_cnsIHtSAdq1iTTZ7Q7nAJ1dmldlxSZ0AB49yLiQ20,2034
52
54
  sdg_hub/core/utils/path_resolution.py,sha256=yWof4kGNpQ5dKcrVHg0h9KfOKLZ6ROjdfsLAZsQT5rM,2000
53
55
  sdg_hub/core/utils/yaml_utils.py,sha256=tShCd-FFkp0xlKnLe7dXsMOR4AvT9d2qRUmu4ZnPSEY,1458
56
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
57
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_answers.yaml,sha256=THRT3cY44KGI_69B2wqt2Q89EknnOSE7B4A_jdnxlIU,330
58
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_multiple_qa.yaml,sha256=Cs-yeiXs4yac3dZsurdXBZj-kkwWdK-xBywjvBlgtGI,669
59
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_question_list.yaml,sha256=qHOgUNrQz2vjUjJiEHNGWxDDXwjJlP1kofTxeGgLyPI,1461
60
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
61
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/detailed_summary.yaml,sha256=Ik6gAml0O-jPq8jpXBAkURzYkQuFOnDZb4LDwjmfAiE,381
62
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/flow.yaml,sha256=va9ESTlEaZozy8pXTJ8OICjRg08KSP4l305YUKFuGAE,4417
63
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
64
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/extractive_summary.yaml,sha256=SeapWoOx3fhN5SvWYuHss_9prLE8xSkOic7JkbDHSR0,4081
65
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/flow.yaml,sha256=Iv4AlbE9PFtTn6teekgiNtrTiYio_nYWS8gyD6eFLUA,4580
66
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
67
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/flow.yaml,sha256=Rv0c4s5vim2I5jKzQgjcUfVMdla6czzmZUU67hlTAbg,2898
68
+ sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/key_facts_summary.yaml,sha256=YKMX_CuvcThG_bdNCAIXdVBkMvB72I89RGq2ltSSgc8,3298
54
69
  sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/README.md,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
55
70
  sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
56
71
  sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/atomic_facts.yaml,sha256=xgUNY793y4lcpdtuWm5Ah1CmbU2gvvPQCpZMMa6kPXU,2447
@@ -59,10 +74,17 @@ sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/ev
59
74
  sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/evaluate_question.yaml,sha256=zwzklXup6khRkR88avgrJTcjaMcV1wnbeYaML5oPuNs,1767
60
75
  sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/evaluate_relevancy.yaml,sha256=cA8igo7jMrRXaWW6k0of6KOp7YnxLtPj0fP4DbrmZNQ,3647
61
76
  sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/extractive_summary.yaml,sha256=fcMV7LaCFZo4D29nwhGJXqFFuZMYVLo9XYjv8zcU6zs,364
62
- sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/flow.yaml,sha256=Rrl9eve9QsGLojAkflgKTHyUgUawKfvhEVAnAxBLZJ8,6307
77
+ sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/flow.yaml,sha256=oyrLRjEnmioMa_G_sd9yQK_nBt4arwWV5fvKgzYE2ds,6090
63
78
  sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/generate_questions_responses.yaml,sha256=yX8aLY8dJSDML9ZJhnj9RzPbN8tH2xfcM4Gc6xZuwqQ,2596
64
- sdg_hub-0.2.1.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
65
- sdg_hub-0.2.1.dist-info/METADATA,sha256=0Si2PZotpwtUI2Pg2cc3uSZIJtS12jF4VInJSTyBngA,8606
66
- sdg_hub-0.2.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
67
- sdg_hub-0.2.1.dist-info/top_level.txt,sha256=TqI7d-HE1n6zkXFkU0nF3A1Ct0P0pBaqI675uFokhx4,8
68
- sdg_hub-0.2.1.dist-info/RECORD,,
79
+ sdg_hub/flows/text_analysis/__init__.py,sha256=WStks4eM_KHNTVsHglcj8vFghmI0PH9P1hUrijBLbwc,125
80
+ sdg_hub/flows/text_analysis/structured_insights/__init__.py,sha256=_DT4NR05JD9CZoSWROPr2lC6se0VjSqQPZJJlEV79mk,274
81
+ sdg_hub/flows/text_analysis/structured_insights/analyze_sentiment.yaml,sha256=1YGPypFJYS8qfYFj2J6ERTgodKJvMF4YHNGt_vOF5qc,1000
82
+ sdg_hub/flows/text_analysis/structured_insights/extract_entities.yaml,sha256=Q_SDy14Zu-qS2sbKfUBmGlYj3k7CUg6HzzXlFCXRKuU,1169
83
+ sdg_hub/flows/text_analysis/structured_insights/extract_keywords.yaml,sha256=_nPPMdHnxag_lYbhYUjGJGo-CvRwWvwdGX7cQhdZ1S0,847
84
+ sdg_hub/flows/text_analysis/structured_insights/flow.yaml,sha256=2HuGTyNwYe6a8Ev-QdKZXwe29NL4wOkq4ecEV9a7NDg,4221
85
+ sdg_hub/flows/text_analysis/structured_insights/summarize.yaml,sha256=WXwQak1pF8e1OwnOoI1EHu8QB6iUNW89rfkTdi1Oq54,687
86
+ sdg_hub-0.3.0.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
87
+ sdg_hub-0.3.0.dist-info/METADATA,sha256=eVLM1fK2-9uD_eWhSRW5VTbdUs-XIn_Va3Z-rY31Utk,9735
88
+ sdg_hub-0.3.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
89
+ sdg_hub-0.3.0.dist-info/top_level.txt,sha256=TqI7d-HE1n6zkXFkU0nF3A1Ct0P0pBaqI675uFokhx4,8
90
+ sdg_hub-0.3.0.dist-info/RECORD,,