sdg-hub 0.2.1__py3-none-any.whl → 0.3.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- sdg_hub/_version.py +16 -3
- sdg_hub/core/blocks/deprecated_blocks/selector.py +1 -1
- sdg_hub/core/blocks/evaluation/evaluate_faithfulness_block.py +175 -416
- sdg_hub/core/blocks/evaluation/evaluate_relevancy_block.py +174 -415
- sdg_hub/core/blocks/evaluation/verify_question_block.py +180 -415
- sdg_hub/core/blocks/llm/client_manager.py +92 -43
- sdg_hub/core/blocks/llm/config.py +1 -0
- sdg_hub/core/blocks/llm/llm_chat_block.py +74 -16
- sdg_hub/core/blocks/llm/llm_chat_with_parsing_retry_block.py +277 -115
- sdg_hub/core/blocks/llm/text_parser_block.py +88 -23
- sdg_hub/core/blocks/registry.py +48 -34
- sdg_hub/core/blocks/transform/__init__.py +2 -0
- sdg_hub/core/blocks/transform/index_based_mapper.py +1 -1
- sdg_hub/core/blocks/transform/json_structure_block.py +142 -0
- sdg_hub/core/flow/base.py +326 -62
- sdg_hub/core/utils/datautils.py +54 -0
- sdg_hub/core/utils/flow_metrics.py +261 -0
- sdg_hub/core/utils/logger_config.py +50 -9
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/__init__.py +0 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/__init__.py +0 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/detailed_summary.yaml +11 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/flow.yaml +159 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/__init__.py +0 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/extractive_summary.yaml +65 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/flow.yaml +161 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_answers.yaml +15 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_multiple_qa.yaml +21 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_question_list.yaml +44 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/__init__.py +0 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/flow.yaml +104 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/key_facts_summary.yaml +61 -0
- sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/flow.yaml +0 -7
- sdg_hub/flows/text_analysis/__init__.py +2 -0
- sdg_hub/flows/text_analysis/structured_insights/__init__.py +6 -0
- sdg_hub/flows/text_analysis/structured_insights/analyze_sentiment.yaml +27 -0
- sdg_hub/flows/text_analysis/structured_insights/extract_entities.yaml +38 -0
- sdg_hub/flows/text_analysis/structured_insights/extract_keywords.yaml +21 -0
- sdg_hub/flows/text_analysis/structured_insights/flow.yaml +153 -0
- sdg_hub/flows/text_analysis/structured_insights/summarize.yaml +21 -0
- {sdg_hub-0.2.1.dist-info → sdg_hub-0.3.0.dist-info}/METADATA +42 -15
- {sdg_hub-0.2.1.dist-info → sdg_hub-0.3.0.dist-info}/RECORD +44 -22
- {sdg_hub-0.2.1.dist-info → sdg_hub-0.3.0.dist-info}/WHEEL +0 -0
- {sdg_hub-0.2.1.dist-info → sdg_hub-0.3.0.dist-info}/licenses/LICENSE +0 -0
- {sdg_hub-0.2.1.dist-info → sdg_hub-0.3.0.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,153 @@
|
|
1
|
+
metadata:
|
2
|
+
id: green-clay-812
|
3
|
+
name: "Structured Text Insights Extraction Flow"
|
4
|
+
description: >-
|
5
|
+
Multi-step pipeline for extracting structured insights from text including
|
6
|
+
summary, keywords, entities, and sentiment analysis combined into a JSON output
|
7
|
+
version: "1.0.0"
|
8
|
+
author: "SDG Hub Contributors"
|
9
|
+
recommended_models:
|
10
|
+
default: "openai/gpt-oss-120b"
|
11
|
+
compatible:
|
12
|
+
- "meta-llama/Llama-3.3-70B-Instruct"
|
13
|
+
- "microsoft/phi-4"
|
14
|
+
- "mistralai/Mixtral-8x7B-Instruct-v0.1"
|
15
|
+
experimental:
|
16
|
+
- "gpt-4o"
|
17
|
+
tags:
|
18
|
+
- "text-analysis"
|
19
|
+
- "summarization"
|
20
|
+
- "nlp"
|
21
|
+
- "structured-output"
|
22
|
+
- "insights"
|
23
|
+
- "sentiment-analysis"
|
24
|
+
- "entity-extraction"
|
25
|
+
- "keyword-extraction"
|
26
|
+
license: "Apache-2.0"
|
27
|
+
min_sdg_hub_version: "0.2.0"
|
28
|
+
dataset_requirements:
|
29
|
+
required_columns:
|
30
|
+
- "text"
|
31
|
+
description: >-
|
32
|
+
Input dataset should contain text content for analysis. Each text should be
|
33
|
+
substantial enough for meaningful analysis (minimum 50 words recommended).
|
34
|
+
Works well with news articles, blog posts, reviews, and other content.
|
35
|
+
|
36
|
+
blocks:
|
37
|
+
# Extract Summary
|
38
|
+
- block_type: "PromptBuilderBlock"
|
39
|
+
block_config:
|
40
|
+
block_name: "build_summary_prompt"
|
41
|
+
input_cols:
|
42
|
+
- "text"
|
43
|
+
output_cols: "summary_prompt"
|
44
|
+
prompt_config_path: "summarize.yaml"
|
45
|
+
- block_type: "LLMChatBlock"
|
46
|
+
block_config:
|
47
|
+
block_name: "generate_summary"
|
48
|
+
input_cols: "summary_prompt"
|
49
|
+
output_cols: "raw_summary"
|
50
|
+
max_tokens: 1024
|
51
|
+
temperature: 0.3
|
52
|
+
async_mode: true
|
53
|
+
- block_type: "TextParserBlock"
|
54
|
+
block_config:
|
55
|
+
block_name: "parse_summary"
|
56
|
+
input_cols: "raw_summary"
|
57
|
+
output_cols: "summary"
|
58
|
+
start_tags:
|
59
|
+
- "[SUMMARY]"
|
60
|
+
end_tags:
|
61
|
+
- "[/SUMMARY]"
|
62
|
+
|
63
|
+
# Extract Keywords
|
64
|
+
- block_type: "PromptBuilderBlock"
|
65
|
+
block_config:
|
66
|
+
block_name: "build_keywords_prompt"
|
67
|
+
input_cols:
|
68
|
+
- "text"
|
69
|
+
output_cols: "keywords_prompt"
|
70
|
+
prompt_config_path: "extract_keywords.yaml"
|
71
|
+
- block_type: "LLMChatBlock"
|
72
|
+
block_config:
|
73
|
+
block_name: "generate_keywords"
|
74
|
+
input_cols: "keywords_prompt"
|
75
|
+
output_cols: "raw_keywords"
|
76
|
+
max_tokens: 512
|
77
|
+
temperature: 0.3
|
78
|
+
async_mode: true
|
79
|
+
- block_type: "TextParserBlock"
|
80
|
+
block_config:
|
81
|
+
block_name: "parse_keywords"
|
82
|
+
input_cols: "raw_keywords"
|
83
|
+
output_cols: "keywords"
|
84
|
+
start_tags:
|
85
|
+
- "[KEYWORDS]"
|
86
|
+
end_tags:
|
87
|
+
- "[/KEYWORDS]"
|
88
|
+
|
89
|
+
# Extract Entities
|
90
|
+
- block_type: "PromptBuilderBlock"
|
91
|
+
block_config:
|
92
|
+
block_name: "build_entities_prompt"
|
93
|
+
input_cols:
|
94
|
+
- "text"
|
95
|
+
output_cols: "entities_prompt"
|
96
|
+
prompt_config_path: "extract_entities.yaml"
|
97
|
+
- block_type: "LLMChatBlock"
|
98
|
+
block_config:
|
99
|
+
block_name: "generate_entities"
|
100
|
+
input_cols: "entities_prompt"
|
101
|
+
output_cols: "raw_entities"
|
102
|
+
max_tokens: 1024
|
103
|
+
temperature: 0.3
|
104
|
+
async_mode: true
|
105
|
+
- block_type: "TextParserBlock"
|
106
|
+
block_config:
|
107
|
+
block_name: "parse_entities"
|
108
|
+
input_cols: "raw_entities"
|
109
|
+
output_cols: "entities"
|
110
|
+
start_tags:
|
111
|
+
- "[ENTITIES]"
|
112
|
+
end_tags:
|
113
|
+
- "[/ENTITIES]"
|
114
|
+
|
115
|
+
# Extract Sentiment
|
116
|
+
- block_type: "PromptBuilderBlock"
|
117
|
+
block_config:
|
118
|
+
block_name: "build_sentiment_prompt"
|
119
|
+
input_cols:
|
120
|
+
- "text"
|
121
|
+
output_cols: "sentiment_prompt"
|
122
|
+
prompt_config_path: "analyze_sentiment.yaml"
|
123
|
+
- block_type: "LLMChatBlock"
|
124
|
+
block_config:
|
125
|
+
block_name: "generate_sentiment"
|
126
|
+
input_cols: "sentiment_prompt"
|
127
|
+
output_cols: "raw_sentiment"
|
128
|
+
max_tokens: 256
|
129
|
+
temperature: 0.1
|
130
|
+
async_mode: true
|
131
|
+
- block_type: "TextParserBlock"
|
132
|
+
block_config:
|
133
|
+
block_name: "parse_sentiment"
|
134
|
+
input_cols: "raw_sentiment"
|
135
|
+
output_cols: "sentiment"
|
136
|
+
start_tags:
|
137
|
+
- "[SENTIMENT]"
|
138
|
+
end_tags:
|
139
|
+
- "[/SENTIMENT]"
|
140
|
+
|
141
|
+
# Create Structured Insights
|
142
|
+
- block_type: "JSONStructureBlock"
|
143
|
+
block_config:
|
144
|
+
block_name: "create_structured_insights"
|
145
|
+
input_cols:
|
146
|
+
- "summary"
|
147
|
+
- "keywords"
|
148
|
+
- "entities"
|
149
|
+
- "sentiment"
|
150
|
+
output_cols:
|
151
|
+
- "structured_insights"
|
152
|
+
ensure_json_serializable: true
|
153
|
+
|
@@ -0,0 +1,21 @@
|
|
1
|
+
- role: system
|
2
|
+
content: You are an AI assistant expert at creating concise, informative summaries that capture the most important information from text.
|
3
|
+
|
4
|
+
- role: user
|
5
|
+
content: |
|
6
|
+
Create a brief, concise summary of the following text. Your summary should:
|
7
|
+
|
8
|
+
1. Be 2-3 sentences maximum
|
9
|
+
2. Capture the most important information and key points
|
10
|
+
3. Be clear and easy to understand
|
11
|
+
4. Avoid adding any information not present in the original text
|
12
|
+
5. Focus on the main topic, key facts, and significant details
|
13
|
+
|
14
|
+
Text to summarize:
|
15
|
+
{{text}}
|
16
|
+
|
17
|
+
Provide your response in the following format:
|
18
|
+
[SUMMARY]
|
19
|
+
Your summary here
|
20
|
+
[/SUMMARY]
|
21
|
+
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: sdg_hub
|
3
|
-
Version: 0.
|
3
|
+
Version: 0.3.0
|
4
4
|
Summary: Synthetic Data Generation
|
5
5
|
Author-email: Red Hat AI Innovation <abhandwa@redhat.com>
|
6
6
|
License: Apache-2.0
|
@@ -27,7 +27,6 @@ Requires-Dist: datasets<4.0.0,>=2.18.0
|
|
27
27
|
Requires-Dist: httpx<1.0.0,>=0.25.0
|
28
28
|
Requires-Dist: jinja2
|
29
29
|
Requires-Dist: litellm<1.75.0,>=1.73.0
|
30
|
-
Requires-Dist: openai<2.0.0,>=1.13.3
|
31
30
|
Requires-Dist: rich
|
32
31
|
Requires-Dist: pydantic<3.0.0,>=2.0.0
|
33
32
|
Requires-Dist: python-dotenv<2.0.0,>=1.0.0
|
@@ -54,6 +53,7 @@ Requires-Dist: sentence-transformers; extra == "examples"
|
|
54
53
|
Requires-Dist: instructor; extra == "examples"
|
55
54
|
Requires-Dist: fastapi; extra == "examples"
|
56
55
|
Requires-Dist: nest-asyncio; extra == "examples"
|
56
|
+
Requires-Dist: ipykernel; extra == "examples"
|
57
57
|
Provides-Extra: dev
|
58
58
|
Requires-Dist: pre-commit<4.0,>=3.0.4; extra == "dev"
|
59
59
|
Requires-Dist: pylint<4.0,>=2.16.2; extra == "dev"
|
@@ -64,6 +64,7 @@ Requires-Dist: pytest-cov; extra == "dev"
|
|
64
64
|
Requires-Dist: pytest-html; extra == "dev"
|
65
65
|
Requires-Dist: tox<5,>=4.4.2; extra == "dev"
|
66
66
|
Requires-Dist: ruff; extra == "dev"
|
67
|
+
Requires-Dist: pytest-env; extra == "dev"
|
67
68
|
Dynamic: license-file
|
68
69
|
|
69
70
|
# `sdg_hub`: Synthetic Data Generation Toolkit
|
@@ -92,6 +93,8 @@ A modular Python framework for building synthetic data generation pipelines usin
|
|
92
93
|
|
93
94
|
**📊 Rich Monitoring** - Detailed logging with progress bars and execution summaries.
|
94
95
|
|
96
|
+
**📋 Dataset Schema Discovery** - Instantly discover required data formats. Get empty datasets with correct schema for easy validation and data preparation.
|
97
|
+
|
95
98
|
**🧩 Easily Extensible** - Create custom blocks with simple inheritance. Rich logging and monitoring built-in.
|
96
99
|
|
97
100
|
|
@@ -176,22 +179,46 @@ flow.set_model_config(
|
|
176
179
|
api_key="your_key",
|
177
180
|
)
|
178
181
|
```
|
179
|
-
####
|
182
|
+
#### Discover dataset requirements and create your dataset
|
180
183
|
```python
|
181
|
-
#
|
182
|
-
dataset
|
183
|
-
|
184
|
-
|
185
|
-
|
186
|
-
|
187
|
-
|
188
|
-
|
189
|
-
'
|
190
|
-
'
|
191
|
-
'
|
192
|
-
'
|
184
|
+
# First, discover what data the flow needs
|
185
|
+
# Get an empty dataset with the exact schema needed
|
186
|
+
schema_dataset = flow.get_dataset_schema() # Get empty dataset with correct schema
|
187
|
+
print(f"Required columns: {schema_dataset.column_names}")
|
188
|
+
print(f"Schema: {schema_dataset.features}")
|
189
|
+
|
190
|
+
# Option 1: Add data directly to the schema dataset
|
191
|
+
dataset = schema_dataset.add_item({
|
192
|
+
'document': 'Your document text here...',
|
193
|
+
'document_outline': '1. Topic A; 2. Topic B; 3. Topic C',
|
194
|
+
'domain': 'Computer Science',
|
195
|
+
'icl_document': 'Example document for in-context learning...',
|
196
|
+
'icl_query_1': 'Example question 1?',
|
197
|
+
'icl_response_1': 'Example answer 1',
|
198
|
+
'icl_query_2': 'Example question 2?',
|
199
|
+
'icl_response_2': 'Example answer 2',
|
200
|
+
'icl_query_3': 'Example question 3?',
|
201
|
+
'icl_response_3': 'Example answer 3'
|
193
202
|
})
|
194
203
|
|
204
|
+
# Option 2: Create your own dataset and validate the schema
|
205
|
+
my_dataset = Dataset.from_dict(my_data_dict)
|
206
|
+
if my_dataset.features == schema_dataset.features:
|
207
|
+
print("✅ Schema matches - ready to generate!")
|
208
|
+
dataset = my_dataset
|
209
|
+
else:
|
210
|
+
print("❌ Schema mismatch - check your columns")
|
211
|
+
|
212
|
+
# Option 3: Get raw requirements for detailed inspection
|
213
|
+
requirements = flow.get_dataset_requirements()
|
214
|
+
if requirements:
|
215
|
+
print(f"Required: {requirements.required_columns}")
|
216
|
+
print(f"Optional: {requirements.optional_columns}")
|
217
|
+
print(f"Min samples: {requirements.min_samples}")
|
218
|
+
```
|
219
|
+
|
220
|
+
#### Dry Run and Generate
|
221
|
+
```python
|
195
222
|
# Quick Testing with Dry Run
|
196
223
|
dry_result = flow.dry_run(dataset, sample_size=1)
|
197
224
|
print(f"Dry run completed in {dry_result['execution_time_seconds']:.2f}s")
|
@@ -1,10 +1,10 @@
|
|
1
1
|
sdg_hub/__init__.py,sha256=Tw-6R5a8_W1kJcTAsW3R9ltBDP1dy5-fe7Tvt3cSyCQ,550
|
2
|
-
sdg_hub/_version.py,sha256=
|
2
|
+
sdg_hub/_version.py,sha256=5zTqm8rgXsWYBpB2M3Zw_K1D-aV8wP7NsBLrmMKkrAQ,704
|
3
3
|
sdg_hub/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
4
4
|
sdg_hub/core/__init__.py,sha256=NwqB4fwhC29W50VW7QXZssLxx122YvgO9LHDLdgAnrI,496
|
5
5
|
sdg_hub/core/blocks/__init__.py,sha256=9sCkCvDQzJGSedaePVlEIpbNwrkBz_K500VW_6FLhuE,1601
|
6
6
|
sdg_hub/core/blocks/base.py,sha256=TrzUAkG7Tiquk0Z3SOFsb5mRnHd1IbHH6gFPVH1P7T8,10424
|
7
|
-
sdg_hub/core/blocks/registry.py,sha256=
|
7
|
+
sdg_hub/core/blocks/registry.py,sha256=FuEN_pnq-nSH1LguY3_oCubT6Kz3SuJjk3TcUpLT-lw,10695
|
8
8
|
sdg_hub/core/blocks/deprecated_blocks/__init__.py,sha256=RDu3MWFStDQko-TKkx8tGoB1UTatP_RSldZK43zHDvY,889
|
9
9
|
sdg_hub/core/blocks/deprecated_blocks/combine_columns.py,sha256=HCvpaYsAwgx1Dm0vIshcWsKoVsRT0KrmKp9j4oqtByc,2757
|
10
10
|
sdg_hub/core/blocks/deprecated_blocks/duplicate_columns.py,sha256=maCaaEs0EMMzt7L1xm7fAH3ylaFMHEkeC_dtOw3FrjU,2694
|
@@ -13,44 +13,59 @@ sdg_hub/core/blocks/deprecated_blocks/flatten_columns.py,sha256=IenCskrPEv09h2uT
|
|
13
13
|
sdg_hub/core/blocks/deprecated_blocks/llmblock.py,sha256=34lzC43BODpMk5AwlWA1ctdYPmN7cA6WL5vMXaI0P0Y,20385
|
14
14
|
sdg_hub/core/blocks/deprecated_blocks/rename_columns.py,sha256=thp-mHtkRmUw_nYKpldy_mLWR2AvC5YUhbqDETM6-T0,2620
|
15
15
|
sdg_hub/core/blocks/deprecated_blocks/sample_populator.py,sha256=UdueMApxOmPWaxxMrw7b1v74fKJBfqqRATEBqgmVtNw,1737
|
16
|
-
sdg_hub/core/blocks/deprecated_blocks/selector.py,sha256=
|
16
|
+
sdg_hub/core/blocks/deprecated_blocks/selector.py,sha256=nWecsVsW8DvBcqAF_LOqXmW-5MQ28uN3d1y6wkSy38c,2960
|
17
17
|
sdg_hub/core/blocks/deprecated_blocks/set_to_majority_value.py,sha256=44TQu-rK5isia-otMVB1zHd8D-wWmu3C8CI1NLtfY5s,2729
|
18
18
|
sdg_hub/core/blocks/evaluation/__init__.py,sha256=kFXee-vsVVdU2XtLio9qHgPx_a0zoB_rQr509EKBGJc,357
|
19
|
-
sdg_hub/core/blocks/evaluation/evaluate_faithfulness_block.py,sha256=
|
20
|
-
sdg_hub/core/blocks/evaluation/evaluate_relevancy_block.py,sha256=
|
21
|
-
sdg_hub/core/blocks/evaluation/verify_question_block.py,sha256=
|
19
|
+
sdg_hub/core/blocks/evaluation/evaluate_faithfulness_block.py,sha256=vFi3YIxVPNnzgdenIeAl7yUb4OOUY_uUOXS-pWLsDmw,12223
|
20
|
+
sdg_hub/core/blocks/evaluation/evaluate_relevancy_block.py,sha256=NXT1lixR-JnOXNlBCbMjULcpu4kh2SthhwCWEobiBt0,12115
|
21
|
+
sdg_hub/core/blocks/evaluation/verify_question_block.py,sha256=LKoIHdxUuTVO24n_M9cAliEj56uEe2kQAecKTRz65zI,12465
|
22
22
|
sdg_hub/core/blocks/filtering/__init__.py,sha256=isxSVSvDqkMjG8dQSl3Q2M4g5c1t9fTjBSA21icf-yA,275
|
23
23
|
sdg_hub/core/blocks/filtering/column_value_filter.py,sha256=H8Gif0q9Wc_d1TnVow8Zpsg7blJOFGN1EZmV6OPpkcg,5971
|
24
24
|
sdg_hub/core/blocks/llm/__init__.py,sha256=N6-Prgd4X85oWbMQzhYMrq7OX-NTJm57cghowK-val0,844
|
25
|
-
sdg_hub/core/blocks/llm/client_manager.py,sha256=
|
26
|
-
sdg_hub/core/blocks/llm/config.py,sha256=
|
25
|
+
sdg_hub/core/blocks/llm/client_manager.py,sha256=IpMUwECL9_oNFC3yxg9A6BRqMcdg0Wdpzx28BhX45Xo,14742
|
26
|
+
sdg_hub/core/blocks/llm/config.py,sha256=gc4xp5D20MSlKMFEos0QAaKUwgbZpBtMGXmn6LsIk78,11289
|
27
27
|
sdg_hub/core/blocks/llm/error_handler.py,sha256=7T-019ZFB9qgZoX1ybIiXyaLjPzrF96qcKmUu6vmO6g,12178
|
28
|
-
sdg_hub/core/blocks/llm/llm_chat_block.py,sha256=
|
29
|
-
sdg_hub/core/blocks/llm/llm_chat_with_parsing_retry_block.py,sha256=
|
28
|
+
sdg_hub/core/blocks/llm/llm_chat_block.py,sha256=9ytjxjADM0FydkLapZPSQPfzjjrFIdFONs3EJEoKnaw,23007
|
29
|
+
sdg_hub/core/blocks/llm/llm_chat_with_parsing_retry_block.py,sha256=H7LqYpEiFO1g2cxncAl4vkLhQxAYgGpV6cUyQTSG03k,27628
|
30
30
|
sdg_hub/core/blocks/llm/prompt_builder_block.py,sha256=fkJd718X1oYlMY1cjo_8WCO16Gl8Tm0bUPWR78E_uws,13935
|
31
|
-
sdg_hub/core/blocks/llm/text_parser_block.py,sha256=
|
32
|
-
sdg_hub/core/blocks/transform/__init__.py,sha256=
|
31
|
+
sdg_hub/core/blocks/llm/text_parser_block.py,sha256=8oRlXEkw8ULA8XVa7WtQZUojodl_ihs1omZpvbwoJQE,17165
|
32
|
+
sdg_hub/core/blocks/transform/__init__.py,sha256=lF9InjOzA6p_mjiwV-a2Kwstq9kqRiQ-dEwbsmR9yQs,825
|
33
33
|
sdg_hub/core/blocks/transform/duplicate_columns.py,sha256=SaP7rIF4ZFEFFa50aU2xGNIuddXaEZrKxdWfHjzFpVI,2833
|
34
|
-
sdg_hub/core/blocks/transform/index_based_mapper.py,sha256=
|
34
|
+
sdg_hub/core/blocks/transform/index_based_mapper.py,sha256=XC_a7Skbd3mu7f4ra8fGWPxMwqUMSjJkQ7Ag7vflwJA,8235
|
35
|
+
sdg_hub/core/blocks/transform/json_structure_block.py,sha256=hm-0M0NAyUREgJRPyV1u-laorgX6MZ1o17E9rNBhN78,5010
|
35
36
|
sdg_hub/core/blocks/transform/melt_columns.py,sha256=vaYa5Taq6GhNZYWFL4uPK3-SfN2BsKEm-wvjd2EYYoI,4382
|
36
37
|
sdg_hub/core/blocks/transform/rename_columns.py,sha256=qeB5L2utqDQnutUetH1VKZSqDiJSH_yUp5EFCV-XCVI,1998
|
37
38
|
sdg_hub/core/blocks/transform/text_concat.py,sha256=_-B__Hob1WwgwkILPIZvTnsDzuwtoX1hKviyzHlnnes,3149
|
38
39
|
sdg_hub/core/blocks/transform/uniform_col_val_setter.py,sha256=XnjiT29z3PzIPy8M-mmE2w-Miab6Ed5ahy32SaxTCTE,3263
|
39
40
|
sdg_hub/core/flow/__init__.py,sha256=N2NZGngvd7qpT5FI_knKukUFM0IkD9K5jdTi-gDeUI4,475
|
40
|
-
sdg_hub/core/flow/base.py,sha256=
|
41
|
+
sdg_hub/core/flow/base.py,sha256=8Xacytg9M82Mbv8r2GLbQgNltH-hCtFS1Fa1WpfFlSw,56488
|
41
42
|
sdg_hub/core/flow/checkpointer.py,sha256=stm5ZtjjEiLk9ZkAAnoQQn5Y8Yl_d7qCsQLZTrCXR48,11867
|
42
43
|
sdg_hub/core/flow/metadata.py,sha256=h9jpvAzWsF5n4ztZMzwa9ZNgnzKTHmFWdn7YbyJLHCw,12977
|
43
44
|
sdg_hub/core/flow/migration.py,sha256=6and-RBqV0t2gRipr1GiOOVnyBJdtyyjw1kO08Z--d4,7558
|
44
45
|
sdg_hub/core/flow/registry.py,sha256=DzCqEEgwhvwnCBAGLogoMVdwXh4pCHrxOWqoxam7O8I,12162
|
45
46
|
sdg_hub/core/flow/validation.py,sha256=pUJvgaUjLpKNwvW6djcqVOF-HShOjegEmGOnUnoX4BA,9722
|
46
47
|
sdg_hub/core/utils/__init__.py,sha256=C2FzLn3dHprwGJDEgI4fyFS3aoCJR-9PhHsunxropJ8,351
|
47
|
-
sdg_hub/core/utils/datautils.py,sha256=
|
48
|
+
sdg_hub/core/utils/datautils.py,sha256=q94NzBEtNwRFhzpk3FHofgJJU0gVRgAV3AAWZ1MroFk,3860
|
48
49
|
sdg_hub/core/utils/error_handling.py,sha256=yku8cGj_nKCyXDsnb-mHCpgukkkAMucJ4iAUrIzqysc,5510
|
49
50
|
sdg_hub/core/utils/flow_id_words.yaml,sha256=5QHpQdP7zwahRuooyAlJIwBY7WcDR7vtbJXxVJqujbg,2317
|
50
51
|
sdg_hub/core/utils/flow_identifier.py,sha256=aAHfK_G9AwEtMglLRMdMpi_AI1dciub5UqBGm4yb2HE,2841
|
51
|
-
sdg_hub/core/utils/
|
52
|
+
sdg_hub/core/utils/flow_metrics.py,sha256=VOdreUzP0kPgnkPjuQk87tZsK5f1u6XGEPM8ugCt0CY,8824
|
53
|
+
sdg_hub/core/utils/logger_config.py,sha256=6_cnsIHtSAdq1iTTZ7Q7nAJ1dmldlxSZ0AB49yLiQ20,2034
|
52
54
|
sdg_hub/core/utils/path_resolution.py,sha256=yWof4kGNpQ5dKcrVHg0h9KfOKLZ6ROjdfsLAZsQT5rM,2000
|
53
55
|
sdg_hub/core/utils/yaml_utils.py,sha256=tShCd-FFkp0xlKnLe7dXsMOR4AvT9d2qRUmu4ZnPSEY,1458
|
56
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
57
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_answers.yaml,sha256=THRT3cY44KGI_69B2wqt2Q89EknnOSE7B4A_jdnxlIU,330
|
58
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_multiple_qa.yaml,sha256=Cs-yeiXs4yac3dZsurdXBZj-kkwWdK-xBywjvBlgtGI,669
|
59
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/generate_question_list.yaml,sha256=qHOgUNrQz2vjUjJiEHNGWxDDXwjJlP1kofTxeGgLyPI,1461
|
60
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
61
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/detailed_summary.yaml,sha256=Ik6gAml0O-jPq8jpXBAkURzYkQuFOnDZb4LDwjmfAiE,381
|
62
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/flow.yaml,sha256=va9ESTlEaZozy8pXTJ8OICjRg08KSP4l305YUKFuGAE,4417
|
63
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
64
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/extractive_summary.yaml,sha256=SeapWoOx3fhN5SvWYuHss_9prLE8xSkOic7JkbDHSR0,4081
|
65
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/flow.yaml,sha256=Iv4AlbE9PFtTn6teekgiNtrTiYio_nYWS8gyD6eFLUA,4580
|
66
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
67
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/flow.yaml,sha256=Rv0c4s5vim2I5jKzQgjcUfVMdla6czzmZUU67hlTAbg,2898
|
68
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/key_facts_summary.yaml,sha256=YKMX_CuvcThG_bdNCAIXdVBkMvB72I89RGq2ltSSgc8,3298
|
54
69
|
sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/README.md,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
55
70
|
sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
56
71
|
sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/atomic_facts.yaml,sha256=xgUNY793y4lcpdtuWm5Ah1CmbU2gvvPQCpZMMa6kPXU,2447
|
@@ -59,10 +74,17 @@ sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/ev
|
|
59
74
|
sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/evaluate_question.yaml,sha256=zwzklXup6khRkR88avgrJTcjaMcV1wnbeYaML5oPuNs,1767
|
60
75
|
sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/evaluate_relevancy.yaml,sha256=cA8igo7jMrRXaWW6k0of6KOp7YnxLtPj0fP4DbrmZNQ,3647
|
61
76
|
sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/extractive_summary.yaml,sha256=fcMV7LaCFZo4D29nwhGJXqFFuZMYVLo9XYjv8zcU6zs,364
|
62
|
-
sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/flow.yaml,sha256=
|
77
|
+
sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/flow.yaml,sha256=oyrLRjEnmioMa_G_sd9yQK_nBt4arwWV5fvKgzYE2ds,6090
|
63
78
|
sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/generate_questions_responses.yaml,sha256=yX8aLY8dJSDML9ZJhnj9RzPbN8tH2xfcM4Gc6xZuwqQ,2596
|
64
|
-
sdg_hub
|
65
|
-
sdg_hub
|
66
|
-
sdg_hub
|
67
|
-
sdg_hub
|
68
|
-
sdg_hub
|
79
|
+
sdg_hub/flows/text_analysis/__init__.py,sha256=WStks4eM_KHNTVsHglcj8vFghmI0PH9P1hUrijBLbwc,125
|
80
|
+
sdg_hub/flows/text_analysis/structured_insights/__init__.py,sha256=_DT4NR05JD9CZoSWROPr2lC6se0VjSqQPZJJlEV79mk,274
|
81
|
+
sdg_hub/flows/text_analysis/structured_insights/analyze_sentiment.yaml,sha256=1YGPypFJYS8qfYFj2J6ERTgodKJvMF4YHNGt_vOF5qc,1000
|
82
|
+
sdg_hub/flows/text_analysis/structured_insights/extract_entities.yaml,sha256=Q_SDy14Zu-qS2sbKfUBmGlYj3k7CUg6HzzXlFCXRKuU,1169
|
83
|
+
sdg_hub/flows/text_analysis/structured_insights/extract_keywords.yaml,sha256=_nPPMdHnxag_lYbhYUjGJGo-CvRwWvwdGX7cQhdZ1S0,847
|
84
|
+
sdg_hub/flows/text_analysis/structured_insights/flow.yaml,sha256=2HuGTyNwYe6a8Ev-QdKZXwe29NL4wOkq4ecEV9a7NDg,4221
|
85
|
+
sdg_hub/flows/text_analysis/structured_insights/summarize.yaml,sha256=WXwQak1pF8e1OwnOoI1EHu8QB6iUNW89rfkTdi1Oq54,687
|
86
|
+
sdg_hub-0.3.0.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
87
|
+
sdg_hub-0.3.0.dist-info/METADATA,sha256=eVLM1fK2-9uD_eWhSRW5VTbdUs-XIn_Va3Z-rY31Utk,9735
|
88
|
+
sdg_hub-0.3.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
89
|
+
sdg_hub-0.3.0.dist-info/top_level.txt,sha256=TqI7d-HE1n6zkXFkU0nF3A1Ct0P0pBaqI675uFokhx4,8
|
90
|
+
sdg_hub-0.3.0.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|