@yottagraph-app/aether-instructions 1.1.8 → 1.1.9
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/commands/update_instructions.md +30 -23
- package/package.json +1 -1
- package/skills/data-model/SKILL.md +58 -0
- package/skills/data-model/edgar/DATA_DICTIONARY.md +306 -0
- package/skills/data-model/edgar/schema.yaml +1893 -0
- package/skills/data-model/fdic/DATA_DICTIONARY.md +243 -0
- package/skills/data-model/fdic/schema.yaml +356 -0
- package/skills/data-model/fred/DATA_DICTIONARY.md +313 -0
- package/skills/data-model/fred/schema.yaml +155 -0
- package/skills/data-model/gleif/DATA_DICTIONARY.md +211 -0
- package/skills/data-model/gleif/schema.yaml +254 -0
- package/skills/data-model/newsdata/schema.yaml +650 -0
- package/skills/data-model/overview.md +77 -0
- package/skills/data-model/polymarket/DATA_DICTIONARY.md +384 -0
- package/skills/data-model/polymarket/schema.yaml +601 -0
- package/skills/data-model/sanctions/DATA_DICTIONARY.md +140 -0
- package/skills/data-model/sanctions/schema.yaml +153 -0
- package/skills/data-model/stocks/DATA_DICTIONARY.md +122 -0
- package/skills/data-model/stocks/schema.yaml +131 -0
- package/skills/data-model/system_schema.yaml +71 -0
- package/skills/data-model/wikipedia/DATA_DICTIONARY.md +185 -0
- package/skills/data-model/wikipedia/schema.yaml +255 -0
- package/skills/elemental-api/SKILL.md +37 -0
- package/skills/elemental-api/articles.md +386 -0
- package/skills/elemental-api/entities.md +393 -0
- package/skills/elemental-api/events.md +145 -0
- package/skills/elemental-api/find.md +279 -0
- package/skills/elemental-api/graph.md +239 -0
- package/skills/elemental-api/llm.md +18 -0
- package/skills/elemental-api/overview.md +51 -0
- package/skills/elemental-api/relationships.md +310 -0
- package/skills/elemental-api/schema.md +379 -0
- package/skills/elemental-api/sentiment.md +93 -0
- package/skills/elemental-api/server.md +186 -0
|
@@ -0,0 +1,650 @@
|
|
|
1
|
+
# Dataset schema for newsdata article extraction.
|
|
2
|
+
#
|
|
3
|
+
# This schema defines the entity types, relationships, and attributes
|
|
4
|
+
# extracted from news articles via freetext LLM extraction. Most elements
|
|
5
|
+
# are active (no passive flag), which means they are extracted by the LLM.
|
|
6
|
+
# Some elements are passive (passive: true), which means they are created
|
|
7
|
+
# by the atomizer from metadata (URL parsing, page rank APIs, LSH dedup, etc.)
|
|
8
|
+
# rather than LLM extraction.
|
|
9
|
+
#
|
|
10
|
+
# NOTE: All elements are currently marked not_mergeable because the resolution
|
|
11
|
+
# services do not yet support clustering. Once flavor, property, and
|
|
12
|
+
# relationship resolution services are operational, switch common elements
|
|
13
|
+
# (person, organization, head_of, works_at, etc.) to mergeable.
|
|
14
|
+
name: "newsdata"
|
|
15
|
+
description: "Entities and relationships extracted from news articles, press releases, and similar unstructured text sources"
|
|
16
|
+
|
|
17
|
+
extraction:
|
|
18
|
+
flavors: closed
|
|
19
|
+
properties: closed
|
|
20
|
+
relationships: closed
|
|
21
|
+
attributes: closed
|
|
22
|
+
events: closed
|
|
23
|
+
|
|
24
|
+
# =============================================================================
|
|
25
|
+
# ACTIVE FLAVORS — extracted by the LLM
|
|
26
|
+
# =============================================================================
|
|
27
|
+
|
|
28
|
+
flavors:
|
|
29
|
+
- name: "person"
|
|
30
|
+
description: "A real person as opposed to a fictional character, such as a CEO, politician, or public figure"
|
|
31
|
+
display_name: "Person"
|
|
32
|
+
mergeability: not_mergeable
|
|
33
|
+
examples: ["James Taiclet", "Christine Amanpour", "Vladimir Putin"]
|
|
34
|
+
|
|
35
|
+
- name: "organization"
|
|
36
|
+
description: "A particular business, institution, or organization such as a corporation, university, government agency, or non-profit"
|
|
37
|
+
display_name: "Organization"
|
|
38
|
+
mergeability: not_mergeable
|
|
39
|
+
examples: ["Google", "Carnegie Mellon University", "The Department of Defense", "TSMC"]
|
|
40
|
+
|
|
41
|
+
- name: "location"
|
|
42
|
+
description: "A specific named geographic location such as a city, country, region, or landmark"
|
|
43
|
+
display_name: "Location"
|
|
44
|
+
mergeability: not_mergeable
|
|
45
|
+
examples: ["New York City", "San Francisco", "North America", "Bakery Square"]
|
|
46
|
+
|
|
47
|
+
- name: "financial_instrument"
|
|
48
|
+
description: "A specific asset that can be traded, such as a stock, ETF, bond, CD, or fund. Companies are organizations, NOT financial instruments. Specific currency amounts are NOT financial instruments."
|
|
49
|
+
display_name: "Financial Instrument"
|
|
50
|
+
mergeability: not_mergeable
|
|
51
|
+
examples: ["Alphabet Inc Class C", "VanEck CLO ETF", "Marcus 14-Month High-Yield CD", "Vanguard 500 Index Fund"]
|
|
52
|
+
|
|
53
|
+
- name: "product"
|
|
54
|
+
description: "A specific tangible product being sold or marketed by an organization"
|
|
55
|
+
display_name: "Product"
|
|
56
|
+
mergeability: not_mergeable
|
|
57
|
+
examples: ["Ozempic", "GeForce GPUs", "Starlink Direct to Cell service"]
|
|
58
|
+
|
|
59
|
+
# PASSIVE FLAVORS — created by the atomizer, not the LLM
|
|
60
|
+
|
|
61
|
+
- name: "article"
|
|
62
|
+
description: "A news article or press release being processed"
|
|
63
|
+
display_name: "Article"
|
|
64
|
+
mergeability: not_mergeable
|
|
65
|
+
passive: true
|
|
66
|
+
|
|
67
|
+
- name: "publication"
|
|
68
|
+
description: "A news publication or media outlet identified by its home URL"
|
|
69
|
+
display_name: "Publication"
|
|
70
|
+
mergeability: not_mergeable
|
|
71
|
+
passive: true
|
|
72
|
+
|
|
73
|
+
# =============================================================================
|
|
74
|
+
# ACTIVE RELATIONSHIPS — extracted by the LLM
|
|
75
|
+
# =============================================================================
|
|
76
|
+
|
|
77
|
+
relationships:
|
|
78
|
+
- name: "head_of"
|
|
79
|
+
description: "A person is the head of an organization or location, e.g., President, CEO, or equivalent top leadership role"
|
|
80
|
+
display_name: "Head Of"
|
|
81
|
+
mergeability: not_mergeable
|
|
82
|
+
domain_flavors: ["person"]
|
|
83
|
+
target_flavors: ["organization", "location"]
|
|
84
|
+
|
|
85
|
+
- name: "is_director"
|
|
86
|
+
description: "A person is on the board of directors of an organization. Not to be used for heads of organizations."
|
|
87
|
+
display_name: "Director Of"
|
|
88
|
+
mergeability: not_mergeable
|
|
89
|
+
domain_flavors: ["person"]
|
|
90
|
+
target_flavors: ["organization"]
|
|
91
|
+
|
|
92
|
+
- name: "works_at"
|
|
93
|
+
description: "A person is employed by, or is a founder of an organization. Not to be used for heads or board members of organizations."
|
|
94
|
+
display_name: "Works At"
|
|
95
|
+
mergeability: not_mergeable
|
|
96
|
+
domain_flavors: ["person"]
|
|
97
|
+
target_flavors: ["organization"]
|
|
98
|
+
|
|
99
|
+
- name: "trades_with"
|
|
100
|
+
description: "An organization or location (such as a country) trades with another organization or location. Not for relationships with people."
|
|
101
|
+
display_name: "Trades With"
|
|
102
|
+
mergeability: not_mergeable
|
|
103
|
+
domain_flavors: ["organization", "location"]
|
|
104
|
+
target_flavors: ["organization", "location"]
|
|
105
|
+
|
|
106
|
+
- name: "customer_of"
|
|
107
|
+
description: "An entity (such as an organization) is a customer of another entity in a business transaction"
|
|
108
|
+
display_name: "Customer Of"
|
|
109
|
+
mergeability: not_mergeable
|
|
110
|
+
domain_flavors: ["person", "organization", "location"]
|
|
111
|
+
target_flavors: ["organization", "location"]
|
|
112
|
+
|
|
113
|
+
- name: "invests_in"
|
|
114
|
+
description: "An entity invests in, finances, or owns shares or stocks of another entity"
|
|
115
|
+
display_name: "Invests In"
|
|
116
|
+
mergeability: not_mergeable
|
|
117
|
+
domain_flavors: ["person", "organization", "location"]
|
|
118
|
+
target_flavors: ["organization", "location", "financial_instrument"]
|
|
119
|
+
|
|
120
|
+
- name: "owns"
|
|
121
|
+
description: "A person or organization owns or controls another organization or location (such as real estate)."
|
|
122
|
+
display_name: "Owns"
|
|
123
|
+
mergeability: not_mergeable
|
|
124
|
+
domain_flavors: ["person", "organization"]
|
|
125
|
+
target_flavors: ["organization", "location", "financial_instrument", "product"]
|
|
126
|
+
|
|
127
|
+
- name: "is_included_in"
|
|
128
|
+
description: "An organization is included in a broad stock index or benchmark such as NASDAQ or S&P 500"
|
|
129
|
+
display_name: "Included In"
|
|
130
|
+
mergeability: not_mergeable
|
|
131
|
+
domain_flavors: ["organization"]
|
|
132
|
+
target_flavors: ["organization", "financial_instrument"]
|
|
133
|
+
|
|
134
|
+
- name: "sues"
|
|
135
|
+
description: "A person or organization sues, or files a lawsuit against another person or organization"
|
|
136
|
+
display_name: "Sues"
|
|
137
|
+
mergeability: not_mergeable
|
|
138
|
+
domain_flavors: ["person", "organization"]
|
|
139
|
+
target_flavors: ["person", "organization"]
|
|
140
|
+
|
|
141
|
+
- name: "is_located_at"
|
|
142
|
+
description: "An entity is located at, operates in, resides in, is headquartered in, was born in, visits, or died in a location"
|
|
143
|
+
display_name: "Located At"
|
|
144
|
+
mergeability: not_mergeable
|
|
145
|
+
domain_flavors: ["person", "organization", "location"]
|
|
146
|
+
target_flavors: ["location"]
|
|
147
|
+
|
|
148
|
+
- name: "commented_on"
|
|
149
|
+
description: "A person or organization made a public statement about another entity, including stock analyst ratings or price objectives"
|
|
150
|
+
display_name: "Commented On"
|
|
151
|
+
mergeability: not_mergeable
|
|
152
|
+
domain_flavors: ["person", "organization"]
|
|
153
|
+
target_flavors: ["person", "organization", "financial_instrument"]
|
|
154
|
+
|
|
155
|
+
- name: "is_colleague_of"
|
|
156
|
+
description: "Two people are colleagues. Not for relationships between locations or organizations."
|
|
157
|
+
display_name: "Colleague Of"
|
|
158
|
+
mergeability: not_mergeable
|
|
159
|
+
domain_flavors: ["person"]
|
|
160
|
+
target_flavors: ["person"]
|
|
161
|
+
|
|
162
|
+
- name: "competes_with"
|
|
163
|
+
description: "Two entities compete with each other, e.g., two competing companies, sports teams, or products"
|
|
164
|
+
display_name: "Competes With"
|
|
165
|
+
mergeability: not_mergeable
|
|
166
|
+
domain_flavors: ["person", "organization", "location", "financial_instrument", "product"]
|
|
167
|
+
target_flavors: ["person", "organization", "location", "financial_instrument", "product"]
|
|
168
|
+
|
|
169
|
+
- name: "partnered_with"
|
|
170
|
+
description: "Two entities partner with each other, e.g., two organizations co-hosting an event or forming a joint venture"
|
|
171
|
+
display_name: "Partnered With"
|
|
172
|
+
mergeability: not_mergeable
|
|
173
|
+
domain_flavors: ["person", "organization", "location"]
|
|
174
|
+
target_flavors: ["person", "organization", "location"]
|
|
175
|
+
|
|
176
|
+
- name: "is_part_of"
|
|
177
|
+
description: "An organization is a part of a larger organization, e.g., a subdivision or subsidiary within a larger company"
|
|
178
|
+
display_name: "Part Of"
|
|
179
|
+
mergeability: not_mergeable
|
|
180
|
+
domain_flavors: ["organization"]
|
|
181
|
+
target_flavors: ["organization"]
|
|
182
|
+
|
|
183
|
+
- name: "is_member_of"
|
|
184
|
+
description: "A person or organization is a member of another organization, e.g., a sports team in a league. Not mutually exclusive — entities can belong to multiple organizations."
|
|
185
|
+
display_name: "Member Of"
|
|
186
|
+
mergeability: not_mergeable
|
|
187
|
+
domain_flavors: ["person", "organization"]
|
|
188
|
+
target_flavors: ["organization"]
|
|
189
|
+
|
|
190
|
+
- name: "provides_support_to"
|
|
191
|
+
description: "An entity provides financial support to another entity. Reserved for sponsorship and donations, NOT for business transactions."
|
|
192
|
+
display_name: "Provides Support To"
|
|
193
|
+
mergeability: not_mergeable
|
|
194
|
+
domain_flavors: ["person", "organization", "location"]
|
|
195
|
+
target_flavors: ["organization", "location"]
|
|
196
|
+
|
|
197
|
+
- name: "issues"
|
|
198
|
+
description: "An organization issues or manages a financial instrument, e.g., a company listed as an issuer of an exchange-traded fund"
|
|
199
|
+
display_name: "Issues"
|
|
200
|
+
mergeability: not_mergeable
|
|
201
|
+
domain_flavors: ["organization"]
|
|
202
|
+
target_flavors: ["financial_instrument"]
|
|
203
|
+
|
|
204
|
+
- name: "serviced_by"
|
|
205
|
+
description: "A financial instrument (e.g., a pool of CMBS loans) is managed by a primary servicer"
|
|
206
|
+
display_name: "Serviced By"
|
|
207
|
+
mergeability: not_mergeable
|
|
208
|
+
domain_flavors: ["financial_instrument"]
|
|
209
|
+
target_flavors: ["organization"]
|
|
210
|
+
|
|
211
|
+
- name: "sponsored_by"
|
|
212
|
+
description: "An asset (e.g., a CMBS, CLO, or an underlying loan) is sponsored by a specific entity that provides or owns the underlying collateral"
|
|
213
|
+
display_name: "Sponsored By"
|
|
214
|
+
mergeability: not_mergeable
|
|
215
|
+
domain_flavors: ["financial_instrument"]
|
|
216
|
+
target_flavors: ["organization"]
|
|
217
|
+
|
|
218
|
+
- name: "compares_to"
|
|
219
|
+
description: "An organization is used as a comparable for analysis of another organization, e.g., BMW as a comparable company to Tesla"
|
|
220
|
+
display_name: "Compares To"
|
|
221
|
+
mergeability: not_mergeable
|
|
222
|
+
domain_flavors: ["organization"]
|
|
223
|
+
target_flavors: ["organization"]
|
|
224
|
+
|
|
225
|
+
- name: "acquires"
|
|
226
|
+
description: "An organization acquires another organization"
|
|
227
|
+
display_name: "Acquires"
|
|
228
|
+
mergeability: not_mergeable
|
|
229
|
+
domain_flavors: ["organization"]
|
|
230
|
+
target_flavors: ["organization"]
|
|
231
|
+
examples: ["Palo Alto Networks acquiring Protect AI"]
|
|
232
|
+
|
|
233
|
+
- name: "launches"
|
|
234
|
+
description: "An organization launches a new product or financial instrument. NOT for expanding a business to new markets."
|
|
235
|
+
display_name: "Launches"
|
|
236
|
+
mergeability: not_mergeable
|
|
237
|
+
domain_flavors: ["organization"]
|
|
238
|
+
target_flavors: ["product", "financial_instrument"]
|
|
239
|
+
examples: ["Barracuda Networks launching Entra ID Backup Premium"]
|
|
240
|
+
|
|
241
|
+
- name: "produces"
|
|
242
|
+
description: "An organization owns, develops, or markets a product"
|
|
243
|
+
display_name: "Produces"
|
|
244
|
+
mergeability: not_mergeable
|
|
245
|
+
domain_flavors: ["organization"]
|
|
246
|
+
target_flavors: ["product"]
|
|
247
|
+
examples: ["Honeywell Anthem integrated flight deck from Honeywell"]
|
|
248
|
+
|
|
249
|
+
# PASSIVE RELATIONSHIPS — created by the atomizer, not the LLM
|
|
250
|
+
|
|
251
|
+
- name: "appears_in"
|
|
252
|
+
description: "An entity or event appears in a source document"
|
|
253
|
+
display_name: "Appears In"
|
|
254
|
+
mergeability: not_mergeable
|
|
255
|
+
target_flavors: ["article"]
|
|
256
|
+
passive: true
|
|
257
|
+
|
|
258
|
+
- name: "duplicate_of"
|
|
259
|
+
description: "An article is a near-duplicate of another article (detected by LSH)"
|
|
260
|
+
display_name: "Duplicate Of"
|
|
261
|
+
mergeability: not_mergeable
|
|
262
|
+
domain_flavors: ["article"]
|
|
263
|
+
target_flavors: ["article"]
|
|
264
|
+
passive: true
|
|
265
|
+
|
|
266
|
+
- name: "published_in"
|
|
267
|
+
description: "An article was published by a publication"
|
|
268
|
+
display_name: "Published In"
|
|
269
|
+
mergeability: not_mergeable
|
|
270
|
+
domain_flavors: ["article"]
|
|
271
|
+
target_flavors: ["publication"]
|
|
272
|
+
passive: true
|
|
273
|
+
|
|
274
|
+
- name: "original_publisher"
|
|
275
|
+
description: "An article's original publisher (when different from the source)"
|
|
276
|
+
display_name: "Original Publisher"
|
|
277
|
+
mergeability: not_mergeable
|
|
278
|
+
domain_flavors: ["article"]
|
|
279
|
+
target_flavors: ["publication"]
|
|
280
|
+
passive: true
|
|
281
|
+
|
|
282
|
+
# =============================================================================
|
|
283
|
+
# ACTIVE PROPERTIES — extracted by the LLM
|
|
284
|
+
# =============================================================================
|
|
285
|
+
|
|
286
|
+
properties:
|
|
287
|
+
- name: "tone"
|
|
288
|
+
type: string
|
|
289
|
+
description: "Whether the article is opinionated or presents factual reporting"
|
|
290
|
+
display_name: "Tone"
|
|
291
|
+
mergeability: not_mergeable
|
|
292
|
+
extraction_config:
|
|
293
|
+
level: document
|
|
294
|
+
classification:
|
|
295
|
+
values:
|
|
296
|
+
- name: "opinionated"
|
|
297
|
+
description: "The article contains editorial perspective or opinion"
|
|
298
|
+
- name: "matter-of-fact"
|
|
299
|
+
description: "The article presents factual reporting without editorializing"
|
|
300
|
+
|
|
301
|
+
- name: "title_factuality"
|
|
302
|
+
type: string
|
|
303
|
+
description: "Whether the article title is sensational or factual"
|
|
304
|
+
display_name: "Title Factuality"
|
|
305
|
+
mergeability: not_mergeable
|
|
306
|
+
extraction_config:
|
|
307
|
+
level: document
|
|
308
|
+
classification:
|
|
309
|
+
values:
|
|
310
|
+
- name: "sensational"
|
|
311
|
+
description: "The title is exaggerated, clickbait, or emotionally charged beyond what the article supports"
|
|
312
|
+
- name: "factual"
|
|
313
|
+
description: "The title accurately and neutrally reflects the article content"
|
|
314
|
+
|
|
315
|
+
- name: "sentiment"
|
|
316
|
+
type: float
|
|
317
|
+
description: "Classify the financial sentiment of the source text. Positive sentiment indicates events like revenue growth, strategic partnerships, or milestone achievement. Negative sentiment indicates events like economic downturn, natural disasters, or adverse market conditions."
|
|
318
|
+
display_name: "Sentiment"
|
|
319
|
+
mergeability: not_mergeable
|
|
320
|
+
extraction_config:
|
|
321
|
+
level: document
|
|
322
|
+
scoring:
|
|
323
|
+
scale:
|
|
324
|
+
labels:
|
|
325
|
+
- value: -1.0
|
|
326
|
+
name: "strongly negative"
|
|
327
|
+
- value: -0.5
|
|
328
|
+
name: "slightly negative"
|
|
329
|
+
- value: 0.0
|
|
330
|
+
name: "neutral"
|
|
331
|
+
- value: 0.5
|
|
332
|
+
name: "slightly positive"
|
|
333
|
+
- value: 1.0
|
|
334
|
+
name: "strongly positive"
|
|
335
|
+
|
|
336
|
+
- name: "entity_sentiment"
|
|
337
|
+
type: float
|
|
338
|
+
description: "Classify the financial sentiment of a specific entity mentioned in the source text. Positive sentiment indicates events like revenue growth, strategic partnerships, or milestone achievement. Negative sentiment indicates events like economic downturn, natural disasters, or adverse market conditions. If the entity is irrelevant to the subject matter, assign a neutral score."
|
|
339
|
+
display_name: "Entity Sentiment"
|
|
340
|
+
mergeability: not_mergeable
|
|
341
|
+
domain_flavors: ["organization", "person", "location"]
|
|
342
|
+
extraction_config:
|
|
343
|
+
level: entity
|
|
344
|
+
scoring:
|
|
345
|
+
scale:
|
|
346
|
+
labels:
|
|
347
|
+
- value: -1.0
|
|
348
|
+
name: "strongly negative"
|
|
349
|
+
- value: -0.5
|
|
350
|
+
name: "slightly negative"
|
|
351
|
+
- value: 0.0
|
|
352
|
+
name: "neutral"
|
|
353
|
+
- value: 0.5
|
|
354
|
+
name: "slightly positive"
|
|
355
|
+
- value: 1.0
|
|
356
|
+
name: "strongly positive"
|
|
357
|
+
|
|
358
|
+
- name: "original_publication_name"
|
|
359
|
+
type: string
|
|
360
|
+
description: >-
|
|
361
|
+
Determine whether this article was syndicated or republished from a
|
|
362
|
+
different publication or wire service. Look for an explicit credit in the
|
|
363
|
+
byline (e.g., "(Reuters) -", "By Jane Doe, Bloomberg", "Source: AP") or
|
|
364
|
+
in a footer/disclaimer (e.g., "This article was originally published
|
|
365
|
+
by..."). Common wire services and syndicators include Reuters, Associated
|
|
366
|
+
Press (AP), AFP, Bloomberg, PRNewswire, GLOBE NEWSWIRE, and Business
|
|
367
|
+
Wire. Return ONLY the name of the original publication or wire service
|
|
368
|
+
exactly as credited. IMPORTANT: Most articles are NOT syndicated — they
|
|
369
|
+
are original content written by or for the website hosting them. If there
|
|
370
|
+
is no explicit syndication credit to a DIFFERENT publication, return
|
|
371
|
+
exactly "Not available". Do NOT return the name of the website hosting
|
|
372
|
+
the article, the article title, a company mentioned in the article, or
|
|
373
|
+
the author name. Do NOT guess — if you are unsure, return "Not available".
|
|
374
|
+
display_name: "Original Publication"
|
|
375
|
+
mergeability: not_mergeable
|
|
376
|
+
domain_flavors: ["article"]
|
|
377
|
+
extraction_config:
|
|
378
|
+
level: document
|
|
379
|
+
literal:
|
|
380
|
+
include_snippet: true
|
|
381
|
+
|
|
382
|
+
# PASSIVE PROPERTIES — created by the atomizer, not the LLM
|
|
383
|
+
|
|
384
|
+
- name: "has_topic"
|
|
385
|
+
type: string
|
|
386
|
+
description: "A topic associated with an article, derived from event categories"
|
|
387
|
+
display_name: "Topic"
|
|
388
|
+
mergeability: not_mergeable
|
|
389
|
+
domain_flavors: ["article"]
|
|
390
|
+
passive: true
|
|
391
|
+
|
|
392
|
+
- name: "title"
|
|
393
|
+
type: string
|
|
394
|
+
description: "Title of the entity"
|
|
395
|
+
display_name: "Title"
|
|
396
|
+
mergeability: not_mergeable
|
|
397
|
+
passive: true
|
|
398
|
+
|
|
399
|
+
- name: "homeUrl"
|
|
400
|
+
type: string
|
|
401
|
+
description: "The home URL of a publication"
|
|
402
|
+
display_name: "Home URL"
|
|
403
|
+
mergeability: not_mergeable
|
|
404
|
+
passive: true
|
|
405
|
+
|
|
406
|
+
- name: "domain"
|
|
407
|
+
type: string
|
|
408
|
+
description: "The domain name of a publication"
|
|
409
|
+
display_name: "Domain"
|
|
410
|
+
mergeability: not_mergeable
|
|
411
|
+
passive: true
|
|
412
|
+
|
|
413
|
+
- name: "name"
|
|
414
|
+
type: string
|
|
415
|
+
description: "Display name of the entity"
|
|
416
|
+
display_name: "Name"
|
|
417
|
+
mergeability: not_mergeable
|
|
418
|
+
passive: true
|
|
419
|
+
|
|
420
|
+
- name: "pageRank"
|
|
421
|
+
type: float
|
|
422
|
+
description: "Google PageRank score for a publication"
|
|
423
|
+
display_name: "PageRank"
|
|
424
|
+
mergeability: not_mergeable
|
|
425
|
+
passive: true
|
|
426
|
+
|
|
427
|
+
- name: "mozRank"
|
|
428
|
+
type: float
|
|
429
|
+
description: "Moz rank score for a publication"
|
|
430
|
+
display_name: "Moz Rank"
|
|
431
|
+
mergeability: not_mergeable
|
|
432
|
+
passive: true
|
|
433
|
+
|
|
434
|
+
- name: "pageAuthority"
|
|
435
|
+
type: float
|
|
436
|
+
description: "Moz page authority score for a publication"
|
|
437
|
+
display_name: "Page Authority"
|
|
438
|
+
mergeability: not_mergeable
|
|
439
|
+
passive: true
|
|
440
|
+
|
|
441
|
+
- name: "domainAuthority"
|
|
442
|
+
type: float
|
|
443
|
+
description: "Moz domain authority score for a publication"
|
|
444
|
+
display_name: "Domain Authority"
|
|
445
|
+
mergeability: not_mergeable
|
|
446
|
+
passive: true
|
|
447
|
+
|
|
448
|
+
- name: "externalLinks"
|
|
449
|
+
type: float
|
|
450
|
+
description: "Number of external links to a publication"
|
|
451
|
+
display_name: "External Links"
|
|
452
|
+
mergeability: not_mergeable
|
|
453
|
+
passive: true
|
|
454
|
+
|
|
455
|
+
- name: "links"
|
|
456
|
+
type: float
|
|
457
|
+
description: "Total number of links to a publication"
|
|
458
|
+
display_name: "Links"
|
|
459
|
+
mergeability: not_mergeable
|
|
460
|
+
passive: true
|
|
461
|
+
|
|
462
|
+
- name: "title_factuality_score"
|
|
463
|
+
type: float
|
|
464
|
+
description: "Aggregate title factuality score for a publication"
|
|
465
|
+
display_name: "Title Factuality Score"
|
|
466
|
+
mergeability: not_mergeable
|
|
467
|
+
passive: true
|
|
468
|
+
|
|
469
|
+
- name: "tone_objectivity_score"
|
|
470
|
+
type: float
|
|
471
|
+
description: "Aggregate tone objectivity score for a publication"
|
|
472
|
+
display_name: "Tone Objectivity Score"
|
|
473
|
+
mergeability: not_mergeable
|
|
474
|
+
passive: true
|
|
475
|
+
|
|
476
|
+
# =============================================================================
|
|
477
|
+
# PASSIVE ATTRIBUTES — created by the atomizer, not the LLM
|
|
478
|
+
# =============================================================================
|
|
479
|
+
|
|
480
|
+
attributes:
|
|
481
|
+
- property: "appears_in"
|
|
482
|
+
name: "source"
|
|
483
|
+
type: string
|
|
484
|
+
description: "Source document identifier"
|
|
485
|
+
display_name: "Source"
|
|
486
|
+
mergeability: not_mergeable
|
|
487
|
+
|
|
488
|
+
- property: "appears_in"
|
|
489
|
+
name: "url"
|
|
490
|
+
type: string
|
|
491
|
+
description: "URL of the source document"
|
|
492
|
+
display_name: "URL"
|
|
493
|
+
mergeability: not_mergeable
|
|
494
|
+
|
|
495
|
+
- property: "appears_in"
|
|
496
|
+
name: "batch"
|
|
497
|
+
type: string
|
|
498
|
+
description: "Batch identifier for the extraction run"
|
|
499
|
+
display_name: "Batch"
|
|
500
|
+
mergeability: not_mergeable
|
|
501
|
+
|
|
502
|
+
- property: "appears_in"
|
|
503
|
+
name: "trustworthiness"
|
|
504
|
+
type: float
|
|
505
|
+
description: "Trustworthiness score for the source publication"
|
|
506
|
+
display_name: "Trustworthiness"
|
|
507
|
+
mergeability: not_mergeable
|
|
508
|
+
|
|
509
|
+
- property: "appears_in"
|
|
510
|
+
name: "sentiment"
|
|
511
|
+
type: float
|
|
512
|
+
description: "Entity-level sentiment in the context of the source document"
|
|
513
|
+
display_name: "Sentiment"
|
|
514
|
+
mergeability: not_mergeable
|
|
515
|
+
|
|
516
|
+
- property: "sentiment"
|
|
517
|
+
name: "reasoning"
|
|
518
|
+
type: string
|
|
519
|
+
description: "Reasoning behind the sentiment score"
|
|
520
|
+
display_name: "Reasoning"
|
|
521
|
+
mergeability: not_mergeable
|
|
522
|
+
|
|
523
|
+
# =============================================================================
|
|
524
|
+
# EVENTS
|
|
525
|
+
# =============================================================================
|
|
526
|
+
|
|
527
|
+
events:
|
|
528
|
+
- name: "Bankruptcy"
|
|
529
|
+
description: "Bankruptcy of a company or person"
|
|
530
|
+
metadata: { severity: high }
|
|
531
|
+
- name: "Default"
|
|
532
|
+
description: "Default on a major loan or debt"
|
|
533
|
+
metadata: { severity: high }
|
|
534
|
+
- name: "Seizure"
|
|
535
|
+
description: "Seizure of assets or property typically by a government or law enforcement"
|
|
536
|
+
metadata: { severity: high }
|
|
537
|
+
- name: "Insolvency"
|
|
538
|
+
description: "Insolvency of a company"
|
|
539
|
+
metadata: { severity: high }
|
|
540
|
+
- name: "Expropriation"
|
|
541
|
+
description: "Expropriation of assets or property"
|
|
542
|
+
metadata: { severity: high }
|
|
543
|
+
- name: "Mergers & acquisitions"
|
|
544
|
+
description: "A merger or acquisition of a company"
|
|
545
|
+
metadata: { severity: high }
|
|
546
|
+
- name: "Hostile takeover"
|
|
547
|
+
description: "Acquiring a company against its management's wishes by purchasing a majority of shares"
|
|
548
|
+
metadata: { severity: high }
|
|
549
|
+
- name: "Acts of war"
|
|
550
|
+
description: "Direct reports of war activities. NOT for historical accounts or obituaries."
|
|
551
|
+
metadata: { severity: high }
|
|
552
|
+
- name: "Terrorism"
|
|
553
|
+
description: "Direct reports of terrorism that are actively happening or predicted to happen. Not for historical accounts."
|
|
554
|
+
metadata: { severity: high }
|
|
555
|
+
- name: "Significant legal judgement"
|
|
556
|
+
description: "Final verdicts in legal trials that directly affect a company, person, or location"
|
|
557
|
+
metadata: { severity: high }
|
|
558
|
+
- name: "Cybersecurity breach"
|
|
559
|
+
description: "A major breach of a company's cybersecurity especially if it will affect the market"
|
|
560
|
+
metadata: { severity: high }
|
|
561
|
+
- name: "Major natural disaster"
|
|
562
|
+
description: "A major, destructive natural disaster such as a hurricane, earthquake, tornado, wildfire, or flood"
|
|
563
|
+
metadata: { severity: high }
|
|
564
|
+
- name: "IPO"
|
|
565
|
+
description: "A report of an initial public offering (IPO) that has happened or is predicted to happen"
|
|
566
|
+
metadata: { severity: high }
|
|
567
|
+
- name: "SPAC"
|
|
568
|
+
description: "A report of a special purpose acquisition company (SPAC) that has happened or is predicted to happen"
|
|
569
|
+
metadata: { severity: high }
|
|
570
|
+
- name: "Win of long-term, high-value contract"
|
|
571
|
+
description: "Major contracts on the order of 10s of millions to billions of dollars"
|
|
572
|
+
metadata: { severity: high }
|
|
573
|
+
- name: "Technological breakthrough"
|
|
574
|
+
description: "Major technological breakthrough (not just adopting new technology). E.g., a new drug, new chip, new aircraft."
|
|
575
|
+
metadata: { severity: high }
|
|
576
|
+
- name: "Epidemic/pandemic disease"
|
|
577
|
+
description: "A major, worldwide or country-wide epidemic or pandemic disease affecting many people"
|
|
578
|
+
metadata: { severity: high }
|
|
579
|
+
- name: "Insider trading"
|
|
580
|
+
description: "Verified insider trading especially if the SEC is involved"
|
|
581
|
+
metadata: { severity: high }
|
|
582
|
+
- name: "Dividend announcement"
|
|
583
|
+
description: "Routine quarterly, monthly, etc. dividend announcements by a company"
|
|
584
|
+
metadata: { severity: medium }
|
|
585
|
+
- name: "Corporate restructuring"
|
|
586
|
+
description: "Restructuring of a company such as an internal reorganization. NOT for mergers or acquisitions."
|
|
587
|
+
metadata: { severity: medium }
|
|
588
|
+
- name: "Layoffs"
|
|
589
|
+
description: "Significant, verified layoffs/firings of staff (not just one or two people) from a company. NOT for labor shortages."
|
|
590
|
+
metadata: { severity: medium }
|
|
591
|
+
- name: "Customer loss"
|
|
592
|
+
description: "Loss of a major customer"
|
|
593
|
+
metadata: { severity: medium }
|
|
594
|
+
- name: "Product delays"
|
|
595
|
+
description: "Significant, verified delays in product delivery"
|
|
596
|
+
metadata: { severity: medium }
|
|
597
|
+
- name: "Major leadership change"
|
|
598
|
+
description: "Major leadership change at a company such as a CEO, CFO, CTO, or Chairman change from one person to another"
|
|
599
|
+
metadata: { severity: medium }
|
|
600
|
+
- name: "Credit rating downgrade"
|
|
601
|
+
description: "A credit rating downgrade of a company"
|
|
602
|
+
metadata: { severity: medium }
|
|
603
|
+
- name: "Credit rating upgrade"
|
|
604
|
+
description: "A credit rating upgrade of a company"
|
|
605
|
+
metadata: { severity: medium }
|
|
606
|
+
- name: "Strategic partnership"
|
|
607
|
+
description: "A strategic partnership between people and/or companies"
|
|
608
|
+
metadata: { severity: medium }
|
|
609
|
+
- name: "New funding or investment"
|
|
610
|
+
description: "Venture capital or private equity investment in a company, such as a Series A, B, etc."
|
|
611
|
+
metadata: { severity: medium }
|
|
612
|
+
- name: "Launch of a new product"
|
|
613
|
+
description: "Launch of a brand new product worthy of press releases (NOT for adopting existing technology)"
|
|
614
|
+
metadata: { severity: medium }
|
|
615
|
+
- name: "Major crime"
|
|
616
|
+
description: "Major crimes such as murder, robbery, etc."
|
|
617
|
+
metadata: { severity: medium }
|
|
618
|
+
- name: "Earnings call"
|
|
619
|
+
description: "Standard quarterly earnings calls"
|
|
620
|
+
metadata: { severity: medium }
|
|
621
|
+
- name: "Change in government policy"
|
|
622
|
+
description: "A significant change in government policy that might affect the financial health of an entity"
|
|
623
|
+
metadata: { severity: low }
|
|
624
|
+
- name: "Market commentary"
|
|
625
|
+
description: "Article discusses mundane changes in the market"
|
|
626
|
+
metadata: { severity: low }
|
|
627
|
+
- name: "Political commentary"
|
|
628
|
+
description: "Mundane political commentary such as polls or pundit analysis"
|
|
629
|
+
metadata: { severity: low }
|
|
630
|
+
- name: "Analyst report"
|
|
631
|
+
description: "Reports from Moody's, S&P Global Ratings, Fitch Ratings, and similar"
|
|
632
|
+
metadata: { severity: low }
|
|
633
|
+
- name: "Interview"
|
|
634
|
+
description: "The article is specifically an interview"
|
|
635
|
+
metadata: { severity: low }
|
|
636
|
+
- name: "Industry award"
|
|
637
|
+
description: "MAJOR awards such as the Nobel Prize, Pulitzer Prize, Turing Award, Edison Awards, etc."
|
|
638
|
+
metadata: { severity: low }
|
|
639
|
+
- name: "Regulatory filing & compliance"
|
|
640
|
+
description: "Typical or routine filings by a company for regulatory and compliance purposes"
|
|
641
|
+
metadata: { severity: low }
|
|
642
|
+
- name: "Personnel changes"
|
|
643
|
+
description: "A change in low- to medium-level personnel such as hiring a new engineer. NOT for major leadership changes or layoffs."
|
|
644
|
+
metadata: { severity: low }
|
|
645
|
+
- name: "Sports"
|
|
646
|
+
description: "Sports news such as a new record, a new player, scores, etc."
|
|
647
|
+
metadata: { severity: low }
|
|
648
|
+
- name: "Entertainment"
|
|
649
|
+
description: "Entertainment news such as a new movie, TV show, album, book, etc."
|
|
650
|
+
metadata: { severity: low }
|