fabricatio 0.3.15.dev5__cp312-cp312-win_amd64.whl → 0.4.5.dev0__cp312-cp312-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (65) hide show
  1. fabricatio/__init__.py +7 -8
  2. fabricatio/actions/__init__.py +69 -1
  3. fabricatio/capabilities/__init__.py +63 -1
  4. fabricatio/models/__init__.py +51 -0
  5. fabricatio/rust.cp312-win_amd64.pyd +0 -0
  6. fabricatio/toolboxes/__init__.py +2 -1
  7. fabricatio/toolboxes/arithmetic.py +1 -1
  8. fabricatio/toolboxes/fs.py +2 -2
  9. fabricatio/workflows/__init__.py +9 -0
  10. fabricatio-0.4.5.dev0.data/scripts/tdown.exe +0 -0
  11. {fabricatio-0.3.15.dev5.dist-info → fabricatio-0.4.5.dev0.dist-info}/METADATA +58 -27
  12. fabricatio-0.4.5.dev0.dist-info/RECORD +15 -0
  13. fabricatio/actions/article.py +0 -415
  14. fabricatio/actions/article_rag.py +0 -407
  15. fabricatio/actions/fs.py +0 -25
  16. fabricatio/actions/output.py +0 -247
  17. fabricatio/actions/rag.py +0 -96
  18. fabricatio/actions/rules.py +0 -83
  19. fabricatio/capabilities/advanced_judge.py +0 -20
  20. fabricatio/capabilities/advanced_rag.py +0 -61
  21. fabricatio/capabilities/censor.py +0 -105
  22. fabricatio/capabilities/check.py +0 -212
  23. fabricatio/capabilities/correct.py +0 -228
  24. fabricatio/capabilities/extract.py +0 -74
  25. fabricatio/capabilities/propose.py +0 -65
  26. fabricatio/capabilities/rag.py +0 -264
  27. fabricatio/capabilities/rating.py +0 -404
  28. fabricatio/capabilities/review.py +0 -114
  29. fabricatio/capabilities/task.py +0 -113
  30. fabricatio/decorators.py +0 -253
  31. fabricatio/emitter.py +0 -177
  32. fabricatio/fs/__init__.py +0 -35
  33. fabricatio/fs/curd.py +0 -153
  34. fabricatio/fs/readers.py +0 -61
  35. fabricatio/journal.py +0 -12
  36. fabricatio/models/action.py +0 -263
  37. fabricatio/models/adv_kwargs_types.py +0 -63
  38. fabricatio/models/extra/__init__.py +0 -1
  39. fabricatio/models/extra/advanced_judge.py +0 -32
  40. fabricatio/models/extra/aricle_rag.py +0 -286
  41. fabricatio/models/extra/article_base.py +0 -488
  42. fabricatio/models/extra/article_essence.py +0 -98
  43. fabricatio/models/extra/article_main.py +0 -285
  44. fabricatio/models/extra/article_outline.py +0 -45
  45. fabricatio/models/extra/article_proposal.py +0 -52
  46. fabricatio/models/extra/patches.py +0 -20
  47. fabricatio/models/extra/problem.py +0 -165
  48. fabricatio/models/extra/rag.py +0 -98
  49. fabricatio/models/extra/rule.py +0 -51
  50. fabricatio/models/generic.py +0 -904
  51. fabricatio/models/kwargs_types.py +0 -121
  52. fabricatio/models/role.py +0 -156
  53. fabricatio/models/task.py +0 -310
  54. fabricatio/models/tool.py +0 -328
  55. fabricatio/models/usages.py +0 -791
  56. fabricatio/parser.py +0 -114
  57. fabricatio/rust.pyi +0 -846
  58. fabricatio/utils.py +0 -156
  59. fabricatio/workflows/articles.py +0 -24
  60. fabricatio/workflows/rag.py +0 -11
  61. fabricatio-0.3.15.dev5.data/scripts/tdown.exe +0 -0
  62. fabricatio-0.3.15.dev5.data/scripts/ttm.exe +0 -0
  63. fabricatio-0.3.15.dev5.dist-info/RECORD +0 -63
  64. {fabricatio-0.3.15.dev5.dist-info → fabricatio-0.4.5.dev0.dist-info}/WHEEL +0 -0
  65. {fabricatio-0.3.15.dev5.dist-info → fabricatio-0.4.5.dev0.dist-info}/licenses/LICENSE +0 -0
@@ -1,488 +0,0 @@
1
- """A foundation for hierarchical document components with dependency tracking."""
2
-
3
- from abc import ABC
4
- from enum import StrEnum
5
- from pathlib import Path
6
- from typing import ClassVar, Generator, List, Optional, Self, Tuple, Type
7
-
8
- from fabricatio.fs import dump_text, safe_text_read
9
- from fabricatio.fs.readers import extract_sections
10
- from fabricatio.journal import logger
11
- from fabricatio.models.generic import (
12
- AsPrompt,
13
- Described,
14
- FinalizedDumpAble,
15
- Introspect,
16
- Language,
17
- ModelHash,
18
- PersistentAble,
19
- ProposedUpdateAble,
20
- SketchedAble,
21
- Titled,
22
- WordCount,
23
- )
24
- from fabricatio.rust import (
25
- detect_language,
26
- extract_body,
27
- replace_thesis_body,
28
- split_out_metadata,
29
- strip_comment,
30
- to_metadata,
31
- word_count,
32
- )
33
- from fabricatio.utils import fallback_kwargs, ok
34
- from pydantic import Field
35
-
36
- ARTICLE_WRAPPER = "// =-=-=-=-=-=-=-=-=-="
37
-
38
-
39
- class ReferringType(StrEnum):
40
- """Enumeration of different types of references that can be made in an article."""
41
-
42
- CHAPTER = "chapter"
43
- SECTION = "section"
44
- SUBSECTION = "subsection"
45
-
46
-
47
- type RefKey = Tuple[str, Optional[str], Optional[str]]
48
-
49
-
50
- class ArticleMetaData(SketchedAble, Described, WordCount, Titled, Language):
51
- """Metadata for an article component."""
52
-
53
- description: str = Field(
54
- alias="elaboration",
55
- description=Described.model_fields["description"].description,
56
- )
57
-
58
- title: str = Field(alias="heading", description=Titled.model_fields["title"].description)
59
-
60
- aims: List[str]
61
- """List of writing aims of the research component in academic style."""
62
-
63
- _unstructured_body: str = ""
64
- """Store the source of the unknown information."""
65
-
66
- @property
67
- def typst_metadata_comment(self) -> str:
68
- """Generates a comment for the metadata of the article component."""
69
- data = self.model_dump(
70
- include={"description", "aims", "expected_word_count"},
71
- by_alias=True,
72
- )
73
- return to_metadata({k: v for k, v in data.items() if v})
74
-
75
- @property
76
- def unstructured_body(self) -> str:
77
- """Returns the unstructured body of the article component."""
78
- return self._unstructured_body
79
-
80
- def update_unstructured_body[S: "ArticleMetaData"](self: S, body: str) -> S:
81
- """Update the unstructured body of the article component."""
82
- self._unstructured_body = body
83
- return self
84
-
85
- @property
86
- def language(self) -> str:
87
- """Get the language of the article component."""
88
- return detect_language(self.title)
89
-
90
-
91
- class FromTypstCode(ArticleMetaData):
92
- """Base class for article components that can be created from a Typst code snippet."""
93
-
94
- @classmethod
95
- def from_typst_code(cls, title: str, body: str, **kwargs) -> Self:
96
- """Converts a Typst code snippet into an article component."""
97
- data, body = split_out_metadata(body)
98
-
99
- return cls(
100
- heading=title.strip(),
101
- **fallback_kwargs(data or {}, elaboration="", expected_word_count=word_count(body), aims=[]),
102
- **kwargs,
103
- )
104
-
105
-
106
- class ToTypstCode(ArticleMetaData):
107
- """Base class for article components that can be converted to a Typst code snippet."""
108
-
109
- def to_typst_code(self) -> str:
110
- """Converts the component into a Typst code snippet for rendering."""
111
- return f"{self.title}\n{self.typst_metadata_comment}\n\n{self._unstructured_body}"
112
-
113
-
114
- class ArticleOutlineBase(
115
- ProposedUpdateAble,
116
- PersistentAble,
117
- ModelHash,
118
- Introspect,
119
- FromTypstCode,
120
- ToTypstCode,
121
- ABC,
122
- ):
123
- """Base class for article outlines."""
124
-
125
- @property
126
- def metadata(self) -> ArticleMetaData:
127
- """Returns the metadata of the article component."""
128
- return ArticleMetaData.model_validate(self, from_attributes=True)
129
-
130
- def update_metadata(self, other: ArticleMetaData) -> Self:
131
- """Updates the metadata of the current instance with the attributes of another instance."""
132
- self.aims.clear()
133
- self.aims.extend(other.aims)
134
- self.description = other.description
135
- return self
136
-
137
- def update_from_inner(self, other: Self) -> Self:
138
- """Updates the current instance with the attributes of another instance."""
139
- return self.update_metadata(other)
140
-
141
-
142
- class SubSectionBase(ArticleOutlineBase):
143
- """Base class for article sections and subsections."""
144
-
145
- def to_typst_code(self) -> str:
146
- """Converts the component into a Typst code snippet for rendering."""
147
- return f"=== {super().to_typst_code()}"
148
-
149
- def introspect(self) -> str:
150
- """Introspects the article subsection outline."""
151
- return ""
152
-
153
- def resolve_update_conflict(self, other: Self) -> str:
154
- """Resolve update errors in the article outline."""
155
- if self.title != other.title:
156
- return f"Title mismatched, expected `{self.title}`, got `{other.title}`"
157
- return ""
158
-
159
-
160
- class SectionBase[T: SubSectionBase](ArticleOutlineBase):
161
- """Base class for article sections and subsections."""
162
-
163
- subsections: List[T]
164
- """Subsections of the section. Contains at least one subsection. You can also add more as needed."""
165
-
166
- child_type: ClassVar[Type[SubSectionBase]]
167
-
168
- def to_typst_code(self) -> str:
169
- """Converts the section into a Typst formatted code snippet.
170
-
171
- Returns:
172
- str: The formatted Typst code snippet.
173
- """
174
- return f"== {super().to_typst_code()}" + "\n\n".join(subsec.to_typst_code() for subsec in self.subsections)
175
-
176
- @classmethod
177
- def from_typst_code(cls, title: str, body: str, **kwargs) -> Self:
178
- """Creates an Article object from the given Typst code."""
179
- raw = extract_sections(body, level=3, section_char="=")
180
-
181
- return (
182
- super()
183
- .from_typst_code(
184
- title,
185
- body,
186
- subsections=[cls.child_type.from_typst_code(*pack) for pack in raw],
187
- )
188
- .update_unstructured_body("" if raw else strip_comment(body))
189
- )
190
-
191
- def resolve_update_conflict(self, other: Self) -> str:
192
- """Resolve update errors in the article outline."""
193
- out = ""
194
- if self.title != other.title:
195
- out += f"Title mismatched, expected `{self.title}`, got `{other.title}`"
196
- if len(self.subsections) != len(other.subsections):
197
- out += f"Section count mismatched, expected `{len(self.subsections)}`, got `{len(other.subsections)}`"
198
- return out or "\n".join(
199
- [
200
- conf
201
- for s, o in zip(self.subsections, other.subsections, strict=True)
202
- if (conf := s.resolve_update_conflict(o))
203
- ]
204
- )
205
-
206
- def update_from_inner(self, other: Self) -> Self:
207
- """Updates the current instance with the attributes of another instance."""
208
- super().update_from_inner(other)
209
- if len(self.subsections) == 0:
210
- self.subsections = other.subsections
211
- return self
212
-
213
- for self_subsec, other_subsec in zip(self.subsections, other.subsections, strict=True):
214
- self_subsec.update_from(other_subsec)
215
- return self
216
-
217
- def introspect(self) -> str:
218
- """Introspects the article section outline."""
219
- if len(self.subsections) == 0:
220
- return f"Section `{self.title}` contains no subsections, expected at least one, but got 0, you can add one or more as needed."
221
- return ""
222
-
223
- @property
224
- def exact_word_count(self) -> int:
225
- """Returns the exact word count of the article section outline."""
226
- return sum(a.exact_word_count for a in self.subsections)
227
-
228
-
229
- class ChapterBase[T: SectionBase](ArticleOutlineBase):
230
- """Base class for article chapters."""
231
-
232
- sections: List[T]
233
- """Sections of the chapter. Contains at least one section. You can also add more as needed."""
234
- child_type: ClassVar[Type[SectionBase]]
235
-
236
- def to_typst_code(self) -> str:
237
- """Converts the chapter into a Typst formatted code snippet for rendering."""
238
- return f"= {super().to_typst_code()}" + "\n\n".join(sec.to_typst_code() for sec in self.sections)
239
-
240
- @classmethod
241
- def from_typst_code(cls, title: str, body: str, **kwargs) -> Self:
242
- """Creates an Article object from the given Typst code."""
243
- raw_sec = extract_sections(body, level=2, section_char="=")
244
-
245
- return (
246
- super()
247
- .from_typst_code(
248
- title,
249
- body,
250
- sections=[cls.child_type.from_typst_code(*pack) for pack in raw_sec],
251
- )
252
- .update_unstructured_body("" if raw_sec else strip_comment(body))
253
- )
254
-
255
- def resolve_update_conflict(self, other: Self) -> str:
256
- """Resolve update errors in the article outline."""
257
- out = ""
258
-
259
- if self.title != other.title:
260
- out += f"Title mismatched, expected `{self.title}`, got `{other.title}`"
261
- if len(self.sections) == len(other.sections):
262
- out += f"Chapter count mismatched, expected `{len(self.sections)}`, got `{len(other.sections)}`"
263
-
264
- return out or "\n".join(
265
- [conf for s, o in zip(self.sections, other.sections, strict=True) if (conf := s.resolve_update_conflict(o))]
266
- )
267
-
268
- def update_from_inner(self, other: Self) -> Self:
269
- """Updates the current instance with the attributes of another instance."""
270
- if len(self.sections) == 0:
271
- self.sections = other.sections
272
- return self
273
-
274
- for self_sec, other_sec in zip(self.sections, other.sections, strict=True):
275
- self_sec.update_from(other_sec)
276
- return self
277
-
278
- def introspect(self) -> str:
279
- """Introspects the article chapter outline."""
280
- if len(self.sections) == 0:
281
- return f"Chapter `{self.title}` contains no sections, expected at least one, but got 0, you can add one or more as needed."
282
- return ""
283
-
284
- @property
285
- def exact_word_count(self) -> int:
286
- """Calculates the total word count across all sections in the chapter.
287
-
288
- Returns:
289
- int: The cumulative word count of all sections.
290
- """
291
- return sum(a.exact_word_count for a in self.sections)
292
-
293
-
294
- class ArticleBase[T: ChapterBase](FinalizedDumpAble, AsPrompt, FromTypstCode, ToTypstCode, ABC):
295
- """Base class for article outlines."""
296
-
297
- description: str = Field(
298
- alias="elaboration",
299
- )
300
- """The abstract of this article, which serves as a concise summary of an academic article, encapsulating its core purpose, methodologies, key results,
301
- and conclusions while enabling readers to rapidly assess the relevance and significance of the study.
302
- Functioning as the article's distilled essence, it succinctly articulates the research problem, objectives,
303
- and scope, providing a roadmap for the full text while also facilitating database indexing, literature reviews,
304
- and citation tracking through standardized metadata. Additionally, it acts as an accessibility gateway,
305
- allowing scholars to gauge the study's contribution to existing knowledge, its methodological rigor,
306
- and its broader implications without engaging with the entire manuscript, thereby optimizing scholarly communication efficiency."""
307
-
308
- chapters: List[T]
309
- """Chapters of the article. Contains at least one chapter. You can also add more as needed."""
310
-
311
- child_type: ClassVar[Type[ChapterBase]]
312
-
313
- @property
314
- def language(self) -> str:
315
- """Get the language of the article."""
316
- if self.title:
317
- return super().language
318
- return self.chapters[0].language
319
-
320
- @property
321
- def exact_word_count(self) -> int:
322
- """Calculates the total word count across all chapters in the article.
323
-
324
- Returns:
325
- int: The cumulative word count of all chapters.
326
- """
327
- return sum(ch.exact_word_count for ch in self.chapters)
328
-
329
- @classmethod
330
- def from_typst_code(cls, title: str, body: str, **kwargs) -> Self:
331
- """Generates an article from the given Typst code."""
332
- raw = extract_sections(body, level=1, section_char="=")
333
- return (
334
- super()
335
- .from_typst_code(
336
- title,
337
- body,
338
- chapters=[cls.child_type.from_typst_code(*pack) for pack in raw],
339
- )
340
- .update_unstructured_body("" if raw else strip_comment(body))
341
- )
342
-
343
- def iter_dfs_rev(
344
- self,
345
- ) -> Generator[ArticleOutlineBase, None, None]:
346
- """Performs a depth-first search (DFS) through the article structure in reverse order.
347
-
348
- Returns:
349
- Generator[ArticleMainBase]: Each component in the article structure in reverse order.
350
- """
351
- for chap in self.chapters:
352
- for sec in chap.sections:
353
- yield from sec.subsections
354
- yield sec
355
- yield chap
356
-
357
- def iter_dfs(self) -> Generator[ArticleOutlineBase, None, None]:
358
- """Performs a depth-first search (DFS) through the article structure.
359
-
360
- Returns:
361
- Generator[ArticleMainBase]: Each component in the article structure.
362
- """
363
- for chap in self.chapters:
364
- yield chap
365
- for sec in chap.sections:
366
- yield sec
367
- yield from sec.subsections
368
-
369
- def iter_sections(self) -> Generator[Tuple[ChapterBase, SectionBase], None, None]:
370
- """Iterates through all sections in the article.
371
-
372
- Returns:
373
- Generator[ArticleOutlineBase]: Each section in the article.
374
- """
375
- for chap in self.chapters:
376
- for sec in chap.sections:
377
- yield chap, sec
378
-
379
- def iter_subsections(self) -> Generator[Tuple[ChapterBase, SectionBase, SubSectionBase], None, None]:
380
- """Iterates through all subsections in the article.
381
-
382
- Returns:
383
- Generator[ArticleOutlineBase]: Each subsection in the article.
384
- """
385
- for chap, sec in self.iter_sections():
386
- for subsec in sec.subsections:
387
- yield chap, sec, subsec
388
-
389
- def find_introspected(self) -> Optional[Tuple[ArticleOutlineBase, str]]:
390
- """Finds the first introspected component in the article structure."""
391
- summary = ""
392
- for component in self.iter_dfs_rev():
393
- summary += component.introspect()
394
- if summary:
395
- return component, summary
396
- return None
397
-
398
- def gather_introspected(self) -> Optional[str]:
399
- """Gathers all introspected components in the article structure."""
400
- return "\n".join([i for component in self.chapters if (i := component.introspect())])
401
-
402
- def iter_chap_title(self) -> Generator[str, None, None]:
403
- """Iterates through all chapter titles in the article."""
404
- for chap in self.chapters:
405
- yield chap.title
406
-
407
- def iter_section_title(self) -> Generator[str, None, None]:
408
- """Iterates through all section titles in the article."""
409
- for _, sec in self.iter_sections():
410
- yield sec.title
411
-
412
- def iter_subsection_title(self) -> Generator[str, None, None]:
413
- """Iterates through all subsection titles in the article."""
414
- for _, _, subsec in self.iter_subsections():
415
- yield subsec.title
416
-
417
- def to_typst_code(self) -> str:
418
- """Generates the Typst code representation of the article."""
419
- return f"// #Title: {super().to_typst_code()}\n" + "\n\n".join(a.to_typst_code() for a in self.chapters)
420
-
421
- def finalized_dump(self) -> str:
422
- """Generates standardized hierarchical markup for academic publishing systems.
423
-
424
- Implements ACL 2024 outline conventions with four-level structure:
425
- = Chapter Title (Level 1)
426
- == Section Title (Level 2)
427
- === Subsection Title (Level 3)
428
- ==== Subsubsection Title (Level 4)
429
-
430
- Returns:
431
- str: Strictly formatted outline with academic sectioning
432
-
433
- Example:
434
- = Methodology
435
- == Neural Architecture Search Framework
436
- === Differentiable Search Space
437
- ==== Constrained Optimization Parameters
438
- === Implementation Details
439
- == Evaluation Protocol
440
- """
441
- return self.to_typst_code()
442
-
443
- def avg_chap_wordcount[S: "ArticleBase"](self: S) -> S:
444
- """Set all chap have same word count sum up to be `self.expected_word_count`."""
445
- avg = int(self.expected_word_count / len(self.chapters))
446
- for c in self.chapters:
447
- c.expected_word_count = avg
448
- return self
449
-
450
- def avg_sec_wordcount[S: "ArticleBase"](self: S) -> S:
451
- """Set all sec have same word count sum up to be `self.expected_word_count`."""
452
- for c in self.chapters:
453
- avg = int(c.expected_word_count / len(c.sections))
454
- for s in c.sections:
455
- s.expected_word_count = avg
456
- return self
457
-
458
- def avg_subsec_wordcount[S: "ArticleBase"](self: S) -> S:
459
- """Set all subsec have same word count sum up to be `self.expected_word_count`."""
460
- for _, s in self.iter_sections():
461
- avg = int(s.expected_word_count / len(s.subsections))
462
- for ss in s.subsections:
463
- ss.expected_word_count = avg
464
- return self
465
-
466
- def avg_wordcount_recursive[S: "ArticleBase"](self: S) -> S:
467
- """Set all chap, sec, subsec have same word count sum up to be `self.expected_word_count`."""
468
- return self.avg_chap_wordcount().avg_sec_wordcount().avg_subsec_wordcount()
469
-
470
- def update_article_file[S: "ArticleBase"](self: S, file: str | Path) -> S:
471
- """Update the article file."""
472
- file = Path(file)
473
- string = safe_text_read(file)
474
- if updated := replace_thesis_body(string, ARTICLE_WRAPPER, f"\n\n{self.to_typst_code()}\n\n"):
475
- dump_text(file, updated)
476
- logger.success(f"Successfully updated {file.as_posix()}.")
477
- else:
478
- logger.warning(f"Failed to update {file.as_posix()}. Please make sure there are paired `{ARTICLE_WRAPPER}`")
479
- return self
480
-
481
- @classmethod
482
- def from_article_file[S: "ArticleBase"](cls: Type[S], file: str | Path, title: str = "") -> S:
483
- """Load article from file."""
484
- file = Path(file)
485
- string = safe_text_read(file)
486
- return cls.from_typst_code(
487
- title, ok(extract_body(string, ARTICLE_WRAPPER), "Failed to extract body from file.")
488
- )
@@ -1,98 +0,0 @@
1
- """ArticleEssence: Semantic fingerprint of academic paper for structured analysis."""
2
-
3
- from typing import List
4
-
5
- from fabricatio.models.extra.rag import MilvusDataBase
6
- from fabricatio.models.generic import PersistentAble, SketchedAble
7
- from pydantic import BaseModel
8
-
9
-
10
- class Equation(BaseModel):
11
- """Mathematical formalism specification for research contributions."""
12
-
13
- description: str
14
- """Structured significance including:
15
- 1. Conceptual meaning
16
- 2. Technical workflow role
17
- 3. Contribution relationship
18
- """
19
-
20
- latex_code: str
21
- """Typeset-ready notation."""
22
-
23
-
24
- class Figure(BaseModel):
25
- """Visual component with academic captioning."""
26
-
27
- description: str
28
- """Interpretation guide covering:
29
- 1. Visual element mapping
30
- 2. Data representation method
31
- 3. Research connection
32
- """
33
-
34
- figure_caption: str
35
- """Nature-style caption containing:
36
- 1. Overview statement
37
- 2. Technical details
38
- 3. Result implications
39
- """
40
-
41
- figure_serial_number: int
42
- """Image serial number extracted from Markdown path"""
43
-
44
-
45
- class Highlightings(BaseModel):
46
- """Technical component aggregator."""
47
-
48
- highlighted_equations: List[Equation]
49
- """Equations that highlight the article's core contributions"""
50
-
51
- highlighted_figures: List[Figure]
52
- """key figures requiring:
53
- 1. Framework overview
54
- 2. Quantitative results
55
- """
56
-
57
-
58
- class ArticleEssence(SketchedAble, PersistentAble, MilvusDataBase):
59
- """Structured representation of a scientific article's core elements in its original language."""
60
-
61
- language: str
62
- """Language of the original article."""
63
-
64
- title: str
65
- """Exact title of the original article."""
66
-
67
- authors: List[str]
68
- """Original author full names as they appear in the source document."""
69
-
70
- keywords: List[str]
71
- """Original keywords as they appear in the source document."""
72
-
73
- publication_year: int
74
- """Publication year in ISO 8601 (YYYY format)."""
75
-
76
- highlightings: Highlightings
77
- """Technical highlights including equations, algorithms, figures, and tables."""
78
-
79
- abstract: str
80
- """Abstract text in the original language."""
81
-
82
- core_contributions: List[str]
83
- """Technical contributions using CRediT taxonomy verbs."""
84
-
85
- technical_novelty: List[str]
86
- """Patent-style claims with technical specificity."""
87
-
88
- research_problems: List[str]
89
- """Problem statements as how/why questions."""
90
-
91
- limitations: List[str]
92
- """Technical limitations analysis."""
93
-
94
- bibtex_cite_key: str
95
- """Bibtex cite key of the original article."""
96
-
97
- def _prepare_vectorization_inner(self) -> str:
98
- return self.compact()