defuddle 0.11.0 → 0.13.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +49 -29
- package/dist/cli.js +15 -46
- package/dist/cli.js.map +1 -1
- package/dist/constants.d.ts +9 -0
- package/dist/constants.js +33 -9
- package/dist/constants.js.map +1 -1
- package/dist/defuddle.d.ts +50 -2
- package/dist/defuddle.js +615 -238
- package/dist/defuddle.js.map +1 -1
- package/dist/elements/code.js +31 -9
- package/dist/elements/code.js.map +1 -1
- package/dist/elements/footnotes.js +2 -1
- package/dist/elements/footnotes.js.map +1 -1
- package/dist/elements/headings.js +42 -50
- package/dist/elements/headings.js.map +1 -1
- package/dist/extractor-registry.d.ts +1 -0
- package/dist/extractor-registry.js +3 -0
- package/dist/extractor-registry.js.map +1 -1
- package/dist/extractors/_base.d.ts +6 -0
- package/dist/extractors/_base.js +8 -0
- package/dist/extractors/_base.js.map +1 -1
- package/dist/extractors/github.d.ts +10 -2
- package/dist/extractors/github.js +158 -71
- package/dist/extractors/github.js.map +1 -1
- package/dist/extractors/hackernews.js +18 -72
- package/dist/extractors/hackernews.js.map +1 -1
- package/dist/extractors/reddit.d.ts +1 -2
- package/dist/extractors/reddit.js +41 -94
- package/dist/extractors/reddit.js.map +1 -1
- package/dist/extractors/x-oembed.d.ts +0 -1
- package/dist/extractors/x-oembed.js +20 -27
- package/dist/extractors/x-oembed.js.map +1 -1
- package/dist/extractors/youtube.d.ts +57 -0
- package/dist/extractors/youtube.js +619 -10
- package/dist/extractors/youtube.js.map +1 -1
- package/dist/index.full.js +1 -1
- package/dist/index.js +1 -1
- package/dist/markdown.js +5 -0
- package/dist/markdown.js.map +1 -1
- package/dist/metadata.d.ts +5 -0
- package/dist/metadata.js +28 -0
- package/dist/metadata.js.map +1 -1
- package/dist/node.d.ts +12 -5
- package/dist/node.js +53 -22
- package/dist/node.js.map +1 -1
- package/dist/scoring.d.ts +6 -1
- package/dist/scoring.js +69 -22
- package/dist/scoring.js.map +1 -1
- package/dist/standardize.js +152 -63
- package/dist/standardize.js.map +1 -1
- package/dist/types.d.ts +9 -0
- package/dist/utils/comments.d.ts +44 -0
- package/dist/utils/comments.js +103 -0
- package/dist/utils/comments.js.map +1 -0
- package/dist/utils/dom.d.ts +9 -0
- package/dist/utils/dom.js +20 -0
- package/dist/utils/dom.js.map +1 -1
- package/dist/utils/linkedom-compat.d.ts +5 -0
- package/dist/utils/linkedom-compat.js +23 -0
- package/dist/utils/linkedom-compat.js.map +1 -0
- package/dist/utils/transcript.d.ts +37 -0
- package/dist/utils/transcript.js +61 -0
- package/dist/utils/transcript.js.map +1 -0
- package/dist/utils.d.ts +6 -0
- package/dist/utils.js +36 -0
- package/dist/utils.js.map +1 -1
- package/package.json +3 -4
|
@@ -10,6 +10,7 @@ export declare class ExtractorRegistry {
|
|
|
10
10
|
static register(mapping: ExtractorMapping): void;
|
|
11
11
|
static findExtractor(document: Document, url: string, schemaOrgData?: any): BaseExtractor | null;
|
|
12
12
|
static findAsyncExtractor(document: Document, url: string, schemaOrgData?: any): BaseExtractor | null;
|
|
13
|
+
static findPreferredAsyncExtractor(document: Document, url: string, schemaOrgData?: any): BaseExtractor | null;
|
|
13
14
|
private static findByPredicate;
|
|
14
15
|
}
|
|
15
16
|
export {};
|
|
@@ -105,6 +105,9 @@ class ExtractorRegistry {
|
|
|
105
105
|
static findAsyncExtractor(document, url, schemaOrgData) {
|
|
106
106
|
return this.findByPredicate(document, url, schemaOrgData, e => e.canExtractAsync());
|
|
107
107
|
}
|
|
108
|
+
static findPreferredAsyncExtractor(document, url, schemaOrgData) {
|
|
109
|
+
return this.findByPredicate(document, url, schemaOrgData, e => e.canExtractAsync() && e.prefersAsync());
|
|
110
|
+
}
|
|
108
111
|
static findByPredicate(document, url, schemaOrgData, predicate) {
|
|
109
112
|
try {
|
|
110
113
|
const domain = new URL(url).hostname;
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"extractor-registry.js","sourceRoot":"","sources":["../src/extractor-registry.ts"],"names":[],"mappings":";;;AAEA,aAAa;AACb,gDAAsD;AACtD,kDAAwD;AACxD,sDAA2D;AAC3D,kDAAwD;AACxD,wDAA8D;AAC9D,kDAAwD;AACxD,gDAAsD;AACtD,4CAAkD;AAClD,gDAAsD;AACtD,gDAAsD;AACtD,oDAAyD;AASzD,MAAa,iBAAiB;IAG7B,MAAM,CAAC,UAAU;QAChB,kDAAkD;QAClD,yEAAyE;QACzE,gEAAgE;QAChE,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,OAAO;gBACP,aAAa;aACb;YACD,SAAS,EAAE,6BAAiB;SAC5B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,aAAa;gBACb,cAAc;aACd;YACD,SAAS,EAAE,0BAAgB;SAC3B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,OAAO;gBACP,aAAa;aACb;YACD,SAAS,EAAE,2BAAgB;SAC3B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,YAAY;gBACZ,gBAAgB;gBAChB,gBAAgB;gBAChB,gCAAgC;aAChC;YACD,SAAS,EAAE,wBAAe;SAC1B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,aAAa;gBACb,UAAU;gBACV,2BAA2B;gBAC3B,eAAe;aACf;YACD,SAAS,EAAE,0BAAgB;SAC3B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,qCAAqC;aACrC;YACD,SAAS,EAAE,gCAAmB;SAC9B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,yCAAyC;aACzC;YACD,SAAS,EAAE,0BAAgB;SAC3B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,WAAW;gBACX,0CAA0C;aAC1C;YACD,SAAS,EAAE,wBAAe;SAC1B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,6CAA6C;aAC7C;YACD,SAAS,EAAE,oBAAa;SACxB,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,0CAA0C;aAC1C;YACD,SAAS,EAAE,wBAAe;SAC1B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,YAAY;gBACZ,6BAA6B;aAC7B;YACD,SAAS,EAAE,wBAAe;SAC1B,CAAC,CAAC;IACJ,CAAC;IAED,MAAM,CAAC,QAAQ,CAAC,OAAyB;QACxC,IAAI,CAAC,QAAQ,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC;IAC7B,CAAC;IAED,MAAM,CAAC,aAAa,CAAC,QAAkB,EAAE,GAAW,EAAE,aAAmB;QACxE,OAAO,IAAI,CAAC,eAAe,CAAC,QAAQ,EAAE,GAAG,EAAE,aAAa,EAAE,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,UAAU,EAAE,CAAC,CAAC;IAChF,CAAC;IAED,MAAM,CAAC,kBAAkB,CAAC,QAAkB,EAAE,GAAW,EAAE,aAAmB;QAC7E,OAAO,IAAI,CAAC,eAAe,CAAC,QAAQ,EAAE,GAAG,EAAE,aAAa,EAAE,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,eAAe,EAAE,CAAC,CAAC;IACrF,CAAC;IAEO,MAAM,CAAC,eAAe,CAC7B,QAAkB,EAAE,GAAW,EAAE,aAA8B,EAC/D,SAA+C;QAE/C,IAAI,CAAC;YACJ,MAAM,MAAM,GAAG,IAAI,GAAG,CAAC,GAAG,CAAC,CAAC,QAAQ,CAAC;YAErC,KAAK,MAAM,EAAE,QAAQ,EAAE,SAAS,EAAE,IAAI,IAAI,CAAC,QAAQ,EAAE,CAAC;gBACrD,MAAM,OAAO,GAAG,QAAQ,CAAC,IAAI,CAAC,OAAO,CAAC,EAAE;oBACvC,IAAI,OAAO,YAAY,MAAM,EAAE,CAAC;wBAC/B,OAAO,OAAO,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;oBAC1B,CAAC;oBACD,OAAO,MAAM,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC;gBACjC,CAAC,CAAC,CAAC;gBAEH,IAAI,OAAO,EAAE,CAAC;oBACb,MAAM,QAAQ,GAAG,IAAI,SAAS,CAAC,QAAQ,EAAE,GAAG,EAAE,aAAa,CAAC,CAAC;oBAC7D,IAAI,SAAS,CAAC,QAAQ,CAAC,EAAE,CAAC;wBACzB,OAAO,QAAQ,CAAC;oBACjB,CAAC;gBACF,CAAC;YACF,CAAC;YAED,OAAO,IAAI,CAAC;QAEb,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YAChB,OAAO,CAAC,KAAK,CAAC,0BAA0B,EAAE,KAAK,CAAC,CAAC;YACjD,OAAO,IAAI,CAAC;QACb,CAAC;IACF,CAAC;;
|
|
1
|
+
{"version":3,"file":"extractor-registry.js","sourceRoot":"","sources":["../src/extractor-registry.ts"],"names":[],"mappings":";;;AAEA,aAAa;AACb,gDAAsD;AACtD,kDAAwD;AACxD,sDAA2D;AAC3D,kDAAwD;AACxD,wDAA8D;AAC9D,kDAAwD;AACxD,gDAAsD;AACtD,4CAAkD;AAClD,gDAAsD;AACtD,gDAAsD;AACtD,oDAAyD;AASzD,MAAa,iBAAiB;IAG7B,MAAM,CAAC,UAAU;QAChB,kDAAkD;QAClD,yEAAyE;QACzE,gEAAgE;QAChE,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,OAAO;gBACP,aAAa;aACb;YACD,SAAS,EAAE,6BAAiB;SAC5B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,aAAa;gBACb,cAAc;aACd;YACD,SAAS,EAAE,0BAAgB;SAC3B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,OAAO;gBACP,aAAa;aACb;YACD,SAAS,EAAE,2BAAgB;SAC3B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,YAAY;gBACZ,gBAAgB;gBAChB,gBAAgB;gBAChB,gCAAgC;aAChC;YACD,SAAS,EAAE,wBAAe;SAC1B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,aAAa;gBACb,UAAU;gBACV,2BAA2B;gBAC3B,eAAe;aACf;YACD,SAAS,EAAE,0BAAgB;SAC3B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,qCAAqC;aACrC;YACD,SAAS,EAAE,gCAAmB;SAC9B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,yCAAyC;aACzC;YACD,SAAS,EAAE,0BAAgB;SAC3B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,WAAW;gBACX,0CAA0C;aAC1C;YACD,SAAS,EAAE,wBAAe;SAC1B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,6CAA6C;aAC7C;YACD,SAAS,EAAE,oBAAa;SACxB,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,0CAA0C;aAC1C;YACD,SAAS,EAAE,wBAAe;SAC1B,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC;YACb,QAAQ,EAAE;gBACT,YAAY;gBACZ,6BAA6B;aAC7B;YACD,SAAS,EAAE,wBAAe;SAC1B,CAAC,CAAC;IACJ,CAAC;IAED,MAAM,CAAC,QAAQ,CAAC,OAAyB;QACxC,IAAI,CAAC,QAAQ,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC;IAC7B,CAAC;IAED,MAAM,CAAC,aAAa,CAAC,QAAkB,EAAE,GAAW,EAAE,aAAmB;QACxE,OAAO,IAAI,CAAC,eAAe,CAAC,QAAQ,EAAE,GAAG,EAAE,aAAa,EAAE,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,UAAU,EAAE,CAAC,CAAC;IAChF,CAAC;IAED,MAAM,CAAC,kBAAkB,CAAC,QAAkB,EAAE,GAAW,EAAE,aAAmB;QAC7E,OAAO,IAAI,CAAC,eAAe,CAAC,QAAQ,EAAE,GAAG,EAAE,aAAa,EAAE,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,eAAe,EAAE,CAAC,CAAC;IACrF,CAAC;IAED,MAAM,CAAC,2BAA2B,CAAC,QAAkB,EAAE,GAAW,EAAE,aAAmB;QACtF,OAAO,IAAI,CAAC,eAAe,CAAC,QAAQ,EAAE,GAAG,EAAE,aAAa,EAAE,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,eAAe,EAAE,IAAI,CAAC,CAAC,YAAY,EAAE,CAAC,CAAC;IACzG,CAAC;IAEO,MAAM,CAAC,eAAe,CAC7B,QAAkB,EAAE,GAAW,EAAE,aAA8B,EAC/D,SAA+C;QAE/C,IAAI,CAAC;YACJ,MAAM,MAAM,GAAG,IAAI,GAAG,CAAC,GAAG,CAAC,CAAC,QAAQ,CAAC;YAErC,KAAK,MAAM,EAAE,QAAQ,EAAE,SAAS,EAAE,IAAI,IAAI,CAAC,QAAQ,EAAE,CAAC;gBACrD,MAAM,OAAO,GAAG,QAAQ,CAAC,IAAI,CAAC,OAAO,CAAC,EAAE;oBACvC,IAAI,OAAO,YAAY,MAAM,EAAE,CAAC;wBAC/B,OAAO,OAAO,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;oBAC1B,CAAC;oBACD,OAAO,MAAM,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC;gBACjC,CAAC,CAAC,CAAC;gBAEH,IAAI,OAAO,EAAE,CAAC;oBACb,MAAM,QAAQ,GAAG,IAAI,SAAS,CAAC,QAAQ,EAAE,GAAG,EAAE,aAAa,CAAC,CAAC;oBAC7D,IAAI,SAAS,CAAC,QAAQ,CAAC,EAAE,CAAC;wBACzB,OAAO,QAAQ,CAAC;oBACjB,CAAC;gBACF,CAAC;YACF,CAAC;YAED,OAAO,IAAI,CAAC;QAEb,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YAChB,OAAO,CAAC,KAAK,CAAC,0BAA0B,EAAE,KAAK,CAAC,CAAC;YACjD,OAAO,IAAI,CAAC;QACb,CAAC;IACF,CAAC;;AA7IF,8CA8IC;AA7Ie,0BAAQ,GAAuB,EAAE,CAAC;AA+IlD,wBAAwB;AACxB,iBAAiB,CAAC,UAAU,EAAE,CAAC"}
|
|
@@ -7,5 +7,11 @@ export declare abstract class BaseExtractor {
|
|
|
7
7
|
abstract canExtract(): boolean;
|
|
8
8
|
abstract extract(): ExtractorResult;
|
|
9
9
|
canExtractAsync(): boolean;
|
|
10
|
+
/**
|
|
11
|
+
* When true, parseAsync() will prefer extractAsync() over extract(),
|
|
12
|
+
* even if sync extraction produces content. Use this when the async
|
|
13
|
+
* path provides strictly better results (e.g. YouTube transcripts).
|
|
14
|
+
*/
|
|
15
|
+
prefersAsync(): boolean;
|
|
10
16
|
extractAsync(): Promise<ExtractorResult>;
|
|
11
17
|
}
|
package/dist/extractors/_base.js
CHANGED
|
@@ -10,6 +10,14 @@ class BaseExtractor {
|
|
|
10
10
|
canExtractAsync() {
|
|
11
11
|
return false;
|
|
12
12
|
}
|
|
13
|
+
/**
|
|
14
|
+
* When true, parseAsync() will prefer extractAsync() over extract(),
|
|
15
|
+
* even if sync extraction produces content. Use this when the async
|
|
16
|
+
* path provides strictly better results (e.g. YouTube transcripts).
|
|
17
|
+
*/
|
|
18
|
+
prefersAsync() {
|
|
19
|
+
return false;
|
|
20
|
+
}
|
|
13
21
|
async extractAsync() {
|
|
14
22
|
return this.extract();
|
|
15
23
|
}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"_base.js","sourceRoot":"","sources":["../../src/extractors/_base.ts"],"names":[],"mappings":";;;AAEA,MAAsB,aAAa;IAKlC,YAAY,QAAkB,EAAE,GAAW,EAAE,aAAmB;QAC/D,IAAI,CAAC,QAAQ,GAAG,QAAQ,CAAC;QACzB,IAAI,CAAC,GAAG,GAAG,GAAG,CAAC;QACf,IAAI,CAAC,aAAa,GAAG,aAAa,CAAC;IACpC,CAAC;IAKD,eAAe;QACd,OAAO,KAAK,CAAC;IACd,CAAC;IAED,KAAK,CAAC,YAAY;QACjB,OAAO,IAAI,CAAC,OAAO,EAAE,CAAC;IACvB,CAAC;CACD;
|
|
1
|
+
{"version":3,"file":"_base.js","sourceRoot":"","sources":["../../src/extractors/_base.ts"],"names":[],"mappings":";;;AAEA,MAAsB,aAAa;IAKlC,YAAY,QAAkB,EAAE,GAAW,EAAE,aAAmB;QAC/D,IAAI,CAAC,QAAQ,GAAG,QAAQ,CAAC;QACzB,IAAI,CAAC,GAAG,GAAG,GAAG,CAAC;QACf,IAAI,CAAC,aAAa,GAAG,aAAa,CAAC;IACpC,CAAC;IAKD,eAAe;QACd,OAAO,KAAK,CAAC;IACd,CAAC;IAED;;;;OAIG;IACH,YAAY;QACX,OAAO,KAAK,CAAC;IACd,CAAC;IAED,KAAK,CAAC,YAAY;QACjB,OAAO,IAAI,CAAC,OAAO,EAAE,CAAC;IACvB,CAAC;CACD;AA9BD,sCA8BC"}
|
|
@@ -1,12 +1,20 @@
|
|
|
1
1
|
import { BaseExtractor } from './_base';
|
|
2
2
|
import { ExtractorResult } from '../types/extractors';
|
|
3
3
|
export declare class GitHubExtractor extends BaseExtractor {
|
|
4
|
+
private isIssue;
|
|
5
|
+
private isPR;
|
|
6
|
+
constructor(document: Document, url: string);
|
|
4
7
|
canExtract(): boolean;
|
|
5
8
|
extract(): ExtractorResult;
|
|
6
|
-
private
|
|
9
|
+
private createContentHtml;
|
|
10
|
+
private getIssueContent;
|
|
11
|
+
private extractComments;
|
|
12
|
+
private getPRBody;
|
|
13
|
+
private getPRContent;
|
|
14
|
+
private extractPRComments;
|
|
7
15
|
private extractAuthor;
|
|
8
16
|
private cleanBodyContent;
|
|
9
|
-
private
|
|
17
|
+
private extractNumber;
|
|
10
18
|
private extractRepoInfo;
|
|
11
19
|
private createDescription;
|
|
12
20
|
}
|
|
@@ -3,7 +3,13 @@ Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
3
3
|
exports.GitHubExtractor = void 0;
|
|
4
4
|
const _base_1 = require("./_base");
|
|
5
5
|
const dom_1 = require("../utils/dom");
|
|
6
|
+
const comments_1 = require("../utils/comments");
|
|
6
7
|
class GitHubExtractor extends _base_1.BaseExtractor {
|
|
8
|
+
constructor(document, url) {
|
|
9
|
+
super(document, url);
|
|
10
|
+
this.isIssue = /\/issues\/\d+/.test(url);
|
|
11
|
+
this.isPR = /\/pull\/\d+/.test(url);
|
|
12
|
+
}
|
|
7
13
|
canExtract() {
|
|
8
14
|
const githubIndicators = [
|
|
9
15
|
'meta[name="expected-hostname"][content="github.com"]',
|
|
@@ -12,57 +18,88 @@ class GitHubExtractor extends _base_1.BaseExtractor {
|
|
|
12
18
|
'.js-header-wrapper',
|
|
13
19
|
'#js-repo-pjax-container',
|
|
14
20
|
];
|
|
15
|
-
|
|
16
|
-
|
|
21
|
+
if (!githubIndicators.some(selector => this.document.querySelector(selector) !== null)) {
|
|
22
|
+
return false;
|
|
23
|
+
}
|
|
24
|
+
if (this.isIssue) {
|
|
25
|
+
return [
|
|
17
26
|
'[data-testid="issue-metadata-sticky"]',
|
|
18
27
|
'[data-testid="issue-title"]',
|
|
19
|
-
]
|
|
20
|
-
}
|
|
21
|
-
|
|
22
|
-
|
|
28
|
+
].some(selector => this.document.querySelector(selector) !== null);
|
|
29
|
+
}
|
|
30
|
+
if (this.isPR) {
|
|
31
|
+
return [
|
|
32
|
+
'.pull-discussion-timeline',
|
|
33
|
+
'.discussion-timeline',
|
|
34
|
+
'.gh-header-title',
|
|
35
|
+
'.js-issue-title',
|
|
36
|
+
].some(selector => this.document.querySelector(selector) !== null);
|
|
37
|
+
}
|
|
38
|
+
return false;
|
|
23
39
|
}
|
|
24
40
|
extract() {
|
|
25
|
-
return this.extractIssue();
|
|
26
|
-
}
|
|
27
|
-
extractIssue() {
|
|
28
41
|
const repoInfo = this.extractRepoInfo();
|
|
29
|
-
const
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
const
|
|
33
|
-
|
|
34
|
-
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
|
|
41
|
-
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
42
|
+
const number = this.extractNumber();
|
|
43
|
+
const type = this.isPR ? 'pull' : 'issue';
|
|
44
|
+
const prBody = this.isPR ? this.getPRBody() : null;
|
|
45
|
+
const { content: postContent, author, published } = this.isPR
|
|
46
|
+
? this.getPRContent(prBody)
|
|
47
|
+
: this.getIssueContent();
|
|
48
|
+
const comments = this.isPR
|
|
49
|
+
? this.extractPRComments(prBody)
|
|
50
|
+
: this.extractComments();
|
|
51
|
+
const contentHtml = this.createContentHtml(postContent, comments);
|
|
52
|
+
return {
|
|
53
|
+
content: contentHtml,
|
|
54
|
+
contentHtml: contentHtml,
|
|
55
|
+
extractedContent: {
|
|
56
|
+
type,
|
|
57
|
+
number,
|
|
58
|
+
repository: repoInfo.repo,
|
|
59
|
+
owner: repoInfo.owner,
|
|
60
|
+
},
|
|
61
|
+
variables: {
|
|
62
|
+
title: this.document.title,
|
|
63
|
+
author,
|
|
64
|
+
published,
|
|
65
|
+
site: `GitHub - ${repoInfo.owner}/${repoInfo.repo}`,
|
|
66
|
+
description: this.createDescription(contentHtml),
|
|
54
67
|
}
|
|
55
|
-
}
|
|
56
|
-
|
|
68
|
+
};
|
|
69
|
+
}
|
|
70
|
+
createContentHtml(postContent, comments) {
|
|
71
|
+
return (0, comments_1.buildContentHtml)('github', postContent, comments);
|
|
72
|
+
}
|
|
73
|
+
getIssueContent() {
|
|
74
|
+
const issueContainer = this.document.querySelector('[data-testid="issue-viewer-issue-container"]');
|
|
75
|
+
if (!issueContainer)
|
|
76
|
+
return { content: '', author: '', published: '' };
|
|
77
|
+
const author = this.extractAuthor(issueContainer, [
|
|
78
|
+
'a[data-testid="issue-body-header-author"]',
|
|
79
|
+
'.IssueBodyHeaderAuthor-module__authorLoginLink--_S7aT',
|
|
80
|
+
'.ActivityHeader-module__AuthorLink--iofTU',
|
|
81
|
+
'a[href*="/users/"][data-hovercard-url*="/users/"]',
|
|
82
|
+
'a[aria-label*="profile"]'
|
|
83
|
+
]);
|
|
84
|
+
const issueTimeElement = issueContainer.querySelector('relative-time');
|
|
85
|
+
const published = issueTimeElement?.getAttribute('datetime') || '';
|
|
86
|
+
const issueBodyElement = issueContainer.querySelector('[data-testid="issue-body-viewer"] .markdown-body');
|
|
87
|
+
if (!issueBodyElement)
|
|
88
|
+
return { content: '', author, published };
|
|
89
|
+
const content = this.cleanBodyContent(issueBodyElement);
|
|
90
|
+
return { content, author, published };
|
|
91
|
+
}
|
|
92
|
+
extractComments() {
|
|
57
93
|
const commentElements = Array.from(this.document.querySelectorAll('[data-wrapper-timeline-id]'));
|
|
58
94
|
const processedComments = new Set();
|
|
59
|
-
|
|
95
|
+
const commentData = [];
|
|
96
|
+
for (const commentElement of commentElements) {
|
|
60
97
|
const commentContainer = commentElement.querySelector('.react-issue-comment');
|
|
61
98
|
if (!commentContainer)
|
|
62
|
-
|
|
99
|
+
continue;
|
|
63
100
|
const commentId = commentElement.getAttribute('data-wrapper-timeline-id');
|
|
64
101
|
if (!commentId || processedComments.has(commentId))
|
|
65
|
-
|
|
102
|
+
continue;
|
|
66
103
|
processedComments.add(commentId);
|
|
67
104
|
const author = this.extractAuthor(commentContainer, [
|
|
68
105
|
'.ActivityHeader-module__AuthorLink--iofTU',
|
|
@@ -71,38 +108,64 @@ class GitHubExtractor extends _base_1.BaseExtractor {
|
|
|
71
108
|
]);
|
|
72
109
|
const timeElement = commentContainer.querySelector('relative-time');
|
|
73
110
|
const timestamp = timeElement?.getAttribute('datetime') || '';
|
|
111
|
+
const date = timestamp ? new Date(timestamp).toISOString().split('T')[0] : '';
|
|
74
112
|
const bodyElement = commentContainer.querySelector('.markdown-body');
|
|
75
|
-
if (bodyElement)
|
|
76
|
-
|
|
77
|
-
|
|
78
|
-
|
|
79
|
-
|
|
80
|
-
|
|
81
|
-
|
|
82
|
-
|
|
83
|
-
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
return
|
|
91
|
-
|
|
92
|
-
|
|
93
|
-
|
|
94
|
-
|
|
95
|
-
|
|
96
|
-
|
|
97
|
-
|
|
98
|
-
|
|
99
|
-
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
113
|
+
if (!bodyElement)
|
|
114
|
+
continue;
|
|
115
|
+
const bodyContent = this.cleanBodyContent(bodyElement);
|
|
116
|
+
if (!bodyContent)
|
|
117
|
+
continue;
|
|
118
|
+
commentData.push({
|
|
119
|
+
author,
|
|
120
|
+
date,
|
|
121
|
+
content: bodyContent,
|
|
122
|
+
});
|
|
123
|
+
}
|
|
124
|
+
return (0, comments_1.buildCommentTree)(commentData);
|
|
125
|
+
}
|
|
126
|
+
getPRBody() {
|
|
127
|
+
// PR body is in [id^="pullrequest-"] or the first .timeline-comment
|
|
128
|
+
return this.document.querySelector('[id^="pullrequest-"]')
|
|
129
|
+
|| this.document.querySelector('.timeline-comment');
|
|
130
|
+
}
|
|
131
|
+
getPRContent(prBody) {
|
|
132
|
+
const bodyEl = prBody?.querySelector('.comment-body.markdown-body')
|
|
133
|
+
|| this.document.querySelector('.comment-body.markdown-body');
|
|
134
|
+
const content = bodyEl ? this.cleanBodyContent(bodyEl) : '';
|
|
135
|
+
const authorEl = prBody?.querySelector('.author')
|
|
136
|
+
|| this.document.querySelector('.gh-header-meta .author');
|
|
137
|
+
const author = authorEl?.textContent?.trim() || '';
|
|
138
|
+
const timeEl = prBody?.querySelector('relative-time');
|
|
139
|
+
const published = timeEl?.getAttribute('datetime') || '';
|
|
140
|
+
return { content, author, published };
|
|
141
|
+
}
|
|
142
|
+
extractPRComments(prBody) {
|
|
143
|
+
// Find all comment containers: regular comments (.timeline-comment)
|
|
144
|
+
// and code review comments (.review-comment)
|
|
145
|
+
const allComments = Array.from(this.document.querySelectorAll('.timeline-comment, .review-comment'));
|
|
146
|
+
const commentData = [];
|
|
147
|
+
for (const comment of allComments) {
|
|
148
|
+
// Skip the PR description
|
|
149
|
+
if (prBody && (comment === prBody || prBody.contains(comment)))
|
|
150
|
+
continue;
|
|
151
|
+
const authorEl = comment.querySelector('.author');
|
|
152
|
+
const author = authorEl?.textContent?.trim() || '';
|
|
153
|
+
const timeEl = comment.querySelector('relative-time');
|
|
154
|
+
const timestamp = timeEl?.getAttribute('datetime') || '';
|
|
155
|
+
const date = timestamp ? new Date(timestamp).toISOString().split('T')[0] : '';
|
|
156
|
+
const bodyEl = comment.querySelector('.comment-body.markdown-body');
|
|
157
|
+
if (!bodyEl)
|
|
158
|
+
continue;
|
|
159
|
+
const bodyContent = this.cleanBodyContent(bodyEl);
|
|
160
|
+
if (!bodyContent)
|
|
161
|
+
continue;
|
|
162
|
+
commentData.push({
|
|
163
|
+
author,
|
|
164
|
+
date,
|
|
165
|
+
content: bodyContent,
|
|
166
|
+
});
|
|
167
|
+
}
|
|
168
|
+
return (0, comments_1.buildCommentTree)(commentData);
|
|
106
169
|
}
|
|
107
170
|
extractAuthor(container, selectors) {
|
|
108
171
|
for (const selector of selectors) {
|
|
@@ -128,9 +191,33 @@ class GitHubExtractor extends _base_1.BaseExtractor {
|
|
|
128
191
|
const cleanBody = bodyElement.cloneNode(true);
|
|
129
192
|
cleanBody.querySelectorAll('button, [data-testid*="button"], [data-testid*="menu"]').forEach(el => el.remove());
|
|
130
193
|
cleanBody.querySelectorAll('.js-clipboard-copy, .zeroclipboard-container').forEach(el => el.remove());
|
|
194
|
+
// Convert GitHub's highlighted code blocks to standard <pre><code>
|
|
195
|
+
// GitHub uses <div class="highlight highlight-source-{lang}"><pre>spans...</pre></div>
|
|
196
|
+
// The <pre> has no <code> child, which breaks markdown conversion.
|
|
197
|
+
cleanBody.querySelectorAll('div.highlight[class*="highlight-source-"] pre, div.highlight pre').forEach(pre => {
|
|
198
|
+
const wrapper = pre.parentElement;
|
|
199
|
+
if (!wrapper)
|
|
200
|
+
return;
|
|
201
|
+
// Extract language from wrapper class (e.g. "highlight-source-ts")
|
|
202
|
+
const langMatch = wrapper.className.match(/highlight-source-(\w+)/);
|
|
203
|
+
const lang = langMatch?.[1] || '';
|
|
204
|
+
// Use data-snippet-clipboard-copy-content if available (clean text),
|
|
205
|
+
// otherwise fall back to textContent
|
|
206
|
+
const content = wrapper.getAttribute('data-snippet-clipboard-copy-content')
|
|
207
|
+
|| pre.textContent || '';
|
|
208
|
+
const code = this.document.createElement('code');
|
|
209
|
+
if (lang) {
|
|
210
|
+
code.setAttribute('class', `language-${lang}`);
|
|
211
|
+
code.setAttribute('data-lang', lang);
|
|
212
|
+
}
|
|
213
|
+
code.textContent = content;
|
|
214
|
+
const newPre = this.document.createElement('pre');
|
|
215
|
+
newPre.appendChild(code);
|
|
216
|
+
wrapper.replaceWith(newPre);
|
|
217
|
+
});
|
|
131
218
|
return (0, dom_1.serializeHTML)(cleanBody).trim();
|
|
132
219
|
}
|
|
133
|
-
|
|
220
|
+
extractNumber() {
|
|
134
221
|
// Try URL first (most reliable)
|
|
135
222
|
const urlMatch = this.url.match(/\/(issues|pull)\/(\d+)/);
|
|
136
223
|
if (urlMatch)
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"github.js","sourceRoot":"","sources":["../../src/extractors/github.ts"],"names":[],"mappings":";;;AAAA,mCAAwC;AAExC,sCAAwD;
|
|
1
|
+
{"version":3,"file":"github.js","sourceRoot":"","sources":["../../src/extractors/github.ts"],"names":[],"mappings":";;;AAAA,mCAAwC;AAExC,sCAAwD;AACxD,gDAAyF;AAEzF,MAAa,eAAgB,SAAQ,qBAAa;IAIjD,YAAY,QAAkB,EAAE,GAAW;QAC1C,KAAK,CAAC,QAAQ,EAAE,GAAG,CAAC,CAAC;QACrB,IAAI,CAAC,OAAO,GAAG,eAAe,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;QACzC,IAAI,CAAC,IAAI,GAAG,aAAa,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;IACrC,CAAC;IAED,UAAU;QACT,MAAM,gBAAgB,GAAG;YACxB,sDAAsD;YACtD,6BAA6B;YAC7B,wCAAwC;YACxC,oBAAoB;YACpB,yBAAyB;SACzB,CAAC;QAEF,IAAI,CAAC,gBAAgB,CAAC,IAAI,CAAC,QAAQ,CAAC,EAAE,CAAC,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,QAAQ,CAAC,KAAK,IAAI,CAAC,EAAE,CAAC;YACxF,OAAO,KAAK,CAAC;QACd,CAAC;QAED,IAAI,IAAI,CAAC,OAAO,EAAE,CAAC;YAClB,OAAO;gBACN,uCAAuC;gBACvC,6BAA6B;aAC7B,CAAC,IAAI,CAAC,QAAQ,CAAC,EAAE,CAAC,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,QAAQ,CAAC,KAAK,IAAI,CAAC,CAAC;QACpE,CAAC;QAED,IAAI,IAAI,CAAC,IAAI,EAAE,CAAC;YACf,OAAO;gBACN,2BAA2B;gBAC3B,sBAAsB;gBACtB,kBAAkB;gBAClB,iBAAiB;aACjB,CAAC,IAAI,CAAC,QAAQ,CAAC,EAAE,CAAC,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,QAAQ,CAAC,KAAK,IAAI,CAAC,CAAC;QACpE,CAAC;QAED,OAAO,KAAK,CAAC;IACd,CAAC;IAED,OAAO;QACN,MAAM,QAAQ,GAAG,IAAI,CAAC,eAAe,EAAE,CAAC;QACxC,MAAM,MAAM,GAAG,IAAI,CAAC,aAAa,EAAE,CAAC;QACpC,MAAM,IAAI,GAAG,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,OAAO,CAAC;QAE1C,MAAM,MAAM,GAAG,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC,IAAI,CAAC,SAAS,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;QACnD,MAAM,EAAE,OAAO,EAAE,WAAW,EAAE,MAAM,EAAE,SAAS,EAAE,GAAG,IAAI,CAAC,IAAI;YAC5D,CAAC,CAAC,IAAI,CAAC,YAAY,CAAC,MAAM,CAAC;YAC3B,CAAC,CAAC,IAAI,CAAC,eAAe,EAAE,CAAC;QAC1B,MAAM,QAAQ,GAAG,IAAI,CAAC,IAAI;YACzB,CAAC,CAAC,IAAI,CAAC,iBAAiB,CAAC,MAAM,CAAC;YAChC,CAAC,CAAC,IAAI,CAAC,eAAe,EAAE,CAAC;QAC1B,MAAM,WAAW,GAAG,IAAI,CAAC,iBAAiB,CAAC,WAAW,EAAE,QAAQ,CAAC,CAAC;QAElE,OAAO;YACN,OAAO,EAAE,WAAW;YACpB,WAAW,EAAE,WAAW;YACxB,gBAAgB,EAAE;gBACjB,IAAI;gBACJ,MAAM;gBACN,UAAU,EAAE,QAAQ,CAAC,IAAI;gBACzB,KAAK,EAAE,QAAQ,CAAC,KAAK;aACrB;YACD,SAAS,EAAE;gBACV,KAAK,EAAE,IAAI,CAAC,QAAQ,CAAC,KAAK;gBAC1B,MAAM;gBACN,SAAS;gBACT,IAAI,EAAE,YAAY,QAAQ,CAAC,KAAK,IAAI,QAAQ,CAAC,IAAI,EAAE;gBACnD,WAAW,EAAE,IAAI,CAAC,iBAAiB,CAAC,WAAW,CAAC;aAChD;SACD,CAAC;IACH,CAAC;IAEO,iBAAiB,CAAC,WAAmB,EAAE,QAAgB;QAC9D,OAAO,IAAA,2BAAgB,EAAC,QAAQ,EAAE,WAAW,EAAE,QAAQ,CAAC,CAAC;IAC1D,CAAC;IAEO,eAAe;QACtB,MAAM,cAAc,GAAG,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,8CAA8C,CAAC,CAAC;QACnG,IAAI,CAAC,cAAc;YAAE,OAAO,EAAE,OAAO,EAAE,EAAE,EAAE,MAAM,EAAE,EAAE,EAAE,SAAS,EAAE,EAAE,EAAE,CAAC;QAEvE,MAAM,MAAM,GAAG,IAAI,CAAC,aAAa,CAAC,cAAc,EAAE;YACjD,2CAA2C;YAC3C,uDAAuD;YACvD,2CAA2C;YAC3C,mDAAmD;YACnD,0BAA0B;SAC1B,CAAC,CAAC;QAEH,MAAM,gBAAgB,GAAG,cAAc,CAAC,aAAa,CAAC,eAAe,CAAC,CAAC;QACvE,MAAM,SAAS,GAAG,gBAAgB,EAAE,YAAY,CAAC,UAAU,CAAC,IAAI,EAAE,CAAC;QAEnE,MAAM,gBAAgB,GAAG,cAAc,CAAC,aAAa,CAAC,kDAAkD,CAAC,CAAC;QAC1G,IAAI,CAAC,gBAAgB;YAAE,OAAO,EAAE,OAAO,EAAE,EAAE,EAAE,MAAM,EAAE,SAAS,EAAE,CAAC;QAEjE,MAAM,OAAO,GAAG,IAAI,CAAC,gBAAgB,CAAC,gBAAgB,CAAC,CAAC;QAExD,OAAO,EAAE,OAAO,EAAE,MAAM,EAAE,SAAS,EAAE,CAAC;IACvC,CAAC;IAEO,eAAe;QACtB,MAAM,eAAe,GAAG,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,QAAQ,CAAC,gBAAgB,CAAC,4BAA4B,CAAC,CAAC,CAAC;QACjG,MAAM,iBAAiB,GAAG,IAAI,GAAG,EAAU,CAAC;QAC5C,MAAM,WAAW,GAAkB,EAAE,CAAC;QAEtC,KAAK,MAAM,cAAc,IAAI,eAAe,EAAE,CAAC;YAC9C,MAAM,gBAAgB,GAAG,cAAc,CAAC,aAAa,CAAC,sBAAsB,CAAC,CAAC;YAC9E,IAAI,CAAC,gBAAgB;gBAAE,SAAS;YAEhC,MAAM,SAAS,GAAG,cAAc,CAAC,YAAY,CAAC,0BAA0B,CAAC,CAAC;YAC1E,IAAI,CAAC,SAAS,IAAI,iBAAiB,CAAC,GAAG,CAAC,SAAS,CAAC;gBAAE,SAAS;YAC7D,iBAAiB,CAAC,GAAG,CAAC,SAAS,CAAC,CAAC;YAEjC,MAAM,MAAM,GAAG,IAAI,CAAC,aAAa,CAAC,gBAAgB,EAAE;gBACnD,2CAA2C;gBAC3C,8BAA8B;gBAC9B,6CAA6C;aAC7C,CAAC,CAAC;YAEH,MAAM,WAAW,GAAG,gBAAgB,CAAC,aAAa,CAAC,eAAe,CAAC,CAAC;YACpE,MAAM,SAAS,GAAG,WAAW,EAAE,YAAY,CAAC,UAAU,CAAC,IAAI,EAAE,CAAC;YAC9D,MAAM,IAAI,GAAG,SAAS,CAAC,CAAC,CAAC,IAAI,IAAI,CAAC,SAAS,CAAC,CAAC,WAAW,EAAE,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;YAE9E,MAAM,WAAW,GAAG,gBAAgB,CAAC,aAAa,CAAC,gBAAgB,CAAC,CAAC;YACrE,IAAI,CAAC,WAAW;gBAAE,SAAS;YAE3B,MAAM,WAAW,GAAG,IAAI,CAAC,gBAAgB,CAAC,WAAW,CAAC,CAAC;YACvD,IAAI,CAAC,WAAW;gBAAE,SAAS;YAE3B,WAAW,CAAC,IAAI,CAAC;gBAChB,MAAM;gBACN,IAAI;gBACJ,OAAO,EAAE,WAAW;aACpB,CAAC,CAAC;QACJ,CAAC;QAED,OAAO,IAAA,2BAAgB,EAAC,WAAW,CAAC,CAAC;IACtC,CAAC;IAEO,SAAS;QAChB,oEAAoE;QACpE,OAAO,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,sBAAsB,CAAC;eACtD,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,mBAAmB,CAAC,CAAC;IACtD,CAAC;IAEO,YAAY,CAAC,MAAsB;QAE1C,MAAM,MAAM,GAAG,MAAM,EAAE,aAAa,CAAC,6BAA6B,CAAC;eAC/D,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,6BAA6B,CAAC,CAAC;QAC/D,MAAM,OAAO,GAAG,MAAM,CAAC,CAAC,CAAC,IAAI,CAAC,gBAAgB,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;QAE5D,MAAM,QAAQ,GAAG,MAAM,EAAE,aAAa,CAAC,SAAS,CAAC;eAC7C,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,yBAAyB,CAAC,CAAC;QAC3D,MAAM,MAAM,GAAG,QAAQ,EAAE,WAAW,EAAE,IAAI,EAAE,IAAI,EAAE,CAAC;QAEnD,MAAM,MAAM,GAAG,MAAM,EAAE,aAAa,CAAC,eAAe,CAAC,CAAC;QACtD,MAAM,SAAS,GAAG,MAAM,EAAE,YAAY,CAAC,UAAU,CAAC,IAAI,EAAE,CAAC;QAEzD,OAAO,EAAE,OAAO,EAAE,MAAM,EAAE,SAAS,EAAE,CAAC;IACvC,CAAC;IAEO,iBAAiB,CAAC,MAAsB;QAC/C,oEAAoE;QACpE,6CAA6C;QAC7C,MAAM,WAAW,GAAG,KAAK,CAAC,IAAI,CAC7B,IAAI,CAAC,QAAQ,CAAC,gBAAgB,CAAC,oCAAoC,CAAC,CACpE,CAAC;QACF,MAAM,WAAW,GAAkB,EAAE,CAAC;QAEtC,KAAK,MAAM,OAAO,IAAI,WAAW,EAAE,CAAC;YACnC,0BAA0B;YAC1B,IAAI,MAAM,IAAI,CAAC,OAAO,KAAK,MAAM,IAAI,MAAM,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC;gBAAE,SAAS;YAEzE,MAAM,QAAQ,GAAG,OAAO,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;YAClD,MAAM,MAAM,GAAG,QAAQ,EAAE,WAAW,EAAE,IAAI,EAAE,IAAI,EAAE,CAAC;YAEnD,MAAM,MAAM,GAAG,OAAO,CAAC,aAAa,CAAC,eAAe,CAAC,CAAC;YACtD,MAAM,SAAS,GAAG,MAAM,EAAE,YAAY,CAAC,UAAU,CAAC,IAAI,EAAE,CAAC;YACzD,MAAM,IAAI,GAAG,SAAS,CAAC,CAAC,CAAC,IAAI,IAAI,CAAC,SAAS,CAAC,CAAC,WAAW,EAAE,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;YAE9E,MAAM,MAAM,GAAG,OAAO,CAAC,aAAa,CAAC,6BAA6B,CAAC,CAAC;YACpE,IAAI,CAAC,MAAM;gBAAE,SAAS;YAEtB,MAAM,WAAW,GAAG,IAAI,CAAC,gBAAgB,CAAC,MAAM,CAAC,CAAC;YAClD,IAAI,CAAC,WAAW;gBAAE,SAAS;YAE3B,WAAW,CAAC,IAAI,CAAC;gBAChB,MAAM;gBACN,IAAI;gBACJ,OAAO,EAAE,WAAW;aACpB,CAAC,CAAC;QACJ,CAAC;QAED,OAAO,IAAA,2BAAgB,EAAC,WAAW,CAAC,CAAC;IACtC,CAAC;IAEO,aAAa,CAAC,SAAkB,EAAE,SAAmB;QAC5D,KAAK,MAAM,QAAQ,IAAI,SAAS,EAAE,CAAC;YAClC,MAAM,UAAU,GAAG,SAAS,CAAC,aAAa,CAAC,QAAQ,CAAC,CAAC;YACrD,IAAI,UAAU,EAAE,CAAC;gBAChB,MAAM,IAAI,GAAG,UAAU,CAAC,YAAY,CAAC,MAAM,CAAC,CAAC;gBAC7C,IAAI,IAAI,EAAE,CAAC;oBACV,IAAI,IAAI,CAAC,UAAU,CAAC,GAAG,CAAC,EAAE,CAAC;wBAC1B,OAAO,IAAI,CAAC,SAAS,CAAC,CAAC,CAAC,CAAC;oBAC1B,CAAC;yBAAM,IAAI,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,EAAE,CAAC;wBACzC,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,0BAA0B,CAAC,CAAC;wBACrD,IAAI,KAAK,IAAI,KAAK,CAAC,CAAC,CAAC,EAAE,CAAC;4BACvB,OAAO,KAAK,CAAC,CAAC,CAAC,CAAC;wBACjB,CAAC;oBACF,CAAC;gBACF,CAAC;YACF,CAAC;QACF,CAAC;QACD,OAAO,SAAS,CAAC;IAClB,CAAC;IAEO,gBAAgB,CAAC,WAAoB;QAC5C,MAAM,SAAS,GAAG,WAAW,CAAC,SAAS,CAAC,IAAI,CAAY,CAAC;QACzD,SAAS,CAAC,gBAAgB,CAAC,wDAAwD,CAAC,CAAC,OAAO,CAAC,EAAE,CAAC,EAAE,CAAC,EAAE,CAAC,MAAM,EAAE,CAAC,CAAC;QAChH,SAAS,CAAC,gBAAgB,CAAC,8CAA8C,CAAC,CAAC,OAAO,CAAC,EAAE,CAAC,EAAE,CAAC,EAAE,CAAC,MAAM,EAAE,CAAC,CAAC;QAEtG,mEAAmE;QACnE,uFAAuF;QACvF,mEAAmE;QACnE,SAAS,CAAC,gBAAgB,CAAC,kEAAkE,CAAC,CAAC,OAAO,CAAC,GAAG,CAAC,EAAE;YAC5G,MAAM,OAAO,GAAG,GAAG,CAAC,aAAa,CAAC;YAClC,IAAI,CAAC,OAAO;gBAAE,OAAO;YAErB,mEAAmE;YACnE,MAAM,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC,KAAK,CAAC,wBAAwB,CAAC,CAAC;YACpE,MAAM,IAAI,GAAG,SAAS,EAAE,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC;YAElC,qEAAqE;YACrE,qCAAqC;YACrC,MAAM,OAAO,GAAG,OAAO,CAAC,YAAY,CAAC,qCAAqC,CAAC;mBACvE,GAAG,CAAC,WAAW,IAAI,EAAE,CAAC;YAE1B,MAAM,IAAI,GAAG,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,MAAM,CAAC,CAAC;YACjD,IAAI,IAAI,EAAE,CAAC;gBACV,IAAI,CAAC,YAAY,CAAC,OAAO,EAAE,YAAY,IAAI,EAAE,CAAC,CAAC;gBAC/C,IAAI,CAAC,YAAY,CAAC,WAAW,EAAE,IAAI,CAAC,CAAC;YACtC,CAAC;YACD,IAAI,CAAC,WAAW,GAAG,OAAO,CAAC;YAE3B,MAAM,MAAM,GAAG,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,KAAK,CAAC,CAAC;YAClD,MAAM,CAAC,WAAW,CAAC,IAAI,CAAC,CAAC;YACzB,OAAO,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC;QAC7B,CAAC,CAAC,CAAC;QAEH,OAAO,IAAA,mBAAa,EAAC,SAAS,CAAC,CAAC,IAAI,EAAE,CAAC;IACxC,CAAC;IAEO,aAAa;QACpB,gCAAgC;QAChC,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,CAAC,KAAK,CAAC,wBAAwB,CAAC,CAAC;QAC1D,IAAI,QAAQ;YAAE,OAAO,QAAQ,CAAC,CAAC,CAAC,CAAC;QAEjC,8BAA8B;QAC9B,MAAM,YAAY,GAAG,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,IAAI,CAAC,CAAC;QACvD,MAAM,UAAU,GAAG,YAAY,EAAE,WAAW,EAAE,KAAK,CAAC,QAAQ,CAAC,CAAC;QAC9D,OAAO,UAAU,CAAC,CAAC,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;IACxC,CAAC;IAEO,eAAe;QACtB,gCAAgC;QAChC,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,CAAC,KAAK,CAAC,iCAAiC,CAAC,CAAC;QACnE,IAAI,QAAQ,EAAE,CAAC;YACd,OAAO,EAAE,KAAK,EAAE,QAAQ,CAAC,CAAC,CAAC,EAAE,IAAI,EAAE,QAAQ,CAAC,CAAC,CAAC,EAAE,CAAC;QAClD,CAAC;QAED,8BAA8B;QAC9B,MAAM,UAAU,GAAG,IAAI,CAAC,QAAQ,CAAC,KAAK,CAAC,KAAK,CAAC,wBAAwB,CAAC,CAAC;QACvE,OAAO,UAAU,CAAC,CAAC,CAAC,EAAE,KAAK,EAAE,UAAU,CAAC,CAAC,CAAC,EAAE,IAAI,EAAE,UAAU,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,EAAE,KAAK,EAAE,EAAE,EAAE,IAAI,EAAE,EAAE,EAAE,CAAC;IAC7F,CAAC;IAGO,iBAAiB,CAAC,OAAe;QACxC,IAAI,CAAC,OAAO;YAAE,OAAO,EAAE,CAAC;QAExB,MAAM,OAAO,GAAG,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,KAAK,CAAC,CAAC;QACnD,OAAO,CAAC,WAAW,CAAC,IAAA,eAAS,EAAC,IAAI,CAAC,QAAQ,EAAE,OAAO,CAAC,CAAC,CAAC;QACvD,OAAO,OAAO,CAAC,WAAW,EAAE,IAAI,EAAE;aAChC,KAAK,CAAC,CAAC,EAAE,GAAG,CAAC;aACb,OAAO,CAAC,MAAM,EAAE,GAAG,CAAC,IAAI,EAAE,CAAC;IAC9B,CAAC;CACD;AA/RD,0CA+RC"}
|
|
@@ -3,6 +3,7 @@ Object.defineProperty(exports, "__esModule", { value: true });
|
|
|
3
3
|
exports.HackerNewsExtractor = void 0;
|
|
4
4
|
const _base_1 = require("./_base");
|
|
5
5
|
const dom_1 = require("../utils/dom");
|
|
6
|
+
const comments_1 = require("../utils/comments");
|
|
6
7
|
class HackerNewsExtractor extends _base_1.BaseExtractor {
|
|
7
8
|
constructor(document, url) {
|
|
8
9
|
super(document, url);
|
|
@@ -48,20 +49,7 @@ class HackerNewsExtractor extends _base_1.BaseExtractor {
|
|
|
48
49
|
};
|
|
49
50
|
}
|
|
50
51
|
createContentHtml(postContent, comments) {
|
|
51
|
-
return
|
|
52
|
-
<div class="hackernews-post">
|
|
53
|
-
<div class="post-content">
|
|
54
|
-
${postContent}
|
|
55
|
-
</div>
|
|
56
|
-
${comments ? `
|
|
57
|
-
<hr>
|
|
58
|
-
<h2>Comments</h2>
|
|
59
|
-
<div class="hackernews-comments">
|
|
60
|
-
${comments}
|
|
61
|
-
</div>
|
|
62
|
-
` : ''}
|
|
63
|
-
</div>
|
|
64
|
-
`.trim();
|
|
52
|
+
return (0, comments_1.buildContentHtml)('hackernews', postContent, comments);
|
|
65
53
|
}
|
|
66
54
|
getPostContent() {
|
|
67
55
|
if (!this.mainPost)
|
|
@@ -75,18 +63,12 @@ class HackerNewsExtractor extends _base_1.BaseExtractor {
|
|
|
75
63
|
const timestamp = timeElement?.getAttribute('title') || '';
|
|
76
64
|
const date = timestamp.split('T')[0] || '';
|
|
77
65
|
const points = this.mainComment.querySelector('.score')?.textContent?.trim() || '';
|
|
78
|
-
|
|
79
|
-
|
|
80
|
-
|
|
81
|
-
|
|
82
|
-
|
|
83
|
-
|
|
84
|
-
${points ? ` • <span class="comment-points">${points}</span>` : ''}
|
|
85
|
-
${parentUrl ? ` • <a href="https://news.ycombinator.com/${parentUrl}" class="parent-link">parent</a>` : ''}
|
|
86
|
-
</div>
|
|
87
|
-
<div class="comment-content">${commentText}</div>
|
|
88
|
-
</div>
|
|
89
|
-
`.trim();
|
|
66
|
+
return (0, comments_1.buildComment)({
|
|
67
|
+
author,
|
|
68
|
+
date,
|
|
69
|
+
content: commentText,
|
|
70
|
+
score: points || undefined,
|
|
71
|
+
});
|
|
90
72
|
}
|
|
91
73
|
// Otherwise handle regular post content
|
|
92
74
|
const titleRow = this.mainPost.querySelector('tr.athing');
|
|
@@ -107,10 +89,8 @@ class HackerNewsExtractor extends _base_1.BaseExtractor {
|
|
|
107
89
|
return this.processComments(comments);
|
|
108
90
|
}
|
|
109
91
|
processComments(comments) {
|
|
110
|
-
|
|
92
|
+
const commentData = [];
|
|
111
93
|
const processedIds = new Set();
|
|
112
|
-
let currentDepth = -1;
|
|
113
|
-
let blockquoteStack = [];
|
|
114
94
|
for (const comment of comments) {
|
|
115
95
|
const id = comment.getAttribute('id');
|
|
116
96
|
if (!id || processedIds.has(id))
|
|
@@ -124,53 +104,19 @@ class HackerNewsExtractor extends _base_1.BaseExtractor {
|
|
|
124
104
|
const points = comment.querySelector('.score')?.textContent?.trim() || '';
|
|
125
105
|
if (!commentText)
|
|
126
106
|
continue;
|
|
127
|
-
// Get the comment URL
|
|
128
107
|
const commentUrl = `https://news.ycombinator.com/item?id=${id}`;
|
|
129
|
-
// Get the timestamp from the title attribute and extract the date portion
|
|
130
108
|
const timestamp = timeElement?.getAttribute('title') || '';
|
|
131
109
|
const date = timestamp.split('T')[0] || '';
|
|
132
|
-
|
|
133
|
-
|
|
134
|
-
|
|
135
|
-
|
|
136
|
-
|
|
137
|
-
|
|
138
|
-
|
|
139
|
-
|
|
140
|
-
currentDepth = 0;
|
|
141
|
-
}
|
|
142
|
-
// For nested comments
|
|
143
|
-
else {
|
|
144
|
-
// If we're moving back up the tree
|
|
145
|
-
if (depth < currentDepth) {
|
|
146
|
-
while (blockquoteStack.length > 0 && blockquoteStack[blockquoteStack.length - 1] >= depth) {
|
|
147
|
-
html += '</blockquote>';
|
|
148
|
-
blockquoteStack.pop();
|
|
149
|
-
}
|
|
150
|
-
}
|
|
151
|
-
// If we're going deeper
|
|
152
|
-
else if (depth > currentDepth) {
|
|
153
|
-
html += '<blockquote>';
|
|
154
|
-
blockquoteStack.push(depth);
|
|
155
|
-
}
|
|
156
|
-
// If we're at the same depth, no need to close or open blockquotes
|
|
157
|
-
}
|
|
158
|
-
html += `<div class="comment">
|
|
159
|
-
<div class="comment-metadata">
|
|
160
|
-
<span class="comment-author"><strong>${author}</strong></span> •
|
|
161
|
-
<a href="${commentUrl}" class="comment-link">${date}</a>
|
|
162
|
-
${points ? ` • <span class="comment-points">${points}</span>` : ''}
|
|
163
|
-
</div>
|
|
164
|
-
<div class="comment-content">${(0, dom_1.serializeHTML)(commentText)}</div>
|
|
165
|
-
</div>`;
|
|
166
|
-
currentDepth = depth;
|
|
167
|
-
}
|
|
168
|
-
// Close any remaining blockquotes
|
|
169
|
-
while (blockquoteStack.length > 0) {
|
|
170
|
-
html += '</blockquote>';
|
|
171
|
-
blockquoteStack.pop();
|
|
110
|
+
commentData.push({
|
|
111
|
+
author,
|
|
112
|
+
date,
|
|
113
|
+
content: (0, dom_1.serializeHTML)(commentText),
|
|
114
|
+
depth,
|
|
115
|
+
score: points || undefined,
|
|
116
|
+
url: commentUrl,
|
|
117
|
+
});
|
|
172
118
|
}
|
|
173
|
-
return
|
|
119
|
+
return (0, comments_1.buildCommentTree)(commentData);
|
|
174
120
|
}
|
|
175
121
|
getPostId() {
|
|
176
122
|
const match = this.url.match(/id=(\d+)/);
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"hackernews.js","sourceRoot":"","sources":["../../src/extractors/hackernews.ts"],"names":[],"mappings":";;;AAAA,mCAAwC;AAExC,sCAA6C;
|
|
1
|
+
{"version":3,"file":"hackernews.js","sourceRoot":"","sources":["../../src/extractors/hackernews.ts"],"names":[],"mappings":";;;AAAA,mCAAwC;AAExC,sCAA6C;AAC7C,gDAAkG;AAElG,MAAa,mBAAoB,SAAQ,qBAAa;IAKrD,YAAY,QAAkB,EAAE,GAAW;QAC1C,KAAK,CAAC,QAAQ,EAAE,GAAG,CAAC,CAAC;QACrB,IAAI,CAAC,QAAQ,GAAG,QAAQ,CAAC,aAAa,CAAC,UAAU,CAAC,CAAC;QACnD,IAAI,CAAC,aAAa,GAAG,IAAI,CAAC,iBAAiB,EAAE,CAAC;QAC9C,IAAI,CAAC,WAAW,GAAG,IAAI,CAAC,aAAa,CAAC,CAAC,CAAC,IAAI,CAAC,eAAe,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;IACvE,CAAC;IAEO,iBAAiB;QACxB,wEAAwE;QACxE,OAAO,CAAC,CAAC,IAAI,CAAC,QAAQ,EAAE,aAAa,CAAC,UAAU,CAAC,IAAI,CAAC,IAAI,CAAC,QAAQ,EAAE,aAAa,CAAC,YAAY,CAAC,CAAC;IAClG,CAAC;IAEO,eAAe;QACtB,4EAA4E;QAC5E,2EAA2E;QAC3E,8EAA8E;QAC9E,OAAO,IAAI,CAAC,QAAQ,EAAE,aAAa,CAAC,WAAW,CAAC,IAAI,IAAI,CAAC;IAC1D,CAAC;IAED,UAAU;QACT,OAAO,CAAC,CAAC,IAAI,CAAC,QAAQ,CAAC;IACxB,CAAC;IAED,OAAO;QACN,MAAM,WAAW,GAAG,IAAI,CAAC,cAAc,EAAE,CAAC;QAC1C,MAAM,QAAQ,GAAG,IAAI,CAAC,eAAe,EAAE,CAAC;QAExC,MAAM,WAAW,GAAG,IAAI,CAAC,iBAAiB,CAAC,WAAW,EAAE,QAAQ,CAAC,CAAC;QAClE,MAAM,SAAS,GAAG,IAAI,CAAC,YAAY,EAAE,CAAC;QACtC,MAAM,UAAU,GAAG,IAAI,CAAC,aAAa,EAAE,CAAC;QACxC,MAAM,WAAW,GAAG,IAAI,CAAC,iBAAiB,EAAE,CAAC;QAC7C,MAAM,SAAS,GAAG,IAAI,CAAC,WAAW,EAAE,CAAC;QAErC,OAAO;YACN,OAAO,EAAE,WAAW;YACpB,WAAW,EAAE,WAAW;YACxB,gBAAgB,EAAE;gBACjB,MAAM,EAAE,IAAI,CAAC,SAAS,EAAE;gBACxB,UAAU;aACV;YACD,SAAS,EAAE;gBACV,KAAK,EAAE,SAAS;gBAChB,MAAM,EAAE,UAAU;gBAClB,IAAI,EAAE,aAAa;gBACnB,WAAW;gBACX,SAAS;aACT;SACD,CAAC;IACH,CAAC;IAEO,iBAAiB,CAAC,WAAmB,EAAE,QAAgB;QAC9D,OAAO,IAAA,2BAAgB,EAAC,YAAY,EAAE,WAAW,EAAE,QAAQ,CAAC,CAAC;IAC9D,CAAC;IAEO,cAAc;QACrB,IAAI,CAAC,IAAI,CAAC,QAAQ;YAAE,OAAO,EAAE,CAAC;QAE9B,iEAAiE;QACjE,IAAI,IAAI,CAAC,aAAa,IAAI,IAAI,CAAC,WAAW,EAAE,CAAC;YAC5C,MAAM,MAAM,GAAG,IAAI,CAAC,WAAW,CAAC,aAAa,CAAC,SAAS,CAAC,EAAE,WAAW,IAAI,WAAW,CAAC;YACrF,MAAM,QAAQ,GAAG,IAAI,CAAC,WAAW,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC;YAC7D,MAAM,WAAW,GAAG,QAAQ,CAAC,CAAC,CAAC,IAAA,mBAAa,EAAC,QAAQ,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;YAC5D,MAAM,WAAW,GAAG,IAAI,CAAC,WAAW,CAAC,aAAa,CAAC,MAAM,CAAC,CAAC;YAC3D,MAAM,SAAS,GAAG,WAAW,EAAE,YAAY,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC;YAC3D,MAAM,IAAI,GAAG,SAAS,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC;YAC3C,MAAM,MAAM,GAAG,IAAI,CAAC,WAAW,CAAC,aAAa,CAAC,QAAQ,CAAC,EAAE,WAAW,EAAE,IAAI,EAAE,IAAI,EAAE,CAAC;YAEnF,OAAO,IAAA,uBAAY,EAAC;gBACnB,MAAM;gBACN,IAAI;gBACJ,OAAO,EAAE,WAAW;gBACpB,KAAK,EAAE,MAAM,IAAI,SAAS;aAC1B,CAAC,CAAC;QACJ,CAAC;QAED,wCAAwC;QACxC,MAAM,QAAQ,GAAG,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC;QAC1D,MAAM,MAAM,GAAG,QAAQ,EAAE,kBAAkB,CAAC;QAC5C,MAAM,GAAG,GAAG,QAAQ,EAAE,aAAa,CAAC,cAAc,CAAC,EAAE,YAAY,CAAC,MAAM,CAAC,IAAI,EAAE,CAAC;QAEhF,IAAI,OAAO,GAAG,EAAE,CAAC;QACjB,IAAI,GAAG,EAAE,CAAC;YACT,OAAO,IAAI,eAAe,GAAG,qBAAqB,GAAG,UAAU,CAAC;QACjE,CAAC;QAED,MAAM,IAAI,GAAG,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,UAAU,CAAC,CAAC;QACrD,IAAI,IAAI,EAAE,CAAC;YACV,OAAO,IAAI,0BAA0B,IAAA,mBAAa,EAAC,IAAI,CAAC,QAAQ,CAAC;QAClE,CAAC;QAED,OAAO,OAAO,CAAC;IAChB,CAAC;IAEO,eAAe;QACtB,MAAM,QAAQ,GAAG,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,QAAQ,CAAC,gBAAgB,CAAC,UAAU,CAAC,CAAC,CAAC;QACxE,OAAO,IAAI,CAAC,eAAe,CAAC,QAAQ,CAAC,CAAC;IACvC,CAAC;IAEO,eAAe,CAAC,QAAmB;QAC1C,MAAM,WAAW,GAAkB,EAAE,CAAC;QACtC,MAAM,YAAY,GAAG,IAAI,GAAG,EAAU,CAAC;QAEvC,KAAK,MAAM,OAAO,IAAI,QAAQ,EAAE,CAAC;YAChC,MAAM,EAAE,GAAG,OAAO,CAAC,YAAY,CAAC,IAAI,CAAC,CAAC;YACtC,IAAI,CAAC,EAAE,IAAI,YAAY,CAAC,GAAG,CAAC,EAAE,CAAC;gBAAE,SAAS;YAC1C,YAAY,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;YAErB,MAAM,MAAM,GAAG,OAAO,CAAC,aAAa,CAAC,UAAU,CAAC,EAAE,YAAY,CAAC,OAAO,CAAC,IAAI,GAAG,CAAC;YAC/E,MAAM,KAAK,GAAG,QAAQ,CAAC,MAAM,CAAC,GAAG,EAAE,CAAC;YACpC,MAAM,WAAW,GAAG,OAAO,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC;YACvD,MAAM,MAAM,GAAG,OAAO,CAAC,aAAa,CAAC,SAAS,CAAC,EAAE,WAAW,IAAI,WAAW,CAAC;YAC5E,MAAM,WAAW,GAAG,OAAO,CAAC,aAAa,CAAC,MAAM,CAAC,CAAC;YAClD,MAAM,MAAM,GAAG,OAAO,CAAC,aAAa,CAAC,QAAQ,CAAC,EAAE,WAAW,EAAE,IAAI,EAAE,IAAI,EAAE,CAAC;YAE1E,IAAI,CAAC,WAAW;gBAAE,SAAS;YAE3B,MAAM,UAAU,GAAG,wCAAwC,EAAE,EAAE,CAAC;YAChE,MAAM,SAAS,GAAG,WAAW,EAAE,YAAY,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC;YAC3D,MAAM,IAAI,GAAG,SAAS,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC;YAE3C,WAAW,CAAC,IAAI,CAAC;gBAChB,MAAM;gBACN,IAAI;gBACJ,OAAO,EAAE,IAAA,mBAAa,EAAC,WAAW,CAAC;gBACnC,KAAK;gBACL,KAAK,EAAE,MAAM,IAAI,SAAS;gBAC1B,GAAG,EAAE,UAAU;aACf,CAAC,CAAC;QACJ,CAAC;QAED,OAAO,IAAA,2BAAgB,EAAC,WAAW,CAAC,CAAC;IACtC,CAAC;IAEO,SAAS;QAChB,MAAM,KAAK,GAAG,IAAI,CAAC,GAAG,CAAC,KAAK,CAAC,UAAU,CAAC,CAAC;QACzC,OAAO,KAAK,EAAE,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC;IACzB,CAAC;IAEO,YAAY;QACnB,IAAI,IAAI,CAAC,aAAa,IAAI,IAAI,CAAC,WAAW,EAAE,CAAC;YAC5C,MAAM,MAAM,GAAG,IAAI,CAAC,WAAW,CAAC,aAAa,CAAC,SAAS,CAAC,EAAE,WAAW,IAAI,WAAW,CAAC;YACrF,MAAM,WAAW,GAAG,IAAI,CAAC,WAAW,CAAC,aAAa,CAAC,WAAW,CAAC,EAAE,WAAW,IAAI,EAAE,CAAC;YACnF,8CAA8C;YAC9C,MAAM,OAAO,GAAG,WAAW,CAAC,IAAI,EAAE,CAAC,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,GAAG,CAAC,WAAW,CAAC,MAAM,GAAG,EAAE,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC;YACzF,OAAO,cAAc,MAAM,KAAK,OAAO,EAAE,CAAC;QAC3C,CAAC;QACD,OAAO,IAAI,CAAC,QAAQ,EAAE,aAAa,CAAC,YAAY,CAAC,EAAE,WAAW,EAAE,IAAI,EAAE,IAAI,EAAE,CAAC;IAC9E,CAAC;IAEO,aAAa;QACpB,OAAO,IAAI,CAAC,QAAQ,EAAE,aAAa,CAAC,SAAS,CAAC,EAAE,WAAW,EAAE,IAAI,EAAE,IAAI,EAAE,CAAC;IAC3E,CAAC;IAEO,iBAAiB;QACxB,MAAM,KAAK,GAAG,IAAI,CAAC,YAAY,EAAE,CAAC;QAClC,MAAM,MAAM,GAAG,IAAI,CAAC,aAAa,EAAE,CAAC;QACpC,IAAI,IAAI,CAAC,aAAa,EAAE,CAAC;YACxB,OAAO,cAAc,MAAM,iBAAiB,CAAC;QAC9C,CAAC;QACD,OAAO,GAAG,KAAK,SAAS,MAAM,iBAAiB,CAAC;IACjD,CAAC;IAEO,WAAW;QAClB,IAAI,CAAC,IAAI,CAAC,QAAQ;YAAE,OAAO,EAAE,CAAC;QAE9B,MAAM,WAAW,GAAG,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,MAAM,CAAC,CAAC;QACxD,MAAM,SAAS,GAAG,WAAW,EAAE,YAAY,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC;QAC3D,OAAO,SAAS,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC;IACtC,CAAC;CACD;AA9KD,kDA8KC"}
|
|
@@ -17,7 +17,6 @@ export declare class RedditExtractor extends BaseExtractor {
|
|
|
17
17
|
private getSubreddit;
|
|
18
18
|
private getPostAuthor;
|
|
19
19
|
private createDescription;
|
|
20
|
-
private
|
|
21
|
-
private renderOldRedditComment;
|
|
20
|
+
private collectOldRedditComments;
|
|
22
21
|
private processComments;
|
|
23
22
|
}
|