@jocmp/mercury-parser 2.4.5 → 2.4.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/generate-custom-parser.js +148 -3
- package/dist/generate-custom-parser.js.map +1 -1
- package/dist/mercury.js +151 -1
- package/dist/mercury.js.map +1 -1
- package/dist/mercury.web.js +1 -1
- package/dist/mercury.web.js.map +1 -1
- package/package.json +1 -1
package/dist/mercury.js
CHANGED
|
@@ -6867,6 +6867,151 @@ var WwwTechpowerupComExtractor = {
|
|
|
6867
6867
|
}
|
|
6868
6868
|
};
|
|
6869
6869
|
|
|
6870
|
+
var WwwFlatpanelshdComExtractor = {
|
|
6871
|
+
domain: 'www.flatpanelshd.com',
|
|
6872
|
+
title: {
|
|
6873
|
+
selectors: [['meta[name="og:title"]', 'value']]
|
|
6874
|
+
},
|
|
6875
|
+
author: {
|
|
6876
|
+
selectors: [['meta[itemprop="author"]', 'value']]
|
|
6877
|
+
},
|
|
6878
|
+
date_published: {
|
|
6879
|
+
selectors: [['meta[itemprop="datePublished"]', 'value']]
|
|
6880
|
+
},
|
|
6881
|
+
lead_image_url: {
|
|
6882
|
+
selectors: [['meta[name="og:image"]', 'value']]
|
|
6883
|
+
},
|
|
6884
|
+
content: {
|
|
6885
|
+
selectors: ['#zephr-anchor', 'article'],
|
|
6886
|
+
transforms: {
|
|
6887
|
+
h2: function h2($node) {
|
|
6888
|
+
return $node.attr('class', 'mercury-parser-keep');
|
|
6889
|
+
},
|
|
6890
|
+
h3: function h3($node) {
|
|
6891
|
+
return $node.attr('class', 'mercury-parser-keep');
|
|
6892
|
+
},
|
|
6893
|
+
h4: function h4($node) {
|
|
6894
|
+
return $node.attr('class', 'mercury-parser-keep');
|
|
6895
|
+
},
|
|
6896
|
+
pre: 'div'
|
|
6897
|
+
},
|
|
6898
|
+
clean: []
|
|
6899
|
+
}
|
|
6900
|
+
};
|
|
6901
|
+
|
|
6902
|
+
var Nineto5macComExtractor = {
|
|
6903
|
+
domain: '9to5mac.com',
|
|
6904
|
+
title: {
|
|
6905
|
+
selectors: ['title', 'h1']
|
|
6906
|
+
},
|
|
6907
|
+
author: {
|
|
6908
|
+
selectors: [['meta[name="author"]', 'value']]
|
|
6909
|
+
},
|
|
6910
|
+
date_published: {
|
|
6911
|
+
selectors: [['meta[name="article:published_time"]', 'value']]
|
|
6912
|
+
},
|
|
6913
|
+
lead_image_url: {
|
|
6914
|
+
selectors: [['meta[name="og:image"]', 'value']]
|
|
6915
|
+
},
|
|
6916
|
+
content: {
|
|
6917
|
+
selectors: ['main'],
|
|
6918
|
+
transforms: {
|
|
6919
|
+
img: function img(node) {
|
|
6920
|
+
node.removeAttr('sizes');
|
|
6921
|
+
}
|
|
6922
|
+
},
|
|
6923
|
+
clean: ['.post-meta']
|
|
6924
|
+
}
|
|
6925
|
+
};
|
|
6926
|
+
|
|
6927
|
+
var WwwNotebookcheckNetExtractor = {
|
|
6928
|
+
domain: 'www.notebookcheck.net',
|
|
6929
|
+
title: {
|
|
6930
|
+
selectors: ['h1']
|
|
6931
|
+
},
|
|
6932
|
+
author: {
|
|
6933
|
+
selectors: ['.intro-author a']
|
|
6934
|
+
},
|
|
6935
|
+
date_published: {
|
|
6936
|
+
selectors: [['.intro-author time', 'datetime']],
|
|
6937
|
+
timezone: 'GMT'
|
|
6938
|
+
},
|
|
6939
|
+
lead_image_url: {
|
|
6940
|
+
selectors: [['meta[name="og:image"]', 'value']]
|
|
6941
|
+
},
|
|
6942
|
+
content: {
|
|
6943
|
+
selectors: ['#content'],
|
|
6944
|
+
transforms: {
|
|
6945
|
+
h2: function h2($node) {
|
|
6946
|
+
return $node.attr('class', 'mercury-parser-keep');
|
|
6947
|
+
},
|
|
6948
|
+
h3: function h3($node) {
|
|
6949
|
+
return $node.attr('class', 'mercury-parser-keep');
|
|
6950
|
+
},
|
|
6951
|
+
h4: function h4($node) {
|
|
6952
|
+
return $node.attr('class', 'mercury-parser-keep');
|
|
6953
|
+
}
|
|
6954
|
+
},
|
|
6955
|
+
clean: ['.ttcl_3', '.socialarea', '.tx-nbc2fe-relatedarticles', 'aside']
|
|
6956
|
+
}
|
|
6957
|
+
};
|
|
6958
|
+
|
|
6959
|
+
var WwwFuturaSciencesComExtractor = {
|
|
6960
|
+
domain: 'www.futura-sciences.com',
|
|
6961
|
+
title: {
|
|
6962
|
+
selectors: ['title', 'h1']
|
|
6963
|
+
},
|
|
6964
|
+
author: {
|
|
6965
|
+
selectors: [['meta[name="author"]', 'value']]
|
|
6966
|
+
},
|
|
6967
|
+
date_published: {
|
|
6968
|
+
selectors: [['meta[name="article:published_time"]', 'value']]
|
|
6969
|
+
},
|
|
6970
|
+
lead_image_url: {
|
|
6971
|
+
selectors: [['meta[name="og:image"]', 'value']]
|
|
6972
|
+
},
|
|
6973
|
+
content: {
|
|
6974
|
+
selectors: ['#article-anchor-article-main-content', '.article-text'],
|
|
6975
|
+
transforms: {
|
|
6976
|
+
h2: function h2(node) {
|
|
6977
|
+
return node.attr('class', 'mercury-parser-keep');
|
|
6978
|
+
},
|
|
6979
|
+
h3: function h3(node) {
|
|
6980
|
+
return node.attr('class', 'mercury-parser-keep');
|
|
6981
|
+
},
|
|
6982
|
+
h4: function h4(node) {
|
|
6983
|
+
return node.attr('class', 'mercury-parser-keep');
|
|
6984
|
+
},
|
|
6985
|
+
ul: function ul($node) {
|
|
6986
|
+
return $node.attr('class', 'mercury-parser-keep');
|
|
6987
|
+
}
|
|
6988
|
+
},
|
|
6989
|
+
clean: ['.cWHWfD']
|
|
6990
|
+
}
|
|
6991
|
+
};
|
|
6992
|
+
|
|
6993
|
+
var SgNewsYahooComExtractor = {
|
|
6994
|
+
domain: 'sg.news.yahoo.com',
|
|
6995
|
+
title: {
|
|
6996
|
+
selectors: [['meta[name="og:title"]', 'value'], 'title']
|
|
6997
|
+
},
|
|
6998
|
+
author: {
|
|
6999
|
+
selectors: ['.caas-attr-provider', 'meta[name="author"]']
|
|
7000
|
+
},
|
|
7001
|
+
date_published: {
|
|
7002
|
+
selectors: ['time[datetime]', 'meta[property="article:published_time"]'],
|
|
7003
|
+
timezone: 'UTC'
|
|
7004
|
+
},
|
|
7005
|
+
lead_image_url: {
|
|
7006
|
+
selectors: [['meta[name="og:image"]', 'value']]
|
|
7007
|
+
},
|
|
7008
|
+
content: {
|
|
7009
|
+
selectors: ['.caas-body-content', 'article'],
|
|
7010
|
+
transforms: {},
|
|
7011
|
+
clean: ['.caas-header', '.caas-logo', '.caas-title-wrapper', 'button', '.advertisement', '.sda-*', '[data-content="Advertisement"]']
|
|
7012
|
+
}
|
|
7013
|
+
};
|
|
7014
|
+
|
|
6870
7015
|
|
|
6871
7016
|
|
|
6872
7017
|
var CustomExtractors = /*#__PURE__*/Object.freeze({
|
|
@@ -7047,7 +7192,12 @@ var CustomExtractors = /*#__PURE__*/Object.freeze({
|
|
|
7047
7192
|
WwwVortezNetExtractor: WwwVortezNetExtractor,
|
|
7048
7193
|
WwwPolygonComExtractor: WwwPolygonComExtractor,
|
|
7049
7194
|
WwwThevergeComExtractor: WwwThevergeComExtractor,
|
|
7050
|
-
WwwTechpowerupComExtractor: WwwTechpowerupComExtractor
|
|
7195
|
+
WwwTechpowerupComExtractor: WwwTechpowerupComExtractor,
|
|
7196
|
+
WwwFlatpanelshdComExtractor: WwwFlatpanelshdComExtractor,
|
|
7197
|
+
Nineto5macComExtractor: Nineto5macComExtractor,
|
|
7198
|
+
WwwNotebookcheckNetExtractor: WwwNotebookcheckNetExtractor,
|
|
7199
|
+
WwwFuturaSciencesComExtractor: WwwFuturaSciencesComExtractor,
|
|
7200
|
+
SgNewsYahooComExtractor: SgNewsYahooComExtractor
|
|
7051
7201
|
});
|
|
7052
7202
|
|
|
7053
7203
|
var Extractors = _Object$keys(CustomExtractors).reduce(function (acc, key) {
|