hdoc-tools 0.8.35 → 0.8.37
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/hdoc-build-pdf.js +15 -11
- package/hdoc-build.js +1 -4
- package/hdoc-module.js +12 -13
- package/hdoc-validate.js +154 -53
- package/hdoc.js +1 -2
- package/package.json +2 -2
package/hdoc-build-pdf.js
CHANGED
@@ -64,17 +64,21 @@
|
|
64
64
|
}).get();
|
65
65
|
imgs.push(...srcs);
|
66
66
|
for (let i = 0; i < imgs.length; i++) {
|
67
|
-
if (hdoc.valid_url(imgs[i])
|
67
|
+
if (hdoc.valid_url(imgs[i])) {
|
68
68
|
// External Link
|
69
|
-
|
70
|
-
|
71
|
-
|
72
|
-
|
73
|
-
|
74
|
-
|
75
|
-
|
76
|
-
|
77
|
-
|
69
|
+
try {
|
70
|
+
const file_response = request('GET', imgs[i]);
|
71
|
+
if (file_response.statusCode === 200) {
|
72
|
+
const image_buffer = file_response.getBody();
|
73
|
+
const mime_type = mime.lookup(imgs[i]);
|
74
|
+
let image_b64 = image_buffer.toString("base64");
|
75
|
+
image_b64 = `data:${mime_type};base64,${image_b64}`;
|
76
|
+
html_source = html_source.replace(imgs[i], image_b64);
|
77
|
+
} else {
|
78
|
+
throw `Unexpected Status ${file_response.statusCode}`;
|
79
|
+
}
|
80
|
+
} catch (err) {
|
81
|
+
console.log(`Error downloading external source [${imgs[i]}] - ${err}`);
|
78
82
|
}
|
79
83
|
} else {
|
80
84
|
// Internal link
|
@@ -86,7 +90,7 @@
|
|
86
90
|
image_b64 = `data:${mime_type};base64,${image_b64}`;
|
87
91
|
html_source = html_source.replace(imgs[i], image_b64);
|
88
92
|
} catch (err) {
|
89
|
-
console.log('Error reading image from HTML source [', image_path, '] -
|
93
|
+
console.log('Error reading image from HTML source [', image_path, '] -', err);
|
90
94
|
return null;
|
91
95
|
}
|
92
96
|
}
|
package/hdoc-build.js
CHANGED
@@ -652,15 +652,12 @@
|
|
652
652
|
});
|
653
653
|
}
|
654
654
|
}
|
655
|
-
|
656
655
|
}
|
657
656
|
}
|
658
657
|
}
|
659
658
|
}
|
660
659
|
}
|
661
|
-
|
662
660
|
}
|
663
|
-
//console.log(JSON.stringify(bc, null, 2));
|
664
661
|
};
|
665
662
|
|
666
663
|
exports.run = async function (source_path, verbose_output, github_api_token) {
|
@@ -765,7 +762,7 @@
|
|
765
762
|
console.log(` Static HTML Files Found: ${static_html_files.length}\n`);
|
766
763
|
|
767
764
|
// Validate content
|
768
|
-
const validation_success = validate.run(work_path, doc_id, verbose);
|
765
|
+
const validation_success = await validate.run(work_path, doc_id, verbose, hdocbook_config, hdocbook_project);
|
769
766
|
if (!validation_success) {
|
770
767
|
process.exit(1);
|
771
768
|
}
|
package/hdoc-module.js
CHANGED
@@ -2,8 +2,8 @@
|
|
2
2
|
'use strict';
|
3
3
|
|
4
4
|
const cheerio = require('cheerio'),
|
5
|
-
request = require('sync-request'),
|
6
5
|
html2text = require('html-to-text'),
|
6
|
+
request = require('sync-request'),
|
7
7
|
wordsCount = require('words-count').default;
|
8
8
|
|
9
9
|
let includesCache = {};
|
@@ -54,18 +54,17 @@
|
|
54
54
|
}
|
55
55
|
};
|
56
56
|
|
57
|
-
exports.valid_url = function (
|
58
|
-
|
59
|
-
|
60
|
-
|
61
|
-
|
62
|
-
|
63
|
-
|
64
|
-
|
65
|
-
|
66
|
-
|
67
|
-
|
68
|
-
return response;
|
57
|
+
exports.valid_url = function (url) {
|
58
|
+
|
59
|
+
const stringIsAValidUrl = (s) => {
|
60
|
+
try {
|
61
|
+
new URL(s);
|
62
|
+
return true;
|
63
|
+
} catch (err) {
|
64
|
+
return false;
|
65
|
+
}
|
66
|
+
};
|
67
|
+
return stringIsAValidUrl(url);
|
69
68
|
};
|
70
69
|
|
71
70
|
exports.expand_variables = function (text, docId = '') {
|
package/hdoc-validate.js
CHANGED
@@ -1,34 +1,79 @@
|
|
1
1
|
(function () {
|
2
2
|
'use strict';
|
3
3
|
|
4
|
-
const
|
4
|
+
const axios = require('axios'),
|
5
|
+
cheerio = require('cheerio'),
|
5
6
|
dree = require('dree'),
|
6
7
|
fs = require('fs'),
|
8
|
+
https = require('https'),
|
7
9
|
path = require('path'),
|
8
|
-
hdoc = require(path.join(__dirname, 'hdoc-module.js'))
|
9
|
-
|
10
|
+
hdoc = require(path.join(__dirname, 'hdoc-module.js'));
|
11
|
+
|
12
|
+
const agent = new https.Agent({
|
13
|
+
rejectUnauthorized: false
|
14
|
+
});
|
10
15
|
|
11
16
|
let errors = {},
|
12
17
|
messages = {},
|
13
18
|
warnings = {},
|
14
19
|
errorcount = 0,
|
15
|
-
|
16
|
-
|
20
|
+
html_files = [],
|
21
|
+
exclude_links = {};
|
17
22
|
|
18
23
|
|
19
|
-
const checkLinks = function (source_path, htmlFile, links) {
|
24
|
+
const checkLinks = async function (source_path, htmlFile, links, hdocbook_config) {
|
20
25
|
for (let i = 0; i < links.length; i++) {
|
21
26
|
|
22
27
|
// Validate that link is a valid URL first
|
23
|
-
if (!hdoc.valid_url(links[i])
|
24
|
-
|
28
|
+
if (!hdoc.valid_url(links[i])) {
|
25
29
|
// Could be a relative path, check
|
26
|
-
|
27
|
-
|
28
|
-
|
30
|
+
isRelativePath(source_path, htmlFile, links[i]);
|
31
|
+
} else {
|
32
|
+
messages[htmlFile.relativePath].push(`Link is a properly formatted external URL: ${links[i]}`);
|
33
|
+
|
34
|
+
// Skip if it's the auto-generated edit url, as these could be part of a private repo which would return a 404
|
35
|
+
if (links[i] === hdoc.get_github_api_path(hdocbook_config.publicSource, htmlFile.relativePath).edit_path.replace(path.extname(htmlFile.relativePath), '.md')) {
|
36
|
+
continue;
|
37
|
+
}
|
38
|
+
|
39
|
+
// Skip if the link is excluded in the project config
|
40
|
+
if (exclude_links[links[i]]) {
|
41
|
+
continue;
|
29
42
|
}
|
43
|
+
|
44
|
+
// Skip mailto links
|
45
|
+
if (links[i].startsWith('mailto:')) {
|
46
|
+
continue;
|
47
|
+
}
|
48
|
+
|
49
|
+
try {
|
50
|
+
await axios.get(links[i], { httpsAgent: agent });
|
51
|
+
messages[htmlFile.relativePath].push(`Link is a valid external URL: ${links[i]}`);
|
52
|
+
} catch (e) {
|
53
|
+
// Handle errors
|
54
|
+
errors[htmlFile.relativePath].push(`Link is not responding: ${links[i]} - [${e.message}]`);
|
55
|
+
}
|
56
|
+
}
|
57
|
+
}
|
58
|
+
};
|
59
|
+
|
60
|
+
const checkImages = async function (source_path, htmlFile, links) {
|
61
|
+
for (let i = 0; i < links.length; i++) {
|
62
|
+
|
63
|
+
// Validate that image is a valid URL first
|
64
|
+
if (!hdoc.valid_url(links[i])) {
|
65
|
+
// Could be a relative path, check image exists
|
66
|
+
doesFileExist(source_path, htmlFile, links[i]);
|
30
67
|
} else {
|
31
|
-
messages[htmlFile.relativePath].push(`
|
68
|
+
messages[htmlFile.relativePath].push(`Image link is a properly formatted external URL: ${links[i]}`);
|
69
|
+
// Do a Get to the URL to see if it exists
|
70
|
+
try {
|
71
|
+
const res = await axios.get(links[i]);
|
72
|
+
messages[htmlFile.relativePath].push(`Image link is a valid external URL: ${links[i]}`);
|
73
|
+
} catch (e) {
|
74
|
+
// Handle errors
|
75
|
+
errors[htmlFile.relativePath].push(`Unexpected Error from external image link: ${links[i]} - ${e.message}`);
|
76
|
+
}
|
32
77
|
}
|
33
78
|
}
|
34
79
|
};
|
@@ -47,16 +92,57 @@
|
|
47
92
|
|
48
93
|
// File callbacks for html file scan
|
49
94
|
const fileCallback = function (element) {
|
50
|
-
|
51
|
-
htmlFiles.push(element);
|
95
|
+
html_files.push(element);
|
52
96
|
};
|
53
97
|
|
54
|
-
const
|
55
|
-
|
56
|
-
let
|
98
|
+
const isRelativePath = function (source_path, html_path, relative_path) {
|
99
|
+
const rel_path_ext = path.extname(relative_path);
|
100
|
+
let response = {
|
101
|
+
is_rel_path: false,
|
102
|
+
has_md_extension: rel_path_ext === '.md'
|
103
|
+
};
|
104
|
+
|
105
|
+
const supported_relpaths = [
|
106
|
+
path.sep + 'index.htm',
|
107
|
+
path.sep + 'index.html',
|
108
|
+
'.htm',
|
109
|
+
'.html',
|
110
|
+
'.md'
|
111
|
+
];
|
57
112
|
|
58
|
-
//
|
59
|
-
|
113
|
+
// Remove explicit anchor links and _books prefix
|
114
|
+
relative_path = relative_path.split('#')[0].replace('_books/', '');
|
115
|
+
|
116
|
+
// Make full file path
|
117
|
+
const file_path = path.join(source_path, relative_path);
|
118
|
+
|
119
|
+
// Does path exist?
|
120
|
+
if (fs.existsSync(file_path)) {
|
121
|
+
response.is_rel_path = true;
|
122
|
+
} else {
|
123
|
+
// Path
|
124
|
+
for (let i = 0; i < supported_relpaths.length; i++) {
|
125
|
+
if (fs.existsSync(`${file_path}${supported_relpaths[i]}`)) {
|
126
|
+
response.is_rel_path = true;
|
127
|
+
break;
|
128
|
+
}
|
129
|
+
}
|
130
|
+
}
|
131
|
+
if (response.has_md_extension) {
|
132
|
+
errors[html_path.relativePath].push(`Relative link contains MD extension, but should not: ${relative_path}`);
|
133
|
+
} else {
|
134
|
+
if (response.is_rel_path) {
|
135
|
+
messages[html_path.relativePath].push(`Relative path exists: ${relative_path}`);
|
136
|
+
} else {
|
137
|
+
errors[html_path.relativePath].push(`Link path does not exist: ${relative_path}`);
|
138
|
+
}
|
139
|
+
}
|
140
|
+
}
|
141
|
+
|
142
|
+
const doesFileExist = function (source_path, html_path, relative_path) {
|
143
|
+
// Remove explicit anchor links and _books prefix
|
144
|
+
relative_path = relative_path.split('#')[0].replace('_books/', '');
|
145
|
+
const file_path = path.join(source_path, relative_path);
|
60
146
|
if (!fs.existsSync(file_path) && !fs.existsSync(file_path + path.sep + 'index.htm') && !fs.existsSync(file_path + 'index.html') && !fs.existsSync(file_path + '.htm') && !fs.existsSync(file_path + '.html')) {
|
61
147
|
errors[html_path.relativePath].push(`Book resource does not exist: ${relative_path}`);
|
62
148
|
return false;
|
@@ -70,7 +156,10 @@
|
|
70
156
|
const getLinks = function (file) {
|
71
157
|
messages[file.relativePath].push('Parsing HTML file');
|
72
158
|
const htmlBody = fs.readFileSync(file.path, 'utf8');
|
73
|
-
let links =
|
159
|
+
let links = {
|
160
|
+
href: [],
|
161
|
+
img: []
|
162
|
+
};
|
74
163
|
const $ = cheerio.load(htmlBody);
|
75
164
|
const hrefs = $('a').map(function (i) {
|
76
165
|
return $(this).attr('href');
|
@@ -78,35 +167,46 @@
|
|
78
167
|
const srcs = $('img').map(function (i) {
|
79
168
|
return $(this).attr('src');
|
80
169
|
}).get();
|
81
|
-
links.push(...hrefs);
|
82
|
-
links.push(...srcs);
|
170
|
+
links.href.push(...hrefs);
|
171
|
+
links.img.push(...srcs);
|
83
172
|
return links;
|
84
173
|
};
|
85
174
|
|
86
|
-
exports.run = function (source_path, doc_id, verbose) {
|
175
|
+
exports.run = async function (source_path, doc_id, verbose, hdocbook_config, hdocbook_project) {
|
87
176
|
// Get a list of HTML files in source_path
|
88
177
|
dree.scan(source_path, dreeOptions, fileCallback);
|
89
178
|
|
179
|
+
if (hdocbook_project.validation && hdocbook_project.validation.exclude_links && hdocbook_project.validation.exclude_links instanceof Array) {
|
180
|
+
hdocbook_project.validation.exclude_links.forEach(function(excl_link) {
|
181
|
+
exclude_links[excl_link] = true;
|
182
|
+
});
|
183
|
+
}
|
184
|
+
|
90
185
|
console.log(`Performing Validation and Building SEO Link List...`);
|
91
186
|
|
92
187
|
let listContent = '';
|
93
|
-
for (let i = 0; i <
|
188
|
+
for (let i = 0; i < html_files.length; i++) {
|
94
189
|
|
95
190
|
// Initiate maps for errors and verbose messages for HTML file
|
96
|
-
errors[
|
97
|
-
messages[
|
98
|
-
warnings[
|
191
|
+
errors[html_files[i].relativePath] = [];
|
192
|
+
messages[html_files[i].relativePath] = [];
|
193
|
+
warnings[html_files[i].relativePath] = [];
|
99
194
|
|
100
|
-
const links = getLinks(
|
101
|
-
if (links.length === 0) {
|
102
|
-
messages[
|
195
|
+
const links = getLinks(html_files[i]);
|
196
|
+
if (links.href.length === 0) {
|
197
|
+
messages[html_files[i].relativePath].push('No links found in file');
|
198
|
+
} else {
|
199
|
+
await checkLinks(source_path, html_files[i], links.href, hdocbook_config);
|
200
|
+
}
|
201
|
+
if (links.img.length === 0) {
|
202
|
+
messages[html_files[i].relativePath].push('No images found in file');
|
103
203
|
} else {
|
104
|
-
|
204
|
+
await checkImages(source_path, html_files[i], links.img);
|
105
205
|
}
|
106
206
|
|
107
207
|
// Build list content for Google
|
108
|
-
listContent += `/${
|
109
|
-
if (i <
|
208
|
+
listContent += `/${html_files[i].relativePath.replace(path.extname(html_files[i].relativePath), '')}`;
|
209
|
+
if (i < html_files.length - 1) {
|
110
210
|
listContent += '\r\n';
|
111
211
|
}
|
112
212
|
}
|
@@ -118,24 +218,6 @@
|
|
118
218
|
} catch (err) {
|
119
219
|
console.error(err);
|
120
220
|
}
|
121
|
-
if (errorcount === 0) {
|
122
|
-
console.log('\r\n---------------');
|
123
|
-
console.log(' No Errors ');
|
124
|
-
console.log('---------------\r\n');
|
125
|
-
} else {
|
126
|
-
console.log('\r\n------------');
|
127
|
-
console.log(' Errors ');
|
128
|
-
console.log('------------');
|
129
|
-
|
130
|
-
for (const key in errors) {
|
131
|
-
if (errors.hasOwnProperty(key) && errors[key].length > 0) {
|
132
|
-
console.log(`\r\n${errors[key].length} error(s) in ${key}`);
|
133
|
-
for (let i = 0; i < errors[key].length; i++) {
|
134
|
-
console.log(` - ${errors[key][i]}`);
|
135
|
-
}
|
136
|
-
}
|
137
|
-
}
|
138
|
-
}
|
139
221
|
|
140
222
|
if (verbose) {
|
141
223
|
console.log('\r\n-------------');
|
@@ -150,7 +232,26 @@
|
|
150
232
|
}
|
151
233
|
}
|
152
234
|
}
|
153
|
-
|
154
|
-
|
235
|
+
|
236
|
+
console.log('\r\n-----------------------');
|
237
|
+
console.log(' Validation Output ');
|
238
|
+
console.log('-----------------------');
|
239
|
+
|
240
|
+
for (const key in errors) {
|
241
|
+
if (errors.hasOwnProperty(key) && errors[key].length > 0) {
|
242
|
+
console.log(`\r\n${errors[key].length} error(s) in ${key}`);
|
243
|
+
for (let i = 0; i < errors[key].length; i++) {
|
244
|
+
console.log(` - ${errors[key][i]}`);
|
245
|
+
errorcount++;
|
246
|
+
}
|
247
|
+
}
|
248
|
+
}
|
249
|
+
|
250
|
+
if (errorcount > 0) {
|
251
|
+
console.log(`\r\n${errorcount} Validation Errors Found\r\n`);
|
252
|
+
return false;
|
253
|
+
}
|
254
|
+
console.log(`\r\nNo Validation Errors Found!\r\n`);
|
255
|
+
return true;
|
155
256
|
};
|
156
257
|
})();
|
package/hdoc.js
CHANGED
package/package.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1
1
|
{
|
2
2
|
"name": "hdoc-tools",
|
3
|
-
"version": "0.8.
|
3
|
+
"version": "0.8.37",
|
4
4
|
"description": "Hornbill HDocBook Development Support Tool",
|
5
5
|
"main": "hdoc.js",
|
6
6
|
"bin": {
|
@@ -30,6 +30,7 @@
|
|
30
30
|
"author": "Hornbill Technologies Ltd",
|
31
31
|
"license": "ISC",
|
32
32
|
"dependencies": {
|
33
|
+
"axios": "^1.3.2",
|
33
34
|
"better-sqlite3": "^8.0.1",
|
34
35
|
"body-parser": "^1.20.1",
|
35
36
|
"cheerio": "^1.0.0-rc.12",
|
@@ -40,7 +41,6 @@
|
|
40
41
|
"highlight.js": "^11.6.0",
|
41
42
|
"html-to-text": "^8.2.1",
|
42
43
|
"js-yaml": "^4.1.0",
|
43
|
-
"jspdf": "^2.5.1",
|
44
44
|
"markdown-it": "^13.0.1",
|
45
45
|
"markdown-it-container": "^3.0.0",
|
46
46
|
"markdown-it-front-matter": "^0.2.3",
|