@zonuexe/techbook-mcp 0.2.2 → 0.2.4
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +28 -1
- package/README.md +39 -20
- package/dist/adapters/calil.d.ts +10 -0
- package/dist/adapters/calil.d.ts.map +1 -0
- package/dist/adapters/calil.js +45 -0
- package/dist/adapters/calil.js.map +1 -0
- package/dist/adapters/openbd.d.ts +57 -0
- package/dist/adapters/openbd.d.ts.map +1 -0
- package/dist/adapters/openbd.js +87 -0
- package/dist/adapters/openbd.js.map +1 -0
- package/dist/adapters/publishers/google-books.d.ts +4 -0
- package/dist/adapters/publishers/google-books.d.ts.map +1 -0
- package/dist/adapters/publishers/google-books.js +75 -0
- package/dist/adapters/publishers/google-books.js.map +1 -0
- package/dist/adapters/publishers/isbn-publisher-codes.d.ts +21 -0
- package/dist/adapters/publishers/isbn-publisher-codes.d.ts.map +1 -0
- package/dist/adapters/publishers/isbn-publisher-codes.js +49 -0
- package/dist/adapters/publishers/isbn-publisher-codes.js.map +1 -0
- package/dist/adapters/publishers/juse-p.d.ts +3 -0
- package/dist/adapters/publishers/juse-p.d.ts.map +1 -0
- package/dist/adapters/publishers/juse-p.js +110 -0
- package/dist/adapters/publishers/juse-p.js.map +1 -0
- package/dist/adapters/publishers/registry.d.ts.map +1 -1
- package/dist/adapters/publishers/registry.js +4 -0
- package/dist/adapters/publishers/registry.js.map +1 -1
- package/dist/adapters/publishers/tatsu-zine.d.ts.map +1 -1
- package/dist/adapters/publishers/tatsu-zine.js +6 -18
- package/dist/adapters/publishers/tatsu-zine.js.map +1 -1
- package/dist/application/get-book-by-isbn.d.ts +13 -0
- package/dist/application/get-book-by-isbn.d.ts.map +1 -0
- package/dist/application/get-book-by-isbn.js +61 -0
- package/dist/application/get-book-by-isbn.js.map +1 -0
- package/dist/application/get-book-detail.d.ts.map +1 -1
- package/dist/application/get-book-detail.js +16 -1
- package/dist/application/get-book-detail.js.map +1 -1
- package/dist/application/search-books.d.ts.map +1 -1
- package/dist/application/search-books.js +20 -0
- package/dist/application/search-books.js.map +1 -1
- package/dist/config/credentials.d.ts +8 -0
- package/dist/config/credentials.d.ts.map +1 -0
- package/dist/config/credentials.js +32 -0
- package/dist/config/credentials.js.map +1 -0
- package/dist/main.js +15 -1
- package/dist/main.js.map +1 -1
- package/dist/mcp/server.d.ts.map +1 -1
- package/dist/mcp/server.js +10 -0
- package/dist/mcp/server.js.map +1 -1
- package/dist/mcp/tools.d.ts +13 -0
- package/dist/mcp/tools.d.ts.map +1 -1
- package/dist/mcp/tools.js +16 -0
- package/dist/mcp/tools.js.map +1 -1
- package/dist/setup.d.ts +2 -0
- package/dist/setup.d.ts.map +1 -0
- package/dist/setup.js +43 -0
- package/dist/setup.js.map +1 -0
- package/flake.lock +61 -0
- package/package.json +1 -1
- package/.claude/settings.local.json +0 -36
- package/.codex/skills/techbook-mcp-release-prep/SKILL.md +0 -105
- package/.github/workflows/test.yml +0 -72
- package/.oxlintrc.json +0 -12
- package/AGENTS.md +0 -100
- package/deno.json +0 -3
- package/src/adapters/cache/memory-cache.ts +0 -31
- package/src/adapters/cache/null-cache.ts +0 -8
- package/src/adapters/html/cheerio-parser.ts +0 -50
- package/src/adapters/http/fetch-client.ts +0 -47
- package/src/adapters/http/mock-client.ts +0 -77
- package/src/adapters/publishers/base.ts +0 -279
- package/src/adapters/publishers/book-tech.ts +0 -117
- package/src/adapters/publishers/born-digital.ts +0 -143
- package/src/adapters/publishers/coronasha.ts +0 -139
- package/src/adapters/publishers/gihyo.ts +0 -120
- package/src/adapters/publishers/impress.ts +0 -103
- package/src/adapters/publishers/lambdanote.ts +0 -146
- package/src/adapters/publishers/manatee.ts +0 -113
- package/src/adapters/publishers/maruzen-publishing.ts +0 -129
- package/src/adapters/publishers/optronics.ts +0 -113
- package/src/adapters/publishers/oreilly-japan.ts +0 -133
- package/src/adapters/publishers/peaks.ts +0 -98
- package/src/adapters/publishers/personal-media.ts +0 -168
- package/src/adapters/publishers/registry.ts +0 -38
- package/src/adapters/publishers/rutles.ts +0 -149
- package/src/adapters/publishers/saiensu.ts +0 -136
- package/src/adapters/publishers/seshop.ts +0 -121
- package/src/adapters/publishers/tatsu-zine.ts +0 -154
- package/src/adapters/publishers/techbookfest.ts +0 -179
- package/src/application/get-book-detail.ts +0 -24
- package/src/application/search-books.ts +0 -44
- package/src/domain/book.ts +0 -35
- package/src/domain/publisher.ts +0 -18
- package/src/main.ts +0 -14
- package/src/mcp/server.ts +0 -103
- package/src/mcp/tools.ts +0 -54
- package/src/ports/cache.ts +0 -5
- package/src/ports/html-parser.ts +0 -15
- package/src/ports/http.ts +0 -17
- package/tests/fixtures/book-tech-detail.html +0 -51
- package/tests/fixtures/book-tech-search.html +0 -91
- package/tests/fixtures/born-digital-detail.html +0 -62
- package/tests/fixtures/born-digital-search.html +0 -51
- package/tests/fixtures/coronasha-detail.html +0 -41
- package/tests/fixtures/coronasha-search.html +0 -61
- package/tests/fixtures/gihyo-detail.html +0 -42
- package/tests/fixtures/gihyo-search.json +0 -54
- package/tests/fixtures/impress-detail-epub.html +0 -746
- package/tests/fixtures/impress-detail-social.html +0 -689
- package/tests/fixtures/lambdanote-search.html +0 -66
- package/tests/fixtures/manatee-detail.html +0 -53
- package/tests/fixtures/manatee-search.html +0 -59
- package/tests/fixtures/maruzen-detail.html +0 -51
- package/tests/fixtures/maruzen-search.html +0 -60
- package/tests/fixtures/optronics-detail.html +0 -30
- package/tests/fixtures/optronics-search.html +0 -75
- package/tests/fixtures/oreilly-detail.html +0 -52
- package/tests/fixtures/oreilly-ebook-list.html +0 -53
- package/tests/fixtures/peaks-detail.html +0 -39
- package/tests/fixtures/peaks-top.html +0 -50
- package/tests/fixtures/personal-media-detail.html +0 -32
- package/tests/fixtures/personal-media-search.html +0 -39
- package/tests/fixtures/rutles-detail.html +0 -32
- package/tests/fixtures/rutles-search.html +0 -62
- package/tests/fixtures/saiensu-detail.html +0 -41
- package/tests/fixtures/saiensu-search.html +0 -65
- package/tests/fixtures/seshop-detail.html +0 -45
- package/tests/fixtures/seshop-search.html +0 -58
- package/tests/fixtures/tatsu-zine-detail-free.html +0 -22
- package/tests/fixtures/tatsu-zine-search.html +0 -40
- package/tests/fixtures/techbookfest-search.json +0 -73
- package/tests/unit/adapters/base.test.ts +0 -441
- package/tests/unit/adapters/publishers/book-tech.test.ts +0 -186
- package/tests/unit/adapters/publishers/born-digital.test.ts +0 -194
- package/tests/unit/adapters/publishers/coronasha.test.ts +0 -207
- package/tests/unit/adapters/publishers/gihyo.test.ts +0 -137
- package/tests/unit/adapters/publishers/impress.test.ts +0 -129
- package/tests/unit/adapters/publishers/lambdanote.test.ts +0 -85
- package/tests/unit/adapters/publishers/manatee.test.ts +0 -165
- package/tests/unit/adapters/publishers/maruzen-publishing.test.ts +0 -179
- package/tests/unit/adapters/publishers/optronics.test.ts +0 -208
- package/tests/unit/adapters/publishers/oreilly-japan.test.ts +0 -194
- package/tests/unit/adapters/publishers/peaks.test.ts +0 -177
- package/tests/unit/adapters/publishers/personal-media.test.ts +0 -199
- package/tests/unit/adapters/publishers/rutles.test.ts +0 -173
- package/tests/unit/adapters/publishers/saiensu.test.ts +0 -169
- package/tests/unit/adapters/publishers/seshop.test.ts +0 -174
- package/tests/unit/adapters/publishers/tatsu-zine.test.ts +0 -172
- package/tests/unit/adapters/publishers/techbookfest.test.ts +0 -94
- package/tests/unit/adapters/registry.test.ts +0 -37
- package/tests/unit/application/get-book-detail.test.ts +0 -102
- package/tests/unit/application/search-books.test.ts +0 -137
- package/tsconfig.json +0 -17
|
@@ -1,120 +0,0 @@
|
|
|
1
|
-
import type { PublisherAdapter, PublisherDeps } from "../../domain/publisher.js";
|
|
2
|
-
import type { BookRecord, SearchQuery } from "../../domain/book.js";
|
|
3
|
-
import { fetchText, stripHtmlTags, resolveUrl, extractAsin, extractEbookStoresFromDoc } from "./base.js";
|
|
4
|
-
|
|
5
|
-
const BASE_URL = "https://gihyo.jp";
|
|
6
|
-
|
|
7
|
-
// --- API レスポンス型 ---
|
|
8
|
-
|
|
9
|
-
interface GihyoSearchResponse {
|
|
10
|
-
lname: string;
|
|
11
|
-
total: number;
|
|
12
|
-
list: Record<string, GihyoBookEntry>;
|
|
13
|
-
next: boolean;
|
|
14
|
-
query: string;
|
|
15
|
-
}
|
|
16
|
-
|
|
17
|
-
interface GihyoBookEntry {
|
|
18
|
-
series: string;
|
|
19
|
-
title: string;
|
|
20
|
-
subtitle: string;
|
|
21
|
-
/** キー: 役割 ("著", "監修" など)、値: { 著者名: markup } */
|
|
22
|
-
author: Record<string, Record<string, string>>;
|
|
23
|
-
/** [定価, 割引価格] */
|
|
24
|
-
price: [number, number];
|
|
25
|
-
stock: number;
|
|
26
|
-
/** ["YYYY.M.D", ""] */
|
|
27
|
-
release: [string, string];
|
|
28
|
-
/** 相対URL: "/book/YYYY/978-4-..." */
|
|
29
|
-
url: string;
|
|
30
|
-
upcoming: boolean;
|
|
31
|
-
support: boolean;
|
|
32
|
-
/** [thumb_url, width, height, full_url] */
|
|
33
|
-
cover: [string, number, number, string];
|
|
34
|
-
}
|
|
35
|
-
|
|
36
|
-
// --- 変換ヘルパー ---
|
|
37
|
-
|
|
38
|
-
function parseAuthors(authorField: Record<string, Record<string, string>>): string[] {
|
|
39
|
-
return Object.values(authorField).flatMap(roleEntries =>
|
|
40
|
-
Object.keys(roleEntries).map(name => stripHtmlTags(name).trim()),
|
|
41
|
-
);
|
|
42
|
-
}
|
|
43
|
-
|
|
44
|
-
function parseReleaseDate(release: [string, string]): string | undefined {
|
|
45
|
-
const raw = release[0];
|
|
46
|
-
if (!raw) return undefined;
|
|
47
|
-
// "2025.9.29" → "2025-09-29"
|
|
48
|
-
const parts = raw.split(".");
|
|
49
|
-
if (parts.length !== 3) return raw;
|
|
50
|
-
const [y, m, d] = parts;
|
|
51
|
-
return `${y}-${m.padStart(2, "0")}-${d.padStart(2, "0")}`;
|
|
52
|
-
}
|
|
53
|
-
|
|
54
|
-
function entryToBookRecord(isbn: string, entry: GihyoBookEntry): BookRecord {
|
|
55
|
-
const title = entry.subtitle
|
|
56
|
-
? `${entry.title} ${entry.subtitle}`
|
|
57
|
-
: entry.title;
|
|
58
|
-
|
|
59
|
-
return {
|
|
60
|
-
title,
|
|
61
|
-
authors: parseAuthors(entry.author),
|
|
62
|
-
publisher: "技術評論社",
|
|
63
|
-
publishedAt: parseReleaseDate(entry.release),
|
|
64
|
-
isbn: isbn.replace(/-/g, ""),
|
|
65
|
-
url: resolveUrl(BASE_URL, entry.url),
|
|
66
|
-
price: entry.price[0] > 0 ? entry.price[0] : undefined,
|
|
67
|
-
coverImageUrl: entry.cover[3] ? resolveUrl(BASE_URL, entry.cover[3]) : undefined,
|
|
68
|
-
};
|
|
69
|
-
}
|
|
70
|
-
|
|
71
|
-
// --- アダプター実装 ---
|
|
72
|
-
|
|
73
|
-
export const gihyoAdapter: PublisherAdapter = {
|
|
74
|
-
id: "gihyo",
|
|
75
|
-
name: "技術評論社",
|
|
76
|
-
baseUrl: BASE_URL,
|
|
77
|
-
|
|
78
|
-
async search(query: SearchQuery, deps: PublisherDeps): Promise<BookRecord[]> {
|
|
79
|
-
const word = [query.title, query.author].filter(Boolean).join(" ");
|
|
80
|
-
if (!word) return [];
|
|
81
|
-
|
|
82
|
-
const limit = query.limit ?? 10;
|
|
83
|
-
const url = `${BASE_URL}/api_gh/site/search?search=${encodeURIComponent(word)}&limit=${limit}`;
|
|
84
|
-
const text = await fetchText(url, deps);
|
|
85
|
-
const data: GihyoSearchResponse = JSON.parse(text);
|
|
86
|
-
|
|
87
|
-
return Object.entries(data.list).map(([isbn, entry]) => entryToBookRecord(isbn, entry));
|
|
88
|
-
},
|
|
89
|
-
|
|
90
|
-
async getDetail(url: string, deps: PublisherDeps): Promise<BookRecord> {
|
|
91
|
-
// URL例: https://gihyo.jp/book/2022/978-4-297-12815-2
|
|
92
|
-
const isbnMatch = url.match(/\/(978-[\d-]+)\s*$/);
|
|
93
|
-
if (!isbnMatch) throw new Error(`URLからISBNを取得できません: ${url}`);
|
|
94
|
-
|
|
95
|
-
const isbn = isbnMatch[1];
|
|
96
|
-
const apiUrl = `${BASE_URL}/api_gh/site/search?search=${encodeURIComponent(isbn)}&limit=1`;
|
|
97
|
-
|
|
98
|
-
// JSONメタデータとebook store情報(HTML)を並列取得
|
|
99
|
-
const [apiText, htmlText] = await Promise.all([
|
|
100
|
-
fetchText(apiUrl, deps),
|
|
101
|
-
fetchText(url, deps),
|
|
102
|
-
]);
|
|
103
|
-
|
|
104
|
-
const data: GihyoSearchResponse = JSON.parse(apiText);
|
|
105
|
-
const entry = data.list[isbn];
|
|
106
|
-
if (!entry) throw new Error(`書籍が見つかりません: ${isbn}`);
|
|
107
|
-
|
|
108
|
-
const base = entryToBookRecord(isbn, entry);
|
|
109
|
-
|
|
110
|
-
const doc = deps.parser.parse(htmlText);
|
|
111
|
-
const ebookStores = extractEbookStoresFromDoc(doc);
|
|
112
|
-
const asin = extractAsin(htmlText);
|
|
113
|
-
|
|
114
|
-
return {
|
|
115
|
-
...base,
|
|
116
|
-
asin,
|
|
117
|
-
ebookStores: ebookStores.length > 0 ? ebookStores : undefined,
|
|
118
|
-
};
|
|
119
|
-
},
|
|
120
|
-
};
|
|
@@ -1,103 +0,0 @@
|
|
|
1
|
-
import type { PublisherAdapter, PublisherDeps } from "../../domain/publisher.js";
|
|
2
|
-
import type { BookRecord, SearchQuery, DrmType } from "../../domain/book.js";
|
|
3
|
-
import { fetchText, parseJapanesePrice, stripAuthorRole } from "./base.js";
|
|
4
|
-
|
|
5
|
-
const BASE_URL = "https://book.impress.co.jp";
|
|
6
|
-
|
|
7
|
-
/** "2026/1/22" → "2026-01-22" */
|
|
8
|
-
function parseImpressDate(text: string): string | undefined {
|
|
9
|
-
const m = text.trim().match(/(\d{4})\/(\d{1,2})\/(\d{1,2})/);
|
|
10
|
-
if (!m) return undefined;
|
|
11
|
-
return `${m[1]}-${m[2].padStart(2, "0")}-${m[3].padStart(2, "0")}`;
|
|
12
|
-
}
|
|
13
|
-
|
|
14
|
-
/**
|
|
15
|
-
* 著者文字列から著者名配列を返す。
|
|
16
|
-
* 例: "山本康太 著" → ["山本康太"]
|
|
17
|
-
* 複数著者は「、」または改行で区切られる。
|
|
18
|
-
*/
|
|
19
|
-
function parseAuthors(text: string): string[] {
|
|
20
|
-
return text
|
|
21
|
-
.split(/[、,\n]/)
|
|
22
|
-
.map(s => stripAuthorRole(s.trim()))
|
|
23
|
-
.filter(Boolean);
|
|
24
|
-
}
|
|
25
|
-
|
|
26
|
-
/**
|
|
27
|
-
* 電子書籍ガイドのテキストから DRM 種別を判定する。
|
|
28
|
-
* 明示されていない場合はインプレスの公式方針に基づき social を返す。
|
|
29
|
-
*/
|
|
30
|
-
function parseDrmType(text: string): DrmType {
|
|
31
|
-
if (/ソーシャルDRM/i.test(text)) return "social";
|
|
32
|
-
if (/DRM-?free|DRMフリー/i.test(text)) return "free";
|
|
33
|
-
if (/パスワード/i.test(text)) return "password_pdf";
|
|
34
|
-
return "social";
|
|
35
|
-
}
|
|
36
|
-
|
|
37
|
-
export const impressBooksAdapter: PublisherAdapter = {
|
|
38
|
-
id: "impress-books",
|
|
39
|
-
name: "インプレスブックス",
|
|
40
|
-
baseUrl: BASE_URL,
|
|
41
|
-
|
|
42
|
-
async search(_query: SearchQuery, _deps: PublisherDeps): Promise<BookRecord[]> {
|
|
43
|
-
// 検索ページは Google Custom Search Engine による JavaScript レンダリングのためスクレイピング不可
|
|
44
|
-
return [];
|
|
45
|
-
},
|
|
46
|
-
|
|
47
|
-
async getDetail(url: string, deps: PublisherDeps): Promise<BookRecord> {
|
|
48
|
-
const html = await fetchText(url, deps);
|
|
49
|
-
const doc = deps.parser.parse(html);
|
|
50
|
-
|
|
51
|
-
// タイトル(ページ内最初の h2)
|
|
52
|
-
const title = doc.selectOne("h2")?.text().trim() ?? "";
|
|
53
|
-
|
|
54
|
-
// dl.module-book-data の dt/dd を順序でペアリング
|
|
55
|
-
const dts = doc.select("dl.module-book-data dt");
|
|
56
|
-
const dds = doc.select("dl.module-book-data dd");
|
|
57
|
-
const bookDataMap = new Map<string, string>();
|
|
58
|
-
for (let i = 0; i < dts.length; i++) {
|
|
59
|
-
const key = dts[i].text().trim();
|
|
60
|
-
const val = dds[i]?.text().trim() ?? "";
|
|
61
|
-
if (key) bookDataMap.set(key, val);
|
|
62
|
-
}
|
|
63
|
-
|
|
64
|
-
const authors = parseAuthors(bookDataMap.get("著者") ?? "");
|
|
65
|
-
const isbn = bookDataMap.get("ISBN")?.replace(/\s/g, "") || undefined;
|
|
66
|
-
const publishedAt = parseImpressDate(bookDataMap.get("発売日") ?? "");
|
|
67
|
-
|
|
68
|
-
// カバー画像(img.ips.co.jp のプロトコル相対URLに https: を補完)
|
|
69
|
-
const coverSrc = doc.selectOne(".block-book-detail-img img")?.attr("src");
|
|
70
|
-
const coverImageUrl = coverSrc
|
|
71
|
-
? (coverSrc.startsWith("//") ? `https:${coverSrc}` : coverSrc)
|
|
72
|
-
: undefined;
|
|
73
|
-
|
|
74
|
-
// 電子版価格・DRM
|
|
75
|
-
const ebookGuide = doc.selectOne(".module-e-book-buy-guide-txt");
|
|
76
|
-
const ebookBuyBtn = doc.selectOne(".module-e-book-buy-guide-btn a");
|
|
77
|
-
|
|
78
|
-
let price: number | undefined;
|
|
79
|
-
let drm: DrmType = "social";
|
|
80
|
-
|
|
81
|
-
if (ebookGuide) {
|
|
82
|
-
const priceText = ebookGuide.find(".module-e-book-price")[0]?.text();
|
|
83
|
-
if (priceText) price = parseJapanesePrice(priceText);
|
|
84
|
-
drm = parseDrmType(ebookGuide.text());
|
|
85
|
-
}
|
|
86
|
-
|
|
87
|
-
const ebookStores = ebookBuyBtn
|
|
88
|
-
? [{ name: "インプレスブックス", url, drm }]
|
|
89
|
-
: [];
|
|
90
|
-
|
|
91
|
-
return {
|
|
92
|
-
title,
|
|
93
|
-
authors,
|
|
94
|
-
publisher: "インプレスブックス",
|
|
95
|
-
url,
|
|
96
|
-
isbn,
|
|
97
|
-
price,
|
|
98
|
-
publishedAt,
|
|
99
|
-
coverImageUrl,
|
|
100
|
-
ebookStores,
|
|
101
|
-
};
|
|
102
|
-
},
|
|
103
|
-
};
|
|
@@ -1,146 +0,0 @@
|
|
|
1
|
-
import type { PublisherAdapter, PublisherDeps } from "../../domain/publisher.js";
|
|
2
|
-
import type { BookRecord, SearchQuery } from "../../domain/book.js";
|
|
3
|
-
import { fetchText, parseJapanesePrice, resolveUrl, extractAsin, extractEbookStoresFromDoc } from "./base.js";
|
|
4
|
-
import type { EbookStore } from "../../domain/book.js";
|
|
5
|
-
|
|
6
|
-
const BASE_URL = "https://www.lambdanote.com";
|
|
7
|
-
|
|
8
|
-
function extractIsbn(text: string): string | undefined {
|
|
9
|
-
const match = text.match(/97[89]-[\d-]{10,}/);
|
|
10
|
-
return match ? match[0].replace(/-/g, "") : undefined;
|
|
11
|
-
}
|
|
12
|
-
|
|
13
|
-
/**
|
|
14
|
-
* Shopify ページに埋め込まれた product JSON を取得する。
|
|
15
|
-
* <script type="application/json" id="ProductJson-..."> または
|
|
16
|
-
* data-product-json 属性を探す。
|
|
17
|
-
*/
|
|
18
|
-
function parseShopifyProductJson(html: string): Record<string, unknown> | null {
|
|
19
|
-
const match = html.match(
|
|
20
|
-
/<script[^>]+type=["']application\/json["'][^>]*id=["']ProductJson[^"']*["'][^>]*>([\s\S]*?)<\/script>/i,
|
|
21
|
-
);
|
|
22
|
-
if (match?.[1]) {
|
|
23
|
-
try {
|
|
24
|
-
return JSON.parse(match[1]) as Record<string, unknown>;
|
|
25
|
-
} catch {
|
|
26
|
-
// fall through
|
|
27
|
-
}
|
|
28
|
-
}
|
|
29
|
-
return null;
|
|
30
|
-
}
|
|
31
|
-
|
|
32
|
-
export const lambdanoteAdapter: PublisherAdapter = {
|
|
33
|
-
id: "lambdanote",
|
|
34
|
-
name: "ラムダノート",
|
|
35
|
-
baseUrl: BASE_URL,
|
|
36
|
-
|
|
37
|
-
async search(query: SearchQuery, deps: PublisherDeps): Promise<BookRecord[]> {
|
|
38
|
-
const word = [query.title, query.author].filter(Boolean).join(" ");
|
|
39
|
-
if (!word) return [];
|
|
40
|
-
|
|
41
|
-
const url = `${BASE_URL}/search?q=${encodeURIComponent(word)}&type=product`;
|
|
42
|
-
const html = await fetchText(url, deps);
|
|
43
|
-
const doc = deps.parser.parse(html);
|
|
44
|
-
|
|
45
|
-
const results: BookRecord[] = [];
|
|
46
|
-
|
|
47
|
-
// Shopify Dawn テーマ系の検索結果セレクター
|
|
48
|
-
const items = doc.select(
|
|
49
|
-
".search-results__list-item, li.search-result-product",
|
|
50
|
-
);
|
|
51
|
-
|
|
52
|
-
for (const item of items) {
|
|
53
|
-
const titleEl =
|
|
54
|
-
item.find(".card__heading a")[0] ??
|
|
55
|
-
item.find("h2 a")[0] ??
|
|
56
|
-
item.find("h3 a")[0] ??
|
|
57
|
-
item.find("a.full-unstyled-link")[0];
|
|
58
|
-
|
|
59
|
-
if (!titleEl) continue;
|
|
60
|
-
|
|
61
|
-
const title = titleEl.text();
|
|
62
|
-
const href = titleEl.attr("href");
|
|
63
|
-
if (!title || !href) continue;
|
|
64
|
-
|
|
65
|
-
const bookUrl = resolveUrl(BASE_URL, href);
|
|
66
|
-
|
|
67
|
-
const priceEl =
|
|
68
|
-
item.find(".price__regular .price-item")[0] ??
|
|
69
|
-
item.find(".price-item")[0] ??
|
|
70
|
-
item.find(".price")[0];
|
|
71
|
-
const price = priceEl ? parseJapanesePrice(priceEl.text()) : undefined;
|
|
72
|
-
|
|
73
|
-
const imgEl = item.find("img")[0];
|
|
74
|
-
const imgSrc = imgEl?.attr("src") ?? imgEl?.attr("data-src");
|
|
75
|
-
const coverImageUrl = imgSrc ? resolveUrl(BASE_URL, imgSrc) : undefined;
|
|
76
|
-
|
|
77
|
-
results.push({
|
|
78
|
-
title,
|
|
79
|
-
authors: [],
|
|
80
|
-
publisher: "ラムダノート",
|
|
81
|
-
url: bookUrl,
|
|
82
|
-
price,
|
|
83
|
-
coverImageUrl,
|
|
84
|
-
});
|
|
85
|
-
}
|
|
86
|
-
|
|
87
|
-
return results.slice(0, query.limit ?? 10);
|
|
88
|
-
},
|
|
89
|
-
|
|
90
|
-
async getDetail(url: string, deps: PublisherDeps): Promise<BookRecord> {
|
|
91
|
-
const html = await fetchText(url, deps);
|
|
92
|
-
const doc = deps.parser.parse(html);
|
|
93
|
-
|
|
94
|
-
const title =
|
|
95
|
-
doc.selectOne("h1.product__title")?.text() ??
|
|
96
|
-
doc.selectOne("h1")?.text() ??
|
|
97
|
-
"";
|
|
98
|
-
|
|
99
|
-
const priceEl =
|
|
100
|
-
doc.selectOne(".price__regular .price-item") ??
|
|
101
|
-
doc.selectOne(".price-item--regular") ??
|
|
102
|
-
doc.selectOne("[class*='price']");
|
|
103
|
-
const price = priceEl ? parseJapanesePrice(priceEl.text()) : undefined;
|
|
104
|
-
|
|
105
|
-
const descEl =
|
|
106
|
-
doc.selectOne(".product__description") ??
|
|
107
|
-
doc.selectOne("[class*='description']");
|
|
108
|
-
const description = descEl?.text() || undefined;
|
|
109
|
-
|
|
110
|
-
const isbn = extractIsbn(html);
|
|
111
|
-
const asin = extractAsin(html);
|
|
112
|
-
|
|
113
|
-
// vendor フィールドに著者が入っている場合がある
|
|
114
|
-
const productJson = parseShopifyProductJson(html);
|
|
115
|
-
const vendor = typeof productJson?.["vendor"] === "string" ? productJson["vendor"] : null;
|
|
116
|
-
const authors: string[] = vendor
|
|
117
|
-
? vendor.split(/[,、//]/).map((a: string) => a.trim()).filter(Boolean)
|
|
118
|
-
: [];
|
|
119
|
-
|
|
120
|
-
const imgEl =
|
|
121
|
-
doc.selectOne(".product__media img") ??
|
|
122
|
-
doc.selectOne(".product-featured-image") ??
|
|
123
|
-
doc.selectOne("[class*='product'] img");
|
|
124
|
-
const imgSrc = imgEl?.attr("src") ?? imgEl?.attr("data-src");
|
|
125
|
-
const coverImageUrl = imgSrc ? resolveUrl(BASE_URL, imgSrc) : undefined;
|
|
126
|
-
|
|
127
|
-
// ラムダノートは購入時生成の一意IDをPDF欄外に印字 (ソーシャルDRM)
|
|
128
|
-
const ebookStores: EbookStore[] = [
|
|
129
|
-
{ name: "ラムダノート", url, drm: "social" },
|
|
130
|
-
...extractEbookStoresFromDoc(doc).filter(s => s.name !== "ラムダノート"),
|
|
131
|
-
];
|
|
132
|
-
|
|
133
|
-
return {
|
|
134
|
-
title,
|
|
135
|
-
authors,
|
|
136
|
-
publisher: "ラムダノート",
|
|
137
|
-
url,
|
|
138
|
-
price,
|
|
139
|
-
description,
|
|
140
|
-
isbn,
|
|
141
|
-
asin,
|
|
142
|
-
coverImageUrl,
|
|
143
|
-
ebookStores,
|
|
144
|
-
};
|
|
145
|
-
},
|
|
146
|
-
};
|
|
@@ -1,113 +0,0 @@
|
|
|
1
|
-
import type { PublisherAdapter, PublisherDeps } from "../../domain/publisher.js";
|
|
2
|
-
import type { BookRecord, SearchQuery } from "../../domain/book.js";
|
|
3
|
-
import type { HtmlDocument } from "../../ports/html-parser.js";
|
|
4
|
-
import { fetchText, parseJapanesePrice, resolveUrl } from "./base.js";
|
|
5
|
-
|
|
6
|
-
const BASE_URL = "https://book.mynavi.jp/manatee";
|
|
7
|
-
const BOOKS_URL = `${BASE_URL}/books/`;
|
|
8
|
-
|
|
9
|
-
/**
|
|
10
|
-
* `.attribute li` 内の著者リンクを配列にする。
|
|
11
|
-
* 各 <a> のテキストが著者名(役割は括弧内テキストで付記されているが名前は <a> 内)。
|
|
12
|
-
*/
|
|
13
|
-
function parseAuthors(doc: HtmlDocument): string[] {
|
|
14
|
-
return doc
|
|
15
|
-
.select(".attribute li a")
|
|
16
|
-
.map(el => el.text().trim())
|
|
17
|
-
.filter(Boolean);
|
|
18
|
-
}
|
|
19
|
-
|
|
20
|
-
export const manateeAdapter: PublisherAdapter = {
|
|
21
|
-
id: "manatee",
|
|
22
|
-
name: "マナティ",
|
|
23
|
-
baseUrl: BASE_URL,
|
|
24
|
-
|
|
25
|
-
async search(query: SearchQuery, deps: PublisherDeps): Promise<BookRecord[]> {
|
|
26
|
-
const word = [query.title, query.author].filter(Boolean).join(" ");
|
|
27
|
-
if (!word) return [];
|
|
28
|
-
|
|
29
|
-
const url = `${BOOKS_URL}?topics_keyword=${encodeURIComponent(word)}`;
|
|
30
|
-
const html = await fetchText(url, deps);
|
|
31
|
-
const doc = deps.parser.parse(html);
|
|
32
|
-
|
|
33
|
-
const results: BookRecord[] = [];
|
|
34
|
-
const limit = query.limit ?? 10;
|
|
35
|
-
|
|
36
|
-
// 書籍アイテムは <!-- item --> コメントで区切られた <li> 内
|
|
37
|
-
for (const li of doc.select("ul.category_list li")) {
|
|
38
|
-
const titleEl = li.find("dl.detail dt a")[0];
|
|
39
|
-
if (!titleEl) continue;
|
|
40
|
-
|
|
41
|
-
const title = titleEl.text().trim();
|
|
42
|
-
if (!title) continue;
|
|
43
|
-
|
|
44
|
-
const href = titleEl.attr("href");
|
|
45
|
-
if (!href) continue;
|
|
46
|
-
const bookUrl = href.startsWith("http") ? href : resolveUrl(BASE_URL, href);
|
|
47
|
-
|
|
48
|
-
const priceText = li.find(".detail__price")[0]?.text().trim();
|
|
49
|
-
const price = priceText ? parseJapanesePrice(priceText) : undefined;
|
|
50
|
-
|
|
51
|
-
const imgEl = li.find(".image img")[0];
|
|
52
|
-
const imgSrc = imgEl?.attr("src");
|
|
53
|
-
const coverImageUrl = imgSrc ? resolveUrl(BASE_URL, imgSrc) : undefined;
|
|
54
|
-
|
|
55
|
-
results.push({
|
|
56
|
-
title,
|
|
57
|
-
authors: [],
|
|
58
|
-
publisher: "マナティ",
|
|
59
|
-
url: bookUrl,
|
|
60
|
-
price,
|
|
61
|
-
coverImageUrl,
|
|
62
|
-
ebookStores: [{ name: "マナティ", url: bookUrl, drm: "social" }],
|
|
63
|
-
});
|
|
64
|
-
|
|
65
|
-
if (results.length >= limit) break;
|
|
66
|
-
}
|
|
67
|
-
|
|
68
|
-
return results;
|
|
69
|
-
},
|
|
70
|
-
|
|
71
|
-
async getDetail(url: string, deps: PublisherDeps): Promise<BookRecord> {
|
|
72
|
-
const html = await fetchText(url, deps);
|
|
73
|
-
const doc = deps.parser.parse(html);
|
|
74
|
-
|
|
75
|
-
const title = doc.selectOne("h1.title")?.text().trim() ?? "";
|
|
76
|
-
|
|
77
|
-
// `.intro` の最初の <p> が出版社名
|
|
78
|
-
const publisher = doc.selectOne(".intro p")?.text().trim() ?? "マナティ";
|
|
79
|
-
|
|
80
|
-
const authors = parseAuthors(doc);
|
|
81
|
-
|
|
82
|
-
// 購入形態テーブルの最初の行から価格取得
|
|
83
|
-
const priceText = doc.selectOne("#item_selectlist table .price")?.text().trim();
|
|
84
|
-
const price = priceText ? parseJapanesePrice(priceText) : undefined;
|
|
85
|
-
|
|
86
|
-
// 表紙画像の alt 属性が "ISBN.jpg" 形式(例: "9784839984274.jpg")
|
|
87
|
-
const imgEl = doc.selectOne("div.item_meta_image img");
|
|
88
|
-
const imgSrc = imgEl?.attr("src");
|
|
89
|
-
const coverImageUrl = imgSrc ? resolveUrl(BASE_URL, imgSrc) : undefined;
|
|
90
|
-
const imgAlt = imgEl?.attr("alt") ?? "";
|
|
91
|
-
const isbn = imgAlt.replace(/\.jpg$/i, "").replace(/-/g, "") || undefined;
|
|
92
|
-
|
|
93
|
-
// 発売日: "発売日:2024-03-22"
|
|
94
|
-
const dateText = doc.selectOne("p.date")?.text().trim();
|
|
95
|
-
const publishedAt = dateText?.match(/(\d{4}-\d{2}-\d{2})/)?.[1] ?? undefined;
|
|
96
|
-
|
|
97
|
-
const descEl = doc.selectOne(".item_desc p:not(.date):not(.pages)");
|
|
98
|
-
const description = descEl?.text().trim() || undefined;
|
|
99
|
-
|
|
100
|
-
return {
|
|
101
|
-
title,
|
|
102
|
-
authors,
|
|
103
|
-
publisher,
|
|
104
|
-
url,
|
|
105
|
-
isbn,
|
|
106
|
-
price,
|
|
107
|
-
publishedAt,
|
|
108
|
-
description,
|
|
109
|
-
coverImageUrl,
|
|
110
|
-
ebookStores: [{ name: "マナティ", url, drm: "social" }],
|
|
111
|
-
};
|
|
112
|
-
},
|
|
113
|
-
};
|
|
@@ -1,129 +0,0 @@
|
|
|
1
|
-
import type { PublisherAdapter, PublisherDeps } from "../../domain/publisher.js";
|
|
2
|
-
import type { BookRecord, SearchQuery } from "../../domain/book.js";
|
|
3
|
-
import { fetchText, resolveUrl, extractEbookStoresFromDoc, parseJapaneseDateToISO, stripAuthorRole } from "./base.js";
|
|
4
|
-
|
|
5
|
-
const BASE_URL = "https://www.maruzen-publishing.co.jp";
|
|
6
|
-
const SEARCH_URL = `${BASE_URL}/search/`;
|
|
7
|
-
|
|
8
|
-
/** 403回避のために自サイトをRefererとして付与する必要がある */
|
|
9
|
-
const EXTRA_HEADERS = { Referer: `${BASE_URL}/` };
|
|
10
|
-
|
|
11
|
-
/**
|
|
12
|
-
* "ボリス・チェルニー 著 折山文哉 訳" → ["ボリス・チェルニー", "折山文哉"]
|
|
13
|
-
* 役割語(著・訳・編・監訳・監修など)を除去する。
|
|
14
|
-
*/
|
|
15
|
-
function parseAuthorsFromText(text: string): string[] {
|
|
16
|
-
return text.split(/[ \s]+(?=\S)/).map(stripAuthorRole).filter(Boolean);
|
|
17
|
-
}
|
|
18
|
-
|
|
19
|
-
/**
|
|
20
|
-
* div.author 内の各リンクから役割語を除去して著者名のみ返す。
|
|
21
|
-
*/
|
|
22
|
-
function parseAuthorLinks(authors: string[]): string[] {
|
|
23
|
-
return authors.map(stripAuthorRole).filter(Boolean);
|
|
24
|
-
}
|
|
25
|
-
|
|
26
|
-
/**
|
|
27
|
-
* "2020/03/31" → "2020-03-31"
|
|
28
|
-
* "2020年3月31日" → "2020-03-31"
|
|
29
|
-
*/
|
|
30
|
-
function parseDate(text: string): string | undefined {
|
|
31
|
-
const m1 = text.match(/(\d{4})\/(\d{1,2})\/(\d{1,2})/);
|
|
32
|
-
if (m1) {
|
|
33
|
-
return `${m1[1]}-${m1[2].padStart(2, "0")}-${m1[3].padStart(2, "0")}`;
|
|
34
|
-
}
|
|
35
|
-
return parseJapaneseDateToISO(text);
|
|
36
|
-
}
|
|
37
|
-
|
|
38
|
-
export const maruzenPublishingAdapter: PublisherAdapter = {
|
|
39
|
-
id: "maruzen-publishing",
|
|
40
|
-
name: "丸善出版",
|
|
41
|
-
baseUrl: BASE_URL,
|
|
42
|
-
|
|
43
|
-
async search(query: SearchQuery, deps: PublisherDeps): Promise<BookRecord[]> {
|
|
44
|
-
const word = [query.title, query.author].filter(Boolean).join(" ");
|
|
45
|
-
if (!word) return [];
|
|
46
|
-
|
|
47
|
-
const url = `${SEARCH_URL}?search_keyword=${encodeURIComponent(word)}&format=1`;
|
|
48
|
-
const html = await fetchText(url, deps, EXTRA_HEADERS);
|
|
49
|
-
const doc = deps.parser.parse(html);
|
|
50
|
-
|
|
51
|
-
const results: BookRecord[] = [];
|
|
52
|
-
const limit = query.limit ?? 10;
|
|
53
|
-
|
|
54
|
-
for (const item of doc.select("div.booklist div.item")) {
|
|
55
|
-
const linkEl = item.find("div.ttl a")[0];
|
|
56
|
-
if (!linkEl) continue;
|
|
57
|
-
|
|
58
|
-
const title = linkEl.text().trim();
|
|
59
|
-
const href = linkEl.attr("href");
|
|
60
|
-
if (!title || !href) continue;
|
|
61
|
-
|
|
62
|
-
const bookUrl = href.startsWith("http") ? href : `${BASE_URL}${href}`;
|
|
63
|
-
|
|
64
|
-
const authorLinks = item.find("div.author a").map(el => el.text().trim());
|
|
65
|
-
const authors = parseAuthorLinks(authorLinks);
|
|
66
|
-
|
|
67
|
-
const imgEl = item.find("div.image img")[0];
|
|
68
|
-
const imgSrc = imgEl?.attr("src");
|
|
69
|
-
const coverImageUrl = imgSrc ? resolveUrl(BASE_URL, imgSrc) : undefined;
|
|
70
|
-
|
|
71
|
-
results.push({
|
|
72
|
-
title,
|
|
73
|
-
authors,
|
|
74
|
-
publisher: "丸善出版",
|
|
75
|
-
url: bookUrl,
|
|
76
|
-
coverImageUrl,
|
|
77
|
-
});
|
|
78
|
-
|
|
79
|
-
if (results.length >= limit) break;
|
|
80
|
-
}
|
|
81
|
-
|
|
82
|
-
return results;
|
|
83
|
-
},
|
|
84
|
-
|
|
85
|
-
async getDetail(url: string, deps: PublisherDeps): Promise<BookRecord> {
|
|
86
|
-
const html = await fetchText(url, deps, EXTRA_HEADERS);
|
|
87
|
-
const doc = deps.parser.parse(html);
|
|
88
|
-
|
|
89
|
-
// タイトルは <title> タグ、またはh1など(サイト構造に依存)
|
|
90
|
-
// div#bookData table の th/td からメタデータを取得
|
|
91
|
-
const table = doc.selectOne("div#bookData table");
|
|
92
|
-
let authors: string[] = [];
|
|
93
|
-
let publisher = "丸善出版";
|
|
94
|
-
let publishedAt: string | undefined;
|
|
95
|
-
|
|
96
|
-
if (table) {
|
|
97
|
-
for (const row of table.find("tr")) {
|
|
98
|
-
const th = row.find("th")[0]?.text().trim() ?? "";
|
|
99
|
-
const tdText = row.find("td")[0]?.text().trim() ?? "";
|
|
100
|
-
|
|
101
|
-
if (th === "著者") {
|
|
102
|
-
authors = parseAuthorsFromText(tdText);
|
|
103
|
-
} else if (th === "発行元") {
|
|
104
|
-
publisher = tdText || "丸善出版";
|
|
105
|
-
} else if (th === "出版年月日") {
|
|
106
|
-
publishedAt = parseDate(tdText);
|
|
107
|
-
}
|
|
108
|
-
}
|
|
109
|
-
}
|
|
110
|
-
|
|
111
|
-
// ページタイトルから書籍タイトルを取得(" | 丸善出版" を除去)
|
|
112
|
-
const pageTitle = doc.selectOne("title")?.text().trim() ?? "";
|
|
113
|
-
const title = pageTitle.replace(/\s*[||]\s*丸善出版.*$/, "").trim();
|
|
114
|
-
|
|
115
|
-
// 電子書籍ストア(kw.maruzen.co.jp は機関向けなので除外)
|
|
116
|
-
const ebookStores = extractEbookStoresFromDoc(doc).filter(
|
|
117
|
-
store => !store.url.includes("kw.maruzen.co.jp"),
|
|
118
|
-
);
|
|
119
|
-
|
|
120
|
-
return {
|
|
121
|
-
title,
|
|
122
|
-
authors,
|
|
123
|
-
publisher,
|
|
124
|
-
url,
|
|
125
|
-
publishedAt,
|
|
126
|
-
ebookStores: ebookStores.length > 0 ? ebookStores : undefined,
|
|
127
|
-
};
|
|
128
|
-
},
|
|
129
|
-
};
|