Compare commits

...

2 commits

Author SHA1 Message Date
55cfb54d09
no-headless 2024-06-30 23:43:40 +09:00
f5d2728526
fix dlsite-maniax 2024-06-30 23:43:25 +09:00
6 changed files with 123 additions and 49 deletions

View file

@ -10,7 +10,7 @@ $ npx https://git.fogtype.com/nebel/gadl/archive/main.tar.gz --help
- Google Play ブックス (漫画) - Google Play ブックス (漫画)
- DMM ブックス (漫画) - DMM ブックス (漫画)
- DLsite 同人 - DLsite 同人/がるまに/成年コミック
- FANZA 同人 - FANZA 同人
## License ## License

View file

@ -1,8 +1,10 @@
import * as Playwright from "playwright"; import type * as Playwright from "playwright";
import { chromium, devices } from "playwright"; import { chromium, devices } from "playwright";
import type { Database } from "./database"; import type { Database } from "./database";
import type { TPlatform } from "./platform"; import type { TPlatform } from "./platform";
export type PageOrFrame = Playwright.Page | Playwright.Frame;
export type ImageFile = { export type ImageFile = {
url: string; url: string;
blocks?: Array<Record<string, number>>; blocks?: Array<Record<string, number>>;
@ -10,6 +12,16 @@ export type ImageFile = {
height?: number; height?: number;
}; };
export type Browser = {
loadBrowserContext(platform: TPlatform): Promise<Playwright.BrowserContext>;
saveBrowserContext(platform: TPlatform, ctx: BrowserContext): Promise<void>;
newContext(): Promise<Playwright.BrowserContext>;
close(): Promise<void>;
drawImage(pageOrFrame: PageOrFrame, imageFile: ImageFile): Promise<Blob>;
};
export type BrowserContext = Playwright.BrowserContext;
async function drawImage(imageFile: ImageFile): Promise<string> { async function drawImage(imageFile: ImageFile): Promise<string> {
const canvas = Object.assign(document.createElement("canvas"), { const canvas = Object.assign(document.createElement("canvas"), {
width: imageFile.width, width: imageFile.width,
@ -71,25 +83,12 @@ async function dataUrlToBlob(dataUrl: string): Promise<Blob> {
return await res.blob(); return await res.blob();
} }
export type Browser = {
loadBrowserContext(platform: TPlatform): Promise<Playwright.BrowserContext>;
saveBrowserContext(platform: TPlatform, ctx: BrowserContext): Promise<void>;
newContext(): Promise<Playwright.BrowserContext>;
close(): Promise<void>;
drawImage(
pageOrFrame: Playwright.Page | Playwright.Frame,
imageFile: ImageFile,
): Promise<Blob>;
};
export type BrowserContext = Playwright.BrowserContext;
export async function createBrowser({ export async function createBrowser({
db, db,
headless = true, headless,
}: { }: {
db: Database; db: Database;
headless?: boolean; headless: boolean;
}): Promise<Browser> { }): Promise<Browser> {
const { userAgent } = devices["Desktop Chrome"]; const { userAgent } = devices["Desktop Chrome"];
const browser = await chromium.launch({ const browser = await chromium.launch({
@ -127,7 +126,7 @@ export async function createBrowser({
close: () => browser.close(), close: () => browser.close(),
async drawImage( async drawImage(
pageOrFrame: Playwright.Page | Playwright.Frame, pageOrFrame: PageOrFrame,
imageFile: ImageFile, imageFile: ImageFile,
): Promise<Blob> { ): Promise<Blob> {
if (Array.isArray(imageFile.blocks) && imageFile.blocks.length > 0) { if (Array.isArray(imageFile.blocks) && imageFile.blocks.length > 0) {

27
main.ts
View file

@ -4,9 +4,9 @@ import path from "node:path";
import util from "node:util"; import util from "node:util";
import { createBrowser } from "./browser"; import { createBrowser } from "./browser";
import { createDatabase } from "./database"; import { createDatabase } from "./database";
import { type Book, createLibrary } from "./library"; import { createLibrary, type Book } from "./library";
import { type TPlatform, createPlatform, platforms } from "./platform";
import * as pkg from "./package.json"; import * as pkg from "./package.json";
import { createPlatform, platforms, type TPlatform } from "./platform";
const options = { const options = {
db: { db: {
@ -30,6 +30,10 @@ const options = {
return `<output_authors_limit> (default: ${this.default})`; return `<output_authors_limit> (default: ${this.default})`;
}, },
}, },
"no-headless": {
type: "boolean",
default: false,
},
login: { login: {
type: "string", type: "string",
toString() { toString() {
@ -53,8 +57,9 @@ const options = {
return [...Object.keys(platforms)].join("|"); return [...Object.keys(platforms)].join("|");
}, },
async run() { async run() {
const db = await createDatabase(args.values.db!); const db = await createDatabase(args.values.db!),
const browser = await createBrowser({ db }); headless = !args.values["no-headless"];
const browser = await createBrowser({ db, headless });
const platform = createPlatform({ const platform = createPlatform({
platform: args.values.logout as TPlatform, platform: args.values.logout as TPlatform,
db, db,
@ -128,9 +133,10 @@ const options = {
return [...Object.keys(platforms)].join("|"); return [...Object.keys(platforms)].join("|");
}, },
async run() { async run() {
const db = await createDatabase(args.values.db!); const db = await createDatabase(args.values.db!),
const library = createLibrary(db); library = createLibrary(db),
const browser = await createBrowser({ db }); headless = !args.values["no-headless"];
const browser = await createBrowser({ db, headless });
const platform = createPlatform({ const platform = createPlatform({
platform: args.values.pull as TPlatform, platform: args.values.pull as TPlatform,
db, db,
@ -150,8 +156,9 @@ const options = {
return `all|<reader_url_or_id>`; return `all|<reader_url_or_id>`;
}, },
async run() { async run() {
const db = await createDatabase(args.values.db!); const db = await createDatabase(args.values.db!),
const library = createLibrary(db); library = createLibrary(db),
headless = !args.values["no-headless"];
const books: Array<Book> = []; const books: Array<Book> = [];
if (args.values.download === "all") { if (args.values.download === "all") {
@ -171,7 +178,7 @@ const options = {
} }
for (const book of books) { for (const book of books) {
const browser = await createBrowser({ db }); const browser = await createBrowser({ db, headless });
const platform = createPlatform({ const platform = createPlatform({
platform: book.platform, platform: book.platform,
db, db,

4
package-lock.json generated
View file

@ -1,12 +1,12 @@
{ {
"name": "@fogtype/gadl", "name": "@fogtype/gadl",
"version": "1.5.0", "version": "1.6.0",
"lockfileVersion": 3, "lockfileVersion": 3,
"requires": true, "requires": true,
"packages": { "packages": {
"": { "": {
"name": "@fogtype/gadl", "name": "@fogtype/gadl",
"version": "1.5.0", "version": "1.6.0",
"license": "AGPL-3.0", "license": "AGPL-3.0",
"dependencies": { "dependencies": {
"fflate": "^0.8.1", "fflate": "^0.8.1",

View file

@ -1,6 +1,6 @@
{ {
"name": "@fogtype/gadl", "name": "@fogtype/gadl",
"version": "1.5.0", "version": "1.6.0",
"license": "AGPL-3.0", "license": "AGPL-3.0",
"type": "module", "type": "module",
"bin": "bin/run.js", "bin": "bin/run.js",

View file

@ -1,5 +1,41 @@
import type {
Browser,
BrowserContext,
ImageFile,
PageOrFrame,
} from "../browser";
import type { Book } from "../library"; import type { Book } from "../library";
import type { Browser, BrowserContext, ImageFile } from "../browser";
// リーダーのページ要素
const workTreeItemsSelector = `[class^=_worktree_] li[class^=_item_]`;
function Reader(page: PageOrFrame, readerUrl: string) {
const workId = /^https:[/][/]play[.]dlsite[.]com[/]#[/]work[/]([^/]+)/.exec(
readerUrl,
)?.[1];
if (!workId) {
throw new Error(`workId is not included: ${readerUrl}`);
}
return {
async load() {
await page.goto(readerUrl);
},
async downloadUrl(): Promise<null | string> {
const isBook = workId.startsWith("B");
if (isBook) {
// PDFファイルでないことを確認
const items = await page.waitForSelector(workTreeItemsSelector);
const text = await items.textContent();
if (!text?.match(/PDF/u)) return null;
}
return `https://www.dlsite.com/home/download/=/product_id/${workId}.html`;
},
};
}
export function DlsiteManiax(browser: Browser) { export function DlsiteManiax(browser: Browser) {
async function* getAllBooks(ctx: BrowserContext): AsyncGenerator<Book> { async function* getAllBooks(ctx: BrowserContext): AsyncGenerator<Book> {
@ -37,6 +73,7 @@ export function DlsiteManiax(browser: Browser) {
ja_JP: string; ja_JP: string;
}; };
}; };
author_name: string | null;
}>; }>;
} = await res.json(); } = await res.json();
@ -46,7 +83,7 @@ export function DlsiteManiax(browser: Browser) {
platform: "dlsite-maniax", platform: "dlsite-maniax",
readerUrl: `https://play.dlsite.com/#/work/${work.workno}`, readerUrl: `https://play.dlsite.com/#/work/${work.workno}`,
title: work.name.ja_JP || "", title: work.name.ja_JP || "",
authors: [work.maker.name.ja_JP || ""], authors: [work.author_name || work.maker.name.ja_JP || ""],
}; };
process.stderr.write("."); process.stderr.write(".");
@ -69,30 +106,61 @@ export function DlsiteManiax(browser: Browser) {
async getFiles(book: Book): Promise<Array<() => Promise<Blob>>> { async getFiles(book: Book): Promise<Array<() => Promise<Blob>>> {
const ctx = await browser.loadBrowserContext("dlsite-maniax"); const ctx = await browser.loadBrowserContext("dlsite-maniax");
const page = await ctx.newPage(); const page = await ctx.newPage();
const reader = Reader(page, book.readerUrl);
await page.goto(book.readerUrl); await reader.load();
const downloadUrl = await reader.downloadUrl();
const [, workId] = if (downloadUrl) {
/^https:[/][/]play[.]dlsite[.]com[/]#[/]work[/]([^/]+)/.exec( const imageFile: ImageFile = { url: downloadUrl };
book.readerUrl,
) ?? [];
if (!workId) { return [
throw new Error(`workId is not included: ${book.readerUrl}`); async () => {
const blob = await browser.drawImage(page, imageFile);
process.stderr.write(".");
return blob;
},
];
} }
const url = `https://www.dlsite.com/home/download/=/product_id/${workId}.html`; // ページ数 … 画面に表示されている要素を辿る
const imageFile = { url }; await page.waitForSelector(workTreeItemsSelector);
const workTreeItems = await page.locator(workTreeItemsSelector).count();
await page.click(workTreeItemsSelector);
return [ // 見開き表示の無効化 … 初回: 右下見開きボタンをクリックして無効化
async () => { const spreadButton = page.getByRole("button", { name: "見開き" });
const blob = await browser.drawImage(page, imageFile); await spreadButton.click();
await Promise.all([
spreadButton.waitFor({ state: "detached" }),
page.mouse.click(0, 720 / 2),
]);
await page.keyboard.press("ArrowRight");
process.stderr.write("."); // ページ数だけ画面送りを繰り返し行い、canvasをそのままキャプチャしていく
const files: Array<() => Promise<Blob>> = [];
while (files.length < workTreeItems) {
await page.waitForTimeout(1000);
const n = Math.min(2, Math.max(0, workTreeItems - 1 - files.length));
const canvas = page.locator("canvas").nth(n);
await canvas.waitFor({ state: "visible" });
const [width, height] = await Promise.all(
["width", "height"].map((d) => canvas.getAttribute(d).then(Number)),
);
await page.setViewportSize({ width, height });
await page.waitForTimeout(500);
const buff = await canvas.screenshot();
files.push(async () => new Blob([buff], { type: "image/png" }));
return blob; process.stderr.write(".");
},
]; await page.keyboard.press("ArrowLeft");
}
// TODO: $ gadl --download=1498 # pdf のとき
return files;
}, },
loginEndpoints: ["https://www.dlsite.com/home/login"], loginEndpoints: ["https://www.dlsite.com/home/login"],
loginSuccessUrl: (url: URL) => url.origin === "https://www.dlsite.com", loginSuccessUrl: (url: URL) => url.origin === "https://www.dlsite.com",