@letsscrapedata/controller 0.0.21 → 0.0.23

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/dist/index.cjs CHANGED
@@ -16990,9 +16990,18 @@ var CheerioElement = class _CheerioElement {
16990
16990
  // src/cheerio/page.ts
16991
16991
  var CheerioPage = class extends import_node_events7.default {
16992
16992
  #document;
16993
- constructor(html3 = "") {
16993
+ /**
16994
+ *
16995
+ * @param html default ""
16996
+ * @param isHtml default true
16997
+ */
16998
+ constructor(html3 = "", isHtml2 = true) {
16994
16999
  super();
16995
- this.#document = load(html3).root();
17000
+ if (isHtml2) {
17001
+ this.#document = load(html3).root();
17002
+ } else {
17003
+ this.#document = load(html3, { xml: true }).root();
17004
+ }
16996
17005
  }
16997
17006
  async bringToFront() {
16998
17007
  throw new Error("Not supported in CheerioPage.");
@@ -17077,8 +17086,12 @@ var CheerioPage = class extends import_node_events7.default {
17077
17086
  isFree() {
17078
17087
  throw new Error("Not supported in CheerioPage.");
17079
17088
  }
17080
- load(html3) {
17081
- this.#document = load(html3).root();
17089
+ load(html3, isHtml2 = true) {
17090
+ if (isHtml2) {
17091
+ this.#document = load(html3).root();
17092
+ } else {
17093
+ this.#document = load(html3, { xml: true }).root();
17094
+ }
17082
17095
  return true;
17083
17096
  }
17084
17097
  async localStroage() {
@@ -17213,6 +17226,7 @@ var LsdBrowserController = class _LsdBrowserController {
17213
17226
  maxBrowserContextsPerBrowser = 10,
17214
17227
  maxPagesPerBrowserContext = 20,
17215
17228
  maxPageFreeSeconds = 900,
17229
+ maxViewportOfNewPage = false,
17216
17230
  proxy = null,
17217
17231
  timeout = 3e4,
17218
17232
  args = [],
@@ -17225,7 +17239,7 @@ var LsdBrowserController = class _LsdBrowserController {
17225
17239
  userAgent = ""
17226
17240
  } = options ? options : {};
17227
17241
  const incognito = typeof options?.incognito === "boolean" ? options.incognito : browserControllerType === "puppeteer" ? false : true;
17228
- const actOptions = { closeFreePagesIntervalSeconds, maxBrowserContextsPerBrowser, maxPagesPerBrowserContext, maxPageFreeSeconds, proxy, timeout, args, executablePath, headless, minBrowserContexts, incognito, proxyPerBrowserContext, userDataDir, userAgent };
17242
+ const actOptions = { closeFreePagesIntervalSeconds, maxBrowserContextsPerBrowser, maxPagesPerBrowserContext, maxPageFreeSeconds, maxViewportOfNewPage, proxy, timeout, args, executablePath, headless, minBrowserContexts, incognito, proxyPerBrowserContext, userDataDir, userAgent };
17229
17243
  let idx = args.findIndex((arg) => arg.toLowerCase().startsWith("--incoginto"));
17230
17244
  if (idx >= 0) {
17231
17245
  (0, import_utils15.logwarn)(`Please use options.incognito instead when launching new browser.`);
@@ -17308,6 +17322,7 @@ var LsdBrowserController = class _LsdBrowserController {
17308
17322
  maxBrowserContextsPerBrowser = 10,
17309
17323
  maxPagesPerBrowserContext = 20,
17310
17324
  maxPageFreeSeconds = 900,
17325
+ maxViewportOfNewPage = false,
17311
17326
  proxy = null,
17312
17327
  timeout = 3e4,
17313
17328
  browserUrl,
@@ -17319,7 +17334,7 @@ var LsdBrowserController = class _LsdBrowserController {
17319
17334
  if (typeof browserUrl !== "string" || !browserUrl.toLowerCase().startsWith("http://")) {
17320
17335
  throw new Error(`Invalid browserUrl ${browserUrl} in connect`);
17321
17336
  }
17322
- const actOptions = { closeFreePagesIntervalSeconds, maxBrowserContextsPerBrowser, maxPagesPerBrowserContext, maxPageFreeSeconds, proxy, timeout, browserUrl, executablePath, headless, incognito, userAgent };
17337
+ const actOptions = { closeFreePagesIntervalSeconds, maxBrowserContextsPerBrowser, maxPagesPerBrowserContext, maxPageFreeSeconds, maxViewportOfNewPage, proxy, timeout, browserUrl, executablePath, headless, incognito, userAgent };
17323
17338
  if (browserControllerType === "playwright") {
17324
17339
  const playwrightBrowserType = this.#playwrightBrowserType(browserType, true);
17325
17340
  const browser = await playwrightBrowserType.connectOverCDP(browserUrl);
package/dist/index.d.cts CHANGED
@@ -811,8 +811,10 @@ interface LsdPage extends EventEmitter {
811
811
  isFree(): boolean;
812
812
  /**
813
813
  * valid only in CheerioPage
814
+ * @param html
815
+ * @param isHtml default true
814
816
  */
815
- load(html: string): boolean;
817
+ load(html: string, isHtml?: boolean): boolean;
816
818
  localStroage(): Promise<LocalStorageOrigin[]>;
817
819
  mainFrame(): AllFrame;
818
820
  maximizeViewport(): Promise<boolean>;
@@ -1174,7 +1176,12 @@ declare class PuppeteerElement implements LsdElement {
1174
1176
 
1175
1177
  declare class CheerioPage extends EventEmitter implements LsdPage {
1176
1178
  #private;
1177
- constructor(html?: string);
1179
+ /**
1180
+ *
1181
+ * @param html default ""
1182
+ * @param isHtml default true
1183
+ */
1184
+ constructor(html?: string, isHtml?: boolean);
1178
1185
  bringToFront(): Promise<boolean>;
1179
1186
  browserContext(): LsdBrowserContext;
1180
1187
  clearCookies(): Promise<boolean>;
@@ -1191,7 +1198,7 @@ declare class CheerioPage extends EventEmitter implements LsdPage {
1191
1198
  goto(): Promise<boolean>;
1192
1199
  id(): string;
1193
1200
  isFree(): boolean;
1194
- load(html: string): boolean;
1201
+ load(html: string, isHtml?: boolean): boolean;
1195
1202
  localStroage(): Promise<LocalStorageOrigin[]>;
1196
1203
  mainFrame(): AllFrame;
1197
1204
  maximizeViewport(): Promise<boolean>;
package/dist/index.d.ts CHANGED
@@ -811,8 +811,10 @@ interface LsdPage extends EventEmitter {
811
811
  isFree(): boolean;
812
812
  /**
813
813
  * valid only in CheerioPage
814
+ * @param html
815
+ * @param isHtml default true
814
816
  */
815
- load(html: string): boolean;
817
+ load(html: string, isHtml?: boolean): boolean;
816
818
  localStroage(): Promise<LocalStorageOrigin[]>;
817
819
  mainFrame(): AllFrame;
818
820
  maximizeViewport(): Promise<boolean>;
@@ -1174,7 +1176,12 @@ declare class PuppeteerElement implements LsdElement {
1174
1176
 
1175
1177
  declare class CheerioPage extends EventEmitter implements LsdPage {
1176
1178
  #private;
1177
- constructor(html?: string);
1179
+ /**
1180
+ *
1181
+ * @param html default ""
1182
+ * @param isHtml default true
1183
+ */
1184
+ constructor(html?: string, isHtml?: boolean);
1178
1185
  bringToFront(): Promise<boolean>;
1179
1186
  browserContext(): LsdBrowserContext;
1180
1187
  clearCookies(): Promise<boolean>;
@@ -1191,7 +1198,7 @@ declare class CheerioPage extends EventEmitter implements LsdPage {
1191
1198
  goto(): Promise<boolean>;
1192
1199
  id(): string;
1193
1200
  isFree(): boolean;
1194
- load(html: string): boolean;
1201
+ load(html: string, isHtml?: boolean): boolean;
1195
1202
  localStroage(): Promise<LocalStorageOrigin[]>;
1196
1203
  mainFrame(): AllFrame;
1197
1204
  maximizeViewport(): Promise<boolean>;
package/dist/index.js CHANGED
@@ -16970,9 +16970,18 @@ var CheerioElement = class _CheerioElement {
16970
16970
  // src/cheerio/page.ts
16971
16971
  var CheerioPage = class extends EventEmitter7 {
16972
16972
  #document;
16973
- constructor(html3 = "") {
16973
+ /**
16974
+ *
16975
+ * @param html default ""
16976
+ * @param isHtml default true
16977
+ */
16978
+ constructor(html3 = "", isHtml2 = true) {
16974
16979
  super();
16975
- this.#document = load(html3).root();
16980
+ if (isHtml2) {
16981
+ this.#document = load(html3).root();
16982
+ } else {
16983
+ this.#document = load(html3, { xml: true }).root();
16984
+ }
16976
16985
  }
16977
16986
  async bringToFront() {
16978
16987
  throw new Error("Not supported in CheerioPage.");
@@ -17057,8 +17066,12 @@ var CheerioPage = class extends EventEmitter7 {
17057
17066
  isFree() {
17058
17067
  throw new Error("Not supported in CheerioPage.");
17059
17068
  }
17060
- load(html3) {
17061
- this.#document = load(html3).root();
17069
+ load(html3, isHtml2 = true) {
17070
+ if (isHtml2) {
17071
+ this.#document = load(html3).root();
17072
+ } else {
17073
+ this.#document = load(html3, { xml: true }).root();
17074
+ }
17062
17075
  return true;
17063
17076
  }
17064
17077
  async localStroage() {
@@ -17193,6 +17206,7 @@ var LsdBrowserController = class _LsdBrowserController {
17193
17206
  maxBrowserContextsPerBrowser = 10,
17194
17207
  maxPagesPerBrowserContext = 20,
17195
17208
  maxPageFreeSeconds = 900,
17209
+ maxViewportOfNewPage = false,
17196
17210
  proxy = null,
17197
17211
  timeout = 3e4,
17198
17212
  args = [],
@@ -17205,7 +17219,7 @@ var LsdBrowserController = class _LsdBrowserController {
17205
17219
  userAgent = ""
17206
17220
  } = options ? options : {};
17207
17221
  const incognito = typeof options?.incognito === "boolean" ? options.incognito : browserControllerType === "puppeteer" ? false : true;
17208
- const actOptions = { closeFreePagesIntervalSeconds, maxBrowserContextsPerBrowser, maxPagesPerBrowserContext, maxPageFreeSeconds, proxy, timeout, args, executablePath, headless, minBrowserContexts, incognito, proxyPerBrowserContext, userDataDir, userAgent };
17222
+ const actOptions = { closeFreePagesIntervalSeconds, maxBrowserContextsPerBrowser, maxPagesPerBrowserContext, maxPageFreeSeconds, maxViewportOfNewPage, proxy, timeout, args, executablePath, headless, minBrowserContexts, incognito, proxyPerBrowserContext, userDataDir, userAgent };
17209
17223
  let idx = args.findIndex((arg) => arg.toLowerCase().startsWith("--incoginto"));
17210
17224
  if (idx >= 0) {
17211
17225
  logwarn6(`Please use options.incognito instead when launching new browser.`);
@@ -17288,6 +17302,7 @@ var LsdBrowserController = class _LsdBrowserController {
17288
17302
  maxBrowserContextsPerBrowser = 10,
17289
17303
  maxPagesPerBrowserContext = 20,
17290
17304
  maxPageFreeSeconds = 900,
17305
+ maxViewportOfNewPage = false,
17291
17306
  proxy = null,
17292
17307
  timeout = 3e4,
17293
17308
  browserUrl,
@@ -17299,7 +17314,7 @@ var LsdBrowserController = class _LsdBrowserController {
17299
17314
  if (typeof browserUrl !== "string" || !browserUrl.toLowerCase().startsWith("http://")) {
17300
17315
  throw new Error(`Invalid browserUrl ${browserUrl} in connect`);
17301
17316
  }
17302
- const actOptions = { closeFreePagesIntervalSeconds, maxBrowserContextsPerBrowser, maxPagesPerBrowserContext, maxPageFreeSeconds, proxy, timeout, browserUrl, executablePath, headless, incognito, userAgent };
17317
+ const actOptions = { closeFreePagesIntervalSeconds, maxBrowserContextsPerBrowser, maxPagesPerBrowserContext, maxPageFreeSeconds, maxViewportOfNewPage, proxy, timeout, browserUrl, executablePath, headless, incognito, userAgent };
17303
17318
  if (browserControllerType === "playwright") {
17304
17319
  const playwrightBrowserType = this.#playwrightBrowserType(browserType, true);
17305
17320
  const browser = await playwrightBrowserType.connectOverCDP(browserUrl);
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@letsscrapedata/controller",
3
- "version": "0.0.21",
3
+ "version": "0.0.23",
4
4
  "description": "Unified browser / HTML controller interfaces that support playwright, puppeteer and cheerio",
5
5
  "type": "module",
6
6
  "main": "./dist/index.mjs",