update example for each platform

Granitosaurus · Granitosaurus · commit f56e69c925f3 · 2024-07-30T21:57:39.000+07:00
diff --git a/examples/README.md b/examples/README.md
@@ -1,22 +1,9 @@
 # Scrapfly Typescript SDK Examples
 
-This directory contains commonly used examples for the Scrapfly Typescript SDK which is available in Typescript runtimes (bun, deno) as well as javascript ones like Nodejs.
+In this directory, examples are provided by JavaScript runtime platform as Scrapfly's Typescript SDK supports multiple options:
 
-You can use `node` to run the `.js` examples:
-
-```
-node examples/basic-get.js
-```
-
-Or compile `.ts` examples to `.js`:
-
-```
-tsc examples/scrape/basic-get.ts -o examples/basic-get.js
-node examples/scrape/basic-get.js
-```
-
-Or run typescript directly through runtimes like `.ts`:
-
-```
-bun examples/scrape/basic-get.ts
-```
+- [node_commonjs](./node_commonjs) - Examples for NodeJS with CommonJS module system.
+- [node_esm](./node_esm) - Examples for NodeJS with ECMAScript Modules (ESM) module system.
+- [bun](./bun) - Examples for Bun Typescript runtime.
+- [deno](./deno) - Examples for Deno Typescript runtime.
+- [serverless: cloudflare workers, aws lambda, supabase](./cloudflareworker_awslambda_supabase) - Examples for serverless platforms like Cloudflare Workers, AWS Lambda and Supabase.
diff --git a/examples/bun/README.md b/examples/bun/README.md
@@ -0,0 +1,17 @@
+# Scrapfly SDK with Bun
+
+Bun is a modern javascript runtime that can execute both javascript and typescript without transpilation.
+
+These examples demonstrate Typescript SDK usage with Bun and for that install the SDK using jsr.io which distributes Typescript files:
+
+```
+$ bunx jsr add @scrapfly/scrapfly-sdk
+```
+
+Then see `bun_examples.ts` for examples and each example can be run by specifying the example function name:
+
+```bash
+$ bun run bun_examples.ts <example_name> <scrapfly_api_key>
+# for example
+$ bun run bun_examples.ts basicGet scp-test-123
+```
diff --git a/examples/bun/bun_examples.ts b/examples/bun/bun_examples.ts
@@ -0,0 +1,111 @@
+import { ScrapflyClient, ScrapeConfig, ScreenshotConfig, ExtractionConfig } from 'scrapfly-sdk';
+
+
+/* To start, you can always get your account information using the .account() method
+ */
+export async function getAccount(apiKey: string) {
+  const client = new ScrapflyClient({ key: apiKey});
+  const account = await client.account();
+  console.log('account');
+  console.log(account);
+}
+
+/* For a basic scrape the only required parameter is the URL
+ */
+export async function basicGet(apiKey: string) {
+  const client = new ScrapflyClient({ key: apiKey});
+
+  let scrape_result = await client.scrape(
+    new ScrapeConfig({
+      url: 'https://httpbin.dev/html',
+      // Anti Scraping Protection bypass - enable this when scraping protected targets
+      asp: true,
+      // server side cache - great for repeated requests
+      cache: true,
+      cache_ttl: 3600,  // in seconds
+      // cache_clear: true,  // you can always clear the cache explicitly!
+    }),
+  );
+
+  // the scrape_result.result contains all result details
+  console.log("web log url:");  // you can check web UI for request details:
+  console.log(scrape_result.result.log_url);
+
+  console.log("page content:");
+  console.log(scrape_result.result.content);
+
+  console.log("response headers:");
+  console.log(scrape_result.result.response_headers);
+
+  console.log("response cookies:");
+  console.log(scrape_result.result.cookies);
+}
+
+/* Enabling js_render enabled scrapfly cloud browsers and enables
+ * a bunch of other features like browser control, js execution, screenshots, etc.
+ */
+export async function JSRender(apiKey: string) {
+  const client = new ScrapflyClient({ key: apiKey});
+
+  let scrape_result = await client.scrape(
+    new ScrapeConfig({
+      url: 'https://web-scraping.dev/product/1',
+      // enable browsers:
+      render_js: true,
+      // this enables more options
+      // you can wait for some element to appear:
+      wait_for_selector: '.review',
+      // you can wait explicitly for N seconds
+      rendering_wait: 3000,  // 3 seconds
+      // you can control the browser through scenarios:
+      // https://scrapfly.io/docs/scrape-api/javascript-scenario
+      js_scenario: [
+        { click: { selector: '#load-more-reviews' }}, 
+        { wait: 2000}, 
+      ],
+      // or even run any custom JS code!
+      js: 'return document.querySelector(".review").innerText',
+    }),
+  );
+
+  // the scrape_result.result contains all result details:
+  console.log("web log url:");  // you can check web UI for request details:
+  console.log(scrape_result.result.log_url);
+
+  console.log("page content:");
+  console.log(scrape_result.result.content.substring(0, 1000) + '...');
+  
+  console.log("browser data capture");
+  console.log(scrape_result.result.browser_data);
+}
+
+
+// CLI entry point
+async function main(): Promise<void> {
+    if (process.argv.length < 4) {
+        console.log(
+            `Usage: bun run bun_examples.ts <functionName> <apiKey>\n` +
+            `getAccount - Get account information\n` +
+            `basicGet - Basic scrape\n` +
+            `JSRender - Scrape with JS rendering\n`
+        );
+        return;
+    }
+    const args = process.argv.slice(2);
+    const functionName = args[0];
+    const apiKey = args[1];
+
+    // Dynamically import the current module
+    const module = await import('./bun_examples.ts');
+
+    if (module[functionName]) {
+        (module[functionName] as Function)(apiKey);
+    } else {
+        console.log(`Function ${functionName} not found.`);
+    }
+}
+
+// Check if the script is being run directly
+if (import.meta.url === `file://${process.argv[1]}`) {
+    main();
+}
diff --git a/examples/cloudflareworker_awslambda_supabase/.denoflare b/examples/cloudflareworker_awslambda_supabase/.denoflare
@@ -0,0 +1,11 @@
+{
+    "$schema": "https://raw.githubusercontent.com/skymethod/denoflare/v0.6.0/common/config.schema.json",
+    "scripts": {
+        "example": {
+            "path": "index.ts",
+            "localPort": 3030
+        }
+    },
+    "profiles": {
+    }
+}
diff --git a/examples/cloudflareworker_awslambda_supabase/README.md b/examples/cloudflareworker_awslambda_supabase/README.md
@@ -0,0 +1,32 @@
+# Scrapfly SDK with Cloudflare Workers or AWS Lambda or Supabase
+
+There are many serverless platforms that can run Javascript or Typescript code which fit well wtih Scrapfly.io. This directory contains examples for Cloudflare Workers, AWS Lambda and Supabase.
+
+The easiest way is to use [Denoflare](https://denoflare.dev/) which allows to easily develop, test and deploy Typescript workers to Cloudflare Workers, AWS Lambda or Supabase.
+
+To start, install denoflare:
+
+```bash
+deno install --unstable-worker-options --allow-read --allow-net --allow-env --allow-run --name denoflare --force https://github.com/skymethod/denoflare/blob/master/cli/cli.ts
+```
+
+Then see `index.ts` for your worker code and configure the `key` with your Scrapfly API key. 
+
+To test your worker locally use the `serve` command:
+
+```bash
+denoflare serve example --bundle backend=esbuild
+```
+
+Finally, to push your worker use one of the `push-` commands:
+
+```bash
+# for cloudflare
+denoflare push-deploy --bundle backend=esbuild
+# for aws lambda
+denoflare push-lambda --bundle backend=esbuild
+# for supabase
+denoflare push-supabase --bundle backend=esbuild
+```
+
+for more see https://denoflare.dev/
diff --git a/examples/cloudflareworker_awslambda_supabase/index.ts b/examples/cloudflareworker_awslambda_supabase/index.ts
@@ -0,0 +1,33 @@
+import { ScrapflyClient, ScrapeConfig, ScreenshotConfig, ExtractionConfig } from 'jsr:@scrapfly/scrapfly-sdk';
+
+const key = 'YOUR SCRAPFLY KEY';
+const client = new ScrapflyClient({ key });
+
+export default {
+    async fetch(request: Request, env: any) {
+        try {
+            const result = await client.scrape(
+                new ScrapeConfig({
+                    url: 'https://web-scraping.dev/product/1',
+                }),
+            );
+            const data = {
+                "url": "https://web-scraping.dev/product/1",
+                "price": result.selector(".product-price").text(),
+                "title": result.selector(".product-title").text(),
+                "description": result.selector(".product-description").text(),
+            };
+            return new Response(JSON.stringify(data), {
+                headers: {
+                    "content-type": "application/json",
+                }
+            })
+        } catch (e) {
+            return new Response(JSON.stringify({"error": e.message}), {
+                headers: {
+                    "content-type": "application/json",
+                }
+            })
+        }
+    },
+}
diff --git a/examples/deno/README.md b/examples/deno/README.md
@@ -0,0 +1,19 @@
+# Scrapfly SDK with Deno
+
+Deno is a modern and secure runtime for JavaScript and TypeScript that uses V8 and is built in Rust.
+
+
+These examples demonstrate Typescript SDK usage with Deno and for that install the SDK using jsr.io which distributes Typescript files:
+
+```bash
+deno add jsr:@scrapfly/scrapfly-sdk
+```
+
+Then see `deno_examples.ts` for examples and each example can be run by specifying the example function name:
+
+```bash
+$ deno run --allow-net -A deno_examples.ts <example_name> <scrapfly_api_key>
+# for example
+$ deno run --allow-net -A deno_examples.ts basicGet scp-test-123
+```
+
diff --git a/examples/deno/deno_examples.ts b/examples/deno/deno_examples.ts
@@ -0,0 +1,108 @@
+import { ScrapflyClient, ScrapeConfig, ScreenshotConfig, ExtractionConfig } from 'jsr:@scrapfly/scrapfly-sdk';
+
+
+/* To start, you can always get your account information using the .account() method
+ */
+export async function getAccount(apiKey: string) {
+  const client = new ScrapflyClient({ key: apiKey});
+  const account = await client.account();
+  console.log('account');
+  console.log(account);
+}
+
+/* For a basic scrape the only required parameter is the URL
+ */
+export async function basicGet(apiKey: string) {
+  const client = new ScrapflyClient({ key: apiKey});
+
+  let scrape_result = await client.scrape(
+    new ScrapeConfig({
+      url: 'https://httpbin.dev/html',
+      // Anti Scraping Protection bypass - enable this when scraping protected targets
+      asp: true,
+      // server side cache - great for repeated requests
+      cache: true,
+      cache_ttl: 3600,  // in seconds
+      // cache_clear: true,  // you can always clear the cache explicitly!
+    }),
+  );
+
+  // the scrape_result.result contains all result details
+  console.log("web log url:");  // you can check web UI for request details:
+  console.log(scrape_result.result.log_url);
+
+  console.log("page content:");
+  console.log(scrape_result.result.content);
+
+  console.log("response headers:");
+  console.log(scrape_result.result.response_headers);
+
+  console.log("response cookies:");
+  console.log(scrape_result.result.cookies);
+}
+
+/* Enabling js_render enabled scrapfly cloud browsers and enables
+ * a bunch of other features like browser control, js execution, screenshots, etc.
+ */
+export async function JSRender(apiKey: string) {
+  const client = new ScrapflyClient({ key: apiKey});
+
+  let scrape_result = await client.scrape(
+    new ScrapeConfig({
+      url: 'https://web-scraping.dev/product/1',
+      // enable browsers:
+      render_js: true,
+      // this enables more options
+      // you can wait for some element to appear:
+      wait_for_selector: '.review',
+      // you can wait explicitly for N seconds
+      rendering_wait: 3000,  // 3 seconds
+      // you can control the browser through scenarios:
+      // https://scrapfly.io/docs/scrape-api/javascript-scenario
+      js_scenario: [
+        { click: { selector: '#load-more-reviews' }}, 
+        { wait: 2000}, 
+      ],
+      // or even run any custom JS code!
+      js: 'return document.querySelector(".review").innerText',
+    }),
+  );
+
+  // the scrape_result.result contains all result details:
+  console.log("web log url:");  // you can check web UI for request details:
+  console.log(scrape_result.result.log_url);
+
+  console.log("page content:");
+  console.log(scrape_result.result.content.substring(0, 1000) + '...');
+  
+  console.log("browser data capture");
+  console.log(scrape_result.result.browser_data);
+}
+
+// CLI entry point
+async function main(): Promise<void> {
+    if (Deno.args.length < 2) {
+        console.log(
+            `Usage: deno run --allow-net deno_examples.ts <functionName> <apiKey>\n` +
+            `getAccount - Get account information\n` +
+            `basicGet - Basic scrape\n` +
+            `JSRender - Scrape with JS rendering\n`
+        );
+        return;
+    }
+    const [functionName, apiKey] = Deno.args;
+
+    // Dynamically import the current module
+    const module = await import('./deno_examples.ts');
+
+    if (module[functionName]) {
+        (module[functionName] as Function)(apiKey);
+    } else {
+        console.log(`Function ${functionName} not found.`);
+    }
+}
+
+// Check if the script is being run directly
+if (import.meta.main) {
+    main();
+}
diff --git a/examples/node_commonjs/README.md b/examples/node_commonjs/README.md
@@ -0,0 +1,18 @@
+# Scrapfly SDK with CommonJS (NodeJS)
+
+CommonJS is a NodeJS module system that allows you to import modules using `require` function.
+
+The examples in `commonjs_examples.cjs` demonstrate how to use Scrapfly SDK with CommonJS. To start, init a project and install the SDK using npm:
+
+```bash
+$ npm init -y
+$ npm install scrapfly-sdk
+```
+
+Then see `commonjs_examples.cjs` for examples and each example can be run by specifying the example function name:
+
+```bash
+$ node commonjs_examples.cjs <example_name> <scrapfly_api_key>
+# for example
+$ node commonjs_examples.cjs basicGet scp-test-123
+```
diff --git a/examples/node_commonjs/commonjs_examples.cjs b/examples/node_commonjs/commonjs_examples.cjs
diff --git a/examples/node_esm/README.md b/examples/node_esm/README.md
diff --git a/examples/node_esm/esm_examples.mjs b/examples/node_esm/esm_examples.mjs