apify-projects
diff --git a/‎.actor/Dockerfile
Lines changed: 57 additions & 0 deletions b/‎.actor/Dockerfile
Lines changed: 57 additions & 0 deletions
diff --git a/‎.actor/actor.json
Lines changed: 9 additions & 0 deletions b/‎.actor/actor.json
Lines changed: 9 additions & 0 deletions
diff --git a/‎.actor/input_schema.json
Lines changed: 32 additions & 0 deletions b/‎.actor/input_schema.json
Lines changed: 32 additions & 0 deletions
diff --git a/‎.dockerignore
Lines changed: 14 additions & 0 deletions b/‎.dockerignore
Lines changed: 14 additions & 0 deletions
diff --git a/‎.editorconfig
Lines changed: 9 additions & 0 deletions b/‎.editorconfig
Lines changed: 9 additions & 0 deletions
diff --git a/‎.eslintrc
Lines changed: 20 additions & 0 deletions b/‎.eslintrc
Lines changed: 20 additions & 0 deletions
diff --git a/‎.gitignore
Lines changed: 12 additions & 0 deletions b/‎.gitignore
Lines changed: 12 additions & 0 deletions
diff --git a/‎README.md
Lines changed: 35 additions & 0 deletions b/‎README.md
Lines changed: 35 additions & 0 deletions
@@ -0,0 +1,57 @@
+# Specify the base Docker image. You can read more about
+# the available images at https://crawlee.dev/docs/guides/docker-images
+# You can also use any other image from Docker Hub.
+FROM apify/actor-node:20 AS builder
+
+# Check preinstalled packages
+RUN npm ls crawlee apify puppeteer playwright
+
+# Copy just package.json and package-lock.json
+# to speed up the build using Docker layer cache.
+COPY package*.json ./
+
+# Install all dependencies. Don't audit to speed up the installation.
+RUN npm install --include=dev --audit=false
+
+# Next, copy the source files using the user set
+# in the base image.
+COPY . ./
+
+# Install all dependencies and build the project.
+# Don't audit to speed up the installation.
+RUN npm run build
+
+# Create final image
+FROM apify/actor-node:20
+
+# Check preinstalled packages
+RUN npm ls crawlee apify puppeteer playwright
+
+# Copy just package.json and package-lock.json
+# to speed up the build using Docker layer cache.
+COPY package*.json ./
+
+# Install NPM packages, skip optional and development dependencies to
+# keep the image small. Avoid logging too much and print the dependency
+# tree for debugging
+RUN npm --quiet set progress=false \
+    && npm install --omit=dev --omit=optional \
+    && echo "Installed NPM packages:" \
+    && (npm list --omit=dev --all || true) \
+    && echo "Node.js version:" \
+    && node --version \
+    && echo "NPM version:" \
+    && npm --version \
+    && rm -r ~/.npm
+
+# Copy built JS files from builder image
+COPY --from=builder /usr/src/app/dist ./dist
+
+# Next, copy the remaining files and directories with the source code.
+# Since we do this after NPM install, quick build will be really fast
+# for most source file changes.
+COPY . ./
+
+
+# Run the image.
+CMD npm run start:prod --silent
@@ -0,0 +1,9 @@
+{
+	"actorSpecification": 1,
+	"name": "store-dynamic-web-scraper",
+	"title": "Dynamic Web Scraper",
+	"description": "Dynamic crawling the websites based on the website content",
+	"version": "0.0",
+	"input": "./input_schema.json",
+	"dockerfile": "./Dockerfile"
+}
@@ -0,0 +1,32 @@
+{
+    "title": "Dynamic Web Scraper",
+    "type": "object",
+    "schemaVersion": 1,
+    "properties": {
+        "startSources": {
+            "title": "Start Sources",
+            "type": "array",
+            "description": "Sources to start with, could be .",
+            "editor": "stringList",
+            "prefill": ["Lucerna Bar Cafe, Prague"],
+            "minItems": 1
+        },
+        "prompt": {
+            "title": "Prompt",
+            "type": "string",
+            "editor": "textarea",
+            "description": "Prompt to evaluate on content.",
+            "prefill": "Look for the food menu items and if you find it look for a chicken option"
+        },
+        "maxDepth": {
+            "title": "Max Depth",
+            "type": "integer",
+            "description": "Maximum depth to scrape.",
+            "default": 3
+        }
+    },
+    "required": [
+        "startSources",
+        "prompt"
+    ]
+}
@@ -0,0 +1,14 @@
+# configurations
+.idea
+.vscode
+
+# crawlee and apify storage folders
+apify_storage
+crawlee_storage
+storage
+
+# installed files
+node_modules
+
+# git folder
+.git
@@ -0,0 +1,9 @@
+root = true
+
+[*]
+indent_style = space
+indent_size = 4
+charset = utf-8
+trim_trailing_whitespace = true
+insert_final_newline = true
+end_of_line = lf
@@ -0,0 +1,20 @@
+{
+    "root": true,
+    "env": {
+        "browser": true,
+        "es2020": true,
+        "node": true
+    },
+    "extends": [
+        "@apify/eslint-config-ts"
+    ],
+    "parserOptions": {
+        "project": "./tsconfig.json",
+        "ecmaVersion": 2020
+    },
+    "ignorePatterns": [
+        "node_modules",
+        "dist",
+        "**/*.d.ts"
+    ]
+}
@@ -0,0 +1,12 @@
+# This file tells Git which files shouldn't be added to source control
+
+.DS_Store
+.idea
+.vscode
+dist
+node_modules
+apify_storage
+storage
+
+# Added by Apify CLI
+.venv
@@ -0,0 +1,35 @@
+## What does Dynamic Web Scraper do?
+Dynamic Web Scraper is an Apify Actor that gathers information online by simulating user browsing behavior on the web. It reduces the time and amount of scraped web pages by using a model (ChatGPT) to make decisions regarding browser navigation and results evaluation.
+
+Dynamic Web Scraper takes as input a prompt and a list of initial URLs or Google queries. The model then decides which URLs should be visited in order to provide the best answer to the prompt.
+
+## Why scrape websites dynamically?
+Dynamic web scraping allows for more efficient data extraction by automating the browsing process. It can help gather specific information from websites that may not be easily accessible through traditional scraping methods.
+
+## How to use Dynamic Web Scraper
+To use Dynamic Web Scraper, follow these steps:
+1. Click on Try for free.
+2. Enter the prompt and a list of initial URLs or Google queries.
+3. Click on Run.
+4. Once the actor has finished, preview or download your data from the Dataset tab.
+
+## How much will it cost to use Dynamic Web Scraper?
+Apify provides $5 free usage credits every month on the Apify Free plan. For more extensive data extraction needs, consider upgrading to a paid Apify subscription.
+
+## Results\nAn example of the JSON results produced by the actor:
+```
+{
+  "url": "https://www.example.com",
+  "inputSource": "Example input",
+  "depth": 3,
+  "response": <Response based on input>
+}
+```
+
+## Tips for using Dynamic Web Scraper
+- Ensure that your prompt is clear and specific to get accurate results.
+- Monitor the actor's progress to ensure it is navigating the web effectively.
+
+## Is it legal to use Dynamic Web Scraper?
+It is important to be aware of legal considerations when scraping websites, especially regarding data privacy regulations such as GDPR. Ensure that you have a legitimate reason for scraping and consult legal advice if needed.
+For more information on the legality of web scraping, read our blog post: [Is Web Scraping Legal?](https://blog.apify.com/is-web-scraping-legal/)