573 lines
16 KiB
JSON
573 lines
16 KiB
JSON
{
|
||
"id": "UuuCIDvTNnloIlvq",
|
||
"meta": {
|
||
"instanceId": "885b4fb4a6a9c2cb5621429a7b972df0d05bb724c20ac7dac7171b62f1c7ef40",
|
||
"templateCredsSetupCompleted": true
|
||
},
|
||
"name": "Automate Etsy Data Mining with Bright Data Scrape & Google Gemini",
|
||
"tags": [
|
||
{
|
||
"id": "Kujft2FOjmOVQAmJ",
|
||
"name": "Engineering",
|
||
"createdAt": "2025-04-09T01:31:00.558Z",
|
||
"updatedAt": "2025-04-09T01:31:00.558Z"
|
||
},
|
||
{
|
||
"id": "ddPkw7Hg5dZhQu2w",
|
||
"name": "AI",
|
||
"createdAt": "2025-04-13T05:38:08.053Z",
|
||
"updatedAt": "2025-04-13T05:38:08.053Z"
|
||
}
|
||
],
|
||
"nodes": [
|
||
{
|
||
"id": "f369feaf-4782-4411-9d08-fe91b9ffd97e",
|
||
"name": "When clicking ‘Test workflow’",
|
||
"type": "n8n-nodes-base.manualTrigger",
|
||
"position": [
|
||
200,
|
||
-555
|
||
],
|
||
"parameters": {},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "231bae3c-c27e-49fc-b878-2d5cc1e14c5a",
|
||
"name": "Sticky Note",
|
||
"type": "n8n-nodes-base.stickyNote",
|
||
"position": [
|
||
200,
|
||
-1020
|
||
],
|
||
"parameters": {
|
||
"width": 400,
|
||
"height": 300,
|
||
"content": "## Note\n\nDeals with the Esty web scraping by utilizing the Bright Data Web Unlocker Product.\n\nThe Information Extraction node being used to demonstrate the usage of the N8N AI capabilities.\n\n**Please make sure to set the Indeed search query and update the Webhook Notification URL**"
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "f568de40-b389-41f9-afe9-5e09a291c367",
|
||
"name": "Sticky Note1",
|
||
"type": "n8n-nodes-base.stickyNote",
|
||
"position": [
|
||
640,
|
||
-1020
|
||
],
|
||
"parameters": {
|
||
"width": 480,
|
||
"height": 300,
|
||
"content": "## LLM Usages\n\nGoogle Gemini Flash Exp model is being used.\n\nBasic LLM Chain Data Extractor."
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "4f1db865-a0cb-4978-9c7d-fde448bd978a",
|
||
"name": "Set Esty Search Query",
|
||
"type": "n8n-nodes-base.set",
|
||
"position": [
|
||
420,
|
||
-555
|
||
],
|
||
"parameters": {
|
||
"options": {},
|
||
"assignments": {
|
||
"assignments": [
|
||
{
|
||
"id": "3aedba66-f447-4d7a-93c0-8158c5e795f9",
|
||
"name": "url",
|
||
"type": "string",
|
||
"value": "https://www.etsy.com/search?q=wall+art+for+mum&order=date_desc&page=1&ref=pagination"
|
||
},
|
||
{
|
||
"id": "4e7ee31d-da89-422f-8079-2ff2d357a0ba",
|
||
"name": "zone",
|
||
"type": "string",
|
||
"value": "web_unlocker1"
|
||
}
|
||
]
|
||
}
|
||
},
|
||
"typeVersion": 3.4
|
||
},
|
||
{
|
||
"id": "4cb51368-bb69-4d99-a0b6-e8e8013f1dfd",
|
||
"name": "Perform Esty Web Request",
|
||
"type": "n8n-nodes-base.httpRequest",
|
||
"position": [
|
||
640,
|
||
-680
|
||
],
|
||
"parameters": {
|
||
"url": "https://api.brightdata.com/request",
|
||
"method": "POST",
|
||
"options": {},
|
||
"sendBody": true,
|
||
"sendHeaders": true,
|
||
"authentication": "genericCredentialType",
|
||
"bodyParameters": {
|
||
"parameters": [
|
||
{
|
||
"name": "zone",
|
||
"value": "={{ $json.zone }}"
|
||
},
|
||
{
|
||
"name": "url",
|
||
"value": "={{ $json.url }}?product=unlocker&method=api"
|
||
},
|
||
{
|
||
"name": "format",
|
||
"value": "raw"
|
||
},
|
||
{
|
||
"name": "data_format",
|
||
"value": "markdown"
|
||
}
|
||
]
|
||
},
|
||
"genericAuthType": "httpHeaderAuth",
|
||
"headerParameters": {
|
||
"parameters": [
|
||
{}
|
||
]
|
||
}
|
||
},
|
||
"credentials": {
|
||
"httpHeaderAuth": {
|
||
"id": "kdbqXuxIR8qIxF7y",
|
||
"name": "Header Auth account"
|
||
}
|
||
},
|
||
"typeVersion": 4.2
|
||
},
|
||
{
|
||
"id": "9fb7bdc5-ba64-4df4-89b4-a3207e7f6d0e",
|
||
"name": "Google Gemini Chat Model",
|
||
"type": "@n8n/n8n-nodes-langchain.lmChatGoogleGemini",
|
||
"position": [
|
||
948,
|
||
-460
|
||
],
|
||
"parameters": {
|
||
"options": {},
|
||
"modelName": "models/gemini-2.0-flash-exp"
|
||
},
|
||
"credentials": {
|
||
"googlePalmApi": {
|
||
"id": "YeO7dHZnuGBVQKVZ",
|
||
"name": "Google Gemini(PaLM) Api account"
|
||
}
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "1f95576d-e243-481d-9d5f-308764d8ea4b",
|
||
"name": "Loop Over Items",
|
||
"type": "n8n-nodes-base.splitInBatches",
|
||
"position": [
|
||
1460,
|
||
-680
|
||
],
|
||
"parameters": {
|
||
"options": {}
|
||
},
|
||
"typeVersion": 3
|
||
},
|
||
{
|
||
"id": "47f23aa1-63ee-49e3-a465-283c7ab71b76",
|
||
"name": "Perform Esty web request over the loop",
|
||
"type": "n8n-nodes-base.httpRequest",
|
||
"position": [
|
||
1680,
|
||
-560
|
||
],
|
||
"parameters": {
|
||
"url": "https://api.brightdata.com/request",
|
||
"method": "POST",
|
||
"options": {},
|
||
"sendBody": true,
|
||
"sendHeaders": true,
|
||
"authentication": "genericCredentialType",
|
||
"bodyParameters": {
|
||
"parameters": [
|
||
{
|
||
"name": "zone",
|
||
"value": "=web_unlocker1"
|
||
},
|
||
{
|
||
"name": "url",
|
||
"value": "={{ $json.url }}&product=unlocker"
|
||
},
|
||
{
|
||
"name": "format",
|
||
"value": "raw"
|
||
},
|
||
{
|
||
"name": "data_format",
|
||
"value": "markdown"
|
||
}
|
||
]
|
||
},
|
||
"genericAuthType": "httpHeaderAuth",
|
||
"headerParameters": {
|
||
"parameters": [
|
||
{}
|
||
]
|
||
}
|
||
},
|
||
"credentials": {
|
||
"httpHeaderAuth": {
|
||
"id": "kdbqXuxIR8qIxF7y",
|
||
"name": "Header Auth account"
|
||
}
|
||
},
|
||
"typeVersion": 4.2
|
||
},
|
||
{
|
||
"id": "0b5ea206-a5a0-49b5-8f53-10b4dec5806c",
|
||
"name": "Initiate a Webhook Notification for the extracted data",
|
||
"type": "n8n-nodes-base.httpRequest",
|
||
"position": [
|
||
2320,
|
||
-560
|
||
],
|
||
"parameters": {
|
||
"url": "https://webhook.site/3c36d7d1-de1b-4171-9fd3-643ea2e4dd76",
|
||
"options": {},
|
||
"sendBody": true,
|
||
"bodyParameters": {
|
||
"parameters": [
|
||
{
|
||
"name": "summary",
|
||
"value": "={{ $json.output }}"
|
||
}
|
||
]
|
||
}
|
||
},
|
||
"typeVersion": 4.2
|
||
},
|
||
{
|
||
"id": "a164b90b-f44c-4862-b010-d515926774c7",
|
||
"name": "Extract Item List with the Product Info",
|
||
"type": "@n8n/n8n-nodes-langchain.informationExtractor",
|
||
"position": [
|
||
1920,
|
||
-560
|
||
],
|
||
"parameters": {
|
||
"text": "=Extract the product info in JSON\n\n{{ $json.data }}",
|
||
"options": {},
|
||
"schemaType": "fromJson",
|
||
"jsonSchemaExample": "[{\n \"image\": \"https://i.etsystatic.com/34923795/r/il/8f3bba/5855230678/il_fullxfull.5855230678_n9el.jpg\",\n \"name\": \"Custom Coffee Mug with Photo\",\n \"url\": \"https://www.etsy.com/listing/1193808036/custom-coffee-mug-with-photo\",\n \"brand\": {\n \"@type\": \"Brand\",\n \"name\": \"TheGiftBucks\"\n },\n \"offers\": {\n \"@type\": \"Offer\",\n \"price\": \"14.99\",\n \"priceCurrency\": \"USD\"\n }\n}]"
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "c3798c64-ac53-44c8-ba91-8fe33377113d",
|
||
"name": "Google Gemini Chat Model for product info",
|
||
"type": "@n8n/n8n-nodes-langchain.lmChatGoogleGemini",
|
||
"position": [
|
||
2000,
|
||
-300
|
||
],
|
||
"parameters": {
|
||
"options": {},
|
||
"modelName": "models/gemini-2.0-flash-exp"
|
||
},
|
||
"credentials": {
|
||
"googlePalmApi": {
|
||
"id": "YeO7dHZnuGBVQKVZ",
|
||
"name": "Google Gemini(PaLM) Api account"
|
||
}
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "11e4ae42-d2e1-4a4b-adcf-382f9e494431",
|
||
"name": "Extract Paginated Resultset",
|
||
"type": "@n8n/n8n-nodes-langchain.informationExtractor",
|
||
"position": [
|
||
860,
|
||
-680
|
||
],
|
||
"parameters": {
|
||
"text": "=Analyze and Extract the below content. Make sure to produce a unique resultset. Exclude page_numbers which are not numbers.\n\n {{ $json.data }}",
|
||
"options": {},
|
||
"schemaType": "manual",
|
||
"inputSchema": "{\n \"$schema\": \"http://json-schema.org/schema#\",\n \"title\": \"PagedResultSetSchema\",\n \"type\": \"array\",\n \"items\": {\n \"type\": \"object\",\n \"properties\": {\n \"page_number\": {\n \"type\": \"string\",\n \"description\": \"Page number, typically a string (e.g., '1', '2', 'next').\"\n },\n \"url\": {\n \"type\": \"string\",\n \"format\": \"uri\",\n \"description\": \"URL pointing to the page.\"\n }\n },\n \"required\": [\"page_number\", \"url\"],\n \"additionalProperties\": false\n }\n}\n"
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "28c1822b-d51c-4f8e-b98e-2e12324397be",
|
||
"name": "Sticky Note2",
|
||
"type": "n8n-nodes-base.stickyNote",
|
||
"position": [
|
||
1400,
|
||
-780
|
||
],
|
||
"parameters": {
|
||
"color": 5,
|
||
"width": 1340,
|
||
"height": 620,
|
||
"content": "## Loop and Perform Paginated Esty Data Extraction\n"
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "d4f18f2b-9825-4320-addb-c02bfdc4da97",
|
||
"name": "Write the scraped content to disk",
|
||
"type": "n8n-nodes-base.readWriteFile",
|
||
"position": [
|
||
2560,
|
||
-760
|
||
],
|
||
"parameters": {
|
||
"options": {},
|
||
"fileName": "=d:\\Esty-Scraped-Content-{{ $('Loop Over Items').item.json.page_number }}.json",
|
||
"operation": "write"
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "5555407d-c7dd-4e5c-83ab-ef6ba9c46da3",
|
||
"name": "Create a binary data",
|
||
"type": "n8n-nodes-base.function",
|
||
"position": [
|
||
2360,
|
||
-760
|
||
],
|
||
"parameters": {
|
||
"functionCode": "items[0].binary = {\n data: {\n data: new Buffer(JSON.stringify(items[0].json, null, 2)).toString('base64')\n }\n};\nreturn items;"
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "2f7a5fab-a2f4-422e-8f83-ce50fbe2a738",
|
||
"name": "Split Out",
|
||
"type": "n8n-nodes-base.splitOut",
|
||
"position": [
|
||
1240,
|
||
-680
|
||
],
|
||
"parameters": {
|
||
"options": {},
|
||
"fieldToSplitOut": "output"
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "3d7a8992-b8d4-4a86-b60b-a92a7d63e31b",
|
||
"name": "Extract Paginated Resultset With OpenAI",
|
||
"type": "@n8n/n8n-nodes-langchain.informationExtractor",
|
||
"position": [
|
||
880,
|
||
-120
|
||
],
|
||
"parameters": {
|
||
"text": "=Analyze and Extract the below content. Make sure to produce a unique resultset. Exclude page_numbers which are not numbers.\n\n {{ $json.data }}",
|
||
"options": {},
|
||
"schemaType": "manual",
|
||
"inputSchema": "{\n \"$schema\": \"http://json-schema.org/schema#\",\n \"title\": \"PagedResultSetSchema\",\n \"type\": \"array\",\n \"items\": {\n \"type\": \"object\",\n \"properties\": {\n \"page_number\": {\n \"type\": \"string\",\n \"description\": \"Page number, typically a string (e.g., '1', '2', 'next').\"\n },\n \"url\": {\n \"type\": \"string\",\n \"format\": \"uri\",\n \"description\": \"URL pointing to the page.\"\n }\n },\n \"required\": [\"page_number\", \"url\"],\n \"additionalProperties\": false\n }\n}\n"
|
||
},
|
||
"typeVersion": 1
|
||
},
|
||
{
|
||
"id": "aa42d335-67bc-4dc5-a68a-4ce93e05464a",
|
||
"name": "OpenAI Chat Model",
|
||
"type": "@n8n/n8n-nodes-langchain.lmChatOpenAi",
|
||
"position": [
|
||
880,
|
||
80
|
||
],
|
||
"parameters": {
|
||
"model": {
|
||
"__rl": true,
|
||
"mode": "list",
|
||
"value": "gpt-4o-mini"
|
||
},
|
||
"options": {}
|
||
},
|
||
"credentials": {
|
||
"openAiApi": {
|
||
"id": "vPKynKbDzJ5ZU4cU",
|
||
"name": "OpenAi account"
|
||
}
|
||
},
|
||
"typeVersion": 1.2
|
||
},
|
||
{
|
||
"id": "82df0ccc-3065-4bb5-a48e-90e4dbf2162f",
|
||
"name": "Sticky Note3",
|
||
"type": "n8n-nodes-base.stickyNote",
|
||
"position": [
|
||
640,
|
||
-260
|
||
],
|
||
"parameters": {
|
||
"color": 6,
|
||
"width": 660,
|
||
"height": 460,
|
||
"content": "## Open AI Extraction (Optional)\nNote - Replace the above workflow with the Open AI Chat Model if needed\nPlease make sure to set the OpenAI Chat Model -> Credential to connect with **OpenAi Account**"
|
||
},
|
||
"typeVersion": 1
|
||
}
|
||
],
|
||
"active": false,
|
||
"pinData": {},
|
||
"settings": {
|
||
"executionOrder": "v1"
|
||
},
|
||
"versionId": "40a1bbd5-05b2-41c2-8b3c-72e3f16fd13a",
|
||
"connections": {
|
||
"Split Out": {
|
||
"main": [
|
||
[
|
||
{
|
||
"node": "Loop Over Items",
|
||
"type": "main",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"Loop Over Items": {
|
||
"main": [
|
||
[],
|
||
[
|
||
{
|
||
"node": "Perform Esty web request over the loop",
|
||
"type": "main",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"OpenAI Chat Model": {
|
||
"ai_languageModel": [
|
||
[
|
||
{
|
||
"node": "Extract Paginated Resultset With OpenAI",
|
||
"type": "ai_languageModel",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"Create a binary data": {
|
||
"main": [
|
||
[
|
||
{
|
||
"node": "Write the scraped content to disk",
|
||
"type": "main",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"Set Esty Search Query": {
|
||
"main": [
|
||
[
|
||
{
|
||
"node": "Perform Esty Web Request",
|
||
"type": "main",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"Google Gemini Chat Model": {
|
||
"ai_languageModel": [
|
||
[
|
||
{
|
||
"node": "Extract Paginated Resultset",
|
||
"type": "ai_languageModel",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"Perform Esty Web Request": {
|
||
"main": [
|
||
[
|
||
{
|
||
"node": "Extract Paginated Resultset",
|
||
"type": "main",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"Extract Paginated Resultset": {
|
||
"main": [
|
||
[
|
||
{
|
||
"node": "Split Out",
|
||
"type": "main",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"When clicking ‘Test workflow’": {
|
||
"main": [
|
||
[
|
||
{
|
||
"node": "Set Esty Search Query",
|
||
"type": "main",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"Perform Esty web request over the loop": {
|
||
"main": [
|
||
[
|
||
{
|
||
"node": "Extract Item List with the Product Info",
|
||
"type": "main",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"Extract Item List with the Product Info": {
|
||
"main": [
|
||
[
|
||
{
|
||
"node": "Initiate a Webhook Notification for the extracted data",
|
||
"type": "main",
|
||
"index": 0
|
||
},
|
||
{
|
||
"node": "Create a binary data",
|
||
"type": "main",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"Google Gemini Chat Model for product info": {
|
||
"ai_languageModel": [
|
||
[
|
||
{
|
||
"node": "Extract Item List with the Product Info",
|
||
"type": "ai_languageModel",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
},
|
||
"Initiate a Webhook Notification for the extracted data": {
|
||
"main": [
|
||
[
|
||
{
|
||
"node": "Loop Over Items",
|
||
"type": "main",
|
||
"index": 0
|
||
}
|
||
]
|
||
]
|
||
}
|
||
}
|
||
} |