diff --git a/workflows/Automate Etsy Data Mining with Bright Data Scrape & Google Gemini-3851/automate_etsy_data_mining_with_bright_data_scrape_google_gemini.json b/workflows/Automate Etsy Data Mining with Bright Data Scrape & Google Gemini-3851/automate_etsy_data_mining_with_bright_data_scrape_google_gemini.json new file mode 100644 index 000000000..55b9ee4b2 --- /dev/null +++ b/workflows/Automate Etsy Data Mining with Bright Data Scrape & Google Gemini-3851/automate_etsy_data_mining_with_bright_data_scrape_google_gemini.json @@ -0,0 +1 @@ +{"id":"UuuCIDvTNnloIlvq","meta":{"instanceId":"885b4fb4a6a9c2cb5621429a7b972df0d05bb724c20ac7dac7171b62f1c7ef40","templateCredsSetupCompleted":true},"name":"Automate Etsy Data Mining with Bright Data Scrape & Google Gemini","tags":[{"id":"Kujft2FOjmOVQAmJ","name":"Engineering","createdAt":"2025-04-09T01:31:00.558Z","updatedAt":"2025-04-09T01:31:00.558Z"},{"id":"ddPkw7Hg5dZhQu2w","name":"AI","createdAt":"2025-04-13T05:38:08.053Z","updatedAt":"2025-04-13T05:38:08.053Z"}],"nodes":[{"id":"f369feaf-4782-4411-9d08-fe91b9ffd97e","name":"When clicking ‘Test workflow’","type":"n8n-nodes-base.manualTrigger","position":[200,-555],"parameters":{},"typeVersion":1},{"id":"231bae3c-c27e-49fc-b878-2d5cc1e14c5a","name":"Sticky Note","type":"n8n-nodes-base.stickyNote","position":[200,-1020],"parameters":{"width":400,"height":300,"content":"## Note\n\nDeals with the Esty web scraping by utilizing the Bright Data Web Unlocker Product.\n\nThe Information Extraction node being used to demonstrate the usage of the N8N AI capabilities.\n\n**Please make sure to set the Indeed search query and update the Webhook Notification URL**"},"typeVersion":1},{"id":"f568de40-b389-41f9-afe9-5e09a291c367","name":"Sticky Note1","type":"n8n-nodes-base.stickyNote","position":[640,-1020],"parameters":{"width":480,"height":300,"content":"## LLM Usages\n\nGoogle Gemini Flash Exp model is being used.\n\nBasic LLM Chain Data Extractor."},"typeVersion":1},{"id":"4f1db865-a0cb-4978-9c7d-fde448bd978a","name":"Set Esty Search Query","type":"n8n-nodes-base.set","position":[420,-555],"parameters":{"options":{},"assignments":{"assignments":[{"id":"3aedba66-f447-4d7a-93c0-8158c5e795f9","name":"url","type":"string","value":"https://www.etsy.com/search?q=wall+art+for+mum&order=date_desc&page=1&ref=pagination"},{"id":"4e7ee31d-da89-422f-8079-2ff2d357a0ba","name":"zone","type":"string","value":"web_unlocker1"}]}},"typeVersion":3.4},{"id":"4cb51368-bb69-4d99-a0b6-e8e8013f1dfd","name":"Perform Esty Web Request","type":"n8n-nodes-base.httpRequest","position":[640,-680],"parameters":{"url":"https://api.brightdata.com/request","method":"POST","options":{},"sendBody":true,"sendHeaders":true,"authentication":"genericCredentialType","bodyParameters":{"parameters":[{"name":"zone","value":"={{ $json.zone }}"},{"name":"url","value":"={{ $json.url }}?product=unlocker&method=api"},{"name":"format","value":"raw"},{"name":"data_format","value":"markdown"}]},"genericAuthType":"httpHeaderAuth","headerParameters":{"parameters":[{}]}},"credentials":{"httpHeaderAuth":{"id":"kdbqXuxIR8qIxF7y","name":"Header Auth account"}},"typeVersion":4.2},{"id":"9fb7bdc5-ba64-4df4-89b4-a3207e7f6d0e","name":"Google Gemini Chat Model","type":"@n8n/n8n-nodes-langchain.lmChatGoogleGemini","position":[948,-460],"parameters":{"options":{},"modelName":"models/gemini-2.0-flash-exp"},"credentials":{"googlePalmApi":{"id":"YeO7dHZnuGBVQKVZ","name":"Google Gemini(PaLM) Api account"}},"typeVersion":1},{"id":"1f95576d-e243-481d-9d5f-308764d8ea4b","name":"Loop Over Items","type":"n8n-nodes-base.splitInBatches","position":[1460,-680],"parameters":{"options":{}},"typeVersion":3},{"id":"47f23aa1-63ee-49e3-a465-283c7ab71b76","name":"Perform Esty web request over the loop","type":"n8n-nodes-base.httpRequest","position":[1680,-560],"parameters":{"url":"https://api.brightdata.com/request","method":"POST","options":{},"sendBody":true,"sendHeaders":true,"authentication":"genericCredentialType","bodyParameters":{"parameters":[{"name":"zone","value":"=web_unlocker1"},{"name":"url","value":"={{ $json.url }}&product=unlocker"},{"name":"format","value":"raw"},{"name":"data_format","value":"markdown"}]},"genericAuthType":"httpHeaderAuth","headerParameters":{"parameters":[{}]}},"credentials":{"httpHeaderAuth":{"id":"kdbqXuxIR8qIxF7y","name":"Header Auth account"}},"typeVersion":4.2},{"id":"0b5ea206-a5a0-49b5-8f53-10b4dec5806c","name":"Initiate a Webhook Notification for the extracted data","type":"n8n-nodes-base.httpRequest","position":[2320,-560],"parameters":{"url":"https://webhook.site/3c36d7d1-de1b-4171-9fd3-643ea2e4dd76","options":{},"sendBody":true,"bodyParameters":{"parameters":[{"name":"summary","value":"={{ $json.output }}"}]}},"typeVersion":4.2},{"id":"a164b90b-f44c-4862-b010-d515926774c7","name":"Extract Item List with the Product Info","type":"@n8n/n8n-nodes-langchain.informationExtractor","position":[1920,-560],"parameters":{"text":"=Extract the product info in JSON\n\n{{ $json.data }}","options":{},"schemaType":"fromJson","jsonSchemaExample":"[{\n \"image\": \"https://i.etsystatic.com/34923795/r/il/8f3bba/5855230678/il_fullxfull.5855230678_n9el.jpg\",\n \"name\": \"Custom Coffee Mug with Photo\",\n \"url\": \"https://www.etsy.com/listing/1193808036/custom-coffee-mug-with-photo\",\n \"brand\": {\n \"@type\": \"Brand\",\n \"name\": \"TheGiftBucks\"\n },\n \"offers\": {\n \"@type\": \"Offer\",\n \"price\": \"14.99\",\n \"priceCurrency\": \"USD\"\n }\n}]"},"typeVersion":1},{"id":"c3798c64-ac53-44c8-ba91-8fe33377113d","name":"Google Gemini Chat Model for product info","type":"@n8n/n8n-nodes-langchain.lmChatGoogleGemini","position":[2000,-300],"parameters":{"options":{},"modelName":"models/gemini-2.0-flash-exp"},"credentials":{"googlePalmApi":{"id":"YeO7dHZnuGBVQKVZ","name":"Google Gemini(PaLM) Api account"}},"typeVersion":1},{"id":"11e4ae42-d2e1-4a4b-adcf-382f9e494431","name":"Extract Paginated Resultset","type":"@n8n/n8n-nodes-langchain.informationExtractor","position":[860,-680],"parameters":{"text":"=Analyze and Extract the below content. Make sure to produce a unique resultset. Exclude page_numbers which are not numbers.\n\n {{ $json.data }}","options":{},"schemaType":"manual","inputSchema":"{\n \"$schema\": \"http://json-schema.org/schema#\",\n \"title\": \"PagedResultSetSchema\",\n \"type\": \"array\",\n \"items\": {\n \"type\": \"object\",\n \"properties\": {\n \"page_number\": {\n \"type\": \"string\",\n \"description\": \"Page number, typically a string (e.g., '1', '2', 'next').\"\n },\n \"url\": {\n \"type\": \"string\",\n \"format\": \"uri\",\n \"description\": \"URL pointing to the page.\"\n }\n },\n \"required\": [\"page_number\", \"url\"],\n \"additionalProperties\": false\n }\n}\n"},"typeVersion":1},{"id":"28c1822b-d51c-4f8e-b98e-2e12324397be","name":"Sticky Note2","type":"n8n-nodes-base.stickyNote","position":[1400,-780],"parameters":{"color":5,"width":1340,"height":620,"content":"## Loop and Perform Paginated Esty Data Extraction\n"},"typeVersion":1},{"id":"d4f18f2b-9825-4320-addb-c02bfdc4da97","name":"Write the scraped content to disk","type":"n8n-nodes-base.readWriteFile","position":[2560,-760],"parameters":{"options":{},"fileName":"=d:\\Esty-Scraped-Content-{{ $('Loop Over Items').item.json.page_number }}.json","operation":"write"},"typeVersion":1},{"id":"5555407d-c7dd-4e5c-83ab-ef6ba9c46da3","name":"Create a binary data","type":"n8n-nodes-base.function","position":[2360,-760],"parameters":{"functionCode":"items[0].binary = {\n data: {\n data: new Buffer(JSON.stringify(items[0].json, null, 2)).toString('base64')\n }\n};\nreturn items;"},"typeVersion":1},{"id":"2f7a5fab-a2f4-422e-8f83-ce50fbe2a738","name":"Split Out","type":"n8n-nodes-base.splitOut","position":[1240,-680],"parameters":{"options":{},"fieldToSplitOut":"output"},"typeVersion":1},{"id":"3d7a8992-b8d4-4a86-b60b-a92a7d63e31b","name":"Extract Paginated Resultset With OpenAI","type":"@n8n/n8n-nodes-langchain.informationExtractor","position":[880,-120],"parameters":{"text":"=Analyze and Extract the below content. Make sure to produce a unique resultset. Exclude page_numbers which are not numbers.\n\n {{ $json.data }}","options":{},"schemaType":"manual","inputSchema":"{\n \"$schema\": \"http://json-schema.org/schema#\",\n \"title\": \"PagedResultSetSchema\",\n \"type\": \"array\",\n \"items\": {\n \"type\": \"object\",\n \"properties\": {\n \"page_number\": {\n \"type\": \"string\",\n \"description\": \"Page number, typically a string (e.g., '1', '2', 'next').\"\n },\n \"url\": {\n \"type\": \"string\",\n \"format\": \"uri\",\n \"description\": \"URL pointing to the page.\"\n }\n },\n \"required\": [\"page_number\", \"url\"],\n \"additionalProperties\": false\n }\n}\n"},"typeVersion":1},{"id":"aa42d335-67bc-4dc5-a68a-4ce93e05464a","name":"OpenAI Chat Model","type":"@n8n/n8n-nodes-langchain.lmChatOpenAi","position":[880,80],"parameters":{"model":{"__rl":true,"mode":"list","value":"gpt-4o-mini"},"options":{}},"credentials":{"openAiApi":{"id":"vPKynKbDzJ5ZU4cU","name":"OpenAi account"}},"typeVersion":1.2},{"id":"82df0ccc-3065-4bb5-a48e-90e4dbf2162f","name":"Sticky Note3","type":"n8n-nodes-base.stickyNote","position":[640,-260],"parameters":{"color":6,"width":660,"height":460,"content":"## Open AI Extraction (Optional)\nNote - Replace the above workflow with the Open AI Chat Model if needed\nPlease make sure to set the OpenAI Chat Model -> Credential to connect with **OpenAi Account**"},"typeVersion":1}],"active":false,"pinData":{},"settings":{"executionOrder":"v1"},"versionId":"40a1bbd5-05b2-41c2-8b3c-72e3f16fd13a","connections":{"Split Out":{"main":[[{"node":"Loop Over Items","type":"main","index":0}]]},"Loop Over Items":{"main":[[],[{"node":"Perform Esty web request over the loop","type":"main","index":0}]]},"OpenAI Chat Model":{"ai_languageModel":[[{"node":"Extract Paginated Resultset With OpenAI","type":"ai_languageModel","index":0}]]},"Create a binary data":{"main":[[{"node":"Write the scraped content to disk","type":"main","index":0}]]},"Set Esty Search Query":{"main":[[{"node":"Perform Esty Web Request","type":"main","index":0}]]},"Google Gemini Chat Model":{"ai_languageModel":[[{"node":"Extract Paginated Resultset","type":"ai_languageModel","index":0}]]},"Perform Esty Web Request":{"main":[[{"node":"Extract Paginated Resultset","type":"main","index":0}]]},"Extract Paginated Resultset":{"main":[[{"node":"Split Out","type":"main","index":0}]]},"When clicking ‘Test workflow’":{"main":[[{"node":"Set Esty Search Query","type":"main","index":0}]]},"Perform Esty web request over the loop":{"main":[[{"node":"Extract Item List with the Product Info","type":"main","index":0}]]},"Extract Item List with the Product Info":{"main":[[{"node":"Initiate a Webhook Notification for the extracted data","type":"main","index":0},{"node":"Create a binary data","type":"main","index":0}]]},"Google Gemini Chat Model for product info":{"ai_languageModel":[[{"node":"Extract Item List with the Product Info","type":"ai_languageModel","index":0}]]},"Initiate a Webhook Notification for the extracted data":{"main":[[{"node":"Loop Over Items","type":"main","index":0}]]}}} \ No newline at end of file