使用 Dumpling AI 从 URL 抓取书籍,清理 HTML,保存到 Sheets,通过邮件发送 CSV
中级
这是一个Engineering, Other, AI, IT Ops领域的自动化工作流,包含 11 个节点。主要使用 Html, Sort, Gmail, SplitOut, HttpRequest 等节点,结合人工智能技术实现智能自动化。 使用 Dumpling AI 从 URL 抓取书籍,清理 HTML,保存到表格,邮件发送 CSV
前置要求
- •Google 账号和 Gmail API 凭证
- •可能需要目标 API 的认证凭证
- •Google Sheets API 凭证
工作流预览
可视化展示节点连接关系,支持缩放和平移
导出工作流
复制以下 JSON 配置到 n8n 导入,即可使用此工作流
{
"id": "DswhuYzoemjA6iNN",
"meta": {
"instanceId": "a1ae5c8dc6c65e674f9c3947d083abcc749ef2546dff9f4ff01de4d6a36ebfe6",
"templateCredsSetupCompleted": true
},
"name": "使用 Dumpling AI 从 URL 抓取书籍,清理 HTML,保存到 Sheets,通过邮件发送 CSV",
"tags": [
{
"id": "TlcNkmb96fUfZ2eA",
"name": "Tutorials",
"createdAt": "2025-04-15T17:02:00.249Z",
"updatedAt": "2025-04-15T17:02:00.249Z"
}
],
"nodes": [
{
"id": "2e4f64a5-353c-4dd3-9822-62df795d4940",
"name": "转换为 CSV 文件",
"type": "n8n-nodes-base.convertToFile",
"position": [
1640,
340
],
"parameters": {
"options": {}
},
"typeVersion": 1.1
},
{
"id": "472442d3-a691-4310-93f8-019579d0c473",
"name": "从页面提取所有书籍",
"type": "n8n-nodes-base.html",
"position": [
760,
340
],
"parameters": {
"options": {},
"operation": "extractHtmlContent",
"dataPropertyName": "content",
"extractionValues": {
"values": [
{
"key": "books",
"cssSelector": ".row > li",
"returnArray": true,
"returnValue": "html"
}
]
}
},
"typeVersion": 1.2
},
{
"id": "92765257-d64d-47c9-bd57-50914342138b",
"name": "按价格排序",
"type": "n8n-nodes-base.sort",
"position": [
1420,
340
],
"parameters": {
"options": {},
"sortFieldsUi": {
"sortField": [
{
"order": "descending",
"fieldName": "price"
}
]
}
},
"typeVersion": 1
},
{
"id": "efc2f33f-1bef-4906-b3b7-b02868080a54",
"name": "提取单个书籍价格",
"type": "n8n-nodes-base.html",
"position": [
1200,
340
],
"parameters": {
"options": {},
"operation": "extractHtmlContent",
"dataPropertyName": "books",
"extractionValues": {
"values": [
{
"key": "title",
"attribute": "title",
"cssSelector": "h3 > a",
"returnValue": "attribute"
},
{
"key": "price",
"cssSelector": ".price_color"
}
]
}
},
"typeVersion": 1.2
},
{
"id": "74c7c3af-d63c-4b6c-95a0-15f45b19134b",
"name": "通过电子邮件发送 CSV",
"type": "n8n-nodes-base.gmail",
"position": [
1860,
340
],
"webhookId": "40f2d609-52ed-40bf-b190-1f1cebbe3fb7",
"parameters": {
"sendTo": "",
"message": "Hey, here's the scraped data from the online bookstore!",
"options": {
"attachmentsUi": {
"attachmentsBinary": [
{}
]
}
},
"subject": "bookstore csv",
"emailType": "text"
},
"credentials": {
"gmailOAuth2": {
"id": "j70r3RTMED1pgN3R",
"name": "Gmail account 2"
}
},
"typeVersion": 2.1
},
{
"id": "95c7998b-ece0-4dea-b99e-97ac22fb8a59",
"name": "便签3",
"type": "n8n-nodes-base.stickyNote",
"position": [
140,
-260
],
"parameters": {
"width": 619,
"height": 297,
"content": "### 使用 Dumpling AI 从 URL 抓取书籍,清理 HTML,保存到 Sheets,通过邮件发送 CSV"
},
"typeVersion": 1
},
{
"id": "f599028a-49a9-4b85-b484-5abf1229e373",
"name": "便签",
"type": "n8n-nodes-base.stickyNote",
"position": [
140,
60
],
"parameters": {
"color": 4,
"width": 900,
"height": 300,
"content": "### 🔁 触发器到原始书籍 HTML"
},
"typeVersion": 1
},
{
"id": "bc6ab72c-de03-4e79-9da0-ca12ddf31811",
"name": "便签1",
"type": "n8n-nodes-base.stickyNote",
"position": [
1140,
60
],
"parameters": {
"color": 6,
"width": 840,
"height": 300,
"content": "### 📦 解析、排序、导出和发送邮件"
},
"typeVersion": 1
},
{
"id": "a1246b4e-212f-4bd3-970b-b0ff8db2f834",
"name": "触发器 - 监视电子表格中的新 URL",
"type": "n8n-nodes-base.googleSheetsTrigger",
"position": [
320,
340
],
"parameters": {
"event": "rowAdded",
"options": {},
"pollTimes": {
"item": [
{
"mode": "everyMinute"
}
]
},
"sheetName": {
"__rl": true,
"mode": "list",
"value": "",
"cachedResultUrl": "https://docs.google.com/spreadsheets/d/1pb4WLqv2EruLM1z9-utehcINolSj0vlUqZionyLoRUs/edit#gid=0",
"cachedResultName": "Sheet1"
},
"documentId": {
"__rl": true,
"mode": "list",
"value": "",
"cachedResultUrl": "https://docs.google.com/spreadsheets/d/1pb4WLqv2EruLM1z9-utehcINolSj0vlUqZionyLoRUs/edit?usp=drivesdk",
"cachedResultName": "URLs"
}
},
"credentials": {
"googleSheetsTriggerOAuth2Api": {
"id": "qDzHSzTkclwDHpSR",
"name": "Google Sheets Trigger account"
}
},
"typeVersion": 1
},
{
"id": "b19aa287-3be4-4e16-908d-b0cb484519e3",
"name": "使用 Dumpling AI 抓取网站内容",
"type": "n8n-nodes-base.httpRequest",
"position": [
540,
340
],
"parameters": {
"url": "https://app.dumplingai.com/api/v1/scrape",
"method": "POST",
"options": {
"allowUnauthorizedCerts": true
},
"jsonBody": "={\n \"url\": \"{{ $('Trigger- Watches For new URL in Spreadsheet')}}\", \n \"format\": \"html\",\n \"cleaned\": \"True\"\n }",
"sendBody": true,
"sendHeaders": true,
"specifyBody": "json",
"authentication": "genericCredentialType",
"genericAuthType": "httpHeaderAuth",
"headerParameters": {
"parameters": [
{
"name": "Content-Type",
"value": "application/json"
}
]
}
},
"credentials": {
"httpBasicAuth": {
"id": "mznexGH3YDtrUTAk",
"name": "Unnamed credential"
},
"httpHeaderAuth": {
"id": "xamyMqCpAech5BeT",
"name": "Header Auth account"
}
},
"typeVersion": 4.1
},
{
"id": "02cbc6f9-bdcb-45fc-9973-ded42346ffbc",
"name": "将 HTML 数组拆分为单个书籍",
"type": "n8n-nodes-base.splitOut",
"position": [
980,
340
],
"parameters": {
"options": {},
"fieldToSplitOut": "books"
},
"typeVersion": 1
}
],
"active": false,
"pinData": {},
"settings": {
"executionOrder": "v1"
},
"versionId": "264412ff-9d74-443c-a2ff-69be1e042a82",
"connections": {
"Sort by price": {
"main": [
[
{
"node": "Convert to CSV File",
"type": "main",
"index": 0
}
]
]
},
"Convert to CSV File": {
"main": [
[
{
"node": "Send CSV via e-mail",
"type": "main",
"index": 0
}
]
]
},
"Extract individual book price": {
"main": [
[
{
"node": "Sort by price",
"type": "main",
"index": 0
}
]
]
},
"Extract all books from the page": {
"main": [
[
{
"node": "Split HTML Array into Individual Books",
"type": "main",
"index": 0
}
]
]
},
"Split HTML Array into Individual Books": {
"main": [
[
{
"node": "Extract individual book price",
"type": "main",
"index": 0
}
]
]
},
"Scrape Website Content with Dumpling AI": {
"main": [
[
{
"node": "Extract all books from the page",
"type": "main",
"index": 0
}
]
]
},
"Trigger- Watches For new URL in Spreadsheet": {
"main": [
[
{
"node": "Scrape Website Content with Dumpling AI",
"type": "main",
"index": 0
}
]
]
}
}
}常见问题
如何使用这个工作流?
复制上方的 JSON 配置代码,在您的 n8n 实例中创建新工作流并选择「从 JSON 导入」,粘贴配置后根据需要修改凭证设置即可。
这个工作流适合什么场景?
中级 - 工程, 其他, 人工智能, IT 运维
需要付费吗?
本工作流完全免费,您可以直接导入使用。但请注意,工作流中使用的第三方服务(如 OpenAI API)可能需要您自行付费。
相关工作流推荐
在可视化参考库中探索n8n节点
在可视化参考库中探索n8n节点
If
Ftp
Set
+93
113 节点I versus AI
其他
使用正则表达式和 AI 发现隐藏的网站 API 端点
使用正则表达式和人工智能发现隐藏的网站API端点
If
Set
Html
+19
58 节点Yulia
工程
使用Dumpling AI从Google Drive提取发票数据至Sheets
使用Dumpling AI从Google Drive提取发票数据并保存至Sheets
Code
Split Out
Google Drive
+5
8 节点Yang
人工智能
通过 Dumpling AI 抓取 Google Places 并自动保存到 Google Sheets
通过 Dumpling AI 抓取 Google Places 并自动保存到 Google Sheets
Split Out
Http Request
Google Sheets
+2
6 节点Yang
人工智能
使用 Dumpling AI 抓取 TikTok 个人资料和文字记录并保存到 Google Sheets
使用 Dumpling AI 抓取 TikTok 个人资料和文字记录并保存到 Google Sheets
Set
Http Request
Google Sheets
+2
6 节点Yang
人工智能
AI新闻简报构建器:使用Dumpling AI抓取网站,GPT-4o摘要
AI新闻简报构建器:Dumpling AI抓取网站,GPT-4o摘要
Set
Code
Gmail
+6
10 节点Yang
人工智能