๐ก๐ Jina.ai ๊ธฐ๋ฐ ๋ค์ค ํ์ด์ง ์น ํฌ๋กค๋ฌ
์ด๊ฒ์AI๋ถ์ผ์์๋ํ ์ํฌํ๋ก์ฐ๋ก, 16๊ฐ์ ๋ ธ๋๋ฅผ ํฌํจํฉ๋๋ค.์ฃผ๋ก Set, Xml, Code, Wait, Limit ๋ฑ์ ๋ ธ๋๋ฅผ ์ฌ์ฉํ๋ฉฐ์ธ๊ณต์ง๋ฅ ๊ธฐ์ ์ ๊ฒฐํฉํ์ฌ ์ค๋งํธ ์๋ํ๋ฅผ ๊ตฌํํฉ๋๋ค. ๐ก๐ Jina.ai์ ๋ค์ค ํ์ด์ง ์น ํฌ๋กค๋ง ๋๊ตฌ ์ฌ์ฉ
- โขGoogle Drive API ์ธ์ฆ ์ ๋ณด
- โข๋์ API์ ์ธ์ฆ ์ ๋ณด๊ฐ ํ์ํ ์ ์์
์ฌ์ฉ๋ ๋ ธ๋ (16)
์นดํ ๊ณ ๋ฆฌ
{
"id": "xEij0kj2I1DHbL3I",
"meta": {
"instanceId": "31e69f7f4a77bf465b805824e303232f0227212ae922d12133a0f96ffeab4fef",
"templateCredsSetupCompleted": true
},
"name": "๐ก๐ Essential Multipage Website Scraper with Jina.ai",
"tags": [],
"nodes": [
{
"id": "3a503859-ef0a-492d-81c6-37e4f0c4c25e",
"name": "์คํฐํค ๋
ธํธ",
"type": "n8n-nodes-base.stickyNote",
"position": [
-840,
0
],
"parameters": {
"color": 3,
"width": 340,
"height": 320,
"content": "## Jina.ai Web Scraper\n### No API Key Required\n"
},
"typeVersion": 1
},
{
"id": "c5217a1a-f074-409b-8340-72afdc5fc8b5",
"name": "'์ํฌํ๋ก ํ
์คํธ' ํด๋ฆญ ์",
"type": "n8n-nodes-base.manualTrigger",
"position": [
-1500,
-300
],
"parameters": {},
"typeVersion": 1
},
{
"id": "72af3b00-2632-4877-a0b6-7477e2f468f7",
"name": "ํญ๋ชฉ ๋ฐ๋ณต",
"type": "n8n-nodes-base.splitInBatches",
"position": [
-1080,
20
],
"parameters": {
"options": {}
},
"typeVersion": 3
},
{
"id": "11f0fa02-51f8-41cc-b789-5c452b6899aa",
"name": "๋๊ธฐ",
"type": "n8n-nodes-base.wait",
"position": [
80,
220
],
"webhookId": "081ce124-0cbf-4a21-a1e7-2c465f460448",
"parameters": {},
"typeVersion": 1.1
},
{
"id": "cf3b5887-8ff2-46e0-ab33-384ab0987cbb",
"name": "์ ํ",
"type": "n8n-nodes-base.limit",
"position": [
80,
-300
],
"parameters": {
"maxItems": 20
},
"typeVersion": 1
},
{
"id": "c4f04d82-aa33-46cf-a8e2-0b4e717e754a",
"name": "์น์ฌ์ดํธ URL ๋ชฉ๋ก ๊ฐ์ ธ์ค๊ธฐ",
"type": "n8n-nodes-base.httpRequest",
"position": [
-780,
-300
],
"parameters": {
"url": "={{ $json.sitemap_url }}",
"options": {}
},
"typeVersion": 4.2
},
{
"id": "7f507c38-1e9e-4c46-8dea-bd6daf65dc55",
"name": "JSON๋ก ๋ณํ",
"type": "n8n-nodes-base.xml",
"position": [
-560,
-300
],
"parameters": {
"options": {}
},
"typeVersion": 1
},
{
"id": "e21b55c2-8b0d-4c7c-ba91-a2d563a4c966",
"name": "์น์ฌ์ดํธ URL ๋ชฉ๋ก ์์ฑ",
"type": "n8n-nodes-base.splitOut",
"position": [
-340,
-300
],
"parameters": {
"options": {},
"fieldToSplitOut": "urlset.url"
},
"typeVersion": 1
},
{
"id": "61555239-8a16-424e-8a60-700f6ebaa270",
"name": "์ฃผ์ ๋๋ ํ์ด์ง๋ณ ํํฐ๋ง",
"type": "n8n-nodes-base.filter",
"position": [
-120,
-300
],
"parameters": {
"options": {},
"conditions": {
"options": {
"version": 2,
"leftValue": "",
"caseSensitive": true,
"typeValidation": "strict"
},
"combinator": "or",
"conditions": [
{
"id": "d66c304d-879a-4dc4-908f-ab0665093672",
"operator": {
"name": "filter.operator.equals",
"type": "string",
"operation": "equals"
},
"leftValue": "={{ $json.loc }}",
"rightValue": "=https://ai.pydantic.dev/"
},
{
"id": "3c930950-bee4-442b-82e6-4437fd39a933",
"operator": {
"type": "string",
"operation": "contains"
},
"leftValue": "={{ $json.loc.toLowerCase() }}",
"rightValue": "agent"
},
{
"id": "aaeaf34e-ad5a-4673-b3bd-8bddf3500988",
"operator": {
"type": "string",
"operation": "contains"
},
"leftValue": "={{ $json.loc.toLowerCase() }}",
"rightValue": "tool"
}
]
}
},
"typeVersion": 2.2
},
{
"id": "dd25fb57-64a3-4c47-be04-6eb66d16520a",
"name": "์น์ฌ์ดํธ URL ์ค์ ",
"type": "n8n-nodes-base.set",
"position": [
-1080,
-300
],
"parameters": {
"options": {},
"assignments": {
"assignments": [
{
"id": "1601dc3e-8024-4e19-b592-93a4e4f77641",
"name": "sitemap_url",
"type": "string",
"value": "https://ai.pydantic.dev/sitemap.xml"
}
]
}
},
"typeVersion": 3.4
},
{
"id": "14ac1c87-29fe-44c8-9c1e-f247a292dde5",
"name": "Jina.ai ์น ์คํฌ๋ํผ",
"type": "n8n-nodes-base.httpRequest",
"position": [
-720,
120
],
"parameters": {
"url": "=https://r.jina.ai/{{ $json.loc }}",
"options": {}
},
"typeVersion": 4.2
},
{
"id": "be253ec2-f088-4895-8ef2-61a3720cf68b",
"name": "Google ๋๋ผ์ด๋ธ์ ์นํ์ด์ง ๋ด์ฉ ์ ์ฅ",
"type": "n8n-nodes-base.googleDrive",
"position": [
-120,
120
],
"parameters": {
"name": "={{ $('Loop Over Items').item.json.loc }} - {{ $json.title }}",
"content": "={{ $json.markdown }}",
"driveId": {
"__rl": true,
"mode": "list",
"value": "My Drive"
},
"options": {},
"folderId": {
"__rl": true,
"mode": "list",
"value": "root",
"cachedResultName": "/ (Root folder)"
},
"operation": "createFromText"
},
"credentials": {
"googleDriveOAuth2Api": {
"id": "UhdXGYLTAJbsa0xX",
"name": "Google Drive account"
}
},
"typeVersion": 3
},
{
"id": "95d808c7-a3ca-4f59-a385-cc77bdff322e",
"name": "์ ๋ชฉ ๋ฐ ๋งํฌ๋ค์ด ์ฝํ
์ธ ์ถ์ถ",
"type": "n8n-nodes-base.code",
"position": [
-380,
120
],
"parameters": {
"jsCode": "// Get the text output from the previous node\nconst data = $input.first().json.data;\n\n// Regular expression to capture the title line\nconst titleRegex = /^Title:\\s*(.+)$/m;\n// Regular expression to capture everything after \"Markdown Content:\"\nconst markdownRegex = /Markdown Content:\\n([\\s\\S]+)/;\n\n// Extract the title using the first capture group\nconst titleMatch = data.match(titleRegex);\nconst title = titleMatch ? titleMatch[1].trim() : '';\n\n// Extract the markdown content using the first capture group\nconst markdownMatch = data.match(markdownRegex);\nconst markdown = markdownMatch ? markdownMatch[1].trim() : '';\n\n// Return a single object with title and markdown as unique values\nreturn { title, markdown };"
},
"typeVersion": 2
},
{
"id": "2fb86c81-c144-4450-908c-559855deadef",
"name": "์คํฐํค ๋
ธํธ1",
"type": "n8n-nodes-base.stickyNote",
"position": [
-1240,
-580
],
"parameters": {
"color": 7,
"width": 1540,
"height": 1080,
"content": "# ๐ก๐ Essential Multipage Website Scraper with Jina.ai\n## Scrape entire websites with this workflow\n**Use responsibly and follow local rules and regulations**"
},
"typeVersion": 1
},
{
"id": "b470b294-95d0-4e51-a9cc-2fe17316a771",
"name": "์คํฐํค ๋
ธํธ2",
"type": "n8n-nodes-base.stickyNote",
"position": [
-1580,
-400
],
"parameters": {
"color": 4,
"width": 280,
"height": 300,
"content": "## ๐Try Me!"
},
"typeVersion": 1
},
{
"id": "fafd0623-a423-4e73-9609-cee8e81f5c13",
"name": "์คํฐํค ๋
ธํธ3",
"type": "n8n-nodes-base.stickyNote",
"position": [
-1180,
-400
],
"parameters": {
"width": 300,
"height": 300,
"content": "## ๐Add Website Sitemap URL"
},
"typeVersion": 1
}
],
"active": false,
"pinData": {},
"settings": {
"executionOrder": "v1"
},
"versionId": "2e815787-d83b-4ab7-a959-2f33006a37a5",
"connections": {
"11f0fa02-51f8-41cc-b789-5c452b6899aa": {
"main": [
[
{
"node": "72af3b00-2632-4877-a0b6-7477e2f468f7",
"type": "main",
"index": 0
}
]
]
},
"cf3b5887-8ff2-46e0-ab33-384ab0987cbb": {
"main": [
[
{
"node": "72af3b00-2632-4877-a0b6-7477e2f468f7",
"type": "main",
"index": 0
}
]
]
},
"7f507c38-1e9e-4c46-8dea-bd6daf65dc55": {
"main": [
[
{
"node": "e21b55c2-8b0d-4c7c-ba91-a2d563a4c966",
"type": "main",
"index": 0
}
]
]
},
"72af3b00-2632-4877-a0b6-7477e2f468f7": {
"main": [
[],
[
{
"node": "14ac1c87-29fe-44c8-9c1e-f247a292dde5",
"type": "main",
"index": 0
}
]
]
},
"dd25fb57-64a3-4c47-be04-6eb66d16520a": {
"main": [
[
{
"node": "c4f04d82-aa33-46cf-a8e2-0b4e717e754a",
"type": "main",
"index": 0
}
]
]
},
"14ac1c87-29fe-44c8-9c1e-f247a292dde5": {
"main": [
[
{
"node": "95d808c7-a3ca-4f59-a385-cc77bdff322e",
"type": "main",
"index": 0
}
]
]
},
"c4f04d82-aa33-46cf-a8e2-0b4e717e754a": {
"main": [
[
{
"node": "7f507c38-1e9e-4c46-8dea-bd6daf65dc55",
"type": "main",
"index": 0
}
]
]
},
"61555239-8a16-424e-8a60-700f6ebaa270": {
"main": [
[
{
"node": "cf3b5887-8ff2-46e0-ab33-384ab0987cbb",
"type": "main",
"index": 0
}
]
]
},
"e21b55c2-8b0d-4c7c-ba91-a2d563a4c966": {
"main": [
[
{
"node": "61555239-8a16-424e-8a60-700f6ebaa270",
"type": "main",
"index": 0
}
]
]
},
"95d808c7-a3ca-4f59-a385-cc77bdff322e": {
"main": [
[
{
"node": "be253ec2-f088-4895-8ef2-61a3720cf68b",
"type": "main",
"index": 0
}
]
]
},
"c5217a1a-f074-409b-8340-72afdc5fc8b5": {
"main": [
[
{
"node": "dd25fb57-64a3-4c47-be04-6eb66d16520a",
"type": "main",
"index": 0
}
]
]
},
"be253ec2-f088-4895-8ef2-61a3720cf68b": {
"main": [
[
{
"node": "11f0fa02-51f8-41cc-b789-5c452b6899aa",
"type": "main",
"index": 0
}
]
]
}
}
}์ด ์ํฌํ๋ก์ฐ๋ฅผ ์ด๋ป๊ฒ ์ฌ์ฉํ๋์?
์์ JSON ๊ตฌ์ฑ ์ฝ๋๋ฅผ ๋ณต์ฌํ์ฌ n8n ์ธ์คํด์ค์์ ์ ์ํฌํ๋ก์ฐ๋ฅผ ์์ฑํ๊ณ "JSON์์ ๊ฐ์ ธ์ค๊ธฐ"๋ฅผ ์ ํํ ํ, ๊ตฌ์ฑ์ ๋ถ์ฌ๋ฃ๊ณ ํ์์ ๋ฐ๋ผ ์ธ์ฆ ์ค์ ์ ์์ ํ์ธ์.
์ด ์ํฌํ๋ก์ฐ๋ ์ด๋ค ์๋๋ฆฌ์ค์ ์ ํฉํ๊ฐ์?
๊ณ ๊ธ - ์ธ๊ณต์ง๋ฅ
์ ๋ฃ์ธ๊ฐ์?
์ด ์ํฌํ๋ก์ฐ๋ ์์ ํ ๋ฌด๋ฃ์ด๋ฉฐ ์ง์ ๊ฐ์ ธ์ ์ฌ์ฉํ ์ ์์ต๋๋ค. ๋ค๋ง, ์ํฌํ๋ก์ฐ์์ ์ฌ์ฉํ๋ ํ์ฌ ์๋น์ค(์: OpenAI API)๋ ์ฌ์ฉ์ ์ง์ ๋น์ฉ์ ์ง๋ถํด์ผ ํ ์ ์์ต๋๋ค.
๊ด๋ จ ์ํฌํ๋ก์ฐ ์ถ์ฒ
Joseph LePage
@joeAs an AI Automation consultant based in Canada, I partner with forward-thinking organizations to implement AI solutions that streamline operations and drive growth.
์ด ์ํฌํ๋ก์ฐ ๊ณต์