清理和标准化 CSV 上传以导入 Google Sheets 和 Drive
中级
这是一个Document Extraction, Multimodal AI领域的自动化工作流,包含 10 个节点。主要使用 Code, Webhook, GoogleDrive, GoogleSheets 等节点。 清理和标准化 CSV 上传以导入 Google Sheets 和 Drive
前置要求
- •HTTP Webhook 端点(n8n 会自动生成)
- •Google Drive API 凭证
- •Google Sheets API 凭证
工作流预览
可视化展示节点连接关系,支持缩放和平移
导出工作流
复制以下 JSON 配置到 n8n 导入,即可使用此工作流
{
"meta": {
"instanceId": "2000c64071c20843606b95c63795bb0797c41036047055a6586498e855b96efc"
},
"nodes": [
{
"id": "24e5fd68-0441-4541-b543-fcaef4f8ec6c",
"name": "设置说明",
"type": "n8n-nodes-base.stickyNote",
"position": [
-496,
-112
],
"parameters": {
"width": 760,
"height": 696,
"content": "🧹 **需要设置:**"
},
"typeVersion": 1
},
{
"id": "b452e138-2c91-4934-8be6-e3c190407db3",
"name": "CSV 上传 Webhook",
"type": "n8n-nodes-base.webhook",
"position": [
-160,
160
],
"webhookId": "csv-upload-webhook",
"parameters": {
"path": "csv-upload",
"options": {
"noResponseBody": false
},
"httpMethod": "POST"
},
"typeVersion": 1
},
{
"id": "e6a91fe0-7d79-4e45-900b-5200b6af7cbf",
"name": "提取 CSV 内容",
"type": "n8n-nodes-base.code",
"position": [
48,
160
],
"parameters": {
"jsCode": "// Extract and validate CSV upload\nconst requestData = $input.first();\nlet csvContent = '';\nlet filename = 'uploaded_file.csv';\n\nif (requestData.binary && requestData.binary.data) {\n csvContent = requestData.binary.data.toString();\n filename = requestData.binary.data.filename || filename;\n} else if (requestData.json.csv_content) {\n csvContent = requestData.json.csv_content;\n filename = requestData.json.filename || filename;\n} else if (requestData.json.file_base64) {\n csvContent = Buffer.from(requestData.json.file_base64, 'base64').toString();\n filename = requestData.json.filename || filename;\n} else {\n throw new Error('No CSV content found in request');\n}\n\nif (!csvContent || csvContent.length < 10) {\n throw new Error('Invalid or empty CSV file');\n}\n\nconst initialRows = csvContent.split('\\n').length - 1;\n\nreturn {\n json: {\n filename,\n original_content: csvContent,\n file_size_bytes: csvContent.length,\n initial_row_count: initialRows,\n upload_timestamp: new Date().toISOString(),\n processing_started: true\n }\n};"
},
"typeVersion": 2
},
{
"id": "57875349-1fa5-454b-aa02-1255a1c87fb4",
"name": "解析 CSV 数据",
"type": "n8n-nodes-base.code",
"position": [
240,
160
],
"parameters": {
"jsCode": "// Parse and clean CSV data\nconst uploadInfo = $input.first().json;\nconst csvContent = uploadInfo.original_content;\n\nconst lines = csvContent.split('\\n').map(line => line.trim()).filter(line => line.length > 0);\nif (lines.length === 0) throw new Error('No valid rows found in CSV');\n\nconst headers = lines[0].split(',').map(header => header.replace(/\"/g, '').trim().toLowerCase().replace(/\\s+/g, '_'));\n\nconst rawRows = [];\nfor (let i = 1; i < lines.length; i++) {\n const values = lines[i].split(',').map(val => val.replace(/\"/g, '').trim());\n if (values.length === headers.length && values.some(val => val.length > 0)) {\n const row = {};\n headers.forEach((header, index) => row[header] = values[index] || '');\n rawRows.push(row);\n }\n}\n\nreturn {\n json: {\n ...uploadInfo,\n headers,\n raw_rows: rawRows,\n parsed_row_count: rawRows.length\n }\n};"
},
"typeVersion": 2
},
{
"id": "275eb9f3-40bc-4c2e-bd8e-7dd707f9dc21",
"name": "清理和标准化数据",
"type": "n8n-nodes-base.code",
"position": [
448,
160
],
"parameters": {
"jsCode": "// Clean CSV rows\nconst data = $input.first().json;\nlet cleanedRows = [...data.raw_rows];\n\nconst cleanEmail = e => e ? (e.toLowerCase().trim().match(/^[^\\s@]+@[^\\s@]+\\.[^\\s@]+$/) ? e : '') : '';\nconst cleanPhone = p => p ? p.replace(/\\D/g, '') : '';\nconst cleanName = n => n ? n.trim().split(' ').map(w => w.charAt(0).toUpperCase() + w.slice(1).toLowerCase()).join(' ') : '';\nconst cleanText = t => t ? t.trim().replace(/\\s+/g, ' ') : '';\n\ncleanedRows = cleanedRows.map(row => {\n const cleaned = {};\n Object.keys(row).forEach(key => {\n let value = row[key];\n if (key.includes('email')) cleaned[key] = cleanEmail(value);\n else if (key.includes('phone')) cleaned[key] = cleanPhone(value);\n else if (key.includes('name')) cleaned[key] = cleanName(value);\n else cleaned[key] = cleanText(value);\n });\n cleaned._data_quality_score = Math.round((Object.values(cleaned).filter(v => v).length / Object.keys(cleaned).length) * 100);\n return cleaned;\n});\n\nconst highQualityRows = cleanedRows.filter(r => r._data_quality_score >= 30);\n\nreturn {\n json: {\n ...data,\n cleaned_rows: highQualityRows,\n cleaning_summary: {\n original_count: data.parsed_row_count,\n after_cleaning: highQualityRows.length,\n average_quality_score: Math.round(highQualityRows.reduce((s, r) => s + r._data_quality_score, 0) / highQualityRows.length)\n },\n processing_completed: new Date().toISOString()\n }\n};"
},
"typeVersion": 2
},
{
"id": "c5d3faa0-0c48-4782-b436-2c51c39ec39a",
"name": "生成干净 CSV",
"type": "n8n-nodes-base.code",
"position": [
640,
160
],
"parameters": {
"jsCode": "// Generate cleaned CSV\nconst data = $input.first().json;\nconst headers = data.headers;\nconst cleanedRows = data.cleaned_rows;\n\nlet csvContent = headers.join(',') + '\\n';\ncsvContent += cleanedRows.map(r => headers.map(h => r[h] || '').join(',')).join('\\n');\n\nconst cleanedFilename = `cleaned_${Date.now()}_${data.filename}`;\n\nreturn {\n json: { ...data, cleaned_csv_content: csvContent, cleaned_filename: cleanedFilename },\n binary: {\n data: Buffer.from(csvContent, 'utf8'),\n fileName: cleanedFilename,\n mimeType: 'text/csv'\n }\n};"
},
"typeVersion": 2
},
{
"id": "56a06147-0e57-44aa-8c24-20e284486bbe",
"name": "保存到 Google Drive",
"type": "n8n-nodes-base.googleDrive",
"position": [
848,
80
],
"parameters": {
"name": "={{ $json.cleaned_filename }}",
"driveId": {
"__rl": true,
"mode": "list",
"value": "My Drive"
},
"options": {},
"folderId": {
"__rl": true,
"mode": "list",
"value": "root",
"cachedResultName": "/ (Root folder)"
}
},
"credentials": {
"googleDriveOAuth2Api": {
"id": "IPz4dCJVFC8uaoHw",
"name": "Google Drive account 2"
}
},
"typeVersion": 3
},
{
"id": "3b1b4bd8-3c65-4ed9-b87c-f6a5885d1712",
"name": "清空现有表格",
"type": "n8n-nodes-base.googleSheets",
"position": [
848,
240
],
"parameters": {
"operation": "clear",
"sheetName": "Sheet1",
"documentId": "YOUR_GOOGLE_SHEET_ID"
},
"typeVersion": 4
},
{
"id": "a856710d-317a-4d97-92f0-2946c91511ec",
"name": "准备表格数据",
"type": "n8n-nodes-base.code",
"position": [
1040,
240
],
"parameters": {
"jsCode": "// Prepare data for Google Sheets\nconst data = $input.first().json;\nreturn data.cleaned_rows.map(r => ({ json: r }));"
},
"typeVersion": 2
},
{
"id": "d1e73fbe-6d7c-47df-8e74-02d4b3ce7fa8",
"name": "导入到 Google Sheets",
"type": "n8n-nodes-base.googleSheets",
"position": [
1248,
240
],
"parameters": {
"options": {},
"operation": "append",
"sheetName": "Sheet1",
"documentId": "YOUR_GOOGLE_SHEET_ID"
},
"typeVersion": 4
}
],
"pinData": {},
"connections": {
"Parse CSV Data": {
"main": [
[
{
"node": "Clean & Standardize Data",
"type": "main",
"index": 0
}
]
]
},
"CSV Upload Webhook": {
"main": [
[
{
"node": "Extract CSV Content",
"type": "main",
"index": 0
}
]
]
},
"Generate Clean CSV": {
"main": [
[
{
"node": "Save to Google Drive",
"type": "main",
"index": 0
},
{
"node": "Clear Existing Sheet",
"type": "main",
"index": 0
}
]
]
},
"Prepare for Sheets": {
"main": [
[
{
"node": "Import to Google Sheets",
"type": "main",
"index": 0
}
]
]
},
"Extract CSV Content": {
"main": [
[
{
"node": "Parse CSV Data",
"type": "main",
"index": 0
}
]
]
},
"Clear Existing Sheet": {
"main": [
[
{
"node": "Prepare for Sheets",
"type": "main",
"index": 0
}
]
]
},
"Clean & Standardize Data": {
"main": [
[
{
"node": "Generate Clean CSV",
"type": "main",
"index": 0
}
]
]
}
}
}常见问题
如何使用这个工作流?
复制上方的 JSON 配置代码,在您的 n8n 实例中创建新工作流并选择「从 JSON 导入」,粘贴配置后根据需要修改凭证设置即可。
这个工作流适合什么场景?
中级 - 文档提取, 多模态 AI
需要付费吗?
本工作流完全免费,您可以直接导入使用。但请注意,工作流中使用的第三方服务(如 OpenAI API)可能需要您自行付费。
相关工作流推荐
自动将新Calendly预约添加到Google表格
自动将新Calendly预约添加到Google表格
Code
Webhook
Google Sheets
+1
5 节点David Olusola
客户关系管理
自动保存Instagram潜在客户到Google表格
自动保存Instagram潜在客户到Google表格
Code
Webhook
Google Sheets
+1
4 节点David Olusola
潜在客户开发
自动保存Zoom录制到Google云端硬盘并在Airtable记录会议
自动保存Zoom录制到Google云端硬盘并在Airtable记录会议
Code
Webhook
Airtable
+3
7 节点David Olusola
文件管理
使用Google套件、PDF和邮件自动化商业保险提交
通过Google套件、PDF和邮件自动化商业保险提交流程
If
Set
Code
+10
37 节点David Olusola
文档提取
使用Postiz自动创建AI新闻视频并发布到社交媒体
使用GPT-4o和HeyGen创建AI新闻视频并发布到社交媒体
Set
Code
Wait
+10
37 节点David Olusola
内容创作
太阳能潜在客户资质审核
使用Google Sheets和Gmail自动化太阳能潜在客户资质审核与跟进
If
Code
Gmail
+6
17 节点David Olusola
销售
工作流信息
难度等级
中级
节点数量10
分类2
节点类型5
作者
David Olusola
@dae221I help ambitious businesses eliminate operational bottlenecks and scale faster with AI automation. My clients typically see 40-60% efficiency gains within 90 days. Currently accepting 3 new projects this quarter - david@daexai.com
外部链接
在 n8n.io 查看 →
分享此工作流