From aa81562716a6863e4f9eaba7a926bdac8ceafee1 Mon Sep 17 00:00:00 2001 From: Li Liu Date: Mon, 3 Sep 2018 11:08:57 +0800 Subject: [PATCH] add solution template examples --- .../ForeachFilePartitionCopy.json | 231 ++++++++++++++++++ .../ForeachFilePartitionCopy/manifest.json | 5 + .../ForeachTablePartitionCopy.json | 215 ++++++++++++++++ .../ForeachTablePartitionCopy/manifest.json | 5 + 4 files changed, 456 insertions(+) create mode 100644 templates/ForeachFilePartitionCopy/ForeachFilePartitionCopy.json create mode 100644 templates/ForeachFilePartitionCopy/manifest.json create mode 100644 templates/ForeachTablePartitionCopy/ForeachTablePartitionCopy.json create mode 100644 templates/ForeachTablePartitionCopy/manifest.json diff --git a/templates/ForeachFilePartitionCopy/ForeachFilePartitionCopy.json b/templates/ForeachFilePartitionCopy/ForeachFilePartitionCopy.json new file mode 100644 index 0000000..e5f2a65 --- /dev/null +++ b/templates/ForeachFilePartitionCopy/ForeachFilePartitionCopy.json @@ -0,0 +1,231 @@ +{ + "$schema": "http://schema.management.azure.com/schemas/2015-01-01/deploymentTemplate.json#", + "contentVersion": "1.0.0.0", + "parameters": { + "factoryName": { + "type": "string", + "metadata": "Data Factory Name", + "defaultValue": "liliuMadridTestGit" + }, + "AzureBlobSource_properties_typeProperties_fileName": { + "type": "string", + "defaultValue": "@dataset().file" + }, + "AzureBlobSource_properties_typeProperties_folderPath": { + "type": "string", + "defaultValue": "@dataset().folder" + }, + "AzureBlobSink_properties_typeProperties_fileName": { + "type": "string", + "defaultValue": "" + }, + "AzureBlobSink_properties_typeProperties_folderPath": { + "type": "string", + "defaultValue": "@dataset().folder" + }, + "AzureBlobSource_properties_linkedServiceName": { + "type": "string", + "metadata": { + "linkedServiceType": "AzureBlobStorage" + } + }, + "AzureBlobSink_properties_linkedServiceName": { + "type": "string", + "metadata": { + "linkedServiceType": "AzureBlobStorage" + } + } + }, + "variables": { + "factoryId": "[concat('Microsoft.DataFactory/factories/', parameters('factoryName'))]" + }, + "resources": [ + { + "name": "[concat(parameters('factoryName'), '/ForeachFilePartitionCopy')]", + "type": "Microsoft.DataFactory/factories/pipelines", + "apiVersion": "2018-06-01", + "properties": { + "description": "Copying a large number of files between file-based storages template", + "activities": [ + { + "name": "GetPartitionList", + "description": "get item list", + "type": "GetMetadata", + "policy": { + "timeout": "7.00:00:00", + "retry": 0, + "retryIntervalInSeconds": 30, + "secureOutput": false, + "secureInput": false + }, + "typeProperties": { + "dataset": { + "referenceName": "AzureBlobSource", + "type": "DatasetReference", + "parameters": { + "folder": { + "value": "@pipeline().parameters.sourceFolder", + "type": "Expression" + }, + "file": " " + } + }, + "fieldList": [ + "childItems" + ] + } + }, + { + "name": "ForEachPartition", + "description": "copy for each item", + "type": "ForEach", + "dependsOn": [ + { + "activity": "GetPartitionList", + "dependencyConditions": [ + "Succeeded" + ] + } + ], + "typeProperties": { + "items": { + "value": "@activity('GetPartitionList').output.childItems", + "type": "Expression" + }, + "batchCount": 10, + "activities": [ + { + "name": "CopyOnePartition", + "description": "Do the copy", + "type": "Copy", + "policy": { + "timeout": "7.00:00:00", + "retry": 0, + "retryIntervalInSeconds": 30, + "secureOutput": false, + "secureInput": false + }, + "userProperties": [ + { + "name": "Source", + "value": "@{item().name}/" + }, + { + "name": "Destination", + "value": "@{item().name}/" + } + ], + "typeProperties": { + "source": { + "type": "BlobSource", + "recursive": true + }, + "sink": { + "type": "BlobSink" + }, + "enableStaging": false, + "dataIntegrationUnits": 0 + }, + "inputs": [ + { + "referenceName": "AzureBlobSource", + "type": "DatasetReference", + "parameters": { + "folder": { + "value": "@pipeline().parameters.sourceFolder", + "type": "Expression" + }, + "file": { + "value": "@item().name", + "type": "Expression" + } + } + } + ], + "outputs": [ + { + "referenceName": "AzureBlobSink", + "type": "DatasetReference", + "parameters": { + "folder": { + "value": "@pipeline().parameters.sinkFolder", + "type": "Expression" + } + } + } + ] + } + ] + } + } + ], + "parameters": { + "sourceFolder": { + "type": "String" + }, + "sinkFolder": { + "type": "String" + } + } + }, + "dependsOn": [ + "[concat(variables('factoryId'), '/datasets/AzureBlobSource')]", + "[concat(variables('factoryId'), '/datasets/AzureBlobSink')]" + ] + }, + { + "name": "[concat(parameters('factoryName'), '/AzureBlobSource')]", + "type": "Microsoft.DataFactory/factories/datasets", + "apiVersion": "2018-06-01", + "properties": { + "linkedServiceName": { + "referenceName": "[parameters('AzureBlobSource_properties_linkedServiceName')]", + "type": "LinkedServiceReference" + }, + "parameters": { + "folder": { + "type": "String" + }, + "file": { + "type": "String" + } + }, + "type": "AzureBlob", + "typeProperties": { + "fileName": { + "value": "[parameters('AzureBlobSource_properties_typeProperties_fileName')]", + "type": "Expression" + }, + "folderPath": { + "value": "[parameters('AzureBlobSource_properties_typeProperties_folderPath')]", + "type": "Expression" + } + } + } + }, + { + "name": "[concat(parameters('factoryName'), '/AzureBlobSink')]", + "type": "Microsoft.DataFactory/factories/datasets", + "apiVersion": "2018-06-01", + "properties": { + "linkedServiceName": { + "referenceName": "[parameters('AzureBlobSink_properties_linkedServiceName')]", + "type": "LinkedServiceReference" + }, + "parameters": { + "folder": { + "type": "String" + } + }, + "type": "AzureBlob", + "typeProperties": { + "fileName": "[parameters('AzureBlobSink_properties_typeProperties_fileName')]", + "folderPath": { + "value": "[parameters('AzureBlobSink_properties_typeProperties_folderPath')]", + "type": "Expression" + } + } + } + } + ] +} \ No newline at end of file diff --git a/templates/ForeachFilePartitionCopy/manifest.json b/templates/ForeachFilePartitionCopy/manifest.json new file mode 100644 index 0000000..c139a82 --- /dev/null +++ b/templates/ForeachFilePartitionCopy/manifest.json @@ -0,0 +1,5 @@ +{ + "name": "ForeachFilePartitionCopy", + "description": "Copying a large number of files between file-based storages template", + "image": "" +} \ No newline at end of file diff --git a/templates/ForeachTablePartitionCopy/ForeachTablePartitionCopy.json b/templates/ForeachTablePartitionCopy/ForeachTablePartitionCopy.json new file mode 100644 index 0000000..317c58f --- /dev/null +++ b/templates/ForeachTablePartitionCopy/ForeachTablePartitionCopy.json @@ -0,0 +1,215 @@ +{ + "$schema": "http://schema.management.azure.com/schemas/2015-01-01/deploymentTemplate.json#", + "contentVersion": "1.0.0.0", + "parameters": { + "factoryName": { + "type": "string", + "metadata": "Data Factory Name", + "defaultValue": "liliuMadridTestGit" + }, + "AzureBlobDestination_properties_typeProperties_folderPath": { + "type": "string", + "defaultValue": "@dataset().folder" + }, + "AzureSqlTableLookup_properties_linkedServiceName": { + "type": "string", + "metadata": { + "linkedServiceType": "AzureSqlDatabase" + } + }, + "AzureSqlTableSource_properties_linkedServiceName": { + "type": "string", + "metadata": { + "linkedServiceType": "AzureSqlDatabase" + } + }, + "AzureBlobDestination_properties_linkedServiceName": { + "type": "string", + "metadata": { + "linkedServiceType": "AzureBlobStorage" + } + } + }, + "variables": { + "factoryId": "[concat('Microsoft.DataFactory/factories/', parameters('factoryName'))]" + }, + "resources": [ + { + "name": "[concat(parameters('factoryName'), '/ForeachTablePartitionCopy')]", + "type": "Microsoft.DataFactory/factories/pipelines", + "apiVersion": "2018-06-01", + "properties": { + "activities": [ + { + "name": "ForEachPartition", + "type": "ForEach", + "dependsOn": [ + { + "activity": "GetPartitionList", + "dependencyConditions": [ + "Succeeded" + ] + } + ], + "typeProperties": { + "items": { + "value": "@activity('GetPartitionList').output.value", + "type": "Expression" + }, + "batchCount": 10, + "activities": [ + { + "name": "CopyOnePartition", + "description": "Do the real copy", + "type": "Copy", + "policy": { + "timeout": "7.00:00:00", + "retry": 0, + "retryIntervalInSeconds": 30, + "secureOutput": false, + "secureInput": false + }, + "typeProperties": { + "source": { + "type": "SqlSource" + }, + "sink": { + "type": "BlobSink" + }, + "enableStaging": false, + "dataIntegrationUnits": 0 + }, + "inputs": [ + { + "referenceName": "AzureSqlTableSource", + "type": "DatasetReference", + "parameters": { + "tableName": { + "value": "[concat('[', '@{item().TABLE_SCHEMA}].[@{item().TABLE_NAME}]')]", + "type": "Expression" + } + } + } + ], + "outputs": [ + { + "referenceName": "AzureBlobDestination", + "type": "DatasetReference", + "parameters": { + "folder": { + "value": "@pipeline().parameters.sinkFolder", + "type": "Expression" + } + } + } + ] + } + ] + } + }, + { + "name": "GetPartitionList", + "type": "Lookup", + "policy": { + "timeout": "7.00:00:00", + "retry": 0, + "retryIntervalInSeconds": 30, + "secureOutput": false, + "secureInput": false + }, + "typeProperties": { + "source": { + "type": "SqlSource", + "sqlReaderQuery": "SELECT TABLE_SCHEMA, TABLE_NAME FROM information_schema.TABLES" + }, + "dataset": { + "referenceName": "AzureSqlTableLookup", + "type": "DatasetReference" + }, + "firstRowOnly": false + } + } + ], + "parameters": { + "sinkFolder": { + "type": "String" + } + } + }, + "dependsOn": [ + "[concat(variables('factoryId'), '/datasets/AzureSqlTableLookup')]", + "[concat(variables('factoryId'), '/datasets/AzureSqlTableSource')]", + "[concat(variables('factoryId'), '/datasets/AzureBlobDestination')]" + ] + }, + { + "name": "[concat(parameters('factoryName'), '/AzureSqlTableLookup')]", + "type": "Microsoft.DataFactory/factories/datasets", + "apiVersion": "2018-06-01", + "properties": { + "description": "Data source for lookup activity, should has the same linked service with AzureSqlTableSource", + "linkedServiceName": { + "referenceName": "[parameters('AzureSqlTableLookup_properties_linkedServiceName')]", + "type": "LinkedServiceReference" + }, + "type": "AzureSqlTable" + } + }, + { + "name": "[concat(parameters('factoryName'), '/AzureSqlTableSource')]", + "type": "Microsoft.DataFactory/factories/datasets", + "apiVersion": "2018-06-01", + "properties": { + "description": "Data source for copy activity, should has the same linked service with AzureSqlTableLookup", + "linkedServiceName": { + "referenceName": "[parameters('AzureSqlTableSource_properties_linkedServiceName')]", + "type": "LinkedServiceReference" + }, + "parameters": { + "tableName": { + "type": "String" + } + }, + "type": "AzureSqlTable", + "typeProperties": { + "tableName": { + "value": "@dataset().tableName", + "type": "Expression" + } + } + } + }, + { + "name": "[concat(parameters('factoryName'), '/AzureBlobDestination')]", + "type": "Microsoft.DataFactory/factories/datasets", + "apiVersion": "2018-06-01", + "properties": { + "linkedServiceName": { + "referenceName": "[parameters('AzureBlobDestination_properties_linkedServiceName')]", + "type": "LinkedServiceReference" + }, + "parameters": { + "folder": { + "type": "String" + } + }, + "type": "AzureBlob", + "typeProperties": { + "format": { + "type": "TextFormat", + "columnDelimiter": ",", + "rowDelimiter": "", + "nullValue": "\\N", + "treatEmptyAsNull": true, + "skipLineCount": 0, + "firstRowAsHeader": false + }, + "folderPath": { + "value": "[parameters('AzureBlobDestination_properties_typeProperties_folderPath')]", + "type": "Expression" + } + } + } + } + ] +} \ No newline at end of file diff --git a/templates/ForeachTablePartitionCopy/manifest.json b/templates/ForeachTablePartitionCopy/manifest.json new file mode 100644 index 0000000..84e6065 --- /dev/null +++ b/templates/ForeachTablePartitionCopy/manifest.json @@ -0,0 +1,5 @@ +{ + "name": "ForeachTablePartitionCopy", + "description": "Table partition foreach", + "image": "" +} \ No newline at end of file