Skip to content

Commit

Permalink
Update Data Downloader Sample
Browse files Browse the repository at this point in the history
Align with latest SDK release
  • Loading branch information
gauravmalhot committed Jul 21, 2015
1 parent 3814571 commit 0fd9dd1
Show file tree
Hide file tree
Showing 4 changed files with 78 additions and 77 deletions.
Original file line number Diff line number Diff line change
@@ -1,11 +1,12 @@
{
"name": "HDInsightLinkedService",
"properties":
{
"type": "HDInsightBYOCLinkedService",
"clusterUri": "<>",
"userName": "<>",
"password": "<>",
"linkedServiceName": "RawEventsLinkedService"
"name": "HDInsightLinkedService",
"properties": {
"type": "HDInsight",
"typeProperties": {
"clusterUri": "<>",
"userName": "<>",
"password": "<>",
"linkedServiceName": "RawEventsLinkedService"
}
}
}
Original file line number Diff line number Diff line change
@@ -1,8 +1,9 @@
{
"name": "RawEventsLinkedService",
"properties":
{
"type": "AzureStorageLinkedService",
"connectionString": "DefaultEndpointsProtocol=https;AccountName=<>;AccountKey=<>"
"name": "RawEventsLinkedService",
"properties": {
"type": "AzureStorage",
"typeProperties": {
"connectionString": "DefaultEndpointsProtocol=https;AccountName=<>;AccountKey=<>"
}
}
}
}
Original file line number Diff line number Diff line change
@@ -1,41 +1,40 @@
{
"name": "DataDownloaderSamplePipeline",
"properties":
{
"description" : "Custom Data Downloader from an HTTP EndPoint Sample Pipeline",
"activities":
[
{
"name": "DownloadData",
"description": "Download raw data from an http endpoint",
"outputs": [ {"name": "RawEventsTable"} ],
"linkedServiceName": "HDInsightLinkedService",
"type": "DotNetActivity",
"transformation":
{
"assemblyName": "DataDownloaderActivity.dll",
"entryPoint": "DataDownloaderActivityNS.DataDownloaderActivity",
"packageLinkedService": "RawEventsLinkedService",
"packageFile": "<container>/package/DataDownloaderActivity.zip",
"extendedProperties":
{
"sliceStart": "$$Text.Format('{0:yyyyMMddHHmm}', Time.AddMinutes(SliceStart, 0))",
"urlFormat": "http://dumps.wikimedia.org/other/pagecounts-raw/{0}/{0}-{1}/pagecounts-{0}{1}{2}-{3}00{4}.gz",
"dataStorageAccountName": "<>",
"dataStorageAccountKey": "<>",
"dataStorageContainer": "<>",
}
},
"policy":
{
"concurrency": 1,
"executionPriorityOrder": "OldestFirst",
"retry": 2,
"timeout": "00:30:00"
},
},
"name": "DataDownloaderSamplePipeline",
"properties": {
"description": "Custom Data Downloader from an HTTP EndPoint Sample Pipeline",
"activities": [
{
"name": "DownloadData",
"description": "Download raw data from an http endpoint",
"outputs": [
{
"name": "RawEventsTable"
}
],
"start": "2015-03-08T00:00:00Z",
"end": "9999-09-09T00:00:00Z"
}
}
"linkedServiceName": "HDInsightLinkedService",
"type": "DotNetActivity",
"typeProperties": {
"assemblyName": "DataDownloaderActivity.dll",
"entryPoint": "DataDownloaderActivityNS.DataDownloaderActivity",
"packageLinkedService": "RawEventsLinkedService",
"packageFile": "<container>/package/DataDownloaderActivity.zip",
"defines": {
"sliceStart": "$$Text.Format('{0:yyyyMMddHHmm}', Time.AddMinutes(SliceStart, 0))",
"urlFormat": "http://dumps.wikimedia.org/other/pagecounts-raw/{0}/{0}-{1}/pagecounts-{0}{1}{2}-{3}00{4}.gz",
"dataStorageAccountName": "<>",
"dataStorageAccountKey": "<>",
"dataStorageContainer": "<>"
}
},
"policy": {
"concurrency": 1,
"executionPriorityOrder": "OldestFirst",
"retry": 2,
"timeout": "00:30:00"
}
}
],
"start": "2015-03-08T00:00:00Z",
"end": "9999-09-09T00:00:00Z"
}
}
48 changes: 24 additions & 24 deletions Samples/HttpDataDownloaderSample/Tables/RawEventsTable.json
Original file line number Diff line number Diff line change
@@ -1,24 +1,24 @@
{
"name":"RawEventsTable",
"properties":{
"location":{
"type":"AzureBlobLocation",
"folderPath":"<Container>/httpDownloadDataIn/{Slice}/",
"partitionedBy":[
{
"name":"Slice",
"value":{
"type":"DateTime",
"date":"SliceStart",
"format":"yyyyMMddHHmm"
}
}
],
"linkedServiceName":"RawEventsLinkedService"
},
"availability":{
"frequency":"Hour",
"interval":1
}
}
}
{
"name": "RawEventsTable",
"properties": {
"type": "AzureBlob",
"linkedServiceName": "RawEventsLinkedService",
"typeProperties": {
"folderPath": "<Container>/httpDownloadDataIn/{Slice}/",
"partitionedBy": [
{
"name": "Slice",
"value": {
"type": "DateTime",
"date": "SliceStart",
"format": "yyyyMMddHHmm"
}
}
]
},
"availability": {
"frequency": "Hour",
"interval": 1
}
}
}

0 comments on commit 0fd9dd1

Please sign in to comment.