Skip to content

Instantly share code, notes, and snippets.

@tdonovic
Created March 18, 2018 21:49
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save tdonovic/fa9a6d47c6761e3930ebe951706d0fa6 to your computer and use it in GitHub Desktop.
Save tdonovic/fa9a6d47c6761e3930ebe951706d0fa6 to your computer and use it in GitHub Desktop.
{
"schemaVersion": 5,
"version": 8,
"pipelineId": "yb321a43a-70ce-446a-af31-d18bfbaf5094",
"title": "y",
"description": "",
"uuid": "76e17b70-b7ea-4782-a37d-32802ce1b27c",
"configuration": [
{
"name": "executionMode",
"value": "STANDALONE"
},
{
"name": "deliveryGuarantee",
"value": "AT_LEAST_ONCE"
},
{
"name": "startEventStage",
"value": "streamsets-datacollector-basic-lib::com_streamsets_pipeline_stage_destination_devnull_ToErrorNullDTarget::1"
},
{
"name": "stopEventStage",
"value": "streamsets-datacollector-basic-lib::com_streamsets_pipeline_stage_destination_devnull_ToErrorNullDTarget::1"
},
{
"name": "shouldRetry",
"value": true
},
{
"name": "retryAttempts",
"value": -1
},
{
"name": "memoryLimit",
"value": "${jvm:maxMemoryMB() * 0.85}"
},
{
"name": "memoryLimitExceeded",
"value": "LOG"
},
{
"name": "notifyOnStates",
"value": [
"RUN_ERROR",
"STOPPED",
"FINISHED"
]
},
{
"name": "emailIDs",
"value": []
},
{
"name": "constants",
"value": []
},
{
"name": "badRecordsHandling",
"value": "streamsets-datacollector-basic-lib::com_streamsets_pipeline_stage_destination_devnull_ToErrorNullDTarget::1"
},
{
"name": "errorRecordPolicy",
"value": "ORIGINAL_RECORD"
},
{
"name": "workerCount",
"value": 0
},
{
"name": "clusterSlaveMemory",
"value": 2048
},
{
"name": "clusterSlaveJavaOpts",
"value": "-XX:+UseConcMarkSweepGC -XX:+UseParNewGC -Dlog4j.debug"
},
{
"name": "clusterLauncherEnv",
"value": []
},
{
"name": "mesosDispatcherURL",
"value": null
},
{
"name": "hdfsS3ConfDir",
"value": null
},
{
"name": "rateLimit",
"value": 0
},
{
"name": "maxRunners",
"value": 0
},
{
"name": "shouldCreateFailureSnapshot",
"value": true
},
{
"name": "webhookConfigs",
"value": []
},
{
"name": "sparkConfigs",
"value": []
},
{
"name": "statsAggregatorStage",
"value": ""
}
],
"uiInfo": {
"previewConfig": {
"previewSource": "CONFIGURED_SOURCE",
"batchSize": 10,
"timeout": 10000,
"writeToDestinations": false,
"executeLifecycleEvents": false,
"showHeader": false,
"showFieldType": true,
"rememberMe": false
}
},
"stages": [
{
"instanceName": "Directory_01",
"library": "streamsets-datacollector-basic-lib",
"stageName": "com_streamsets_pipeline_stage_origin_spooldir_SpoolDirDSource",
"stageVersion": "9",
"configuration": [
{
"name": "conf.dataFormatConfig.compression",
"value": "NONE"
},
{
"name": "conf.dataFormatConfig.filePatternInArchive",
"value": "*"
},
{
"name": "conf.dataFormatConfig.charset",
"value": "UTF-8"
},
{
"name": "conf.dataFormatConfig.removeCtrlChars",
"value": false
},
{
"name": "conf.dataFormatConfig.textMaxLineLen",
"value": 1024
},
{
"name": "conf.dataFormatConfig.useCustomDelimiter",
"value": false
},
{
"name": "conf.dataFormatConfig.customDelimiter",
"value": "\\r\\n"
},
{
"name": "conf.dataFormatConfig.includeCustomDelimiterInTheText",
"value": false
},
{
"name": "conf.dataFormatConfig.jsonContent",
"value": "MULTIPLE_OBJECTS"
},
{
"name": "conf.dataFormatConfig.jsonMaxObjectLen",
"value": 4096
},
{
"name": "conf.dataFormatConfig.csvFileFormat",
"value": "CSV"
},
{
"name": "conf.dataFormatConfig.csvHeader",
"value": "NO_HEADER"
},
{
"name": "conf.dataFormatConfig.csvAllowExtraColumns",
"value": false
},
{
"name": "conf.dataFormatConfig.csvExtraColumnPrefix",
"value": "_extra_"
},
{
"name": "conf.dataFormatConfig.csvMaxObjectLen",
"value": 1024
},
{
"name": "conf.dataFormatConfig.csvCustomDelimiter",
"value": "|"
},
{
"name": "conf.dataFormatConfig.csvCustomEscape",
"value": "\\"
},
{
"name": "conf.dataFormatConfig.csvCustomQuote",
"value": "\""
},
{
"name": "conf.dataFormatConfig.csvEnableComments",
"value": false
},
{
"name": "conf.dataFormatConfig.csvCommentMarker",
"value": "#"
},
{
"name": "conf.dataFormatConfig.csvIgnoreEmptyLines",
"value": true
},
{
"name": "conf.dataFormatConfig.csvRecordType",
"value": "LIST_MAP"
},
{
"name": "conf.dataFormatConfig.csvSkipStartLines",
"value": 0
},
{
"name": "conf.dataFormatConfig.parseNull",
"value": false
},
{
"name": "conf.dataFormatConfig.nullConstant",
"value": "\\\\N"
},
{
"name": "conf.dataFormatConfig.xmlRecordElement",
"value": null
},
{
"name": "conf.dataFormatConfig.includeFieldXpathAttributes",
"value": false
},
{
"name": "conf.dataFormatConfig.xPathNamespaceContext",
"value": []
},
{
"name": "conf.dataFormatConfig.outputFieldAttributes",
"value": false
},
{
"name": "conf.dataFormatConfig.xmlMaxObjectLen",
"value": 4096
},
{
"name": "conf.dataFormatConfig.logMode",
"value": "COMMON_LOG_FORMAT"
},
{
"name": "conf.dataFormatConfig.logMaxObjectLen",
"value": 1024
},
{
"name": "conf.dataFormatConfig.retainOriginalLine",
"value": false
},
{
"name": "conf.dataFormatConfig.customLogFormat",
"value": "%h %l %u %t \"%r\" %>s %b"
},
{
"name": "conf.dataFormatConfig.regex",
"value": "^(\\S+) (\\S+) (\\S+) \\[([\\w:/]+\\s[+\\-]\\d{4})\\] \"(\\S+) (\\S+) (\\S+)\" (\\d{3}) (\\d+)"
},
{
"name": "conf.dataFormatConfig.fieldPathsToGroupName",
"value": [
{
"fieldPath": "/",
"group": 1
}
]
},
{
"name": "conf.dataFormatConfig.grokPatternDefinition",
"value": null
},
{
"name": "conf.dataFormatConfig.grokPattern",
"value": "%{COMMONAPACHELOG}"
},
{
"name": "conf.dataFormatConfig.onParseError",
"value": "ERROR"
},
{
"name": "conf.dataFormatConfig.maxStackTraceLines",
"value": 50
},
{
"name": "conf.dataFormatConfig.enableLog4jCustomLogFormat",
"value": false
},
{
"name": "conf.dataFormatConfig.log4jCustomLogFormat",
"value": "%r [%t] %-5p %c %x - %m%n"
},
{
"name": "conf.dataFormatConfig.avroSchema",
"value": null
},
{
"name": "conf.dataFormatConfig.schemaRegistryUrls",
"value": []
},
{
"name": "conf.dataFormatConfig.schemaLookupMode",
"value": "SUBJECT"
},
{
"name": "conf.dataFormatConfig.subject",
"value": null
},
{
"name": "conf.dataFormatConfig.schemaId",
"value": null
},
{
"name": "conf.dataFormatConfig.protoDescriptorFile",
"value": null
},
{
"name": "conf.dataFormatConfig.messageType",
"value": null
},
{
"name": "conf.dataFormatConfig.isDelimited",
"value": true
},
{
"name": "conf.dataFormatConfig.binaryMaxObjectLen",
"value": 1024
},
{
"name": "conf.dataFormatConfig.datagramMode",
"value": "SYSLOG"
},
{
"name": "conf.dataFormatConfig.typesDbPath",
"value": null
},
{
"name": "conf.dataFormatConfig.convertTime",
"value": false
},
{
"name": "conf.dataFormatConfig.excludeInterval",
"value": true
},
{
"name": "conf.dataFormatConfig.authFilePath",
"value": null
},
{
"name": "conf.dataFormatConfig.netflowOutputValuesMode",
"value": "RAW_AND_INTERPRETED"
},
{
"name": "conf.dataFormatConfig.maxTemplateCacheSize",
"value": -1
},
{
"name": "conf.dataFormatConfig.templateCacheTimeoutMs",
"value": -1
},
{
"name": "conf.dataFormatConfig.netflowOutputValuesModeDatagram",
"value": "RAW_AND_INTERPRETED"
},
{
"name": "conf.dataFormatConfig.maxTemplateCacheSizeDatagram",
"value": -1
},
{
"name": "conf.dataFormatConfig.templateCacheTimeoutMsDatagram",
"value": -1
},
{
"name": "conf.dataFormatConfig.wholeFileMaxObjectLen",
"value": 8192
},
{
"name": "conf.dataFormatConfig.rateLimit",
"value": "-1"
},
{
"name": "conf.dataFormat",
"value": "WHOLE_FILE"
},
{
"name": "conf.spoolDir",
"value": "/opt/streamsets-datacollector-3.1.0.0/resources"
},
{
"name": "conf.numberOfThreads",
"value": 1
},
{
"name": "conf.pathMatcherMode",
"value": "GLOB"
},
{
"name": "conf.filePattern",
"value": "*"
},
{
"name": "conf.useLastModified",
"value": "LEXICOGRAPHICAL"
},
{
"name": "conf.processSubdirectories",
"value": false
},
{
"name": "conf.allowLateDirectory",
"value": false
},
{
"name": "conf.overrunLimit",
"value": 128
},
{
"name": "conf.batchSize",
"value": 1000
},
{
"name": "conf.poolingTimeoutSecs",
"value": 60
},
{
"name": "conf.maxSpoolFiles",
"value": 1000
},
{
"name": "conf.initialFileToProcess",
"value": null
},
{
"name": "conf.errorArchiveDir",
"value": null
},
{
"name": "conf.postProcessing",
"value": "NONE"
},
{
"name": "conf.archiveDir",
"value": null
},
{
"name": "conf.retentionTimeMins",
"value": 0
},
{
"name": "stageOnRecordError",
"value": "TO_ERROR"
}
],
"uiInfo": {
"yPos": 50,
"stageType": "SOURCE",
"rawSource": {
"configuration": [
{
"name": "fileName"
}
]
},
"description": "",
"label": "Directory 1",
"xPos": 60
},
"inputLanes": [],
"outputLanes": [
"Directory_01OutputLane15210041827250"
],
"eventLanes": [],
"services": []
},
{
"instanceName": "SampleProcessor_01",
"library": "streamsets-datacollector-dev-lib",
"stageName": "com_example_stage_processor_sample_SampleDProcessor",
"stageVersion": "1",
"configuration": [
{
"name": "config",
"value": "default"
},
{
"name": "stageOnRecordError",
"value": "TO_ERROR"
},
{
"name": "stageRequiredFields",
"value": []
},
{
"name": "stageRecordPreconditions",
"value": []
}
],
"uiInfo": {
"description": "",
"label": "Sample Processor 1",
"xPos": 280,
"yPos": 50,
"stageType": "PROCESSOR"
},
"inputLanes": [
"Directory_01OutputLane15210041827250"
],
"outputLanes": [
"SampleProcessor_01OutputLane15210041887930"
],
"eventLanes": [],
"services": []
},
{
"instanceName": "FieldRemover_01",
"library": "streamsets-datacollector-basic-lib",
"stageName": "com_streamsets_pipeline_stage_processor_fieldfilter_FieldFilterDProcessor",
"stageVersion": "1",
"configuration": [
{
"name": "filterOperation",
"value": "REMOVE"
},
{
"name": "fields",
"value": [
"/fileRef"
]
},
{
"name": "stageRequiredFields",
"value": []
},
{
"name": "stageRecordPreconditions",
"value": []
}
],
"uiInfo": {
"description": "",
"label": "Field Remover 1",
"xPos": 479,
"yPos": 59,
"stageType": "PROCESSOR"
},
"inputLanes": [
"SampleProcessor_01OutputLane15210041887930"
],
"outputLanes": [
"FieldRemover_01OutputLane15210043027480"
],
"eventLanes": [],
"services": []
},
{
"instanceName": "LocalFS_01",
"library": "streamsets-datacollector-basic-lib",
"stageName": "com_streamsets_pipeline_stage_destination_localfilesystem_LocalFileSystemDTarget",
"stageVersion": "3",
"configuration": [
{
"name": "configs.uniquePrefix",
"value": "sdc-${sdc:id()}"
},
{
"name": "configs.fileNameSuffix",
"value": null
},
{
"name": "configs.dirPathTemplateInHeader",
"value": false
},
{
"name": "configs.dirPathTemplate",
"value": "/opt/streamsets-datacollector-3.1.0.0/streamsets-libs/tmp/out/${YYYY()}-${MM()}-${DD()}-${hh()}"
},
{
"name": "configs.timeZoneID",
"value": "UTC"
},
{
"name": "configs.timeDriver",
"value": "${time:now()}"
},
{
"name": "configs.maxRecordsPerFile",
"value": 0
},
{
"name": "configs.maxFileSize",
"value": 0
},
{
"name": "configs.idleTimeout",
"value": "${1 * HOURS}"
},
{
"name": "configs.compression",
"value": "NONE"
},
{
"name": "configs.otherCompression",
"value": null
},
{
"name": "configs.fileType",
"value": "TEXT"
},
{
"name": "configs.keyEl",
"value": "${uuid()}"
},
{
"name": "configs.lateRecordsLimit",
"value": "${1 * HOURS}"
},
{
"name": "configs.rollIfHeader",
"value": false
},
{
"name": "configs.rollHeaderName",
"value": "roll"
},
{
"name": "configs.lateRecordsAction",
"value": "SEND_TO_ERROR"
},
{
"name": "configs.lateRecordsDirPathTemplate",
"value": "/tmp/late/${YYYY()}-${MM()}-${DD()}"
},
{
"name": "configs.dataFormat",
"value": "JSON"
},
{
"name": "configs.hdfsPermissionCheck",
"value": true
},
{
"name": "configs.permissionEL",
"value": null
},
{
"name": "configs.skipOldTempFileRecovery",
"value": false
},
{
"name": "configs.dataGeneratorFormatConfig.charset",
"value": "UTF-8"
},
{
"name": "configs.dataGeneratorFormatConfig.csvFileFormat",
"value": "CSV"
},
{
"name": "configs.dataGeneratorFormatConfig.csvHeader",
"value": "NO_HEADER"
},
{
"name": "configs.dataGeneratorFormatConfig.csvReplaceNewLines",
"value": true
},
{
"name": "configs.dataGeneratorFormatConfig.csvReplaceNewLinesString",
"value": " "
},
{
"name": "configs.dataGeneratorFormatConfig.csvCustomDelimiter",
"value": "|"
},
{
"name": "configs.dataGeneratorFormatConfig.csvCustomEscape",
"value": "\\"
},
{
"name": "configs.dataGeneratorFormatConfig.csvCustomQuote",
"value": "\""
},
{
"name": "configs.dataGeneratorFormatConfig.jsonMode",
"value": "MULTIPLE_OBJECTS"
},
{
"name": "configs.dataGeneratorFormatConfig.textFieldPath",
"value": "/text"
},
{
"name": "configs.dataGeneratorFormatConfig.textRecordSeparator",
"value": "\\n"
},
{
"name": "configs.dataGeneratorFormatConfig.textFieldMissingAction",
"value": "ERROR"
},
{
"name": "configs.dataGeneratorFormatConfig.textEmptyLineIfNull",
"value": false
},
{
"name": "configs.dataGeneratorFormatConfig.avroSchemaSource",
"value": null
},
{
"name": "configs.dataGeneratorFormatConfig.avroSchema",
"value": null
},
{
"name": "configs.dataGeneratorFormatConfig.registerSchema",
"value": false
},
{
"name": "configs.dataGeneratorFormatConfig.schemaRegistryUrlsForRegistration",
"value": []
},
{
"name": "configs.dataGeneratorFormatConfig.schemaRegistryUrls",
"value": []
},
{
"name": "configs.dataGeneratorFormatConfig.schemaLookupMode",
"value": "SUBJECT"
},
{
"name": "configs.dataGeneratorFormatConfig.subject",
"value": null
},
{
"name": "configs.dataGeneratorFormatConfig.subjectToRegister",
"value": null
},
{
"name": "configs.dataGeneratorFormatConfig.schemaId",
"value": null
},
{
"name": "configs.dataGeneratorFormatConfig.avroCompression",
"value": "NULL"
},
{
"name": "configs.dataGeneratorFormatConfig.binaryFieldPath",
"value": "/"
},
{
"name": "configs.dataGeneratorFormatConfig.protoDescriptorFile",
"value": null
},
{
"name": "configs.dataGeneratorFormatConfig.messageType",
"value": null
},
{
"name": "configs.dataGeneratorFormatConfig.fileNameEL",
"value": null
},
{
"name": "configs.dataGeneratorFormatConfig.wholeFileExistsAction",
"value": "TO_ERROR"
},
{
"name": "configs.dataGeneratorFormatConfig.includeChecksumInTheEvents",
"value": false
},
{
"name": "configs.dataGeneratorFormatConfig.checksumAlgorithm",
"value": "MD5"
},
{
"name": "configs.dataGeneratorFormatConfig.xmlPrettyPrint",
"value": true
},
{
"name": "configs.dataGeneratorFormatConfig.xmlValidateSchema",
"value": false
},
{
"name": "configs.dataGeneratorFormatConfig.xmlSchema",
"value": null
},
{
"name": "stageOnRecordError",
"value": "TO_ERROR"
},
{
"name": "stageRequiredFields",
"value": []
},
{
"name": "stageRecordPreconditions",
"value": []
}
],
"uiInfo": {
"description": "",
"label": "Local FS 1",
"xPos": 716,
"yPos": 50,
"stageType": "TARGET"
},
"inputLanes": [
"FieldRemover_01OutputLane15210043027480"
],
"outputLanes": [],
"eventLanes": [],
"services": []
}
],
"errorStage": {
"instanceName": "Discard_ErrorStage",
"library": "streamsets-datacollector-basic-lib",
"stageName": "com_streamsets_pipeline_stage_destination_devnull_ToErrorNullDTarget",
"stageVersion": "1",
"configuration": [],
"uiInfo": {
"description": "",
"label": "Error Records - Discard",
"xPos": 936,
"yPos": 50,
"stageType": "TARGET"
},
"inputLanes": [],
"outputLanes": [],
"eventLanes": [],
"services": []
},
"info": {
"pipelineId": "yb321a43a-70ce-446a-af31-d18bfbaf5094",
"title": "y",
"description": "",
"created": 1521004179115,
"lastModified": 1521004372840,
"creator": "admin",
"lastModifier": "admin",
"lastRev": "0",
"uuid": "76e17b70-b7ea-4782-a37d-32802ce1b27c",
"valid": true,
"metadata": {
"labels": []
},
"name": "yb321a43a-70ce-446a-af31-d18bfbaf5094",
"sdcVersion": "3.1.0.0",
"sdcId": "c81ab400-2745-11e8-a37e-819939cc1bbe"
},
"metadata": {
"labels": []
},
"statsAggregatorStage": null,
"startEventStages": [
{
"instanceName": "Discard_StartEventStage",
"library": "streamsets-datacollector-basic-lib",
"stageName": "com_streamsets_pipeline_stage_destination_devnull_ToErrorNullDTarget",
"stageVersion": "1",
"configuration": [],
"uiInfo": {
"description": "",
"label": "Start Event - Discard",
"xPos": 280,
"yPos": 50,
"stageType": "TARGET"
},
"inputLanes": [],
"outputLanes": [],
"eventLanes": [],
"services": []
}
],
"stopEventStages": [
{
"instanceName": "Discard_StopEventStage",
"library": "streamsets-datacollector-basic-lib",
"stageName": "com_streamsets_pipeline_stage_destination_devnull_ToErrorNullDTarget",
"stageVersion": "1",
"configuration": [],
"uiInfo": {
"description": "",
"label": "Stop Event - Discard",
"xPos": 280,
"yPos": 50,
"stageType": "TARGET"
},
"inputLanes": [],
"outputLanes": [],
"eventLanes": [],
"services": []
}
],
"valid": true,
"issues": {
"pipelineIssues": [],
"stageIssues": {},
"issueCount": 0
},
"previewable": true
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment