Options
- Mark as New
- Bookmark
- Subscribe
- Mute
- Subscribe to RSS Feed
- Permalink
- Report Inappropriate Content
05-21-2024 07:20 AM
File notification would only impact any new arriving files
Yes, I have all the 3 million files as newly arriving files as I generate synthetic data files for performance testing.
From the logs you shared it shows that there are no outstanding bytes or files.
I think it was the last batch of the stream but if you can see below metric
where "numBytesOutstanding" : "2605258897", "numFilesOutstanding" : "60310" are wrong as per my assumption, because when it runs next batch the numbers increase/decrease.
{
"id" : "d49e1e9c-ac58-4da0-8ccb-9aa1790a7e40",
"runId" : "6d3ac39b-42c1-4bd8-99c7-8477817b278e",
"name" : null,
"timestamp" : "2024-05-21T14:16:10.155Z",
"batchId" : 1478,
"batchDuration" : 35581,
"numInputRows" : 998,
"inputRowsPerSecond" : 0.0,
"processedRowsPerSecond" : 28.04867766504595,
"durationMs" : {
"addBatch" : 25634,
"commitOffsets" : 202,
"getBatch" : 246,
"latestOffset" : 2295,
"queryPlanning" : 5687,
"triggerExecution" : 35568,
"walCommit" : 180
},
"stateOperators" : [ ],
"sources" : [ {
"description" : "CloudFilesSource[abfss://5f540a60-11bb-4db9-9246-14bb346f1ad2@dtmsplztestscudlsdvc001.dfs.core.windows.net/data/15012/1/]",
"startOffset" : {
"seqNum" : 18875879,
"sourceVersion" : 1,
"lastBackfillStartTimeMs" : 1715782085477,
"lastBackfillFinishTimeMs" : 1715782478832,
"lastInputPath" : "abfss://5f540a60-11bb-4db9-9246-14bb346f1ad2@dtmsplztestscudlsdvc001.dfs.core.windows.net/data/15012/1/"
},
"endOffset" : {
"seqNum" : 18877451,
"sourceVersion" : 1,
"lastBackfillStartTimeMs" : 1715782085477,
"lastBackfillFinishTimeMs" : 1715782478832,
"lastInputPath" : "abfss://5f540a60-11bb-4db9-9246-14bb346f1ad2@dtmsplztestscudlsdvc001.dfs.core.windows.net/data/15012/1/"
},
"latestOffset" : null,
"numInputRows" : 998,
"inputRowsPerSecond" : 0.0,
"processedRowsPerSecond" : 28.04867766504595,
"metrics" : {
"approximateQueueSize" : "5869492",
"numBytesOutstanding" : "2605258897",
"numFilesOutstanding" : "60310"
}
} ],
"sink" : {
"description" : "ForeachBatchSink",
"numOutputRows" : -1
},
"observedMetrics" : {
"15012_5f540a60-11bb-4db9-9246-14bb346f1ad2_compress" : {
"PipelineRunID" : "5ba763c1-4e6f-4b8e-8555-9f42935fd6a3",
"BatchStatus" : "Fail",
"AppId" : "5f540a60-11bb-4db9-9246-14bb346f1ad2",
"SchemaId" : 15012,
"SchemaVersion" : 1,
"Priority" : 10,
"InputRecordCount" : 998,
"OutputRecordCount" : 998
}
}
}