-
Notifications
You must be signed in to change notification settings - Fork 130
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Fix Partitioned SessionWindow bug, where restoring from checkpoint tr…
…iggers an exception. Cause of the Issue: The PartitionedSessionWindowPipe keeps multiple dictionary states. One of the dictionary does not have a [DataMember] attribute, Because the value type is a LinkedList which does not support serialization. On checkpoint and then Restore, this dictionary is re-created using other data members in UpdatePointers callback. During this, the scenario of empty LinkedList value is missed and not restored. When next data event appears for the partition, the partitionKey is indexed on the dictionary resulting in KeyNotFoundException Regression No, this existed for a long time. The customer hit the bug now because of workaround suggested (for another bug) to use 'timestamp by .. over' clause. ReproSteps: Added as a Testcase. Fix: Added code to restore key with empty LinkedList. Verified that this was the exact state just before checkpoint. Added a testcase that triggers this bug and with the fix the testcase passes.
- Loading branch information
Showing
2 changed files
with
110 additions
and
1 deletion.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
101 changes: 101 additions & 0 deletions
101
Sources/Test/SimpleTesting/Partitioned/PartitionedStreamCheckpointTests.cs
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,101 @@ | ||
// ********************************************************************* | ||
// Copyright (c) Microsoft Corporation. All rights reserved. | ||
// Licensed under the MIT License | ||
// ********************************************************************* | ||
using System; | ||
using System.Collections.Generic; | ||
using System.IO; | ||
using System.Linq; | ||
using System.Reactive.Linq; | ||
using System.Reactive.Subjects; | ||
using Microsoft.StreamProcessing; | ||
using Microsoft.VisualStudio.TestTools.UnitTesting; | ||
|
||
namespace SimpleTesting | ||
{ | ||
/* This test case verifies fix for | ||
* Bug 944724: Exception in Trill SessionWindow when Partition (substreams) is used and restored from checkpoint | ||
* | ||
* Cause of the Bug: | ||
* The PartitionedSessionWindowPipe keeps multiple dictionary states. | ||
* One of the dictionary does not have a [DataMember] attribute, Because the value type is a LinkedList which does not support serialization. | ||
* On checkpoint and then Restore, this dictionary is re-created using other data members in UpdatePointers callback. | ||
* During this, the scenario of empty LinkedList value is missed and not restored. | ||
* When next data event appears for the partition, the partitionKey is indexed on the dictionary resulting in KeyNotFoundException | ||
*/ | ||
[TestClass] | ||
public class PartitionedStreamCheckpointTests : TestWithConfigSettingsWithoutMemoryLeakDetection | ||
{ | ||
[TestMethod, TestCategory("Gated")] | ||
public void CheckpointPartitionedSessionWindow() | ||
{ | ||
Config.DataBatchSize = 1; | ||
|
||
var data = new PartitionedStreamEvent<int, double>[] | ||
{ | ||
PartitionedStreamEvent.CreatePoint(0, 5, 1.0), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 8), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 11), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 14), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 17), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 21), | ||
PartitionedStreamEvent.CreatePoint(0, 24, 1.0), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 100), | ||
}; | ||
|
||
var expected = new PartitionedStreamEvent<int, double>[] | ||
{ | ||
PartitionedStreamEvent.CreateStart(0, 5, 1.0), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 8), | ||
PartitionedStreamEvent.CreateEnd(0, 9, 5, 1.0), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 11), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 14), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 17), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 21), | ||
PartitionedStreamEvent.CreateStart(0, 24, 1.0), | ||
PartitionedStreamEvent.CreateEnd(0, 28, 24, 1.0), | ||
PartitionedStreamEvent.CreatePunctuation<int, double>(0, 100), | ||
}; | ||
|
||
// This index represents the point when the checkpoint restore needs to happen to trigger the bug. | ||
const int checkpointIndex = 6; | ||
|
||
var subject = new Subject<PartitionedStreamEvent<int, double>>(); | ||
var output = new List<PartitionedStreamEvent<int, double>>(); | ||
var process = CreateQueryContainerForPartitionedStream(subject, output); | ||
|
||
for (int i = 0; i < data.Length; i++) | ||
{ | ||
if (i == checkpointIndex) | ||
{ | ||
using (var ms = new MemoryStream()) | ||
{ | ||
process.Checkpoint(ms); | ||
ms.Seek(0, SeekOrigin.Begin); | ||
|
||
subject = new Subject<PartitionedStreamEvent<int, double>>(); | ||
process = CreateQueryContainerForPartitionedStream(subject, output, ms); | ||
} | ||
} | ||
|
||
subject.OnNext(data[i]); | ||
} | ||
|
||
Assert.IsTrue(expected.SequenceEqual(output)); | ||
} | ||
|
||
private Process CreateQueryContainerForPartitionedStream( | ||
Subject<PartitionedStreamEvent<int, double>> subject, | ||
List<PartitionedStreamEvent<int, double>> output, | ||
Stream stream = null) | ||
{ | ||
var qc = new QueryContainer(); | ||
var input = qc.RegisterInput(subject); | ||
var streamableOutput = input.SessionTimeoutWindow(4, 5).Sum(o => o); | ||
var egress = qc.RegisterOutput(streamableOutput).ForEachAsync(o => output.Add(o)); | ||
var process = qc.Restore(stream); | ||
|
||
return process; | ||
} | ||
} | ||
} |