aboutsummaryrefslogtreecommitdiff
path: root/weed/query/engine/timestamp_integration_test.go
diff options
context:
space:
mode:
Diffstat (limited to 'weed/query/engine/timestamp_integration_test.go')
-rw-r--r--weed/query/engine/timestamp_integration_test.go202
1 files changed, 202 insertions, 0 deletions
diff --git a/weed/query/engine/timestamp_integration_test.go b/weed/query/engine/timestamp_integration_test.go
new file mode 100644
index 000000000..2f53e6d6e
--- /dev/null
+++ b/weed/query/engine/timestamp_integration_test.go
@@ -0,0 +1,202 @@
+package engine
+
+import (
+ "strconv"
+ "testing"
+
+ "github.com/seaweedfs/seaweedfs/weed/pb/schema_pb"
+ "github.com/stretchr/testify/assert"
+)
+
+// TestTimestampIntegrationScenarios tests complete end-to-end scenarios
+func TestTimestampIntegrationScenarios(t *testing.T) {
+ engine := NewTestSQLEngine()
+
+ // Simulate the exact timestamps that were failing in production
+ timestamps := []struct {
+ timestamp int64
+ id int64
+ name string
+ }{
+ {1756947416566456262, 897795, "original_failing_1"},
+ {1756947416566439304, 715356, "original_failing_2"},
+ {1756913789829292386, 82460, "current_data"},
+ }
+
+ t.Run("EndToEndTimestampEquality", func(t *testing.T) {
+ for _, ts := range timestamps {
+ t.Run(ts.name, func(t *testing.T) {
+ // Create a test record
+ record := &schema_pb.RecordValue{
+ Fields: map[string]*schema_pb.Value{
+ "_timestamp_ns": {Kind: &schema_pb.Value_Int64Value{Int64Value: ts.timestamp}},
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: ts.id}},
+ },
+ }
+
+ // Build SQL query
+ sql := "SELECT id, _timestamp_ns FROM test WHERE _timestamp_ns = " + strconv.FormatInt(ts.timestamp, 10)
+ stmt, err := ParseSQL(sql)
+ assert.NoError(t, err)
+
+ selectStmt := stmt.(*SelectStatement)
+
+ // Test time filter extraction (Fix #2 and #5)
+ startTimeNs, stopTimeNs := engine.extractTimeFilters(selectStmt.Where.Expr)
+ assert.Equal(t, ts.timestamp-1, startTimeNs, "Should set startTimeNs to avoid scan boundary bug")
+ assert.Equal(t, int64(0), stopTimeNs, "Should not set stopTimeNs to avoid premature termination")
+
+ // Test predicate building (Fix #1)
+ predicate, err := engine.buildPredicate(selectStmt.Where.Expr)
+ assert.NoError(t, err)
+
+ // Test predicate evaluation (Fix #1 - precision)
+ result := predicate(record)
+ assert.True(t, result, "Should match exact timestamp without precision loss")
+
+ // Test that close but different timestamps don't match
+ closeRecord := &schema_pb.RecordValue{
+ Fields: map[string]*schema_pb.Value{
+ "_timestamp_ns": {Kind: &schema_pb.Value_Int64Value{Int64Value: ts.timestamp + 1}},
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: ts.id}},
+ },
+ }
+ result = predicate(closeRecord)
+ assert.False(t, result, "Should not match timestamp that differs by 1 nanosecond")
+ })
+ }
+ })
+
+ t.Run("ComplexRangeQueries", func(t *testing.T) {
+ // Test range queries that combine multiple fixes
+ testCases := []struct {
+ name string
+ sql string
+ shouldSet struct{ start, stop bool }
+ }{
+ {
+ name: "RangeWithDifferentBounds",
+ sql: "SELECT * FROM test WHERE _timestamp_ns >= 1756913789829292386 AND _timestamp_ns <= 1756947416566456262",
+ shouldSet: struct{ start, stop bool }{true, true},
+ },
+ {
+ name: "RangeWithSameBounds",
+ sql: "SELECT * FROM test WHERE _timestamp_ns >= 1756913789829292386 AND _timestamp_ns <= 1756913789829292386",
+ shouldSet: struct{ start, stop bool }{true, false}, // Fix #4: equal bounds should not set stop
+ },
+ {
+ name: "OpenEndedRange",
+ sql: "SELECT * FROM test WHERE _timestamp_ns >= 1756913789829292386",
+ shouldSet: struct{ start, stop bool }{true, false},
+ },
+ }
+
+ for _, tc := range testCases {
+ t.Run(tc.name, func(t *testing.T) {
+ stmt, err := ParseSQL(tc.sql)
+ assert.NoError(t, err)
+
+ selectStmt := stmt.(*SelectStatement)
+ startTimeNs, stopTimeNs := engine.extractTimeFilters(selectStmt.Where.Expr)
+
+ if tc.shouldSet.start {
+ assert.NotEqual(t, int64(0), startTimeNs, "Should set startTimeNs for range query")
+ } else {
+ assert.Equal(t, int64(0), startTimeNs, "Should not set startTimeNs")
+ }
+
+ if tc.shouldSet.stop {
+ assert.NotEqual(t, int64(0), stopTimeNs, "Should set stopTimeNs for bounded range")
+ } else {
+ assert.Equal(t, int64(0), stopTimeNs, "Should not set stopTimeNs")
+ }
+ })
+ }
+ })
+
+ t.Run("ProductionScenarioReproduction", func(t *testing.T) {
+ // This test reproduces the exact production scenario that was failing
+
+ // Original failing query: WHERE _timestamp_ns = 1756947416566456262
+ sql := "SELECT id, _timestamp_ns FROM ecommerce.user_events WHERE _timestamp_ns = 1756947416566456262"
+ stmt, err := ParseSQL(sql)
+ assert.NoError(t, err, "Should parse the production query that was failing")
+
+ selectStmt := stmt.(*SelectStatement)
+
+ // Verify time filter extraction works correctly (fixes scan termination issue)
+ startTimeNs, stopTimeNs := engine.extractTimeFilters(selectStmt.Where.Expr)
+ assert.Equal(t, int64(1756947416566456261), startTimeNs, "Should set startTimeNs to target-1") // Fix #5
+ assert.Equal(t, int64(0), stopTimeNs, "Should not set stopTimeNs") // Fix #2
+
+ // Verify predicate handles the large timestamp correctly
+ predicate, err := engine.buildPredicate(selectStmt.Where.Expr)
+ assert.NoError(t, err, "Should build predicate for production query")
+
+ // Test with the actual record that exists in production
+ productionRecord := &schema_pb.RecordValue{
+ Fields: map[string]*schema_pb.Value{
+ "_timestamp_ns": {Kind: &schema_pb.Value_Int64Value{Int64Value: 1756947416566456262}},
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 897795}},
+ },
+ }
+
+ result := predicate(productionRecord)
+ assert.True(t, result, "Should match the production record that was failing before") // Fix #1
+
+ // Verify precision - test that a timestamp differing by just 1 nanosecond doesn't match
+ slightlyDifferentRecord := &schema_pb.RecordValue{
+ Fields: map[string]*schema_pb.Value{
+ "_timestamp_ns": {Kind: &schema_pb.Value_Int64Value{Int64Value: 1756947416566456263}},
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 897795}},
+ },
+ }
+
+ result = predicate(slightlyDifferentRecord)
+ assert.False(t, result, "Should NOT match record with timestamp differing by 1 nanosecond")
+ })
+}
+
+// TestRegressionPrevention ensures the fixes don't break normal cases
+func TestRegressionPrevention(t *testing.T) {
+ engine := NewTestSQLEngine()
+
+ t.Run("SmallTimestamps", func(t *testing.T) {
+ // Ensure small timestamps still work normally
+ smallTimestamp := int64(1234567890)
+
+ record := &schema_pb.RecordValue{
+ Fields: map[string]*schema_pb.Value{
+ "_timestamp_ns": {Kind: &schema_pb.Value_Int64Value{Int64Value: smallTimestamp}},
+ },
+ }
+
+ result := engine.valuesEqual(record.Fields["_timestamp_ns"], smallTimestamp)
+ assert.True(t, result, "Small timestamps should continue to work")
+ })
+
+ t.Run("NonTimestampColumns", func(t *testing.T) {
+ // Ensure non-timestamp columns aren't affected by timestamp fixes
+ sql := "SELECT * FROM test WHERE id = 12345"
+ stmt, err := ParseSQL(sql)
+ assert.NoError(t, err)
+
+ selectStmt := stmt.(*SelectStatement)
+ startTimeNs, stopTimeNs := engine.extractTimeFilters(selectStmt.Where.Expr)
+
+ assert.Equal(t, int64(0), startTimeNs, "Non-timestamp queries should not set startTimeNs")
+ assert.Equal(t, int64(0), stopTimeNs, "Non-timestamp queries should not set stopTimeNs")
+ })
+
+ t.Run("StringComparisons", func(t *testing.T) {
+ // Ensure string comparisons aren't affected
+ record := &schema_pb.RecordValue{
+ Fields: map[string]*schema_pb.Value{
+ "name": {Kind: &schema_pb.Value_StringValue{StringValue: "test"}},
+ },
+ }
+
+ result := engine.valuesEqual(record.Fields["name"], "test")
+ assert.True(t, result, "String comparisons should continue to work")
+ })
+}