github-mirrors
/
mirror-seaweedfs


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202
							package engine

import (
	"strconv"
	"testing"

	"github.com/seaweedfs/seaweedfs/weed/pb/schema_pb"
	"github.com/stretchr/testify/assert"
)

// TestTimestampIntegrationScenarios tests complete end-to-end scenarios
func TestTimestampIntegrationScenarios(t *testing.T) {
	engine := NewTestSQLEngine()

	// Simulate the exact timestamps that were failing in production
	timestamps := []struct {
		timestamp int64
		id        int64
		name      string
	}{
		{1756947416566456262, 897795, "original_failing_1"},
		{1756947416566439304, 715356, "original_failing_2"},
		{1756913789829292386, 82460, "current_data"},
	}

	t.Run("EndToEndTimestampEquality", func(t *testing.T) {
		for _, ts := range timestamps {
			t.Run(ts.name, func(t *testing.T) {
				// Create a test record
				record := &schema_pb.RecordValue{
					Fields: map[string]*schema_pb.Value{
						"_timestamp_ns": {Kind: &schema_pb.Value_Int64Value{Int64Value: ts.timestamp}},
						"id":            {Kind: &schema_pb.Value_Int64Value{Int64Value: ts.id}},
					},
				}

				// Build SQL query
				sql := "SELECT id, _timestamp_ns FROM test WHERE _timestamp_ns = " + strconv.FormatInt(ts.timestamp, 10)
				stmt, err := ParseSQL(sql)
				assert.NoError(t, err)

				selectStmt := stmt.(*SelectStatement)

				// Test time filter extraction (Fix #2 and #5)
				startTimeNs, stopTimeNs := engine.extractTimeFilters(selectStmt.Where.Expr)
				assert.Equal(t, ts.timestamp-1, startTimeNs, "Should set startTimeNs to avoid scan boundary bug")
				assert.Equal(t, int64(0), stopTimeNs, "Should not set stopTimeNs to avoid premature termination")

				// Test predicate building (Fix #1)
				predicate, err := engine.buildPredicate(selectStmt.Where.Expr)
				assert.NoError(t, err)

				// Test predicate evaluation (Fix #1 - precision)
				result := predicate(record)
				assert.True(t, result, "Should match exact timestamp without precision loss")

				// Test that close but different timestamps don't match
				closeRecord := &schema_pb.RecordValue{
					Fields: map[string]*schema_pb.Value{
						"_timestamp_ns": {Kind: &schema_pb.Value_Int64Value{Int64Value: ts.timestamp + 1}},
						"id":            {Kind: &schema_pb.Value_Int64Value{Int64Value: ts.id}},
					},
				}
				result = predicate(closeRecord)
				assert.False(t, result, "Should not match timestamp that differs by 1 nanosecond")
			})
		}
	})

	t.Run("ComplexRangeQueries", func(t *testing.T) {
		// Test range queries that combine multiple fixes
		testCases := []struct {
			name      string
			sql       string
			shouldSet struct{ start, stop bool }
		}{
			{
				name:      "RangeWithDifferentBounds",
				sql:       "SELECT * FROM test WHERE _timestamp_ns >= 1756913789829292386 AND _timestamp_ns <= 1756947416566456262",
				shouldSet: struct{ start, stop bool }{true, true},
			},
			{
				name:      "RangeWithSameBounds",
				sql:       "SELECT * FROM test WHERE _timestamp_ns >= 1756913789829292386 AND _timestamp_ns <= 1756913789829292386",
				shouldSet: struct{ start, stop bool }{true, false}, // Fix #4: equal bounds should not set stop
			},
			{
				name:      "OpenEndedRange",
				sql:       "SELECT * FROM test WHERE _timestamp_ns >= 1756913789829292386",
				shouldSet: struct{ start, stop bool }{true, false},
			},
		}

		for _, tc := range testCases {
			t.Run(tc.name, func(t *testing.T) {
				stmt, err := ParseSQL(tc.sql)
				assert.NoError(t, err)

				selectStmt := stmt.(*SelectStatement)
				startTimeNs, stopTimeNs := engine.extractTimeFilters(selectStmt.Where.Expr)

				if tc.shouldSet.start {
					assert.NotEqual(t, int64(0), startTimeNs, "Should set startTimeNs for range query")
				} else {
					assert.Equal(t, int64(0), startTimeNs, "Should not set startTimeNs")
				}

				if tc.shouldSet.stop {
					assert.NotEqual(t, int64(0), stopTimeNs, "Should set stopTimeNs for bounded range")
				} else {
					assert.Equal(t, int64(0), stopTimeNs, "Should not set stopTimeNs")
				}
			})
		}
	})

	t.Run("ProductionScenarioReproduction", func(t *testing.T) {
		// This test reproduces the exact production scenario that was failing

		// Original failing query: WHERE _timestamp_ns = 1756947416566456262
		sql := "SELECT id, _timestamp_ns FROM ecommerce.user_events WHERE _timestamp_ns = 1756947416566456262"
		stmt, err := ParseSQL(sql)
		assert.NoError(t, err, "Should parse the production query that was failing")

		selectStmt := stmt.(*SelectStatement)

		// Verify time filter extraction works correctly (fixes scan termination issue)
		startTimeNs, stopTimeNs := engine.extractTimeFilters(selectStmt.Where.Expr)
		assert.Equal(t, int64(1756947416566456261), startTimeNs, "Should set startTimeNs to target-1") // Fix #5
		assert.Equal(t, int64(0), stopTimeNs, "Should not set stopTimeNs")                             // Fix #2

		// Verify predicate handles the large timestamp correctly
		predicate, err := engine.buildPredicate(selectStmt.Where.Expr)
		assert.NoError(t, err, "Should build predicate for production query")

		// Test with the actual record that exists in production
		productionRecord := &schema_pb.RecordValue{
			Fields: map[string]*schema_pb.Value{
				"_timestamp_ns": {Kind: &schema_pb.Value_Int64Value{Int64Value: 1756947416566456262}},
				"id":            {Kind: &schema_pb.Value_Int64Value{Int64Value: 897795}},
			},
		}

		result := predicate(productionRecord)
		assert.True(t, result, "Should match the production record that was failing before") // Fix #1

		// Verify precision - test that a timestamp differing by just 1 nanosecond doesn't match
		slightlyDifferentRecord := &schema_pb.RecordValue{
			Fields: map[string]*schema_pb.Value{
				"_timestamp_ns": {Kind: &schema_pb.Value_Int64Value{Int64Value: 1756947416566456263}},
				"id":            {Kind: &schema_pb.Value_Int64Value{Int64Value: 897795}},
			},
		}

		result = predicate(slightlyDifferentRecord)
		assert.False(t, result, "Should NOT match record with timestamp differing by 1 nanosecond")
	})
}

// TestRegressionPrevention ensures the fixes don't break normal cases
func TestRegressionPrevention(t *testing.T) {
	engine := NewTestSQLEngine()

	t.Run("SmallTimestamps", func(t *testing.T) {
		// Ensure small timestamps still work normally
		smallTimestamp := int64(1234567890)

		record := &schema_pb.RecordValue{
			Fields: map[string]*schema_pb.Value{
				"_timestamp_ns": {Kind: &schema_pb.Value_Int64Value{Int64Value: smallTimestamp}},
			},
		}

		result := engine.valuesEqual(record.Fields["_timestamp_ns"], smallTimestamp)
		assert.True(t, result, "Small timestamps should continue to work")
	})

	t.Run("NonTimestampColumns", func(t *testing.T) {
		// Ensure non-timestamp columns aren't affected by timestamp fixes
		sql := "SELECT * FROM test WHERE id = 12345"
		stmt, err := ParseSQL(sql)
		assert.NoError(t, err)

		selectStmt := stmt.(*SelectStatement)
		startTimeNs, stopTimeNs := engine.extractTimeFilters(selectStmt.Where.Expr)

		assert.Equal(t, int64(0), startTimeNs, "Non-timestamp queries should not set startTimeNs")
		assert.Equal(t, int64(0), stopTimeNs, "Non-timestamp queries should not set stopTimeNs")
	})

	t.Run("StringComparisons", func(t *testing.T) {
		// Ensure string comparisons aren't affected
		record := &schema_pb.RecordValue{
			Fields: map[string]*schema_pb.Value{
				"name": {Kind: &schema_pb.Value_StringValue{StringValue: "test"}},
			},
		}

		result := engine.valuesEqual(record.Fields["name"], "test")
		assert.True(t, result, "String comparisons should continue to work")
	})
}