| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216 |
- package engine
- import (
- "time"
- "github.com/seaweedfs/seaweedfs/weed/pb/schema_pb"
- )
- // generateSampleHybridData creates sample data that simulates both live and archived messages
- // This function is only used for testing and is not included in production builds
- func generateSampleHybridData(topicName string, options HybridScanOptions) []HybridScanResult {
- now := time.Now().UnixNano()
- // Generate different sample data based on topic name
- var sampleData []HybridScanResult
- switch topicName {
- case "user_events":
- sampleData = []HybridScanResult{
- // Simulated live log data (recent)
- // Generate more test data to support LIMIT/OFFSET testing
- {
- Values: map[string]*schema_pb.Value{
- "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 82460}},
- "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 9465}},
- "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "live_login"}},
- "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"ip": "10.0.0.1", "live": true}`}},
- "status": {Kind: &schema_pb.Value_StringValue{StringValue: "active"}},
- "action": {Kind: &schema_pb.Value_StringValue{StringValue: "login"}},
- "user_type": {Kind: &schema_pb.Value_StringValue{StringValue: "premium"}},
- "amount": {Kind: &schema_pb.Value_DoubleValue{DoubleValue: 43.619326294957126}},
- },
- Timestamp: now - 300000000000, // 5 minutes ago
- Key: []byte("live-user-9465"),
- Source: "live_log",
- },
- {
- Values: map[string]*schema_pb.Value{
- "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 841256}},
- "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 2336}},
- "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "live_action"}},
- "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"action": "click", "live": true}`}},
- "status": {Kind: &schema_pb.Value_StringValue{StringValue: "pending"}},
- "action": {Kind: &schema_pb.Value_StringValue{StringValue: "click"}},
- "user_type": {Kind: &schema_pb.Value_StringValue{StringValue: "standard"}},
- "amount": {Kind: &schema_pb.Value_DoubleValue{DoubleValue: 550.0278410655299}},
- },
- Timestamp: now - 120000000000, // 2 minutes ago
- Key: []byte("live-user-2336"),
- Source: "live_log",
- },
- {
- Values: map[string]*schema_pb.Value{
- "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 55537}},
- "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 6912}},
- "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "purchase"}},
- "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"amount": 25.99, "item": "book"}`}},
- },
- Timestamp: now - 90000000000, // 1.5 minutes ago
- Key: []byte("live-user-6912"),
- Source: "live_log",
- },
- {
- Values: map[string]*schema_pb.Value{
- "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 65143}},
- "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 5102}},
- "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "page_view"}},
- "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"page": "/home", "duration": 30}`}},
- },
- Timestamp: now - 80000000000, // 80 seconds ago
- Key: []byte("live-user-5102"),
- Source: "live_log",
- },
- // Simulated archived Parquet data (older)
- {
- Values: map[string]*schema_pb.Value{
- "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 686003}},
- "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 2759}},
- "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "archived_login"}},
- "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"ip": "192.168.1.1", "archived": true}`}},
- },
- Timestamp: now - 3600000000000, // 1 hour ago
- Key: []byte("archived-user-2759"),
- Source: "parquet_archive",
- },
- {
- Values: map[string]*schema_pb.Value{
- "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 417224}},
- "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 7810}},
- "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "archived_logout"}},
- "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"duration": 1800, "archived": true}`}},
- },
- Timestamp: now - 1800000000000, // 30 minutes ago
- Key: []byte("archived-user-7810"),
- Source: "parquet_archive",
- },
- {
- Values: map[string]*schema_pb.Value{
- "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 424297}},
- "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 8897}},
- "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "purchase"}},
- "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"amount": 45.50, "item": "electronics"}`}},
- },
- Timestamp: now - 1500000000000, // 25 minutes ago
- Key: []byte("archived-user-8897"),
- Source: "parquet_archive",
- },
- {
- Values: map[string]*schema_pb.Value{
- "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 431189}},
- "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 3400}},
- "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "signup"}},
- "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"referral": "google", "plan": "free"}`}},
- },
- Timestamp: now - 1200000000000, // 20 minutes ago
- Key: []byte("archived-user-3400"),
- Source: "parquet_archive",
- },
- {
- Values: map[string]*schema_pb.Value{
- "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 413249}},
- "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 5175}},
- "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "update_profile"}},
- "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"field": "email", "new_value": "user@example.com"}`}},
- },
- Timestamp: now - 900000000000, // 15 minutes ago
- Key: []byte("archived-user-5175"),
- Source: "parquet_archive",
- },
- {
- Values: map[string]*schema_pb.Value{
- "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 120612}},
- "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 5429}},
- "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "comment"}},
- "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"post_id": 123, "comment": "Great post!"}`}},
- },
- Timestamp: now - 600000000000, // 10 minutes ago
- Key: []byte("archived-user-5429"),
- Source: "parquet_archive",
- },
- }
- case "system_logs":
- sampleData = []HybridScanResult{
- // Simulated live system logs (recent)
- {
- Values: map[string]*schema_pb.Value{
- "level": {Kind: &schema_pb.Value_StringValue{StringValue: "INFO"}},
- "message": {Kind: &schema_pb.Value_StringValue{StringValue: "Live system startup completed"}},
- "service": {Kind: &schema_pb.Value_StringValue{StringValue: "auth-service"}},
- },
- Timestamp: now - 240000000000, // 4 minutes ago
- Key: []byte("live-sys-001"),
- Source: "live_log",
- },
- {
- Values: map[string]*schema_pb.Value{
- "level": {Kind: &schema_pb.Value_StringValue{StringValue: "WARN"}},
- "message": {Kind: &schema_pb.Value_StringValue{StringValue: "Live high memory usage detected"}},
- "service": {Kind: &schema_pb.Value_StringValue{StringValue: "monitor-service"}},
- },
- Timestamp: now - 180000000000, // 3 minutes ago
- Key: []byte("live-sys-002"),
- Source: "live_log",
- },
- // Simulated archived system logs (older)
- {
- Values: map[string]*schema_pb.Value{
- "level": {Kind: &schema_pb.Value_StringValue{StringValue: "ERROR"}},
- "message": {Kind: &schema_pb.Value_StringValue{StringValue: "Archived database connection failed"}},
- "service": {Kind: &schema_pb.Value_StringValue{StringValue: "db-service"}},
- },
- Timestamp: now - 7200000000000, // 2 hours ago
- Key: []byte("archived-sys-001"),
- Source: "parquet_archive",
- },
- {
- Values: map[string]*schema_pb.Value{
- "level": {Kind: &schema_pb.Value_StringValue{StringValue: "INFO"}},
- "message": {Kind: &schema_pb.Value_StringValue{StringValue: "Archived batch job completed"}},
- "service": {Kind: &schema_pb.Value_StringValue{StringValue: "batch-service"}},
- },
- Timestamp: now - 3600000000000, // 1 hour ago
- Key: []byte("archived-sys-002"),
- Source: "parquet_archive",
- },
- }
- default:
- // For unknown topics, return empty data
- sampleData = []HybridScanResult{}
- }
- // Apply predicate filtering if specified
- if options.Predicate != nil {
- var filtered []HybridScanResult
- for _, result := range sampleData {
- // Convert to RecordValue for predicate testing
- recordValue := &schema_pb.RecordValue{Fields: make(map[string]*schema_pb.Value)}
- for k, v := range result.Values {
- recordValue.Fields[k] = v
- }
- recordValue.Fields[SW_COLUMN_NAME_TIMESTAMP] = &schema_pb.Value{Kind: &schema_pb.Value_Int64Value{Int64Value: result.Timestamp}}
- recordValue.Fields[SW_COLUMN_NAME_KEY] = &schema_pb.Value{Kind: &schema_pb.Value_BytesValue{BytesValue: result.Key}}
- if options.Predicate(recordValue) {
- filtered = append(filtered, result)
- }
- }
- sampleData = filtered
- }
- return sampleData
- }
|