aboutsummaryrefslogtreecommitdiff
path: root/weed/query/engine/test_sample_data_test.go
diff options
context:
space:
mode:
Diffstat (limited to 'weed/query/engine/test_sample_data_test.go')
-rw-r--r--weed/query/engine/test_sample_data_test.go216
1 files changed, 216 insertions, 0 deletions
diff --git a/weed/query/engine/test_sample_data_test.go b/weed/query/engine/test_sample_data_test.go
new file mode 100644
index 000000000..e4a19b431
--- /dev/null
+++ b/weed/query/engine/test_sample_data_test.go
@@ -0,0 +1,216 @@
+package engine
+
+import (
+ "time"
+
+ "github.com/seaweedfs/seaweedfs/weed/pb/schema_pb"
+)
+
+// generateSampleHybridData creates sample data that simulates both live and archived messages
+// This function is only used for testing and is not included in production builds
+func generateSampleHybridData(topicName string, options HybridScanOptions) []HybridScanResult {
+ now := time.Now().UnixNano()
+
+ // Generate different sample data based on topic name
+ var sampleData []HybridScanResult
+
+ switch topicName {
+ case "user_events":
+ sampleData = []HybridScanResult{
+ // Simulated live log data (recent)
+ // Generate more test data to support LIMIT/OFFSET testing
+ {
+ Values: map[string]*schema_pb.Value{
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 82460}},
+ "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 9465}},
+ "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "live_login"}},
+ "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"ip": "10.0.0.1", "live": true}`}},
+ "status": {Kind: &schema_pb.Value_StringValue{StringValue: "active"}},
+ "action": {Kind: &schema_pb.Value_StringValue{StringValue: "login"}},
+ "user_type": {Kind: &schema_pb.Value_StringValue{StringValue: "premium"}},
+ "amount": {Kind: &schema_pb.Value_DoubleValue{DoubleValue: 43.619326294957126}},
+ },
+ Timestamp: now - 300000000000, // 5 minutes ago
+ Key: []byte("live-user-9465"),
+ Source: "live_log",
+ },
+ {
+ Values: map[string]*schema_pb.Value{
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 841256}},
+ "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 2336}},
+ "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "live_action"}},
+ "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"action": "click", "live": true}`}},
+ "status": {Kind: &schema_pb.Value_StringValue{StringValue: "pending"}},
+ "action": {Kind: &schema_pb.Value_StringValue{StringValue: "click"}},
+ "user_type": {Kind: &schema_pb.Value_StringValue{StringValue: "standard"}},
+ "amount": {Kind: &schema_pb.Value_DoubleValue{DoubleValue: 550.0278410655299}},
+ },
+ Timestamp: now - 120000000000, // 2 minutes ago
+ Key: []byte("live-user-2336"),
+ Source: "live_log",
+ },
+ {
+ Values: map[string]*schema_pb.Value{
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 55537}},
+ "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 6912}},
+ "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "purchase"}},
+ "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"amount": 25.99, "item": "book"}`}},
+ },
+ Timestamp: now - 90000000000, // 1.5 minutes ago
+ Key: []byte("live-user-6912"),
+ Source: "live_log",
+ },
+ {
+ Values: map[string]*schema_pb.Value{
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 65143}},
+ "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 5102}},
+ "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "page_view"}},
+ "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"page": "/home", "duration": 30}`}},
+ },
+ Timestamp: now - 80000000000, // 80 seconds ago
+ Key: []byte("live-user-5102"),
+ Source: "live_log",
+ },
+
+ // Simulated archived Parquet data (older)
+ {
+ Values: map[string]*schema_pb.Value{
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 686003}},
+ "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 2759}},
+ "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "archived_login"}},
+ "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"ip": "192.168.1.1", "archived": true}`}},
+ },
+ Timestamp: now - 3600000000000, // 1 hour ago
+ Key: []byte("archived-user-2759"),
+ Source: "parquet_archive",
+ },
+ {
+ Values: map[string]*schema_pb.Value{
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 417224}},
+ "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 7810}},
+ "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "archived_logout"}},
+ "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"duration": 1800, "archived": true}`}},
+ },
+ Timestamp: now - 1800000000000, // 30 minutes ago
+ Key: []byte("archived-user-7810"),
+ Source: "parquet_archive",
+ },
+ {
+ Values: map[string]*schema_pb.Value{
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 424297}},
+ "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 8897}},
+ "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "purchase"}},
+ "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"amount": 45.50, "item": "electronics"}`}},
+ },
+ Timestamp: now - 1500000000000, // 25 minutes ago
+ Key: []byte("archived-user-8897"),
+ Source: "parquet_archive",
+ },
+ {
+ Values: map[string]*schema_pb.Value{
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 431189}},
+ "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 3400}},
+ "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "signup"}},
+ "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"referral": "google", "plan": "free"}`}},
+ },
+ Timestamp: now - 1200000000000, // 20 minutes ago
+ Key: []byte("archived-user-3400"),
+ Source: "parquet_archive",
+ },
+ {
+ Values: map[string]*schema_pb.Value{
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 413249}},
+ "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 5175}},
+ "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "update_profile"}},
+ "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"field": "email", "new_value": "user@example.com"}`}},
+ },
+ Timestamp: now - 900000000000, // 15 minutes ago
+ Key: []byte("archived-user-5175"),
+ Source: "parquet_archive",
+ },
+ {
+ Values: map[string]*schema_pb.Value{
+ "id": {Kind: &schema_pb.Value_Int64Value{Int64Value: 120612}},
+ "user_id": {Kind: &schema_pb.Value_Int32Value{Int32Value: 5429}},
+ "event_type": {Kind: &schema_pb.Value_StringValue{StringValue: "comment"}},
+ "data": {Kind: &schema_pb.Value_StringValue{StringValue: `{"post_id": 123, "comment": "Great post!"}`}},
+ },
+ Timestamp: now - 600000000000, // 10 minutes ago
+ Key: []byte("archived-user-5429"),
+ Source: "parquet_archive",
+ },
+ }
+
+ case "system_logs":
+ sampleData = []HybridScanResult{
+ // Simulated live system logs (recent)
+ {
+ Values: map[string]*schema_pb.Value{
+ "level": {Kind: &schema_pb.Value_StringValue{StringValue: "INFO"}},
+ "message": {Kind: &schema_pb.Value_StringValue{StringValue: "Live system startup completed"}},
+ "service": {Kind: &schema_pb.Value_StringValue{StringValue: "auth-service"}},
+ },
+ Timestamp: now - 240000000000, // 4 minutes ago
+ Key: []byte("live-sys-001"),
+ Source: "live_log",
+ },
+ {
+ Values: map[string]*schema_pb.Value{
+ "level": {Kind: &schema_pb.Value_StringValue{StringValue: "WARN"}},
+ "message": {Kind: &schema_pb.Value_StringValue{StringValue: "Live high memory usage detected"}},
+ "service": {Kind: &schema_pb.Value_StringValue{StringValue: "monitor-service"}},
+ },
+ Timestamp: now - 180000000000, // 3 minutes ago
+ Key: []byte("live-sys-002"),
+ Source: "live_log",
+ },
+
+ // Simulated archived system logs (older)
+ {
+ Values: map[string]*schema_pb.Value{
+ "level": {Kind: &schema_pb.Value_StringValue{StringValue: "ERROR"}},
+ "message": {Kind: &schema_pb.Value_StringValue{StringValue: "Archived database connection failed"}},
+ "service": {Kind: &schema_pb.Value_StringValue{StringValue: "db-service"}},
+ },
+ Timestamp: now - 7200000000000, // 2 hours ago
+ Key: []byte("archived-sys-001"),
+ Source: "parquet_archive",
+ },
+ {
+ Values: map[string]*schema_pb.Value{
+ "level": {Kind: &schema_pb.Value_StringValue{StringValue: "INFO"}},
+ "message": {Kind: &schema_pb.Value_StringValue{StringValue: "Archived batch job completed"}},
+ "service": {Kind: &schema_pb.Value_StringValue{StringValue: "batch-service"}},
+ },
+ Timestamp: now - 3600000000000, // 1 hour ago
+ Key: []byte("archived-sys-002"),
+ Source: "parquet_archive",
+ },
+ }
+
+ default:
+ // For unknown topics, return empty data
+ sampleData = []HybridScanResult{}
+ }
+
+ // Apply predicate filtering if specified
+ if options.Predicate != nil {
+ var filtered []HybridScanResult
+ for _, result := range sampleData {
+ // Convert to RecordValue for predicate testing
+ recordValue := &schema_pb.RecordValue{Fields: make(map[string]*schema_pb.Value)}
+ for k, v := range result.Values {
+ recordValue.Fields[k] = v
+ }
+ recordValue.Fields[SW_COLUMN_NAME_TIMESTAMP] = &schema_pb.Value{Kind: &schema_pb.Value_Int64Value{Int64Value: result.Timestamp}}
+ recordValue.Fields[SW_COLUMN_NAME_KEY] = &schema_pb.Value{Kind: &schema_pb.Value_BytesValue{BytesValue: result.Key}}
+
+ if options.Predicate(recordValue) {
+ filtered = append(filtered, result)
+ }
+ }
+ sampleData = filtered
+ }
+
+ return sampleData
+}