jrmccluskey commented on a change in pull request #15253: URL: https://github.com/apache/beam/pull/15253#discussion_r681094769
########## File path: sdks/go/pkg/beam/testing/teststream/teststream.go ########## @@ -0,0 +1,150 @@ +// Licensed to the Apache Software Foundation (ASF) under one or more +// contributor license agreements. See the NOTICE file distributed with +// this work for additional information regarding copyright ownership. +// The ASF licenses this file to You under the Apache License, Version 2.0 +// (the "License"); you may not use this file except in compliance with +// the License. You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. + +// Package teststream contains code configuring the TestStream primitive for +// use in testing code that is meant to be run on streaming data sources. +// See https://beam.apache.org/blog/test-stream/ for more information. +// TestStream is supported on Flink. +package teststream + +import ( + "bytes" + "fmt" + "reflect" + + "github.com/apache/beam/sdks/go/pkg/beam" + "github.com/apache/beam/sdks/go/pkg/beam/core/graph/coder" + "github.com/apache/beam/sdks/go/pkg/beam/core/graph/mtime" + "github.com/apache/beam/sdks/go/pkg/beam/core/util/protox" + + pipepb "github.com/apache/beam/sdks/go/pkg/beam/model/pipeline_v1" +) + +const urn = "beam:transform:teststream:v1" + +// Config holds information used to create a TestStreamPayload object. +type Config struct { + elmCoder *coder.Coder + events []*pipepb.TestStreamPayload_Event + endpoint *pipepb.ApiServiceDescriptor + watermark int64 +} + +// MakeConfig initializes a Config struct to begin inserting TestStream events/endpoints into. +// Requires that users provide the coder for the elements they are trying to emit. +func NewConfig() Config { + return Config{elmCoder: nil, + events: []*pipepb.TestStreamPayload_Event{}, + endpoint: &pipepb.ApiServiceDescriptor{}, + watermark: 0, + } +} + +// SetEndpoint sets a URL for a TestStreamService that will emit events instead of having them +// defined manually. Currently does not support authentication, so the TestStreamService should +// be accessed in a trusted context. +func (c *Config) SetEndpoint(url string) { + c.endpoint.Url = url +} + +// createPayload converts the Config object into a TestStreamPayload to be sent to the runner. +func (c *Config) createPayload() *pipepb.TestStreamPayload { + return &pipepb.TestStreamPayload{CoderId: "c0", Events: c.events, Endpoint: c.endpoint} +} + +// AdvanceWatermark adds an event to the Config Events struct advancing the watermark for the PCollection +// to the given timestamp. Timestamp is in milliseconds +func (c *Config) AdvanceWatermark(timestamp int64) error { + if c.watermark >= timestamp { + return fmt.Errorf("watermark must be monotonally increasing, is at %v, got %v", c.watermark, timestamp) + } + watermarkAdvance := &pipepb.TestStreamPayload_Event_AdvanceWatermark{NewWatermark: timestamp} + watermarkEvent := &pipepb.TestStreamPayload_Event_WatermarkEvent{WatermarkEvent: watermarkAdvance} + c.events = append(c.events, &pipepb.TestStreamPayload_Event{Event: watermarkEvent}) + c.watermark = timestamp + return nil +} + +// AdvanceWatermarkToInfinity advances the watermark to the maximum timestamp. +func (c *Config) AdvanceWatermarkToInfinity() error { + return c.AdvanceWatermark(mtime.MaxTimestamp.Milliseconds()) +} + +// AdvanceProcessingTime adds an event advancing the processing time by a given duration. +// This advancement is applied to all of the PCollections output by the TestStream. +func (c *Config) AdvanceProcessingTime(duration int64) { + processingAdvance := &pipepb.TestStreamPayload_Event_AdvanceProcessingTime{AdvanceDuration: duration} + processingEvent := &pipepb.TestStreamPayload_Event_ProcessingTimeEvent{ProcessingTimeEvent: processingAdvance} + c.events = append(c.events, &pipepb.TestStreamPayload_Event{Event: processingEvent}) +} + +// AdvanceProcessingTimeToInfinity moves the TestStream processing time to the largest possible +// timestamp. +func (c *Config) AdvanceProcessingTimeToInfinity() { + c.AdvanceProcessingTime(mtime.MaxTimestamp.Milliseconds()) +} + +// AddElements adds a number of elements to the Config object at the specified event timestamp. +// The encoder will panic if there is a type mismatch between the provided coder and the +// elements. +func (c *Config) AddElements(timestamp int64, elements ...interface{}) error { + if c.elmCoder == nil { + elmType := reflect.TypeOf(elements[0]) Review comment: Looking at it now I think we could completely ditch keeping up with the coder and keep up with the element type passed into AddElements instead. `beam.Create` just gets the type of the first element and defines the encoder off of that using `beam.NewElementEncoder` in the same way I have now. End result we can remove any references to coders in `AddElement.` -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: [email protected] For queries about this service, please contact Infrastructure at: [email protected]
