| // Copyright 2016 Google LLC |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| package pubsub |
| |
| import ( |
| "context" |
| "errors" |
| "fmt" |
| "runtime" |
| "strings" |
| "sync" |
| "time" |
| |
| "cloud.google.com/go/iam" |
| "github.com/golang/protobuf/proto" |
| gax "github.com/googleapis/gax-go/v2" |
| "google.golang.org/api/support/bundler" |
| pb "google.golang.org/genproto/googleapis/pubsub/v1" |
| fmpb "google.golang.org/genproto/protobuf/field_mask" |
| "google.golang.org/grpc" |
| "google.golang.org/grpc/codes" |
| ) |
| |
| const ( |
| // MaxPublishRequestCount is the maximum number of messages that can be in a single publish request, as |
| // defined by the PubSub service. |
| MaxPublishRequestCount = 1000 |
| |
| // MaxPublishRequestBytes is the maximum size of a single publish request in bytes, as defined by the PubSub |
| // service. |
| MaxPublishRequestBytes = 1e7 |
| |
| maxInt = int(^uint(0) >> 1) |
| ) |
| |
| // ErrOversizedMessage indicates that a message's size exceeds MaxPublishRequestBytes. |
| var ErrOversizedMessage = bundler.ErrOversizedItem |
| |
| // Topic is a reference to a PubSub topic. |
| // |
| // The methods of Topic are safe for use by multiple goroutines. |
| type Topic struct { |
| c *Client |
| // The fully qualified identifier for the topic, in the format "projects/<projid>/topics/<name>" |
| name string |
| |
| // Settings for publishing messages. All changes must be made before the |
| // first call to Publish. The default is DefaultPublishSettings. |
| PublishSettings PublishSettings |
| |
| mu sync.RWMutex |
| stopped bool |
| bundler *bundler.Bundler |
| } |
| |
| // PublishSettings control the bundling of published messages. |
| type PublishSettings struct { |
| |
| // Publish a non-empty batch after this delay has passed. |
| DelayThreshold time.Duration |
| |
| // Publish a batch when it has this many messages. The maximum is |
| // MaxPublishRequestCount. |
| CountThreshold int |
| |
| // Publish a batch when its size in bytes reaches this value. |
| ByteThreshold int |
| |
| // The number of goroutines that invoke the Publish RPC concurrently. |
| // Defaults to a multiple of GOMAXPROCS. |
| NumGoroutines int |
| |
| // The maximum time that the client will attempt to publish a bundle of messages. |
| Timeout time.Duration |
| } |
| |
| // DefaultPublishSettings holds the default values for topics' PublishSettings. |
| var DefaultPublishSettings = PublishSettings{ |
| DelayThreshold: 1 * time.Millisecond, |
| CountThreshold: 100, |
| ByteThreshold: 1e6, |
| Timeout: 60 * time.Second, |
| } |
| |
| // CreateTopic creates a new topic. |
| // The specified topic ID must start with a letter, and contain only letters |
| // ([A-Za-z]), numbers ([0-9]), dashes (-), underscores (_), periods (.), |
| // tildes (~), plus (+) or percent signs (%). It must be between 3 and 255 |
| // characters in length, and must not start with "goog". |
| // If the topic already exists an error will be returned. |
| func (c *Client) CreateTopic(ctx context.Context, id string) (*Topic, error) { |
| t := c.Topic(id) |
| _, err := c.pubc.CreateTopic(ctx, &pb.Topic{Name: t.name}) |
| if err != nil { |
| return nil, err |
| } |
| return t, nil |
| } |
| |
| // Topic creates a reference to a topic in the client's project. |
| // |
| // If a Topic's Publish method is called, it has background goroutines |
| // associated with it. Clean them up by calling Topic.Stop. |
| // |
| // Avoid creating many Topic instances if you use them to publish. |
| func (c *Client) Topic(id string) *Topic { |
| return c.TopicInProject(id, c.projectID) |
| } |
| |
| // TopicInProject creates a reference to a topic in the given project. |
| // |
| // If a Topic's Publish method is called, it has background goroutines |
| // associated with it. Clean them up by calling Topic.Stop. |
| // |
| // Avoid creating many Topic instances if you use them to publish. |
| func (c *Client) TopicInProject(id, projectID string) *Topic { |
| return newTopic(c, fmt.Sprintf("projects/%s/topics/%s", projectID, id)) |
| } |
| |
| func newTopic(c *Client, name string) *Topic { |
| return &Topic{ |
| c: c, |
| name: name, |
| PublishSettings: DefaultPublishSettings, |
| } |
| } |
| |
| // TopicConfig describes the configuration of a topic. |
| type TopicConfig struct { |
| // The set of labels for the topic. |
| Labels map[string]string |
| // The topic's message storage policy. |
| MessageStoragePolicy MessageStoragePolicy |
| } |
| |
| // TopicConfigToUpdate describes how to update a topic. |
| type TopicConfigToUpdate struct { |
| // If non-nil, the current set of labels is completely |
| // replaced by the new set. |
| // This field has beta status. It is not subject to the stability guarantee |
| // and may change. |
| Labels map[string]string |
| } |
| |
| func protoToTopicConfig(pbt *pb.Topic) TopicConfig { |
| return TopicConfig{ |
| Labels: pbt.Labels, |
| MessageStoragePolicy: protoToMessageStoragePolicy(pbt.MessageStoragePolicy), |
| } |
| } |
| |
| // MessageStoragePolicy constrains how messages published to the topic may be stored. It |
| // is determined when the topic is created based on the policy configured at |
| // the project level. |
| type MessageStoragePolicy struct { |
| // The list of GCP regions where messages that are published to the topic may |
| // be persisted in storage. Messages published by publishers running in |
| // non-allowed GCP regions (or running outside of GCP altogether) will be |
| // routed for storage in one of the allowed regions. An empty list indicates a |
| // misconfiguration at the project or organization level, which will result in |
| // all Publish operations failing. |
| AllowedPersistenceRegions []string |
| } |
| |
| func protoToMessageStoragePolicy(msp *pb.MessageStoragePolicy) MessageStoragePolicy { |
| if msp == nil { |
| return MessageStoragePolicy{} |
| } |
| return MessageStoragePolicy{AllowedPersistenceRegions: msp.AllowedPersistenceRegions} |
| } |
| |
| // Config returns the TopicConfig for the topic. |
| func (t *Topic) Config(ctx context.Context) (TopicConfig, error) { |
| pbt, err := t.c.pubc.GetTopic(ctx, &pb.GetTopicRequest{Topic: t.name}) |
| if err != nil { |
| return TopicConfig{}, err |
| } |
| return protoToTopicConfig(pbt), nil |
| } |
| |
| // Update changes an existing topic according to the fields set in cfg. It returns |
| // the new TopicConfig. |
| // |
| // Any call to Update (even with an empty TopicConfigToUpdate) will update the |
| // MessageStoragePolicy for the topic from the organization's settings. |
| func (t *Topic) Update(ctx context.Context, cfg TopicConfigToUpdate) (TopicConfig, error) { |
| req := t.updateRequest(cfg) |
| if len(req.UpdateMask.Paths) == 0 { |
| return TopicConfig{}, errors.New("pubsub: UpdateTopic call with nothing to update") |
| } |
| rpt, err := t.c.pubc.UpdateTopic(ctx, req) |
| if err != nil { |
| return TopicConfig{}, err |
| } |
| return protoToTopicConfig(rpt), nil |
| } |
| |
| func (t *Topic) updateRequest(cfg TopicConfigToUpdate) *pb.UpdateTopicRequest { |
| pt := &pb.Topic{Name: t.name} |
| paths := []string{"message_storage_policy"} // always fetch |
| if cfg.Labels != nil { |
| pt.Labels = cfg.Labels |
| paths = append(paths, "labels") |
| } |
| return &pb.UpdateTopicRequest{ |
| Topic: pt, |
| UpdateMask: &fmpb.FieldMask{Paths: paths}, |
| } |
| } |
| |
| // Topics returns an iterator which returns all of the topics for the client's project. |
| func (c *Client) Topics(ctx context.Context) *TopicIterator { |
| it := c.pubc.ListTopics(ctx, &pb.ListTopicsRequest{Project: c.fullyQualifiedProjectName()}) |
| return &TopicIterator{ |
| c: c, |
| next: func() (string, error) { |
| topic, err := it.Next() |
| if err != nil { |
| return "", err |
| } |
| return topic.Name, nil |
| }, |
| } |
| } |
| |
| // TopicIterator is an iterator that returns a series of topics. |
| type TopicIterator struct { |
| c *Client |
| next func() (string, error) |
| } |
| |
| // Next returns the next topic. If there are no more topics, iterator.Done will be returned. |
| func (tps *TopicIterator) Next() (*Topic, error) { |
| topicName, err := tps.next() |
| if err != nil { |
| return nil, err |
| } |
| return newTopic(tps.c, topicName), nil |
| } |
| |
| // ID returns the unique identifier of the topic within its project. |
| func (t *Topic) ID() string { |
| slash := strings.LastIndex(t.name, "/") |
| if slash == -1 { |
| // name is not a fully-qualified name. |
| panic("bad topic name") |
| } |
| return t.name[slash+1:] |
| } |
| |
| // String returns the printable globally unique name for the topic. |
| func (t *Topic) String() string { |
| return t.name |
| } |
| |
| // Delete deletes the topic. |
| func (t *Topic) Delete(ctx context.Context) error { |
| return t.c.pubc.DeleteTopic(ctx, &pb.DeleteTopicRequest{Topic: t.name}) |
| } |
| |
| // Exists reports whether the topic exists on the server. |
| func (t *Topic) Exists(ctx context.Context) (bool, error) { |
| if t.name == "_deleted-topic_" { |
| return false, nil |
| } |
| _, err := t.c.pubc.GetTopic(ctx, &pb.GetTopicRequest{Topic: t.name}) |
| if err == nil { |
| return true, nil |
| } |
| if grpc.Code(err) == codes.NotFound { |
| return false, nil |
| } |
| return false, err |
| } |
| |
| // IAM returns the topic's IAM handle. |
| func (t *Topic) IAM() *iam.Handle { |
| return iam.InternalNewHandle(t.c.pubc.Connection(), t.name) |
| } |
| |
| // Subscriptions returns an iterator which returns the subscriptions for this topic. |
| // |
| // Some of the returned subscriptions may belong to a project other than t. |
| func (t *Topic) Subscriptions(ctx context.Context) *SubscriptionIterator { |
| it := t.c.pubc.ListTopicSubscriptions(ctx, &pb.ListTopicSubscriptionsRequest{ |
| Topic: t.name, |
| }) |
| return &SubscriptionIterator{ |
| c: t.c, |
| next: it.Next, |
| } |
| } |
| |
| var errTopicStopped = errors.New("pubsub: Stop has been called for this topic") |
| |
| // Publish publishes msg to the topic asynchronously. Messages are batched and |
| // sent according to the topic's PublishSettings. Publish never blocks. |
| // |
| // Publish returns a non-nil PublishResult which will be ready when the |
| // message has been sent (or has failed to be sent) to the server. |
| // |
| // Publish creates goroutines for batching and sending messages. These goroutines |
| // need to be stopped by calling t.Stop(). Once stopped, future calls to Publish |
| // will immediately return a PublishResult with an error. |
| func (t *Topic) Publish(ctx context.Context, msg *Message) *PublishResult { |
| // TODO(jba): if this turns out to take significant time, try to approximate it. |
| // Or, convert the messages to protos in Publish, instead of in the service. |
| msg.size = proto.Size(&pb.PubsubMessage{ |
| Data: msg.Data, |
| Attributes: msg.Attributes, |
| }) |
| r := &PublishResult{ready: make(chan struct{})} |
| t.initBundler() |
| t.mu.RLock() |
| defer t.mu.RUnlock() |
| // TODO(aboulhosn) [from bcmills] consider changing the semantics of bundler to perform this logic so we don't have to do it here |
| if t.stopped { |
| r.set("", errTopicStopped) |
| return r |
| } |
| |
| // TODO(jba) [from bcmills] consider using a shared channel per bundle |
| // (requires Bundler API changes; would reduce allocations) |
| // The call to Add should never return an error because the bundler's |
| // BufferedByteLimit is set to maxInt; we do not perform any flow |
| // control in the client. |
| err := t.bundler.Add(&bundledMessage{msg, r}, msg.size) |
| if err != nil { |
| r.set("", err) |
| } |
| return r |
| } |
| |
| // Stop sends all remaining published messages and stop goroutines created for handling |
| // publishing. Returns once all outstanding messages have been sent or have |
| // failed to be sent. |
| func (t *Topic) Stop() { |
| t.mu.Lock() |
| noop := t.stopped || t.bundler == nil |
| t.stopped = true |
| t.mu.Unlock() |
| if noop { |
| return |
| } |
| t.bundler.Flush() |
| } |
| |
| // A PublishResult holds the result from a call to Publish. |
| type PublishResult struct { |
| ready chan struct{} |
| serverID string |
| err error |
| } |
| |
| // Ready returns a channel that is closed when the result is ready. |
| // When the Ready channel is closed, Get is guaranteed not to block. |
| func (r *PublishResult) Ready() <-chan struct{} { return r.ready } |
| |
| // Get returns the server-generated message ID and/or error result of a Publish call. |
| // Get blocks until the Publish call completes or the context is done. |
| func (r *PublishResult) Get(ctx context.Context) (serverID string, err error) { |
| // If the result is already ready, return it even if the context is done. |
| select { |
| case <-r.Ready(): |
| return r.serverID, r.err |
| default: |
| } |
| select { |
| case <-ctx.Done(): |
| return "", ctx.Err() |
| case <-r.Ready(): |
| return r.serverID, r.err |
| } |
| } |
| |
| func (r *PublishResult) set(sid string, err error) { |
| r.serverID = sid |
| r.err = err |
| close(r.ready) |
| } |
| |
| type bundledMessage struct { |
| msg *Message |
| res *PublishResult |
| } |
| |
| func (t *Topic) initBundler() { |
| t.mu.RLock() |
| noop := t.stopped || t.bundler != nil |
| t.mu.RUnlock() |
| if noop { |
| return |
| } |
| t.mu.Lock() |
| defer t.mu.Unlock() |
| // Must re-check, since we released the lock. |
| if t.stopped || t.bundler != nil { |
| return |
| } |
| |
| timeout := t.PublishSettings.Timeout |
| t.bundler = bundler.NewBundler(&bundledMessage{}, func(items interface{}) { |
| // TODO(jba): use a context detached from the one passed to NewClient. |
| ctx := context.TODO() |
| if timeout != 0 { |
| var cancel func() |
| ctx, cancel = context.WithTimeout(ctx, timeout) |
| defer cancel() |
| } |
| t.publishMessageBundle(ctx, items.([]*bundledMessage)) |
| }) |
| t.bundler.DelayThreshold = t.PublishSettings.DelayThreshold |
| t.bundler.BundleCountThreshold = t.PublishSettings.CountThreshold |
| if t.bundler.BundleCountThreshold > MaxPublishRequestCount { |
| t.bundler.BundleCountThreshold = MaxPublishRequestCount |
| } |
| t.bundler.BundleByteThreshold = t.PublishSettings.ByteThreshold |
| t.bundler.BufferedByteLimit = maxInt |
| t.bundler.BundleByteLimit = MaxPublishRequestBytes |
| // Unless overridden, allow many goroutines per CPU to call the Publish RPC concurrently. |
| // The default value was determined via extensive load testing (see the loadtest subdirectory). |
| if t.PublishSettings.NumGoroutines > 0 { |
| t.bundler.HandlerLimit = t.PublishSettings.NumGoroutines |
| } else { |
| t.bundler.HandlerLimit = 25 * runtime.GOMAXPROCS(0) |
| } |
| } |
| |
| func (t *Topic) publishMessageBundle(ctx context.Context, bms []*bundledMessage) { |
| pbMsgs := make([]*pb.PubsubMessage, len(bms)) |
| for i, bm := range bms { |
| pbMsgs[i] = &pb.PubsubMessage{ |
| Data: bm.msg.Data, |
| Attributes: bm.msg.Attributes, |
| } |
| bm.msg = nil // release bm.msg for GC |
| } |
| res, err := t.c.pubc.Publish(ctx, &pb.PublishRequest{ |
| Topic: t.name, |
| Messages: pbMsgs, |
| }, gax.WithGRPCOptions(grpc.MaxCallSendMsgSize(maxSendRecvBytes))) |
| for i, bm := range bms { |
| if err != nil { |
| bm.res.set("", err) |
| } else { |
| bm.res.set(res.MessageIds[i], nil) |
| } |
| } |
| } |