From fcd0a8252e3ab27662be2a781073b80a03f31573 Mon Sep 17 00:00:00 2001 From: Rasmus Dahlberg Date: Sun, 11 May 2025 20:54:16 +0200 Subject: monitor: Retry get-sth and proof fetching Should ensure we don't get into a position where we always fail to get 3x queries that succeed in a row when trying to persist chunks. --- internal/monitor/backoff.go | 83 +++++++++++++++++++++++++++++++++++++++++++-- 1 file changed, 80 insertions(+), 3 deletions(-) (limited to 'internal') diff --git a/internal/monitor/backoff.go b/internal/monitor/backoff.go index 63c5f55..3bfff7e 100644 --- a/internal/monitor/backoff.go +++ b/internal/monitor/backoff.go @@ -2,6 +2,7 @@ package monitor import ( "context" + "time" ct "github.com/google/certificate-transparency-go" "github.com/google/certificate-transparency-go/client" @@ -15,6 +16,10 @@ import ( // // For reference on this issue, see: // https://github.com/google/certificate-transparency-go/issues/898 +// +// Update: retries was added for get-sth and proof fetching. +// Only because we need 3x queries that succeed in a row, and some logs seem to +// rate limit globally for all endpoints rather than per endpoint. type backoffClient struct { cli *client.LogClient } @@ -24,15 +29,75 @@ func (bc *backoffClient) BaseURI() string { } func (bc *backoffClient) GetSTH(ctx context.Context) (*ct.SignedTreeHead, error) { - return bc.cli.GetSTH(ctx) + backoff := 1 + for { + rsp, err := bc.cli.GetSTH(ctx) + if err == nil { + return rsp, nil + } + + jcErr, ok := err.(jsonclient.RspError) + if !ok { + return rsp, err + } + if jcErr.StatusCode != 429 { + return rsp, err + } + if err := sleep(ctx, time.Duration(backoff)*time.Second); err != nil { + return nil, err + } + if backoff < 32 { + backoff = 2 * backoff + } + } } func (bc *backoffClient) GetSTHConsistency(ctx context.Context, first, second uint64) ([][]byte, error) { - return bc.cli.GetSTHConsistency(ctx, first, second) + backoff := 1 + for { + rsp, err := bc.cli.GetSTHConsistency(ctx, first, second) + if err == nil { + return rsp, nil + } + + jcErr, ok := err.(jsonclient.RspError) + if !ok { + return rsp, err + } + if jcErr.StatusCode != 429 { + return rsp, err + } + if err := sleep(ctx, time.Duration(backoff)*time.Second); err != nil { + return nil, err + } + if backoff < 32 { + backoff = 2 * backoff + } + } } func (bc *backoffClient) GetProofByHash(ctx context.Context, hash []byte, treeSize uint64) (*ct.GetProofByHashResponse, error) { - return bc.cli.GetProofByHash(ctx, hash, treeSize) + backoff := 1 + for { + rsp, err := bc.cli.GetProofByHash(ctx, hash, treeSize) + if err == nil { + return rsp, nil + } + + jcErr, ok := err.(jsonclient.RspError) + if !ok { + return rsp, err + } + if jcErr.StatusCode != 429 { + return rsp, err + } + if err := sleep(ctx, time.Duration(backoff)*time.Second); err != nil { + return nil, err + } + if backoff < 32 { + backoff = 2 * backoff + } + } } func (bc *backoffClient) GetRawEntries(ctx context.Context, start, end int64) (*ct.GetEntriesResponse, error) { @@ -54,3 +119,15 @@ func (bc *backoffClient) GetRawEntries(ctx context.Context, start, end int64) (* } return rsp, err } + +func sleep(ctx context.Context, d time.Duration) error { + timer := time.NewTimer(d) + defer timer.Stop() + + select { + case <-ctx.Done(): + return ctx.Err() + case <-timer.C: + return nil + } +} -- cgit v1.2.3