mirror of
https://github.com/coder/coder.git
synced 2025-07-03 16:13:58 +00:00
chore: track disabled telemetry (#16347)
Addresses https://github.com/coder/nexus/issues/116. ## Core Concept Send one final telemetry report after the user disables telemetry with the message that the telemetry was disabled. No other information about the deployment is sent in this report. This final report is submitted only if the deployment ever had telemetry on. ## Changes 1. Refactored how our telemetry is initialized. 2. Introduced the `TelemetryEnabled` telemetry item, which allows to decide whether a final report should be sent. 3. Added the `RecordTelemetryStatus` telemetry method, which decides whether a final report should be sent and updates the telemetry item. 4. Added tests to ensure the implementation is correct.
This commit is contained in:
@ -15,6 +15,7 @@ import (
|
||||
"regexp"
|
||||
"runtime"
|
||||
"slices"
|
||||
"strconv"
|
||||
"strings"
|
||||
"sync"
|
||||
"time"
|
||||
@ -42,6 +43,7 @@ const (
|
||||
)
|
||||
|
||||
type Options struct {
|
||||
Disabled bool
|
||||
Database database.Store
|
||||
Logger slog.Logger
|
||||
// URL is an endpoint to direct telemetry towards!
|
||||
@ -116,8 +118,8 @@ type remoteReporter struct {
|
||||
shutdownAt *time.Time
|
||||
}
|
||||
|
||||
func (*remoteReporter) Enabled() bool {
|
||||
return true
|
||||
func (r *remoteReporter) Enabled() bool {
|
||||
return !r.options.Disabled
|
||||
}
|
||||
|
||||
func (r *remoteReporter) Report(snapshot *Snapshot) {
|
||||
@ -161,10 +163,12 @@ func (r *remoteReporter) Close() {
|
||||
close(r.closed)
|
||||
now := dbtime.Now()
|
||||
r.shutdownAt = &now
|
||||
// Report a final collection of telemetry prior to close!
|
||||
// This could indicate final actions a user has taken, and
|
||||
// the time the deployment was shutdown.
|
||||
r.reportWithDeployment()
|
||||
if r.Enabled() {
|
||||
// Report a final collection of telemetry prior to close!
|
||||
// This could indicate final actions a user has taken, and
|
||||
// the time the deployment was shutdown.
|
||||
r.reportWithDeployment()
|
||||
}
|
||||
r.closeFunc()
|
||||
}
|
||||
|
||||
@ -177,7 +181,74 @@ func (r *remoteReporter) isClosed() bool {
|
||||
}
|
||||
}
|
||||
|
||||
// See the corresponding test in telemetry_test.go for a truth table.
|
||||
func ShouldReportTelemetryDisabled(recordedTelemetryEnabled *bool, telemetryEnabled bool) bool {
|
||||
return recordedTelemetryEnabled != nil && *recordedTelemetryEnabled && !telemetryEnabled
|
||||
}
|
||||
|
||||
// RecordTelemetryStatus records the telemetry status in the database.
|
||||
// If the status changed from enabled to disabled, returns a snapshot to
|
||||
// be sent to the telemetry server.
|
||||
func RecordTelemetryStatus( //nolint:revive
|
||||
ctx context.Context,
|
||||
logger slog.Logger,
|
||||
db database.Store,
|
||||
telemetryEnabled bool,
|
||||
) (*Snapshot, error) {
|
||||
item, err := db.GetTelemetryItem(ctx, string(TelemetryItemKeyTelemetryEnabled))
|
||||
if err != nil && !errors.Is(err, sql.ErrNoRows) {
|
||||
return nil, xerrors.Errorf("get telemetry enabled: %w", err)
|
||||
}
|
||||
var recordedTelemetryEnabled *bool
|
||||
if !errors.Is(err, sql.ErrNoRows) {
|
||||
value, err := strconv.ParseBool(item.Value)
|
||||
if err != nil {
|
||||
logger.Debug(ctx, "parse telemetry enabled", slog.Error(err))
|
||||
}
|
||||
// If ParseBool fails, value will default to false.
|
||||
// This may happen if an admin manually edits the telemetry item
|
||||
// in the database.
|
||||
recordedTelemetryEnabled = &value
|
||||
}
|
||||
|
||||
if err := db.UpsertTelemetryItem(ctx, database.UpsertTelemetryItemParams{
|
||||
Key: string(TelemetryItemKeyTelemetryEnabled),
|
||||
Value: strconv.FormatBool(telemetryEnabled),
|
||||
}); err != nil {
|
||||
return nil, xerrors.Errorf("upsert telemetry enabled: %w", err)
|
||||
}
|
||||
|
||||
shouldReport := ShouldReportTelemetryDisabled(recordedTelemetryEnabled, telemetryEnabled)
|
||||
if !shouldReport {
|
||||
return nil, nil //nolint:nilnil
|
||||
}
|
||||
// If any of the following calls fail, we will never report that telemetry changed
|
||||
// from enabled to disabled. This is okay. We only want to ping the telemetry server
|
||||
// once, and never again. If that attempt fails, so be it.
|
||||
item, err = db.GetTelemetryItem(ctx, string(TelemetryItemKeyTelemetryEnabled))
|
||||
if err != nil {
|
||||
return nil, xerrors.Errorf("get telemetry enabled after upsert: %w", err)
|
||||
}
|
||||
return &Snapshot{
|
||||
TelemetryItems: []TelemetryItem{
|
||||
ConvertTelemetryItem(item),
|
||||
},
|
||||
}, nil
|
||||
}
|
||||
|
||||
func (r *remoteReporter) runSnapshotter() {
|
||||
telemetryDisabledSnapshot, err := RecordTelemetryStatus(r.ctx, r.options.Logger, r.options.Database, r.Enabled())
|
||||
if err != nil {
|
||||
r.options.Logger.Debug(r.ctx, "record and maybe report telemetry status", slog.Error(err))
|
||||
}
|
||||
if telemetryDisabledSnapshot != nil {
|
||||
r.reportSync(telemetryDisabledSnapshot)
|
||||
}
|
||||
r.options.Logger.Debug(r.ctx, "finished telemetry status check")
|
||||
if !r.Enabled() {
|
||||
return
|
||||
}
|
||||
|
||||
first := true
|
||||
ticker := time.NewTicker(r.options.SnapshotFrequency)
|
||||
defer ticker.Stop()
|
||||
@ -1567,6 +1638,7 @@ type telemetryItemKey string
|
||||
//revive:disable:exported
|
||||
const (
|
||||
TelemetryItemKeyHTMLFirstServedAt telemetryItemKey = "html_first_served_at"
|
||||
TelemetryItemKeyTelemetryEnabled telemetryItemKey = "telemetry_enabled"
|
||||
)
|
||||
|
||||
type TelemetryItem struct {
|
||||
@ -1578,6 +1650,8 @@ type TelemetryItem struct {
|
||||
|
||||
type noopReporter struct{}
|
||||
|
||||
func (*noopReporter) Report(_ *Snapshot) {}
|
||||
func (*noopReporter) Enabled() bool { return false }
|
||||
func (*noopReporter) Close() {}
|
||||
func (*noopReporter) Report(_ *Snapshot) {}
|
||||
func (*noopReporter) Enabled() bool { return false }
|
||||
func (*noopReporter) Close() {}
|
||||
func (*noopReporter) RunSnapshotter() {}
|
||||
func (*noopReporter) ReportDisabledIfNeeded() error { return nil }
|
||||
|
@ -131,7 +131,8 @@ func TestTelemetry(t *testing.T) {
|
||||
require.Len(t, snapshot.WorkspaceProxies, 1)
|
||||
require.Len(t, snapshot.WorkspaceModules, 1)
|
||||
require.Len(t, snapshot.Organizations, 1)
|
||||
require.Len(t, snapshot.TelemetryItems, 1)
|
||||
// We create one item manually above. The other is TelemetryEnabled, created by the snapshotter.
|
||||
require.Len(t, snapshot.TelemetryItems, 2)
|
||||
wsa := snapshot.WorkspaceAgents[0]
|
||||
require.Len(t, wsa.Subsystems, 2)
|
||||
require.Equal(t, string(database.WorkspaceAgentSubsystemEnvbox), wsa.Subsystems[0])
|
||||
@ -361,31 +362,112 @@ func TestTelemetryItem(t *testing.T) {
|
||||
require.Equal(t, item.Value, "new_value")
|
||||
}
|
||||
|
||||
func collectSnapshot(t *testing.T, db database.Store, addOptionsFn func(opts telemetry.Options) telemetry.Options) (*telemetry.Deployment, *telemetry.Snapshot) {
|
||||
func TestShouldReportTelemetryDisabled(t *testing.T) {
|
||||
t.Parallel()
|
||||
// Description | telemetryEnabled (db) | telemetryEnabled (is) | Report Telemetry Disabled |
|
||||
//----------------------------------------|-----------------------|-----------------------|---------------------------|
|
||||
// New deployment | <null> | true | No |
|
||||
// New deployment with telemetry disabled | <null> | false | No |
|
||||
// Telemetry was enabled, and still is | true | true | No |
|
||||
// Telemetry was enabled but now disabled | true | false | Yes |
|
||||
// Telemetry was disabled, now is enabled | false | true | No |
|
||||
// Telemetry was disabled, still disabled | false | false | No |
|
||||
boolTrue := true
|
||||
boolFalse := false
|
||||
require.False(t, telemetry.ShouldReportTelemetryDisabled(nil, true))
|
||||
require.False(t, telemetry.ShouldReportTelemetryDisabled(nil, false))
|
||||
require.False(t, telemetry.ShouldReportTelemetryDisabled(&boolTrue, true))
|
||||
require.True(t, telemetry.ShouldReportTelemetryDisabled(&boolTrue, false))
|
||||
require.False(t, telemetry.ShouldReportTelemetryDisabled(&boolFalse, true))
|
||||
require.False(t, telemetry.ShouldReportTelemetryDisabled(&boolFalse, false))
|
||||
}
|
||||
|
||||
func TestRecordTelemetryStatus(t *testing.T) {
|
||||
t.Parallel()
|
||||
for _, testCase := range []struct {
|
||||
name string
|
||||
recordedTelemetryEnabled string
|
||||
telemetryEnabled bool
|
||||
shouldReport bool
|
||||
}{
|
||||
{name: "New deployment", recordedTelemetryEnabled: "nil", telemetryEnabled: true, shouldReport: false},
|
||||
{name: "Telemetry disabled", recordedTelemetryEnabled: "nil", telemetryEnabled: false, shouldReport: false},
|
||||
{name: "Telemetry was enabled and still is", recordedTelemetryEnabled: "true", telemetryEnabled: true, shouldReport: false},
|
||||
{name: "Telemetry was enabled but now disabled", recordedTelemetryEnabled: "true", telemetryEnabled: false, shouldReport: true},
|
||||
{name: "Telemetry was disabled now is enabled", recordedTelemetryEnabled: "false", telemetryEnabled: true, shouldReport: false},
|
||||
{name: "Telemetry was disabled still disabled", recordedTelemetryEnabled: "false", telemetryEnabled: false, shouldReport: false},
|
||||
{name: "Telemetry was disabled still disabled, invalid value", recordedTelemetryEnabled: "invalid", telemetryEnabled: false, shouldReport: false},
|
||||
} {
|
||||
testCase := testCase
|
||||
t.Run(testCase.name, func(t *testing.T) {
|
||||
t.Parallel()
|
||||
|
||||
db, _ := dbtestutil.NewDB(t)
|
||||
ctx := testutil.Context(t, testutil.WaitMedium)
|
||||
logger := testutil.Logger(t)
|
||||
if testCase.recordedTelemetryEnabled != "nil" {
|
||||
db.UpsertTelemetryItem(ctx, database.UpsertTelemetryItemParams{
|
||||
Key: string(telemetry.TelemetryItemKeyTelemetryEnabled),
|
||||
Value: testCase.recordedTelemetryEnabled,
|
||||
})
|
||||
}
|
||||
snapshot1, err := telemetry.RecordTelemetryStatus(ctx, logger, db, testCase.telemetryEnabled)
|
||||
require.NoError(t, err)
|
||||
|
||||
if testCase.shouldReport {
|
||||
require.NotNil(t, snapshot1)
|
||||
require.Equal(t, snapshot1.TelemetryItems[0].Key, string(telemetry.TelemetryItemKeyTelemetryEnabled))
|
||||
require.Equal(t, snapshot1.TelemetryItems[0].Value, "false")
|
||||
} else {
|
||||
require.Nil(t, snapshot1)
|
||||
}
|
||||
|
||||
for i := 0; i < 3; i++ {
|
||||
// Whatever happens, subsequent calls should not report if telemetryEnabled didn't change
|
||||
snapshot2, err := telemetry.RecordTelemetryStatus(ctx, logger, db, testCase.telemetryEnabled)
|
||||
require.NoError(t, err)
|
||||
require.Nil(t, snapshot2)
|
||||
}
|
||||
})
|
||||
}
|
||||
}
|
||||
|
||||
func mockTelemetryServer(t *testing.T) (*url.URL, chan *telemetry.Deployment, chan *telemetry.Snapshot) {
|
||||
t.Helper()
|
||||
deployment := make(chan *telemetry.Deployment, 64)
|
||||
snapshot := make(chan *telemetry.Snapshot, 64)
|
||||
r := chi.NewRouter()
|
||||
r.Post("/deployment", func(w http.ResponseWriter, r *http.Request) {
|
||||
require.Equal(t, buildinfo.Version(), r.Header.Get(telemetry.VersionHeader))
|
||||
w.WriteHeader(http.StatusAccepted)
|
||||
dd := &telemetry.Deployment{}
|
||||
err := json.NewDecoder(r.Body).Decode(dd)
|
||||
require.NoError(t, err)
|
||||
deployment <- dd
|
||||
// Ensure the header is sent only after deployment is sent
|
||||
w.WriteHeader(http.StatusAccepted)
|
||||
})
|
||||
r.Post("/snapshot", func(w http.ResponseWriter, r *http.Request) {
|
||||
require.Equal(t, buildinfo.Version(), r.Header.Get(telemetry.VersionHeader))
|
||||
w.WriteHeader(http.StatusAccepted)
|
||||
ss := &telemetry.Snapshot{}
|
||||
err := json.NewDecoder(r.Body).Decode(ss)
|
||||
require.NoError(t, err)
|
||||
snapshot <- ss
|
||||
// Ensure the header is sent only after snapshot is sent
|
||||
w.WriteHeader(http.StatusAccepted)
|
||||
})
|
||||
server := httptest.NewServer(r)
|
||||
t.Cleanup(server.Close)
|
||||
serverURL, err := url.Parse(server.URL)
|
||||
require.NoError(t, err)
|
||||
|
||||
return serverURL, deployment, snapshot
|
||||
}
|
||||
|
||||
func collectSnapshot(t *testing.T, db database.Store, addOptionsFn func(opts telemetry.Options) telemetry.Options) (*telemetry.Deployment, *telemetry.Snapshot) {
|
||||
t.Helper()
|
||||
|
||||
serverURL, deployment, snapshot := mockTelemetryServer(t)
|
||||
|
||||
options := telemetry.Options{
|
||||
Database: db,
|
||||
Logger: testutil.Logger(t),
|
||||
|
Reference in New Issue
Block a user