trufflesecurity · ap00rv · Sep 5, 2025 · Oct 7, 2025 · Oct 8, 2025 · Oct 9, 2025
@@ -35,6 +35,8 @@ func (s Scanner) Keywords() []string {
 	return []string{"confluent"}
 }
 
+func (s Scanner) Version() int { return 1 }
+
 // FromData will find and optionally verify Confluent secrets in a given set of bytes.
 func (s Scanner) FromData(ctx context.Context, verify bool, data []byte) (results []detectors.Result, err error) {
 	dataStr := string(data)
@@ -52,6 +54,10 @@ func (s Scanner) FromData(ctx context.Context, verify bool, data []byte) (result
 				DetectorType: detectorspb.DetectorType_Confluent,
 				Raw:          []byte(resMatch),
 				RawV2:        []byte(resMatch + resSecret),
+				ExtraData: map[string]string{
+					"rotation_guide": "https://docs.confluent.io/cloud/current/security/authenticate/workload-identities/service-accounts/api-keys/best-practices-api-keys.html#rotate-api-keys-regularly",
+					"version":        fmt.Sprintf("%d", s.Version()),
+				},
 			}
 
 			if verify {

@@ -0,0 +1,118 @@
+package confluent
+
+import (
+	"context"
+	b64 "encoding/base64"
+	"fmt"
+	"hash/crc32"
+	"strings"
+
+	regexp "github.com/wasilibs/go-re2"
+
+	"github.com/trufflesecurity/trufflehog/v3/pkg/detectors"
+	"github.com/trufflesecurity/trufflehog/v3/pkg/pb/detectorspb"
+)
+
+type Scanner struct {
+	detectors.DefaultMultiPartCredentialProvider
+}
+
+// Ensure the Scanner satisfies the interface at compile time.
+var _ detectors.Detector = (*Scanner)(nil)
+
+var (
+	keyPat = regexp.MustCompile(detectors.PrefixRegex([]string{"confluent"}) + `\b([A-Z0-9]{16})\b`)
+	// Match cflt prefix followed by 60 characters consisting of A-Z, a-z, 0-9, + or /
+	//See https://docs.confluent.io/cloud/current/security/authenticate/workload-identities/service-accounts/api-keys/overview.html#api-secret-format
+	secretPat = regexp.MustCompile(`\b(cflt[A-Za-z0-9+/]{60})\b`)
+)
+
+// Keywords are used for efficiently pre-filtering chunks.
+// Use identifiers in the secret preferably, or the provider name.
+func (s Scanner) Keywords() []string {
+	return []string{"cflt"}
+}
+
+func (s Scanner) Version() int { return 2 }
+
+// FromData will find and optionally verify Confluent secrets in a given set of bytes.
+func (s Scanner) FromData(ctx context.Context, verify bool, data []byte) (results []detectors.Result, err error) {
+	dataStr := string(data)
+
+	matches := keyPat.FindAllStringSubmatch(dataStr, -1)
+	secretMatches := secretPat.FindAllStringSubmatch(dataStr, -1)
+
+	for _, match := range matches {
+		resMatch := strings.TrimSpace(match[1])
+
+		for _, match := range secretMatches {
+			resSecret := strings.TrimSpace(match[1]) // Use index 1 for the captured group
+
+			s1 := detectors.Result{
+				DetectorType: detectorspb.DetectorType_Confluent,
+				Raw:          []byte(resMatch),
+				RawV2:        []byte(resMatch + resSecret),
+				ExtraData: map[string]string{
+					"rotation_guide": "https://docs.confluent.io/cloud/current/security/authenticate/workload-identities/service-accounts/api-keys/best-practices-api-keys.html#rotate-api-keys-regularly",
+					"version":        fmt.Sprintf("%d", s.Version()),
+				},
+			}
+
+			if verify {
+				s1.Verified = verifyConfluentSecret(resSecret)
+			}
+
+			results = append(results, s1)
+		}
+	}
+
+	return results, nil
+}
+
+// verifyConfluentSecret verifies the Confluent secret by checking the CRC32 checksum
+func verifyConfluentSecret(secret string) bool {
+	if len(secret) != 64 { // cflt + 60 characters
+		return false
+	}
+
+	if !strings.HasPrefix(secret, "cflt") {
+		return false
+	}
+
+	// Extract the first 54 characters after 'cflt' prefix (58 total - 4 for cflt)
+	payload := secret[4:58] // Characters 5-58 (54 characters)
+
+	// Extract the last 6 characters as the checksum
+	checksumEncoded := secret[58:64]
+
+	// Decode the checksum from base64
+	checksumBytes, err := b64.StdEncoding.DecodeString(checksumEncoded + "==") // Add padding if needed
+	if err != nil {
+		// Try without padding
+		checksumBytes, err = b64.StdEncoding.DecodeString(checksumEncoded)
+		if err != nil {
+			return false
+		}
+	}
+
+	if len(checksumBytes) < 4 {
+		return false
+	}
+
+	// Calculate CRC32 checksum of the payload
+	expectedChecksum := crc32.ChecksumIEEE([]byte(payload))
+
+	// Convert received checksum bytes to uint32 (little endian to match the encoding)
+	receivedChecksum := uint32(checksumBytes[3])<<24 | uint32(checksumBytes[2])<<16 |
+		uint32(checksumBytes[1])<<8 | uint32(checksumBytes[0])
+
+	return expectedChecksum == receivedChecksum
+}
+
+func (s Scanner) Type() detectorspb.DetectorType {
+	return detectorspb.DetectorType_Confluent
+}
+
+func (s Scanner) Description() string {
+	return "Confluent provides a streaming platform based on Apache Kafka to help companies harness their data in real-time. Confluent Cloud API keys can be used to access and manage Confluent Cloud control plane APIs and resources."
+}
@@ -0,0 +1,123 @@
+//go:build detectors
+// +build detectors
+
+package confluent
+
+import (
+	"context"
+	"fmt"
+	"testing"
+
+	"github.com/kylelemons/godebug/pretty"
+	"github.com/trufflesecurity/trufflehog/v3/pkg/detectors"
+
+	"github.com/trufflesecurity/trufflehog/v3/pkg/pb/detectorspb"
+)
+
+func TestConfluent_FromChunk(t *testing.T) {
+	// Valid secret with proper CRC32 checksum
+	validSecret := "cfltT8d8RzkNseTMEDKcjNM1BZTFPHqRn/dQm9q7w6SjzZ12wZfwjaJdipHZtDjw"
+	// Invalid secret with wrong checksum
+	invalidSecret := "cfltT8d8RzkNseTMEDKcjNM1BZTFPHqRn/dQm9q7w6SjzZ12wZfwjaJdipHZtDje"
+	key := "JSAOOCIC74SGECCP"
+
+	type args struct {
+		ctx    context.Context
+		data   []byte
+		verify bool
+	}
+	tests := []struct {
+		name    string
+		s       Scanner
+		args    args
+		want    []detectors.Result
+		wantErr bool
+	}{
+		{
+			name: "found, verified",
+			s:    Scanner{},
+			args: args{
+				ctx:    context.Background(),
+				data:   []byte(fmt.Sprintf("You can find a confluent secret %s with key %s", validSecret, key)),
+				verify: true,
+			},
+			want: []detectors.Result{
+				{
+					DetectorType: detectorspb.DetectorType_Confluent,
+					Verified:     true,
+					ExtraData: map[string]string{
+						"rotation_guide": "https://docs.confluent.io/cloud/current/security/authenticate/workload-identities/service-accounts/api-keys/best-practices-api-keys.html#rotate-api-keys-regularly",
+						"version":        "2",
+					},
+				},
+			},
+			wantErr: false,
+		},
+		{
+			name: "found, unverified",
+			s:    Scanner{},
+			args: args{
+				ctx:    context.Background(),
+				data:   []byte(fmt.Sprintf("You can find a confluent secret %s with %s key but not valid", invalidSecret, key)), // the secret would satisfy the regex but not pass validation
+				verify: true,
+			},
+			want: []detectors.Result{
+				{
+					DetectorType: detectorspb.DetectorType_Confluent,
+					Verified:     false,
+					ExtraData: map[string]string{
+						"rotation_guide": "https://docs.confluent.io/cloud/current/security/authenticate/workload-identities/service-accounts/api-keys/best-practices-api-keys.html#rotate-api-keys-regularly",
+						"version":        "2",
+					},
+				},
+			},
+			wantErr: false,
+		},
+		{
+			name: "not found",
+			s:    Scanner{},
+			args: args{
+				ctx:    context.Background(),
+				data:   []byte("You cannot find the secret within"),
+				verify: true,
+			},
+			want:    nil,
+			wantErr: false,
+		},
+	}
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			s := Scanner{}
+			got, err := s.FromData(tt.args.ctx, tt.args.verify, tt.args.data)
+			if (err != nil) != tt.wantErr {
+				t.Errorf("Confluent.FromData() error = %v, wantErr %v", err, tt.wantErr)
+				return
+			}
+			for i := range got {
+				if len(got[i].Raw) == 0 {
+					t.Fatalf("no raw secret present: \n %+v", got[i])
+				}
+				got[i].Raw = nil
+			}
+			if diff := pretty.Compare(got, tt.want); diff != "" {
+				t.Errorf("Confluent.FromData() %s diff: (-got +want)\n%s", tt.name, diff)
+			}
+		})
+	}
+}
+
+func BenchmarkFromData(benchmark *testing.B) {
+	ctx := context.Background()
+	s := Scanner{}
+	for name, data := range detectors.MustGetBenchmarkData() {
+		benchmark.Run(name, func(b *testing.B) {
+			b.ResetTimer()
+			for n := 0; n < b.N; n++ {
+				_, err := s.FromData(ctx, false, data)
+				if err != nil {
+					b.Fatal(err)
+				}
+			}
+		})
+	}
+}
@@ -0,0 +1,87 @@
+package confluent
+
+import (
+	"context"
+	"testing"
+
+	"github.com/google/go-cmp/cmp"
+
+	"github.com/trufflesecurity/trufflehog/v3/pkg/detectors"
+	"github.com/trufflesecurity/trufflehog/v3/pkg/engine/ahocorasick"
+)
+
+var (
+	validPattern = `
+		=== Confluent Cloud API key ===
+
+		API key:
+		JSAOOCIC74SGECCP
+
+		API secret:
+		cfltT8d8RzkNseTMEDKcjNM1BZTFPHqRn/dQm9q7w6SjzZ12wZfwjaJdipHZtDjw
+
+		Resource scope:
+		Cloud resource management
+
+	`
+	secret = "JSAOOCIC74SGECCPcfltT8d8RzkNseTMEDKcjNM1BZTFPHqRn/dQm9q7w6SjzZ12wZfwjaJdipHZtDjw"
+)
+
+func TestConfluent_Pattern(t *testing.T) {
+	d := Scanner{}
+	ahoCorasickCore := ahocorasick.NewAhoCorasickCore([]detectors.Detector{d})
+
+	tests := []struct {
+		name  string
+		input string
+		want  []string
+	}{
+		{
+			name:  "valid pattern",
+			input: validPattern,
+			want:  []string{secret},
+		},
+	}
+
+	for _, test := range tests {
+		t.Run(test.name, func(t *testing.T) {
+			matchedDetectors := ahoCorasickCore.FindDetectorMatches([]byte(test.input))
+			if len(matchedDetectors) == 0 {
+				t.Errorf("keywords '%v' not matched by: %s", d.Keywords(), test.input)
+				return
+			}
+
+			results, err := d.FromData(context.Background(), false, []byte(test.input))
+			if err != nil {
+				t.Errorf("error = %v", err)
+				return
+			}
+
+			if len(results) != len(test.want) {
+				if len(results) == 0 {
+					t.Errorf("did not receive result")
+				} else {
+					t.Errorf("expected %d results, only received %d", len(test.want), len(results))
+				}
+				return
+			}
+
+			actual := make(map[string]struct{}, len(results))
+			for _, r := range results {
+				if len(r.RawV2) > 0 {
+					actual[string(r.RawV2)] = struct{}{}
+				} else {
+					actual[string(r.Raw)] = struct{}{}
+				}
+			}
+			expected := make(map[string]struct{}, len(test.want))
+			for _, v := range test.want {
+				expected[v] = struct{}{}
+			}
+
+			if diff := cmp.Diff(expected, actual); diff != "" {
+				t.Errorf("%s diff: (-want +got)\n%s", test.name, diff)
+			}
+		})
+	}
+}
@@ -183,7 +183,8 @@ import (
 	"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/commercejs"
 	"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/commodities"
 	"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/companyhub"
-	"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/confluent"
+	confluentv1 "github.com/trufflesecurity/trufflehog/v3/pkg/detectors/confluent/v1"
+	confluentv2 "github.com/trufflesecurity/trufflehog/v3/pkg/detectors/confluent/v2"
 	"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/contentfulpersonalaccesstoken"
 	"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/conversiontools"
 	"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/convertapi"
@@ -1047,7 +1048,8 @@ func buildDetectorList() []detectors.Detector {
 		&commercejs.Scanner{},
 		&commodities.Scanner{},
 		&companyhub.Scanner{},
-		&confluent.Scanner{},
+		&confluentv1.Scanner{},
+		&confluentv2.Scanner{},
 		&contentfulpersonalaccesstoken.Scanner{},
 		&conversiontools.Scanner{},
 		&convertapi.Scanner{},