Skip to content

Commit

Permalink
Added Twitter v2 Detector (#3016)
Browse files Browse the repository at this point in the history
* implemented a newer version of twitter included a test.
moved old twitter detector to as V1.

* added version information in twitter test
  • Loading branch information
abmussani authored Jul 18, 2024
1 parent 68ec7a2 commit c20ca0d
Show file tree
Hide file tree
Showing 5 changed files with 263 additions and 24 deletions.
101 changes: 101 additions & 0 deletions pkg/detectors/twitter/v1/twitter_v1.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,101 @@
package twitter

import (
"context"
"fmt"
"net/http"
"strings"

regexp "github.com/wasilibs/go-re2"

"github.com/trufflesecurity/trufflehog/v3/pkg/common"
"github.com/trufflesecurity/trufflehog/v3/pkg/detectors"
"github.com/trufflesecurity/trufflehog/v3/pkg/pb/detectorspb"
)

type Scanner struct {
detectors.DefaultMultiPartCredentialProvider

client *http.Client
}

// Ensure the Scanner satisfies the interface at compile time.
var _ detectors.Detector = (*Scanner)(nil)
var _ detectors.Versioner = (*Scanner)(nil)

var (
defaultClient = common.SaneHttpClient()

// Make sure that your group is surrounded in boundary characters such as below to reduce false positives.
keyPat = regexp.MustCompile(detectors.PrefixRegex([]string{"twitter"}) + `\b([A-Z]{22}%[a-zA-Z-0-9]{23}%[a-zA-Z-0-9]{6}%[a-zA-Z-0-9]{3}%[a-zA-Z-0-9]{9}%[a-zA-Z-0-9]{52})\b`)
)

func (s *Scanner) Version() int { return 1 }

// Keywords are used for efficiently pre-filtering chunks.
// Use identifiers in the secret preferably, or the provider name.
func (s Scanner) Keywords() []string {
return []string{"twitter"}
}

// FromData will find and optionally verify Twitter secrets in a given set of bytes.
func (s Scanner) FromData(ctx context.Context, verify bool, data []byte) (results []detectors.Result, err error) {
dataStr := string(data)

keyMatches := make(map[string]struct{})
for _, match := range keyPat.FindAllStringSubmatch(dataStr, -1) {
keyMatches[match[1]] = struct{}{}
}

for resMatch := range keyMatches {
resMatch = strings.TrimSpace(resMatch)

s1 := detectors.Result{
DetectorType: detectorspb.DetectorType_Twitter,
Raw: []byte(resMatch),
ExtraData: map[string]string{
"version": fmt.Sprintf("%d", s.Version()),
},
}

if verify {
client := s.client
if client == nil {
client = defaultClient
}
isVerified, err := s.VerifyTwitterToken(ctx, client, resMatch)
s1.Verified = isVerified
s1.SetVerificationError(err)
}

results = append(results, s1)
}

return results, nil
}

func (s Scanner) Type() detectorspb.DetectorType {
return detectorspb.DetectorType_Twitter
}

func (s Scanner) VerifyTwitterToken(ctx context.Context, client *http.Client, token string) (bool, error) {
req, err := http.NewRequestWithContext(ctx, http.MethodGet, "https://api.twitter.com/2/tweets/20", nil)
if err != nil {
return false, err
}
req.Header.Add("Authorization", fmt.Sprintf("Bearer %s", token))
res, err := client.Do(req)
if err != nil {
return false, err
}

defer res.Body.Close()
switch res.StatusCode {
case http.StatusOK:
return true, nil
case http.StatusUnauthorized:
return false, nil
default:
return false, fmt.Errorf("unexpected status code %d", res.StatusCode)
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -50,6 +50,9 @@ func TestTwitter_FromChunk(t *testing.T) {
{
DetectorType: detectorspb.DetectorType_Twitter,
Verified: true,
ExtraData: map[string]string{
"version": "1",
},
},
},
wantErr: false,
Expand All @@ -66,6 +69,9 @@ func TestTwitter_FromChunk(t *testing.T) {
{
DetectorType: detectorspb.DetectorType_Twitter,
Verified: false,
ExtraData: map[string]string{
"version": "1",
},
},
},
wantErr: false,
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,23 +10,29 @@ import (

"github.com/trufflesecurity/trufflehog/v3/pkg/common"
"github.com/trufflesecurity/trufflehog/v3/pkg/detectors"
v1 "github.com/trufflesecurity/trufflehog/v3/pkg/detectors/twitter/v1"
"github.com/trufflesecurity/trufflehog/v3/pkg/pb/detectorspb"
)

type Scanner struct {
detectors.DefaultMultiPartCredentialProvider
v1.Scanner

client *http.Client
}

// Ensure the Scanner satisfies the interface at compile time.
var _ detectors.Detector = (*Scanner)(nil)
var _ detectors.Detector = (*v1.Scanner)(nil)
var _ detectors.Versioner = (*v1.Scanner)(nil)

var (
client = common.SaneHttpClient()
defaultClient = common.SaneHttpClient()

// Make sure that your group is surrounded in boundary characters such as below to reduce false positives.
keyPat = regexp.MustCompile(detectors.PrefixRegex([]string{"twitter"}) + `\b([A-Z]{22}%[a-zA-Z-0-9]{23}%[a-zA-Z-0-9]{6}%[a-zA-Z-0-9]{3}%[a-zA-Z-0-9]{9}%[a-zA-Z-0-9]{52})\b`)
keyPat = regexp.MustCompile(detectors.PrefixRegex([]string{"twitter"}) + `\b([a-zA-Z0-9]{20,59}%([a-zA-Z0-9]{3,}%){0,2}[a-zA-Z0-9]{52})\b`)
)

func (s *Scanner) Version() int { return 2 }

// Keywords are used for efficiently pre-filtering chunks.
// Use identifiers in the secret preferably, or the provider name.
func (s Scanner) Keywords() []string {
Expand All @@ -37,32 +43,30 @@ func (s Scanner) Keywords() []string {
func (s Scanner) FromData(ctx context.Context, verify bool, data []byte) (results []detectors.Result, err error) {
dataStr := string(data)

matches := keyPat.FindAllStringSubmatch(dataStr, -1)
keyMatches := make(map[string]struct{})
for _, match := range keyPat.FindAllStringSubmatch(dataStr, -1) {
keyMatches[match[1]] = struct{}{}
}

for _, match := range matches {
if len(match) != 2 {
continue
}
resMatch := strings.TrimSpace(match[1])
for match := range keyMatches {
match = strings.TrimSpace(match)

s1 := detectors.Result{
DetectorType: detectorspb.DetectorType_Twitter,
Raw: []byte(resMatch),
Raw: []byte(match),
ExtraData: map[string]string{
"version": fmt.Sprintf("%d", s.Version()),
},
}

if verify {
req, err := http.NewRequestWithContext(ctx, "GET", "https://api.twitter.com/2/tweets/20", nil)
if err != nil {
continue
}
req.Header.Add("Authorization", fmt.Sprintf("Bearer %s", resMatch))
res, err := client.Do(req)
if err == nil {
defer res.Body.Close()
if res.StatusCode >= 200 && res.StatusCode < 300 {
s1.Verified = true
}
client := s.client
if client == nil {
client = defaultClient
}
isVerified, err := s.VerifyTwitterToken(ctx, client, match)
s1.Verified = isVerified
s1.SetVerificationError(err)
}

results = append(results, s1)
Expand Down
126 changes: 126 additions & 0 deletions pkg/detectors/twitter/v2/twitter_v2_test.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,126 @@
//go:build detectors
// +build detectors

package twitter

import (
"context"
"fmt"
"testing"
"time"

"github.com/kylelemons/godebug/pretty"
"github.com/trufflesecurity/trufflehog/v3/pkg/detectors"

"github.com/trufflesecurity/trufflehog/v3/pkg/common"
"github.com/trufflesecurity/trufflehog/v3/pkg/pb/detectorspb"
)

func TestTwitter_FromChunk(t *testing.T) {
ctx, cancel := context.WithTimeout(context.Background(), time.Second*5)
defer cancel()
testSecrets, err := common.GetSecret(ctx, "trufflehog-testing", "detectors5")
if err != nil {
t.Fatalf("could not get test secrets from GCP: %s", err)
}
secret := testSecrets.MustGetField("TWITTER_V2_ACTIVE")
inactiveSecret := testSecrets.MustGetField("TWITTER_V2_INACTIVE")

type args struct {
ctx context.Context
data []byte
verify bool
}
tests := []struct {
name string
s Scanner
args args
want []detectors.Result
wantErr bool
}{
{
name: "found, verified",
s: Scanner{},
args: args{
ctx: context.Background(),
data: []byte(fmt.Sprintf("You can find a twitter secret %s within", secret)),
verify: true,
},
want: []detectors.Result{
{
DetectorType: detectorspb.DetectorType_Twitter,
Verified: true,
ExtraData: map[string]string{
"version": "2",
},
},
},
wantErr: false,
},
{
name: "found, unverified",
s: Scanner{},
args: args{
ctx: context.Background(),
data: []byte(fmt.Sprintf("You can find a twitter secret %s within but not valid", inactiveSecret)), // the secret would satisfy the regex but not pass validation
verify: true,
},
want: []detectors.Result{
{
DetectorType: detectorspb.DetectorType_Twitter,
Verified: false,
ExtraData: map[string]string{
"version": "2",
},
},
},
wantErr: false,
},
{
name: "not found",
s: Scanner{},
args: args{
ctx: context.Background(),
data: []byte("You cannot find the secret within"),
verify: true,
},
want: nil,
wantErr: false,
},
}
for _, tt := range tests {
t.Run(tt.name, func(t *testing.T) {
s := Scanner{}
got, err := s.FromData(tt.args.ctx, tt.args.verify, tt.args.data)
if (err != nil) != tt.wantErr {
t.Errorf("Twitter.FromData() error = %v, wantErr %v", err, tt.wantErr)
return
}
for i := range got {
if len(got[i].Raw) == 0 {
t.Fatalf("no raw secret present: \n %+v", got[i])
}
got[i].Raw = nil
}
if diff := pretty.Compare(got, tt.want); diff != "" {
t.Errorf("Twitter.FromData() %s diff: (-got +want)\n%s", tt.name, diff)
}
})
}
}

func BenchmarkFromData(benchmark *testing.B) {
ctx := context.Background()
s := Scanner{}
for name, data := range detectors.MustGetBenchmarkData() {
benchmark.Run(name, func(b *testing.B) {
b.ResetTimer()
for n := 0; n < b.N; n++ {
_, err := s.FromData(ctx, false, data)
if err != nil {
b.Fatal(err)
}
}
})
}
}
6 changes: 4 additions & 2 deletions pkg/engine/defaults.go
Original file line number Diff line number Diff line change
Expand Up @@ -724,7 +724,8 @@ import (
"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/twilio"
"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/twist"
"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/twitch"
"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/twitter"
twitterv1 "github.com/trufflesecurity/trufflehog/v3/pkg/detectors/twitter/v1"
twitterv2 "github.com/trufflesecurity/trufflehog/v3/pkg/detectors/twitter/v2"
"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/twitterconsumerkey"
"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/tyntec"
"github.com/trufflesecurity/trufflehog/v3/pkg/detectors/typeform"
Expand Down Expand Up @@ -1424,7 +1425,8 @@ func DefaultDetectors() []detectors.Detector {
magicbell.Scanner{},
apitemplate.Scanner{},
knapsackpro.Scanner{},
twitter.Scanner{},
twitterv1.Scanner{},
twitterv2.Scanner{},
timecamp.Scanner{},
signable.Scanner{},
teletype.Scanner{},
Expand Down

0 comments on commit c20ca0d

Please sign in to comment.