From 42e4ff42049a1e4ff1edb5f3434a75f8862e8207 Mon Sep 17 00:00:00 2001 From: daynewlee Date: Sun, 8 Dec 2024 15:11:08 -0600 Subject: [PATCH] epss: add UUID for customized URL Signed-off-by: daynewlee --- enricher/epss/epss.go | 47 ++++++++++++++++++++------------------ enricher/epss/epss_test.go | 16 ++++++------- 2 files changed, 33 insertions(+), 30 deletions(-) diff --git a/enricher/epss/epss.go b/enricher/epss/epss.go index 87fd37a60..9bbb9d02c 100644 --- a/enricher/epss/epss.go +++ b/enricher/epss/epss.go @@ -1,3 +1,4 @@ +// Package epss provides a epss enricher. package epss import ( @@ -16,6 +17,7 @@ import ( "strings" "time" + "github.com/google/uuid" "github.com/quay/zlog" "github.com/quay/claircore" @@ -64,7 +66,7 @@ type Enricher struct { // Config is the configuration for Enricher. type Config struct { - BaseURL *string `json:"url" yaml:"url"` + URL *string `json:"url" yaml:"url"` } func (e *Enricher) Configure(ctx context.Context, f driver.ConfigUnmarshaler, c *http.Client) error { @@ -79,18 +81,18 @@ func (e *Enricher) Configure(ctx context.Context, f driver.ConfigUnmarshaler, c if err := f(&cfg); err != nil { return err } - if cfg.BaseURL != nil { + if cfg.URL != nil { // validate the URL format - if _, err := url.Parse(*cfg.BaseURL); err != nil { - return fmt.Errorf("invalid URL format for BaseURL: %w", err) + if _, err := url.Parse(*cfg.URL); err != nil { + return fmt.Errorf("invalid URL format for URL: %w", err) } // only .gz file is supported - if strings.HasSuffix(*cfg.BaseURL, ".gz") { + if strings.HasSuffix(*cfg.URL, ".gz") { //overwrite feedPath is cfg provides another baseURL path - e.feedPath = *cfg.BaseURL + e.feedPath = *cfg.URL } else { - return fmt.Errorf("invalid baseURL root: expected a '.gz' file, but got '%q'", *cfg.BaseURL) + return fmt.Errorf("invalid baseURL root: expected a '.gz' file, but got '%q'", *cfg.URL) } } @@ -128,14 +130,19 @@ func (e *Enricher) FetchEnrichment(ctx context.Context, prevFingerprint driver.F if err = httputil.CheckResponse(resp, http.StatusOK); err != nil { return nil, "", fmt.Errorf("unable to fetch file: %w", err) } - - etag := resp.Header.Get("etag") - if etag == "" { - return nil, "", fmt.Errorf("ETag not found in response headers") + var str string + var newFingerprint driver.Fingerprint + str = resp.Header.Get("etag") + if str == "" { + newUUID, err := uuid.NewRandom() + if err != nil { + return nil, "", fmt.Errorf("failed to generate UUID: %w", err) + } + // Generate a UUID for customized URL + str = newUUID.String() + zlog.Warn(ctx).Msg("ETag not found; generated UUID for fingerprint") } - - newFingerprint := driver.Fingerprint(etag) - + newFingerprint = driver.Fingerprint(str) if prevFingerprint == newFingerprint { zlog.Info(ctx).Str("fingerprint", string(newFingerprint)).Msg("file unchanged; skipping processing") return nil, prevFingerprint, nil @@ -158,7 +165,6 @@ func (e *Enricher) FetchEnrichment(ctx context.Context, prevFingerprint driver.F var modelVersion, date string for _, field := range record { - field = strings.TrimSpace(field) field = strings.TrimPrefix(strings.TrimSpace(field), "#") key, value, found := strings.Cut(field, ":") if !found { @@ -176,11 +182,8 @@ func (e *Enricher) FetchEnrichment(ctx context.Context, prevFingerprint driver.F return nil, "", fmt.Errorf("missing metadata fields in record: %v", record) } csvReader.Comment = '#' - csvReader.FieldsPerRecord = 3 // Expect exactly 3 fields per record - if modelVersion == "" || date == "" { - return nil, "", fmt.Errorf("missing metadata fields in record: %v", record) - } + csvReader.FieldsPerRecord = 3 // Expect exactly 3 fields per record // Read and validate header line record, err = csvReader.Read() @@ -262,8 +265,8 @@ func (*Enricher) Name() string { } func currentFeedURL() string { - currentDate := time.Now() - formattedDate := currentDate.Format("2006-01-02") + yesterday := time.Now().AddDate(0, 0, -1) // Get yesterday's date + formattedDate := yesterday.Format("2006-01-02") filePath := fmt.Sprintf("epss_scores-%s.csv.gz", formattedDate) feedURL, err := url.Parse(DefaultBaseURL) @@ -354,7 +357,7 @@ func (e *Enricher) Enrich(ctx context.Context, g driver.EnrichmentGetter, r *cla } func newItemFeed(record []string, modelVersion string, scoreDate string) (driver.EnrichmentRecord, error) { - // Assuming record has already been validated to have 3 fields + // Validate the record has the expected length if len(record) != 3 { return driver.EnrichmentRecord{}, fmt.Errorf("unexpected record length: %d", len(record)) } diff --git a/enricher/epss/epss_test.go b/enricher/epss/epss_test.go index 042a6711c..32eeefcbf 100644 --- a/enricher/epss/epss_test.go +++ b/enricher/epss/epss_test.go @@ -38,7 +38,7 @@ func TestConfigure(t *testing.T) { Config: func(i interface{}) error { cfg := i.(*Config) s := "http://example.com/" - cfg.BaseURL = &s + cfg.URL = &s return nil }, Check: func(t *testing.T, err error) { @@ -58,11 +58,11 @@ func TestConfigure(t *testing.T) { }, }, { - Name: "BadURL", // Malformed URL in BaseURL + Name: "BadURL", // Malformed URL in URL Config: func(i interface{}) error { cfg := i.(*Config) s := "http://[notaurl:/" - cfg.BaseURL = &s + cfg.URL = &s return nil }, Check: func(t *testing.T, err error) { @@ -72,11 +72,11 @@ func TestConfigure(t *testing.T) { }, }, { - Name: "ValidGZURL", // Proper .gz URL in BaseURL + Name: "ValidGZURL", // Proper .gz URL in URL Config: func(i interface{}) error { cfg := i.(*Config) s := "http://example.com/epss_scores-2024-10-25.csv.gz" - cfg.BaseURL = &s + cfg.URL = &s return nil }, Check: func(t *testing.T, err error) { @@ -207,7 +207,7 @@ func (tc fetchTestcase) Run(ctx context.Context, srv *httptest.Server) func(*tes t.Fatal("expected Config type for i, but got a different type") } u := srv.URL + "/data.csv.gz" - cfg.BaseURL = &u + cfg.URL = &u return nil } @@ -259,7 +259,7 @@ func (tc parseTestcase) Run(ctx context.Context, srv *httptest.Server) func(*tes t.Fatal("assertion failed") } u := srv.URL + "/data.csv.gz" - cfg.BaseURL = &u + cfg.URL = &u return nil } if err := e.Configure(ctx, f, srv.Client()); err != nil { @@ -313,7 +313,7 @@ func TestEnrich(t *testing.T) { t.Fatal("assertion failed") } u := srv.URL + "/data.csv.gz" - cfg.BaseURL = &u + cfg.URL = &u return nil } if err := e.Configure(ctx, f, srv.Client()); err != nil {