Skip to content

Validator polling #320

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Draft
wants to merge 1 commit into
base: main
Choose a base branch
from
Draft
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
278 changes: 235 additions & 43 deletions validator/validate_cmd.go
Original file line number Diff line number Diff line change
Expand Up @@ -4,104 +4,296 @@ import (
"encoding/json"
"errors"
"flag"
"fmt"
"os"
"path/filepath"
"strings"
"sync"
"time"

sq "github.com/Masterminds/squirrel"

"github.com/interline-io/log"
"github.com/interline-io/transitland-lib/ext"
"github.com/interline-io/transitland-lib/dmfr/store"
"github.com/interline-io/transitland-lib/internal/cli"
"github.com/interline-io/transitland-lib/internal/snakejson"
"github.com/interline-io/transitland-lib/tlcsv"
"github.com/interline-io/transitland-lib/tldb"
"github.com/jmoiron/sqlx"
)

// Command
type Command struct {
Options Options
rtFiles cli.ArrayFlags
OutputFile string
DBURL string
FVID int
extensions cli.ArrayFlags
SaveValidationReport bool
Options Options
OutputFile string
DBURL string
checkRtUrls cli.ArrayFlags
extensions cli.ArrayFlags

//////
CheckRtUrls []string
FeedId string
Timezone string
ValidationReportStorage string
readerPath string
ValidateRtDir string
ValidateStaticPath string
Storage string
RefreshRate int
ForceFvid int

//////
vt *Validator
db sqlx.Ext
checkFvid sync.Mutex
activeFvid int
}

func (cmd *Command) Parse(args []string) error {
fl := flag.NewFlagSet("validate", flag.ExitOnError)
fl.Usage = func() {
log.Print("Usage: validate <reader>")
log.Print("Usage: validate [reader]")
fl.PrintDefaults()
}
fl.Var(&cmd.extensions, "ext", "Include GTFS Extension")
fl.StringVar(&cmd.OutputFile, "o", "", "Write validation report as JSON to file")
fl.IntVar(&cmd.RefreshRate, "refresh", 0, "GTFS-RT URL refresh rate in seconds")
fl.IntVar(&cmd.ForceFvid, "force-fvid", 0, "Force feed version id")
fl.IntVar(&cmd.Options.ErrorLimit, "error-limit", 1000, "Max number of detailed errors per error group")
fl.BoolVar(&cmd.Options.BestPractices, "best-practices", false, "Include Best Practices validations")
fl.BoolVar(&cmd.Options.IncludeRealtimeJson, "rt-json", false, "Include GTFS-RT proto messages as JSON in validation report")
fl.BoolVar(&cmd.SaveValidationReport, "validation-report", false, "Save static validation report in database")
fl.BoolVar(&cmd.Options.UseHeaderTimestamp, "header-timestamp", false, "Use header time")
fl.StringVar(&cmd.Storage, "storage", "", "Static storage")
fl.StringVar(&cmd.ValidationReportStorage, "validation-report-storage", "", "Storage path for saving validation report JSON")
fl.IntVar(&cmd.FVID, "save-fvid", 0, "Save report to feed version ID")
fl.Var(&cmd.rtFiles, "rt", "Include GTFS-RT proto message in validation report")
fl.IntVar(&cmd.Options.ErrorLimit, "error-limit", 1000, "Max number of detailed errors per error group")
fl.StringVar(&cmd.ValidateRtDir, "validate-rt-dir", "", "Validate messages in directory")
fl.StringVar(&cmd.Timezone, "timezone", "America/Los_Angeles", "Timezone")
fl.StringVar(&cmd.FeedId, "feed", "", "Use active feed version for this feed in database")
fl.Var(&cmd.checkRtUrls, "rt", "Include GTFS-RT proto message file or URL in validation report")
err := fl.Parse(args)
if err != nil || fl.NArg() < 1 {
if err != nil {
fl.Usage()
return errors.New("requires input reader")
return err
}
if fl.NArg() > 1 {
return errors.New("unknown argument")
} else if fl.NArg() == 1 {
cmd.ValidateStaticPath = fl.Arg(0)
}
if cmd.DBURL == "" {
cmd.DBURL = os.Getenv("TL_DATABASE_URL")
}
cmd.readerPath = fl.Arg(0)
cmd.Options.ValidateRealtimeMessages = cmd.rtFiles
cmd.Options.Extensions = cmd.extensions
cmd.CheckRtUrls = append(cmd.CheckRtUrls, cmd.checkRtUrls...)
cmd.Options.Extensions = append(cmd.Options.Extensions, cmd.extensions...)
cmd.Options.EvaluateAt = time.Now().In(time.UTC)
return nil
}

func (cmd *Command) Run() error {
log.Infof("Validating: %s", cmd.readerPath)
reader, err := ext.OpenReader(cmd.readerPath)
// Open database if provided
if cmd.DBURL != "" {
r, err := tldb.NewReader(cmd.DBURL)
if err != nil {
return err
}
if err := r.Open(); err != nil {
return err
}
cmd.db = r.Adapter.DBX()
}

// Reset
cmd.activeFvid = -1

// Check local RTs
var initialRtChecks []string
initialRtChecks = append(initialRtChecks, cmd.CheckRtUrls...)
if cmd.ValidateRtDir != "" {
localRtFiles, err := getFiles(cmd.ValidateRtDir)
if err != nil {
return err
}
initialRtChecks = append(initialRtChecks, localRtFiles...)
}

// Initial check feed
staticResult, err := cmd.checkFeed(initialRtChecks)
if err != nil {
return err
}
// staticResult.DisplayErrors()
// staticResult.DisplayWarnings()
// staticResult.DisplaySummary()

// Save to output file
if err := saveResult(staticResult, cmd.OutputFile, cmd.db, cmd.activeFvid, cmd.ValidationReportStorage); err != nil {
log.Error().Err(err).Msg("Failed to save validation report")
return err
}

// Poll RT urls
if cmd.RefreshRate > 0 {
exit := make(chan string)
ticker := time.NewTicker(time.Duration(cmd.RefreshRate) * time.Second)
go func() {
for ; true; <-ticker.C {
if _, err := cmd.checkFeed(nil); err != nil {
log.Error().Err(err).Msg("Failed to check feed")
continue
}
now, nowLocal := cmd.now()
result, err := cmd.vt.ValidateRTs(cmd.CheckRtUrls, now, nowLocal)
if err != nil {
log.Error().Err(err).Msg("Failed to validate RT messages")
continue
}
if err := saveResult(result, "", cmd.db, cmd.activeFvid, cmd.ValidationReportStorage); err != nil {
log.Error().Err(err).Msg("Failed to save RT validation report")
continue
}
log.Info().Msg("Saved report")
}
}()
<-exit
}
return nil
}

func (cmd *Command) checkFeed(rtUrls []string) (*Result, error) {
cmd.checkFvid.Lock()
defer cmd.checkFvid.Unlock()

// Open static GTFS
var reader *tlcsv.Reader
if cmd.ValidateStaticPath != "" {
if cmd.activeFvid == cmd.ForceFvid {
return nil, nil
}
log.Info().Str("url", cmd.ValidateStaticPath).Msg("Checking static feed")
var err error
reader, err = tlcsv.NewReader(cmd.ValidateStaticPath)
if err != nil {
return nil, err
}
cmd.activeFvid = cmd.ForceFvid
} else if cmd.db != nil && cmd.FeedId != "" {
// Check fv
atx := tldb.NewPostgresAdapterFromDBX(cmd.db)
checkFv := struct {
ID int
SHA1 string
}{}
q := atx.Sqrl().Select("feed_versions.id, feed_versions.sha1").From("feed_versions")
if cmd.ForceFvid > 0 {
q = q.Where(sq.Eq{"id": cmd.ForceFvid})
} else {
q = q.Join("feed_states on feed_states.feed_version_id = feed_versions.id").
Join("current_feeds on current_feeds.id = feed_versions.feed_id").
Where("current_feeds.onestop_id = ?", cmd.FeedId)
}
qstr, qargs, _ := q.ToSql()
if err := atx.Get(&checkFv, qstr, qargs...); err != nil {
return nil, err
}
if cmd.activeFvid == checkFv.ID {
return nil, nil
}
log.Info().Int("fvid", checkFv.ID).Str("sha1", checkFv.SHA1).Msg("Checking static feed")
cmd.activeFvid = checkFv.ID
// Fetch from storage
fvFile := fmt.Sprintf("%s.zip", checkFv.SHA1)
tladapter, err := store.NewStoreAdapter(cmd.Storage, fvFile, "")
if err != nil {
return nil, err
}
reader, err = tlcsv.NewReaderFromAdapter(tladapter)
if err != nil {
return nil, err
}
} else {
return nil, errors.New("no static feed")
}

// Open
if err := reader.Open(); err != nil {
return nil, err
}
defer reader.Close()
v, err := NewValidator(reader, cmd.Options)

// Validate
newOpts := cmd.Options
newOpts.ValidateRealtimeMessages = rtUrls
newVt, err := NewValidator(reader, newOpts)
if err != nil {
return err
return nil, err
}
result, err := v.Validate()
staticResult, err := newVt.Validate()
if err != nil {
return err
return nil, err
}
// result.DisplayErrors()
// result.DisplayWarnings()
// result.DisplaySummary()
cmd.vt = newVt
staticResult.FeedVersionID = cmd.activeFvid
staticResult.CreatedAt = time.Now().In(time.UTC)
staticResult.UpdatedAt = time.Now().In(time.UTC)
return staticResult, nil
}

func (cmd *Command) now() (time.Time, time.Time) {
// Get local time
tz, err := time.LoadLocation(cmd.Timezone)
if err != nil {
panic(err)
}
now := time.Now()
nowLocal := now.In(tz)
return now, nowLocal
}

// Write output
if cmd.OutputFile != "" {
f, err := os.Create(cmd.OutputFile)
func saveResult(result *Result, outpath string, db sqlx.Ext, fvid int, validationReportStorage string) error {
// Save report to disk
if outpath != "" {
f, err := os.Create(outpath)
if err != nil {
return err
}
b, err := json.MarshalIndent(snakejson.SnakeMarshaller{Value: result}, "", " ")
if err != nil {
return err
}
f.Write(b)
f.Close()
}

// Save to database
if cmd.SaveValidationReport {
log.Infof("Saving validation report to feed version: %d", cmd.FVID)
writer, err := tldb.OpenWriter(cmd.DBURL, true)
if err != nil {
if _, err := f.Write(b); err != nil {
return err
}
atx := writer.Adapter
defer atx.Close()
if err := SaveValidationReport(atx, result, cmd.FVID, cmd.ValidationReportStorage); err != nil {
if err := f.Close(); err != nil {
return err
}
}

// Save report to database
if db != nil && fvid > 0 {
atx := tldb.NewPostgresAdapterFromDBX(db)
if err := SaveValidationReport(
atx,
result,
fvid,
validationReportStorage,
); err != nil {
return err
}
}
return nil
}

func getFiles(path string) ([]string, error) {
files := []string{}
if err := filepath.Walk(path,
func(path string, info os.FileInfo, err error) error {
if err != nil {
return err
}
if strings.HasSuffix(info.Name(), ".pb") {
files = append(files, path)
}
return nil
}); err != nil {
return nil, err
}
return files, nil
}
Loading