212 lines
4.6 KiB
Go
Raw Normal View History

2015-05-21 08:52:19 +02:00
package main
import (
"database/sql"
"log"
"os"
"time"
2015-07-15 13:23:13 +02:00
_ "github.com/lib/pq"
2015-05-21 08:52:19 +02:00
)
var dbConn = getEnvDefault("UR_DB_URL", "postgres://user:password@localhost/ur?sslmode=disable")
func getEnvDefault(key, def string) string {
if val := os.Getenv(key); val != "" {
return val
}
return def
}
func main() {
log.SetFlags(log.Ltime | log.Ldate)
log.SetOutput(os.Stdout)
db, err := sql.Open("postgres", dbConn)
if err != nil {
log.Fatalln("database:", err)
}
err = setupDB(db)
if err != nil {
log.Fatalln("database:", err)
}
for {
runAggregation(db)
// Sleep until one minute past next midnight
sleepUntilNext(24*time.Hour, 1*time.Minute)
}
}
func runAggregation(db *sql.DB) {
2015-07-15 13:23:13 +02:00
since := maxIndexedDay(db, "VersionSummary")
log.Println("Aggregating VersionSummary data since", since)
rows, err := aggregateVersionSummary(db, since)
if err != nil {
log.Fatalln("aggregate:", err)
}
log.Println("Inserted", rows, "rows")
log.Println("Aggregating UserMovement data")
rows, err = aggregateUserMovement(db)
2015-05-21 08:52:19 +02:00
if err != nil {
log.Fatalln("aggregate:", err)
}
log.Println("Inserted", rows, "rows")
}
func sleepUntilNext(intv, margin time.Duration) {
now := time.Now().UTC()
next := now.Truncate(intv).Add(intv).Add(margin)
log.Println("Sleeping until", next)
time.Sleep(next.Sub(now))
}
func setupDB(db *sql.DB) error {
_, err := db.Exec(`CREATE TABLE IF NOT EXISTS VersionSummary (
Day TIMESTAMP NOT NULL,
Version VARCHAR(8) NOT NULL,
Count INTEGER NOT NULL
)`)
if err != nil {
return err
}
2015-07-15 13:23:13 +02:00
_, err = db.Exec(`CREATE TABLE IF NOT EXISTS UserMovement (
Day TIMESTAMP NOT NULL,
Added INTEGER NOT NULL,
2015-07-15 13:45:33 +02:00
Bounced INTEGER NOT NULL,
2015-07-15 13:23:13 +02:00
Removed INTEGER NOT NULL
)`)
if err != nil {
return err
}
2015-05-21 08:52:19 +02:00
row := db.QueryRow(`SELECT 'UniqueDayVersionIndex'::regclass`)
if err := row.Scan(nil); err != nil {
_, err = db.Exec(`CREATE UNIQUE INDEX UniqueDayVersionIndex ON VersionSummary (Day, Version)`)
}
row = db.QueryRow(`SELECT 'DayIndex'::regclass`)
if err := row.Scan(nil); err != nil {
_, err = db.Exec(`CREATE INDEX DayIndex ON VerionSummary (Day)`)
}
2015-07-15 13:23:13 +02:00
row = db.QueryRow(`SELECT 'MovementDayIndex'::regclass`)
if err := row.Scan(nil); err != nil {
_, err = db.Exec(`CREATE INDEX MovementDayIndex ON UserMovement (Day)`)
}
2015-05-21 08:52:19 +02:00
return err
}
2015-07-15 13:23:13 +02:00
func maxIndexedDay(db *sql.DB, table string) time.Time {
2015-05-21 08:52:19 +02:00
var t time.Time
2015-07-15 13:23:13 +02:00
row := db.QueryRow("SELECT MAX(Day) FROM " + table)
2015-05-21 08:52:19 +02:00
err := row.Scan(&t)
if err != nil {
return time.Time{}
}
return t
}
2015-07-15 13:23:13 +02:00
func aggregateVersionSummary(db *sql.DB, since time.Time) (int64, error) {
2015-05-21 08:52:19 +02:00
res, err := db.Exec(`INSERT INTO VersionSummary (
SELECT
DATE_TRUNC('day', Received) AS Day,
SUBSTRING(Version FROM '^v\d.\d+') AS Ver,
COUNT(*) AS Count
FROM Reports
WHERE
DATE_TRUNC('day', Received) > $1
2015-05-29 09:51:56 +02:00
AND DATE_TRUNC('day', Received) < DATE_TRUNC('day', NOW())
2015-05-21 08:52:19 +02:00
AND Version like 'v0.%'
GROUP BY Day, Ver
);
`, since)
if err != nil {
return 0, err
}
return res.RowsAffected()
}
2015-07-15 13:23:13 +02:00
func aggregateUserMovement(db *sql.DB) (int64, error) {
rows, err := db.Query(`SELECT
DATE_TRUNC('day', Received) AS Day,
UniqueID
FROM Reports
WHERE
DATE_TRUNC('day', Received) < DATE_TRUNC('day', NOW())
AND Version like 'v0.%'
ORDER BY Day
`)
if err != nil {
return 0, err
}
defer rows.Close()
firstSeen := make(map[string]time.Time)
lastSeen := make(map[string]time.Time)
var minTs time.Time
for rows.Next() {
var ts time.Time
var id string
if err := rows.Scan(&ts, &id); err != nil {
return 0, err
}
if minTs.IsZero() {
minTs = ts
}
if _, ok := firstSeen[id]; !ok {
firstSeen[id] = ts
}
lastSeen[id] = ts
}
type sumRow struct {
day time.Time
added int
removed int
2015-07-15 13:45:33 +02:00
bounced int
2015-07-15 13:23:13 +02:00
}
var sumRows []sumRow
for t := minTs; t.Before(time.Now().Truncate(24 * time.Hour)); t = t.AddDate(0, 0, 1) {
2015-07-15 13:45:33 +02:00
var added, removed, bounced int
old := t.Before(time.Now().AddDate(0, 0, -14))
2015-07-15 13:23:13 +02:00
for id, first := range firstSeen {
last := lastSeen[id]
2015-07-15 13:45:33 +02:00
if first.Equal(t) && last.Equal(t) && old {
bounced++
continue
}
2015-07-15 13:23:13 +02:00
if first.Equal(t) {
added++
}
2015-07-15 13:45:33 +02:00
if last == t && old {
2015-07-15 13:23:13 +02:00
removed++
}
}
2015-07-15 13:45:33 +02:00
sumRows = append(sumRows, sumRow{t, added, removed, bounced})
2015-07-15 13:23:13 +02:00
}
tx, err := db.Begin()
if err != nil {
return 0, err
}
if _, err := tx.Exec("DELETE FROM UserMovement"); err != nil {
tx.Rollback()
return 0, err
}
for _, r := range sumRows {
2015-07-15 13:45:33 +02:00
if _, err := tx.Exec("INSERT INTO UserMovement (Day, Added, Removed, Bounced) VALUES ($1, $2, $3, $4)", r.day, r.added, r.removed, r.bounced); err != nil {
2015-07-15 13:23:13 +02:00
tx.Rollback()
return 0, err
}
}
return int64(len(sumRows)), tx.Commit()
}