forked from tangled.org/core
Monorepo for Tangled — https://tangled.org
1package state 2 3import ( 4 "context" 5 "encoding/json" 6 "errors" 7 "fmt" 8 "slices" 9 "time" 10 11 "tangled.org/core/api/tangled" 12 "tangled.org/core/appview/cache" 13 "tangled.org/core/appview/config" 14 "tangled.org/core/appview/db" 15 "tangled.org/core/appview/models" 16 ec "tangled.org/core/eventconsumer" 17 "tangled.org/core/eventconsumer/cursor" 18 "tangled.org/core/log" 19 "tangled.org/core/rbac" 20 "tangled.org/core/workflow" 21 22 "github.com/bluesky-social/indigo/atproto/syntax" 23 "github.com/go-git/go-git/v5/plumbing" 24 "github.com/posthog/posthog-go" 25) 26 27func Knotstream(ctx context.Context, c *config.Config, d *db.DB, enforcer *rbac.Enforcer, posthog posthog.Client) (*ec.Consumer, error) { 28 knots, err := db.GetRegistrations( 29 d, 30 db.FilterIsNot("registered", "null"), 31 ) 32 if err != nil { 33 return nil, err 34 } 35 36 srcs := make(map[ec.Source]struct{}) 37 for _, k := range knots { 38 s := ec.NewKnotSource(k.Domain) 39 srcs[s] = struct{}{} 40 } 41 42 logger := log.New("knotstream") 43 cache := cache.New(c.Redis.Addr) 44 cursorStore := cursor.NewRedisCursorStore(cache) 45 46 cfg := ec.ConsumerConfig{ 47 Sources: srcs, 48 ProcessFunc: knotIngester(d, enforcer, posthog, c.Core.Dev), 49 RetryInterval: c.Knotstream.RetryInterval, 50 MaxRetryInterval: c.Knotstream.MaxRetryInterval, 51 ConnectionTimeout: c.Knotstream.ConnectionTimeout, 52 WorkerCount: c.Knotstream.WorkerCount, 53 QueueSize: c.Knotstream.QueueSize, 54 Logger: logger, 55 Dev: c.Core.Dev, 56 CursorStore: &cursorStore, 57 } 58 59 return ec.NewConsumer(cfg), nil 60} 61 62func knotIngester(d *db.DB, enforcer *rbac.Enforcer, posthog posthog.Client, dev bool) ec.ProcessFunc { 63 return func(ctx context.Context, source ec.Source, msg ec.Message) error { 64 switch msg.Nsid { 65 case tangled.GitRefUpdateNSID: 66 return ingestRefUpdate(d, enforcer, posthog, dev, source, msg) 67 case tangled.PipelineNSID: 68 return ingestPipeline(d, source, msg) 69 } 70 71 return nil 72 } 73} 74 75func ingestRefUpdate(d *db.DB, enforcer *rbac.Enforcer, pc posthog.Client, dev bool, source ec.Source, msg ec.Message) error { 76 var record tangled.GitRefUpdate 77 err := json.Unmarshal(msg.EventJson, &record) 78 if err != nil { 79 return err 80 } 81 82 knownKnots, err := enforcer.GetKnotsForUser(record.CommitterDid) 83 if err != nil { 84 return err 85 } 86 if !slices.Contains(knownKnots, source.Key()) { 87 return fmt.Errorf("%s does not belong to %s, something is fishy", record.CommitterDid, source.Key()) 88 } 89 90 err1 := populatePunchcard(d, record) 91 err2 := updateRepoLanguages(d, record) 92 93 var err3 error 94 if !dev { 95 err3 = pc.Enqueue(posthog.Capture{ 96 DistinctId: record.CommitterDid, 97 Event: "git_ref_update", 98 }) 99 } 100 101 return errors.Join(err1, err2, err3) 102} 103 104func populatePunchcard(d *db.DB, record tangled.GitRefUpdate) error { 105 knownEmails, err := db.GetAllEmails(d, record.CommitterDid) 106 if err != nil { 107 return err 108 } 109 110 count := 0 111 for _, ke := range knownEmails { 112 if record.Meta == nil { 113 continue 114 } 115 if record.Meta.CommitCount == nil { 116 continue 117 } 118 for _, ce := range record.Meta.CommitCount.ByEmail { 119 if ce == nil { 120 continue 121 } 122 if ce.Email == ke.Address { 123 count += int(ce.Count) 124 } 125 } 126 } 127 128 punch := models.Punch{ 129 Did: record.CommitterDid, 130 Date: time.Now(), 131 Count: count, 132 } 133 return db.AddPunch(d, punch) 134} 135 136func updateRepoLanguages(d *db.DB, record tangled.GitRefUpdate) error { 137 if record.Meta == nil || record.Meta.LangBreakdown == nil || record.Meta.LangBreakdown.Inputs == nil { 138 return fmt.Errorf("empty language data for repo: %s/%s", record.RepoDid, record.RepoName) 139 } 140 141 repos, err := db.GetRepos( 142 d, 143 0, 144 db.FilterEq("did", record.RepoDid), 145 db.FilterEq("name", record.RepoName), 146 ) 147 if err != nil { 148 return fmt.Errorf("failed to look for repo in DB (%s/%s): %w", record.RepoDid, record.RepoName, err) 149 } 150 if len(repos) != 1 { 151 return fmt.Errorf("incorrect number of repos returned: %d (expected 1)", len(repos)) 152 } 153 repo := repos[0] 154 155 ref := plumbing.ReferenceName(record.Ref) 156 if !ref.IsBranch() { 157 return fmt.Errorf("%s is not a valid reference name", ref) 158 } 159 160 var langs []models.RepoLanguage 161 for _, l := range record.Meta.LangBreakdown.Inputs { 162 if l == nil { 163 continue 164 } 165 166 langs = append(langs, models.RepoLanguage{ 167 RepoAt: repo.RepoAt(), 168 Ref: ref.Short(), 169 IsDefaultRef: record.Meta.IsDefaultRef, 170 Language: l.Lang, 171 Bytes: l.Size, 172 }) 173 } 174 175 return db.InsertRepoLanguages(d, langs) 176} 177 178func ingestPipeline(d *db.DB, source ec.Source, msg ec.Message) error { 179 var record tangled.Pipeline 180 err := json.Unmarshal(msg.EventJson, &record) 181 if err != nil { 182 return err 183 } 184 185 if record.TriggerMetadata == nil { 186 return fmt.Errorf("empty trigger metadata: nsid %s, rkey %s", msg.Nsid, msg.Rkey) 187 } 188 189 if record.TriggerMetadata.Repo == nil { 190 return fmt.Errorf("empty repo: nsid %s, rkey %s", msg.Nsid, msg.Rkey) 191 } 192 193 // does this repo have a spindle configured? 194 repos, err := db.GetRepos( 195 d, 196 0, 197 db.FilterEq("did", record.TriggerMetadata.Repo.Did), 198 db.FilterEq("name", record.TriggerMetadata.Repo.Repo), 199 ) 200 if err != nil { 201 return fmt.Errorf("failed to look for repo in DB: nsid %s, rkey %s, %w", msg.Nsid, msg.Rkey, err) 202 } 203 if len(repos) != 1 { 204 return fmt.Errorf("incorrect number of repos returned: %d (expected 1)", len(repos)) 205 } 206 if repos[0].Spindle == "" { 207 return fmt.Errorf("repo does not have a spindle configured yet: nsid %s, rkey %s", msg.Nsid, msg.Rkey) 208 } 209 210 // trigger info 211 var trigger models.Trigger 212 var sha string 213 trigger.Kind = workflow.TriggerKind(record.TriggerMetadata.Kind) 214 switch trigger.Kind { 215 case workflow.TriggerKindPush: 216 trigger.PushRef = &record.TriggerMetadata.Push.Ref 217 trigger.PushNewSha = &record.TriggerMetadata.Push.NewSha 218 trigger.PushOldSha = &record.TriggerMetadata.Push.OldSha 219 sha = *trigger.PushNewSha 220 case workflow.TriggerKindPullRequest: 221 trigger.PRSourceBranch = &record.TriggerMetadata.PullRequest.SourceBranch 222 trigger.PRTargetBranch = &record.TriggerMetadata.PullRequest.TargetBranch 223 trigger.PRSourceSha = &record.TriggerMetadata.PullRequest.SourceSha 224 trigger.PRAction = &record.TriggerMetadata.PullRequest.Action 225 sha = *trigger.PRSourceSha 226 } 227 228 tx, err := d.Begin() 229 if err != nil { 230 return fmt.Errorf("failed to start txn: %w", err) 231 } 232 233 triggerId, err := db.AddTrigger(tx, trigger) 234 if err != nil { 235 return fmt.Errorf("failed to add trigger entry: %w", err) 236 } 237 238 pipeline := models.Pipeline{ 239 Rkey: msg.Rkey, 240 Knot: source.Key(), 241 RepoOwner: syntax.DID(record.TriggerMetadata.Repo.Did), 242 RepoName: record.TriggerMetadata.Repo.Repo, 243 TriggerId: int(triggerId), 244 Sha: sha, 245 } 246 247 err = db.AddPipeline(tx, pipeline) 248 if err != nil { 249 return fmt.Errorf("failed to add pipeline: %w", err) 250 } 251 252 err = tx.Commit() 253 if err != nil { 254 return fmt.Errorf("failed to commit txn: %w", err) 255 } 256 257 return nil 258}