Brad Fitzpatrick | b1ddf2b | 2017-02-08 06:05:26 +0000 | [diff] [blame] | 1 | // Copyright 2017 The Go Authors. All rights reserved. |
| 2 | // Use of this source code is governed by a BSD-style |
| 3 | // license that can be found in the LICENSE file. |
| 4 | |
| 5 | // Package maintner mirrors, searches, syncs, and serves Git, Github, |
| 6 | // and Gerrit metadata. |
| 7 | // |
| 8 | // Maintner is short for "Maintainer". This package is intended for |
| 9 | // use by many tools. The name of the daemon that serves the maintner |
| 10 | // data to other tools is "maintnerd". |
| 11 | package maintner |
| 12 | |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 13 | import ( |
| 14 | "context" |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 15 | "errors" |
Brad Fitzpatrick | 776028b | 2017-02-15 10:46:56 -0800 | [diff] [blame] | 16 | "fmt" |
Brad Fitzpatrick | 776028b | 2017-02-15 10:46:56 -0800 | [diff] [blame] | 17 | "log" |
Brad Fitzpatrick | 147e896 | 2017-03-08 02:43:47 +0000 | [diff] [blame] | 18 | "regexp" |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 19 | "sync" |
| 20 | "time" |
| 21 | |
Kevin Burke | 92164ac | 2017-03-18 17:11:31 -0700 | [diff] [blame] | 22 | "github.com/golang/protobuf/ptypes" |
| 23 | "github.com/golang/protobuf/ptypes/timestamp" |
| 24 | |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 25 | "golang.org/x/build/maintner/maintpb" |
Kevin Burke | 7ebe3f6 | 2017-02-20 13:59:38 -0800 | [diff] [blame] | 26 | "golang.org/x/sync/errgroup" |
Chris Broadfoot | f744882 | 2018-02-23 11:21:05 -0800 | [diff] [blame] | 27 | "golang.org/x/time/rate" |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 28 | ) |
Brad Fitzpatrick | b1ddf2b | 2017-02-08 06:05:26 +0000 | [diff] [blame] | 29 | |
| 30 | // Corpus holds all of a project's metadata. |
| 31 | type Corpus struct { |
Brad Fitzpatrick | 04f8c52 | 2017-04-29 07:39:57 +0000 | [diff] [blame] | 32 | mutationLogger MutationLogger // non-nil when this is a self-updating corpus |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 33 | mutationSource MutationSource // from Initialize |
Brad Fitzpatrick | 04f8c52 | 2017-04-29 07:39:57 +0000 | [diff] [blame] | 34 | verbose bool |
| 35 | dataDir string |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 36 | sawErrSplit bool |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 37 | |
Brad Fitzpatrick | a7d233f | 2017-03-08 16:56:47 -0800 | [diff] [blame] | 38 | mu sync.RWMutex // guards all following fields |
| 39 | // corpus state: |
Brad Fitzpatrick | 1cf306e | 2017-03-27 17:39:01 +0000 | [diff] [blame] | 40 | didInit bool // true after Initialize completes successfully |
Kevin Burke | 8cb8408 | 2017-03-03 11:56:12 -0800 | [diff] [blame] | 41 | debug bool |
Brad Fitzpatrick | 059b908 | 2017-03-29 01:10:53 +0000 | [diff] [blame] | 42 | strIntern map[string]string // interned strings, including binary githashes |
| 43 | |
Brad Fitzpatrick | da737d3 | 2017-04-05 23:30:39 +0000 | [diff] [blame] | 44 | // pubsub: |
| 45 | activityChans map[string]chan struct{} // keyed by topic |
| 46 | |
Brad Fitzpatrick | a7d233f | 2017-03-08 16:56:47 -0800 | [diff] [blame] | 47 | // github-specific |
Brad Fitzpatrick | b3a49f9 | 2017-03-20 19:58:04 +0000 | [diff] [blame] | 48 | github *GitHub |
Kevin Burke | 92164ac | 2017-03-18 17:11:31 -0700 | [diff] [blame] | 49 | gerrit *Gerrit |
Brad Fitzpatrick | 8e7c0db | 2017-03-13 20:51:23 +0000 | [diff] [blame] | 50 | watchedGithubRepos []watchedGithubRepo |
Kevin Burke | 92164ac | 2017-03-18 17:11:31 -0700 | [diff] [blame] | 51 | watchedGerritRepos []watchedGerritRepo |
Chris Broadfoot | f744882 | 2018-02-23 11:21:05 -0800 | [diff] [blame] | 52 | githubLimiter *rate.Limiter |
| 53 | |
Brad Fitzpatrick | a7d233f | 2017-03-08 16:56:47 -0800 | [diff] [blame] | 54 | // git-specific: |
Brad Fitzpatrick | 5bc3f1f | 2017-03-27 18:44:23 +0000 | [diff] [blame] | 55 | lastGitCount time.Time // last time of log spam about loading status |
Brad Fitzpatrick | a7d233f | 2017-03-08 16:56:47 -0800 | [diff] [blame] | 56 | pollGitDirs []polledGitCommits |
Kevin Burke | f2033b7 | 2017-03-27 13:36:47 -0600 | [diff] [blame] | 57 | gitPeople map[string]*GitPerson |
| 58 | gitCommit map[GitHash]*GitCommit |
| 59 | gitCommitTodo map[GitHash]bool // -> true |
| 60 | gitOfHg map[string]GitHash // hg hex hash -> git hash |
Brad Fitzpatrick | a7d233f | 2017-03-08 16:56:47 -0800 | [diff] [blame] | 61 | zoneCache map[string]*time.Location // "+0530" => location |
Kevin Burke | 7ebe3f6 | 2017-02-20 13:59:38 -0800 | [diff] [blame] | 62 | } |
| 63 | |
Brad Fitzpatrick | b77708e | 2017-05-16 14:10:39 -0700 | [diff] [blame] | 64 | // RLock grabs the corpus's read lock. Grabbing the read lock prevents |
Chris Broadfoot | 90850ed | 2017-07-08 09:08:42 -0700 | [diff] [blame] | 65 | // any concurrent writes from mutating the corpus. This is only |
Brad Fitzpatrick | b77708e | 2017-05-16 14:10:39 -0700 | [diff] [blame] | 66 | // necessary if the application is querying the corpus and calling its |
| 67 | // Update method concurrently. |
| 68 | func (c *Corpus) RLock() { c.mu.RLock() } |
| 69 | |
| 70 | // RUnlock unlocks the corpus's read lock. |
| 71 | func (c *Corpus) RUnlock() { c.mu.RUnlock() } |
| 72 | |
Brad Fitzpatrick | 147e896 | 2017-03-08 02:43:47 +0000 | [diff] [blame] | 73 | type polledGitCommits struct { |
| 74 | repo *maintpb.GitRepo |
| 75 | dir string |
| 76 | } |
| 77 | |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 78 | // EnableLeaderMode prepares c to be the leader. This should only be |
| 79 | // called by the maintnerd process. |
| 80 | // |
Brad Fitzpatrick | 04f8c52 | 2017-04-29 07:39:57 +0000 | [diff] [blame] | 81 | // The provided scratchDir will store git checkouts. |
| 82 | func (c *Corpus) EnableLeaderMode(logger MutationLogger, scratchDir string) { |
| 83 | c.mutationLogger = logger |
| 84 | c.dataDir = scratchDir |
| 85 | } |
| 86 | |
Brad Fitzpatrick | b77708e | 2017-05-16 14:10:39 -0700 | [diff] [blame] | 87 | // SetVerbose enables or disables verbose logging. |
Brad Fitzpatrick | 04f8c52 | 2017-04-29 07:39:57 +0000 | [diff] [blame] | 88 | func (c *Corpus) SetVerbose(v bool) { c.verbose = v } |
| 89 | |
| 90 | func (c *Corpus) getDataDir() string { |
| 91 | if c.dataDir == "" { |
| 92 | panic("getDataDir called before Corpus.EnableLeaderMode") |
| 93 | } |
| 94 | return c.dataDir |
Kevin Burke | 7ebe3f6 | 2017-02-20 13:59:38 -0800 | [diff] [blame] | 95 | } |
| 96 | |
Brad Fitzpatrick | 3dedafe | 2017-03-20 23:22:38 +0000 | [diff] [blame] | 97 | // GitHub returns the corpus's github data. |
| 98 | func (c *Corpus) GitHub() *GitHub { |
| 99 | if c.github != nil { |
| 100 | return c.github |
| 101 | } |
| 102 | return new(GitHub) |
| 103 | } |
| 104 | |
Brad Fitzpatrick | 1eecef3 | 2017-04-03 13:01:31 -0700 | [diff] [blame] | 105 | // Gerrit returns the corpus's Gerrit data. |
| 106 | func (c *Corpus) Gerrit() *Gerrit { |
| 107 | if c.gerrit != nil { |
| 108 | return c.gerrit |
| 109 | } |
| 110 | return new(Gerrit) |
| 111 | } |
| 112 | |
Brad Fitzpatrick | b77708e | 2017-05-16 14:10:39 -0700 | [diff] [blame] | 113 | // Check verifies the internal structure of the Corpus data structures. |
| 114 | // It is intended for tests and debugging. |
| 115 | func (c *Corpus) Check() error { |
Brad Fitzpatrick | ae78535 | 2017-05-24 16:12:44 +0000 | [diff] [blame] | 116 | if err := c.Gerrit().check(); err != nil { |
| 117 | return fmt.Errorf("gerrit: %v", err) |
Brad Fitzpatrick | b77708e | 2017-05-16 14:10:39 -0700 | [diff] [blame] | 118 | } |
Brad Fitzpatrick | 2662697 | 2017-11-16 00:30:55 +0000 | [diff] [blame] | 119 | |
| 120 | for hash, gc := range c.gitCommit { |
| 121 | if gc.Committer == placeholderCommitter { |
| 122 | return fmt.Errorf("corpus git commit %v has placeholder committer", hash) |
| 123 | } |
| 124 | if gc.Hash != hash { |
| 125 | return fmt.Errorf("git commit for key %q had GitCommit.Hash %q", hash, gc.Hash) |
| 126 | } |
| 127 | for _, pc := range gc.Parents { |
| 128 | if _, ok := c.gitCommit[pc.Hash]; !ok { |
| 129 | return fmt.Errorf("git commit %q exists but its parent %q does not", gc.Hash, pc.Hash) |
| 130 | } |
| 131 | } |
| 132 | } |
| 133 | |
Brad Fitzpatrick | b77708e | 2017-05-16 14:10:39 -0700 | [diff] [blame] | 134 | return nil |
| 135 | } |
| 136 | |
Kevin Burke | 92164ac | 2017-03-18 17:11:31 -0700 | [diff] [blame] | 137 | // mustProtoFromTime turns a time.Time into a *timestamp.Timestamp or panics if |
| 138 | // in is invalid. |
| 139 | func mustProtoFromTime(in time.Time) *timestamp.Timestamp { |
| 140 | tp, err := ptypes.TimestampProto(in) |
| 141 | if err != nil { |
| 142 | panic(err) |
| 143 | } |
| 144 | return tp |
| 145 | } |
| 146 | |
Brad Fitzpatrick | d1cc7bf | 2017-03-09 12:48:04 -0800 | [diff] [blame] | 147 | // requires c.mu be held for writing |
| 148 | func (c *Corpus) str(s string) string { |
| 149 | if v, ok := c.strIntern[s]; ok { |
| 150 | return v |
| 151 | } |
| 152 | if c.strIntern == nil { |
| 153 | c.strIntern = make(map[string]string) |
| 154 | } |
| 155 | c.strIntern[s] = s |
| 156 | return s |
| 157 | } |
| 158 | |
Brad Fitzpatrick | eadb1bf | 2017-03-27 18:42:54 +0000 | [diff] [blame] | 159 | func (c *Corpus) strb(b []byte) string { |
| 160 | if v, ok := c.strIntern[string(b)]; ok { |
| 161 | return v |
| 162 | } |
| 163 | return c.str(string(b)) |
| 164 | } |
| 165 | |
Kevin Burke | 8cb8408 | 2017-03-03 11:56:12 -0800 | [diff] [blame] | 166 | func (c *Corpus) SetDebug() { |
| 167 | c.debug = true |
| 168 | } |
| 169 | |
| 170 | func (c *Corpus) debugf(format string, v ...interface{}) { |
| 171 | if c.debug { |
| 172 | log.Printf(format, v...) |
| 173 | } |
| 174 | } |
| 175 | |
Brad Fitzpatrick | 147e896 | 2017-03-08 02:43:47 +0000 | [diff] [blame] | 176 | // gerritProjNameRx is the pattern describing a Gerrit project name. |
| 177 | // TODO: figure out if this is accurate. |
| 178 | var gerritProjNameRx = regexp.MustCompile(`^[a-z0-9]+[a-z0-9\-\_]*$`) |
| 179 | |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 180 | // TrackGoGitRepo registers a git directory to have its metadata slurped into the corpus. |
Brad Fitzpatrick | 147e896 | 2017-03-08 02:43:47 +0000 | [diff] [blame] | 181 | // The goRepo is a name like "go" or "net". The dir is a path on disk. |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 182 | func (c *Corpus) TrackGoGitRepo(goRepo, dir string) { |
| 183 | if c.mutationLogger == nil { |
| 184 | panic("can't TrackGoGitRepo in non-leader mode") |
| 185 | } |
Brad Fitzpatrick | 147e896 | 2017-03-08 02:43:47 +0000 | [diff] [blame] | 186 | if !gerritProjNameRx.MatchString(goRepo) { |
| 187 | panic(fmt.Sprintf("bogus goRepo value %q", goRepo)) |
| 188 | } |
| 189 | c.mu.Lock() |
| 190 | defer c.mu.Unlock() |
| 191 | c.pollGitDirs = append(c.pollGitDirs, polledGitCommits{ |
| 192 | repo: &maintpb.GitRepo{GoRepo: goRepo}, |
| 193 | dir: dir, |
| 194 | }) |
| 195 | } |
| 196 | |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 197 | // A MutationSource yields a log of mutations that will catch a corpus |
| 198 | // back up to the present. |
| 199 | type MutationSource interface { |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 200 | // GetMutations returns a channel of mutations or related events. |
| 201 | // The channel will never be closed. |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 202 | // All sends on the returned channel should select |
| 203 | // on the provided context. |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 204 | GetMutations(context.Context) <-chan MutationStreamEvent |
| 205 | } |
| 206 | |
| 207 | // MutationStreamEvent represents one of three possible events while |
Dmitri Shuralyov | bb8466f | 2020-02-29 00:13:56 -0500 | [diff] [blame] | 208 | // reading mutations from disk or another source. |
| 209 | // An event is either a mutation, an error, or reaching the current |
| 210 | // end of the log. Exactly one of the three fields will be non-zero. |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 211 | type MutationStreamEvent struct { |
| 212 | Mutation *maintpb.Mutation |
| 213 | |
| 214 | // Err is a fatal error reading the log. No other events will |
| 215 | // follow an Err. |
| 216 | Err error |
| 217 | |
| 218 | // End, if true, means that all mutations have been sent and |
| 219 | // the next event might take some time to arrive (it might not |
| 220 | // have occurred yet). The End event is not a terminal state |
| 221 | // like Err. There may be multiple Ends. |
| 222 | End bool |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 223 | } |
| 224 | |
Brad Fitzpatrick | 021a49d | 2017-04-18 18:17:06 +0000 | [diff] [blame] | 225 | // Initialize populates the Corpus using the data from the |
| 226 | // MutationSource. It returns once it's up-to-date. To incrementally |
| 227 | // update it later, use the Update method. |
Kevin Burke | 7ebe3f6 | 2017-02-20 13:59:38 -0800 | [diff] [blame] | 228 | func (c *Corpus) Initialize(ctx context.Context, src MutationSource) error { |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 229 | if c.mutationSource != nil { |
| 230 | panic("duplicate call to Initialize") |
| 231 | } |
| 232 | c.mutationSource = src |
| 233 | log.Printf("Loading data from log %T ...", src) |
Andrew Bonventre | 6990c34 | 2017-07-05 22:24:05 -0400 | [diff] [blame] | 234 | return c.update(ctx, nil) |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 235 | } |
| 236 | |
Oleksandr Redko | f03e733 | 2023-02-18 15:01:28 +0200 | [diff] [blame] | 237 | // ErrSplit is returned when the client notices the leader's |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 238 | // mutation log has changed. This can happen if the leader restarts |
| 239 | // with uncommitted transactions. (The leader only commits mutations |
| 240 | // periodically.) |
| 241 | var ErrSplit = errors.New("maintner: leader server's history split, process out of sync") |
| 242 | |
| 243 | // Update incrementally updates the corpus from its current state to |
| 244 | // the latest state from the MutationSource passed earlier to |
| 245 | // Initialize. It does not return until there's either a new change or |
| 246 | // the context expires. |
Dmitri Shuralyov | 816bbcc | 2022-06-25 13:12:59 -0400 | [diff] [blame] | 247 | // If Update returns ErrSplit, the corpus can no longer be updated. |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 248 | // |
Chris Broadfoot | 90850ed | 2017-07-08 09:08:42 -0700 | [diff] [blame] | 249 | // Update must not be called concurrently with any other Update calls. If |
| 250 | // reading the corpus concurrently while the corpus is updating, you must hold |
| 251 | // the read lock using Corpus.RLock. |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 252 | func (c *Corpus) Update(ctx context.Context) error { |
| 253 | if c.mutationSource == nil { |
Andrew Bonventre | 6990c34 | 2017-07-05 22:24:05 -0400 | [diff] [blame] | 254 | panic("Update called without call to Initialize") |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 255 | } |
| 256 | if c.sawErrSplit { |
Andrew Bonventre | 6990c34 | 2017-07-05 22:24:05 -0400 | [diff] [blame] | 257 | panic("Update called after previous call returned ErrSplit") |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 258 | } |
| 259 | log.Printf("Updating data from log %T ...", c.mutationSource) |
Andrew Bonventre | 6990c34 | 2017-07-05 22:24:05 -0400 | [diff] [blame] | 260 | err := c.update(ctx, nil) |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 261 | if err == ErrSplit { |
| 262 | c.sawErrSplit = true |
| 263 | } |
| 264 | return err |
| 265 | } |
| 266 | |
Andrew Bonventre | 6990c34 | 2017-07-05 22:24:05 -0400 | [diff] [blame] | 267 | // UpdateWithLocker behaves just like Update, but holds lk when processing |
| 268 | // mutation events. |
| 269 | func (c *Corpus) UpdateWithLocker(ctx context.Context, lk sync.Locker) error { |
| 270 | if c.mutationSource == nil { |
| 271 | panic("UpdateWithLocker called without call to Initialize") |
| 272 | } |
| 273 | if c.sawErrSplit { |
| 274 | panic("UpdateWithLocker called after previous call returned ErrSplit") |
| 275 | } |
| 276 | log.Printf("Updating data from log %T ...", c.mutationSource) |
| 277 | err := c.update(ctx, lk) |
| 278 | if err == ErrSplit { |
| 279 | c.sawErrSplit = true |
| 280 | } |
| 281 | return err |
| 282 | } |
| 283 | |
Brad Fitzpatrick | ee6321b | 2017-11-14 23:25:00 +0000 | [diff] [blame] | 284 | type noopLocker struct{} |
| 285 | |
| 286 | func (noopLocker) Lock() {} |
| 287 | func (noopLocker) Unlock() {} |
| 288 | |
Andrew Bonventre | 6990c34 | 2017-07-05 22:24:05 -0400 | [diff] [blame] | 289 | // lk optionally specifies a locker to use while processing mutations. |
| 290 | func (c *Corpus) update(ctx context.Context, lk sync.Locker) error { |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 291 | src := c.mutationSource |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 292 | ch := src.GetMutations(ctx) |
| 293 | done := ctx.Done() |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 294 | c.mu.Lock() |
| 295 | defer c.mu.Unlock() |
Brad Fitzpatrick | ee6321b | 2017-11-14 23:25:00 +0000 | [diff] [blame] | 296 | if lk == nil { |
| 297 | lk = noopLocker{} |
| 298 | } |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 299 | for { |
| 300 | select { |
| 301 | case <-done: |
Brad Fitzpatrick | a7d233f | 2017-03-08 16:56:47 -0800 | [diff] [blame] | 302 | err := ctx.Err() |
| 303 | log.Printf("Context expired while loading data from log %T: %v", src, err) |
| 304 | return err |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 305 | case e := <-ch: |
| 306 | if e.Err != nil { |
Brad Fitzpatrick | 1a1ef8e | 2017-04-29 21:15:37 +0000 | [diff] [blame] | 307 | log.Printf("Corpus GetMutations: %v", e.Err) |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 308 | return e.Err |
| 309 | } |
| 310 | if e.End { |
Brad Fitzpatrick | 1cf306e | 2017-03-27 17:39:01 +0000 | [diff] [blame] | 311 | c.didInit = true |
Brad Fitzpatrick | ee6321b | 2017-11-14 23:25:00 +0000 | [diff] [blame] | 312 | lk.Lock() |
| 313 | c.finishProcessing() |
| 314 | lk.Unlock() |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 315 | log.Printf("Reloaded data from log %T.", src) |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 316 | return nil |
| 317 | } |
Brad Fitzpatrick | ee6321b | 2017-11-14 23:25:00 +0000 | [diff] [blame] | 318 | lk.Lock() |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 319 | c.processMutationLocked(e.Mutation) |
Brad Fitzpatrick | ee6321b | 2017-11-14 23:25:00 +0000 | [diff] [blame] | 320 | lk.Unlock() |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 321 | } |
| 322 | } |
| 323 | } |
| 324 | |
Brad Fitzpatrick | 2ceb757 | 2017-03-25 03:56:50 +0000 | [diff] [blame] | 325 | // addMutation adds a mutation to the log and immediately processes it. |
| 326 | func (c *Corpus) addMutation(m *maintpb.Mutation) { |
Brad Fitzpatrick | 04f8c52 | 2017-04-29 07:39:57 +0000 | [diff] [blame] | 327 | if c.verbose { |
Brad Fitzpatrick | 8927fdd | 2017-03-15 17:51:41 +0000 | [diff] [blame] | 328 | log.Printf("mutation: %v", m) |
| 329 | } |
Kevin Burke | 9fd5f30 | 2017-02-28 13:31:57 -0800 | [diff] [blame] | 330 | c.mu.Lock() |
| 331 | c.processMutationLocked(m) |
Brad Fitzpatrick | 02c3a36 | 2017-11-17 21:48:51 +0000 | [diff] [blame] | 332 | c.finishProcessing() |
Kevin Burke | 9fd5f30 | 2017-02-28 13:31:57 -0800 | [diff] [blame] | 333 | c.mu.Unlock() |
Brad Fitzpatrick | 2ceb757 | 2017-03-25 03:56:50 +0000 | [diff] [blame] | 334 | |
Brad Fitzpatrick | 04f8c52 | 2017-04-29 07:39:57 +0000 | [diff] [blame] | 335 | if c.mutationLogger == nil { |
Brad Fitzpatrick | 2ceb757 | 2017-03-25 03:56:50 +0000 | [diff] [blame] | 336 | return |
| 337 | } |
Brad Fitzpatrick | 04f8c52 | 2017-04-29 07:39:57 +0000 | [diff] [blame] | 338 | err := c.mutationLogger.Log(m) |
Brad Fitzpatrick | 2ceb757 | 2017-03-25 03:56:50 +0000 | [diff] [blame] | 339 | if err != nil { |
| 340 | // TODO: handle errors better? failing is only safe option. |
| 341 | log.Fatalf("could not log mutation %v: %v\n", m, err) |
Kevin Burke | 9fd5f30 | 2017-02-28 13:31:57 -0800 | [diff] [blame] | 342 | } |
| 343 | } |
| 344 | |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 345 | // c.mu must be held. |
| 346 | func (c *Corpus) processMutationLocked(m *maintpb.Mutation) { |
| 347 | if im := m.GithubIssue; im != nil { |
| 348 | c.processGithubIssueMutation(im) |
| 349 | } |
Brad Fitzpatrick | 8cf2b3b | 2017-03-18 03:48:31 +0000 | [diff] [blame] | 350 | if gm := m.Github; gm != nil { |
| 351 | c.processGithubMutation(gm) |
| 352 | } |
Brad Fitzpatrick | a7d233f | 2017-03-08 16:56:47 -0800 | [diff] [blame] | 353 | if gm := m.Git; gm != nil { |
| 354 | c.processGitMutation(gm) |
| 355 | } |
Kevin Burke | 92164ac | 2017-03-18 17:11:31 -0700 | [diff] [blame] | 356 | if gm := m.Gerrit; gm != nil { |
| 357 | c.processGerritMutation(gm) |
| 358 | } |
Brad Fitzpatrick | 49a8dd9 | 2017-02-12 07:22:59 +0000 | [diff] [blame] | 359 | } |
| 360 | |
Brad Fitzpatrick | ee6321b | 2017-11-14 23:25:00 +0000 | [diff] [blame] | 361 | // finishProcessing fixes up invariants and data structures before |
| 362 | // returning the Corpus from the Update loop back to the user. |
| 363 | // |
| 364 | // c.mu must be held. |
| 365 | func (c *Corpus) finishProcessing() { |
| 366 | c.gerrit.finishProcessing() |
| 367 | } |
| 368 | |
Brad Fitzpatrick | 8da4ff0 | 2017-03-20 22:18:18 +0000 | [diff] [blame] | 369 | // SyncLoop runs forever (until an error or context expiration) and |
| 370 | // updates the corpus as the tracked sources change. |
| 371 | func (c *Corpus) SyncLoop(ctx context.Context) error { |
| 372 | return c.sync(ctx, true) |
Brad Fitzpatrick | b1ddf2b | 2017-02-08 06:05:26 +0000 | [diff] [blame] | 373 | } |
| 374 | |
Brad Fitzpatrick | 8da4ff0 | 2017-03-20 22:18:18 +0000 | [diff] [blame] | 375 | // Sync updates the corpus from its tracked sources. |
| 376 | func (c *Corpus) Sync(ctx context.Context) error { |
| 377 | return c.sync(ctx, false) |
Brad Fitzpatrick | b1ddf2b | 2017-02-08 06:05:26 +0000 | [diff] [blame] | 378 | } |
| 379 | |
Brad Fitzpatrick | 8da4ff0 | 2017-03-20 22:18:18 +0000 | [diff] [blame] | 380 | func (c *Corpus) sync(ctx context.Context, loop bool) error { |
Brad Fitzpatrick | 73e10fb | 2017-05-16 17:36:42 -0700 | [diff] [blame] | 381 | if _, ok := c.mutationSource.(*netMutSource); ok { |
| 382 | return errors.New("maintner: can't run Corpus.Sync on a Corpus using NetworkMutationSource (did you mean Update?)") |
| 383 | } |
| 384 | |
Kevin Burke | 7ebe3f6 | 2017-02-20 13:59:38 -0800 | [diff] [blame] | 385 | group, ctx := errgroup.WithContext(ctx) |
Brad Fitzpatrick | 8927fdd | 2017-03-15 17:51:41 +0000 | [diff] [blame] | 386 | for _, w := range c.watchedGithubRepos { |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 387 | gr, token := w.gr, w.token |
Kevin Burke | 7ebe3f6 | 2017-02-20 13:59:38 -0800 | [diff] [blame] | 388 | group.Go(func() error { |
Brad Fitzpatrick | 8927fdd | 2017-03-15 17:51:41 +0000 | [diff] [blame] | 389 | log.Printf("Polling %v ...", gr.id) |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 390 | for { |
| 391 | err := gr.sync(ctx, token, loop) |
| 392 | if loop && isTempErr(err) { |
| 393 | log.Printf("Temporary error from github %v: %v", gr.ID(), err) |
| 394 | time.Sleep(30 * time.Second) |
| 395 | continue |
| 396 | } |
| 397 | log.Printf("github sync ending for %v: %v", gr.ID(), err) |
| 398 | return err |
| 399 | } |
Kevin Burke | 7ebe3f6 | 2017-02-20 13:59:38 -0800 | [diff] [blame] | 400 | }) |
| 401 | } |
Brad Fitzpatrick | 147e896 | 2017-03-08 02:43:47 +0000 | [diff] [blame] | 402 | for _, rp := range c.pollGitDirs { |
| 403 | rp := rp |
| 404 | group.Go(func() error { |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 405 | for { |
| 406 | err := c.syncGitCommits(ctx, rp, loop) |
| 407 | if loop && isTempErr(err) { |
| 408 | log.Printf("Temporary error from git repo %v: %v", rp.dir, err) |
| 409 | time.Sleep(30 * time.Second) |
| 410 | continue |
| 411 | } |
| 412 | log.Printf("git sync ending for %v: %v", rp.dir, err) |
| 413 | return err |
| 414 | } |
Brad Fitzpatrick | 147e896 | 2017-03-08 02:43:47 +0000 | [diff] [blame] | 415 | }) |
| 416 | } |
Kevin Burke | 92164ac | 2017-03-18 17:11:31 -0700 | [diff] [blame] | 417 | for _, w := range c.watchedGerritRepos { |
Brad Fitzpatrick | d97cc62 | 2017-03-24 23:23:46 +0000 | [diff] [blame] | 418 | gp := w.project |
Kevin Burke | 92164ac | 2017-03-18 17:11:31 -0700 | [diff] [blame] | 419 | group.Go(func() error { |
Brad Fitzpatrick | d97cc62 | 2017-03-24 23:23:46 +0000 | [diff] [blame] | 420 | log.Printf("Polling gerrit %v ...", gp.proj) |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 421 | for { |
| 422 | err := gp.sync(ctx, loop) |
| 423 | if loop && isTempErr(err) { |
| 424 | log.Printf("Temporary error from gerrit %v: %v", gp.proj, err) |
| 425 | time.Sleep(30 * time.Second) |
| 426 | continue |
| 427 | } |
| 428 | log.Printf("gerrit sync ending for %v: %v", gp.proj, err) |
| 429 | return err |
| 430 | } |
Kevin Burke | 92164ac | 2017-03-18 17:11:31 -0700 | [diff] [blame] | 431 | }) |
| 432 | } |
Kevin Burke | 7ebe3f6 | 2017-02-20 13:59:38 -0800 | [diff] [blame] | 433 | return group.Wait() |
| 434 | } |
Brad Fitzpatrick | 8160f0c | 2017-04-26 22:52:07 +0000 | [diff] [blame] | 435 | |
| 436 | func isTempErr(err error) bool { |
| 437 | log.Printf("IS TEMP ERROR? %T %v", err, err) |
| 438 | return true |
| 439 | } |