2021-02-27 02:42:37 +03:00
|
|
|
package github
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"fmt"
|
2021-03-05 22:06:21 +03:00
|
|
|
"strings"
|
2021-02-27 02:42:37 +03:00
|
|
|
"sync"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/shurcooL/githubv4"
|
|
|
|
)
|
|
|
|
|
2021-03-05 22:06:21 +03:00
|
|
|
const ( // These values influence how fast the github graphql rate limit is exhausted.
|
|
|
|
NUM_ISSUES = 40
|
|
|
|
NUM_ISSUE_EDITS = 100
|
|
|
|
NUM_TIMELINE_ITEMS = 100
|
|
|
|
NUM_COMMENT_EDITS = 100
|
2021-02-27 02:42:37 +03:00
|
|
|
|
|
|
|
CHAN_CAPACITY = 128
|
|
|
|
)
|
|
|
|
|
2021-03-08 09:53:09 +03:00
|
|
|
// importMediator provides a convenient interface to retrieve issues from the Github GraphQL API.
|
2021-02-27 02:42:37 +03:00
|
|
|
type importMediator struct {
|
|
|
|
// Github graphql client
|
2021-03-05 22:06:21 +03:00
|
|
|
gc *githubv4.Client
|
|
|
|
|
|
|
|
// name of the repository owner on Github
|
|
|
|
owner string
|
|
|
|
|
|
|
|
// name of the Github repository
|
2021-02-27 02:42:37 +03:00
|
|
|
project string
|
2021-03-05 22:06:21 +03:00
|
|
|
|
2021-03-08 09:53:09 +03:00
|
|
|
// since specifies which issues to import. Issues that have been updated at or after the
|
|
|
|
// given date should be imported.
|
2021-02-27 02:42:37 +03:00
|
|
|
since time.Time
|
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
// Issues is a channel holding bundles of Issues to be imported. Each issueEvent
|
|
|
|
// is either a message (type messageEvent) or a struct holding all the data associated with
|
|
|
|
// one issue (type issueData).
|
|
|
|
Issues chan issueEvent
|
2021-03-05 22:06:21 +03:00
|
|
|
|
2021-03-08 09:53:09 +03:00
|
|
|
// Sticky error
|
|
|
|
err error
|
2021-03-05 22:06:21 +03:00
|
|
|
|
2021-03-08 09:53:09 +03:00
|
|
|
// errMut is a mutex to synchronize access to the sticky error variable err.
|
|
|
|
errMut sync.Mutex
|
|
|
|
}
|
2021-03-05 22:06:21 +03:00
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
type issueEvent interface {
|
|
|
|
isIssueEvent()
|
|
|
|
}
|
|
|
|
type timelineEvent interface {
|
|
|
|
isTimelineEvent()
|
|
|
|
}
|
|
|
|
type userContentEditEvent interface {
|
|
|
|
isUserContentEditEvent()
|
2021-03-08 09:53:09 +03:00
|
|
|
}
|
2021-02-27 02:42:37 +03:00
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
type messageEvent struct {
|
|
|
|
msg string
|
2021-03-05 22:06:21 +03:00
|
|
|
}
|
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
func (messageEvent) isIssueEvent() {}
|
|
|
|
func (messageEvent) isUserContentEditEvent() {}
|
|
|
|
func (messageEvent) isTimelineEvent() {}
|
|
|
|
|
|
|
|
type issueData struct {
|
|
|
|
issue
|
|
|
|
issueEdits <-chan userContentEditEvent
|
|
|
|
timelineItems <-chan timelineEvent
|
|
|
|
}
|
|
|
|
|
|
|
|
func (issueData) isIssueEvent() {}
|
|
|
|
|
|
|
|
type timelineData struct {
|
|
|
|
timelineItem
|
|
|
|
userContentEdits <-chan userContentEditEvent
|
|
|
|
}
|
|
|
|
|
|
|
|
func (timelineData) isTimelineEvent() {}
|
|
|
|
|
|
|
|
type userContentEditData struct {
|
|
|
|
userContentEdit
|
|
|
|
}
|
|
|
|
|
|
|
|
// func (userContentEditData) isEvent()
|
|
|
|
func (userContentEditData) isUserContentEditEvent() {}
|
|
|
|
|
2021-03-05 22:06:21 +03:00
|
|
|
func (mm *importMediator) setError(err error) {
|
|
|
|
mm.errMut.Lock()
|
|
|
|
mm.err = err
|
|
|
|
mm.errMut.Unlock()
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
func NewImportMediator(ctx context.Context, client *githubv4.Client, owner, project string, since time.Time) *importMediator {
|
|
|
|
mm := importMediator{
|
2021-03-08 09:53:09 +03:00
|
|
|
gc: client,
|
|
|
|
owner: owner,
|
|
|
|
project: project,
|
|
|
|
since: since,
|
2021-03-17 21:29:39 +03:00
|
|
|
Issues: make(chan issueEvent, CHAN_CAPACITY),
|
2021-03-08 09:53:09 +03:00
|
|
|
err: nil,
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
go func() {
|
2021-03-05 22:06:21 +03:00
|
|
|
mm.fillIssues(ctx)
|
2021-03-17 21:29:39 +03:00
|
|
|
close(mm.Issues)
|
2021-02-27 02:42:37 +03:00
|
|
|
}()
|
|
|
|
return &mm
|
|
|
|
}
|
|
|
|
|
2021-03-08 09:53:09 +03:00
|
|
|
type varmap map[string]interface{}
|
|
|
|
|
2021-03-05 22:06:21 +03:00
|
|
|
func newIssueVars(owner, project string, since time.Time) varmap {
|
|
|
|
return varmap{
|
|
|
|
"owner": githubv4.String(owner),
|
|
|
|
"name": githubv4.String(project),
|
|
|
|
"issueSince": githubv4.DateTime{Time: since},
|
|
|
|
"issueFirst": githubv4.Int(NUM_ISSUES),
|
|
|
|
"issueEditLast": githubv4.Int(NUM_ISSUE_EDITS),
|
|
|
|
"issueEditBefore": (*githubv4.String)(nil),
|
|
|
|
"timelineFirst": githubv4.Int(NUM_TIMELINE_ITEMS),
|
|
|
|
"timelineAfter": (*githubv4.String)(nil),
|
|
|
|
"commentEditLast": githubv4.Int(NUM_COMMENT_EDITS),
|
|
|
|
"commentEditBefore": (*githubv4.String)(nil),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func newIssueEditVars() varmap {
|
|
|
|
return varmap{
|
|
|
|
"issueEditLast": githubv4.Int(NUM_ISSUE_EDITS),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func newTimelineVars() varmap {
|
|
|
|
return varmap{
|
|
|
|
"timelineFirst": githubv4.Int(NUM_TIMELINE_ITEMS),
|
|
|
|
"commentEditLast": githubv4.Int(NUM_COMMENT_EDITS),
|
|
|
|
"commentEditBefore": (*githubv4.String)(nil),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func newCommentEditVars() varmap {
|
|
|
|
return varmap{
|
|
|
|
"commentEditLast": githubv4.Int(NUM_COMMENT_EDITS),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-02-27 02:42:37 +03:00
|
|
|
func (mm *importMediator) Error() error {
|
2021-03-05 22:06:21 +03:00
|
|
|
mm.errMut.Lock()
|
|
|
|
err := mm.err
|
|
|
|
mm.errMut.Unlock()
|
|
|
|
return err
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
func (mm *importMediator) User(ctx context.Context, loginName string) (*user, error) {
|
|
|
|
query := userQuery{}
|
|
|
|
vars := varmap{"login": githubv4.String(loginName)}
|
2021-03-17 21:29:39 +03:00
|
|
|
// handle message events localy
|
|
|
|
channel := make(chan messageEvent)
|
|
|
|
defer close(channel)
|
|
|
|
// print all messages immediately
|
|
|
|
go func() {
|
|
|
|
for event := range channel {
|
|
|
|
fmt.Println(event.msg)
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
if err := mm.mQuery(ctx, &query, vars, channel); err != nil {
|
2021-02-27 02:42:37 +03:00
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return &query.User, nil
|
|
|
|
}
|
|
|
|
|
2021-03-05 22:06:21 +03:00
|
|
|
func (mm *importMediator) fillIssues(ctx context.Context) {
|
2021-03-17 21:29:39 +03:00
|
|
|
// First: setup message handling while submitting GraphQL queries.
|
|
|
|
msgs := make(chan messageEvent)
|
|
|
|
defer close(msgs)
|
|
|
|
// forward all the messages to the issue channel. The message will be queued after
|
|
|
|
// all the issues which has been completed.
|
|
|
|
go func() {
|
|
|
|
for msg := range msgs {
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
|
|
|
case mm.Issues <- msg:
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
// start processing the actual issues
|
2021-03-05 22:06:21 +03:00
|
|
|
initialCursor := githubv4.String("")
|
2021-03-17 21:29:39 +03:00
|
|
|
issues, hasIssues := mm.queryIssue(ctx, initialCursor, msgs)
|
2021-03-05 22:06:21 +03:00
|
|
|
for hasIssues {
|
|
|
|
for _, node := range issues.Nodes {
|
2021-03-08 09:53:09 +03:00
|
|
|
// We need to send an issue-bundle over the issue channel before we start
|
|
|
|
// filling the issue edits and the timeline items to avoid deadlocks.
|
2021-03-17 21:29:39 +03:00
|
|
|
issueEditChan := make(chan userContentEditEvent, CHAN_CAPACITY)
|
|
|
|
timelineBundleChan := make(chan timelineEvent, CHAN_CAPACITY)
|
2021-03-05 22:06:21 +03:00
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
2021-03-17 21:29:39 +03:00
|
|
|
case mm.Issues <- issueData{node.issue, issueEditChan, timelineBundleChan}:
|
2021-03-05 22:06:21 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
// We do not know whether the client reads from the issue edit channel
|
|
|
|
// or the timeline channel first. Since the capacity of any channel is limited
|
|
|
|
// any send operation may block. Hence, in order to avoid deadlocks we need
|
|
|
|
// to send over both these channels concurrently.
|
|
|
|
go func(node issueNode) {
|
|
|
|
mm.fillIssueEdits(ctx, &node, issueEditChan)
|
|
|
|
close(issueEditChan)
|
|
|
|
}(node)
|
|
|
|
go func(node issueNode) {
|
2021-03-08 09:53:09 +03:00
|
|
|
mm.fillTimeline(ctx, &node, timelineBundleChan)
|
|
|
|
close(timelineBundleChan)
|
2021-03-05 22:06:21 +03:00
|
|
|
}(node)
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
2021-03-05 22:06:21 +03:00
|
|
|
if !issues.PageInfo.HasNextPage {
|
|
|
|
break
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
2021-03-17 21:29:39 +03:00
|
|
|
issues, hasIssues = mm.queryIssue(ctx, issues.PageInfo.EndCursor, msgs)
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
func (mm *importMediator) fillIssueEdits(ctx context.Context, issueNode *issueNode, channel chan<- userContentEditEvent) {
|
|
|
|
// First: setup message handling while submitting GraphQL queries.
|
|
|
|
msgs := make(chan messageEvent)
|
|
|
|
defer close(msgs)
|
|
|
|
// forward all the messages to the issue-edit channel. The message will be queued after
|
|
|
|
// all the issue edits which have been completed.
|
|
|
|
go func() {
|
|
|
|
for msg := range msgs {
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
|
|
|
case channel <- msg:
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}()
|
2021-02-27 02:42:37 +03:00
|
|
|
edits := &issueNode.UserContentEdits
|
|
|
|
hasEdits := true
|
|
|
|
for hasEdits {
|
|
|
|
for edit := range reverse(edits.Nodes) {
|
|
|
|
if edit.Diff == nil || string(*edit.Diff) == "" {
|
2021-03-05 22:06:21 +03:00
|
|
|
// issueEdit.Diff == nil happen if the event is older than early
|
|
|
|
// 2018, Github doesn't have the data before that. Best we can do is
|
|
|
|
// to ignore the event.
|
2021-02-27 02:42:37 +03:00
|
|
|
continue
|
|
|
|
}
|
2021-03-05 22:06:21 +03:00
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
2021-03-17 21:29:39 +03:00
|
|
|
case channel <- userContentEditData{edit}:
|
2021-03-05 22:06:21 +03:00
|
|
|
}
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
if !edits.PageInfo.HasPreviousPage {
|
|
|
|
break
|
|
|
|
}
|
2021-03-17 21:29:39 +03:00
|
|
|
edits, hasEdits = mm.queryIssueEdits(ctx, issueNode.issue.Id, edits.PageInfo.EndCursor, msgs)
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
func (mm *importMediator) fillTimeline(ctx context.Context, issueNode *issueNode, channel chan<- timelineEvent) {
|
|
|
|
// First: setup message handling while submitting GraphQL queries.
|
|
|
|
msgs := make(chan messageEvent)
|
|
|
|
defer close(msgs)
|
|
|
|
// forward all the messages to the timeline channel. The message will be queued after
|
|
|
|
// all the timeline items which have been completed.
|
|
|
|
go func() {
|
|
|
|
for msg := range msgs {
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
|
|
|
case channel <- msg:
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}()
|
2021-02-27 02:42:37 +03:00
|
|
|
items := &issueNode.TimelineItems
|
|
|
|
hasItems := true
|
|
|
|
for hasItems {
|
|
|
|
for _, item := range items.Nodes {
|
2021-03-05 22:06:21 +03:00
|
|
|
if item.Typename == "IssueComment" {
|
2021-03-08 09:53:09 +03:00
|
|
|
// Issue comments are different than other timeline items in that
|
|
|
|
// they may have associated user content edits.
|
|
|
|
//
|
|
|
|
// Send over the timeline-channel before starting to fill the comment
|
|
|
|
// edits.
|
2021-03-17 21:29:39 +03:00
|
|
|
commentEditChan := make(chan userContentEditEvent, CHAN_CAPACITY)
|
2021-03-05 22:06:21 +03:00
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
2021-03-17 21:29:39 +03:00
|
|
|
case channel <- timelineData{item, commentEditChan}:
|
2021-03-05 22:06:21 +03:00
|
|
|
}
|
|
|
|
// We need to create a new goroutine for filling the comment edit
|
|
|
|
// channel.
|
|
|
|
go func(item timelineItem) {
|
|
|
|
mm.fillCommentEdits(ctx, &item, commentEditChan)
|
|
|
|
close(commentEditChan)
|
|
|
|
}(item)
|
|
|
|
} else {
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
2021-03-17 21:29:39 +03:00
|
|
|
case channel <- timelineData{item, nil}:
|
2021-03-05 22:06:21 +03:00
|
|
|
}
|
|
|
|
}
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
if !items.PageInfo.HasNextPage {
|
|
|
|
break
|
|
|
|
}
|
2021-03-17 21:29:39 +03:00
|
|
|
items, hasItems = mm.queryTimeline(ctx, issueNode.issue.Id, items.PageInfo.EndCursor, msgs)
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
func (mm *importMediator) fillCommentEdits(ctx context.Context, item *timelineItem, channel chan<- userContentEditEvent) {
|
2021-03-05 22:06:21 +03:00
|
|
|
// Here we are only concerned with timeline items of type issueComment.
|
2021-02-27 02:42:37 +03:00
|
|
|
if item.Typename != "IssueComment" {
|
|
|
|
return
|
|
|
|
}
|
2021-03-17 21:29:39 +03:00
|
|
|
// First: setup message handling while submitting GraphQL queries.
|
|
|
|
msgs := make(chan messageEvent)
|
|
|
|
defer close(msgs)
|
|
|
|
// forward all the messages to the user content edit channel. The message will be queued after
|
|
|
|
// all the user content edits which have been completed already.
|
|
|
|
go func() {
|
|
|
|
for msg := range msgs {
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
|
|
|
case channel <- msg:
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}()
|
2021-02-27 02:42:37 +03:00
|
|
|
comment := &item.IssueComment
|
|
|
|
edits := &comment.UserContentEdits
|
|
|
|
hasEdits := true
|
|
|
|
for hasEdits {
|
|
|
|
for edit := range reverse(edits.Nodes) {
|
|
|
|
if edit.Diff == nil || string(*edit.Diff) == "" {
|
2021-03-05 22:06:21 +03:00
|
|
|
// issueEdit.Diff == nil happen if the event is older than early
|
|
|
|
// 2018, Github doesn't have the data before that. Best we can do is
|
|
|
|
// to ignore the event.
|
2021-02-27 02:42:37 +03:00
|
|
|
continue
|
|
|
|
}
|
2021-03-05 22:06:21 +03:00
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
2021-03-17 21:29:39 +03:00
|
|
|
case channel <- userContentEditData{edit}:
|
2021-03-05 22:06:21 +03:00
|
|
|
}
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
if !edits.PageInfo.HasPreviousPage {
|
|
|
|
break
|
|
|
|
}
|
2021-03-17 21:29:39 +03:00
|
|
|
edits, hasEdits = mm.queryCommentEdits(ctx, comment.Id, edits.PageInfo.EndCursor, msgs)
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
func (mm *importMediator) queryCommentEdits(ctx context.Context, nid githubv4.ID, cursor githubv4.String, msgs chan<- messageEvent) (*userContentEditConnection, bool) {
|
2021-03-05 22:06:21 +03:00
|
|
|
vars := newCommentEditVars()
|
|
|
|
vars["gqlNodeId"] = nid
|
2021-02-27 02:42:37 +03:00
|
|
|
if cursor == "" {
|
|
|
|
vars["commentEditBefore"] = (*githubv4.String)(nil)
|
|
|
|
} else {
|
|
|
|
vars["commentEditBefore"] = cursor
|
|
|
|
}
|
|
|
|
query := commentEditQuery{}
|
2021-03-17 21:29:39 +03:00
|
|
|
if err := mm.mQuery(ctx, &query, vars, msgs); err != nil {
|
2021-03-05 22:06:21 +03:00
|
|
|
mm.setError(err)
|
2021-02-27 02:42:37 +03:00
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
connection := &query.Node.IssueComment.UserContentEdits
|
|
|
|
if len(connection.Nodes) <= 0 {
|
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
return connection, true
|
|
|
|
}
|
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
func (mm *importMediator) queryTimeline(ctx context.Context, nid githubv4.ID, cursor githubv4.String, msgs chan<- messageEvent) (*timelineItemsConnection, bool) {
|
2021-03-05 22:06:21 +03:00
|
|
|
vars := newTimelineVars()
|
|
|
|
vars["gqlNodeId"] = nid
|
2021-02-27 02:42:37 +03:00
|
|
|
if cursor == "" {
|
|
|
|
vars["timelineAfter"] = (*githubv4.String)(nil)
|
|
|
|
} else {
|
|
|
|
vars["timelineAfter"] = cursor
|
|
|
|
}
|
|
|
|
query := timelineQuery{}
|
2021-03-17 21:29:39 +03:00
|
|
|
if err := mm.mQuery(ctx, &query, vars, msgs); err != nil {
|
2021-03-05 22:06:21 +03:00
|
|
|
mm.setError(err)
|
2021-02-27 02:42:37 +03:00
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
connection := &query.Node.Issue.TimelineItems
|
|
|
|
if len(connection.Nodes) <= 0 {
|
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
return connection, true
|
|
|
|
}
|
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
func (mm *importMediator) queryIssueEdits(ctx context.Context, nid githubv4.ID, cursor githubv4.String, msgs chan<- messageEvent) (*userContentEditConnection, bool) {
|
2021-03-05 22:06:21 +03:00
|
|
|
vars := newIssueEditVars()
|
|
|
|
vars["gqlNodeId"] = nid
|
2021-02-27 02:42:37 +03:00
|
|
|
if cursor == "" {
|
|
|
|
vars["issueEditBefore"] = (*githubv4.String)(nil)
|
|
|
|
} else {
|
|
|
|
vars["issueEditBefore"] = cursor
|
|
|
|
}
|
|
|
|
query := issueEditQuery{}
|
2021-03-17 21:29:39 +03:00
|
|
|
if err := mm.mQuery(ctx, &query, vars, msgs); err != nil {
|
2021-03-05 22:06:21 +03:00
|
|
|
mm.setError(err)
|
2021-02-27 02:42:37 +03:00
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
connection := &query.Node.Issue.UserContentEdits
|
|
|
|
if len(connection.Nodes) <= 0 {
|
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
return connection, true
|
|
|
|
}
|
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
func (mm *importMediator) queryIssue(ctx context.Context, cursor githubv4.String, msgs chan<- messageEvent) (*issueConnection, bool) {
|
2021-03-05 22:06:21 +03:00
|
|
|
vars := newIssueVars(mm.owner, mm.project, mm.since)
|
2021-02-27 02:42:37 +03:00
|
|
|
if cursor == "" {
|
|
|
|
vars["issueAfter"] = (*githubv4.String)(nil)
|
|
|
|
} else {
|
|
|
|
vars["issueAfter"] = githubv4.String(cursor)
|
|
|
|
}
|
|
|
|
query := issueQuery{}
|
2021-03-17 21:29:39 +03:00
|
|
|
if err := mm.mQuery(ctx, &query, vars, msgs); err != nil {
|
2021-03-05 22:06:21 +03:00
|
|
|
mm.setError(err)
|
2021-02-27 02:42:37 +03:00
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
connection := &query.Repository.Issues
|
|
|
|
if len(connection.Nodes) <= 0 {
|
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
return connection, true
|
|
|
|
}
|
|
|
|
|
|
|
|
func reverse(eds []userContentEdit) chan userContentEdit {
|
|
|
|
ret := make(chan userContentEdit)
|
|
|
|
go func() {
|
|
|
|
for i := range eds {
|
|
|
|
ret <- eds[len(eds)-1-i]
|
|
|
|
}
|
|
|
|
close(ret)
|
|
|
|
}()
|
|
|
|
return ret
|
|
|
|
}
|
|
|
|
|
|
|
|
type rateLimiter interface {
|
|
|
|
rateLimit() rateLimit
|
|
|
|
}
|
|
|
|
|
2021-03-05 22:06:21 +03:00
|
|
|
// mQuery executes a single GraphQL query. The variable query is used to derive the GraphQL query
|
|
|
|
// and it is used to populate the response into it. It should be a pointer to a struct that
|
|
|
|
// corresponds to the Github graphql schema and it has to implement the rateLimiter interface. If
|
|
|
|
// there is a Github rate limiting error, then the function sleeps and retries after the rate limit
|
2021-03-09 17:31:58 +03:00
|
|
|
// is expired. If there is another error, then the method will retry before giving up.
|
2021-03-17 21:29:39 +03:00
|
|
|
func (mm *importMediator) mQuery(ctx context.Context, query rateLimiter, vars map[string]interface{}, msgs chan<- messageEvent) error {
|
|
|
|
if err := mm.queryOnce(ctx, query, vars, msgs); err == nil {
|
2021-03-09 17:31:58 +03:00
|
|
|
// success: done
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
// failure: we will retry
|
2021-03-17 21:29:39 +03:00
|
|
|
// To retry is important for importing projects with a big number of issues.
|
2021-03-09 17:31:58 +03:00
|
|
|
retries := 3
|
|
|
|
var err error
|
|
|
|
for i := 0; i < retries; i++ {
|
|
|
|
// wait a few seconds before retry
|
|
|
|
sleepTime := 8 * (i + 1)
|
|
|
|
time.Sleep(time.Duration(sleepTime) * time.Second)
|
2021-03-17 21:29:39 +03:00
|
|
|
err = mm.queryOnce(ctx, query, vars, msgs)
|
2021-03-09 17:31:58 +03:00
|
|
|
if err == nil {
|
|
|
|
// success: done
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2021-03-17 21:29:39 +03:00
|
|
|
func (mm *importMediator) queryOnce(ctx context.Context, query rateLimiter, vars map[string]interface{}, msgs chan<- messageEvent) error {
|
2021-03-05 22:06:21 +03:00
|
|
|
// first: just send the query to the graphql api
|
|
|
|
vars["dryRun"] = githubv4.Boolean(false)
|
2021-02-27 02:42:37 +03:00
|
|
|
qctx, cancel := context.WithTimeout(ctx, defaultTimeout)
|
|
|
|
defer cancel()
|
2021-03-05 22:06:21 +03:00
|
|
|
err := mm.gc.Query(qctx, query, vars)
|
|
|
|
if err == nil {
|
|
|
|
// no error: done
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
// matching the error string
|
|
|
|
if !strings.Contains(err.Error(), "API rate limit exceeded") {
|
|
|
|
// an error, but not the API rate limit error: done
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
// a rate limit error
|
|
|
|
// ask the graphql api for rate limiting information
|
|
|
|
vars["dryRun"] = githubv4.Boolean(true)
|
|
|
|
qctx, cancel = context.WithTimeout(ctx, defaultTimeout)
|
|
|
|
defer cancel()
|
2021-02-27 02:42:37 +03:00
|
|
|
if err := mm.gc.Query(qctx, query, vars); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
rateLimit := query.rateLimit()
|
|
|
|
if rateLimit.Cost > rateLimit.Remaining {
|
2021-03-05 22:06:21 +03:00
|
|
|
// sleep
|
2021-02-27 02:42:37 +03:00
|
|
|
resetTime := rateLimit.ResetAt.Time
|
|
|
|
// Add a few seconds (8) for good measure
|
2021-03-05 22:06:21 +03:00
|
|
|
resetTime = resetTime.Add(8 * time.Second)
|
2021-03-17 21:29:39 +03:00
|
|
|
msg := fmt.Sprintf("Github GraphQL API rate limit exhausted. Sleeping until %s", resetTime.String())
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return ctx.Err()
|
|
|
|
case msgs <- messageEvent{msg}:
|
|
|
|
}
|
2021-03-05 22:06:21 +03:00
|
|
|
timer := time.NewTimer(time.Until(resetTime))
|
2021-02-27 02:42:37 +03:00
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
stop(timer)
|
|
|
|
return ctx.Err()
|
|
|
|
case <-timer.C:
|
|
|
|
}
|
|
|
|
}
|
2021-03-05 22:06:21 +03:00
|
|
|
// run the original query again
|
2021-02-27 02:42:37 +03:00
|
|
|
vars["dryRun"] = githubv4.Boolean(false)
|
|
|
|
qctx, cancel = context.WithTimeout(ctx, defaultTimeout)
|
|
|
|
defer cancel()
|
2021-03-05 22:06:21 +03:00
|
|
|
err = mm.gc.Query(qctx, query, vars)
|
|
|
|
return err // might be nil
|
2021-02-27 02:42:37 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
func stop(t *time.Timer) {
|
|
|
|
if !t.Stop() {
|
|
|
|
select {
|
|
|
|
case <-t.C:
|
|
|
|
default:
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|