Skip to content

Commit 2e5a251

Browse files
rremerRoyce Remer
authored and
Royce Remer
committed
Make LFS http_client parallel within a batch.
Signed-off-by: Royce Remer <[email protected]>
1 parent 0690cb0 commit 2e5a251

File tree

4 files changed

+79
-67
lines changed

4 files changed

+79
-67
lines changed

Diff for: go.mod

+1-1
Original file line numberDiff line numberDiff line change
@@ -124,6 +124,7 @@ require (
124124
golang.org/x/image v0.21.0
125125
golang.org/x/net v0.30.0
126126
golang.org/x/oauth2 v0.23.0
127+
golang.org/x/sync v0.8.0
127128
golang.org/x/sys v0.26.0
128129
golang.org/x/text v0.19.0
129130
golang.org/x/tools v0.26.0
@@ -316,7 +317,6 @@ require (
316317
go.uber.org/zap v1.27.0 // indirect
317318
golang.org/x/exp v0.0.0-20241009180824-f66d83c29e7c // indirect
318319
golang.org/x/mod v0.21.0 // indirect
319-
golang.org/x/sync v0.8.0 // indirect
320320
golang.org/x/time v0.7.0 // indirect
321321
google.golang.org/genproto/googleapis/rpc v0.0.0-20241021214115-324edc3d5d38 // indirect
322322
gopkg.in/alexcesaro/quotedprintable.v3 v3.0.0-20150716171945-2caba252f4dc // indirect

Diff for: modules/lfs/http_client.go

+73-51
Original file line numberDiff line numberDiff line change
@@ -17,6 +17,8 @@ import (
1717
"code.gitea.io/gitea/modules/log"
1818
"code.gitea.io/gitea/modules/proxy"
1919
"code.gitea.io/gitea/modules/setting"
20+
21+
"golang.org/x/sync/errgroup"
2022
)
2123

2224
// HTTPClient is used to communicate with the LFS server
@@ -113,6 +115,7 @@ func (c *HTTPClient) Upload(ctx context.Context, objects []Pointer, callback Upl
113115
return c.performOperation(ctx, objects, nil, callback)
114116
}
115117

118+
// performOperation takes a slice of LFS object pointers, batches them, and performs the upload/download operations concurrently in each batch
116119
func (c *HTTPClient) performOperation(ctx context.Context, objects []Pointer, dc DownloadCallback, uc UploadCallback) error {
117120
if len(objects) == 0 {
118121
return nil
@@ -133,71 +136,90 @@ func (c *HTTPClient) performOperation(ctx context.Context, objects []Pointer, dc
133136
return fmt.Errorf("TransferAdapter not found: %s", result.Transfer)
134137
}
135138

139+
errGroup, groupCtx := errgroup.WithContext(ctx)
136140
for _, object := range result.Objects {
137-
if object.Error != nil {
138-
log.Trace("Error on object %v: %v", object.Pointer, object.Error)
139-
if uc != nil {
140-
if _, err := uc(object.Pointer, object.Error); err != nil {
141-
return err
142-
}
143-
} else {
144-
if err := dc(object.Pointer, nil, object.Error); err != nil {
145-
return err
146-
}
147-
}
148-
continue
149-
}
150-
151-
if uc != nil {
152-
if len(object.Actions) == 0 {
153-
log.Trace("%v already present on server", object.Pointer)
154-
continue
155-
}
141+
errGroup.Go(func() error {
142+
err := performSingleOperation(groupCtx, object, dc, uc, transferAdapter)
143+
return err
144+
})
145+
}
156146

157-
link, ok := object.Actions["upload"]
158-
if !ok {
159-
log.Debug("%+v", object)
160-
return errors.New("missing action 'upload'")
161-
}
147+
// only the first error is returned, preserving legacy behavior before concurrency
148+
return errGroup.Wait()
149+
}
162150

163-
content, err := uc(object.Pointer, nil)
164-
if err != nil {
165-
return err
166-
}
151+
// performSingleOperation performs an LFS upload or download operation on a single object
152+
func performSingleOperation(ctx context.Context, object *ObjectResponse, dc DownloadCallback, uc UploadCallback, transferAdapter TransferAdapter) error {
153+
// the response from an lfs batch api request for this specific object id contained an error
154+
if object.Error != nil {
155+
log.Trace("Error on object %v: %v", object.Pointer, object.Error)
167156

168-
err = transferAdapter.Upload(ctx, link, object.Pointer, content)
169-
if err != nil {
157+
// this was an 'upload' request inside the batch request
158+
if uc != nil {
159+
if _, err := uc(object.Pointer, object.Error); err != nil {
170160
return err
171161
}
172-
173-
link, ok = object.Actions["verify"]
174-
if ok {
175-
if err := transferAdapter.Verify(ctx, link, object.Pointer); err != nil {
176-
return err
177-
}
178-
}
179162
} else {
180-
link, ok := object.Actions["download"]
181-
if !ok {
182-
// no actions block in response, try legacy response schema
183-
link, ok = object.Links["download"]
184-
}
185-
if !ok {
186-
log.Debug("%+v", object)
187-
return errors.New("missing action 'download'")
163+
// this was NOT an 'upload' request inside the batch request, meaning it must be a 'download' request
164+
err := dc(object.Pointer, nil, object.Error)
165+
if errors.Is(object.Error, ErrObjectNotExist) {
166+
log.Warn("Ignoring missing upstream LFS object %-v: %v", object.Pointer, err)
167+
return nil
188168
}
189169

190-
content, err := transferAdapter.Download(ctx, link)
191-
if err != nil {
192-
return err
193-
}
170+
// this was a 'download' request which was a legitimate error response from the batch api (not an http/404)
171+
return err
172+
}
173+
}
194174

195-
if err := dc(object.Pointer, content, nil); err != nil {
175+
// the response from an lfs batch api request contained necessary upload/download fields to act upon
176+
if uc != nil {
177+
if len(object.Actions) == 0 {
178+
log.Trace("%v already present on server", object.Pointer)
179+
return nil
180+
}
181+
182+
link, ok := object.Actions["upload"]
183+
if !ok {
184+
return errors.New("missing action 'upload'")
185+
}
186+
187+
content, err := uc(object.Pointer, nil)
188+
if err != nil {
189+
return err
190+
}
191+
192+
err = transferAdapter.Upload(ctx, link, object.Pointer, content)
193+
if err != nil {
194+
return err
195+
}
196+
197+
link, ok = object.Actions["verify"]
198+
if ok {
199+
if err := transferAdapter.Verify(ctx, link, object.Pointer); err != nil {
196200
return err
197201
}
198202
}
199-
}
203+
} else {
204+
link, ok := object.Actions["download"]
205+
if !ok {
206+
// no actions block in response, try legacy response schema
207+
link, ok = object.Links["download"]
208+
}
209+
if !ok {
210+
log.Debug("%+v", object)
211+
return errors.New("missing action 'download'")
212+
}
200213

214+
content, err := transferAdapter.Download(ctx, link)
215+
if err != nil {
216+
return err
217+
}
218+
219+
if err := dc(object.Pointer, content, nil); err != nil {
220+
return err
221+
}
222+
}
201223
return nil
202224
}
203225

Diff for: modules/lfs/http_client_test.go

+5-10
Original file line numberDiff line numberDiff line change
@@ -211,36 +211,31 @@ func TestHTTPClientDownload(t *testing.T) {
211211
expectederror: "TransferAdapter not found: ",
212212
},
213213
// case 5
214-
{
215-
endpoint: "https://error-in-response-objects.io",
216-
expectederror: "Object not found",
217-
},
218-
// case 6
219214
{
220215
endpoint: "https://empty-actions-map.io",
221216
expectederror: "missing action 'download'",
222217
},
223-
// case 7
218+
// case 6
224219
{
225220
endpoint: "https://download-actions-map.io",
226221
expectederror: "",
227222
},
228-
// case 8
223+
// case 7
229224
{
230225
endpoint: "https://upload-actions-map.io",
231226
expectederror: "missing action 'download'",
232227
},
233-
// case 9
228+
// case 8
234229
{
235230
endpoint: "https://verify-actions-map.io",
236231
expectederror: "missing action 'download'",
237232
},
238-
// case 10
233+
// case 9
239234
{
240235
endpoint: "https://unknown-actions-map.io",
241236
expectederror: "missing action 'download'",
242237
},
243-
// case 11
238+
// case 10
244239
{
245240
endpoint: "https://legacy-batch-request-download.io",
246241
expectederror: "",

Diff for: modules/repository/repo.go

-5
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,6 @@ package repository
55

66
import (
77
"context"
8-
"errors"
98
"fmt"
109
"io"
1110
"strings"
@@ -182,10 +181,6 @@ func StoreMissingLfsObjectsInRepository(ctx context.Context, repo *repo_model.Re
182181
downloadObjects := func(pointers []lfs.Pointer) error {
183182
err := lfsClient.Download(ctx, pointers, func(p lfs.Pointer, content io.ReadCloser, objectError error) error {
184183
if objectError != nil {
185-
if errors.Is(objectError, lfs.ErrObjectNotExist) {
186-
log.Warn("Repo[%-v]: Ignore missing LFS object %-v: %v", repo, p, objectError)
187-
return nil
188-
}
189184
return objectError
190185
}
191186

0 commit comments

Comments
 (0)