-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathreader.go
More file actions
294 lines (261 loc) · 6.77 KB
/
reader.go
File metadata and controls
294 lines (261 loc) · 6.77 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
package httpreader
import (
"errors"
"fmt"
"io"
"net/http"
"net/url"
"strconv"
"strings"
"sync"
)
// ErrInvalidStatusCode is returned when a ranged HTTP request does not return
// the expected status code.
type InvalidStatusCodeError struct {
StatusCode int // StatusCode returned by the server
Expected int // Expected status code.
}
func (e *InvalidStatusCodeError) Error() string {
return fmt.Sprintf("invalid HTTP status code: %d (expected: %d)", e.StatusCode, e.Expected)
}
// InvalidHeaderError is returned when a required HTTP header is missing, malformed,
// or an unexpected value.
type InvalidHeaderError struct {
Name string
Reason string
}
func (e *InvalidHeaderError) Error() string {
return fmt.Sprintf("invalid header %q: %s", e.Name, e.Reason)
}
type HTTPRangeReader interface {
io.Seeker
io.Reader
io.ReaderAt
}
var _ HTTPRangeReader = &Reader{} // implementation assertion
// Reader implements HTTPRangeReader for an HTTP resource using
// range requests.
type Reader struct {
resourceURL *url.URL
// resourceSize is the reported size of the resource. It is determined by
// the value of the `Content-Range` header returned by the server.
resourceSize int64
discardWnd int
// The headers returned by the server during reader init.
initHeader http.Header
// Primary connection used by Read() and Seek()
mainResp *http.Response
mainOffset int64
// Temporary connection used by ReadAt() to adhere to the interface description.
// - Clients of ReadAt can execute parallel ReadAt calls on the same
// input source
// - If ReadAt is reading from an input source with a seek offset, ReadAt
// should not affect nor be affected by the underlying seek offset
tempResp *http.Response
tempOffset int64
httpClient *http.Client
httpHeader http.Header
mu sync.Mutex
}
func (r *Reader) ResourceSize() int64 {
return r.resourceSize
}
func (r *Reader) ResourceURL() *url.URL {
u := *r.resourceURL
return &u
}
func (r *Reader) InitHeader() http.Header {
return r.initHeader
}
// Seek sets the offset for the next Read to `offset`, interpreted according
// to `whence`
//
// If the requested offset is within the configured discard window, Seek will
// discard data from the response body to reach the new offset. This is done
// to avoid initiating another HTTP request.
func (r *Reader) Seek(offset int64, whence int) (int64, error) {
switch whence {
case io.SeekStart:
case io.SeekCurrent:
offset = r.mainOffset + offset
case io.SeekEnd:
offset = r.resourceSize + offset
}
if offset >= r.resourceSize {
return 0, errors.New("seek beyond end of resource")
}
if offset < 0 {
return 0, errors.New("seek before beginning of resource")
}
distance := offset - r.mainOffset
if distance >= 0 && distance <= int64(r.discardWnd) {
// Forward seek within the discard window
n, err := io.CopyN(io.Discard, r, distance)
if err != nil {
return 0, err
}
if n != distance {
return 0, errors.New("skip data error")
}
} else {
// Backward seek OR forward seek beyond discard window
if err := r.request(offset); err != nil {
return 0, err
}
r.mainOffset = offset
}
return offset, nil
}
func (r *Reader) Read(p []byte) (int, error) {
if r.mainOffset >= r.resourceSize {
return 0, io.EOF
}
if r.mainResp == nil {
err := r.request(r.mainOffset)
if err != nil {
return 0, err
}
}
n, err := r.mainResp.Body.Read(p)
r.mainOffset += int64(n)
return n, err
}
func (r *Reader) ReadAt(p []byte, offset int64) (int, error) {
r.mu.Lock()
defer r.mu.Unlock()
// If the current body is empty, the new offset is behind the current offset, or
// the new offset is too far ahead of the current offset.
if r.tempResp == nil ||
offset < r.tempOffset ||
offset >= r.tempOffset+int64(r.discardWnd) {
if r.tempResp != nil {
// The new offset is behind or too far forward. Close the current response
// body before we initiate a new request
r.tempResp.Body.Close()
}
req, err := newRangeRequest(
r.resourceURL,
r.httpHeader,
&httpRange{start: offset, end: -1},
)
if err != nil {
return 0, err
}
res, err := r.httpClient.Do(req)
if err != nil {
return 0, err
}
r.tempOffset = offset
r.tempResp = res
}
if r.tempOffset < offset {
// At this point tempOffset should either equal `offset` or be within the
// set discard window.
n, err := io.CopyN(io.Discard, r.tempResp.Body, offset-r.tempOffset)
if err != nil {
return 0, err
}
if n+r.tempOffset != offset {
return 0, errors.New("skip data error")
}
r.tempOffset = offset
}
n, err := r.tempResp.Body.Read(p)
r.tempOffset += int64(n)
return n, err
}
func (r *Reader) request(offset int64) error {
if r.mainResp != nil {
r.mainResp.Body.Close()
}
req, err := newRangeRequest(
r.resourceURL,
r.httpHeader,
&httpRange{start: offset, end: -1},
)
if err != nil {
return err
}
res, err := r.httpClient.Do(req)
if err != nil {
return err
}
if err = isRangeResponse(res); err != nil {
res.Body.Close()
return err
}
r.mainOffset = offset
r.mainResp = res
return err
}
func (r *Reader) init() error {
// initial request to determine if the server supports range requests
// as well as the size of the requested resource.
req, err := newRangeRequest(
r.resourceURL,
r.httpHeader,
&httpRange{start: 0, end: 511},
)
if err != nil {
return err
}
res, err := r.httpClient.Do(req)
if err != nil {
return err
}
res.Body.Close()
if err = isRangeResponse(res); err != nil {
return err
}
contentRange := strings.Split(res.Header.Get("Content-Range"), "/")
if len(contentRange) == 2 {
size, err := strconv.ParseInt(contentRange[1], 10, 64)
if err != nil {
return &InvalidHeaderError{
Name: "Content-Range",
Reason: fmt.Sprintf("failed to parse resource size: %v", err),
}
}
r.resourceSize = size
} else {
return &InvalidHeaderError{
Name: "Content-Range",
Reason: fmt.Sprintf(
"failed to parse value: %q", res.Header.Get("Content-Range")),
}
}
return err
}
func isRangeResponse(res *http.Response) error {
if res.StatusCode != http.StatusPartialContent {
return &InvalidStatusCodeError{res.StatusCode, http.StatusPartialContent}
}
if ar := res.Header.Get("Accept-Ranges"); ar != "bytes" {
return &InvalidHeaderError{
Name: "Accept-Ranges",
Reason: fmt.Sprintf(
"server (%s) returned unexpected value: %q (expected: `bytes`)",
res.Request.URL.Host,
ar),
}
}
return nil
}
var defaultHTTPClient = &http.Client{
Transport: &http.Transport{
Proxy: http.ProxyFromEnvironment,
},
}
func NewReader(u *url.URL, options ...Option) (*Reader, error) {
reader := &Reader{
resourceURL: u,
httpClient: defaultHTTPClient,
discardWnd: 1024 * 512,
}
for _, option := range options {
if err := option(reader); err != nil {
return nil, err
}
}
return reader, reader.init()
}