forked from depot/depot.ai
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathregistry.ts
414 lines (343 loc) · 13.9 KB
/
registry.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
import type {HonoRequest} from 'hono'
import {Hono} from 'hono'
import PQueue from 'p-queue'
import {PostHog} from 'posthog-node'
import {z} from 'zod'
// Types **********************************************************************
interface Env {
Bindings: {
storage: R2Bucket
REGISTRY_TOKEN: string
UPSTREAM_REGISTRY: string
POSTHOG_API_KEY: string
}
}
// Routes *********************************************************************
const app = new Hono<Env>()
app.use('*', async (c, next) => {
c.executionCtx.passThroughOnException()
await next()
})
app.use('*', async (c, next) => {
console.log('START', c.req.method, c.req.url)
await next()
console.log('END', c.req.method, c.req.url, c.res.status)
})
app.get('/', ({text}) => text('🔮'))
app.get('/v2/', ({text}) => text('🔮'))
app.get('/v2/:name{.*}/manifests/:reference', async ({req, env, executionCtx}) => {
const name = req.param('name')
const reference = req.param('reference')
const tag = parseTag(reference)
const digest = tag ? await resolveTagToDigest(env, name, tag) : parseDigest(reference)
if (!digest) return json({errors: [{code: 'MANIFEST_UNKNOWN'}]}, {status: 404})
const key = `${name}/manifests/${digest.digest}`
const headers = new Headers({
'Docker-Content-Digest': digest.digest,
'Docker-Distribution-Api-Version': 'registry/2.0',
})
if (tag && env.POSTHOG_API_KEY) {
executionCtx.waitUntil(
(async () => {
const ip = req.headers.get('cf-connecting-ip')
const posthog = getPostHog(env)
posthog.capture({
distinctId: ip ?? 'anonymous',
event: 'depot.ai: pull image',
properties: {reference: `${name}:${tag}`, name, tag, digest: digest.digest, $ip: ip, $geoip_disable: false},
})
await posthog.flushAsync()
})(),
)
}
return pullThroughRegistry(
req,
() => getObject(req, env, key, headers),
() => importManifest(env, name, digest),
)
})
app.get('/v2/:name{.*}/blobs/:digest', async ({req, env}) => {
const name = req.param('name')
const digest = parseDigest(req.param('digest'))
if (!digest) return json({errors: [{code: 'BLOB_UNKNOWN'}]}, {status: 404})
const key = `${name}/blobs/${digest.digest}`
const headers = new Headers({
'Docker-Content-Digest': digest.digest,
'Docker-Distribution-Api-Version': 'registry/2.0',
})
return pullThroughRegistry(
req,
() => getObject(req, env, key, headers),
() => importBlob(env, name, digest),
)
})
app.post('/v2/:name{.*}/manifests/:reference/_import', async ({req, env}) => {
const url = new URL(req.url)
const name = req.param('name')
const reference = req.param('reference')
const tag = parseTag(reference)
if (!tag) return json({errors: [{code: 'MANIFEST_INVALID'}]}, {status: 400})
const res = await fetchFromRegistry(env, `https://registry/v2/${name}/manifests/${tag}`)
if (!res.ok) return res
const digest = parseDigest(res.headers.get('Docker-Content-Digest') ?? '')
if (!digest) return json({errors: [{code: 'MANIFEST_INVALID'}]}, {status: 400})
if (url.searchParams.has('full') || !(await env.storage.head(`${name}/manifests/${digest.digest}`))) {
await importAll(env, name, digest)
}
await env.storage.put(`${name}/tags/${tag}`, digest.digest)
return json({ok: true, name, digest: digest.digest})
})
app.notFound(({json}) => json({errors: [{code: 'NOT_FOUND', message: 'not found'}]}, 404))
app.onError((err, {json}) => {
console.log(err)
return json({errors: [{code: 'INTERNAL_ERROR', message: err.message}]}, 500)
})
export default app
// Utils **********************************************************************
function response(bodyInit?: BodyInit | null | undefined, init: ResponseInit = {}): Response {
const headers = new Headers(init.headers || {})
headers.set('Docker-Distribution-API-Version', 'registry/2.0')
init.headers = headers
return new Response(bodyInit, init)
}
function emptyResponse(responseInit?: ResponseInit): Response {
return response(null, responseInit)
}
function json(data: any, responseInit: ResponseInit = {}): Response {
const headers = new Headers(responseInit.headers ?? {})
headers.set('Content-Type', 'application/json')
responseInit.headers = headers
return response(JSON.stringify(data), responseInit)
}
let upstreamURL: URL | undefined
async function pullThroughRegistry(
req: HonoRequest<any>,
fromR2: () => Promise<Response | null>,
fromRegistry: () => Promise<Response>,
) {
if (req.method === 'HEAD') {
let object = await fromR2()
if (!object) {
const res = await fromRegistry()
if (!res.ok) return res
object = await fromR2()
}
if (!object) return json({errors: [{code: 'BLOB_UNKNOWN'}]}, {status: 404})
return object
}
const object = await fromR2()
if (!object) return fromRegistry()
return object
}
async function importManifest(env: Env['Bindings'], name: string, digest: Digest) {
const res = await fetchFromRegistry(env, `https://registry/v2/${name}/manifests/${digest.digest}`)
if (!res.ok || !res.body) return res
await env.storage.put(`${name}/manifests/${digest.digest}`, res.body, {
sha256: digest.hash,
httpMetadata: {
contentEncoding: res.headers.get('content-encoding') ?? undefined,
contentType: res.headers.get('content-type') ?? undefined,
},
})
const obj = await env.storage.get(`${name}/manifests/${digest.digest}`)
if (!obj) return new Response(null, {status: 404})
return new Response(obj.body, res)
}
async function importBlob(env: Env['Bindings'], name: string, digest: Digest) {
const res = await fetchFromRegistry(env, `https://registry/v2/${name}/blobs/${digest.digest}`)
if (!res.ok || !res.body) return res
const key = `${name}/blobs/${digest.digest}`
const options: R2PutOptions = {
sha256: digest.hash,
httpMetadata: {
contentEncoding: res.headers.get('content-encoding') ?? undefined,
contentType: res.headers.get('content-type') ?? undefined,
},
}
const contentLength = Number(res.headers.get('content-length') ?? 0)
const partSize = 1024 * 1024 * 750 // 500MB
const numberOfParts = Math.ceil(contentLength / partSize)
if (contentLength > partSize) {
const upload = await env.storage.createMultipartUpload(key, options)
console.log(`importing blob ${digest.digest} in ${numberOfParts} parts (ID ${upload.uploadId})`)
try {
const parts: R2UploadedPart[] = new Array(numberOfParts)
const queue = new PQueue({concurrency: 4})
for (let i = 0; i < numberOfParts; i++) {
const idx = i
await queue.add(async () => {
const range = `bytes=${idx * partSize}-${Math.min(contentLength - 1, (idx + 1) * partSize - 1)}`
console.log(`importing blob ${digest.digest} part ${idx + 1} (${range})`)
const res = await fetchFromRegistry(env, `https://registry/v2/${name}/blobs/${digest.digest}`, {
headers: {Range: range},
})
if (!res.ok || !res.body) {
throw new Error(`failed to fetch blob for part ${idx}: ${res.status} ${res.statusText}`)
}
parts[idx] = await upload.uploadPart(idx + 1, res.body)
console.log(`imported blob ${digest.digest} part ${idx + 1} ${res.headers.get('content-length')}`)
})
}
await queue.onEmpty()
await upload.complete(parts)
} catch (err) {
await upload.abort()
throw err
}
} else {
console.log(`importing blob ${digest.digest}`)
await env.storage.put(key, res.body, options)
}
const obj = await env.storage.get(key)
if (!obj) return new Response(null, {status: 404})
return new Response(obj.body, res)
}
async function importAll(env: Env['Bindings'], name: string, digest: Digest) {
const res = await importManifest(env, name, digest)
if (!res.ok) throw new Error(`failed to fetch manifest: ${res.status} ${res.statusText}`)
const content: Manifest = await res.json()
if (!content.mediaType) throw new Error('missing mediaType')
console.log(`importing ${name}@${digest.digest} (${content.mediaType})`)
switch (content.mediaType) {
case 'application/vnd.docker.distribution.manifest.list.v2+json':
case 'application/vnd.oci.image.index.v1+json': {
for (const descriptor of content.manifests) {
const digest = parseDigest(descriptor.digest)
if (!digest) throw new Error(`invalid manifest digest: ${descriptor.digest}`)
await importAll(env, name, digest)
}
return
}
case 'application/vnd.docker.distribution.manifest.v2+json':
case 'application/vnd.oci.image.manifest.v1+json': {
const digest = parseDigest(content.config.digest)
if (!digest) throw new Error(`invalid config digest: ${content.config.digest}`)
if (await env.storage.head(`${name}/blobs/${digest.digest}`)) {
console.log(`already imported ${name}@${digest.digest} (${content.config.mediaType})`)
} else {
console.log(`importing ${name}@${digest.digest} (${content.config.mediaType})`)
await importBlob(env, name, digest)
}
for (const layer of content.layers) {
const digest = parseDigest(layer.digest)
if (!digest) throw new Error(`invalid layer digest: ${layer.digest}`)
if (await env.storage.head(`${name}/blobs/${digest.digest}`)) {
console.log(`already imported ${name}@${digest.digest} (${layer.mediaType}, ${layer.size} bytes)`)
} else {
console.log(`importing ${name}@${digest.digest} (${layer.mediaType}, ${layer.size} bytes)`)
await importBlob(env, name, digest)
}
}
return
}
default:
throw new Error(`unknown content: ${JSON.stringify(content)}`)
}
}
async function resolveTagToDigest(env: Env['Bindings'], name: string, tag: string) {
const obj = await env.storage.get(`${name}/tags/${tag}`)
if (obj) return parseDigest(await obj.text())
const res = await fetchFromRegistry(env, `https://registry/v2/${name}/manifests/${tag}`)
if (!res.ok) return null
const digest = res.headers.get('Docker-Content-Digest')
if (!digest) return null
await env.storage.put(`${name}/tags/${tag}`, digest)
return parseDigest(digest)
}
async function fetchFromRegistry(env: Env['Bindings'], url: string, init: RequestInit = {}) {
upstreamURL = upstreamURL ?? new URL(env.UPSTREAM_REGISTRY)
const registryURL = new URL(url)
registryURL.protocol = upstreamURL.protocol
registryURL.hostname = upstreamURL.hostname
registryURL.pathname = registryURL.pathname.replace(/^\/v2\//, `/v2/${upstreamURL.pathname}/`)
const headers = new Headers(init.headers)
headers.set('accept', '*/*')
headers.set('authorization', `Basic ${env.REGISTRY_TOKEN}`)
return await fetch(registryURL, {...init, headers})
}
async function getObject(req: HonoRequest<any>, env: Env['Bindings'], key: string, headers: Headers) {
if (req.method === 'HEAD') {
const obj = await env.storage.head(key)
if (!obj) return null
obj.writeHttpMetadata(headers)
headers.set('accept-ranges', 'bytes')
headers.set('etag', obj.httpEtag)
headers.set('content-length', obj.size.toString())
return emptyResponse({headers})
}
const obj = await env.storage.get(key, {onlyIf: req.headers, range: req.headers})
if (!obj) return null
obj.writeHttpMetadata(headers)
headers.set('etag', obj.httpEtag)
headers.set('accept-ranges', 'bytes')
if (
req.headers.has('range') &&
obj.range &&
'offset' in obj.range &&
'length' in obj.range &&
obj.range.offset != undefined &&
obj.range.length != undefined
) {
headers.set('content-range', `bytes ${obj.range.offset}-${obj.range.offset + obj.range.length - 1}/${obj.size}`)
headers.set('content-length', (obj.range.length != undefined ? obj.range.length : obj.size).toString())
} else {
headers.set('content-length', obj.size.toString())
}
const body = 'body' in obj && obj.body ? obj.body : null
const status = 'body' in obj && obj.body ? (req.headers.get('range') !== null ? 206 : 200) : 304
console.log('Handling with R2', key, status, obj.range, [...headers.entries()])
return new Response(body, {headers, status})
}
const tagSchema = z.string().regex(/^[\w][\w.-]{0,127}$/)
function parseTag(candidate: string) {
const result = tagSchema.safeParse(candidate)
return result.success ? result.data : null
}
interface Digest {
readonly algorithm: 'sha256' | 'sha384' | 'sha512'
readonly hash: string
readonly digest: string
}
const digestSchema = z.string().regex(/^[a-z0-9]+(?:[.+_-][a-z0-9]+)*:[a-zA-Z0-9=_-]+$/)
function parseDigest(candidate: string): Digest | null {
const result = digestSchema.safeParse(candidate)
if (!result.success) return null
const [algorithm, hash] = result.data.split(':')
if (algorithm !== 'sha256' && algorithm !== 'sha384' && algorithm !== 'sha512') return null
if (!hash) return null
return {algorithm, hash, digest: result.data}
}
// Analytics ******************************************************************
let _posthog: PostHog | undefined
function getPostHog(env: Env['Bindings']): PostHog {
if (!_posthog) {
_posthog = new PostHog(env.POSTHOG_API_KEY, {
fetch: (info: RequestInfo, init?: RequestInit) => fetch(info, init),
flushAt: 1,
flushInterval: 0,
disableGeoip: false,
})
}
return _posthog
}
// Manifest Types *************************************************************
type Manifest = ImageIndex | ImageManifest
interface Descriptor {
mediaType:
| 'application/vnd.docker.distribution.manifest.list.v2+json'
| 'application/vnd.oci.image.index.v1+json'
| 'application/vnd.docker.distribution.manifest.v2+json'
| 'application/vnd.oci.image.manifest.v1+json'
| string
digest: string
size: number
}
interface ImageIndex {
mediaType: 'application/vnd.docker.distribution.manifest.list.v2+json' | 'application/vnd.oci.image.index.v1+json'
manifests: Descriptor[]
}
interface ImageManifest {
mediaType: 'application/vnd.docker.distribution.manifest.v2+json' | 'application/vnd.oci.image.manifest.v1+json'
config: Descriptor
layers: Descriptor[]
}