forked from github/docs
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdynamic-assets.js
151 lines (137 loc) · 5.95 KB
/
dynamic-assets.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
import fs from 'fs/promises'
import sharp from 'sharp'
import { assetCacheControl, defaultCacheControl } from './cache-control.js'
import { setFastlySurrogateKey, SURROGATE_ENUMS } from './set-fastly-surrogate-key.js'
/**
* This is the indicator that is a virtual part of the URL.
* Similar to `/cb-1234/` in asset URLs, it's just there to tell the
* middleware that the image can be aggressively cached. It's not
* part of the actual file-on-disk path.
* Similarly, `/mw-1000/` is virtual and will be observed and removed from
* the pathname before trying to look it up as disk-on-file.
* The exact pattern needs to match how it's set in whatever Markdown
* processing code that might make dynamic asset URLs.
* So if you change this, make sure you change the code that expects
* to be able to inject this into the URL.
*/
const maxWidthPathPartRegex = /\/mw-(\d+)\//
/**
*
* Why not any free number? If we allowed it to be any integer number
* someone would put our backend servers at risk by doing something like:
*
* const makeURL = () => `${BASE}/assets/mw-${Math.floor(Math.random()*1000)}/foo.png`
* await Promise.all([...Array(10000).keys()].map(makeURL))
*
* Which would be lots of distinctly different and valid URLs that the
* CDN can never really "protect us" on because they're too often distinct.
*
* At the moment, the only business need is for 1,000 pixels, so the array
* only has one. But can change in the future and make this sentence moot.
*/
const VALID_MAX_WIDTHS = [1440, 1000]
export default async function dynamicAssets(req, res, next) {
if (!req.url.startsWith('/assets/')) return next()
if (!(req.method === 'GET' || req.method === 'HEAD')) {
return res.status(405).type('text/plain').send('Method Not Allowed')
}
// To protect from possible denial of service, we never allow what
// we're going to do (the image file operation), if the whole thing
// won't be aggressively cached.
// If we didn't do this, someone making 2 requests, ...
//
// > GET /assets/images/site/logo.web?random=10476583
// > GET /assets/images/site/logo.web?random=20196996
//
// ...would be treated as 2 distinct backend requests. Sure, each one
// would be cached in the CDN, but that's not helping if someone does...
//
// while (true) {
// startFetchThread(`/assets/images/site/logo.web?whatever=${rand()}`)
// }
//
// So we "force" any deviation of the URL to a redirect to the canonical
// URL (which, again, is heavily cached).
if (Object.keys(req.query).length > 0) {
// Cache the 404 so it won't be re-attempted over and over
defaultCacheControl(res)
// This redirects to the same URL we're currently on, but with the
// query string part omitted.
// For example:
//
// > GET /assets/images/site/logo.web?foo=bar
// < 302
// < location: /assets/images/site/logo.web
//
return res.redirect(302, req.path)
}
// From PNG to WEBP, if the PNG exists
if (req.path.endsWith('.webp')) {
const { url, maxWidth, error } = deconstructImageURL(req.path)
if (error) {
return res.status(400).type('text/plain').send(error.toString())
}
try {
const originalBuffer = await fs.readFile(url.slice(1).replace(/\.webp$/, '.png'))
const image = sharp(originalBuffer)
if (maxWidth) {
const { width } = await image.metadata()
if (width > maxWidth) {
image.resize({ width: maxWidth })
}
}
// Note that by default, sharp will use a lossy compression.
// (i.e. `{lossless: false}` in the options)
// The difference is that a lossless image is slightly crisper
// but becomes on average 1.8x larger.
// Given how we serve images, no human would be able to tell the
// difference simply by looking at the image as it appears as an
// image tag in the web page.
// Also given that rendering-for-viewing is the "end of the line"
// for the image meaning it just ends up being viewed and not
// resaved as a source file. If we had intention to overwrite all
// original PNG source files to WEBP, we should consier lossless
// to preserve as much quality as possible at the source level.
// The default quality is 80% which, combined with `lossless:false`
// makes our images 2.8x smaller than the average PNG.
const buffer = await image.webp().toBuffer()
assetCacheControl(res)
return res.type('image/webp').send(buffer)
} catch (error) {
if (error.code !== 'ENOENT') {
throw error
}
}
}
// Cache the 404 so it won't be re-attempted over and over
defaultCacheControl(res)
// There's a preceeding middleware that sets the Surrogate-Key to
// "manual-purge" based on the URL possibly having the `/cb-xxxxx/`
// checksum in it. But, if it failed, we don't want that. So
// undo that if it was set.
// It's handy too to not overly cache 404s in the CDN because
// it could be that the next prod deployment fixes the missing image.
// For example, a PR landed that introduced the *reference* to the image
// but forgot to check in the new image, then a follow-up PR adds the image.
setFastlySurrogateKey(res, SURROGATE_ENUMS.DEFAULT)
// Don't use something like `next(404)` because we don't want a fancy
// HTML "Page not found" page response because a failed asset lookup
// is impossibly a typo in the browser address bar or an accidentally
// broken link, like it might be to a regular HTML page.
res.status(404).type('text/plain').send('Asset not found')
}
function deconstructImageURL(url) {
let error
let maxWidth
const match = url.match(maxWidthPathPartRegex)
if (match) {
const [whole, number] = match
maxWidth = parseInt(number)
if (isNaN(maxWidth) || maxWidth <= 0 || !VALID_MAX_WIDTHS.includes(maxWidth)) {
error = new Error(`width number (${maxWidth}) is not a valid number`)
} else {
url = url.replace(whole, '/')
}
}
return { url, maxWidth, error }
}