Skip to content

Commit

Permalink
feat: Introduce asset discovery response caching behind flag (#419)
Browse files Browse the repository at this point in the history
* test: [Spike] Add network caching to asset discovery behind flag

* Only cache 200 status code responses

Keep the caching layer real thin, since its an optimization

* Add inline doc, clean up console.logs

* Pull method out into its own util

Up next is to test

* Add tests for response cache util

* Refactor `getResponseCache` function

* Remove extra early testing snapshots

* Remove `body` from mocked response obj

* Code review: Update test to be more reliable
  • Loading branch information
Robdel12 committed Nov 8, 2019
1 parent 62ddc66 commit 7d7dd52
Show file tree
Hide file tree
Showing 8 changed files with 129 additions and 2 deletions.
2 changes: 1 addition & 1 deletion package.json
Original file line number Diff line number Diff line change
Expand Up @@ -147,7 +147,7 @@
"test": "yarn test:unit && yarn test:client && yarn test:integration && yarn test:command:snapshot && yarn test:command:upload",
"test:unit": "PERCY_TOKEN=abc mocha \"test/**/*.test.ts\" --exclude \"test/percy-agent-client/**/*.test.ts\" --exclude \"test/integration/**/*\"",
"test:client": "karma start ./test/percy-agent-client/karma.conf.js",
"test:integration": "yarn build-client && node ./bin/run exec -h *.localtest.me -c .ci.percy.yml -- mocha test/integration/**/*.test.ts",
"test:integration": "yarn build-client && node ./bin/run exec --cache-responses -h *.localtest.me -c .ci.percy.yml -- mocha test/integration/**/*.test.ts",
"test:command:snapshot": "./bin/run snapshot test/integration/test-static-site -b /dummy-base-url/ -i **/red-keep.** -s **/*.{html}",
"test:command:upload": "./bin/run upload test/integration/test-static-images",
"version": "oclif-dev readme && git add README.md",
Expand Down
6 changes: 6 additions & 0 deletions src/commands/exec.ts
Original file line number Diff line number Diff line change
Expand Up @@ -27,6 +27,12 @@ export default class Exec extends PercyCommand {
'Asset discovery network idle timeout (in milliseconds)',
].join(' '),
}),
'cache-responses': flags.boolean({
description: [
`[default: ${DEFAULT_CONFIGURATION.agent['asset-discovery']['cache-responses']}]`,
'Enable caching network responses for asset discovery (experimental)',
].join(' '),
}),
'port': flags.integer({
char: 'p',
description: [
Expand Down
1 change: 1 addition & 0 deletions src/configuration/asset-discovery-configuration.ts
Original file line number Diff line number Diff line change
Expand Up @@ -4,4 +4,5 @@ export interface AssetDiscoveryConfiguration {
'network-idle-timeout': number,
'page-pool-size-min': number,
'page-pool-size-max': number
'cache-responses': boolean
}
1 change: 1 addition & 0 deletions src/configuration/configuration.ts
Original file line number Diff line number Diff line change
Expand Up @@ -27,6 +27,7 @@ export const DEFAULT_CONFIGURATION: Configuration = {
'network-idle-timeout': 50, // ms
'page-pool-size-min': 1, // pages
'page-pool-size-max': 5, // pages
'cache-responses': false,
},
},
'static-snapshots': {
Expand Down
16 changes: 15 additions & 1 deletion src/services/asset-discovery-service.ts
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@ import { AssetDiscoveryConfiguration } from '../configuration/asset-discovery-co
import { DEFAULT_CONFIGURATION } from '../configuration/configuration'
import { SnapshotOptions } from '../percy-agent-client/snapshot-options'
import { logError, profile } from '../utils/logger'
import { cacheResponse, getResponseCache } from '../utils/response-cache'
import waitForNetworkIdle from '../utils/wait-for-network-idle'
import PercyClientService from './percy-client-service'
import ResponseService from './response-service'
Expand Down Expand Up @@ -189,13 +190,15 @@ export class AssetDiscoveryService extends PercyClientService {
]) as {})

page.on('request', async (request) => {
const requestUrl = request.url()

try {
if (!this.shouldRequestResolve(request)) {
await request.abort()
return
}

if (request.url() === rootResourceUrl) {
if (requestUrl === rootResourceUrl) {
await request.respond({
body: domSnapshot,
contentType: 'text/html',
Expand All @@ -204,6 +207,13 @@ export class AssetDiscoveryService extends PercyClientService {
return
}

if (this.configuration['cache-responses'] === true && getResponseCache(requestUrl)) {
logger.debug(`Asset cache hit for ${requestUrl}`)
await request.respond(getResponseCache(requestUrl))

return
}

await request.continue()
} catch (error) {
logError(error)
Expand All @@ -215,7 +225,11 @@ export class AssetDiscoveryService extends PercyClientService {
// We could also listen on 'response', but then we'd have to check if it was successful.
page.on('requestfinished', async (request) => {
const response = request.response()

if (response) {
if (this.configuration['cache-responses'] === true) {
await cacheResponse(response, logger)
}
// Parallelize the work in processResponse as much as possible, but make sure to
// wait for it to complete before returning from the asset discovery phase.
const promise = this.responseService.processResponse(
Expand Down
1 change: 1 addition & 0 deletions src/utils/configuration.ts
Original file line number Diff line number Diff line change
Expand Up @@ -41,6 +41,7 @@ function transform(flags: any, args: any) {
'asset-discovery': {
'allowed-hostnames': flags['allowed-hostname'],
'network-idle-timeout': flags['network-idle-timeout'],
'cache-responses': flags['cache-responses'],
},
},
'static-snapshots': {
Expand Down
47 changes: 47 additions & 0 deletions src/utils/response-cache.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,47 @@
import { Response } from 'puppeteer'
let responseCache = {} as any

/**
* Keep an in-memory cache of asset responses.
*
* When enabled, asset responses will be kept in memory. When the asset is
* re-requested, it will be responsed with what the cached response. This makes
* it so servers aren't being hounded for the same asset over and over again.
*/
export async function cacheResponse(response: Response, logger: any) {
const responseUrl = response.url()
const statusCode = response.status()

if (!!responseCache[responseUrl]) {
logger.debug(`Asset already in cache ${responseUrl}`)
return
}

if (![200, 201].includes(statusCode)) {
return
}

try {
const buffer = await response.buffer()

responseCache[responseUrl] = {
status: response.status(),
headers: response.headers(),
body: buffer,
}

logger.debug(`Added ${responseUrl} to asset discovery cache`)
} catch (error) {
logger.debug(`Could not cache response ${responseUrl}: ${error}`)
}
}

export function getResponseCache(url: string) {
return responseCache[url]
}

export function _setResponseCache(newResponseCache: any) {
responseCache = newResponseCache

return responseCache
}
57 changes: 57 additions & 0 deletions test/utils/response-cache.test.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,57 @@
import { expect } from 'chai'
import { _setResponseCache, cacheResponse, getResponseCache } from '../../src/utils/response-cache'

// Mock logger
const logger = { debug() { return '' }}
const defaultResponse = {
url() { return 'http://example.com/foo.txt' },
status() { return 200 },
headers() { return 'fake headers' },
buffer() { return 'hello' },
} as any

describe('Response cache util', () => {
beforeEach(() => {
_setResponseCache({})
})

it('200 status code response adds to the cache', async () => {
await cacheResponse(defaultResponse, logger)

expect(getResponseCache('http://example.com/foo.txt')).to.eql({
status: 200,
body: 'hello',
headers: 'fake headers',
})
})

it('201 status code response adds to the cache', async () => {
await cacheResponse({ ...defaultResponse, status() { return 201 } }, logger)

expect(getResponseCache('http://example.com/foo.txt')).to.eql({
status: 201,
body: 'hello',
headers: 'fake headers',
})
})

it('calling the cache with the same URL does nothing', async () => {
await cacheResponse(defaultResponse, logger)
await cacheResponse({ ...defaultResponse, status() { return 201 } }, logger)

expect(getResponseCache('http://example.com/foo.txt')).to.eql({
status: 200,
body: 'hello',
headers: 'fake headers',
})
})

it('non-200 status code response does not add to the cache', async () => {
await cacheResponse({ ...defaultResponse, status() { return 300 } }, logger)
await cacheResponse({ ...defaultResponse, status() { return 500 } }, logger)
await cacheResponse({ ...defaultResponse, status() { return 401 } }, logger)
await cacheResponse({ ...defaultResponse, status() { return 404 } }, logger)

expect(getResponseCache('http://example.com/foo.txt')).to.eql(undefined)
})
})

0 comments on commit 7d7dd52

Please sign in to comment.