diff --git a/CHANGELOG.md b/CHANGELOG.md index 6149992ae92..5a7e3a69e5a 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -10,7 +10,13 @@ The version headers in this history reflect the versions of Apollo Server itself ## vNEXT +## v3.10.4 + +- `apollo-server-core`: Manage memory more efficiently in the usage reporting plugin by allowing large objects to be garbage collected more quickly. [PR #7106](https://github.com/apollographql/apollo-server/pull/7106) +- `apollo-server-core`: The usage reporting plugin now defaults to a 30 second timeout for each attempt to send reports to Apollo Server instead of no timeout; the timeout can be adjusted with the new `requestTimeoutMs` option to `ApolloServerPluginUsageReporting`. (Apollo's servers already enforced a 30 second timeout, so this is unlikely to break any existing use cases.) [PR #7106](https://github.com/apollographql/apollo-server/pull/7106) + ## v3.10.3 + - `apollo-server-core`: Fix memory leak in usage reporting plugin. [Issue #6983](https://github.com/apollographql/apollo-server/issues/6983) [PR #6999](https://github.com/apollographql/apollo-server/[Issue #6983](https://github.com/apollographql/apollo-server/issues/6983)pull/6999) ## v3.10.2 diff --git a/package-lock.json b/package-lock.json index 768d099c859..ebf907c6c4b 100644 --- a/package-lock.json +++ b/package-lock.json @@ -13091,6 +13091,7 @@ "jest-runtime": "^28.1.3", "jest-snapshot": "^28.1.3", "jest-util": "^28.1.3", + "node-abort-controller": "^3.0.1", "p-limit": "^3.1.0", "pretty-format": "^28.1.3", "slash": "^3.0.0", @@ -16498,6 +16499,11 @@ "integrity": "sha512-sGkPx+VjMtmA6MX27oA4FBFELFCZZ4S4XqeGOXCv68tT+jb3vk/RyaKWP0PTKyWtmLSM0b+adUTEvbs1PEaH2w==", "dev": true }, + "node_modules/node-abort-controller": { + "version": "3.0.1", + "resolved": "https://registry.npmjs.org/node-abort-controller/-/node-abort-controller-3.0.1.tgz", + "integrity": "sha512-/ujIVxthRs+7q6hsdjHMaj8hRG9NuWmwrz+JdRwZ14jdFoKSkm+vDsCbF9PLpnSqjaWQJuTmVtcWHNLr+vrOFw==" + }, "node_modules/node-fetch": { "version": "2.6.7", "resolved": "https://registry.npmjs.org/node-fetch/-/node-fetch-2.6.7.tgz", @@ -21026,6 +21032,7 @@ "graphql-tag": "^2.11.0", "loglevel": "^1.6.8", "lru-cache": "^6.0.0", + "node-abort-controller": "^3.0.1", "sha.js": "^2.4.11", "uuid": "^9.0.0", "whatwg-mimetype": "^3.0.0" @@ -27183,6 +27190,7 @@ "graphql-tag": "^2.11.0", "loglevel": "^1.6.8", "lru-cache": "^6.0.0", + "node-abort-controller": "^3.0.1", "sha.js": "^2.4.11", "uuid": "^9.0.0", "whatwg-mimetype": "^3.0.0" @@ -31247,6 +31255,7 @@ "jest-runtime": "^28.1.3", "jest-snapshot": "^28.1.3", "jest-util": "^28.1.3", + "node-abort-controller": "^3.0.1", "p-limit": "^3.1.0", "pretty-format": "^28.1.3", "slash": "^3.0.0", @@ -33800,6 +33809,11 @@ } } }, + "node-abort-controller": { + "version": "3.0.1", + "resolved": "https://registry.npmjs.org/node-abort-controller/-/node-abort-controller-3.0.1.tgz", + "integrity": "sha512-/ujIVxthRs+7q6hsdjHMaj8hRG9NuWmwrz+JdRwZ14jdFoKSkm+vDsCbF9PLpnSqjaWQJuTmVtcWHNLr+vrOFw==" + }, "node-fetch": { "version": "2.6.7", "resolved": "https://registry.npmjs.org/node-fetch/-/node-fetch-2.6.7.tgz", diff --git a/packages/apollo-server-core/package.json b/packages/apollo-server-core/package.json index 91b83428062..1193ca7d549 100644 --- a/packages/apollo-server-core/package.json +++ b/packages/apollo-server-core/package.json @@ -44,6 +44,7 @@ "graphql-tag": "^2.11.0", "loglevel": "^1.6.8", "lru-cache": "^6.0.0", + "node-abort-controller": "^3.0.1", "sha.js": "^2.4.11", "uuid": "^9.0.0", "whatwg-mimetype": "^3.0.0" diff --git a/packages/apollo-server-core/src/plugin/usageReporting/options.ts b/packages/apollo-server-core/src/plugin/usageReporting/options.ts index be070f521cc..b2af01c3086 100644 --- a/packages/apollo-server-core/src/plugin/usageReporting/options.ts +++ b/packages/apollo-server-core/src/plugin/usageReporting/options.ts @@ -258,6 +258,12 @@ export interface ApolloServerPluginUsageReportingOptions { * Minimum back-off for retries. Defaults to 100ms. */ minimumRetryDelayMs?: number; + /** + * Default timeout for each individual attempt to send a report to Apollo. + * (This is for each HTTP POST, not for all potential retries.) Defaults to 30 + * seconds (30000ms). + */ + requestTimeoutMs?: number; /** * A logger interface to be used for output and errors. When not provided * it will default to the server's own `logger` implementation and use diff --git a/packages/apollo-server-core/src/plugin/usageReporting/plugin.ts b/packages/apollo-server-core/src/plugin/usageReporting/plugin.ts index 8bce7bd3d54..7dfcee38711 100644 --- a/packages/apollo-server-core/src/plugin/usageReporting/plugin.ts +++ b/packages/apollo-server-core/src/plugin/usageReporting/plugin.ts @@ -1,8 +1,10 @@ import os from 'os'; +import { promisify } from 'util'; import { gzip } from 'zlib'; import retry from 'async-retry'; import { Report, ReportHeader, Trace } from 'apollo-reporting-protobuf'; -import { Response, fetch, Headers } from 'apollo-server-env'; +import { Response, fetch, Headers, RequestInit } from 'apollo-server-env'; +import { AbortController } from 'node-abort-controller'; import type { GraphQLRequestListener, GraphQLServerListener, @@ -38,6 +40,8 @@ import { } from '@apollo/utils.usagereporting'; import type LRUCache from 'lru-cache'; +const gzipPromise = promisify(gzip); + const reportHeaderDefaults = { hostname: os.hostname(), agentVersion: `apollo-server-core@${ @@ -238,7 +242,7 @@ export function ApolloServerPluginUsageReporting( // Needs to be an arrow function to be confident that key is defined. const sendReport = async (executableSchemaId: string): Promise => { - const report = getAndDeleteReport(executableSchemaId); + let report = getAndDeleteReport(executableSchemaId); if ( !report || (Object.keys(report.tracesPerQuery).length === 0 && @@ -255,9 +259,12 @@ export function ApolloServerPluginUsageReporting( const protobufError = Report.verify(report); if (protobufError) { - throw new Error(`Error encoding report: ${protobufError}`); + throw new Error(`Error verifying report: ${protobufError}`); } - const message = Report.encode(report).finish(); + let message: Uint8Array | null = Report.encode(report).finish(); + // Let the original protobuf object be garbage collected (helpful if the + // HTTP request hangs). + report = null; // Potential follow-up: we can compare message.length to // report.sizeEstimator.bytes and use it to "learn" if our estimation is @@ -282,23 +289,10 @@ export function ApolloServerPluginUsageReporting( ); } - const compressed = await new Promise((resolve, reject) => { - // The protobuf library gives us a Uint8Array. Node 8's zlib lets us - // pass it directly; convert for the sake of Node 6. (No support right - // now for Node 4, which lacks Buffer.from.) - const messageBuffer = Buffer.from( - message.buffer as ArrayBuffer, - message.byteOffset, - message.byteLength, - ); - gzip(messageBuffer, (err, gzipResult) => { - if (err) { - reject(err); - } else { - resolve(gzipResult); - } - }); - }); + const compressed = await gzipPromise(message); + // Let the uncompressed message be garbage collected (helpful if the + // HTTP request is slow). + message = null; // Wrap fetcher with async-retry for automatic retrying const fetcher = options.fetcher ?? fetch; @@ -306,11 +300,15 @@ export function ApolloServerPluginUsageReporting( // Retry on network errors and 5xx HTTP // responses. async () => { - const curResponse = await fetcher( - (options.endpointUrl || - 'https://usage-reporting.api.apollographql.com') + - '/api/ingress/traces', - { + // Note that once we require Node v16 we can use its global + // AbortController instead of the one from `node-abort-controller`. + const controller = new AbortController(); + const abortTimeout = setTimeout(() => { + controller.abort(); + }, options.requestTimeoutMs ?? 30_000); + let curResponse; + try { + const requestInit: RequestInit = { method: 'POST', headers: { 'user-agent': 'ApolloServerPluginUsageReporting', @@ -320,8 +318,26 @@ export function ApolloServerPluginUsageReporting( }, body: compressed, agent: options.requestAgent, - }, - ); + }; + // The apollo-server-env Fetch API doesn't have `signal` in + // RequestInit, but it does work in node-fetch. We've added it + // already to our `Fetcher` interface (`@apollo/utils.fetcher`) + // that we're using in AS4 but making changes to + // `apollo-server-env` that could cause custom AS3 fetchers to not + // compile feels like a bad idea. The worst case scenario of + // passing in an ignored `signal` is the timeout doesn't work, in + // which case you're not getting the new feature but can change + // your fetcher to make it work. + (requestInit as any).signal = controller.signal; + curResponse = await fetcher( + (options.endpointUrl || + 'https://usage-reporting.api.apollographql.com') + + '/api/ingress/traces', + requestInit, + ); + } finally { + clearTimeout(abortTimeout); + } if (curResponse.status >= 500 && curResponse.status < 600) { throw new Error( diff --git a/packages/apollo-server-integration-testsuite/src/ApolloServer.ts b/packages/apollo-server-integration-testsuite/src/ApolloServer.ts index bcfea09861f..863773348be 100644 --- a/packages/apollo-server-integration-testsuite/src/ApolloServer.ts +++ b/packages/apollo-server-integration-testsuite/src/ApolloServer.ts @@ -1983,21 +1983,20 @@ export function testApolloServer( describe('graphql server functions even when Apollo servers are down', () => { async function testWithStatus( - status: number, + status: number | 'cannot-connect' | 'timeout', expectedRequestCount: number, ) { - const networkError = status === 0; - const { closeServer, fakeUsageReportingUrl, writeResponseResolve } = await makeFakeUsageReportingServer({ - status, + // the 444 case shouldn't ever get to actually sending 444 + status: typeof status === 'number' ? status : 444, waitWriteResponse: true, }); try { // To simulate a network error, we create and close the server. // This lets us still generate a port that is hopefully unused. - if (networkError) { + if (status == 'cannot-connect') { await closeServer(); } @@ -2034,6 +2033,8 @@ export function testApolloServer( reportErrorFunction(error: Error) { reportErrorPromiseResolve(error); }, + // Make sure the timeout test actually finishes in time + requestTimeoutMs: status === 'timeout' ? 10 : undefined, }), ], }); @@ -2049,19 +2050,24 @@ export function testApolloServer( }); expect(result.data.something).toBe('hello'); - if (!networkError) { + if (typeof status === 'number') { // Allow reporting to return its response (for every retry). + // (But not if we're intentionally timing out!) writeResponseResolve(); } // Make sure we can get the error from reporting. const sendingError = await reportErrorPromise; expect(sendingError).toBeTruthy(); - if (networkError) { + if (status === 'cannot-connect') { expect(sendingError.message).toContain( 'Error sending report to Apollo servers', ); expect(sendingError.message).toContain('ECONNREFUSED'); + } else if (status === 'timeout') { + expect(sendingError.message).toBe( + 'Error sending report to Apollo servers: The user aborted a request.', + ); } else { expect(sendingError.message).toBe( `Error sending report to Apollo servers: HTTP status ${status}, Important text in the body`, @@ -2069,7 +2075,7 @@ export function testApolloServer( } expect(requestCount).toBe(expectedRequestCount); } finally { - if (!networkError) { + if (status !== 'cannot-connect') { await closeServer(); } } @@ -2079,7 +2085,10 @@ export function testApolloServer( await testWithStatus(500, 3); }); it('with network error', async () => { - await testWithStatus(0, 3); + await testWithStatus('cannot-connect', 3); + }); + it('with timeout', async () => { + await testWithStatus('timeout', 3); }); it('with non-retryable error', async () => { await testWithStatus(400, 1);