fix(tests): improve reliability of performance tests (aws#5492)

jpinkney-aws · web-flow · commit 856102836519 · 2024-08-26T07:37:35.000-04:00
## Problem
- We currently do a one-shot performance test measurement, which can be
be impacted by the underlying cpu

## Solution
- Run 5 performance tests by default, this should give us a more
accurate reading

### Performance of the last 10 test runs on my computer:
```
{userCpuUsage: 27.763992642839753, systemCpuUsage: 5.8700764000563925, duration: 0.0488549862, heapTotal: 0.15}
{userCpuUsage: 32.432557472712574, systemCpuUsage: 7.287778251185924, duration: 0.0350972354, heapTotal: 0.15}
{userCpuUsage: 36.17269595509756, systemCpuUsage: 8.190125881726889, duration: 0.0313357906, heapTotal: 0.15}
{userCpuUsage: 23.575720185158513, systemCpuUsage: 5.680905138190308, duration: 0.0468292694, heapTotal: 0.05}
{userCpuUsage: 29.722270663855547, systemCpuUsage: 6.725376761131834, duration: 0.044072017399999996, heapTotal: 0.05}
{userCpuUsage: 30.981420694546227, systemCpuUsage: 6.724871937232588, duration: 0.0404778744, heapTotal: 0.05}
{userCpuUsage: 29.15659118178076, systemCpuUsage: 6.544881314879868, duration: 0.0438601896, heapTotal: 0.15}
{userCpuUsage: 29.66190894781342, systemCpuUsage: 6.556456308274413, duration: 0.042828962400000004, heapTotal: 0.1}
{userCpuUsage: 32.209253755861006, systemCpuUsage: 7.245284221753529, duration: 0.036528329, heapTotal: 0.1}
{userCpuUsage: 30.4379237001285, systemCpuUsage: 6.790691656039722, duration: 0.0378142194, heapTotal: 0.1}
{userCpuUsage: 28.075430930361144, systemCpuUsage: 6.952612678963097, duration: 0.042763791, heapTotal: 0.1}
```

&lt;!---
    REMINDER:
    - Read CONTRIBUTING.md first.
    - Add test coverage for your changes.
    - Update the changelog using `npm run newChange`.
    - Link to related issues/commits.
    - Testing: how did you test your changes?
- Screenshots (if the pull request is related to UI/UX then please
include light and dark theme screenshots)
--&gt;

## License

By submitting this pull request, I confirm that my contribution is made
under the terms of the Apache 2.0 license.
diff --git a/packages/core/src/shared/performance/performance.ts b/packages/core/src/shared/performance/performance.ts
@@ -8,7 +8,17 @@ import { getLogger } from '../logger'
 import { isWeb } from '../extensionGlobals'
 
 interface PerformanceMetrics {
-    cpuUsage: number
+    /**
+     * The percentange of CPU time spent executing the user-space portions
+     * of the application, (javascript and user-space libraries/dependencies)
+     */
+    userCpuUsage: number
+
+    /**
+     * The percentage CPU time spent executing system-level operations
+     * related to the application, (file I/O, network, ipc, other kernel-space tasks)
+     */
+    systemCpuUsage: number
     heapTotal: number
     duration: number
 }
@@ -17,6 +27,7 @@ interface TestOptions {
     darwin?: Partial<PerformanceMetrics>
     win32?: Partial<PerformanceMetrics>
     linux?: Partial<PerformanceMetrics>
+    testRuns?: number
 }
 
 export interface PerformanceSpan<T> {
@@ -55,13 +66,16 @@ export class PerformanceTracker {
 
             const elapsedTime = process.hrtime(this.#startPerformance.duration)
             const duration = elapsedTime[0] + elapsedTime[1] / 1e9 // convert microseconds to seconds
-            const usage = ((userCpuUsage + systemCpuUsage) / duration) * 100 // convert to percentage
+
+            const totalUserUsage = (userCpuUsage / duration) * 100
+            const totalSystemUsage = (systemCpuUsage / duration) * 100
 
             const endMemoryUsage = process.memoryUsage().heapTotal - this.#startPerformance?.memory
             const endMemoryUsageInMB = endMemoryUsage / (1024 * 1024) // converting bytes to MB
 
             return {
-                cpuUsage: usage,
+                userCpuUsage: totalUserUsage,
+                systemCpuUsage: totalSystemUsage,
                 heapTotal: endMemoryUsageInMB,
                 duration,
             }
@@ -71,21 +85,60 @@ export class PerformanceTracker {
     }
 }
 
-export function performanceTest(options: TestOptions, name: string, fn: () => Promise<void>): Mocha.Test
-export function performanceTest(options: TestOptions, name: string, fn: () => void): Mocha.Test
+/**
+ * Generate a test suite that runs fn options.testRuns times and gets the average performance metrics of all the test runs
+ */
+export function performanceTest(options: TestOptions, name: string, fn: () => Promise<void>): Mocha.Suite
+export function performanceTest(options: TestOptions, name: string, fn: () => void): Mocha.Suite
 export function performanceTest(options: TestOptions, name: string, fn: () => void | Promise<void>) {
     const testOption = options[process.platform as 'linux' | 'darwin' | 'win32']
 
-    const performanceTracker = new PerformanceTracker(name)
+    const totalTestRuns = options.testRuns ?? 5
+
+    return describe(`${name} performance tests`, async () => {
+        let performanceTracker: PerformanceTracker | undefined
+        const testRunMetrics: PerformanceMetrics[] = []
+
+        beforeEach(() => {
+            performanceTracker = new PerformanceTracker(name)
+            performanceTracker.start()
+        })
+
+        afterEach(() => {
+            const metrics = performanceTracker?.stop()
+            if (!metrics) {
+                assert.fail('Performance metrics not found')
+            }
+            testRunMetrics.push(metrics)
+        })
 
-    return it(name, async () => {
-        performanceTracker.start()
-        await fn()
-        const metrics = performanceTracker.stop()
-        if (!metrics) {
-            assert.fail('Performance metrics not found')
+        for (let testRun = 1; testRun <= totalTestRuns; testRun++) {
+            it(`${name} - test run ${testRun}`, async () => {
+                await fn()
+            })
         }
-        assertPerformanceMetrics(metrics, name, testOption)
+
+        after(async () => {
+            const totalUserCPUUsage =
+                testRunMetrics.reduce((acc, metric) => acc + metric.userCpuUsage, 0) / testRunMetrics.length
+            const totalSystemCPUUsage =
+                testRunMetrics.reduce((acc, metric) => acc + metric.systemCpuUsage, 0) / testRunMetrics.length
+            const totalMemoryUsage =
+                testRunMetrics.reduce((acc, metric) => acc + metric.heapTotal, 0) / testRunMetrics.length
+            const totalDuration =
+                testRunMetrics.reduce((acc, metric) => acc + metric.duration, 0) / testRunMetrics.length
+
+            assertPerformanceMetrics(
+                {
+                    userCpuUsage: totalUserCPUUsage,
+                    systemCpuUsage: totalSystemCPUUsage,
+                    duration: totalDuration,
+                    heapTotal: totalMemoryUsage,
+                },
+                name,
+                testOption
+            )
+        })
     })
 }
 
@@ -94,12 +147,20 @@ function assertPerformanceMetrics(
     name: string,
     testOption?: Partial<PerformanceMetrics>
 ) {
-    const expectedCPUUsage = testOption?.cpuUsage ?? 50
-    const foundCPUUsage = performanceMetrics.cpuUsage
+    const expectedUserCPUUsage = testOption?.userCpuUsage ?? 50
+    const foundUserCPUUsage = performanceMetrics.userCpuUsage
+
+    assert(
+        foundUserCPUUsage < expectedUserCPUUsage,
+        `Expected total user CPU usage for ${name} to be less than ${expectedUserCPUUsage}. Actual user CPU usage was ${foundUserCPUUsage}`
+    )
+
+    const expectedSystemCPUUsage = testOption?.systemCpuUsage ?? 20
+    const foundSystemCPUUsage = performanceMetrics.systemCpuUsage
 
     assert(
-        foundCPUUsage < expectedCPUUsage,
-        `Expected total CPU usage for ${name} to be less than ${expectedCPUUsage}. Actual CPU usage was ${foundCPUUsage}`
+        foundSystemCPUUsage < expectedUserCPUUsage,
+        `Expected total system CPU usage for ${name} to be less than ${expectedSystemCPUUsage}. Actual system CPU usage was ${foundSystemCPUUsage}`
     )
 
     const expectedMemoryUsage = testOption?.heapTotal ?? 400
diff --git a/packages/core/src/shared/telemetry/spans.ts b/packages/core/src/shared/telemetry/spans.ts
@@ -224,7 +224,8 @@ export class TelemetrySpan<T extends MetricBase = MetricBase> {
             const performanceMetrics = this.#performance?.stop()
             if (performanceMetrics) {
                 this.record({
-                    cpuUsage: performanceMetrics.cpuUsage,
+                    userCpuUsage: performanceMetrics.userCpuUsage,
+                    systemCpuUsage: performanceMetrics.systemCpuUsage,
                     heapTotal: performanceMetrics.heapTotal,
                     functionName: this.#options.functionId?.name ?? this.name,
                 } as any)
diff --git a/packages/core/src/shared/telemetry/vscodeTelemetry.json b/packages/core/src/shared/telemetry/vscodeTelemetry.json
@@ -277,9 +277,14 @@
             "description": "A detailed state of a specific auth connection. Use `authStatus` for a higher level view of an extension's general connection."
         },
         {
-            "name": "cpuUsage",
+            "name": "userCpuUsage",
             "type": "int",
-            "description": "Percentage of cpu usage"
+            "description": "Percentage of user cpu usage (user space)"
+        },
+        {
+            "name": "systemCpuUsage",
+            "type": "int",
+            "description": "Percentage of system cpu usage (kernal space)"
         },
         {
             "name": "heapTotal",
@@ -1095,7 +1100,11 @@
             "description": "Represents a function call. In most cases this should wrap code with a run(), then you can add context.",
             "metadata": [
                 {
-                    "type": "cpuUsage",
+                    "type": "userCpuUsage",
+                    "required": true
+                },
+                {
+                    "type": "systemCpuUsage",
                     "required": true
                 },
                 {
diff --git a/packages/core/src/test/shared/performance/performance.test.ts b/packages/core/src/test/shared/performance/performance.test.ts
@@ -21,12 +21,14 @@ describe('performance tooling', () => {
 
     describe('PerformanceTracker', () => {
         it('gets performance metrics', () => {
-            const { expectedCpuUsage, expectedHeapTotal, expectedTotalSeconds } = stubPerformance(sandbox)
+            const { expectedUserCpuUsage, expectedSystemCpuUsage, expectedHeapTotal, expectedTotalSeconds } =
+                stubPerformance(sandbox)
             const perf = new PerformanceTracker('foo')
             perf.start()
             const metrics = perf.stop()
 
-            assert.deepStrictEqual(metrics?.cpuUsage, expectedCpuUsage)
+            assert.deepStrictEqual(metrics?.userCpuUsage, expectedUserCpuUsage)
+            assert.deepStrictEqual(metrics?.systemCpuUsage, expectedSystemCpuUsage)
             assert.deepStrictEqual(metrics?.heapTotal, expectedHeapTotal)
             assert.deepStrictEqual(metrics?.duration, expectedTotalSeconds)
         })
diff --git a/packages/core/src/test/shared/telemetry/spans.test.ts b/packages/core/src/test/shared/telemetry/spans.test.ts
@@ -78,15 +78,16 @@ describe('TelemetrySpan', function () {
     })
 
     it('records performance', function () {
-        const { expectedCpuUsage, expectedHeapTotal } = stubPerformance(sandbox)
+        const { expectedUserCpuUsage, expectedSystemCpuUsage, expectedHeapTotal } = stubPerformance(sandbox)
         const span = new TelemetrySpan('function_call', {
             emit: true,
         })
         span.start()
         clock.tick(90)
         span.stop()
         assertTelemetry('function_call', {
-            cpuUsage: expectedCpuUsage,
+            userCpuUsage: expectedUserCpuUsage,
+            systemCpuUsage: expectedSystemCpuUsage,
             heapTotal: expectedHeapTotal,
             duration: 90,
             result: 'Succeeded',
@@ -269,7 +270,7 @@ describe('TelemetryTracer', function () {
 
         it('records performance', function () {
             clock = installFakeClock()
-            const { expectedCpuUsage, expectedHeapTotal } = stubPerformance(sandbox)
+            const { expectedUserCpuUsage, expectedSystemCpuUsage, expectedHeapTotal } = stubPerformance(sandbox)
             tracer.run(
                 'function_call',
                 () => {
@@ -281,7 +282,8 @@ describe('TelemetryTracer', function () {
             )
 
             assertTelemetry('function_call', {
-                cpuUsage: expectedCpuUsage,
+                userCpuUsage: expectedUserCpuUsage,
+                systemCpuUsage: expectedSystemCpuUsage,
                 heapTotal: expectedHeapTotal,
                 duration: 90,
                 result: 'Succeeded',
diff --git a/packages/core/src/test/utilities/performance.ts b/packages/core/src/test/utilities/performance.ts
@@ -6,11 +6,11 @@
 import Sinon from 'sinon'
 
 export function stubPerformance(sandbox: Sinon.SinonSandbox) {
-    const expectedCpuUsage = { user: 10000, system: 2000 }
+    const cpuUsage = { user: 10000, system: 2000 }
     const initialHeapTotal = 1
     const totalNanoseconds = 30000000 // 0.03 seconds
 
-    sandbox.stub(process, 'cpuUsage').returns(expectedCpuUsage)
+    sandbox.stub(process, 'cpuUsage').returns(cpuUsage)
 
     const memoryUsageStub = sandbox.stub(process, 'memoryUsage')
     memoryUsageStub
@@ -21,7 +21,8 @@ export function stubPerformance(sandbox: Sinon.SinonSandbox) {
     sandbox.stub(process, 'hrtime').onCall(0).returns([0, 0]).onCall(1).returns([0, totalNanoseconds])
 
     return {
-        expectedCpuUsage: 40,
+        expectedUserCpuUsage: 33.333333333333336,
+        expectedSystemCpuUsage: 6.666666666666667,
         expectedHeapTotal: 10,
         expectedTotalSeconds: totalNanoseconds / 1e9,
     }