ciphermask/test/e2e/benchmark.js

#!/usr/bin/env node

const path = require('path')
const { promises: fs, constants: fsConstants } = require('fs')
const ttest = require('ttest')
const { By, Key } = require('selenium-webdriver')
const { withFixtures } = require('./helpers')
const { PAGES } = require('./webdriver/driver')

const DEFAULT_NUM_SAMPLES = 20
const ALL_PAGES = Object.values(PAGES)

async function measurePage (pageName) {
  let metrics
  await withFixtures({ fixtures: 'imported-account' }, async ({ driver }) => {
    const passwordField = await driver.findElement(By.css('#password'))
    await passwordField.sendKeys('correct horse battery staple')
    await passwordField.sendKeys(Key.ENTER)
    await driver.findElement(By.css('.selected-account__name'))
    await driver.navigate(pageName)
    await driver.delay(1000)
    metrics = await driver.collectMetrics()
  })
  return metrics
}

function calculateResult (calc) {
  return (result) => {
    const calculatedResult = {}
    for (const key of Object.keys(result)) {
      calculatedResult[key] = calc(result[key])
    }
    return calculatedResult
  }
}
const calculateSum = (array) => array.reduce((sum, val) => sum + val)
const calculateAverage = (array) => calculateSum(array) / array.length
const minResult = calculateResult((array) => Math.min(...array))
const maxResult = calculateResult((array) => Math.max(...array))
const averageResult = calculateResult((array) => calculateAverage(array))
const standardDeviationResult = calculateResult((array) => {
  const average = calculateAverage(array)
  const squareDiffs = array.map((value) => Math.pow(value - average, 2))
  return Math.sqrt(calculateAverage(squareDiffs))
})
// 95% margin of error calculated using Student's t-distrbution
const calculateMarginOfError = (array) => ttest(array).confidence()[1] - calculateAverage(array)
const marginOfErrorResult = calculateResult((array) => calculateMarginOfError(array))

async function profilePageLoad (pages, numSamples) {
  const results = {}
  for (const pageName of pages) {
    const runResults = []
    for (let i = 0; i < numSamples; i += 1) {
      runResults.push(await measurePage(pageName))
    }

    if (runResults.some((result) => result.navigation.lenth > 1)) {
      throw new Error(`Multiple navigations not supported`)
    } else if (runResults.some((result) => result.navigation[0].type !== 'navigate')) {
      throw new Error(`Navigation type ${runResults.find((result) => result.navigation[0].type !== 'navigate').navigation[0].type} not supported`)
    }

    const result = {
      firstPaint: runResults.map((result) => result.paint['first-paint']),
      domContentLoaded: runResults.map((result) => result.navigation[0] && result.navigation[0].domContentLoaded),
      load: runResults.map((result) => result.navigation[0] && result.navigation[0].load),
      domInteractive: runResults.map((result) => result.navigation[0] && result.navigation[0].domInteractive),
    }

    results[pageName] = {
      min: minResult(result),
      max: maxResult(result),
      average: averageResult(result),
      standardDeviation: standardDeviationResult(result),
      marginOfError: marginOfErrorResult(result),
    }
  }
  return results
}

async function isWritable (directory) {
  try {
    await fs.access(directory, fsConstants.W_OK)
    return true
  } catch (error) {
    if (error.code !== 'EACCES') {
      throw error
    }
    return false
  }
}

async function getFirstParentDirectoryThatExists (directory) {
  while (true) {
    try {
      await fs.access(directory, fsConstants.F_OK)
      return directory
    } catch (error) {
      if (error.code !== 'ENOENT') {
        throw error
      } else if (directory === path.dirname(directory)) {
        throw new Error('Failed to find parent directory that exists')
      }
      directory = path.dirname(directory)
    }
  }
}

async function main () {
  const args = process.argv.slice(2)

  let pages = ['home']
  let numSamples = DEFAULT_NUM_SAMPLES
  let outputPath
  let outputDirectory
  let existingParentDirectory

  while (args.length) {
    if (/^(--pages|-p)$/i.test(args[0])) {
      if (args[1] === undefined) {
        throw new Error('Missing pages argument')
      }
      pages = args[1].split(',')
      for (const page of pages) {
        if (!ALL_PAGES.includes(page)) {
          throw new Error(`Invalid page: '${page}`)
        }
      }
      args.splice(0, 2)
    } else if (/^(--samples|-s)$/i.test(args[0])) {
      if (args[1] === undefined) {
        throw new Error('Missing number of samples')
      }
      numSamples = parseInt(args[1], 10)
      if (isNaN(numSamples)) {
        throw new Error(`Invalid 'samples' argument given: '${args[1]}'`)
      }
      args.splice(0, 2)
    } else if (/^(--out|-o)$/i.test(args[0])) {
      if (args[1] === undefined) {
        throw new Error('Missing output filename')
      }
      outputPath = path.resolve(args[1])
      outputDirectory = path.dirname(outputPath)
      existingParentDirectory = await getFirstParentDirectoryThatExists(outputDirectory)
      if (!await isWritable(existingParentDirectory)) {
        throw new Error(`Specified directory is not writable: '${args[1]}'`)
      }
      args.splice(0, 2)
    } else {
      throw new Error(`Unrecognized argument: '${args[0]}'`)
    }
  }

  const results = await profilePageLoad(pages, numSamples)

  if (outputPath) {
    if (outputDirectory !== existingParentDirectory) {
      await fs.mkdir(outputDirectory, { recursive: true })
    }
    await fs.writeFile(outputPath, JSON.stringify(results, null, 2))
  } else {
    console.log(JSON.stringify(results, null, 2))
  }
}

main()
  .catch((e) => {
    console.error(e)
    process.exit(1)
  })
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`#!/usr/bin/env node`

			`const path = require('path')`
			`const { promises: fs, constants: fsConstants } = require('fs')`
Add margin of error metric (#7877) A margin of error metric has been added, which is calculated from a 95% confidence interval. This confidence interval is calculated using Student's t-distribution, which is generally preferred for smaller sample sizes (< ~30) of populations following a normal distribution. 5 years ago			`const ttest = require('ttest')`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`const { By, Key } = require('selenium-webdriver')`
			`const { withFixtures } = require('./helpers')`
			`const { PAGES } = require('./webdriver/driver')`

Add benchmark to CI (#7871) * Add benchmark to CI The page load benchmark for Chrome is now run during CI, and the results are collected and summarized in the `metamaskbot` comment. Closes #6881 * Double default number of samples The number of default samples was changed from 10 to 20. The results from 10 samples would show statistically significant changes in page load times between builds, so weren't a sufficiently useful metric. 5 years ago			`const DEFAULT_NUM_SAMPLES = 20`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`const ALL_PAGES = Object.values(PAGES)`

			`async function measurePage (pageName) {`
			`let metrics`
			`await withFixtures({ fixtures: 'imported-account' }, async ({ driver }) => {`
			`const passwordField = await driver.findElement(By.css('#password'))`
			`await passwordField.sendKeys('correct horse battery staple')`
			`await passwordField.sendKeys(Key.ENTER)`
Implement new fullscreen design (#8657) The fullscreen UI now shows roughly the same design as the popup UI. A few additional changes depicted in the new fullscreen designs will be implemented in subsequent PRs (e.g. the inline buttons on assets) This was done now to make asset pages easier to implement. Implementing asset pages solely for the popup UI would have been complicated by the fact that we use viewport size to switch between the two layouts, so we would have had to re-route upon resizing the window. 5 years ago			`await driver.findElement(By.css('.selected-account__name'))`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`await driver.navigate(pageName)`
			`await driver.delay(1000)`
			`metrics = await driver.collectMetrics()`
			`})`
			`return metrics`
			`}`

			`function calculateResult (calc) {`
			`return (result) => {`
			`const calculatedResult = {}`
			`for (const key of Object.keys(result)) {`
			`calculatedResult[key] = calc(result[key])`
			`}`
			`return calculatedResult`
			`}`
			`}`
			`const calculateSum = (array) => array.reduce((sum, val) => sum + val)`
			`const calculateAverage = (array) => calculateSum(array) / array.length`
			`const minResult = calculateResult((array) => Math.min(...array))`
			`const maxResult = calculateResult((array) => Math.max(...array))`
Enable arrow-parens ESLint rule 5 years ago			`const averageResult = calculateResult((array) => calculateAverage(array))`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`const standardDeviationResult = calculateResult((array) => {`
			`const average = calculateAverage(array)`
Enable arrow-parens ESLint rule 5 years ago			`const squareDiffs = array.map((value) => Math.pow(value - average, 2))`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`return Math.sqrt(calculateAverage(squareDiffs))`
			`})`
Add margin of error metric (#7877) A margin of error metric has been added, which is calculated from a 95% confidence interval. This confidence interval is calculated using Student's t-distribution, which is generally preferred for smaller sample sizes (< ~30) of populations following a normal distribution. 5 years ago			`// 95% margin of error calculated using Student's t-distrbution`
			`const calculateMarginOfError = (array) => ttest(array).confidence()[1] - calculateAverage(array)`
			`const marginOfErrorResult = calculateResult((array) => calculateMarginOfError(array))`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago
			`async function profilePageLoad (pages, numSamples) {`
			`const results = {}`
			`for (const pageName of pages) {`
			`const runResults = []`
			`for (let i = 0; i < numSamples; i += 1) {`
			`runResults.push(await measurePage(pageName))`
			`}`

Enable arrow-parens ESLint rule 5 years ago			`if (runResults.some((result) => result.navigation.lenth > 1)) {`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			throw new Error(`Multiple navigations not supported`)
Enable arrow-parens ESLint rule 5 years ago			`} else if (runResults.some((result) => result.navigation[0].type !== 'navigate')) {`
			throw new Error(`Navigation type ${runResults.find((result) => result.navigation[0].type !== 'navigate').navigation[0].type} not supported`)
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`}`

			`const result = {`
Enable arrow-parens ESLint rule 5 years ago			`firstPaint: runResults.map((result) => result.paint['first-paint']),`
			`domContentLoaded: runResults.map((result) => result.navigation[0] && result.navigation[0].domContentLoaded),`
			`load: runResults.map((result) => result.navigation[0] && result.navigation[0].load),`
			`domInteractive: runResults.map((result) => result.navigation[0] && result.navigation[0].domInteractive),`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`}`

			`results[pageName] = {`
			`min: minResult(result),`
			`max: maxResult(result),`
			`average: averageResult(result),`
			`standardDeviation: standardDeviationResult(result),`
Add margin of error metric (#7877) A margin of error metric has been added, which is calculated from a 95% confidence interval. This confidence interval is calculated using Student's t-distribution, which is generally preferred for smaller sample sizes (< ~30) of populations following a normal distribution. 5 years ago			`marginOfError: marginOfErrorResult(result),`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`}`
			`}`
			`return results`
			`}`

			`async function isWritable (directory) {`
			`try {`
			`await fs.access(directory, fsConstants.W_OK)`
			`return true`
			`} catch (error) {`
			`if (error.code !== 'EACCES') {`
			`throw error`
			`}`
			`return false`
			`}`
			`}`

			`async function getFirstParentDirectoryThatExists (directory) {`
			`while (true) {`
			`try {`
			`await fs.access(directory, fsConstants.F_OK)`
			`return directory`
			`} catch (error) {`
			`if (error.code !== 'ENOENT') {`
			`throw error`
			`} else if (directory === path.dirname(directory)) {`
			`throw new Error('Failed to find parent directory that exists')`
			`}`
			`directory = path.dirname(directory)`
			`}`
			`}`
			`}`

			`async function main () {`
			`const args = process.argv.slice(2)`

Close notification UI if no unapproved confirmations (#8358) * close notification UI if no pending confirmations * change benchmark page to 'home' 5 years ago			`let pages = ['home']`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`let numSamples = DEFAULT_NUM_SAMPLES`
			`let outputPath`
			`let outputDirectory`
			`let existingParentDirectory`

			`while (args.length) {`
			`if (/^(--pages\|-p)$/i.test(args[0])) {`
			`if (args[1] === undefined) {`
			`throw new Error('Missing pages argument')`
			`}`
			`pages = args[1].split(',')`
			`for (const page of pages) {`
			`if (!ALL_PAGES.includes(page)) {`
			throw new Error(`Invalid page: '${page}`)
			`}`
			`}`
			`args.splice(0, 2)`
			`} else if (/^(--samples\|-s)$/i.test(args[0])) {`
			`if (args[1] === undefined) {`
			`throw new Error('Missing number of samples')`
			`}`
			`numSamples = parseInt(args[1], 10)`
			`if (isNaN(numSamples)) {`
			throw new Error(`Invalid 'samples' argument given: '${args[1]}'`)
			`}`
			`args.splice(0, 2)`
			`} else if (/^(--out\|-o)$/i.test(args[0])) {`
			`if (args[1] === undefined) {`
			`throw new Error('Missing output filename')`
			`}`
			`outputPath = path.resolve(args[1])`
			`outputDirectory = path.dirname(outputPath)`
			`existingParentDirectory = await getFirstParentDirectoryThatExists(outputDirectory)`
			`if (!await isWritable(existingParentDirectory)) {`
			throw new Error(`Specified directory is not writable: '${args[1]}'`)
			`}`
			`args.splice(0, 2)`
			`} else {`
			throw new Error(`Unrecognized argument: '${args[0]}'`)
			`}`
			`}`

			`const results = await profilePageLoad(pages, numSamples)`

			`if (outputPath) {`
			`if (outputDirectory !== existingParentDirectory) {`
			`await fs.mkdir(outputDirectory, { recursive: true })`
			`}`
			`await fs.writeFile(outputPath, JSON.stringify(results, null, 2))`
			`} else {`
			`console.log(JSON.stringify(results, null, 2))`
			`}`
			`}`

			`main()`
Enable arrow-parens ESLint rule 5 years ago			`.catch((e) => {`
Add benchmark script (#7869) The script `benchmark.js` will collect page load metrics from the extension, and print them to a file or the console. A method for collecting metrics was added to the web driver to help with this. This script will calculate the min, max, average, and standard deviation for four metrics: 'firstPaint', 'domContentLoaded', 'load', and 'domInteractive'. The variation between samples is sometimes high, with the results varying between samples if only 3 were taken. However, all tests I've done locally with 5 samples have produced results within one standard deviation of each other. The default number of samples has been set to 10, which should be more than enough to produce consistent results. The benchmark can be run with the npm script `benchmark:chrome` or `benchmark:firefox`, e.g. `yarn benchmark:chrome`. 5 years ago			`console.error(e)`
			`process.exit(1)`
			`})`