impress-2020/api/assetImage.js

/**
 * /api/assetImage renders a canvas movie to PNG! To do this, we use a headless
 * Chromium browser, which renders a special page in the webapp and screenshots
 * the displayed canvas.
 *
 * This is, of course, a relatively heavyweight operation: it's always gonna be
 * a bit slow, and consume significant RAM. So, caching is going to be
 * important, so that we're not calling this all the time and overloading the
 * endpoint!
 *
 * Parameters:
 *   - libraryUrl: A https://images.neopets.com/ URL to a JS movie library
 *   - size: 600, 300, or 150. Determines the output image size.
 */
const beeline = require("honeycomb-beeline")({
  writeKey: process.env["HONEYCOMB_WRITE_KEY"],
  dataset:
    process.env["NODE_ENV"] === "production"
      ? "Dress to Impress (2020)"
      : "Dress to Impress (2020, dev)",
  serviceName: "impress-2020-gql-server",
  disableInstrumentationOnLoad: true,
});

// To render the image, we load the /internal/assetImage page in the web app,
// a simple page specifically designed for this API endpoint!
const ASSET_IMAGE_PAGE_BASE_URL = process.env.VERCEL_URL
  ? `https://${process.env.VERCEL_URL}/internal/assetImage`
  : process.env.NODE_ENV === "development"
  ? "http://localhost:3000/internal/assetImage"
  : "https://impress-2020.openneo.net/internal/assetImage";

// TODO: We used to share a browser instamce, but we couldn't get it to reload
//       correctly after accidental closes, so we're just gonna always load a
//       new one now. What are the perf implications of this? Does it slow down
//       response time substantially?
async function getBrowser() {
  if (process.env["NODE_ENV"] === "production") {
    // In production, we use a special chrome-aws-lambda Chromium.
    const chromium = require("chrome-aws-lambda");
    const playwright = require("playwright-core");
    return await playwright.chromium.launch({
      args: chromium.args,
      executablePath: await chromium.executablePath,
      headless: true,
    });
  } else {
    // In development, we use the standard playwright Chromium.
    const playwright = require("playwright");
    return await playwright.chromium.launch({ headless: true });
  }
}

async function handle(req, res) {
  const { libraryUrl, size } = req.query;
  if (!libraryUrl) {
    return reject(res, "libraryUrl is required");
  }

  if (!isNeopetsUrl(libraryUrl)) {
    return reject(
      res,
      `libraryUrl must be an HTTPS Neopets URL, but was: ${libraryUrl}`
    );
  }

  if (size !== "600" && size !== "300" && size !== "150") {
    return reject(res, `size must be 600, 300, or 150, but was: ${size}`);
  }

  let imageBuffer;
  try {
    imageBuffer = await loadAndScreenshotImage(libraryUrl, size);
  } catch (e) {
    console.error(e);
    return reject(res, `Could not load image: ${e.message}`, 500);
  }

  // TODO: Compress the image?

  // Send a long-term cache header, to avoid running this any more than we have
  // to! If we make a big change, we'll flush the cache or add a version param.
  res.setHeader("Cache-Control", "public, max-age=31536000, immutable");
  res.setHeader("Content-Type", "image/png");
  return res.send(imageBuffer);
}

async function loadAndScreenshotImage(libraryUrl, size) {
  const assetImagePageUrl = new URL(ASSET_IMAGE_PAGE_BASE_URL);
  assetImagePageUrl.search = new URLSearchParams({
    libraryUrl,
    size,
  }).toString();

  console.debug("Opening browser page");
  const browser = await getBrowser();
  const page = await browser.newPage();
  console.debug("Page opened, navigating to: " + assetImagePageUrl.toString());

  try {
    await page.goto(assetImagePageUrl.toString());
    console.debug("Page loaded, awaiting image");

    // Start looking for the loaded canvas, *and* for an error message.
    // When either one displays, we proceed, either by returning the image if
    // present, or raising the error if present.
    const imageBufferPromise = screenshotImageFromPage(page);
    const errorMessagePromise = readErrorMessageFromPage(page);
    const firstResultFromPage = await Promise.any([
      imageBufferPromise.then((imageBuffer) => ({ imageBuffer })),
      errorMessagePromise.then((errorMessage) => ({ errorMessage })),
    ]);

    if (firstResultFromPage.errorMessage) {
      throw new Error(firstResultFromPage.errorMessage);
    } else if (firstResultFromPage.imageBuffer) {
      return firstResultFromPage.imageBuffer;
    } else {
      throw new Error(
        `Assertion error: Promise.any did not return an errorMessage or an imageBuffer: ` +
          `${JSON.stringify(Object.keys(firstResultFromPage))}`
      );
    }
  } finally {
    // Tear down our resources when we're done! If it fails, log the error, but
    // don't block the success of the image.
    try {
      await page.close();
    } catch (e) {
      console.warn("Error closing page after image finished", e);
    }
    try {
      await browser.close();
    } catch (e) {
      console.warn("Error closing browser after image finished", e);
    }
  }
}

async function screenshotImageFromPage(page) {
  await page.waitForSelector("#asset-image-canvas[data-is-loaded=true]", {
    timeout: 10000,
  });
  const canvas = await page.$("#asset-image-canvas[data-is-loaded=true]");
  console.debug("Image loaded, taking screenshot");

  const imageBuffer = await canvas.screenshot({
    omitBackground: true,
  });
  console.debug(`Screenshot captured, size: ${imageBuffer.length}`);

  return imageBuffer;
}

async function readErrorMessageFromPage(page) {
  await page.waitForSelector("#asset-image-error-message", {
    timeout: 10000,
  });
  const errorMessageContainer = await page.$("#asset-image-error-message");
  const errorMessage = await errorMessageContainer.innerText();
  return errorMessage;
}

function isNeopetsUrl(urlString) {
  let url;
  try {
    url = new URL(urlString);
  } catch (e) {
    return false;
  }

  return url.origin === "https://images.neopets.com";
}

function reject(res, message, status = 400) {
  res.setHeader("Content-Type", "text/plain");
  return res.status(status).send(message);
}

// Polyfill Promise.any for older Node: https://github.com/ungap/promise-any
Promise.any =
  Promise.any ||
  function ($) {
    return new Promise(function (D, E, A, L) {
      A = [];
      L = $.map(function ($, i) {
        return Promise.resolve($).then(D, function (O) {
          return ((A[i] = O), --L) || E({ errors: A });
        });
      }).length;
    });
  };

async function handleWithBeeline(req, res) {
  beeline.withTrace(
    { name: "api/assetImage", operation_name: "api/assetImage" },
    () => handle(req, res)
  );
}

export default handleWithBeeline;
/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`/**`
			`* /api/assetImage renders a canvas movie to PNG! To do this, we use a headless`
			`* Chromium browser, which renders a special page in the webapp and screenshots`
			`* the displayed canvas.`
			`*`
			`* This is, of course, a relatively heavyweight operation: it's always gonna be`
			`* a bit slow, and consume significant RAM. So, caching is going to be`
			`* important, so that we're not calling this all the time and overloading the`
			`* endpoint!`
Use /api/assetImage for all image sizes We update /api/assetImage to accept size as a parameter (I make it mandatory to push people into HTTP caching happy paths), and we update the GraphQL thing to use it in those cases too! This also means that, if these images seem to go well, we could swap Classic DTI over to them… I want to turn off those RAM-heavy image converters on the VPS lol 2021-08-19 17:56:09 -07:00			`*`
			`* Parameters:`
			`* - libraryUrl: A https://images.neopets.com/ URL to a JS movie library`
			`* - size: 600, 300, or 150. Determines the output image size.`
/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`*/`
			`const beeline = require("honeycomb-beeline")({`
			`writeKey: process.env["HONEYCOMB_WRITE_KEY"],`
			`dataset:`
			`process.env["NODE_ENV"] === "production"`
			`? "Dress to Impress (2020)"`
			`: "Dress to Impress (2020, dev)",`
			`serviceName: "impress-2020-gql-server",`
Trickier disabling honeycomb instrumentation Hm, okay, so the documented way to not instrument anything doesn't actually stop them from patching Module._load. But this undocumented option sure does! So, woo, let's try it! lol 2021-08-08 00:23:57 -07:00			`disableInstrumentationOnLoad: true,`
/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`});`

			`// To render the image, we load the /internal/assetImage page in the web app,`
			`// a simple page specifically designed for this API endpoint!`
			`const ASSET_IMAGE_PAGE_BASE_URL = process.env.VERCEL_URL`
			? `https://${process.env.VERCEL_URL}/internal/assetImage`
			`: process.env.NODE_ENV === "development"`
			`? "http://localhost:3000/internal/assetImage"`
			`: "https://impress-2020.openneo.net/internal/assetImage";`

Create a new browser for each assetImage request Well, holding onto the browser instance seems to be a source of bugs (my previous fix didn't seem to fix it), and I'm not _sure_ what the perf characteristics are, so let's just try a fresh instance each time! I don't actually know what a browser "instance" in Playwright really is, I'm not sure it even necessarily creates a new process, I just don't know and I saw some Vercel example code take this approach, which is definitely simpler, and I guess must not be _overtly_ bad perf if it's idiomatic? So, like, ok, cool, let's see if this stops 500ing us with "Browser closed"! 😅 2021-09-02 19:25:48 -07:00			`// TODO: We used to share a browser instamce, but we couldn't get it to reload`
			`// correctly after accidental closes, so we're just gonna always load a`
			`// new one now. What are the perf implications of this? Does it slow down`
			`// response time substantially?`
/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`async function getBrowser() {`
Create a new browser for each assetImage request Well, holding onto the browser instance seems to be a source of bugs (my previous fix didn't seem to fix it), and I'm not _sure_ what the perf characteristics are, so let's just try a fresh instance each time! I don't actually know what a browser "instance" in Playwright really is, I'm not sure it even necessarily creates a new process, I just don't know and I saw some Vercel example code take this approach, which is definitely simpler, and I guess must not be _overtly_ bad perf if it's idiomatic? So, like, ok, cool, let's see if this stops 500ing us with "Browser closed"! 😅 2021-09-02 19:25:48 -07:00			`if (process.env["NODE_ENV"] === "production") {`
			`// In production, we use a special chrome-aws-lambda Chromium.`
			`const chromium = require("chrome-aws-lambda");`
			`const playwright = require("playwright-core");`
			`return await playwright.chromium.launch({`
			`args: chromium.args,`
			`executablePath: await chromium.executablePath,`
			`headless: true,`
			`});`
			`} else {`
			`// In development, we use the standard playwright Chromium.`
			`const playwright = require("playwright");`
			`return await playwright.chromium.launch({ headless: true });`
Reboot assetImage browser when it disappears Been seeing this in testing in prod, the first few images worked great, but then eventually they all started saying the browser was disconnected. Here, we add a check to reconnect if it goes missing. This is actually kinda hard to test in dev, because the dev server creates a new process every time the function runs, so fingers crossed! I also added explicit logic to close the page when we're done with it, I'm worried we crashed the browser by exceeding the RAM limit by leaving pages open. Not sure quite how their model works and whether things eventually get flushed out on their own! 2021-08-19 23:38:25 -07:00			`}`
/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`}`

			`async function handle(req, res) {`
Use /api/assetImage for all image sizes We update /api/assetImage to accept size as a parameter (I make it mandatory to push people into HTTP caching happy paths), and we update the GraphQL thing to use it in those cases too! This also means that, if these images seem to go well, we could swap Classic DTI over to them… I want to turn off those RAM-heavy image converters on the VPS lol 2021-08-19 17:56:09 -07:00			`const { libraryUrl, size } = req.query;`
/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`if (!libraryUrl) {`
			`return reject(res, "libraryUrl is required");`
			`}`

			`if (!isNeopetsUrl(libraryUrl)) {`
			`return reject(`
			`res,`
			`libraryUrl must be an HTTPS Neopets URL, but was: ${libraryUrl}`
			`);`
			`}`

Use /api/assetImage for all image sizes We update /api/assetImage to accept size as a parameter (I make it mandatory to push people into HTTP caching happy paths), and we update the GraphQL thing to use it in those cases too! This also means that, if these images seem to go well, we could swap Classic DTI over to them… I want to turn off those RAM-heavy image converters on the VPS lol 2021-08-19 17:56:09 -07:00			`if (size !== "600" && size !== "300" && size !== "150") {`
			return reject(res, `size must be 600, 300, or 150, but was: ${size}`);
			`}`

/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`let imageBuffer;`
			`try {`
Use /api/assetImage for all image sizes We update /api/assetImage to accept size as a parameter (I make it mandatory to push people into HTTP caching happy paths), and we update the GraphQL thing to use it in those cases too! This also means that, if these images seem to go well, we could swap Classic DTI over to them… I want to turn off those RAM-heavy image converters on the VPS lol 2021-08-19 17:56:09 -07:00			`imageBuffer = await loadAndScreenshotImage(libraryUrl, size);`
/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`} catch (e) {`
			`console.error(e);`
			return reject(res, `Could not load image: ${e.message}`, 500);
			`}`

			`// TODO: Compress the image?`

			`// Send a long-term cache header, to avoid running this any more than we have`
			`// to! If we make a big change, we'll flush the cache or add a version param.`
			`res.setHeader("Cache-Control", "public, max-age=31536000, immutable");`
			`res.setHeader("Content-Type", "image/png");`
			`return res.send(imageBuffer);`
			`}`

Use /api/assetImage for all image sizes We update /api/assetImage to accept size as a parameter (I make it mandatory to push people into HTTP caching happy paths), and we update the GraphQL thing to use it in those cases too! This also means that, if these images seem to go well, we could swap Classic DTI over to them… I want to turn off those RAM-heavy image converters on the VPS lol 2021-08-19 17:56:09 -07:00			`async function loadAndScreenshotImage(libraryUrl, size) {`
/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`const assetImagePageUrl = new URL(ASSET_IMAGE_PAGE_BASE_URL);`
Use /api/assetImage for all image sizes We update /api/assetImage to accept size as a parameter (I make it mandatory to push people into HTTP caching happy paths), and we update the GraphQL thing to use it in those cases too! This also means that, if these images seem to go well, we could swap Classic DTI over to them… I want to turn off those RAM-heavy image converters on the VPS lol 2021-08-19 17:56:09 -07:00			`assetImagePageUrl.search = new URLSearchParams({`
			`libraryUrl,`
			`size,`
			`}).toString();`
/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00
			`console.debug("Opening browser page");`
			`const browser = await getBrowser();`
			`const page = await browser.newPage();`
			`console.debug("Page opened, navigating to: " + assetImagePageUrl.toString());`

Reboot assetImage browser when it disappears Been seeing this in testing in prod, the first few images worked great, but then eventually they all started saying the browser was disconnected. Here, we add a check to reconnect if it goes missing. This is actually kinda hard to test in dev, because the dev server creates a new process every time the function runs, so fingers crossed! I also added explicit logic to close the page when we're done with it, I'm worried we crashed the browser by exceeding the RAM limit by leaving pages open. Not sure quite how their model works and whether things eventually get flushed out on their own! 2021-08-19 23:38:25 -07:00			`try {`
			`await page.goto(assetImagePageUrl.toString());`
			`console.debug("Page loaded, awaiting image");`

			`// Start looking for the loaded canvas, and for an error message.`
			`// When either one displays, we proceed, either by returning the image if`
			`// present, or raising the error if present.`
			`const imageBufferPromise = screenshotImageFromPage(page);`
			`const errorMessagePromise = readErrorMessageFromPage(page);`
			`const firstResultFromPage = await Promise.any([`
			`imageBufferPromise.then((imageBuffer) => ({ imageBuffer })),`
			`errorMessagePromise.then((errorMessage) => ({ errorMessage })),`
			`]);`

			`if (firstResultFromPage.errorMessage) {`
			`throw new Error(firstResultFromPage.errorMessage);`
			`} else if (firstResultFromPage.imageBuffer) {`
			`return firstResultFromPage.imageBuffer;`
			`} else {`
			`throw new Error(`
			`Assertion error: Promise.any did not return an errorMessage or an imageBuffer: ` +
			`${JSON.stringify(Object.keys(firstResultFromPage))}`
			`);`
			`}`
			`} finally {`
Await closing Playwright before finish request I noticed when loading Your Outfits earlier (before I switched it to just use prod images even on dev), that there was a big memory leak slowing down my machine. My hypothesis is that this is because I wasn't _waiting_ for the resources to tear down before finishing the request, so Vercel terminated the request early, and I further hypothesize that terminating a Playwright session partway through isn't guaranteed to clean up the browser. Not sure about that! Could have just been that we spun up a lot at once, and a bunch of things went into swap! (But I thought it generally handles requests in serial in the dev server? So that feels unlikely.) Anyway, I don't feel like extensively testing this again and maybe messing up my computer session again :p Just, when I first wrote this without awaits, I knew that it was a bit risky, but I wanted to _see_ if it was a problem before slowing down individual requests by awaiting. And now, my "it's likely to be a problem" threshold has been reached, lol! So, I'm not _confident_ this is the best play, I don't know the internals well enough; but it seems like a better side to err on than the other, now that I know more! 2021-09-03 15:43:27 -07:00			`// Tear down our resources when we're done! If it fails, log the error, but`
			`// don't block the success of the image.`
			`try {`
			`await page.close();`
			`} catch (e) {`
			`console.warn("Error closing page after image finished", e);`
			`}`
			`try {`
			`await browser.close();`
			`} catch (e) {`
			`console.warn("Error closing browser after image finished", e);`
			`}`
/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`}`
			`}`

			`async function screenshotImageFromPage(page) {`
			`await page.waitForSelector("#asset-image-canvas[data-is-loaded=true]", {`
			`timeout: 10000,`
			`});`
			`const canvas = await page.$("#asset-image-canvas[data-is-loaded=true]");`
			`console.debug("Image loaded, taking screenshot");`

			`const imageBuffer = await canvas.screenshot({`
			`omitBackground: true,`
			`});`
			console.debug(`Screenshot captured, size: ${imageBuffer.length}`);

			`return imageBuffer;`
			`}`

			`async function readErrorMessageFromPage(page) {`
			`await page.waitForSelector("#asset-image-error-message", {`
			`timeout: 10000,`
			`});`
			`const errorMessageContainer = await page.$("#asset-image-error-message");`
			`const errorMessage = await errorMessageContainer.innerText();`
			`return errorMessage;`
			`}`

			`function isNeopetsUrl(urlString) {`
			`let url;`
			`try {`
			`url = new URL(urlString);`
			`} catch (e) {`
			`return false;`
			`}`

			`return url.origin === "https://images.neopets.com";`
			`}`

			`function reject(res, message, status = 400) {`
			`res.setHeader("Content-Type", "text/plain");`
			`return res.status(status).send(message);`
			`}`

Polyfill Promise.any for Node v14 Oops, Promise.any was added in Node 15, but prod uses Node 14! Polyfill it! 2021-08-17 01:43:39 -07:00			`// Polyfill Promise.any for older Node: https://github.com/ungap/promise-any`
			`Promise.any =`
			`Promise.any \|\|`
			`function ($) {`
			`return new Promise(function (D, E, A, L) {`
			`A = [];`
			`L = $.map(function ($, i) {`
			`return Promise.resolve($).then(D, function (O) {`
			`return ((A[i] = O), --L) \|\| E({ errors: A });`
			`});`
			`}).length;`
			`});`
			`};`

/api/assetImage can render movies! Yeah wow huh, that was much less painful than I expected! I haven't tested this very rigorously, literally just the Floating Negg Faerie Doll: https://images.neopets.com/cp/items/data/000/000/005/5735_a8feda8d08/5735.js 2021-07-02 15:19:11 -07:00			`async function handleWithBeeline(req, res) {`
			`beeline.withTrace(`
			`{ name: "api/assetImage", operation_name: "api/assetImage" },`
			`() => handle(req, res)`
			`);`
			`}`

			`export default handleWithBeeline;`