458 lines
14 KiB
JavaScript
458 lines
14 KiB
JavaScript
/* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
|
|
|
|
const lazy = {};
|
|
|
|
ChromeUtils.defineESModuleGetters(lazy, {
|
|
SkippableTimer: "resource:///modules/UrlbarUtils.sys.mjs",
|
|
UrlbarPrefs: "resource:///modules/UrlbarPrefs.sys.mjs",
|
|
UrlbarUtils: "resource:///modules/UrlbarUtils.sys.mjs",
|
|
});
|
|
|
|
const SEARCH_PARAMS = {
|
|
CLIENT_VARIANTS: "client_variants",
|
|
PROVIDERS: "providers",
|
|
QUERY: "q",
|
|
SEQUENCE_NUMBER: "seq",
|
|
SESSION_ID: "sid",
|
|
};
|
|
|
|
const SESSION_TIMEOUT_MS = 5 * 60 * 1000; // 5 minutes
|
|
|
|
/**
|
|
* Client class for querying the Merino server. Each instance maintains its own
|
|
* session state including a session ID and sequence number that is included in
|
|
* its requests to Merino.
|
|
*/
|
|
export class MerinoClient {
|
|
/**
|
|
* @returns {object}
|
|
* The names of URL search params.
|
|
*/
|
|
static get SEARCH_PARAMS() {
|
|
return { ...SEARCH_PARAMS };
|
|
}
|
|
|
|
/**
|
|
* @param {string} name
|
|
* An optional name for the client. It will be included in log messages.
|
|
* @param {object} options
|
|
* Options object
|
|
* @param {string} options.cachePeriodMs
|
|
* Enables caching when nonzero. The client will cache the response
|
|
* suggestions from its most recent successful request for the specified
|
|
* period. The client will serve the cached suggestions for all fetches for
|
|
* the same URL until either the cache period elapses or a successful fetch
|
|
* for a different URL is made (ignoring session-related URL params like
|
|
* session ID and sequence number). Caching is per `MerinoClient` instance
|
|
* and is not shared across instances.
|
|
*
|
|
* WARNING: Cached suggestions are only ever evicted when new suggestions
|
|
* are cached. They are not evicted on a timer. If the client has cached
|
|
* some suggestions and no further fetches are made, they'll stay cached
|
|
* indefinitely. If your request URLs contain senstive data that should not
|
|
* stick around in the object graph indefinitely, you should either not use
|
|
* caching or you should implement an eviction mechanism.
|
|
*
|
|
* This cache strategy is intentionally simplistic and designed to be used
|
|
* by the urlbar with very short cache periods to make sure Firefox doesn't
|
|
* repeatedly call the same Merino URL on each keystroke in a urlbar
|
|
* session, which is wasteful and can cause a suggestion to flicker out of
|
|
* and into the urlbar panel as the user matches it again and again,
|
|
* especially when Merino latency is high. It is not designed to be a
|
|
* general caching mechanism. If you need more complex or long-lived
|
|
* caching, try working with the Merino team to add cache headers to the
|
|
* relevant responses so you can leverage Firefox's HTTP cache.
|
|
*/
|
|
constructor(name = "anonymous", { cachePeriodMs = 0 } = {}) {
|
|
this.#name = name;
|
|
this.#cachePeriodMs = cachePeriodMs;
|
|
ChromeUtils.defineLazyGetter(this, "logger", () =>
|
|
lazy.UrlbarUtils.getLogger({ prefix: `MerinoClient [${name}]` })
|
|
);
|
|
}
|
|
|
|
/**
|
|
* @returns {string}
|
|
* The name of the client.
|
|
*/
|
|
get name() {
|
|
return this.#name;
|
|
}
|
|
|
|
/**
|
|
* @returns {number}
|
|
* If `resetSession()` is not called within this timeout period after a
|
|
* session starts, the session will time out and the next fetch will begin a
|
|
* new session.
|
|
*/
|
|
get sessionTimeoutMs() {
|
|
return this.#sessionTimeoutMs;
|
|
}
|
|
set sessionTimeoutMs(value) {
|
|
this.#sessionTimeoutMs = value;
|
|
}
|
|
|
|
/**
|
|
* @returns {number}
|
|
* The current session ID. Null when there is no active session.
|
|
*/
|
|
get sessionID() {
|
|
return this.#sessionID;
|
|
}
|
|
|
|
/**
|
|
* @returns {number}
|
|
* The current sequence number in the current session. Zero when there is no
|
|
* active session.
|
|
*/
|
|
get sequenceNumber() {
|
|
return this.#sequenceNumber;
|
|
}
|
|
|
|
/**
|
|
* @returns {string}
|
|
* A string that indicates the status of the last fetch. Possible values:
|
|
* success, timeout, network_error, http_error
|
|
*/
|
|
get lastFetchStatus() {
|
|
return this.#lastFetchStatus;
|
|
}
|
|
|
|
/**
|
|
* Fetches Merino suggestions.
|
|
*
|
|
* @param {object} options
|
|
* Options object
|
|
* @param {string} options.query
|
|
* The search string.
|
|
* @param {Array} options.providers
|
|
* Array of provider names to request from Merino. If this is given it will
|
|
* override the `merinoProviders` Nimbus variable and its fallback pref
|
|
* `browser.urlbar.merino.providers`.
|
|
* @param {number} options.timeoutMs
|
|
* Timeout in milliseconds. This method will return once the timeout
|
|
* elapses, a response is received, or an error occurs, whichever happens
|
|
* first.
|
|
* @param {object} options.otherParams
|
|
* If specified, the otherParams will be added as a query params. Currently
|
|
* used for accuweather's location autocomplete endpoint
|
|
* @returns {Array}
|
|
* The Merino suggestions or null if there's an error or unexpected
|
|
* response.
|
|
*/
|
|
async fetch({
|
|
query,
|
|
providers = null,
|
|
timeoutMs = lazy.UrlbarPrefs.get("merinoTimeoutMs"),
|
|
otherParams = {},
|
|
}) {
|
|
this.logger.debug("Fetch start", { query });
|
|
|
|
// Get the endpoint URL. It's empty by default when running tests so they
|
|
// don't hit the network.
|
|
let endpointString = lazy.UrlbarPrefs.get("merinoEndpointURL");
|
|
if (!endpointString) {
|
|
return [];
|
|
}
|
|
let url = URL.parse(endpointString);
|
|
if (!url) {
|
|
let error = new Error(`${endpointString} is not a valid URL`);
|
|
this.logger.error("Error creating endpoint URL", error);
|
|
return [];
|
|
}
|
|
|
|
// Start setting search params. Leave session-related params for last.
|
|
url.searchParams.set(SEARCH_PARAMS.QUERY, query);
|
|
|
|
let clientVariants = lazy.UrlbarPrefs.get("merinoClientVariants");
|
|
if (clientVariants) {
|
|
url.searchParams.set(SEARCH_PARAMS.CLIENT_VARIANTS, clientVariants);
|
|
}
|
|
|
|
let providersString;
|
|
if (providers != null) {
|
|
if (!Array.isArray(providers)) {
|
|
throw new Error("providers must be an array if given");
|
|
}
|
|
providersString = providers.join(",");
|
|
} else {
|
|
let value = lazy.UrlbarPrefs.get("merinoProviders");
|
|
if (value) {
|
|
// The Nimbus variable/pref is used only if it's a non-empty string.
|
|
providersString = value;
|
|
}
|
|
}
|
|
|
|
// An empty providers string is a valid value and means Merino should
|
|
// receive the request but not return any suggestions, so do not do a simple
|
|
// `if (providersString)` here.
|
|
if (typeof providersString == "string") {
|
|
url.searchParams.set(SEARCH_PARAMS.PROVIDERS, providersString);
|
|
}
|
|
|
|
// if otherParams are present add them to the url
|
|
for (const [param, value] of Object.entries(otherParams)) {
|
|
url.searchParams.set(param, value);
|
|
}
|
|
|
|
// At this point, all search params should be set except for session-related
|
|
// params.
|
|
|
|
let details = { query, providers, timeoutMs, url: url.toString() };
|
|
this.logger.debug("Fetch details", details);
|
|
|
|
// If caching is enabled, generate the cache key for this request URL.
|
|
let cacheKey;
|
|
if (this.#cachePeriodMs && !MerinoClient._test_disableCache) {
|
|
url.searchParams.sort();
|
|
cacheKey = url.toString();
|
|
|
|
// If we have cached suggestions and they're still valid, return them.
|
|
if (
|
|
this.#cache.suggestions &&
|
|
Date.now() < this.#cache.dateMs + this.#cachePeriodMs &&
|
|
this.#cache.key == cacheKey
|
|
) {
|
|
this.logger.debug("Fetch served from cache");
|
|
return this.#cache.suggestions;
|
|
}
|
|
}
|
|
|
|
// At this point, we're calling Merino.
|
|
|
|
// Set up the Merino session ID and related state. The session ID is a UUID
|
|
// without leading and trailing braces.
|
|
if (!this.#sessionID) {
|
|
let uuid = Services.uuid.generateUUID().toString();
|
|
this.#sessionID = uuid.substring(1, uuid.length - 1);
|
|
this.#sequenceNumber = 0;
|
|
this.#sessionTimer?.cancel();
|
|
|
|
// Per spec, for the user's privacy, the session should time out and a new
|
|
// session ID should be used if the engagement does not end soon.
|
|
this.#sessionTimer = new lazy.SkippableTimer({
|
|
name: "Merino session timeout",
|
|
time: this.#sessionTimeoutMs,
|
|
logger: this.logger,
|
|
callback: () => this.resetSession(),
|
|
});
|
|
}
|
|
url.searchParams.set(SEARCH_PARAMS.SESSION_ID, this.#sessionID);
|
|
url.searchParams.set(SEARCH_PARAMS.SEQUENCE_NUMBER, this.#sequenceNumber);
|
|
this.#sequenceNumber++;
|
|
|
|
let recordResponse = category => {
|
|
this.logger.debug("Fetch done", { status: category });
|
|
this.#lastFetchStatus = category;
|
|
recordResponse = null;
|
|
};
|
|
|
|
// Set up the timeout timer.
|
|
let timer = (this.#timeoutTimer = new lazy.SkippableTimer({
|
|
name: "Merino timeout",
|
|
time: timeoutMs,
|
|
logger: this.logger,
|
|
callback: () => {
|
|
// The fetch timed out.
|
|
this.logger.debug("Fetch timed out", { timeoutMs });
|
|
recordResponse?.("timeout");
|
|
},
|
|
}));
|
|
|
|
// If there's an ongoing fetch, abort it so there's only one at a time. By
|
|
// design we do not abort fetches on timeout or when the query is canceled
|
|
// so we can record their latency.
|
|
try {
|
|
this.#fetchController?.abort();
|
|
} catch (error) {
|
|
this.logger.error("Error aborting previous fetch", error);
|
|
}
|
|
|
|
// Do the fetch.
|
|
let response;
|
|
let controller = (this.#fetchController = new AbortController());
|
|
await Promise.race([
|
|
timer.promise,
|
|
(async () => {
|
|
try {
|
|
// Canceling the timer below resolves its promise, which can resolve
|
|
// the outer promise created by `Promise.race`. This inner async
|
|
// function happens not to await anything after canceling the timer,
|
|
// but if it did, `timer.promise` could win the race and resolve the
|
|
// outer promise without a value. For that reason, we declare
|
|
// `response` in the outer scope and set it here instead of returning
|
|
// the response from this inner function and assuming it will also be
|
|
// returned by `Promise.race`.
|
|
response = await fetch(url, { signal: controller.signal });
|
|
this.logger.debug("Got response", {
|
|
status: response.status,
|
|
...details,
|
|
});
|
|
if (!response.ok) {
|
|
recordResponse?.("http_error");
|
|
}
|
|
} catch (error) {
|
|
if (error.name != "AbortError") {
|
|
this.logger.error("Fetch error", error);
|
|
recordResponse?.("network_error");
|
|
}
|
|
} finally {
|
|
// Now that the fetch is done, cancel the timeout timer so it doesn't
|
|
// fire and record a timeout. If it already fired, which it would have
|
|
// on timeout, or was already canceled, this is a no-op.
|
|
timer.cancel();
|
|
if (controller == this.#fetchController) {
|
|
this.#fetchController = null;
|
|
}
|
|
this.#nextResponseDeferred?.resolve(response);
|
|
this.#nextResponseDeferred = null;
|
|
}
|
|
})(),
|
|
]);
|
|
if (timer == this.#timeoutTimer) {
|
|
this.#timeoutTimer = null;
|
|
}
|
|
|
|
if (!response?.ok) {
|
|
// `recordResponse()` was already called above, no need to call it here.
|
|
return [];
|
|
}
|
|
|
|
if (response.status == 204) {
|
|
// No content. We check for this because `response.json()` (below) throws
|
|
// in this case, and since we log the error it can spam the console.
|
|
recordResponse?.("no_suggestion");
|
|
return [];
|
|
}
|
|
|
|
// Get the response body as an object.
|
|
let body;
|
|
try {
|
|
body = await response.json();
|
|
} catch (error) {
|
|
this.logger.error("Error getting response as JSON", error);
|
|
}
|
|
|
|
if (body) {
|
|
this.logger.debug("Response body", body);
|
|
}
|
|
|
|
if (!body?.suggestions?.length) {
|
|
recordResponse?.("no_suggestion");
|
|
return [];
|
|
}
|
|
|
|
let { suggestions, request_id } = body;
|
|
if (!Array.isArray(suggestions)) {
|
|
this.logger.error("Unexpected response", body);
|
|
recordResponse?.("no_suggestion");
|
|
return [];
|
|
}
|
|
|
|
recordResponse?.("success");
|
|
suggestions = suggestions.map(suggestion => ({
|
|
...suggestion,
|
|
request_id,
|
|
source: "merino",
|
|
}));
|
|
|
|
if (cacheKey) {
|
|
this.#cache = {
|
|
suggestions,
|
|
key: cacheKey,
|
|
dateMs: Date.now(),
|
|
};
|
|
}
|
|
|
|
return suggestions;
|
|
}
|
|
|
|
/**
|
|
* Resets the Merino session ID and related state.
|
|
*/
|
|
resetSession() {
|
|
this.#sessionID = null;
|
|
this.#sequenceNumber = 0;
|
|
this.#sessionTimer?.cancel();
|
|
this.#sessionTimer = null;
|
|
this.#nextSessionResetDeferred?.resolve();
|
|
this.#nextSessionResetDeferred = null;
|
|
}
|
|
|
|
/**
|
|
* Cancels the timeout timer.
|
|
*/
|
|
cancelTimeoutTimer() {
|
|
this.#timeoutTimer?.cancel();
|
|
}
|
|
|
|
/**
|
|
* Returns a promise that's resolved when the next response is received or a
|
|
* network error occurs.
|
|
*
|
|
* @returns {Promise}
|
|
* The promise is resolved with the `Response` object or undefined if a
|
|
* network error occurred.
|
|
*/
|
|
waitForNextResponse() {
|
|
if (!this.#nextResponseDeferred) {
|
|
this.#nextResponseDeferred = Promise.withResolvers();
|
|
}
|
|
return this.#nextResponseDeferred.promise;
|
|
}
|
|
|
|
/**
|
|
* Returns a promise that's resolved when the session is next reset, including
|
|
* on session timeout.
|
|
*
|
|
* @returns {Promise}
|
|
*/
|
|
waitForNextSessionReset() {
|
|
if (!this.#nextSessionResetDeferred) {
|
|
this.#nextSessionResetDeferred = Promise.withResolvers();
|
|
}
|
|
return this.#nextSessionResetDeferred.promise;
|
|
}
|
|
|
|
static _test_disableCache = false;
|
|
|
|
get _test_sessionTimer() {
|
|
return this.#sessionTimer;
|
|
}
|
|
|
|
get _test_timeoutTimer() {
|
|
return this.#timeoutTimer;
|
|
}
|
|
|
|
get _test_fetchController() {
|
|
return this.#fetchController;
|
|
}
|
|
|
|
// State related to the current session.
|
|
#sessionID = null;
|
|
#sequenceNumber = 0;
|
|
#sessionTimer = null;
|
|
#sessionTimeoutMs = SESSION_TIMEOUT_MS;
|
|
|
|
#name;
|
|
#timeoutTimer = null;
|
|
#fetchController = null;
|
|
#lastFetchStatus = null;
|
|
#nextResponseDeferred = null;
|
|
#nextSessionResetDeferred = null;
|
|
#cachePeriodMs = 0;
|
|
|
|
// When caching is enabled, we cache response suggestions from the most recent
|
|
// successful request.
|
|
#cache = {
|
|
// The cached suggestions array.
|
|
suggestions: null,
|
|
// The cache key: the stringified request URL without session-related params
|
|
// (session ID and sequence number).
|
|
key: null,
|
|
// The date the suggestions were cached as returned by `Date.now()`.
|
|
dateMs: 0,
|
|
};
|
|
}
|