rx-player

/** * Copyright 2015 CANAL+ Group * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ import isNonEmptyString from "./is_non_empty_string"; import startsWith from "./starts_with"; // Scheme part of an url (e.g. "http://"). const schemeRe = /^(?:[a-z]+:)?\/\//i; /** * Match the different components of an URL. * * foo://example.com:8042/over/there?name=ferret#nose \_/ \______________/\_________/ \_________/ \__/ | | | | | scheme authority path query fragment * 1st match is the scheme: (e.g. "foo://") * 2nd match is the authority (e.g "example.com:8042") * 3rd match is the path (e.g "/over/there") * 4th match is the query params (e.g "name=ferret") * 5th match is the fragment (e.g "nose") * */ const urlComponentRegex = /^(?:([^:/?#]+):)?(?:\/\/([^/?#]*))?([^?#]*)(?:\?([^#]*))?(?:#(.*))?$/; /** * In a given URL, find the index at which the filename begins. * That is, this function finds the index of the last `/` character and returns * the index after it, returning the length of the whole URL if no `/` was found * after the scheme (i.e. in `http://`, the slashes are not considered). * @param {string} url * @returns {number} */ function getFilenameIndexInUrl(url: string): number { const indexOfLastSlash = url.lastIndexOf("/"); if (indexOfLastSlash < 0) { return url.length; } if (schemeRe.test(url)) { const firstSlashIndex = url.indexOf("/"); if (firstSlashIndex >= 0 && indexOfLastSlash === firstSlashIndex + 1) { // The "/" detected is actually the one from the protocol part of the URL // ("https://") return url.length; } } const indexOfQuestionMark = url.indexOf("?"); if (indexOfQuestionMark >= 0 && indexOfQuestionMark < indexOfLastSlash) { // There are query parameters. Let's ignore them and re-run the logic // without return getFilenameIndexInUrl(url.substring(0, indexOfQuestionMark)); } return indexOfLastSlash + 1; } /** * Take two URLs and try to construct a relative URL for the second (`newUrl`) * relative to the first (`baseUrl`). * * Returns `null` if they appear to be on different domains, depend on * different schemes or if we don't have enough information to compute the * relative URL. * @param {string} baseUrl * @param {string} newUrl * @returns {string} */ function getRelativeUrl(baseUrl: string, newUrl: string): string | null { const baseParts = parseURL(baseUrl); const newParts = parseURL(newUrl); if ( baseParts.scheme !== newParts.scheme || baseParts.authority !== newParts.authority ) { return null; } if ( // if base and new path are mixed between absolute and relative path, return null (baseParts.path[0] !== undefined && baseParts.path[0] !== "/" && newParts.path[0] === "/") || (newParts.path[0] !== undefined && newParts.path[0] !== "/" && baseParts.path[0] === "/") ) { return null; } const baseNormalizedPath = removeDotSegment(baseParts.path); const newNormalizedPath = removeDotSegment(newParts.path); let relativePath: string | undefined; if (baseNormalizedPath === newNormalizedPath) { relativePath = ""; } else { const basePathSplitted = baseNormalizedPath.split("/"); // remove everything after the last trailing / basePathSplitted.pop(); const newPathSplitted = newNormalizedPath.split("/"); while ( basePathSplitted.length > 0 && newPathSplitted.length > 0 && basePathSplitted[0] === newPathSplitted[0] ) { basePathSplitted.shift(); newPathSplitted.shift(); } while (basePathSplitted.length > 0) { basePathSplitted.shift(); newPathSplitted.unshift(".."); } let pathJoined = newPathSplitted.join("/"); if (pathJoined.endsWith("../") || pathJoined.endsWith("./")) { pathJoined = pathJoined.slice(0, pathJoined.length - 1); } relativePath = pathJoined === "" ? "." : pathJoined; } let result = relativePath; if (relativePath === "" && newParts.query === baseParts.query) { // path and query is the same, we don't need to rewrite it } else if (isNonEmptyString(newParts.query)) { result += "?"; result += newParts.query; } if (isNonEmptyString(newParts.fragment)) { result += "#"; result += newParts.fragment; } return result; } /** * Resolve the output URL from the baseURL and the relative reference as * specified by RFC 3986 section 5. * @param base * @param relative * @see https://datatracker.ietf.org/doc/html/rfc3986#section-5 * @example base: http://example.com | relative: /b/c | output: http://example.com/b/c * @returns the resolved url */ function _resolveURL(base: string, relative: string) { const baseParts = parseURL(base); const relativeParts = parseURL(relative); if (isNonEmptyString(relativeParts.scheme)) { return formatURL(relativeParts); } const target: IParsedURL = { scheme: baseParts.scheme, authority: baseParts.authority, path: "", query: relativeParts.query, fragment: relativeParts.fragment, }; if (isNonEmptyString(relativeParts.authority)) { target.authority = relativeParts.authority; target.path = removeDotSegment(relativeParts.path); return formatURL(target); } if (relativeParts.path === "") { target.path = baseParts.path; if (!isNonEmptyString(relativeParts.query)) { target.query = baseParts.query; } } else { if (startsWith(relativeParts.path, "/")) { // path is absolute target.path = removeDotSegment(relativeParts.path); } else { // path is relative target.path = removeDotSegment(mergePaths(baseParts, relativeParts.path)); } } return formatURL(target); } interface IParsedURL { scheme: string; authority: string; path: string; query: string; fragment: string; } /** * Cache to store already parsed URLs to avoid unnecessary computation when parsing the same URL again. */ const parsedUrlCache = new Map<string, IParsedURL>(); /** * Sets the maximum number of entries allowed in the parsedUrlCache map. * This limit helps prevent excessive memory usage. The value is arbitrary. */ const MAX_URL_CACHE_ENTRIES = 200; /** * Parses a URL into its components. * @param {string} url - The URL to parse. * @returns {IParsedURL} The parsed URL components. */ function parseURL(url: string): IParsedURL { if (parsedUrlCache.has(url)) { return parsedUrlCache.get(url) as IParsedURL; } const matches = url.match(urlComponentRegex); let parsed: IParsedURL; if (matches === null) { parsed = { scheme: "", authority: "", path: "", query: "", fragment: "", }; } else { parsed = { scheme: matches[1] ?? "", authority: matches[2] ?? "", path: matches[3] ?? "", query: matches[4] ?? "", fragment: matches[5] ?? "", }; } if (parsedUrlCache.size >= MAX_URL_CACHE_ENTRIES) { parsedUrlCache.clear(); } parsedUrlCache.set(url, parsed); return parsed; } /** * Formats a parsed URL into a string. * @param {IParsedURL} parts - The parsed URL components. * @returns {string} The formatted URL string. */ function formatURL(parts: IParsedURL): string { let url = ""; if (isNonEmptyString(parts.scheme)) { url += parts.scheme + ":"; } if (isNonEmptyString(parts.authority)) { url += "//" + parts.authority; } url += parts.path; if (isNonEmptyString(parts.query)) { url += "?" + parts.query; } if (isNonEmptyString(parts.fragment)) { url += "#" + parts.fragment; } return url; } /** * Removes "." and ".." from the URL path, as described by the algorithm * in RFC 3986 Section 5.2.4. Remove Dot Segments * @param {string} path - The URL path * @see https://datatracker.ietf.org/doc/html/rfc3986#section-5.2.4 * @returns The path with dot segments removed. * @example "/baz/booz/../biz" => "/baz/biz" */ function removeDotSegment(path: string): string { const segments = path.split(/(?=\/)/); const output: string[] = []; for (let i = 0; i < segments.length; i++) { const segment = segments[i]; if (segment === ".." || segment === "." || segment === "") { continue; } if (segment === "/..") { output.pop(); // if it's last segment push a trailing "/" if (i === segments.length - 1) { output.push("/"); } continue; } if (segment === "/.") { // if it's last segment push a trailing "/" if (i === segments.length - 1) { output.push("/"); } continue; } output.push(segment); } return output.join(""); } /** * Merges a base URL path with a relative URL path, as described by * the algorithm merge paths in RFC 3986 Section 5.2.3. Merge Paths * @param {IParsedURL} baseParts - The parsed base URL components. * @param {string} relativePath - The relative URL path. * @returns {string} The merged URL path. * @see https://datatracker.ietf.org/doc/html/rfc3986#section-5.2.3 */ function mergePaths(baseParts: IParsedURL, relativePath: string): string { if (isNonEmptyString(baseParts.authority) && baseParts.path === "") { return "/" + relativePath; } const basePath = baseParts.path; return basePath.substring(0, basePath.lastIndexOf("/") + 1) + relativePath; } /** * Resolves multiple URL segments using the RFC 3986 URL resolution algorithm. * * This function takes a variable number of URL segments and resolves them * sequentially according to the RFC 3986 URL resolution algorithm. * First argument is the base URL. * Empty string arguments are ignored. * * @param {...(string|undefined)} args - The URL segments to resolve. * @returns {string} The resolved URL as a string. */ function resolveURL(...args: Array<string | undefined>): string { const filteredArgs = args.filter((val) => val !== ""); const len = filteredArgs.length; if (len === 0) { return ""; } if (len === 1) { return filteredArgs[0] ?? ""; } else { const basePart = filteredArgs[0] ?? ""; const relativeParts = filteredArgs[1] ?? ""; const resolvedURL = _resolveURL(basePart, relativeParts); const remainingArgs = filteredArgs.slice(2); return resolveURL(resolvedURL, ...remainingArgs); } } export { getFilenameIndexInUrl, getRelativeUrl, resolveURL };