2020-11-05 16:58:23 +00:00
|
|
|
const { rtrimSlashes } = require('./path-utils');
|
|
|
|
const { urlDecode } = require('./string-utils');
|
2018-05-23 12:14:38 +01:00
|
|
|
|
2017-11-08 17:51:55 +00:00
|
|
|
const urlUtils = {};
|
|
|
|
|
|
|
|
urlUtils.hash = function(url) {
|
|
|
|
const s = url.split('#');
|
|
|
|
if (s.length <= 1) return '';
|
|
|
|
return s[s.length - 1];
|
2019-07-29 15:43:53 +02:00
|
|
|
};
|
2017-11-08 17:51:55 +00:00
|
|
|
|
2018-05-23 12:14:38 +01:00
|
|
|
urlUtils.urlWithoutPath = function(url) {
|
|
|
|
const parsed = require('url').parse(url, true);
|
2019-09-19 22:51:18 +01:00
|
|
|
return `${parsed.protocol}//${parsed.host}`;
|
2019-07-29 15:43:53 +02:00
|
|
|
};
|
2018-05-23 12:14:38 +01:00
|
|
|
|
|
|
|
urlUtils.urlProtocol = function(url) {
|
2019-05-10 01:06:06 +01:00
|
|
|
if (!url) return '';
|
2018-05-23 12:14:38 +01:00
|
|
|
const parsed = require('url').parse(url, true);
|
|
|
|
return parsed.protocol;
|
2019-07-29 15:43:53 +02:00
|
|
|
};
|
2018-05-23 12:14:38 +01:00
|
|
|
|
|
|
|
urlUtils.prependBaseUrl = function(url, baseUrl) {
|
|
|
|
baseUrl = rtrimSlashes(baseUrl).trim(); // All the code below assumes that the baseUrl does not end up with a slash
|
|
|
|
url = url.trim();
|
|
|
|
|
|
|
|
if (!url) url = '';
|
|
|
|
if (!baseUrl) return url;
|
2019-06-13 00:26:09 +01:00
|
|
|
if (url.indexOf('#') === 0) return url; // Don't prepend if it's a local anchor
|
2018-05-24 12:44:13 +01:00
|
|
|
if (urlUtils.urlProtocol(url)) return url; // Don't prepend the base URL if the URL already has a scheme
|
2018-05-23 12:14:38 +01:00
|
|
|
|
2019-07-29 15:43:53 +02:00
|
|
|
if (url.length >= 2 && url.indexOf('//') === 0) {
|
|
|
|
// If it starts with // it's a protcol-relative URL
|
2018-05-23 12:14:38 +01:00
|
|
|
return urlUtils.urlProtocol(baseUrl) + url;
|
2019-07-29 15:43:53 +02:00
|
|
|
} else if (url && url[0] === '/') {
|
|
|
|
// If it starts with a slash, it's an absolute URL so it should be relative to the domain (and not to the full baseUrl)
|
2018-05-23 12:14:38 +01:00
|
|
|
return urlUtils.urlWithoutPath(baseUrl) + url;
|
|
|
|
} else {
|
2019-09-19 22:51:18 +01:00
|
|
|
return baseUrl + (url ? `/${url}` : '');
|
2018-05-23 12:14:38 +01:00
|
|
|
}
|
2019-07-29 15:43:53 +02:00
|
|
|
};
|
2018-05-23 12:14:38 +01:00
|
|
|
|
2019-09-12 22:48:10 +01:00
|
|
|
const resourceRegex = /^(joplin:\/\/|:\/)([0-9a-zA-Z]{32})(|#[^\s]*)(|\s".*?")$/;
|
|
|
|
|
2019-09-10 09:25:58 +01:00
|
|
|
urlUtils.isResourceUrl = function(url) {
|
2019-09-12 22:48:10 +01:00
|
|
|
return !!url.match(resourceRegex);
|
2019-09-10 09:25:58 +01:00
|
|
|
};
|
|
|
|
|
2019-09-09 18:16:00 +01:00
|
|
|
urlUtils.parseResourceUrl = function(url) {
|
2019-09-10 09:25:58 +01:00
|
|
|
if (!urlUtils.isResourceUrl(url)) return null;
|
|
|
|
|
2019-09-12 22:48:10 +01:00
|
|
|
const match = url.match(resourceRegex);
|
2019-09-09 18:16:00 +01:00
|
|
|
|
2019-09-12 22:48:10 +01:00
|
|
|
const itemId = match[2];
|
|
|
|
let hash = match[3].trim();
|
2019-09-12 21:57:23 +01:00
|
|
|
|
|
|
|
// In general we want the hash to be decoded so that non-alphabetical languages
|
|
|
|
// appear as-is without being encoded with %.
|
|
|
|
// Fixes https://github.com/laurent22/joplin/issues/1870
|
2019-09-12 22:48:10 +01:00
|
|
|
if (hash) hash = urlDecode(hash.substr(1)); // Remove the first #
|
|
|
|
|
|
|
|
return {
|
|
|
|
itemId: itemId,
|
|
|
|
hash: hash,
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
|
|
|
urlUtils.extractResourceUrls = function(text) {
|
|
|
|
const markdownLinksRE = /\]\((.*?)\)/g;
|
|
|
|
const output = [];
|
|
|
|
let result = null;
|
|
|
|
|
|
|
|
while ((result = markdownLinksRE.exec(text)) !== null) {
|
|
|
|
const resourceUrlInfo = urlUtils.parseResourceUrl(result[1]);
|
|
|
|
if (resourceUrlInfo) output.push(resourceUrlInfo);
|
|
|
|
}
|
|
|
|
|
|
|
|
const htmlRegexes = [
|
|
|
|
/<img[\s\S]*?src=["']:\/([a-zA-Z0-9]{32})["'][\s\S]*?>/gi,
|
|
|
|
/<a[\s\S]*?href=["']:\/([a-zA-Z0-9]{32})["'][\s\S]*?>/gi,
|
|
|
|
];
|
|
|
|
|
|
|
|
for (const htmlRegex of htmlRegexes) {
|
|
|
|
while (true) {
|
|
|
|
const m = htmlRegex.exec(text);
|
|
|
|
if (!m) break;
|
|
|
|
output.push({ itemId: m[1], hash: '' });
|
|
|
|
}
|
|
|
|
}
|
2019-09-09 18:16:00 +01:00
|
|
|
|
|
|
|
return output;
|
|
|
|
};
|
|
|
|
|
2020-10-28 15:50:34 +00:00
|
|
|
urlUtils.objectToQueryString = function(query) {
|
|
|
|
if (!query) return '';
|
|
|
|
|
|
|
|
let queryString = '';
|
|
|
|
const s = [];
|
|
|
|
for (const k in query) {
|
|
|
|
if (!query.hasOwnProperty(k)) continue;
|
|
|
|
s.push(`${encodeURIComponent(k)}=${encodeURIComponent(query[k])}`);
|
|
|
|
}
|
|
|
|
queryString = s.join('&');
|
|
|
|
|
|
|
|
return queryString;
|
|
|
|
};
|
|
|
|
|
2021-11-23 12:12:27 +00:00
|
|
|
// This is a modified version of the file-uri-to-path package:
|
|
|
|
//
|
|
|
|
// - It removes the dependency to the "path" package, which wouldn't work with
|
|
|
|
// React Native.
|
|
|
|
//
|
|
|
|
// - It always returns paths with forward slashes "/". This is normally handled
|
|
|
|
// properly everywhere.
|
|
|
|
//
|
|
|
|
// - Adds the "platform" parameter to optionall return paths with "\" for win32
|
|
|
|
function fileUriToPath_(uri, platform) {
|
|
|
|
const sep = '/';
|
|
|
|
|
|
|
|
if (
|
|
|
|
typeof uri !== 'string' ||
|
|
|
|
uri.length <= 7 ||
|
|
|
|
uri.substring(0, 7) !== 'file://'
|
|
|
|
) {
|
|
|
|
throw new TypeError(
|
|
|
|
'must pass in a file:// URI to convert to a file path'
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
const rest = decodeURI(uri.substring(7));
|
|
|
|
const firstSlash = rest.indexOf('/');
|
|
|
|
let host = rest.substring(0, firstSlash);
|
|
|
|
let path = rest.substring(firstSlash + 1);
|
|
|
|
|
|
|
|
// 2. Scheme Definition
|
|
|
|
// As a special case, <host> can be the string "localhost" or the empty
|
|
|
|
// string; this is interpreted as "the machine from which the URL is
|
|
|
|
// being interpreted".
|
|
|
|
if (host === 'localhost') {
|
|
|
|
host = '';
|
|
|
|
}
|
|
|
|
|
|
|
|
if (host) {
|
|
|
|
host = sep + sep + host;
|
|
|
|
}
|
|
|
|
|
|
|
|
// 3.2 Drives, drive letters, mount points, file system root
|
|
|
|
// Drive letters are mapped into the top of a file URI in various ways,
|
|
|
|
// depending on the implementation; some applications substitute
|
|
|
|
// vertical bar ("|") for the colon after the drive letter, yielding
|
|
|
|
// "file:///c|/tmp/test.txt". In some cases, the colon is left
|
|
|
|
// unchanged, as in "file:///c:/tmp/test.txt". In other cases, the
|
|
|
|
// colon is simply omitted, as in "file:///c/tmp/test.txt".
|
|
|
|
path = path.replace(/^(.+)\|/, '$1:');
|
|
|
|
|
|
|
|
// for Windows, we need to invert the path separators from what a URI uses
|
|
|
|
// if (sep === '\\') {
|
|
|
|
// path = path.replace(/\//g, '\\');
|
|
|
|
// }
|
|
|
|
|
|
|
|
if (/^.+:/.test(path)) {
|
|
|
|
// has Windows drive at beginning of path
|
|
|
|
} else {
|
|
|
|
// unix path…
|
|
|
|
path = sep + path;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (platform === 'win32') {
|
|
|
|
return (host + path).replace(/\//g, '\\');
|
|
|
|
} else {
|
|
|
|
return host + path;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
urlUtils.fileUriToPath = (path, platform = 'linux') => {
|
|
|
|
const output = fileUriToPath_(path, platform);
|
2021-11-22 17:17:28 +00:00
|
|
|
|
|
|
|
// The file-uri-to-path module converts Windows path such as
|
|
|
|
//
|
|
|
|
// file://c:/autoexec.bat => \\c:\autoexec.bat
|
|
|
|
//
|
|
|
|
// Probably because a file:// that starts with only two slashes is not
|
|
|
|
// quite valid. If we use three slashes, it works:
|
|
|
|
//
|
|
|
|
// file:///c:/autoexec.bat => c:\autoexec.bat
|
|
|
|
//
|
|
|
|
// However there are various places in the app where we can find
|
|
|
|
// paths with only two slashes because paths are often constructed
|
|
|
|
// as `file://${resourcePath}` - which works in all OSes except
|
|
|
|
// Windows.
|
|
|
|
//
|
|
|
|
// So here we introduce a special case - if we detect that we have
|
|
|
|
// an invalid Windows path that starts with \\x:, we just remove
|
|
|
|
// the first two backslashes.
|
|
|
|
//
|
|
|
|
// https://github.com/laurent22/joplin/issues/5693
|
|
|
|
|
2021-11-23 12:12:27 +00:00
|
|
|
if (output.match(/^\/\/[a-zA-Z]:/)) {
|
2021-11-22 17:17:28 +00:00
|
|
|
return output.substr(2);
|
|
|
|
}
|
|
|
|
|
|
|
|
return output;
|
|
|
|
};
|
|
|
|
|
2019-07-29 15:43:53 +02:00
|
|
|
module.exports = urlUtils;
|