2017-09-05 13:24:16 -07:00
|
|
|
import url from 'url';
|
2017-10-03 09:01:06 -06:00
|
|
|
import sanitizeFilename from 'sanitize-filename';
|
2017-10-03 09:48:43 -06:00
|
|
|
import { isString, escapeRegExp, flow, partialRight } from 'lodash';
|
2017-09-05 13:24:16 -07:00
|
|
|
|
2017-03-15 14:32:41 -04:00
|
|
|
function getUrl(url, direct) {
|
|
|
|
return `${ direct ? '/#' : '' }${ url }`;
|
|
|
|
}
|
|
|
|
|
|
|
|
export function getCollectionUrl(collectionName, direct) {
|
|
|
|
return getUrl(`/collections/${ collectionName }`, direct);
|
|
|
|
}
|
|
|
|
|
|
|
|
export function getNewEntryUrl(collectionName, direct) {
|
|
|
|
return getUrl(`/collections/${ collectionName }/entries/new`, direct);
|
|
|
|
}
|
2017-09-05 13:24:16 -07:00
|
|
|
|
2017-09-30 17:27:07 -06:00
|
|
|
// Unreserved chars from RFC3987.
|
|
|
|
const uriChars = /[\w\-.~]/i;
|
2017-09-30 20:43:29 -06:00
|
|
|
const ucsChars = /[\xA0-\u{D7FF}\u{F900}-\u{FDCF}\u{FDF0}-\u{FFEF}\u{10000}-\u{1FFFD}\u{20000}-\u{2FFFD}\u{30000}-\u{3FFFD}\u{40000}-\u{4FFFD}\u{50000}-\u{5FFFD}\u{60000}-\u{6FFFD}\u{70000}-\u{7FFFD}\u{80000}-\u{8FFFD}\u{90000}-\u{9FFFD}\u{A0000}-\u{AFFFD}\u{B0000}-\u{BFFFD}\u{C0000}-\u{CFFFD}\u{D0000}-\u{DFFFD}\u{E1000}-\u{EFFFD}]/u;
|
2017-09-30 17:27:07 -06:00
|
|
|
export function sanitizeIRI(str, { replacement }) {
|
|
|
|
let result = "";
|
|
|
|
// We cannot use a `map` function here because `string.split()` splits things like emojis into surrogate pairs.
|
|
|
|
for (const char of str) {
|
|
|
|
if (uriChars.test(char) || ucsChars.test(char)) {
|
|
|
|
result += char;
|
|
|
|
} else {
|
|
|
|
result += replacement;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2017-10-03 09:01:06 -06:00
|
|
|
export function sanitizeSlug(str, { replacement = '-' }) {
|
|
|
|
if (!isString(str)) throw "`sanitizeSlug` only accepts strings as input.";
|
|
|
|
if (!isString(replacement)) throw "the `sanitizeSlug` replacement character must be a string.";
|
2017-10-03 09:48:43 -06:00
|
|
|
|
2017-10-03 09:01:06 -06:00
|
|
|
// Sanitize as IRI (i18n URI) and as filename.
|
2017-10-03 09:48:43 -06:00
|
|
|
const sanitize = flow([
|
|
|
|
partialRight(sanitizeIRI, { replacement }),
|
|
|
|
partialRight(sanitizeFilename, { replacement }),
|
|
|
|
]);
|
|
|
|
const sanitizedSlug = sanitize(str);
|
|
|
|
|
2017-10-03 09:01:06 -06:00
|
|
|
// Remove any doubled or trailing replacement characters (that were added in the sanitizers).
|
|
|
|
const doubleReplacement = new RegExp('(?:' + escapeRegExp(replacement) + ')+', 'g');
|
2017-10-03 09:48:43 -06:00
|
|
|
const trailingReplacment = new RegExp(escapeRegExp(replacement) + '$');
|
|
|
|
const normalizedSlug = sanitizedSlug
|
|
|
|
.replace(doubleReplacement, '-')
|
|
|
|
.replace(trailingReplacment, '');
|
2017-10-03 09:01:06 -06:00
|
|
|
|
2017-10-03 09:48:43 -06:00
|
|
|
return normalizedSlug;
|
2017-10-03 09:01:06 -06:00
|
|
|
}
|
|
|
|
|
2017-09-05 13:24:16 -07:00
|
|
|
export function urlize(string) {
|
|
|
|
const sanitized = makePathSanitized(string);
|
|
|
|
const parsedURL = url.parse(sanitized);
|
|
|
|
|
|
|
|
return url.format(parsedURL);
|
|
|
|
}
|
|
|
|
|
|
|
|
function makePathSanitized(string) {
|
|
|
|
return makePath(string.toLowerCase());
|
|
|
|
}
|
|
|
|
|
|
|
|
function makePath(string) {
|
|
|
|
return unicodeSanitize(string).trim().replace(/[\s]/g, '-').replace(/-+/g, '-');
|
|
|
|
}
|
|
|
|
|
|
|
|
function unicodeSanitize(string) {
|
|
|
|
let target = [];
|
|
|
|
const runes = string.split('');
|
|
|
|
for (let i=0; i < string.length; i++) {
|
|
|
|
const r = runes[i];
|
|
|
|
if (r == '%' && i+2 < string.length && string.substr(i+1, 2).match(/^[0-9a-f]+$/)) {
|
|
|
|
target = target.concat([r, runes[i+1], runes[i+2]]);
|
|
|
|
} else if (r.match(/[\w .\/\\_#\+-]/u)) {
|
|
|
|
target.push(r);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return target.join('');
|
|
|
|
}
|