// (C) Copyright 2015 Moodle Pty Ltd.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
import { Clipboard, Translate } from '@singletons';
import { CoreToasts } from '@services/toasts';
import { Locutus } from './locutus';
import { CoreError } from '@classes/errors/error';
import { convertTextToHTMLElement } from '../utils/create-html-element';
/**
* Singleton with helper functions for text manipulation.
*/
export class CoreText {
// Avoid creating singleton instances.
private constructor() {
// Nothing to do.
}
/**
* Add ending slash from a path or URL.
*
* @param text Text to treat.
* @returns Treated text.
*/
static addEndingSlash(text: string): string {
if (!text) {
return '';
}
if (text.slice(-1) != '/') {
return text + '/';
}
return text;
}
/**
* Add starting slash to a string if needed.
*
* @param text Text to treat.
* @returns Treated text.
*/
static addStartingSlash(text = ''): string {
if (text[0] === '/') {
return text;
}
return '/' + text;
}
/**
* Given a list of sentences, build a message with all of them wrapped in
.
*
* @param messages Messages to show.
* @returns Message with all the messages.
*/
static buildMessage(messages: string[]): string {
let result = '';
messages.forEach((message) => {
if (message) {
result += `
${message}
`;
}
});
return result;
}
/**
* Convert size in bytes into human readable format
*
* @param bytes Number of bytes to convert.
* @param precision Number of digits after the decimal separator.
* @returns Size in human readable format.
*/
static bytesToSize(bytes: number, precision: number = 2): string {
if (bytes === undefined || bytes === null || bytes < 0) {
return Translate.instant('core.notapplicable');
}
if (precision < 0) {
precision = 2;
}
const keys = ['core.sizeb', 'core.sizekb', 'core.sizemb', 'core.sizegb', 'core.sizetb'];
const units = Translate.instant(keys);
let pos = 0;
if (bytes >= 1024) {
while (bytes >= 1024) {
pos++;
bytes = bytes / 1024;
}
// Round to "precision" decimals if needed.
bytes = Number(Math.round(parseFloat(bytes + 'e+' + precision)) + 'e-' + precision);
}
return Translate.instant('core.humanreadablesize', { size: bytes, unit: units[keys[pos]] });
}
/**
* Copies a text to clipboard and shows a toast message.
*
* @param text Text to be copied
*/
static async copyToClipboard(text: string): Promise {
try {
await Clipboard.copy(text);
} catch {
// Use HTML Copy command.
const virtualInput = document.createElement('textarea');
virtualInput.innerHTML = text;
virtualInput.select();
virtualInput.setSelectionRange(0, 99999);
document.execCommand('copy'); // eslint-disable-line deprecation/deprecation
}
// Show toast using ionicLoading.
CoreToasts.show({
message: 'core.copiedtoclipboard',
translateMessage: true,
});
}
/**
* Count words in a text.
* This function is based on Moodle's count_words.
*
* @param text Text to count.
* @returns Number of words.
*/
static countWords(text?: string | null): number {
if (!text || typeof text != 'string') {
return 0;
}
// Before stripping tags, add a space after the close tag of anything that is not obviously inline.
// Also, br is a special case because it definitely delimits a word, but has no close tag.
text = text.replace(/(<\/(?!a>|b>|del>|em>|i>|ins>|s>|small>|span>|strong>|sub>|sup>|u>)\w+>|
|
)/ig, '$1 ');
// Now remove HTML tags.
text = text.replace(/(<([^>]+)>)/ig, '');
// Decode HTML entities.
text = CoreText.decodeHTMLEntities(text);
// Now, the word count is the number of blocks of characters separated
// by any sort of space. That seems to be the definition used by all other systems.
// To be precise about what is considered to separate words:
// * Anything that Unicode considers a 'Separator'
// * Anything that Unicode considers a 'Control character'
// * An em- or en- dash.
let words: string[];
try {
words = text.split(/[\p{Z}\p{Cc}—–]+/u);
} catch {
// Unicode-aware flag not supported.
words = text.split(/\s+/);
}
// Filter empty words.
return words.filter(word => word).length;
}
/**
* Clean HTML tags.
*
* @param text The text to be cleaned.
* @param options Processing options.
* @param options.singleLine True if new lines should be removed (all the text in a single line).
* @param options.trim True if text should be trimmed.
* @returns Clean text.
*/
static cleanTags(text: string | undefined, options: { singleLine?: boolean; trim?: boolean } = {}): string {
if (!text) {
return '';
}
// First, we use a regexpr.
text = text.replace(/(<([^>]+)>)/ig, '');
// Then, we rely on the browser. We need to wrap the text to be sure is HTML.
text = convertTextToHTMLElement(text).textContent || '';
// Trim text
text = options.trim ? text.trim() : text;
// Recover or remove new lines.
text = CoreText.replaceNewLines(text, options.singleLine ? ' ' : '
');
return text;
}
/**
* Decode an escaped HTML text. This implementation is based on PHP's htmlspecialchars_decode.
*
* @param text Text to decode.
* @returns Decoded text.
*/
static decodeHTML(text: string | number): string {
if (text === undefined || text === null || (typeof text === 'number' && isNaN(text))) {
return '';
} else if (typeof text != 'string') {
return '' + text;
}
return text
.replace(/&/g, '&')
.replace(/</g, '<')
.replace(/>/g, '>')
.replace(/"/g, '"')
.replace(/'/g, '\'')
.replace(/ /g, ' ');
}
/**
* Decode HTML entities in a text. Equivalent to PHP html_entity_decode.
*
* @param text Text to decode.
* @returns Decoded text.
*/
static decodeHTMLEntities(text: string): string {
if (text) {
text = convertTextToHTMLElement(text).textContent || '';
}
return text;
}
/**
* Escapes some characters in a string to be used as a regular expression.
*
* @param text Text to escape.
* @returns Escaped text.
*/
static escapeForRegex(text: string): string {
if (!text || typeof text !== 'string') {
return '';
}
return text.replace(/[-[\]{}()*+?.,\\^$|#\s]/g, '\\$&');
}
/**
* Escape an HTML text. This implementation is based on PHP's htmlspecialchars.
*
* @param text Text to escape.
* @param doubleEncode If false, it will not convert existing html entities. Defaults to true.
* @returns Escaped text.
*/
static escapeHTML(text?: string | number | null, doubleEncode = true): string {
if (text === undefined || text === null || (typeof text === 'number' && isNaN(text))) {
return '';
} else if (typeof text !== 'string') {
return '' + text;
}
if (doubleEncode) {
text = text.replace(/&/g, '&');
} else {
text = text.replace(/&(?!amp;)(?!lt;)(?!gt;)(?!quot;)(?!#039;)/g, '&');
}
return text
.replace(//g, '>')
.replace(/"/g, '"')
.replace(/'/g, ''');
}
/**
* Formats a text, in HTML replacing new lines by correct html new lines.
*
* @param text Text to format.
* @returns Formatted text.
*/
static formatHtmlLines(text: string): string {
const hasHTMLTags = CoreText.hasHTMLTags(text);
if (text.indexOf('') == -1) {
// Wrap the text in
tags.
text = '
' + text + '
';
}
if (!hasHTMLTags) {
// The text doesn't have HTML, replace new lines for
.
return CoreText.replaceNewLines(text, '
');
}
return text;
}
/**
* Check if a text contains HTML tags.
*
* @param text Text to check.
* @returns Whether it has HTML tags.
*/
static hasHTMLTags(text: string): boolean {
return /<[a-z][\s\S]*>/i.test(text);
}
/**
* Check if a text contains Unicode long chars.
* Using as threshold Hex value D800
*
* @param text Text to check.
* @returns True if has Unicode chars, false otherwise.
*/
static hasUnicode(text: string): boolean {
for (let x = 0; x < text.length; x++) {
if (text.charCodeAt(x) > 55295) {
return true;
}
}
return false;
}
/**
* Check if an object has any long Unicode char.
*
* @param data Object to be checked.
* @returns If the data has any long Unicode char on it.
*/
static hasUnicodeData(data: Record): boolean {
for (const el in data) {
if (typeof data[el] === 'object') {
if (CoreText.hasUnicodeData(data[el] as Record)) {
return true;
}
continue;
}
if (typeof data[el] === 'string' && CoreText.hasUnicode(data[el] as string)) {
return true;
}
}
return false;
}
/**
* Highlight all occurrences of a certain text inside another text. It will add some HTML code to highlight it.
*
* @param text Full text.
* @param searchText Text to search and highlight.
* @returns Highlighted text.
*/
static highlightText(text: string, searchText: string): string {
if (!text || typeof text !== 'string') {
return '';
} else if (!searchText) {
return text;
}
const regex = new RegExp('(' + searchText + ')', 'gi');
return text.replace(regex, '$1');
}
/**
* Check whether the given text matches a glob pattern.
*
* @param text Text to match against.
* @param pattern Glob pattern.
* @returns Whether the pattern matches.
*/
static matchesGlob(text: string, pattern: string): boolean {
pattern = pattern
.replace(/\*\*/g, '%RECURSIVE_MATCH%')
.replace(/\*/g, '%LOCAL_MATCH%')
.replace(/\?/g, '%CHARACTER_MATCH%');
pattern = CoreText.escapeForRegex(pattern);
pattern = pattern
.replace(/%RECURSIVE_MATCH%/g, '.*')
.replace(/%LOCAL_MATCH%/g, '[^/]*')
.replace(/%CHARACTER_MATCH%/g, '[^/]');
return new RegExp(`^${pattern}$`).test(text);
}
/**
* Same as Javascript's JSON.parse, but it will handle errors.
*
* @param json JSON text.
* @param defaultValue Default value to return if the parse fails. Defaults to the original value.
* @param logErrorFn An error to call with the exception to log the error. If not supplied, no error.
* @returns JSON parsed as object or what it gets.
*/
static parseJSON(json: string, defaultValue?: T, logErrorFn?: (error?: Error) => void): T {
try {
return JSON.parse(json);
} catch (error) {
// Error, log the error if needed.
if (logErrorFn) {
logErrorFn(error);
}
}
// Error parsing, return the default value or the original value.
if (defaultValue !== undefined) {
return defaultValue;
}
throw new CoreError('JSON cannot be parsed and not default value has been provided');
}
/**
* Process HTML string.
*
* @param text HTML string.
* @param process Method to process the HTML.
* @returns Processed HTML string.
*/
static processHTML(text: string, process: (element: HTMLElement) => unknown): string {
const element = convertTextToHTMLElement(text);
process(element);
return element.innerHTML;
}
/**
* Replace all characters that cause problems with files in Android and iOS.
*
* @param text Text to treat.
* @returns Treated text.
*/
static removeSpecialCharactersForFiles(text: string): string {
if (!text || typeof text !== 'string') {
return '';
}
return text.replace(/[#:/?\\]+/g, '_');
}
/**
* Remove ending slash from a path or URL.
*
* @param text Text to treat.
* @returns Treated text.
*/
static removeEndingSlash(text?: string): string {
if (!text) {
return '';
}
if (text.slice(-1) == '/') {
return text.substring(0, text.length - 1);
}
return text;
}
/**
* Remove starting slash from a string if needed.
*
* @param text Text to treat.
* @returns Treated text.
*/
static removeStartingSlash(text = ''): string {
if (text[0] !== '/') {
return text;
}
return text.substring(1);
}
/**
* Replace {{ARGUMENT}} arguments in the text.
*
* @param text Text to treat.
* @param replacements Argument values.
* @param encoding Encoding to use in values.
* @returns Treated text.
*/
static replaceArguments(text: string, replacements: Record = {}, encoding?: 'uri'): string {
let match: RegExpMatchArray | null = null;
while ((match = text.match(/\{\{([^}]+)\}\}/))) {
const argument = match[1].trim();
const value = replacements[argument] ?? '';
const encodedValue = encoding ? encodeURIComponent(value) : value;
text = text.replace(`{{${argument}}}`, encodedValue);
}
return text;
}
/**
* Replace all the new lines on a certain text.
*
* @param text The text to be treated.
* @param newValue Text to use instead of new lines.
* @returns Treated text.
*/
static replaceNewLines(text: string, newValue: string): string {
if (!text || typeof text !== 'string') {
return '';
}
return text.replace(/(?:\r\n|\r|\n)/g, newValue);
}
/**
* Rounds a number to use a certain amout of decimals or less.
* Difference between this function and float's toFixed:
* 7.toFixed(2) -> 7.00
* roundToDecimals(7, 2) -> 7
*
* @param num Number to round.
* @param decimals Number of decimals. By default, 2.
* @returns Rounded number.
*/
static roundToDecimals(num: number, decimals: number = 2): number {
const multiplier = Math.pow(10, decimals);
return Math.round(num * multiplier) / multiplier;
}
/**
* Add quotes to HTML characters.
*
* Returns text with HTML characters (like "<", ">", etc.) properly quoted.
* Based on Moodle's s() function.
*
* @param text Text to treat.
* @returns Treated text.
*/
static s(text: string): string {
if (!text) {
return '';
}
return CoreText.escapeHTML(text).replace(/&#(\d+|x[0-9a-f]+);/i, '$1;');
}
/**
* Shortens a text to length and adds an ellipsis.
*
* @param text The text to be shortened.
* @param length The desired length.
* @returns Shortened text.
*/
static shortenText(text: string, length: number): string {
if (text.length > length) {
text = text.substring(0, length);
// Now, truncate at the last word boundary (if exists).
const lastWordPos = text.lastIndexOf(' ');
if (lastWordPos > 0) {
text = text.substring(0, lastWordPos);
}
text += '…';
}
return text;
}
/**
* Strip Unicode long char of a given text.
* Using as threshold Hex value D800
*
* @param text Text to check.
* @returns Without the Unicode chars.
*/
static stripUnicode(text: string): string {
let stripped = '';
for (let x = 0; x < text.length; x++) {
if (text.charCodeAt(x) <= 55295) {
stripped += text.charAt(x);
}
}
return stripped;
}
/**
* Replace text within a portion of a string. Equivalent to PHP's substr_replace.
*
* @param str The string to treat.
* @param replace The value to put inside the string.
* @param start The index where to start putting the new string. If negative, it will count from the end of the string.
* @param length Length of the portion of string which is to be replaced. If negative, it represents the number of characters
* from the end of string at which to stop replacing. If not provided, replace until the end of the string.
* @returns Treated string.
*/
static substrReplace(str: string, replace: string, start: number, length?: number): string {
return Locutus.substrReplace(str, replace, start, length);
}
/**
* Remove all ocurrences of a certain character from the start and end of a string.
*
* @param text Text to treat.
* @param character Character to remove.
* @returns Treated text.
*/
static trimCharacter(text: string, character: string): string {
const escaped = CoreText.escapeForRegex(character);
const regExp = new RegExp(`^${escaped}+|${escaped}+$`, 'g');
return text.replace(regExp, '');
}
/**
* If a number has only 1 digit, add a leading zero to it.
*
* @param num Number to convert.
* @returns Number with leading zeros.
*/
static twoDigits(num: string | number): string {
if (Number(num) < 10) {
return '0' + num;
} else {
return '' + num; // Convert to string for coherence.
}
}
/**
* Make a string's first character uppercase.
*
* @param text Text to treat.
* @returns Treated text.
*/
static capitalize(text: string): string {
return text.charAt(0).toUpperCase() + text.slice(1);
}
/**
* Unserialize Array from PHP.
*
* @param data String to unserialize.
* @returns Unserialized data.
*/
static unserialize(data: string): T {
return Locutus.unserialize(data);
}
}
/**
* Define text formatting types.
*/
export enum CoreTextFormat {
FORMAT_MOODLE = 0, // Does all sorts of transformations and filtering.
FORMAT_HTML = 1, // Plain HTML (with some tags stripped). Use it by default.
FORMAT_PLAIN = 2, // Plain text (even tags are printed in full).
// FORMAT_WIKI is deprecated since 2005...
FORMAT_MARKDOWN = 4, // Markdown-formatted text http://daringfireball.net/projects/markdown/
}
export const defaultTextFormat = CoreTextFormat.FORMAT_HTML;