/* * CDDL HEADER START * * The contents of this file are subject to the terms of the * Common Development and Distribution License (the "License"). * You may not use this file except in compliance with the License. * * See LICENSE.txt included in this distribution for the specific * language governing permissions and limitations under the License. * * When distributing Covered Code, include this CDDL HEADER in each * file and include the License file at LICENSE.txt. * If applicable, add the following below this CDDL HEADER, with the * fields enclosed by brackets "[]" replaced with your own identifying * information: Portions Copyright [yyyy] [name of copyright owner] * * CDDL HEADER END */ /* * Copyright (c) 2005, 2021, Oracle and/or its affiliates. All rights reserved. * Portions Copyright (c) 2011, Jens Elkner. * Portions Copyright (c) 2017, 2020, Chris Fraire . * Portions Copyright (c) 2019, Krystof Tulinger . */ package org.opengrok.indexer.web; import static org.opengrok.indexer.index.Indexer.PATH_SEPARATOR; import java.io.BufferedInputStream; import java.io.File; import java.io.FileInputStream; import java.io.IOException; import java.io.InputStream; import java.io.InputStreamReader; import java.io.Reader; import java.io.Writer; import java.net.MalformedURLException; import java.net.URI; import java.net.URISyntaxException; import java.net.URL; import java.net.URLDecoder; import java.net.URLEncoder; import java.nio.charset.StandardCharsets; import java.text.DecimalFormat; import java.text.NumberFormat; import java.util.Collection; import java.util.HashMap; import java.util.LinkedList; import java.util.List; import java.util.Locale; import java.util.Map; import java.util.Map.Entry; import java.util.TreeMap; import java.util.function.Function; import java.util.logging.Level; import java.util.logging.Logger; import java.util.regex.Matcher; import java.util.regex.Pattern; import java.util.zip.GZIPInputStream; import jakarta.servlet.http.HttpServletRequest; import org.apache.commons.lang3.SystemUtils; import org.apache.lucene.queryparser.classic.QueryParser; import org.opengrok.indexer.configuration.RuntimeEnvironment; import org.opengrok.indexer.history.Annotation; import org.opengrok.indexer.history.HistoryException; import org.opengrok.indexer.history.HistoryGuru; import org.opengrok.indexer.logger.LoggerFactory; /** * Class for useful functions. */ public final class Util { private static final Logger LOGGER = LoggerFactory.getLogger(Util.class); private static final int BOLD_COUNT_THRESHOLD = 1000; private static final String anchorLinkStart = ""; private static final String RE_Q_ESC_AMP_AMP = "\\?|&|&"; private static final String RE_Q_E_A_A_COUNT_EQ_VAL = "(" + RE_Q_ESC_AMP_AMP + "|\\b)" + QueryParameters.COUNT_PARAM_EQ + "\\d+"; private static final String RE_Q_E_A_A_START_EQ_VAL = "(" + RE_Q_ESC_AMP_AMP + "|\\b)" + QueryParameters.START_PARAM_EQ + "\\d+"; private static final String RE_A_ANCHOR_Q_E_A_A = "^(" + RE_Q_ESC_AMP_AMP + ")"; /** Private to enforce static. */ private Util() { } /** * Return a string that represents s in HTML by calling * {@link #htmlize(java.lang.CharSequence, java.lang.Appendable, boolean)} * with {@code s}, a transient {@link StringBuilder}, and {@code true}. *

* (N.b. if no special characters are present, {@code s} is returned as is, * without the expensive call.) * * @param s a defined string * @return a string representing the character sequence in HTML */ public static String htmlize(String s) { if (!needsHtmlize(s, false)) { return s; } StringBuilder sb = new StringBuilder(s.length() * 2); try { htmlize(s, sb, false); } catch (IOException ioe) { // IOException cannot happen when the destination is a // StringBuilder. Wrap in an AssertionError so that callers // don't have to check for an IOException that should never // happen. throw new AssertionError("StringBuilder threw IOException", ioe); } return sb.toString(); } /** * Return a string which represents a CharSequence in HTML by * calling * {@link #htmlize(java.lang.CharSequence, java.lang.Appendable, boolean)} * with {@code q}, a transient {@link StringBuilder}, and {@code false}. * * @param q a character sequence * @return a string representing the character sequence in HTML */ public static String htmlize(CharSequence q) { StringBuilder sb = new StringBuilder(q.length() * 2); try { htmlize(q, sb, false); } catch (IOException ioe) { // IOException cannot happen when the destination is a // StringBuilder. Wrap in an AssertionError so that callers // don't have to check for an IOException that should never // happen. throw new AssertionError("StringBuilder threw IOException", ioe); } return sb.toString(); } /** * Append a character sequence to the given destination whereby special * characters for HTML or characters that are not printable ASCII are * escaped accordingly. * * @param q a character sequence to escape * @param dest where to append the character sequence to * @param pre a value indicating whether the output is pre-formatted -- if * true then LFs will not be converted to elements * @throws IOException if an error occurred when writing to {@code dest} */ public static void htmlize(CharSequence q, Appendable dest, boolean pre) throws IOException { for (int i = 0; i < q.length(); i++) { htmlize(q.charAt(i), dest, pre); } } /** * Calls * {@link #htmlize(java.lang.CharSequence, java.lang.Appendable, boolean)} * with {@code q}, {@code dest}, and {@code false}. * * @param q a character sequence to escape * @param dest where to append the character sequence to * @throws IOException if an error occurred when writing to {@code dest} */ public static void htmlize(CharSequence q, Appendable dest) throws IOException { htmlize(q, dest, false); } /** * Append a character array to the given destination whereby special * characters for HTML or characters that are not printable ASCII are * escaped accordingly. * * @param cs characters to escape * @param length max. number of characters to append, starting from index 0. * @param dest where to append the character sequence to * @throws IOException if an error occurred when writing to {@code dest} */ public static void htmlize(char[] cs, int length, Appendable dest) throws IOException { int len = length; if (cs.length < length) { len = cs.length; } for (int i = 0; i < len; i++) { htmlize(cs[i], dest, false); } } /** * Append a character to the given destination whereby special characters * special for HTML or characters that are not printable ASCII are * escaped accordingly. * * @param c the character to append * @param dest where to append the character to * @param pre a value indicating whether the output is pre-formatted -- if * true then LFs will not be converted to elements * @throws IOException if an error occurred when writing to {@code dest} * @see #needsHtmlize(char, boolean) */ private static void htmlize(char c, Appendable dest, boolean pre) throws IOException { switch (c) { case '\'': dest.append("'"); break; case '"': dest.append("""); break; case '&': dest.append("&"); break; case '>': dest.append(">"); break; case '<': dest.append("<"); break; case '\n': if (pre) { dest.append(c); } else { dest.append("
"); } break; default: if ((c >= ' ' && c <= '~') || (c < ' ' && Character.isWhitespace(c))) { dest.append(c); } else { dest.append("&#").append(Integer.toString(c)).append(';'); } break; } } /** * Determine if a character is a special character needing HTML escaping or * is a character that is not printable ASCII. * @param c the character to examine * @param pre a value indicating whether the output is pre-formatted -- if * true then LFs will not be converted to elements * @see #htmlize(char, java.lang.Appendable, boolean) */ private static boolean needsHtmlize(char c, boolean pre) { switch (c) { case '\'': case '"': case '&': case '>': case '<': return true; case '\n': if (!pre) { return true; } default: return (c < ' ' || c > '~') && (c >= ' ' || !Character.isWhitespace(c)); } } private static boolean needsHtmlize(CharSequence q, boolean pre) { for (int i = 0; i < q.length(); ++i) { if (needsHtmlize(q.charAt(i), pre)) { return true; } } return false; } /** * Convenience method for {@code breadcrumbPath(urlPrefix, path, PATH_SEPARATOR)}. * * @param urlPrefix prefix to add to each url * @param path path to crack * @return HTML markup for the breadcrumb or the path itself. * * @see #breadcrumbPath(String, String, char) */ public static String breadcrumbPath(String urlPrefix, String path) { return breadcrumbPath(urlPrefix, path, PATH_SEPARATOR); } /** * Convenience method for * {@code breadcrumbPath(urlPrefix, path, sep, "", false)}. * * @param urlPrefix prefix to add to each url * @param path path to crack * @param sep separator to use to crack the given path * * @return HTML markup fro the breadcrumb or the path itself. * @see #breadcrumbPath(String, String, char, String, boolean, boolean) */ public static String breadcrumbPath(String urlPrefix, String path, char sep) { return breadcrumbPath(urlPrefix, path, sep, "", false); } /** * Convenience method for * {@code breadcrumbPath(urlPrefix, path, sep, "", false, path.endsWith(sep)}. * * @param urlPrefix prefix to add to each url * @param path path to crack * @param sep separator to use to crack the given path * @param urlPostfix suffix to add to each url * @param compact if {@code true} the given path gets transformed into its * canonical form (.i.e. all '.' and '..' and double separators removed, but * not always resolves to an absolute path) before processing starts. * @return HTML markup fro the breadcrumb or the path itself. * @see #breadcrumbPath(String, String, char, String, boolean, boolean) * @see #getCanonicalPath(String, char) */ public static String breadcrumbPath(String urlPrefix, String path, char sep, String urlPostfix, boolean compact) { if (path == null || path.length() == 0) { return path; } return breadcrumbPath(urlPrefix, path, sep, urlPostfix, compact, path.charAt(path.length() - 1) == sep); } /** * Create a breadcrumb path to allow navigation to each element of a path. * Consecutive separators (sep) in the given path are * always collapsed into a single separator automatically. If * compact is {@code true} path gets translated into a canonical * path similar to {@link File#getCanonicalPath()}, however the current * working directory is assumed to be "/" and no checks are done (e.g. * neither whether the path [component] exists nor which type it is). * * @param urlPrefix what should be prepend to the constructed URL * @param path the full path from which the breadcrumb path is built. * @param sep the character that separates the path components in * path * @param urlPostfix what should be append to the constructed URL * @param compact if {@code true}, a canonical path gets constructed before * processing. * @param isDir if {@code true} a "/" gets append to the last path * component's link and sep to its name * @return path if it resolves to an empty or "/" or {@code null} * path, the HTML markup for the breadcrumb path otherwise. */ public static String breadcrumbPath(String urlPrefix, String path, char sep, String urlPostfix, boolean compact, boolean isDir) { if (path == null || path.length() == 0) { return path; } String[] pnames = normalize(path.split(escapeForRegex(sep)), compact); if (pnames.length == 0) { return path; } String prefix = urlPrefix == null ? "" : urlPrefix; String postfix = urlPostfix == null ? "" : urlPostfix; StringBuilder pwd = new StringBuilder(path.length() + pnames.length); StringBuilder markup = new StringBuilder((pnames.length + 3 >> 1) * path.length() + pnames.length * (17 + prefix.length() + postfix.length())); int k = path.indexOf(pnames[0]); if (path.lastIndexOf(sep, k) != -1) { pwd.append(PATH_SEPARATOR); markup.append(sep); } for (int i = 0; i < pnames.length; i++) { pwd.append(uriEncodePath(pnames[i])); if (isDir || i < pnames.length - 1) { pwd.append(PATH_SEPARATOR); } markup.append(anchorLinkStart).append(prefix).append(pwd) .append(postfix).append(closeQuotedTag).append(pnames[i]) .append(anchorEnd); if (isDir || i < pnames.length - 1) { markup.append(sep); } } return markup.toString(); } /** * Normalize the given path to its canonical form. I.e. all * separators (sep) are replaced with a slash ('/'), all double * slashes are replaced by a single slash, all single dot path components * (".") of the formed path are removed and all double dot path components * (".." ) of the formed path are replaced with its parent or '/' if there * is no parent. *

Variable	Value
Ignored files	"); printUnorderedList(out, env.getIgnoredNames().getItems()); out.append("

"); htmlize(item, buf); out.append(buf); buf.setLength(0); out.append("

"); } /** * Create a string literal for use in JavaScript functions. * * @param str the string to be represented by the literal * @return a JavaScript string literal */ public static String jsStringLiteral(String str) { StringBuilder sb = new StringBuilder(); sb.append('"'); for (int i = 0; i < str.length(); i++) { char c = str.charAt(i); switch (c) { case '"': sb.append("\\\""); break; case '\\': sb.append("\\\\"); break; case '\n': sb.append("\\n"); break; case '\r': sb.append("\\r"); break; default: sb.append(c); } } sb.append('"'); return sb.toString(); } /** * Make a path relative by stripping off a prefix. If the path does not have * the given prefix, return the full path unchanged. * * @param prefix the prefix to strip off * @param fullPath the path from which to remove the prefix * @return a path relative to {@code prefix} if {@code prefix} is a parent * directory of {@code fullPath}; otherwise, {@code fullPath} */ public static String stripPathPrefix(String prefix, String fullPath) { // Find the length of the prefix to strip off. The prefix should // represent a directory, so it could end with a slash. In case it // doesn't end with a slash, increase the length by one so that we // strip off the leading slash from the relative path. int prefixLength = prefix.length(); if (!prefix.endsWith("/")) { prefixLength++; } // If the full path starts with the prefix, strip off the prefix. if (fullPath.length() > prefixLength && fullPath.startsWith(prefix) && fullPath.charAt(prefixLength - 1) == '/') { return fullPath.substring(prefixLength); } // Otherwise, return the full path. return fullPath; } /** * Creates a HTML slider for pagination. This has the same effect as * invoking createSlider(offset, limit, size, null). * * @param offset start of the current page * @param limit max number of items per page * @param size number of total hits to paginate * @return string containing slider html */ public static String createSlider(int offset, int limit, int size) { return createSlider(offset, limit, size, null); } /** * Creates a HTML slider for pagination. * * @param offset start of the current page * @param limit max number of items per page * @param size number of total hits to paginate * @param request request containing URL parameters which should be appended * to the page URL * @return string containing slider html */ public static String createSlider(int offset, int limit, long size, HttpServletRequest request) { String slider = ""; if (limit < size) { final StringBuilder buf = new StringBuilder(4096); int lastPage = (int) Math.ceil((double) size / limit); // startingResult is the number of a first result on the current page int startingResult = offset - limit * (offset / limit % 10 + 1); int myFirstPage = startingResult < 0 ? 1 : startingResult / limit + 1; int myLastPage = Math.min(lastPage, myFirstPage + 10 + (myFirstPage == 1 ? 0 : 1)); // function taking the page number and appending the desired content into the final buffer Function generatePageLink = page -> { int myOffset = Math.max(0, (page - 1) * limit); if (myOffset <= offset && offset < myOffset + limit) { // do not generate anchor for current page buf.append("").append(page).append(""); } else { buf.append(""); // add << or >> if this link would lead to another section if (page == myFirstPage && page != 1) { buf.append("<<"); } else if (page == myLastPage && myOffset + limit < size) { buf.append(">>"); } else { buf.append(page); } buf.append(""); } return null; }; // slider composition if (myFirstPage != 1) { generatePageLink.apply(1); buf.append("..."); } for (int page = myFirstPage; page <= myLastPage; page++) { generatePageLink.apply(page); } if (myLastPage != lastPage) { buf.append("..."); generatePageLink.apply(lastPage); } return buf.toString(); } return slider; } /** * Check if the string is a HTTP URL. * * @param string the string to check * @return true if it is http URL, false otherwise */ public static boolean isHttpUri(String string) { URL url; try { url = new URL(string); } catch (MalformedURLException ex) { return false; } return url.getProtocol().equals("http") || url.getProtocol().equals("https"); } protected static final String REDACTED_USER_INFO = "redacted_by_OpenGrok"; /** * If given path is a URL, return the string representation with the user-info part filtered out. * @param path path to object * @return either the original string or string representation of URL with the user-info part removed */ public static String redactUrl(String path) { URL url; try { url = new URL(path); } catch (MalformedURLException e) { // not an URL return path; } if (url.getUserInfo() != null) { return url.toString().replace(url.getUserInfo(), REDACTED_USER_INFO); } else { return path; } } /** * Build a HTML link to the given HTTP URL. If the URL is not an http URL * then it is returned as it was received. This has the same effect as * invoking linkify(url, true). * * @param url the text to be linkified * @return the linkified string * * @see #linkify(java.lang.String, boolean) */ public static String linkify(String url) { return linkify(url, true); } /** * Build a html link to the given http URL. If the URL is not an http URL * then it is returned as it was received. * * @param url the HTTP URL * @param newTab if the link should open in a new tab * @return HTML code containing the link <a>...</a> */ public static String linkify(String url, boolean newTab) { if (isHttpUri(url)) { try { Map attrs = new TreeMap<>(); attrs.put("href", url); attrs.put("title", String.format("Link to %s", Util.encode(url))); if (newTab) { attrs.put("target", "_blank"); attrs.put("rel", "noreferrer"); } return buildLink(url, attrs); } catch (URISyntaxException | MalformedURLException ex) { return url; } } return url; } /** * Build an anchor with given name and a pack of attributes. Automatically * escapes href attributes and automatically escapes the name into HTML * entities. * * @param name displayed name of the anchor * @param attrs map of attributes for the html element * @return string containing the result * * @throws URISyntaxException URI syntax * @throws MalformedURLException malformed URL */ public static String buildLink(String name, Map attrs) throws URISyntaxException, MalformedURLException { StringBuilder buffer = new StringBuilder(); buffer.append(" attr : attrs.entrySet()) { buffer.append(" "); buffer.append(attr.getKey()); buffer.append("=\""); String value = attr.getValue(); if (attr.getKey().equals("href")) { value = Util.encodeURL(value); } buffer.append(value); buffer.append("\""); } buffer.append(">"); buffer.append(Util.htmlize(name)); buffer.append(""); return buffer.toString(); } /** * Build an anchor with given name and a pack of attributes. Automatically * escapes href attributes and automatically escapes the name into HTML * entities. * * @param name displayed name of the anchor * @param url anchor's URL * @return string containing the result * * @throws URISyntaxException URI syntax * @throws MalformedURLException bad URL */ public static String buildLink(String name, String url) throws URISyntaxException, MalformedURLException { Map attrs = new TreeMap<>(); attrs.put("href", url); return buildLink(name, attrs); } /** * Build an anchor with given name and a pack of attributes. Automatically * escapes href attributes and automatically escapes the name into HTML * entities. * * @param name displayed name of the anchor * @param url anchor's URL * @param newTab a flag if the link should be opened in a new tab * @return string containing the result * * @throws URISyntaxException URI syntax * @throws MalformedURLException bad URL */ public static String buildLink(String name, String url, boolean newTab) throws URISyntaxException, MalformedURLException { Map attrs = new TreeMap<>(); attrs.put("href", url); if (newTab) { attrs.put("target", "_blank"); attrs.put("rel", "noreferrer"); } return buildLink(name, attrs); } /** * Replace all occurrences of pattern in the incoming text with the link * named name pointing to an URL. It is possible to use the regexp pattern * groups in name and URL when they are specified in the pattern. * * @param text text to replace all patterns * @param pattern the pattern to match * @param name link display name * @param url link URL * @return the text with replaced links */ public static String linkifyPattern(String text, Pattern pattern, String name, String url) { try { String buildLink = buildLink(name, url, true); return pattern.matcher(text).replaceAll(buildLink); } catch (URISyntaxException | MalformedURLException ex) { LOGGER.log(Level.WARNING, "The given URL ''{0}'' is not valid", url); return text; } } /** * Try to complete the given URL part into full URL with server name, port, * scheme, ... *

for request http://localhost:8080/source/xref/xxx and part * /cgi-bin/user=: http://localhost:8080/cgi-bin/user=
for request http://localhost:8080/source/xref/xxx and part * cgi-bin/user=: http://localhost:8080/source/xref/xxx/cgi-bin/user=
for request http://localhost:8080/source/xref/xxx and part * http://users.com/user=: http://users.com/user=

* * @param url the given URL part, may be already full URL * @param req the request containing the information about the server * @return the converted URL or the input parameter if there was an error */ public static String completeUrl(String url, HttpServletRequest req) { try { if (!isHttpUri(url)) { if (url.startsWith("/")) { return new URI(req.getScheme(), null, req.getServerName(), req.getServerPort(), url, null, null).toString(); } StringBuffer prepUrl = req.getRequestURL(); if (!url.isEmpty()) { prepUrl.append('/').append(url); } return new URI(prepUrl.toString()).toString(); } return url; } catch (URISyntaxException ex) { LOGGER.log(Level.INFO, String.format("Unable to convert given URL part '%s' to complete URL", url), ex); return url; } } /** * Parses the specified URL and returns its query params. * @param url URL to retrieve the query params from * @return query params of {@code url} */ public static Map> getQueryParams(final URL url) { if (url == null) { throw new IllegalArgumentException("Cannot get query params from the null url"); } Map> returnValue = new HashMap<>(); if (url.getQuery() == null) { return returnValue; } String[] pairs = url.getQuery().split("&"); for (String pair : pairs) { if (pair.isEmpty()) { continue; } int idx = pair.indexOf('='); if (idx == -1) { returnValue.computeIfAbsent(pair, k -> new LinkedList<>()); continue; } String key = URLDecoder.decode(pair.substring(0, idx), StandardCharsets.UTF_8); String value = URLDecoder.decode(pair.substring(idx + 1), StandardCharsets.UTF_8); List paramValues = returnValue.computeIfAbsent(key, k -> new LinkedList<>()); paramValues.add(value); } return returnValue; } }