001////////////////////////////////////////////////////////////////////////////////
002// checkstyle: Checks Java source code for adherence to a set of rules.
003// Copyright (C) 2001-2018 the original author or authors.
004//
005// This library is free software; you can redistribute it and/or
006// modify it under the terms of the GNU Lesser General Public
007// License as published by the Free Software Foundation; either
008// version 2.1 of the License, or (at your option) any later version.
009//
010// This library is distributed in the hope that it will be useful,
011// but WITHOUT ANY WARRANTY; without even the implied warranty of
012// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
013// Lesser General Public License for more details.
014//
015// You should have received a copy of the GNU Lesser General Public
016// License along with this library; if not, write to the Free Software
017// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
018////////////////////////////////////////////////////////////////////////////////
019
020package com.puppycrawl.tools.checkstyle.checks.javadoc.utils;
021
022import java.util.ArrayList;
023import java.util.List;
024import java.util.regex.Matcher;
025import java.util.regex.Pattern;
026
027import com.puppycrawl.tools.checkstyle.api.LineColumn;
028
029/**
030 * Tools for extracting inline tags from Javadoc comments.
031 *
032 */
033public final class InlineTagUtils {
034
035    /**
036     * Inline tag pattern.
037     */
038    private static final Pattern INLINE_TAG_PATTERN = Pattern.compile(
039            ".*?\\{@(\\p{Alpha}+)\\b(.*?)}", Pattern.DOTALL);
040
041    /** Pattern to recognize leading "*" characters in Javadoc. */
042    private static final Pattern JAVADOC_PREFIX_PATTERN = Pattern.compile(
043        "^\\s*\\*", Pattern.MULTILINE);
044
045    /** Pattern matching whitespace, used by {@link InlineTagUtils#collapseWhitespace(String)}. */
046    private static final Pattern WHITESPACE_PATTERN = Pattern.compile("\\s+");
047
048    /** Pattern matching a newline. */
049    private static final Pattern NEWLINE_PATTERN = Pattern.compile("\\n");
050
051    /** Line feed character. */
052    private static final String LINE_FEED = "\n";
053
054    /** Carriage return character. */
055    private static final String CARRIAGE_RETURN = "\r";
056
057    /** Prevent instantiation. */
058    private InlineTagUtils() {
059    }
060
061    /**
062     * Extract inline Javadoc tags from the given comment.
063     * @param lines The Javadoc comment (as lines).
064     * @return The extracted inline Javadoc tags.
065     */
066    public static List<TagInfo> extractInlineTags(String... lines) {
067        for (String line : lines) {
068            if (line.contains(LINE_FEED) || line.contains(CARRIAGE_RETURN)) {
069                throw new IllegalArgumentException("comment lines cannot contain newlines");
070            }
071        }
072
073        final String commentText = convertLinesToString(lines);
074        final Matcher inlineTagMatcher = INLINE_TAG_PATTERN.matcher(commentText);
075
076        final List<TagInfo> tags = new ArrayList<>();
077
078        while (inlineTagMatcher.find()) {
079            final String tagName = inlineTagMatcher.group(1);
080
081            // Remove the leading asterisks (in case the tag spans a line) and collapse
082            // the whitespace.
083            String matchedTagValue = inlineTagMatcher.group(2);
084            matchedTagValue = removeLeadingJavaDoc(matchedTagValue);
085            matchedTagValue = collapseWhitespace(matchedTagValue);
086
087            final String tagValue = matchedTagValue;
088
089            final int startIndex = inlineTagMatcher.start(1);
090            final LineColumn position = getLineColumnOfIndex(commentText,
091                // correct start index offset
092                startIndex - 1);
093
094            tags.add(new TagInfo(tagName, tagValue, position));
095        }
096
097        return tags;
098    }
099
100    /**
101     * Convert array of string to single String.
102     * @param lines A number of lines, in order.
103     * @return The lines, joined together with newlines, as a single string.
104     */
105    private static String convertLinesToString(String... lines) {
106        final StringBuilder builder = new StringBuilder(1024);
107        for (String line : lines) {
108            builder.append(line);
109            builder.append(LINE_FEED);
110        }
111        return builder.toString();
112    }
113
114    /**
115     * Get LineColumn from string till index.
116     * @param source Source string.
117     * @param index An index into the string.
118     * @return A position in the source representing what line and column that index appears on.
119     */
120    private static LineColumn getLineColumnOfIndex(String source, int index) {
121        final String precedingText = source.subSequence(0, index).toString();
122        final String[] precedingLines = NEWLINE_PATTERN.split(precedingText);
123        final String lastLine = precedingLines[precedingLines.length - 1];
124        return new LineColumn(precedingLines.length, lastLine.length());
125    }
126
127    /**
128     * Collapse whitespaces.
129     * @param str Source string.
130     * @return The given string with all whitespace collapsed.
131     */
132    private static String collapseWhitespace(String str) {
133        final Matcher matcher = WHITESPACE_PATTERN.matcher(str);
134        return matcher.replaceAll(" ").trim();
135    }
136
137    /**
138     * Remove leading JavaDoc.
139     * @param source A string to remove leading Javadoc from.
140     * @return The given string with leading Javadoc "*" characters from each line removed.
141     */
142    private static String removeLeadingJavaDoc(String source) {
143        final Matcher matcher = JAVADOC_PREFIX_PATTERN.matcher(source);
144        return matcher.replaceAll("");
145    }
146
147}