| 1 | /* |
|---|---|
| 2 | * Copyright (C) 2007-2010 JĂșlio Vilmar Gesser. |
| 3 | * Copyright (C) 2011, 2013-2020 The JavaParser Team. |
| 4 | * |
| 5 | * This file is part of JavaParser. |
| 6 | * |
| 7 | * JavaParser can be used either under the terms of |
| 8 | * a) the GNU Lesser General Public License as published by |
| 9 | * the Free Software Foundation, either version 3 of the License, or |
| 10 | * (at your option) any later version. |
| 11 | * b) the terms of the Apache License |
| 12 | * |
| 13 | * You should have received a copy of both licenses in LICENCE.LGPL and |
| 14 | * LICENCE.APACHE. Please refer to those files for details. |
| 15 | * |
| 16 | * JavaParser is distributed in the hope that it will be useful, |
| 17 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 18 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| 19 | * GNU Lesser General Public License for more details. |
| 20 | */ |
| 21 | |
| 22 | package com.github.javaparser; |
| 23 | |
| 24 | import com.github.javaparser.ast.comments.JavadocComment; |
| 25 | import com.github.javaparser.javadoc.Javadoc; |
| 26 | import com.github.javaparser.javadoc.JavadocBlockTag; |
| 27 | import com.github.javaparser.javadoc.description.JavadocDescription; |
| 28 | import java.util.Arrays; |
| 29 | import java.util.Collections; |
| 30 | import java.util.List; |
| 31 | import java.util.regex.Pattern; |
| 32 | import java.util.stream.Collectors; |
| 33 | |
| 34 | import static com.github.javaparser.utils.Utils.*; |
| 35 | |
| 36 | /** |
| 37 | * The class responsible for parsing the content of JavadocComments and producing JavadocDocuments. |
| 38 | * <a href="https://docs.oracle.com/javase/1.5.0/docs/tooldocs/windows/javadoc.html">The Javadoc specification.</a> |
| 39 | */ |
| 40 | class JavadocParser { |
| 41 | |
| 42 | private static String BLOCK_TAG_PREFIX = "@"; |
| 43 | private static Pattern BLOCK_PATTERN = Pattern.compile("^\\s*" + BLOCK_TAG_PREFIX, Pattern.MULTILINE); |
| 44 | |
| 45 | public static Javadoc parse(JavadocComment comment) { |
| 46 | return parse(comment.getContent()); |
| 47 | } |
| 48 | |
| 49 | public static Javadoc parse(String commentContent) { |
| 50 | List<String> cleanLines = cleanLines(normalizeEolInTextBlock(commentContent, SYSTEM_EOL)); |
| 51 | int indexOfFirstBlockTag = cleanLines.stream() |
| 52 | .filter(JavadocParser::isABlockLine) |
| 53 | .map(cleanLines::indexOf) |
| 54 | .findFirst() |
| 55 | .orElse(-1); |
| 56 | List<String> blockLines; |
| 57 | String descriptionText; |
| 58 | if (indexOfFirstBlockTag == -1) { |
| 59 | descriptionText = trimRight(String.join(SYSTEM_EOL, cleanLines)); |
| 60 | blockLines = Collections.emptyList(); |
| 61 | } else { |
| 62 | descriptionText = trimRight(String.join(SYSTEM_EOL, cleanLines.subList(0, indexOfFirstBlockTag))); |
| 63 | |
| 64 | //Combine cleaned lines, but only starting with the first block tag till the end |
| 65 | //In this combined string it is easier to handle multiple lines which actually belong together |
| 66 | String tagBlock = cleanLines.subList(indexOfFirstBlockTag, cleanLines.size()) |
| 67 | .stream() |
| 68 | .collect(Collectors.joining(SYSTEM_EOL)); |
| 69 | |
| 70 | //Split up the entire tag back again, considering now that some lines belong to the same block tag. |
| 71 | //The pattern splits the block at each new line starting with the '@' symbol, thus the symbol |
| 72 | //then needs to be added again so that the block parsers handles everything correctly. |
| 73 | blockLines = BLOCK_PATTERN |
| 74 | .splitAsStream(tagBlock) |
| 75 | .filter(s1 -> !s1.isEmpty()) |
| 76 | .map(s -> BLOCK_TAG_PREFIX + s) |
| 77 | .collect(Collectors.toList()); |
| 78 | } |
| 79 | Javadoc document = new Javadoc(JavadocDescription.parseText(descriptionText)); |
| 80 | blockLines.forEach(l -> document.addBlockTag(parseBlockTag(l))); |
| 81 | return document; |
| 82 | } |
| 83 | |
| 84 | private static JavadocBlockTag parseBlockTag(String line) { |
| 85 | line = line.trim().substring(1); |
| 86 | String tagName = nextWord(line); |
| 87 | String rest = line.substring(tagName.length()).trim(); |
| 88 | return new JavadocBlockTag(tagName, rest); |
| 89 | } |
| 90 | |
| 91 | private static boolean isABlockLine(String line) { |
| 92 | return line.trim().startsWith(BLOCK_TAG_PREFIX); |
| 93 | } |
| 94 | |
| 95 | private static String trimRight(String string) { |
| 96 | while (!string.isEmpty() && Character.isWhitespace(string.charAt(string.length() - 1))) { |
| 97 | string = string.substring(0, string.length() - 1); |
| 98 | } |
| 99 | return string; |
| 100 | } |
| 101 | |
| 102 | private static List<String> cleanLines(String content) { |
| 103 | String[] lines = content.split(SYSTEM_EOL); |
| 104 | if (lines.length == 0) { |
| 105 | return Collections.emptyList(); |
| 106 | } |
| 107 | |
| 108 | List<String> cleanedLines = Arrays.stream(lines).map(l -> { |
| 109 | int asteriskIndex = startsWithAsterisk(l); |
| 110 | if (asteriskIndex == -1) { |
| 111 | return l; |
| 112 | } else { |
| 113 | // if a line starts with space followed by an asterisk drop to the asterisk |
| 114 | // if there is a space immediately after the asterisk drop it also |
| 115 | if (l.length() > (asteriskIndex + 1)) { |
| 116 | |
| 117 | char c = l.charAt(asteriskIndex + 1); |
| 118 | if (c == ' ' || c == '\t') { |
| 119 | return l.substring(asteriskIndex + 2); |
| 120 | } |
| 121 | } |
| 122 | return l.substring(asteriskIndex + 1); |
| 123 | } |
| 124 | }).collect(Collectors.toList()); |
| 125 | // lines containing only whitespace are normalized to empty lines |
| 126 | cleanedLines = cleanedLines.stream().map(l -> l.trim().isEmpty() ? "" : l).collect(Collectors.toList()); |
| 127 | // if the first starts with a space, remove it |
| 128 | if (!cleanedLines.get(0).isEmpty() && (cleanedLines.get(0).charAt(0) == ' ' || cleanedLines.get(0).charAt(0) == '\t')) { |
| 129 | cleanedLines.set(0, cleanedLines.get(0).substring(1)); |
| 130 | } |
| 131 | // drop empty lines at the beginning and at the end |
| 132 | while (cleanedLines.size() > 0 && cleanedLines.get(0).trim().isEmpty()) { |
| 133 | cleanedLines = cleanedLines.subList(1, cleanedLines.size()); |
| 134 | } |
| 135 | while (cleanedLines.size() > 0 && cleanedLines.get(cleanedLines.size() - 1).trim().isEmpty()) { |
| 136 | cleanedLines = cleanedLines.subList(0, cleanedLines.size() - 1); |
| 137 | } |
| 138 | return cleanedLines; |
| 139 | } |
| 140 | |
| 141 | // Visible for testing |
| 142 | static int startsWithAsterisk(String line) { |
| 143 | if (line.startsWith("*")) { |
| 144 | return 0; |
| 145 | } else if ((line.startsWith(" ") || line.startsWith("\t")) && line.length() > 1) { |
| 146 | int res = startsWithAsterisk(line.substring(1)); |
| 147 | if (res == -1) { |
| 148 | return -1; |
| 149 | } else { |
| 150 | return 1 + res; |
| 151 | } |
| 152 | } else { |
| 153 | return -1; |
| 154 | } |
| 155 | } |
| 156 | } |
| 157 |
Members