/*
 * Copyright (c) 2004, 2020, Oracle and/or its affiliates. All rights reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.  Oracle designates this
 * particular file as subject to the "Classpath" exception as provided
 * by Oracle in the LICENSE file that accompanied this code.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 * or visit www.oracle.com if you need additional information or have any
 * questions.
 */

package com.sun.tools.javac.parser;

import com.sun.tools.javac.parser.Tokens.Comment;
import com.sun.tools.javac.parser.Tokens.Comment.CommentStyle;
import com.sun.tools.javac.util.*;

import java.nio.CharBuffer;
import java.util.Arrays;
import java.util.regex.Pattern;

An extension to the base lexical analyzer (JavaTokenizer) that captures and processes the contents of doc comments. It does so by stripping the leading whitespace and comment starts from each line of the Javadoc comment.

This is NOT part of any supported API. If you write code that depends on this, you do so at your own risk. This code and its internal interfaces are subject to change or deletion without notice.

/** * An extension to the base lexical analyzer (JavaTokenizer) that * captures and processes the contents of doc comments. It does * so by stripping the leading whitespace and comment starts from * each line of the Javadoc comment. * * <p><b>This is NOT part of any supported API. * If you write code that depends on this, you do so at your own risk. * This code and its internal interfaces are subject to change or * deletion without notice.</b> */
public class JavadocTokenizer extends JavaTokenizer {
The factory that created this Scanner.
/** * The factory that created this Scanner. */
final ScannerFactory fac;
Create a tokenizer from the input character buffer. The input buffer content would typically be a Javadoc comment extracted by JavaTokenizer.
Params:
  • fac – the factory which created this Scanner.
  • cb – the input character buffer.
/** * Create a tokenizer from the input character buffer. The input buffer * content would typically be a Javadoc comment extracted by * JavaTokenizer. * * @param fac the factory which created this Scanner. * @param cb the input character buffer. */
protected JavadocTokenizer(ScannerFactory fac, CharBuffer cb) { super(fac, cb); this.fac = fac; }
Create a tokenizer from the input array. The input buffer content would typically be a Javadoc comment extracted by JavaTokenizer.
Params:
  • fac – factory which created this Scanner
  • array – input character array.
  • length – length of the meaningful content in the array.
/** * Create a tokenizer from the input array. The input buffer * content would typically be a Javadoc comment extracted by * JavaTokenizer. * * @param fac factory which created this Scanner * @param array input character array. * @param length length of the meaningful content in the array. */
protected JavadocTokenizer(ScannerFactory fac, char[] array, int length) { super(fac, array, length); this.fac = fac; } @Override protected Comment processComment(int pos, int endPos, CommentStyle style) { char[] buf = getRawCharacters(pos, endPos); return new JavadocComment(style, fac, buf, pos); }
An extension of BasicComment used to extract the relevant portion of a Javadoc comment.
/** * An extension of BasicComment used to extract the relevant portion * of a Javadoc comment. */
protected static class JavadocComment extends BasicComment {
Pattern used to detect a well formed @deprecated tag in a JaavDoc comment.
/** * Pattern used to detect a well formed @deprecated tag in a JaavDoc * comment. */
private static final Pattern DEPRECATED_PATTERN = Pattern.compile("(?sm).*^\\s*@deprecated( |$).*");
The relevant portion of the comment that is of interest to Javadoc. Produced by invoking scanDocComment.
/** * The relevant portion of the comment that is of interest to Javadoc. * Produced by invoking scanDocComment. */
private String docComment = null;
StringBuilder used to extract the relevant portion of the Javadoc comment.
/** * StringBuilder used to extract the relevant portion of the Javadoc comment. */
private final StringBuilder sb;
Map used to map the extracted Javadoc comment's character positions back to the original source.
/** * Map used to map the extracted Javadoc comment's character positions back to * the original source. */
OffsetMap offsetMap = new OffsetMap(); JavadocComment(CommentStyle cs, ScannerFactory sf, char[] array, int offset) { super( cs, sf, array, offset); this.sb = new StringBuilder(); }
Add a character to the extraction buffer.
Params:
  • ch – character to add.
/** * Add a character to the extraction buffer. * * @param ch character to add. */
protected void put(char ch) { offsetMap.add(sb.length(), offsetPosition()); sb.append(ch); }
Add a code point to the extraction buffer.
Params:
  • codePoint – code point to add.
/** * Add a code point to the extraction buffer. * * @param codePoint code point to add. */
protected void putCodePoint(int codePoint) { offsetMap.add(sb.length(), offsetPosition()); sb.appendCodePoint(codePoint); }
Add current character or code point to the extraction buffer.
/** * Add current character or code point to the extraction buffer. */
protected void put() { if (isSurrogate()) { putCodePoint(getCodepoint()); } else { put(get()); } } @Override public String getText() { if (!scanned && cs == CommentStyle.JAVADOC) { scanDocComment(); } return docComment; } @Override public int getSourcePos(int pos) { if (pos == Position.NOPOS) { return Position.NOPOS; } if (pos < 0 || pos > docComment.length()) { throw new StringIndexOutOfBoundsException(String.valueOf(pos)); } return offsetMap.getSourcePos(pos); } @Override protected void scanDocComment() { try { boolean firstLine = true; // Skip over /* accept("/*"); // Consume any number of stars skip('*'); // Is the comment in the form /**/, /***/, /****/, etc. ? if (is('/')) { docComment = ""; return; } // Skip line terminator on the first line of the comment. if (isOneOf('\n', '\r')) { accept('\r'); accept('\n'); firstLine = false; } outerLoop: // The outerLoop processes the doc comment, looping once // for each line. For each line, it first strips off // whitespace, then it consumes any stars, then it // puts the rest of the line into the extraction buffer. while (isAvailable()) { int begin_pos = position(); // Consume whitespace from the beginning of each line. skipWhitespace(); // Are there stars here? If so, consume them all // and check for the end of comment. if (is('*')) { // skip all of the stars skip('*'); // check for the closing slash. if (accept('/')) { // We're done with the Javadoc comment break outerLoop; } } else if (!firstLine) { // The current line does not begin with a '*' so we will // treat it as comment reset(begin_pos); } textLoop: // The textLoop processes the rest of the characters // on the line, adding them to the extraction buffer. while (isAvailable()) { if (accept("*/")) { // This is the end of the comment, return // the contents of the extraction buffer. break outerLoop; } else if (isOneOf('\n', '\r')) { // We've seen a newline. Add it to our // buffer and break out of this loop, // starting fresh on a new line. put('\n'); accept('\r'); accept('\n'); break textLoop; } else if (is('\f')){ next(); break textLoop; // treat as end of line } else { // Add the character to our buffer. put(); next(); } } // end textLoop firstLine = false; } // end outerLoop // If extraction buffer is not empty. if (sb.length() > 0) { // Remove trailing asterisks. int i = sb.length() - 1; while (i > -1 && sb.charAt(i) == '*') { i--; } sb.setLength(i + 1) ; // Store the text of the doc comment docComment = sb.toString(); } else { docComment = ""; } } finally { scanned = true; // Check if comment contains @deprecated comment. if (docComment != null && DEPRECATED_PATTERN.matcher(docComment).matches()) { deprecatedFlag = true; } } } }
Build a map for translating between line numbers and positions in the input. Overridden to expand tabs.
Returns:a LineMap
/** * Build a map for translating between line numbers and positions in the input. * Overridden to expand tabs. * * @return a LineMap */
@Override public Position.LineMap getLineMap() { char[] buf = getRawCharacters(); return Position.makeLineMap(buf, buf.length, true); }
Build an int table to mapping positions in extracted Javadoc comment to positions in the JavaTokenizer source buffer. The array is organized as a series of pairs of integers: the first number in each pair specifies a position in the comment text, the second number in each pair specifies the corresponding position in the source buffer. The pairs are sorted in ascending order. Since the mapping function is generally continuous, with successive positions in the string corresponding to successive positions in the source buffer, the table only needs to record discontinuities in the mapping. The values of intermediate positions can be inferred. Discontinuities may occur in a number of places: when a newline is followed by whitespace and asterisks (which are ignored), when a tab is expanded into spaces, and when unicode escapes are used in the source buffer. Thus, to find the source position of any position, p, in the comment string, find the index, i, of the pair whose string offset (map[i * NOFFSETS + SB_OFFSET] ) is closest to but not greater than p. Then, sourcePos(p) = map[i * NOFFSETS + POS_OFFSET] + (p - map[i * NOFFSETS + SB_OFFSET]) .
/** * Build an int table to mapping positions in extracted Javadoc comment * to positions in the JavaTokenizer source buffer. * * The array is organized as a series of pairs of integers: the first * number in each pair specifies a position in the comment text, * the second number in each pair specifies the corresponding position * in the source buffer. The pairs are sorted in ascending order. * * Since the mapping function is generally continuous, with successive * positions in the string corresponding to successive positions in the * source buffer, the table only needs to record discontinuities in * the mapping. The values of intermediate positions can be inferred. * * Discontinuities may occur in a number of places: when a newline * is followed by whitespace and asterisks (which are ignored), * when a tab is expanded into spaces, and when unicode escapes * are used in the source buffer. * * Thus, to find the source position of any position, p, in the comment * string, find the index, i, of the pair whose string offset * ({@code map[i * NOFFSETS + SB_OFFSET] }) is closest to but not greater * than p. Then, {@code sourcePos(p) = map[i * NOFFSETS + POS_OFFSET] + * (p - map[i * NOFFSETS + SB_OFFSET]) }. */
static class OffsetMap {
map entry offset for comment offset member of pair.
/** * map entry offset for comment offset member of pair. */
private static final int SB_OFFSET = 0;
map entry offset of input offset member of pair.
/** * map entry offset of input offset member of pair. */
private static final int POS_OFFSET = 1;
Number of elements in each entry.
/** * Number of elements in each entry. */
private static final int NOFFSETS = 2;
Array storing entries in map.
/** * Array storing entries in map. */
private int[] map;
Logical size of map (number of valid entries.)
/** * Logical size of map (number of valid entries.) */
private int size;
Constructor.
/** * Constructor. */
OffsetMap() { this.map = new int[128]; this.size = 0; }
Returns true if it is worthwhile adding the entry pair to the map. That is if there is a change in relative offset.
Params:
  • sbOffset – comment offset member of pair.
  • posOffet – input offset member of pair.
Returns:true if it is worthwhile adding the entry pair.
/** * Returns true if it is worthwhile adding the entry pair to the map. That is * if there is a change in relative offset. * * @param sbOffset comment offset member of pair. * @param posOffet input offset member of pair. * * @return true if it is worthwhile adding the entry pair. */
boolean shouldAdd(int sbOffset, int posOffet) { return sbOffset - lastSBOffset() != posOffet - lastPosOffset(); }
Adds entry pair if worthwhile.
Params:
  • sbOffset – comment offset member of pair.
  • posOffet – input offset member of pair.
/** * Adds entry pair if worthwhile. * * @param sbOffset comment offset member of pair. * @param posOffet input offset member of pair. */
void add(int sbOffset, int posOffet) { if (size == 0 || shouldAdd(sbOffset, posOffet)) { ensure(NOFFSETS); map[size + SB_OFFSET] = sbOffset; map[size + POS_OFFSET] = posOffet; size += NOFFSETS; } }
Returns the previous comment offset.
Returns:the previous comment offset.
/** * Returns the previous comment offset. * * @return the previous comment offset. */
private int lastSBOffset() { return size == 0 ? 0 : map[size - NOFFSETS + SB_OFFSET]; }
Returns the previous input offset.
Returns:the previous input offset.
/** * Returns the previous input offset. * * @return the previous input offset. */
private int lastPosOffset() { return size == 0 ? 0 : map[size - NOFFSETS + POS_OFFSET]; }
Ensures there is enough space for a new entry.
Params:
  • need – number of array slots needed.
/** * Ensures there is enough space for a new entry. * * @param need number of array slots needed. */
private void ensure(int need) { need += size; int grow = map.length; while (need > grow) { grow <<= 1; } // Handle overflow. if (grow < map.length) { throw new IndexOutOfBoundsException(); } else if (grow != map.length) { map = Arrays.copyOf(map, grow); } }
Binary search to find the entry for which the string index is less than pos. Since the map is a list of pairs of integers we must make sure the index is always NOFFSETS scaled. If we find an exact match for pos, the other item in the pair gives the source pos; otherwise, compute the source position relative to the best match found in the array.
/** * Binary search to find the entry for which the string index is less * than pos. Since the map is a list of pairs of integers we must make * sure the index is always NOFFSETS scaled. If we find an exact match * for pos, the other item in the pair gives the source pos; otherwise, * compute the source position relative to the best match found in the * array. */
int getSourcePos(int pos) { if (size == 0) { return Position.NOPOS; } int start = 0; int end = size / NOFFSETS; while (start < end - 1) { // find an index midway between start and end int index = (start + end) / 2; int indexScaled = index * NOFFSETS; if (map[indexScaled + SB_OFFSET] < pos) { start = index; } else if (map[indexScaled + SB_OFFSET] == pos) { return map[indexScaled + POS_OFFSET]; } else { end = index; } } int startScaled = start * NOFFSETS; return map[startScaled + POS_OFFSET] + (pos - map[startScaled + SB_OFFSET]); } } }