pmd/javacc-wrapper.xml

524 lines
21 KiB
XML
Raw Normal View History

<!--
~ BSD-style license; for more info see http://pmd.sourceforge.net/license.html
-->
<project name="pmd" default="alljavacc" basedir="/">
<!-- Wraps a JavaCC/JJTree task and adapts the generated sources to the PMD
codebase.
Input parameters:
- lang-name: Capitalized name of the language eg Jsp or Java.
By convention the grammar file must be named exactly
so with a .jj[t] extension.
2020-08-26 19:25:21 +02:00
- lang-name-camelcase: Name of the language in camelcase. Useful for languages
whose name is an acronym, eg PLSQL (in camelcase, "Plsql").
Defaults to lang-name.
- lang-terse-name: Terse name, used in the conventional package names
It also uses the following maven properties:
- javacc.outputDirectory: Directory in which to root the generated package tree
- javacc.jar: JAR of JavaCC in the local maven repository
- some properties of project.build
-->
2020-08-26 19:25:21 +02:00
<condition property="lang-name-camelcase" value="${lang-name}">
<!-- Eg for "PLSQL": "Plsql" -->
<not>
<isset property="lang-name-camelcase" />
</not>
</condition>
<property name="target-package-dir" value="${javacc.outputDirectory}/net/sourceforge/pmd/lang/${lang-terse-name}/ast" />
<property name="stamp-file" value="${project.build.directory}/last-generated-timestamp" />
<property name="javacc-home.path" value="${project.build.directory}/lib/javacc" />
2020-01-11 00:58:49 +01:00
<property name="lang-ast-package" value="net.sourceforge.pmd.lang.${lang-terse-name}.ast" />
<property name="ast-api-package" value="net.sourceforge.pmd.lang.ast" />
<property name="ast-impl-package" value="${ast-api-package}.impl.javacc" />
<property name="grammar-file" value="etc/grammar/${lang-name}.jjt" />
2020-01-11 00:58:49 +01:00
2020-01-11 02:39:24 +01:00
<property name="parser-name" value="${lang-name}ParserImpl" />
2020-01-11 00:58:49 +01:00
<property name="parser-file" value="${target-package-dir}/${parser-name}.java" />
2020-01-11 02:39:24 +01:00
<property name="ast-prefix" value="AST" />
<property name="constants-itf-name" value="${parser-name}Constants" />
<property name="constants-itf-file" value="${target-package-dir}/${constants-itf-name}.java" />
<property name="token-constants-name" value="${lang-name}TokenKinds" />
<property name="token-constants-file" value="${target-package-dir}/${token-constants-name}.java" />
<property name="node-name" value="${lang-name}Node" />
<property name="base-class-name" value="Abstract${lang-name}Node" />
<!-- This will be moved to impl package when all language modules have been ported -->
2020-04-29 00:48:57 +02:00
<property name="base-tokenmgr" value="${ast-impl-package}.AbstractTokenManager"/>
<property name="charstream-itf" value="${ast-impl-package}.CharStream"/>
<property name="tokenmgr-name" value="${parser-name}TokenManager" />
<property name="tokenmgr-file" value="${target-package-dir}/${tokenmgr-name}.java" />
2020-01-11 02:39:24 +01:00
<!-- Visitor names -->
2020-08-26 19:25:21 +02:00
<!-- This is the default name generated by JJTree -->
2020-01-11 02:39:24 +01:00
<property name="gen-visitor-name" value="${parser-name}Visitor" />
2020-08-26 19:25:21 +02:00
<!-- This is the actual name we use -->
<property name="generic-visitor-interface-name" value="${lang-name-camelcase}Visitor" />
2020-07-01 11:06:48 +02:00
<property name="generic-visitor-interface-file"
value="${target-package-dir}/${generic-visitor-interface-name}.java" />
2020-01-11 02:39:24 +01:00
<!-- TARGETS -->
<target name="alljavacc"
description="Generates JavaCC sources and cleans them up"
depends="checkUpToDate,init,jjtree,jjtree-ersatz,javacc,adapt-generated,default-visitor,cleanup" />
<target name="checkUpToDate"
description="Checks the input files are up to date">
<uptodate property="javaccBuildNotRequired" targetfile="${stamp-file}">
<srcfiles dir="etc/grammar" includes="${lang-name}.jj*" />
<srcfiles file="${ant.file}" />
</uptodate>
<echo message="Up-to-date check: javaccBuildNotRequired=${javaccBuildNotRequired}" />
<condition property="jjtreeBuildNotRequired">
<or>
<isset property="no-jjtree" />
<isset property="javaccBuildNotRequired" />
</or>
</condition>
</target>
<target name="init" unless="javaccBuildNotRequired" description="Initialize build">
<mkdir dir="${javacc-home.path}" />
<copy file="${javacc.jar}" tofile="${javacc-home.path}/javacc.jar" />
<mkdir dir="${javacc.outputDirectory}" />
<touch file="${stamp-file}" />
<delete dir="${target-package-dir}" />
<mkdir dir="${target-package-dir}" />
</target>
<target name="cleanup" unless="javaccBuildNotRequired">
<delete dir="${javacc-home.path}" />
</target>
<target name="jjtree" unless="jjtreeBuildNotRequired" description="Runs JJTree">
2020-03-19 17:57:30 +01:00
<!--
Token-tracking behavior is implemented in the JJTree builder,
so the grammar should have TRACK_TOKEN=false; (this is the default value)
-->
<jjtree target="etc/grammar/${lang-name}.jjt"
outputdirectory="${target-package-dir}"
2020-01-11 02:39:24 +01:00
nodeusesparser="false"
2020-01-11 00:58:49 +01:00
nodepackage="${lang-ast-package}"
javacchome="${javacc-home.path}" />
</target>
<target name="jjtree-ersatz" if="no-jjtree" unless="javaccBuildNotRequired">
<!-- If no jjtree is run, then we look for a .jj file to place
in the target dir for the javacc target to pick up on it -->
<copy file="etc/grammar/${lang-name}.jj" todir="${target-package-dir}" />
</target>
<target name="javacc" depends="jjtree" unless="javaccBuildNotRequired">
<javacc static="false"
usercharstream="true"
2020-01-11 05:22:29 +01:00
unicodeinput="true"
target="${target-package-dir}/${lang-name}.jj"
outputdirectory="${target-package-dir}"
javacchome="${javacc-home.path}" />
</target>
<target name="adapt-generated" unless="javaccBuildNotRequired">
2020-01-11 02:39:24 +01:00
<delete file="${target-package-dir}/Node.java" />
<delete file="${target-package-dir}/SimpleNode.java" />
<delete file="${target-package-dir}/JJT${parser-name}State.java" />
<delete file="${target-package-dir}/CharStream.java" />
<delete file="${target-package-dir}/ParseException.java" />
<delete file="${target-package-dir}/Token.java" />
<delete file="${target-package-dir}/TokenMgrError.java" />
<!-- Remove all duplicate files -->
<delete>
<fileset dir="${javacc.outputDirectory}">
<present present="both" targetdir="${project.build.sourceDirectory}" />
</fileset>
</delete>
2020-01-11 02:39:24 +01:00
<antcall target="cleanup-token-manager" />
<antcall target="cleanup-parser" />
<antcall target="cleanup-nodes" />
<!-- Map Javacc names to our names -->
<replaceregexp flags="g">
<regexp pattern="\bToken\b" />
<substitution expression="${ast-impl-package}.JavaccToken" />
<fileset dir="${target-package-dir}" />
</replaceregexp>
<replaceregexp flags="g">
<regexp pattern="(?&lt;!\.)\bCharStream\b" />
<substitution expression="${charstream-itf}" />
<fileset dir="${target-package-dir}" />
</replaceregexp>
<antcall target="constants-files" />
<!-- For compatibility -->
2020-01-11 05:22:29 +01:00
<replaceregexp flags="g">
<regexp pattern="\.image\b(?! =)" />
2020-01-11 05:22:29 +01:00
<substitution expression=".getImage()" />
<fileset dir="${target-package-dir}" />
</replaceregexp>
2020-01-11 02:39:24 +01:00
<replace token=".beginLine" value=".getBeginLine()">
<fileset dir="${target-package-dir}" />
</replace>
<replace token=".beginColumn" value=".getBeginColumn()">
<fileset dir="${target-package-dir}" />
</replace>
<!-- Used by debug modes -->
<replace token="TokenMgrError.addEscapes" value="net.sourceforge.pmd.util.StringUtil.escapeJava">
<fileset dir="${target-package-dir}" />
</replace>
</target>
<target name="cleanup-parser">
<replace token="new Token()" value="token_source.input_stream.getTokenDocument().open()">
<fileset file="${parser-file}" />
</replace>
<replaceregexp flags="g">
<regexp pattern='jjtree.openNodeScope\((jjtn.*?)\);' />
<substitution expression='jjtree.openNodeScope(\1, getToken(1));' />
<file name="${parser-file}" />
</replaceregexp>
<replaceregexp flags="g">
<regexp pattern='jjtree.closeNodeScope\((jjtn.*?)\);' />
<substitution expression='jjtree.closeNodeScope(\1, getToken(0));' />
<file name="${parser-file}" />
</replaceregexp>
<!-- The tree builder is generic now -->
<replaceregexp flags="g">
<regexp pattern="\bJJT${parser-name}State\b" />
<substitution expression="${ast-impl-package}.JjtreeBuilder&lt;${base-class-name}&gt;" />
<fileset file="${parser-file}" />
</replaceregexp>
<replaceregexp flags="g">
<regexp pattern="new ParseException\(token, exptokseq, tokenImage\);" />
<substitution expression="new ParseException(token, exptokseq);" />
<fileset file="${parser-file}" />
</replaceregexp>
<replaceregexp>
<regexp pattern="public interface"/>
<substitution expression="interface"/>
<fileset file="${target-package-dir}/${parser-name}TreeConstants.java" />
</replaceregexp>
</target>
<target name="cleanup-token-manager">
2020-01-11 05:22:29 +01:00
<replaceregexp>
<regexp pattern='(public )?class ${tokenmgr-name}' />
<substitution expression='class ${tokenmgr-name} extends ${base-tokenmgr}' />
<file name="${tokenmgr-file}" />
</replaceregexp>
2020-01-11 02:39:24 +01:00
<!-- This is a programming error and should be caught in tests -->
<replaceregexp>
<regexp pattern='throw new TokenMgrError\("Error: Ignoring invalid lexical state.*?\);' />
<substitution expression='throw new IllegalArgumentException("Invalid lexical state " + lexState);' />
<file name="${tokenmgr-file}" />
</replaceregexp>
2020-01-25 15:17:12 +01:00
<!-- Useless argument, also replace lex state ID with its name -->
2020-01-11 02:39:24 +01:00
<replaceregexp>
2020-01-25 15:17:12 +01:00
<regexp pattern='curLexState, error_line, error_column, error_after, curChar, TokenMgrError.LEXICAL_ERROR\)' />
<substitution expression='lexStateNames[curLexState], error_line, error_column, error_after, curChar)' />
2020-01-11 02:39:24 +01:00
<file name="${tokenmgr-file}" />
</replaceregexp>
<!-- Patch token creation routine, delegates to the token document. -->
<replaceregexp flags="s">
<file name="${tokenmgr-file}" />
<regexp pattern="protected Token jjFillToken.*?(?=int curLexState = )" />
<substitution expression="protected Token jjFillToken() {return input_stream.getTokenDocument().createToken(jjmatchedKind, input_stream, jjstrLiteralImages[jjmatchedKind]);}" />
</replaceregexp>
2020-04-18 13:02:54 +02:00
<!-- Renamed CharStream methods -->
<replaceregexp flags="g">
<file name="${tokenmgr-file}" />
<regexp pattern="image.append\(input_stream.GetSuffix\(" />
<substitution expression="input_stream.appendSuffix(image,(" />
</replaceregexp>
<replaceregexp flags="g">
<file name="${tokenmgr-file}" />
<regexp pattern="input_stream.GetImage" />
<substitution expression="input_stream.getTokenImage" />
</replaceregexp>
<replaceregexp flags="g">
<file name="${tokenmgr-file}" />
<regexp pattern="input_stream.BeginToken" />
<substitution expression="input_stream.markTokenStart" />
</replaceregexp>
<!-- This is used to allow for tokens to be immutable. The lexical actions
return the new token instead of mutating it. -->
<replaceregexp flags="sg">
<file name="${tokenmgr-file}" />
<regexp pattern="void ((Token|Skip)LexicalActions\(Token matchedToken\))\R\{(.*?)}\R(?=(private )?void)" />
<substitution expression="Token \1 { \3
return matchedToken;
}" />
</replaceregexp>
<!-- Update call sites for the previous routines -->
<replaceregexp>
<file name="${tokenmgr-file}" />
<regexp pattern="(Token|Skip)LexicalActions\(matchedToken\);" />
<substitution expression="matchedToken = \0" />
</replaceregexp>
<!-- Fix end column being now exclusive -->
<!-- JavaCC assumes it's inclusive, uses it for character positions of errors -->
<!-- This is also used in debug mode -->
<replaceregexp flags="sg">
<file name="${tokenmgr-file}" />
<regexp pattern="input_stream.getEndColumn\(\)" />
<substitution expression="(input_stream.getEndColumn() - 1)" />
</replaceregexp>
2020-01-11 02:39:24 +01:00
</target>
2020-01-11 02:39:24 +01:00
<target name="constants-files">
2020-01-11 02:39:24 +01:00
<replaceregexp flags="g">
<regexp pattern="implements ${constants-itf-name}," />
<substitution expression="implements" />
<fileset dir="${target-package-dir}" />
</replaceregexp>
2020-01-11 00:58:49 +01:00
<replaceregexp flags="g">
2020-01-11 02:39:24 +01:00
<regexp pattern=", ${constants-itf-name}\b" />
<substitution expression="" />
<fileset dir="${target-package-dir}" />
2020-01-11 00:58:49 +01:00
</replaceregexp>
<replaceregexp flags="g">
2020-01-11 02:39:24 +01:00
<regexp pattern="implements ${constants-itf-name}\b" />
<substitution expression="" />
<fileset dir="${target-package-dir}" />
2020-01-11 00:58:49 +01:00
</replaceregexp>
2020-01-11 02:39:24 +01:00
<replaceregexp>
<regexp pattern="package ${lang-ast-package};" />
<substitution expression="\0
import static ${lang-ast-package}.${token-constants-name}.*;" />
<fileset file="${tokenmgr-file}" />
<fileset file="${parser-file}" />
</replaceregexp>
2020-01-11 00:58:49 +01:00
2020-01-11 02:39:24 +01:00
<!-- Create constants file -->
2020-01-11 02:39:24 +01:00
<move file="${constants-itf-file}" tofile="${token-constants-file}" />
<replaceregexp>
<regexp pattern="(public )?interface ${constants-itf-name} \{" />
<substitution expression="/** Token kinds ({@link ${ast-impl-package}.JavaccToken#kind}) for this language. */${line.separator}
public final class ${token-constants-name} \{${line.separator}
private ${token-constants-name}() { /* Utility class */ }${line.separator}
"/>
2020-01-11 02:39:24 +01:00
<fileset file="${token-constants-file}" />
</replaceregexp>
<replaceregexp flags="g">
<regexp pattern="/\*\* RegularExpression Id. \*/\R" />
2020-01-11 02:39:24 +01:00
<substitution expression="public static final " />
<fileset file="${token-constants-file}" />
</replaceregexp>
2020-01-11 02:39:24 +01:00
<replaceregexp flags="s">
<regexp pattern="/\*\* End of File. \*/\R" />
<substitution expression="public static final " />
2020-01-11 02:39:24 +01:00
<fileset file="${token-constants-file}" />
</replaceregexp>
<!-- Lexical states are kept package-private -->
<replaceregexp flags="g">
<regexp pattern="/\*\* Lexical state. \*/\R" />
2020-01-11 02:39:24 +01:00
<substitution expression="static final " />
<fileset file="${token-constants-file}" />
</replaceregexp>
2020-01-11 02:39:24 +01:00
<replace>
<replacetoken>/** Literal token values. */</replacetoken>
2020-03-20 16:32:09 +01:00
<replacevalue><![CDATA[
2020-01-11 02:39:24 +01:00
/** Returns a string describing the given token kind.
* Returns null if the kind is unknown.
*
* @param kind Kind of token
*
* @return A string describing the given kind
*/
public static @org.checkerframework.checker.nullness.qual.Nullable
String describe(int kind) {
2020-03-20 16:32:09 +01:00
return kind < 0 || kind >= tokenImage.length
2020-01-11 02:39:24 +01:00
? null
: tokenImage[kind];
}
2020-03-20 17:07:48 +01:00
/** Returns a new token manager for this language. The CharStream
* should be configured with the correct language-specific escaping
* and token document. This is not a published API, it's intended to
* be used as a basis for a CPD Tokenizer.
*/
@net.sourceforge.pmd.annotation.InternalApi
2020-09-02 06:07:39 +02:00
public static net.sourceforge.pmd.lang.TokenManager<%%%API_PACK%%%.impl.javacc.JavaccToken> newTokenManager(%%%API_PACK%%%.impl.javacc.CharStream cs) {
2020-03-20 16:32:09 +01:00
return new %%%TOKEN_MGR_NAME%%%(cs);
}
2020-01-11 02:39:24 +01:00
private static final
2020-03-20 16:32:09 +01:00
]]> </replacevalue>
2020-01-11 02:39:24 +01:00
<fileset file="${token-constants-file}" />
</replace>
<replace>
<replacetoken>};</replacetoken>
<replacevalue><![CDATA[
};
/** Nams of the tokens, each index corresponds to a kind. See also {@link #describe(int)}. */
public static final java.util.List<String> TOKEN_NAMES = java.util.Collections.unmodifiableList(java.util.Arrays.asList(tokenImage));
]]> </replacevalue>
<fileset file="${token-constants-file}" />
</replace>
2020-03-20 16:32:09 +01:00
<replaceregexp>
<regexp pattern="%%%TOKEN_MGR_NAME%%%" />
<substitution expression="${tokenmgr-name}" />
<fileset file="${token-constants-file}" />
</replaceregexp>
<replaceregexp flags="g">
<regexp pattern="%%%API_PACK%%%" />
<substitution expression="${ast-api-package}" />
<fileset file="${token-constants-file}" />
</replaceregexp>
2020-01-11 02:39:24 +01:00
</target>
<target name="cleanup-nodes">
<replaceregexp flags="g">
<regexp pattern="\bParseException\b" />
<substitution expression="${ast-api-package}.ParseException" />
<fileset dir="${target-package-dir}" />
</replaceregexp>
<replaceregexp flags="g">
<regexp pattern="extends SimpleNode\b" />
<substitution expression="extends ${base-class-name}" />
<fileset dir="${target-package-dir}" />
</replaceregexp>
2020-01-11 02:39:24 +01:00
<!-- Remove constructor with parser -->
<replaceregexp flags="s">
<regexp pattern="public \w+\(${parser-name}.*?}" />
<substitution expression="" />
<fileset dir="${target-package-dir}">
<include name="${ast-prefix}*" />
</fileset>
</replaceregexp>
2020-01-11 02:39:24 +01:00
<!-- Make constructor package-private -->
<replaceregexp>
<regexp pattern="public (\w+\(int)" />
<substitution expression="\1" />
<fileset dir="${target-package-dir}">
<include name="${ast-prefix}*" />
</fileset>
</replaceregexp>
2020-01-11 02:39:24 +01:00
<!-- Make constructor package-private -->
<replaceregexp>
2020-02-15 00:48:57 +01:00
<regexp pattern="(?&lt;!public(\R| ))class" />
2020-01-11 02:39:24 +01:00
<substitution expression="public class" />
<fileset dir="${target-package-dir}">
<include name="${ast-prefix}*" />
</fileset>
</replaceregexp>
2020-01-11 02:39:24 +01:00
<replaceregexp flags="g">
<regexp pattern="/\*\* Accept the visitor. \*\*/" />
<substitution expression="" />
<fileset dir="${target-package-dir}">
<include name="${ast-prefix}*" />
</fileset>
</replaceregexp>
</target>
<target name="default-visitor" depends="jjtree" unless="jjtreeBuildNotRequired">
2020-08-25 02:04:10 +02:00
<move file="${target-package-dir}/${gen-visitor-name}.java" tofile="${generic-visitor-interface-file}" />
<replace file="${generic-visitor-interface-file}">
<replacefilter token="${gen-visitor-name}"
value="${generic-visitor-interface-name}&lt;P, R> extends ${ast-api-package}.AstVisitor&lt;P, R>" />
<replacefilter token="SimpleNode" value="${node-name}" />
2020-08-25 02:04:10 +02:00
<!-- Root method, eg visitJavaNode -->
<replacefilter
2020-08-25 02:04:10 +02:00
token="Object visit(${node-name} node, Object data);"
2020-08-26 19:25:21 +02:00
value="default R visit${lang-name-camelcase}Node(${node-name} node, P data) { return visitNode(node, data); }">
</replacefilter>
2020-08-25 02:04:10 +02:00
<replacefilter token="public Object visit(" value="default R visit(" />
2020-08-26 19:25:21 +02:00
<replacefilter token="Object data);" value="P data) { return visit${lang-name-camelcase}Node(node, data); }" />
</replace>
2020-08-07 03:15:33 +02:00
<replace>
2020-08-25 02:04:10 +02:00
<replacefilter token="public Object jjtAccept(${gen-visitor-name} visitor, Object data)"
value="@Override protected &lt;P, R> R accept${generic-visitor-interface-name}(${generic-visitor-interface-name}&lt;? super P, ? extends R> visitor, P data)" />
2020-08-07 03:15:33 +02:00
<fileset dir="${target-package-dir}">
<include name="${ast-prefix}*" />
</fileset>
</replace>
</target>
</project>