/* * [BatCharCategory.java] * * Summary: top level enum to define the categories of character for the BatTokenizer. * * Copyright: (c) 2004-2017 Roedy Green, Canadian Mind Products, http://mindprod.com * * Licence: This software may be copied and used freely for any purpose but military. * http://mindprod.com/contact/nonmil.html * * Requires: JDK 1.8+ * * Created with: JetBrains IntelliJ IDEA IDE http://www.jetbrains.com/idea/ * * Version History: * 3.1 2009-04-12 shorter style names, improved highlighting. */ package com.mindprod.jprep; /** * top level enum to define the categories of character for the BatTokenizer. * * @author Roedy Green, Canadian Mind Products * @version 3.1 2009-04-12 shorter style names, improved highlighting. * @since 2004-05-15 */ @SuppressWarnings( { "EnumeratedConstantNamingConvention" } ) public enum BatCharCategory { /** * colon, behaves differently in different contexts: :: - comment start :done - label C:\myfile.txt echo : this * is fine */ COLON, /** * End of line character */ EOL, /** * ignore control chars */ IGNORE, /** * high ascii ` and chars not used in bat language */ OTHER, /** * chars used in identifiers */ PLAIN, /** * punctuation */ PUNCTUATION, /** * " */ QUOTE, /** * needs to go in its own token because it is rendered specially. */ SEPARATOR, /** * space */ SPACE; /** * Categorise one character * * @param theChar character to categorise * * @return category code, e.g. PLAIN QUOTE */ static BatCharCategory categorise( char theChar ) { if ( 'a' <= theChar && theChar <= 'z' ) { return PLAIN; } if ( 'A' <= theChar && theChar <= 'Z' ) { return PLAIN; } if ( '0' <= theChar && theChar <= '9' ) { return PLAIN; } switch ( theChar ) { case '$': case '_': return PLAIN; case ' ': case '\t': case 0xa0://   return SPACE; case '\n': return EOL; case '\"': return QUOTE; case ':': return COLON; case ';': case '\\': case '/': return SEPARATOR; case '!': case '#': case '%': case '&': case '(': case ')': case '*': case '+': case ',': case '-': case '.': case '<': case '=': case '>': case '?': case '@': case '[': case ']': case '^': case '`': case '{': case '|': case '}': case '~': return PUNCTUATION; case '\r': case 127: case 0xfeff: /* bom */ case 0xfffd: /* replaced bom */ return IGNORE; default: if ( 0 <= theChar && theChar <= 31 ) { return IGNORE; } else { return OTHER; } } // end switch } // end categorise } // end BatCharCategory