blob: 2dbf35c62270269459668037efcc22c1927aa1f1 [file] [log] [blame]
// Copyright (C) 2009 Google Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package prettify.lang;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
import java.util.regex.Pattern;
import prettify.Lang;
import prettify.Prettify;
/**
* Registers a language handler for Haskell.
*
*
* To use, include prettify.js and this file in your HTML page.
* Then put your code in an HTML tag like
* <pre class="prettyprint lang-hs">(my lisp code)</pre>
* The lang-cl class identifies the language as common lisp.
* This file supports the following language extensions:
* lang-cl - Common Lisp
* lang-el - Emacs Lisp
* lang-lisp - Lisp
* lang-scm - Scheme
*
*
* I used http://www.informatik.uni-freiburg.de/~thiemann/haskell/haskell98-report-html/syntax-iso.html
* as the basis, but ignore the way the ncomment production nests since this
* makes the lexical grammar irregular. It might be possible to support
* ncomments using the lookbehind filter.
*
*
* @author mikesamuel@gmail.com
*/
public class LangHs extends Lang {
public LangHs() {
List<List<Object>> _shortcutStylePatterns = new ArrayList<List<Object>>();
List<List<Object>> _fallthroughStylePatterns = new ArrayList<List<Object>>();
// Whitespace
// whitechar -> newline | vertab | space | tab | uniWhite
// newline -> return linefeed | return | linefeed | formfeed
_shortcutStylePatterns.add(Arrays.asList(new Object[]{Prettify.PR_PLAIN, Pattern.compile("^[\\t\\n\\x0B\\x0C\\r ]+"), null, "\t\n" + Character.toString((char) 0x0B) + Character.toString((char) 0x0C) + "\r "}));
// Single line double and single-quoted strings.
// char -> ' (graphic<' | \> | space | escape<\&>) '
// string -> " {graphic<" | \> | space | escape | gap}"
// escape -> \ ( charesc | ascii | decimal | o octal
// | x hexadecimal )
// charesc -> a | b | f | n | r | t | v | \ | " | ' | &
_shortcutStylePatterns.add(Arrays.asList(new Object[]{Prettify.PR_STRING, Pattern.compile("^\\\"(?:[^\\\"\\\\\\n\\x0C\\r]|\\\\[\\s\\S])*(?:\\\"|$)"), null, "\""}));
_shortcutStylePatterns.add(Arrays.asList(new Object[]{Prettify.PR_STRING, Pattern.compile("^\\'(?:[^\\'\\\\\\n\\x0C\\r]|\\\\[^&])\\'?"), null, "'"}));
// decimal -> digit{digit}
// octal -> octit{octit}
// hexadecimal -> hexit{hexit}
// integer -> decimal
// | 0o octal | 0O octal
// | 0x hexadecimal | 0X hexadecimal
// float -> decimal . decimal [exponent]
// | decimal exponent
// exponent -> (e | E) [+ | -] decimal
_shortcutStylePatterns.add(Arrays.asList(new Object[]{Prettify.PR_LITERAL, Pattern.compile("^(?:0o[0-7]+|0x[\\da-f]+|\\d+(?:\\.\\d+)?(?:e[+\\-]?\\d+)?)", Pattern.CASE_INSENSITIVE), null, "0123456789"}));
// Haskell does not have a regular lexical grammar due to the nested
// ncomment.
// comment -> dashes [ any<symbol> {any}] newline
// ncomment -> opencom ANYseq {ncomment ANYseq}closecom
// dashes -> '--' {'-'}
// opencom -> '{-'
// closecom -> '-}'
_fallthroughStylePatterns.add(Arrays.asList(new Object[]{Prettify.PR_COMMENT, Pattern.compile("^(?:(?:--+(?:[^\\r\\n\\x0C]*)?)|(?:\\{-(?:[^-]|-+[^-\\}])*-\\}))")}));
// reservedid -> case | class | data | default | deriving | do
// | else | if | import | in | infix | infixl | infixr
// | instance | let | module | newtype | of | then
// | type | where | _
_fallthroughStylePatterns.add(Arrays.asList(new Object[]{Prettify.PR_KEYWORD, Pattern.compile("^(?:case|class|data|default|deriving|do|else|if|import|in|infix|infixl|infixr|instance|let|module|newtype|of|then|type|where|_)(?=[^a-zA-Z0-9\\']|$)"), null}));
// qvarid -> [ modid . ] varid
// qconid -> [ modid . ] conid
// varid -> (small {small | large | digit | ' })<reservedid>
// conid -> large {small | large | digit | ' }
// modid -> conid
// small -> ascSmall | uniSmall | _
// ascSmall -> a | b | ... | z
// uniSmall -> any Unicode lowercase letter
// large -> ascLarge | uniLarge
// ascLarge -> A | B | ... | Z
// uniLarge -> any uppercase or titlecase Unicode letter
_fallthroughStylePatterns.add(Arrays.asList(new Object[]{Prettify.PR_PLAIN, Pattern.compile("^(?:[A-Z][\\w\\']*\\.)*[a-zA-Z][\\w\\']*")}));
// matches the symbol production
_fallthroughStylePatterns.add(Arrays.asList(new Object[]{Prettify.PR_PUNCTUATION, Pattern.compile("^[^\\t\\n\\x0B\\x0C\\r a-zA-Z0-9\\'\\\"]+")}));
setShortcutStylePatterns(_shortcutStylePatterns);
setFallthroughStylePatterns(_fallthroughStylePatterns);
}
public static List<String> getFileExtensions() {
return Arrays.asList(new String[]{"hs"});
}
}