Coccinelle release-1.0.0-rc11
[bpt/coccinelle.git] / parsing_cocci / lexer_script.mll
1 (*
2 * Copyright 2012, INRIA
3 * Julia Lawall, Gilles Muller
4 * Copyright 2010-2011, INRIA, University of Copenhagen
5 * Julia Lawall, Rene Rydhof Hansen, Gilles Muller, Nicolas Palix
6 * Copyright 2005-2009, Ecole des Mines de Nantes, University of Copenhagen
7 * Yoann Padioleau, Julia Lawall, Rene Rydhof Hansen, Henrik Stuart, Gilles Muller, Nicolas Palix
8 * This file is part of Coccinelle.
9 *
10 * Coccinelle is free software: you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation, according to version 2 of the License.
13 *
14 * Coccinelle is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
18 *
19 * You should have received a copy of the GNU General Public License
20 * along with Coccinelle. If not, see <http://www.gnu.org/licenses/>.
21 *
22 * The authors reserve the right to distribute this or future versions of
23 * Coccinelle under other licenses.
24 *)
25
26
27 {
28 open Parser_cocci_menhir
29 module D = Data
30 module Ast = Ast_cocci
31 exception Lexical of string
32 let tok = Lexing.lexeme
33 let inc_line _ = Lexer_cocci.line := !Lexer_cocci.line + 1
34 }
35 (* ---------------------------------------------------------------------- *)
36 (* tokens *)
37
38 let oct = ['0'-'7']
39 let hex = ['0'-'9' 'a'-'f' 'A'-'F']
40
41 let myrule = [^'\'''"''@''/''\n''\r''\011''\012']+
42
43 rule token = parse
44 | myrule { TScriptData (tok lexbuf) }
45 | ['\n' '\r' '\011' '\012'] { inc_line(); TScriptData (tok lexbuf) }
46 | "@@" { TArobArob }
47 | "@" { TArob }
48 | "/" { TScriptData (tok lexbuf) }
49 | "//" [^ '\n']* { token lexbuf } (* skip SmPL comments *)
50 | '"' { TScriptData (Printf.sprintf "\"%s\"" (string lexbuf)) }
51 | "'" { TScriptData (Printf.sprintf "'%s'" (cstring lexbuf)) }
52 | eof { EOF }
53 | _ { raise (Lexical ("unrecognised symbol, in token rule:"^tok lexbuf)) }
54
55 (* These are C strings. Perhaps they require some adjustment. *)
56 and string = parse
57 | '"' { "" }
58 | (_ as x) { (String.make 1 x) ^ string lexbuf }
59
60 and cstring = parse
61 | "'" { "" }
62 | (_ as x) { (String.make 1 x) ^ cstring lexbuf }