Coccinelle release 1.0.0-rc4
[bpt/coccinelle.git] / parsing_cocci / lexer_script.mll
1 (*
2 * Copyright 2010, INRIA, University of Copenhagen
3 * Julia Lawall, Rene Rydhof Hansen, Gilles Muller, Nicolas Palix
4 * Copyright 2005-2009, Ecole des Mines de Nantes, University of Copenhagen
5 * Yoann Padioleau, Julia Lawall, Rene Rydhof Hansen, Henrik Stuart, Gilles Muller, Nicolas Palix
6 * This file is part of Coccinelle.
7 *
8 * Coccinelle is free software: you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation, according to version 2 of the License.
11 *
12 * Coccinelle is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with Coccinelle. If not, see <http://www.gnu.org/licenses/>.
19 *
20 * The authors reserve the right to distribute this or future versions of
21 * Coccinelle under other licenses.
22 *)
23
24
25 {
26 open Parser_cocci_menhir
27 module D = Data
28 module Ast = Ast_cocci
29 exception Lexical of string
30 let tok = Lexing.lexeme
31 let inc_line _ = Lexer_cocci.line := !Lexer_cocci.line + 1
32 }
33 (* ---------------------------------------------------------------------- *)
34 (* tokens *)
35
36 let oct = ['0'-'7']
37 let hex = ['0'-'9' 'a'-'f' 'A'-'F']
38
39 let myrule = [^'\'''"''@''/''\n''\r''\011''\012']+
40
41 rule token = parse
42 | myrule { TScriptData (tok lexbuf) }
43 | ['\n' '\r' '\011' '\012'] { inc_line(); TScriptData (tok lexbuf) }
44 | "@@" { TArobArob }
45 | "@" { TArob }
46 | "/" { TScriptData (tok lexbuf) }
47 | "//" [^ '\n']* { token lexbuf } (* skip SmPL comments *)
48 | '"' { TScriptData (Printf.sprintf "\"%s\"" (string lexbuf)) }
49 | "'" { TScriptData (Printf.sprintf "'%s'" (cstring lexbuf)) }
50 | eof { EOF }
51 | _ { raise (Lexical ("unrecognised symbol, in token rule:"^tok lexbuf)) }
52
53 (* These are C strings. Perhaps they require some adjustment. *)
54 and string = parse
55 | '"' { "" }
56 | (_ as x) { (String.make 1 x) ^ string lexbuf }
57
58 and cstring = parse
59 | "'" { "" }
60 | (_ as x) { (String.make 1 x) ^ cstring lexbuf }