chiark / gitweb /
New feature: messages with keyword arguments!
[sod] / src / module-parse.lisp
CommitLineData
bf090e02
MW
1;;; -*-lisp-*-
2;;;
3;;; Top-level parser for module syntax
4;;;
5;;; (c) 2010 Straylight/Edgeware
6;;;
7
8;;;----- Licensing notice ---------------------------------------------------
9;;;
e0808c47 10;;; This file is part of the Sensible Object Design, an object system for C.
bf090e02
MW
11;;;
12;;; SOD is free software; you can redistribute it and/or modify
13;;; it under the terms of the GNU General Public License as published by
14;;; the Free Software Foundation; either version 2 of the License, or
15;;; (at your option) any later version.
16;;;
17;;; SOD is distributed in the hope that it will be useful,
18;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
19;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20;;; GNU General Public License for more details.
21;;;
22;;; You should have received a copy of the GNU General Public License
23;;; along with SOD; if not, write to the Free Software Foundation,
24;;; Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
25
26(in-package #:sod)
27
28;;;--------------------------------------------------------------------------
29;;; Toplevel syntax.
30
bf090e02
MW
31;;; Type names.
32
048d0b2d
MW
33(define-pluggable-parser module typename (scanner pset)
34 ;; `typename' id ( `,' id )* `;'
35 (declare (ignore pset))
bf090e02
MW
36 (with-parser-context (token-scanner-context :scanner scanner)
37 (parse (and "typename"
38 (skip-many (:min 1)
39 (seq ((id :id))
40 (if (gethash id *module-type-map*)
41 (cerror* "Type `~A' already defined" id)
42 (add-to-module *module*
43 (make-instance 'type-item
44 :name id))))
45 #\,)
46 #\;))))
47
48;;; Fragments.
49
048d0b2d 50(define-pluggable-parser module code (scanner pset)
4fc52153 51 ;; `code' id `:' item-name [constraints] `{' c-fragment `}'
048d0b2d
MW
52 ;;
53 ;; constrains ::= `[' constraint-list `]'
4fc52153
MW
54 ;; constraint ::= item-name+
55 ;; item-name ::= id | `(' id+ `)'
048d0b2d 56 (declare (ignore pset))
bf090e02 57 (with-parser-context (token-scanner-context :scanner scanner)
4fc52153
MW
58 (labels ((kw ()
59 (parse (seq ((kw :id))
60 (intern (frob-identifier kw) 'keyword))))
61 (item ()
62 (parse (or (kw)
63 (seq (#\( (names (list (:min 1) (kw))) #\))
64 names)))))
9ec578d9
MW
65 (parse (seq ("code"
66 (reason (kw))
67 #\:
4fc52153 68 (name (item))
9ec578d9
MW
69 (constraints (? (seq (#\[
70 (constraints (list (:min 1)
4fc52153
MW
71 (list (:min 1)
72 (item))
9ec578d9
MW
73 #\,))
74 #\])
75 constraints)))
76 (fragment (parse-delimited-fragment scanner #\{ #\})))
77 (add-to-module *module*
78 (make-instance 'code-fragment-item
79 :fragment fragment
80 :constraints constraints
81 :reason reason
82 :name name)))))))
bf090e02
MW
83
84;;; External files.
85
9ec578d9
MW
86(export 'read-module)
87(defun read-module (pathname &key (truename nil truep) location)
bf090e02
MW
88 "Parse the file at PATHNAME as a module, returning it.
89
90 This is the main entry point for parsing module files. You may well know
91 the file's TRUENAME already (e.g., because `probe-file' dropped it into
92 your lap) so you can avoid repeating the search by providing it.
93
94 The LOCATION is the thing which wanted the module imported -- usually a
95 `file-location' object, though it might be anything other than `t' which
96 can be printed in the event of circular imports."
97
9ec578d9
MW
98 (setf pathname (merge-pathnames pathname
99 (make-pathname :type "SOD" :case :common)))
100 (unless truep (setf truename (truename pathname)))
bf090e02
MW
101 (define-module (pathname :location location :truename truename)
102 (with-open-file (f-stream pathname :direction :input)
103 (let* ((*readtable* (copy-readtable))
104 (char-scanner (make-instance 'charbuf-scanner
105 :stream f-stream))
106 (scanner (make-instance 'sod-token-scanner
107 :char-scanner char-scanner)))
108 (with-default-error-location (scanner)
109 (with-parser-context (token-scanner-context :scanner scanner)
048d0b2d
MW
110 (parse (skip-many ()
111 (seq ((pset (parse-property-set scanner))
112 (nil (error ()
113 (plug module scanner pset))))
114 (check-unused-properties pset))))))))))
115
116(define-pluggable-parser module test (scanner pset)
117 ;; `demo' string `;'
118 (declare (ignore pset))
bf090e02
MW
119 (with-parser-context (token-scanner-context :scanner scanner)
120 (parse (seq ("demo" (string :string) #\;)
121 (format t ";; DEMO ~S~%" string)))))
122
048d0b2d
MW
123(define-pluggable-parser module file (scanner pset)
124 ;; `import' string `;'
125 ;; `load' string `;'
126 (declare (ignore pset))
bf090e02
MW
127 (flet ((common (name type what thunk)
128 (find-file scanner
129 (merge-pathnames name
130 (make-pathname :type type
131 :case :common))
132 what
133 thunk)))
134 (with-parser-context (token-scanner-context :scanner scanner)
135 (parse (or (seq ("import" (name :string) #\;)
136 (common name "SOD" "module"
137 (lambda (path true)
138 (handler-case
139 (let ((module (read-module path
140 :truename true)))
141 (when module
142 (module-import module)
143 (pushnew module
144 (module-dependencies
145 *module*))))
146 (file-error (error)
147 (cerror* "Error reading module ~S: ~A"
148 path error))))))
149 (seq ("load" (name :string) #\;)
150 (common name "LISP" "Lisp file"
151 (lambda (path true)
152 (handler-case
153 (load true :verbose nil :print nil)
154 (error (error)
155 (cerror* "Error loading Lisp file ~S: ~A"
156 path error)))))))))))
157
01e3faf9
MW
158;;; Setting properties.
159
160(define-pluggable-parser module set (scanner pset)
161 ;; `set' property-list `;'
162 (with-parser-context (token-scanner-context :scanner scanner)
163 (parse (and "set"
164 (lisp (let ((module-pset (module-pset *module*)))
165 (when pset
166 (pset-map (lambda (prop)
167 (add-property module-pset
168 (p-name prop)
169 (p-value prop)
170 :type (p-type prop)
171 :location (p-location prop))
172 (setf (p-seenp prop) t))
173 pset))
174 (parse (skip-many (:min 0)
175 (error (:ignore-unconsumed t)
176 (parse-property scanner module-pset)
177 (skip-until (:keep-end t) #\, #\;))
178 #\,))))
179 #\;))))
180
bf090e02
MW
181;;; Lisp escape.
182
048d0b2d 183(define-pluggable-parser module lisp (scanner pset)
bf090e02 184 ;; `lisp' s-expression `;'
048d0b2d 185 (declare (ignore pset))
bf090e02
MW
186 (with-parser-context (token-scanner-context :scanner scanner)
187 (parse (seq ((sexp (if (and (eql (token-type scanner) :id)
188 (string= (token-value scanner) "lisp"))
189 (let* ((stream (make-scanner-stream scanner))
190 (sexp (read stream t)))
191 (scanner-step scanner)
192 (values sexp t t))
193 (values '((:id "lisp")) nil nil)))
194 #\;)
195 (eval sexp)))))
196
197;;;--------------------------------------------------------------------------
198;;; Class declarations.
199
7f2917d2
MW
200(export 'class-item)
201
048d0b2d 202(defun parse-class-body (scanner pset name supers)
c91b90c3 203 ;; class-body ::= `{' class-item* `}'
048d0b2d
MW
204 ;;
205 ;; class-item ::= property-set raw-class-item
c91b90c3
MW
206 (with-parser-context (token-scanner-context :scanner scanner)
207 (make-class-type name)
048d0b2d 208 (let* ((class (make-sod-class name (mapcar #'find-sod-class supers)
c91b90c3
MW
209 pset scanner))
210 (nick (sod-class-nickname class)))
211
212 (labels ((parse-maybe-dotted-declarator (base-type)
213 ;; Parse a declarator or dotted-declarator, i.e., one whose
214 ;; centre is
215 ;;
216 ;; maybe-dotted-identifier ::= [id `.'] id
217 ;;
218 ;; A plain identifier is returned as a string, as usual; a
219 ;; dotted identifier is returned as a cons cell of the two
220 ;; names.
221 (parse-declarator
222 scanner base-type
43073476 223 :keywordp t
ea578bb4 224 :kernel (parser ()
c91b90c3
MW
225 (seq ((name-a :id)
226 (name-b (? (seq (#\. (id :id)) id))))
227 (if name-b (cons name-a name-b)
228 name-a)))))
229
c91b90c3
MW
230 (parse-message-item (sub-pset type name)
231 ;; message-item ::=
232 ;; declspec+ declarator -!- (method-body | `;')
2cbdee3d
MW
233 ;;
234 ;; Don't allow a method-body here if the message takes a
235 ;; varargs list, because we don't have a name for the
236 ;; `va_list' parameter.
237 (let ((message (make-sod-message class name type
238 sub-pset scanner)))
239 (if (varargs-message-p message)
240 (parse #\;)
241 (parse (or #\; (parse-method-item sub-pset
242 type nick name))))))
c91b90c3
MW
243
244 (parse-method-item (sub-pset type sub-nick name)
245 ;; method-item ::=
246 ;; declspec+ dotted-declarator -!- method-body
247 ;;
248 ;; method-body ::= `{' c-fragment `}' | `extern' `;'
249 (parse (seq ((body (or (seq ("extern" #\;) nil)
250 (parse-delimited-fragment
251 scanner #\{ #\}))))
252 (make-sod-method class sub-nick name type
253 body sub-pset scanner))))
254
255 (parse-initializer ()
256 ;; initializer ::= `=' c-fragment | `=' `{' c-fragment `}'
257 ;;
258 ;; Return (VALUE-KIND . VALUE-FORM), ready for passing to a
259 ;; `sod-initializer' constructor.
9ec578d9
MW
260
261 ;; This is kind of tricky because we have to juggle both
262 ;; layers of the parsing machinery. The character scanner
263 ;; will already have consumed the lookahead token (which, if
264 ;; we're going to do anything, is `=').
265 (let ((char-scanner (token-scanner-char-scanner scanner)))
266
267 ;; First, skip the character-scanner past any whitespace.
268 ;; We don't record this consumption, which is a bit
269 ;; naughty, but nobody will actually mind.
270 (loop
271 (when (or (scanner-at-eof-p char-scanner)
272 (not (whitespace-char-p
273 (scanner-current-char char-scanner))))
274 (return))
275 (scanner-step char-scanner))
276
277 ;; Now maybe read an initializer.
278 (cond ((not (eql (token-type scanner) #\=))
279 ;; It's not an `=' after all. There's no
280 ;; initializer.
281 (values '(#\=) nil nil))
282
283 ((and (not (scanner-at-eof-p char-scanner))
284 (char= (scanner-current-char char-scanner)
285 #\{))
286 ;; There's a brace after the `=', so we should
287 ;; consume the `=' here, and read a compound
288 ;; initializer enclosed in braces.
289 (parse (seq (#\= (frag (parse-delimited-fragment
290 scanner #\{ #\})))
291 (cons :compound frag))))
292
293 (t
294 ;; No brace, so read from the `=' up to, but not
295 ;; including, the trailing `,' or `;' delimiter.
296 (parse (seq ((frag (parse-delimited-fragment
297 scanner #\= '(#\; #\,)
298 :keep-end t)))
299 (cons :simple frag)))))))
c91b90c3
MW
300
301 (parse-slot-item (sub-pset base-type type name)
302 ;; slot-item ::=
303 ;; declspec+ declarator -!- [initializer]
304 ;; [`,' init-declarator-list] `;'
305 ;;
306 ;; init-declarator-list ::=
307 ;; declarator [initializer] [`,' init-declarator-list]
308 (parse (and (seq ((init (? (parse-initializer))))
309 (make-sod-slot class name type
310 sub-pset scanner)
311 (when init
312 (make-sod-instance-initializer
313 class nick name (car init) (cdr init)
048d0b2d 314 sub-pset scanner)))
c91b90c3
MW
315 (skip-many ()
316 (seq (#\,
317 (ds (parse-declarator scanner
318 base-type))
319 (init (? (parse-initializer))))
320 (make-sod-slot class (cdr ds) (car ds)
321 sub-pset scanner)
322 (when init
323 (make-sod-instance-initializer
324 class nick (cdr ds)
325 (car init) (cdr init)
048d0b2d 326 sub-pset scanner))))
c91b90c3
MW
327 #\;)))
328
329 (parse-initializer-item (sub-pset constructor)
330 ;; initializer-item ::=
331 ;; [`class'] -!- slot-initializer-list `;'
332 ;;
333 ;; slot-initializer ::= id `.' id initializer
334 (parse (and (skip-many ()
335 (seq ((name-a :id) #\. (name-b :id)
336 (init (parse-initializer)))
337 (funcall constructor class
338 name-a name-b
339 (car init) (cdr init)
340 sub-pset scanner))
341 #\,)
342 #\;)))
343
344 (class-item-dispatch (sub-pset base-type type name)
345 ;; Logically part of `parse-raw-class-item', but the
346 ;; indentation was getting crazy. We're currently at
347 ;;
348 ;; raw-class-item ::=
349 ;; declspec+ (declarator | dotted-declarator) -!- ...
350 ;; | other-items
351 ;;
352 ;; If the declarator is dotted then this must be a method
353 ;; definition; otherwise it might be a message or slot.
354 (cond ((not (typep type 'c-function-type))
355 (when (consp name)
356 (cerror*-with-location
357 scanner
358 "Method declarations must have function type.")
359 (setf name (cdr name)))
360 (parse-slot-item sub-pset base-type type name))
361 ((consp name)
362 (parse-method-item sub-pset type
363 (car name) (cdr name)))
364 (t
365 (parse-message-item sub-pset type name))))
366
367 (parse-raw-class-item (sub-pset)
368 ;; raw-class-item ::=
369 ;; message-item
370 ;; | method-item
371 ;; | slot-item
372 ;; | initializer-item
373 ;;
374 ;; Most of the above begin with declspecs and a declarator
375 ;; (which might be dotted). So we parse that here and
376 ;; dispatch based on what we find.
048d0b2d 377 (parse (or (plug class-item scanner class sub-pset)
db2abd9d 378 (peek
c91b90c3
MW
379 (seq ((ds (parse-c-type scanner))
380 (dc (parse-maybe-dotted-declarator ds))
048d0b2d
MW
381 (nil (class-item-dispatch sub-pset
382 ds
383 (car dc)
db2abd9d 384 (cdr dc))))))
c91b90c3
MW
385 (and "class"
386 (parse-initializer-item
387 sub-pset
388 #'make-sod-class-initializer))
389 (parse-initializer-item
390 sub-pset
391 #'make-sod-instance-initializer)))))
392
048d0b2d
MW
393 (parse (seq (#\{
394 (nil (skip-many ()
395 (seq ((sub-pset (parse-property-set scanner))
9ec578d9 396 (nil (parse-raw-class-item sub-pset)))
048d0b2d 397 (check-unused-properties sub-pset))))
9ec578d9 398 (nil (error () #\})))
048d0b2d
MW
399 (finalize-sod-class class)
400 (add-to-module *module* class)))))))
401
402(define-pluggable-parser module class (scanner pset)
c91b90c3
MW
403 ;; `class' id [`:' id-list] class-body
404 ;; `class' id `;'
bf090e02 405 (with-parser-context (token-scanner-context :scanner scanner)
c91b90c3
MW
406 (parse (seq ("class"
407 (name :id)
408 (nil (or (seq (#\;)
409 (make-class-type name))
410 (seq ((supers (? (seq (#\: (ids (list () :id #\,)))
411 ids)))
412 (nil (parse-class-body
413 scanner
414 pset name supers)))))))))))
415
bf090e02 416;;;----- That's all, folks --------------------------------------------------