| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | IN: xmode.marker | 
					
						
							|  |  |  | USING: kernel namespaces xmode.rules xmode.tokens | 
					
						
							| 
									
										
										
										
											2007-12-08 03:23:14 -05:00
										 |  |  | xmode.marker.state xmode.marker.context xmode.utilities | 
					
						
							|  |  |  | xmode.catalog sequences math assocs combinators combinators.lib | 
					
						
							| 
									
										
										
										
											2008-06-24 14:47:54 -04:00
										 |  |  | strings regexp splitting parser-combinators ascii unicode.case | 
					
						
							|  |  |  | combinators.short-circuit ;
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | ! Based on org.gjt.sp.jedit.syntax.TokenMarker | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : current-keyword ( -- string )
 | 
					
						
							|  |  |  |     last-offset get position get line get subseq ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : keyword-number? ( keyword -- ? )
 | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         [ current-rule-set rule-set-highlight-digits? ] | 
					
						
							|  |  |  |         [ dup [ digit? ] contains? ] | 
					
						
							|  |  |  |         [ | 
					
						
							|  |  |  |             dup [ digit? ] all? [ | 
					
						
							| 
									
										
										
										
											2007-12-06 00:23:18 -05:00
										 |  |  |                 current-rule-set rule-set-digit-re | 
					
						
							|  |  |  |                 dup [ dupd matches? ] [ drop f ] if
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |             ] unless*
 | 
					
						
							|  |  |  |         ] | 
					
						
							| 
									
										
										
										
											2008-06-10 21:42:55 -04:00
										 |  |  |     } 0&& nip ;
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | : mark-number ( keyword -- id )
 | 
					
						
							|  |  |  |     keyword-number? DIGIT and ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : mark-keyword ( keyword -- id )
 | 
					
						
							| 
									
										
										
										
											2007-12-10 02:20:36 -05:00
										 |  |  |     current-rule-set rule-set-keywords at ;
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | : add-remaining-token ( -- )
 | 
					
						
							|  |  |  |     current-rule-set rule-set-default prev-token, ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : mark-token ( -- )
 | 
					
						
							|  |  |  |     current-keyword | 
					
						
							|  |  |  |     dup mark-number [ ] [ mark-keyword ] ?if
 | 
					
						
							|  |  |  |     [ prev-token, ] when* ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : current-char ( -- char )
 | 
					
						
							|  |  |  |     position get line get nth ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | GENERIC: match-position ( rule -- n )
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | M: mark-previous-rule match-position drop last-offset get ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | M: rule match-position drop position get ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : can-match-here? ( matcher rule -- ? )
 | 
					
						
							|  |  |  |     match-position { | 
					
						
							|  |  |  |         [ over ] | 
					
						
							|  |  |  |         [ over matcher-at-line-start?     over zero?                implies ] | 
					
						
							|  |  |  |         [ over matcher-at-whitespace-end? over whitespace-end get = implies ] | 
					
						
							|  |  |  |         [ over matcher-at-word-start?     over last-offset get =    implies ] | 
					
						
							| 
									
										
										
										
											2008-06-10 21:42:55 -04:00
										 |  |  |     } 0&& 2nip ;
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-08 03:23:14 -05:00
										 |  |  | : rest-of-line ( -- str )
 | 
					
						
							|  |  |  |     line get position get tail-slice ;
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-08 15:14:33 -05:00
										 |  |  | GENERIC: text-matches? ( string text -- match-count/f )
 | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-08 03:23:14 -05:00
										 |  |  | M: f text-matches? | 
					
						
							|  |  |  |     2drop f ;
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-08 03:23:14 -05:00
										 |  |  | M: string-matcher text-matches? | 
					
						
							|  |  |  |     [ | 
					
						
							|  |  |  |         dup string-matcher-string | 
					
						
							|  |  |  |         swap string-matcher-ignore-case? | 
					
						
							|  |  |  |         string-head? | 
					
						
							|  |  |  |     ] keep string-matcher-string length and ;
 | 
					
						
							| 
									
										
										
										
											2007-12-06 00:23:18 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | M: regexp text-matches? | 
					
						
							| 
									
										
										
										
											2007-12-08 15:14:33 -05:00
										 |  |  |     >r >string r> match-head ;
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | : rule-start-matches? ( rule -- match-count/f )
 | 
					
						
							|  |  |  |     dup rule-start tuck swap can-match-here? [ | 
					
						
							| 
									
										
										
										
											2007-12-08 03:23:14 -05:00
										 |  |  |         rest-of-line swap matcher-text text-matches? | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |     ] [ | 
					
						
							|  |  |  |         drop f
 | 
					
						
							|  |  |  |     ] if ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : rule-end-matches? ( rule -- match-count/f )
 | 
					
						
							|  |  |  |     dup mark-following-rule? [ | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  |         dup rule-start swap can-match-here? 0 and
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |     ] [ | 
					
						
							|  |  |  |         dup rule-end tuck swap can-match-here? [ | 
					
						
							| 
									
										
										
										
											2007-12-08 03:23:14 -05:00
										 |  |  |             rest-of-line | 
					
						
							|  |  |  |             swap matcher-text context get line-context-end or
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |             text-matches? | 
					
						
							|  |  |  |         ] [ | 
					
						
							|  |  |  |             drop f
 | 
					
						
							|  |  |  |         ] if
 | 
					
						
							|  |  |  |     ] if ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  | DEFER: get-rules | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : get-always-rules ( vector/f ruleset -- vector/f )
 | 
					
						
							|  |  |  |     f swap rule-set-rules at ?push-all ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : get-char-rules ( vector/f char ruleset -- vector/f )
 | 
					
						
							|  |  |  |     >r ch>upper r> rule-set-rules at ?push-all ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : get-rules ( char ruleset -- seq )
 | 
					
						
							| 
									
										
										
										
											2007-12-10 02:20:36 -05:00
										 |  |  |     f -rot [ get-char-rules ] keep get-always-rules ;
 | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | GENERIC: handle-rule-start ( match-count rule -- )
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | GENERIC: handle-rule-end ( match-count rule -- )
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  | : find-escape-rule ( -- rule )
 | 
					
						
							|  |  |  |     context get dup
 | 
					
						
							|  |  |  |     line-context-in-rule-set rule-set-escape-rule [ ] [ | 
					
						
							|  |  |  |         line-context-parent line-context-in-rule-set | 
					
						
							|  |  |  |         dup [ rule-set-escape-rule ] when
 | 
					
						
							|  |  |  |     ] ?if ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : check-escape-rule ( rule -- ? )
 | 
					
						
							|  |  |  |     rule-no-escape? [ f ] [ | 
					
						
							|  |  |  |         find-escape-rule dup [ | 
					
						
							|  |  |  |             dup rule-start-matches? dup [ | 
					
						
							|  |  |  |                 swap handle-rule-start | 
					
						
							|  |  |  |                 delegate-end-escaped? [ not ] change
 | 
					
						
							|  |  |  |                 t
 | 
					
						
							|  |  |  |             ] [ | 
					
						
							|  |  |  |                 2drop f
 | 
					
						
							|  |  |  |             ] if
 | 
					
						
							|  |  |  |         ] when
 | 
					
						
							|  |  |  |     ] if ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | : check-every-rule ( -- ? )
 | 
					
						
							|  |  |  |     current-char current-rule-set get-rules | 
					
						
							|  |  |  |     [ rule-start-matches? ] map-find
 | 
					
						
							|  |  |  |     dup [ handle-rule-start t ] [ 2drop f ] if ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : ?end-rule ( -- )
 | 
					
						
							|  |  |  |     current-rule [ | 
					
						
							|  |  |  |         dup rule-end-matches? | 
					
						
							|  |  |  |         dup [ swap handle-rule-end ] [ 2drop ] if
 | 
					
						
							|  |  |  |     ] when* ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : rule-match-token* ( rule -- id )
 | 
					
						
							|  |  |  |     dup rule-match-token { | 
					
						
							|  |  |  |         { f [ dup rule-body-token ] } | 
					
						
							|  |  |  |         { t [ current-rule-set rule-set-default ] } | 
					
						
							|  |  |  |         [ ] | 
					
						
							|  |  |  |     } case nip ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  | M: escape-rule handle-rule-start | 
					
						
							|  |  |  |     drop
 | 
					
						
							|  |  |  |     ?end-rule | 
					
						
							|  |  |  |     process-escape? get [ | 
					
						
							|  |  |  |         escaped? [ not ] change
 | 
					
						
							|  |  |  |         position [ + ] change
 | 
					
						
							|  |  |  |     ] [ 2drop ] if ;
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | M: seq-rule handle-rule-start | 
					
						
							|  |  |  |     ?end-rule | 
					
						
							|  |  |  |     mark-token | 
					
						
							|  |  |  |     add-remaining-token | 
					
						
							|  |  |  |     tuck rule-body-token next-token, | 
					
						
							| 
									
										
										
										
											2007-12-10 02:20:36 -05:00
										 |  |  |     rule-delegate [ push-context ] when* ;
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | UNION: abstract-span-rule span-rule eol-span-rule ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | M: abstract-span-rule handle-rule-start | 
					
						
							|  |  |  |     ?end-rule | 
					
						
							|  |  |  |     mark-token | 
					
						
							|  |  |  |     add-remaining-token | 
					
						
							|  |  |  |     tuck rule-match-token* next-token, | 
					
						
							|  |  |  |     ! ... end subst ... | 
					
						
							|  |  |  |     dup context get set-line-context-in-rule | 
					
						
							| 
									
										
										
										
											2007-12-10 02:20:36 -05:00
										 |  |  |     rule-delegate push-context ;
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  | M: span-rule handle-rule-end | 
					
						
							|  |  |  |     2drop ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | M: mark-following-rule handle-rule-start | 
					
						
							|  |  |  |     ?end-rule | 
					
						
							|  |  |  |     mark-token add-remaining-token | 
					
						
							|  |  |  |     tuck rule-match-token* next-token, | 
					
						
							|  |  |  |     f context get set-line-context-end | 
					
						
							|  |  |  |     context get set-line-context-in-rule ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  | M: mark-following-rule handle-rule-end | 
					
						
							|  |  |  |     nip rule-match-token* prev-token, | 
					
						
							|  |  |  |     f context get set-line-context-in-rule ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | M: mark-previous-rule handle-rule-start | 
					
						
							|  |  |  |     ?end-rule | 
					
						
							|  |  |  |     mark-token | 
					
						
							|  |  |  |     dup rule-body-token prev-token, | 
					
						
							|  |  |  |     rule-match-token* next-token, ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-06-09 03:14:14 -04:00
										 |  |  | : do-escaped ( -- )
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |     escaped? get [ | 
					
						
							|  |  |  |         escaped? off
 | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  |         ! ... | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |     ] when ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : check-end-delegate ( -- ? )
 | 
					
						
							|  |  |  |     context get line-context-parent [ | 
					
						
							|  |  |  |         line-context-in-rule [ | 
					
						
							|  |  |  |             dup rule-end-matches? dup [ | 
					
						
							|  |  |  |                 [ | 
					
						
							|  |  |  |                     swap handle-rule-end | 
					
						
							|  |  |  |                     ?end-rule | 
					
						
							|  |  |  |                     mark-token | 
					
						
							|  |  |  |                     add-remaining-token | 
					
						
							|  |  |  |                 ] keep context get line-context-parent line-context-in-rule rule-match-token* next-token, | 
					
						
							|  |  |  |                 pop-context | 
					
						
							|  |  |  |                 seen-whitespace-end? on t
 | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  |             ] [ drop check-escape-rule ] if
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |         ] [ f ] if*
 | 
					
						
							|  |  |  |     ] [ f ] if* ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : handle-no-word-break ( -- )
 | 
					
						
							|  |  |  |     context get line-context-parent [ | 
					
						
							| 
									
										
										
										
											2007-12-10 02:20:36 -05:00
										 |  |  |         line-context-in-rule [ | 
					
						
							|  |  |  |             dup rule-no-word-break? [ | 
					
						
							|  |  |  |                 rule-match-token* prev-token, | 
					
						
							|  |  |  |                 pop-context | 
					
						
							|  |  |  |             ] [ drop ] if
 | 
					
						
							|  |  |  |         ] when*
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |     ] when* ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : check-rule ( -- )
 | 
					
						
							|  |  |  |     ?end-rule | 
					
						
							|  |  |  |     handle-no-word-break | 
					
						
							|  |  |  |     mark-token | 
					
						
							|  |  |  |     add-remaining-token ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : (check-word-break) ( -- )
 | 
					
						
							|  |  |  |     check-rule | 
					
						
							|  |  |  |      | 
					
						
							|  |  |  |     1 current-rule-set rule-set-default next-token, ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  | : rule-set-empty? ( ruleset -- ? )
 | 
					
						
							|  |  |  |     dup rule-set-rules assoc-empty?
 | 
					
						
							|  |  |  |     swap rule-set-keywords assoc-empty? and ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | : check-word-break ( -- ? )
 | 
					
						
							|  |  |  |     current-char dup blank? [ | 
					
						
							|  |  |  |         drop
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         seen-whitespace-end? get [ | 
					
						
							|  |  |  |             position get 1+ whitespace-end set
 | 
					
						
							|  |  |  |         ] unless
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         (check-word-break) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     ] [ | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  |         ! Micro-optimization with incorrect semantics; we keep | 
					
						
							|  |  |  |         ! it here because jEdit mode files depend on it now... | 
					
						
							|  |  |  |         current-rule-set rule-set-empty? [ | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |             drop
 | 
					
						
							|  |  |  |         ] [ | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  |             dup alpha? [ | 
					
						
							|  |  |  |                 drop
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |             ] [ | 
					
						
							| 
									
										
										
										
											2007-12-02 05:25:18 -05:00
										 |  |  |                 current-rule-set rule-set-no-word-sep* member? [ | 
					
						
							|  |  |  |                     (check-word-break) | 
					
						
							|  |  |  |                 ] unless
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |             ] if
 | 
					
						
							|  |  |  |         ] if
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         seen-whitespace-end? on
 | 
					
						
							|  |  |  |     ] if
 | 
					
						
							|  |  |  |     escaped? off
 | 
					
						
							|  |  |  |     delegate-end-escaped? off t ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : mark-token-loop ( -- )
 | 
					
						
							|  |  |  |     position get line get length < [ | 
					
						
							|  |  |  |         { | 
					
						
							|  |  |  |             [ check-end-delegate ] | 
					
						
							|  |  |  |             [ check-every-rule ] | 
					
						
							|  |  |  |             [ check-word-break ] | 
					
						
							| 
									
										
										
										
											2008-06-10 21:42:55 -04:00
										 |  |  |         } 0|| drop
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  | 
 | 
					
						
							|  |  |  |         position inc
 | 
					
						
							|  |  |  |         mark-token-loop | 
					
						
							|  |  |  |     ] when ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : mark-remaining ( -- )
 | 
					
						
							|  |  |  |     line get length position set
 | 
					
						
							|  |  |  |     check-rule ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : unwind-no-line-break ( -- )
 | 
					
						
							|  |  |  |     context get line-context-parent [ | 
					
						
							| 
									
										
										
										
											2007-12-10 02:20:36 -05:00
										 |  |  |         line-context-in-rule [ | 
					
						
							|  |  |  |             rule-no-line-break? [ | 
					
						
							|  |  |  |                 pop-context | 
					
						
							|  |  |  |                 unwind-no-line-break | 
					
						
							|  |  |  |             ] when
 | 
					
						
							|  |  |  |         ] when*
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |     ] when* ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : tokenize-line ( line-context line rules -- line-context' seq )
 | 
					
						
							|  |  |  |     [ | 
					
						
							| 
									
										
										
										
											2007-12-10 02:20:36 -05:00
										 |  |  |         "MAIN" swap at -rot
 | 
					
						
							| 
									
										
										
										
											2007-11-28 23:34:11 -05:00
										 |  |  |         init-token-marker | 
					
						
							|  |  |  |         mark-token-loop | 
					
						
							|  |  |  |         mark-remaining | 
					
						
							|  |  |  |         unwind-no-line-break | 
					
						
							|  |  |  |         context get
 | 
					
						
							|  |  |  |     ] { } make ;
 |