]> git.saurik.com Git - wxWidgets.git/blob - utils/HelpGen/src/cjparser.cpp
offset version by 1 to avoid having compatibility_version of 0.0.0 under Darwin:...
[wxWidgets.git] / utils / HelpGen / src / cjparser.cpp
1 /////////////////////////////////////////////////////////////////////////////
2 // Name: No names yet.
3 // Purpose: Contrib. demo
4 // Author: Aleksandras Gluchovas
5 // Modified by:
6 // Created: 22/09/98
7 // RCS-ID: $Id$
8 // Copyright: (c) Aleskandars Gluchovas
9 // Licence: wxWindows licence
10 /////////////////////////////////////////////////////////////////////////////
11
12 // For compilers that support precompilation, includes "wx/wx.h".
13 #include "wx/wxprec.h"
14
15 #ifdef __BORLANDC__
16 #pragma hdrstop
17 #endif
18
19 #ifndef WX_PRECOMP
20 #include "wx/wx.h"
21 #endif
22
23 #include "cjparser.h"
24
25 #if defined( wxUSE_TEMPLATE_STL )
26
27 #include <map>
28
29 #else
30
31 #include "wxstlac.h"
32
33 #endif
34
35
36 /***** Implementation for class SJParser *****/
37
38 // statics used by inline'ed C helper-functions
39 static char* _gSrcStart = 0;
40 static char* _gSrcEnd = 0;
41 static wxChar* _gLastSuppresedComment = 0;
42 static int _gLineNo = 0;
43
44 // FOR NOW:: comments queue is static
45 #define MAX_CQ_ENTRIES 128
46 static char* _gCommentsQueue[MAX_CQ_ENTRIES];
47 static int _gCQSize = 0;
48
49 /***** keyword map related structures *****/
50
51 struct less_c_str
52 {
53 inline bool operator()( char* x, char* y) const
54 { return ( strcmp( x,y ) < 0 );
55 }
56 };
57
58 //WXSTL_MAP(CharPtrT,CharPtrT, LESS_THEN_FUNCTOR(CharPtrT));
59
60 #if defined( wxUSE_TEMPLATE_STL )
61
62 typedef map< char*, char*, less_c_str > KeywordMapT;
63
64 #else
65
66 typedef char* CharPtrT;
67 typedef WXSTL_MAP( CharPtrT, CharPtrT ,less_c_str) KeywordMapT;
68
69 #endif
70
71 static KeywordMapT __gMultiLangMap;
72 static int __gMapReady = 0;
73
74 static char* __gKeyWords[] =
75 {
76 "public",
77 "protected",
78 "private",
79
80 "class",
81 "struct",
82 "union",
83 "enum",
84 "interface",
85
86 "package",
87 "import",
88
89 "typedef",
90 "template",
91 "friend",
92 "const",
93 "volatile",
94 "mutable",
95 "virtual",
96 "inline",
97 "static",
98 "register",
99
100 "final",
101 "abstract",
102 "native",
103
104 "__stdcall",
105 "extern",
106
107 0
108 };
109
110 static void check_keyword_map()
111 {
112 if ( !__gMapReady )
113 {
114 __gMapReady = 1;
115
116 // "make sure" the address of the first member of non-polimorphic class
117 // coinsides with the address of the instance
118
119 char** keyword = __gKeyWords;
120
121 while ( (*keyword) != 0 )
122 {
123 __gMultiLangMap.insert(
124 KeywordMapT::value_type( *keyword, *keyword )
125 );
126
127 ++keyword;
128 }
129 }
130 }
131
132 /***** helper functions *****/
133
134 static inline void skip_to_eol( char*& cur )
135 {
136 while( *(cur) != 10 && *cur != 13 && cur < _gSrcEnd) ++cur;
137 }
138
139 static inline void skip_eol( char*& cur )
140 {
141 if ( *cur == 13 )
142
143 cur += 2;
144 else
145 cur += 1;
146
147 ++_gLineNo;
148 }
149
150 static inline bool skip_to_next_comment_in_the_line( char*& cur )
151 {
152 do
153 {
154 while( cur < _gSrcEnd &&
155 *cur != 10 &&
156 *cur != 13 &&
157 *cur != '/'
158 ) ++cur;
159
160 if ( cur == _gSrcEnd ) return false;
161
162 if ( *cur == '/' )
163 {
164 if ( (*(cur+1) == '*') ||
165 (*(cur+1) == '/') ) return true;
166 else
167 {
168 ++cur;
169 continue;
170 }
171 }
172
173 return false;
174
175 } while(1);
176 }
177
178 inline static void store_line_no( int& toVar )
179 {
180 toVar = _gLineNo;
181 }
182
183 inline static void restore_line_no( int storedLineNo )
184 {
185 _gLineNo = storedLineNo;
186 }
187
188 inline static int get_line_no()
189 {
190 return _gLineNo;
191 }
192
193 static void skip_to_prev_line( char*& cur )
194 {
195 while( cur >= _gSrcStart &&
196 *cur != 10 &&
197 *cur != 13
198 ) --cur;
199
200 // NOTE:: '\n' is 13,10 for DOS
201 // '\n' is 10 for UNIX
202
203 // NOTE1: '\n' symbol is not used here,
204 // to provide possibility of loading
205 // file as binary
206
207 --cur;
208 if ( *cur == 10 )
209 {
210 ++cur;
211 return;
212 }
213
214 if ( *cur == 13 ) --cur;
215
216 while( cur >= _gSrcStart &&
217 *cur != 10 &&
218 *cur != 13
219 ) --cur;
220
221 ++cur; // move to the first character in the line
222 }
223
224 static inline void skip_comments( char*& cur )
225 {
226 ++cur; // skip '/' token
227
228 if ( *cur != '/' && *cur != '*' ) return;
229
230 // first, store position of the comment into the queue
231 // (which further will be attached to the next context
232 // found)
233
234 if ( cur-1 != _gLastSuppresedComment )
235 {
236 if ( _gCQSize == MAX_CQ_ENTRIES )
237 {
238 size_t i = MAX_CQ_ENTRIES-1;
239
240 while( i != 0 )
241 {
242 _gCommentsQueue[i-1] = _gCommentsQueue[i];
243 --i;
244 }
245
246 --_gCQSize ;
247 }
248
249 _gCommentsQueue[_gCQSize++] = cur-1;
250 }
251
252 // if signle-line comment, skip it now
253 if ( *cur == '/' )
254 {
255 skip_to_eol( cur );
256 skip_eol( cur );
257 return;
258 }
259
260 size_t level = 1;
261
262 // check for multiline comment (handle nested multiline comments!)
263
264 int line_len = 0;
265
266 ++cur;
267 ++cur;
268 do
269 {
270 // TBD:: check eof cond.
271
272 // detect and remove vertical columns of '*''s
273
274 while ( *cur != '/' && cur < _gSrcEnd )
275 {
276 switch (*cur)
277 {
278 case '*' :
279 {
280 if ( *(cur+1) != '/' )
281 {
282 if ( line_len == 1 )
283
284 *cur = ' ';
285 }
286
287 break;
288 }
289
290 case 13 : line_len = 0; break;
291 case 10 : { line_len = 0; ++_gLineNo; } break;
292
293 default : ++line_len;
294 }
295
296 ++cur;
297 }
298
299 if ( cur >= _gSrcEnd ) return;
300
301 ++cur;
302
303 if ( *(cur-2) == '*' )
304 {
305 --level;
306 if ( level == 0 )
307 break;
308 }
309 else
310 if ( *cur == '*' )
311 {
312 ++cur;
313 ++cur;
314
315 ++level;
316 }
317
318 } while(1);
319 }
320
321 static inline void clear_commets_queue()
322 {
323 _gCQSize = 0;
324 }
325
326 static inline void skip_quoted_string( char*& cur )
327 {
328 ++cur; // skip first quote '"'
329
330 // check if quote wasn't prefixed
331 if ( *(cur-2) == '\\' )
332 return;
333
334 do
335 {
336 while ( *cur != '"' && cur < _gSrcEnd )
337 {
338 if ( *cur == 10 ) ++_gLineNo;
339 ++cur;
340 }
341
342 if ( cur >= _gSrcEnd ) return;
343
344 ++cur; // skip the last quote
345
346 // check if it wasn't prefixed
347
348 if ( *(cur-2) != '\\' )
349 break;
350
351 } while (1);
352 }
353
354 // skips subsequent white space and comments
355 // (return false if the end of source code reached)
356
357 static inline bool get_next_token( char*& cur )
358 {
359 for( ; cur < _gSrcEnd; ++cur )
360 {
361 switch( *(cur) )
362 {
363 case ' ' : continue;
364 case '\t': continue;
365 case 13 : continue;
366
367 case 10 : { ++_gLineNo;continue; }
368
369 case '/' : skip_comments( cur );
370 --cur;
371 continue;
372
373 default : break;
374 };
375
376 break;
377 }
378
379 if ( cur >= _gSrcEnd )
380 return false;
381 else
382 return true;
383 }
384
385 static inline void skip_preprocessor_dir( wxChar*& cur )
386 {
387 do
388 {
389 skip_to_eol(cur);
390
391 if ( *(cur-1) != _T('\\') )
392 break;
393
394 if ( cur < _gSrcEnd )
395 skip_eol( cur );
396 else
397 break;
398
399 } while(1);
400 }
401
402 static void skip_token( char*& cur )
403 {
404 if ( *cur == '"' )
405 {
406 skip_quoted_string( cur );
407 return;
408 }
409
410 if ( *cur == ',' ||
411 *cur == ';' ||
412 *cur == ')' ||
413 *cur == '('
414 )
415 {
416 ++cur;
417 return;
418 }
419
420 // special case of "!=", "<=", ... 2 character composite tokens
421 if ( *cur == '<' ||
422 *cur == '>' ||
423 *cur == '=' ||
424 *cur == '!'
425 )
426 {
427 cur++;
428 if ( *cur == '=' )
429 cur++;
430
431 return;
432 }
433
434 ++cur; // leading character is always skipped
435
436 for( ; cur < _gSrcEnd ; ++cur )
437 {
438 switch ( *cur )
439 {
440 case ' ' : break;
441 case '\t': break;
442 case 13 : break;
443 case 10 : break;
444 case ',' : break;
445 case ';' : break;
446 case '<' : break;
447 case '>' : break;
448
449 // FIXME:: QUICK-HACK:: to treat scope resolution
450 // tokens are a part of the string - e.g. SomeSpace::SubName would
451 // become one token
452
453 case ':' : if ( *(cur+1) == ':' )
454 {
455 ++cur;
456 continue;
457 }
458
459 break;
460 case '=' : break;
461 case '(' : break;
462 case ')' : break;
463 case '{' : break;
464 case '}' : break;
465
466 default : continue;
467 };
468 break;
469 }
470 }
471
472 static inline size_t get_token_len( char* tok )
473 {
474 char* start = tok;
475
476 skip_token( tok );
477
478 return size_t( tok - start );
479 }
480
481 // returns true, if given tokens are equel
482
483 static inline bool cmp_tokens( char* tok1, char* tok2 )
484 {
485 // NOTE:: the case one token includes
486 // other in it's entirely is not handled
487
488 size_t len = get_token_len( tok1 );
489
490 // assuming that tokens are non-zero length
491
492 do
493 {
494 if ( *(tok1++) != *(tok2++) )
495 return false;
496
497 --len;
498
499 } while ( --len );
500
501 return true;
502 }
503
504 static inline bool cmp_tokens_fast( char* tok1, char* tok2, size_t len )
505 {
506 do
507 {
508 if ( *(tok1++) != *(tok2++) )
509 return false;
510
511 } while ( --len );
512
513 return true;
514 }
515
516 static inline void skip_tempalate_statement( char*& cur )
517 {
518 size_t level = 0;
519
520 // go one level deeper
521 while( *cur != '<' && cur < _gSrcEnd )
522 {
523 if (*cur == 10 ) ++_gLineNo;
524 ++cur;
525 }
526
527 // FIXME:: template should be checked statement for
528 // comments inside of it
529
530 do
531 {
532 if ( *cur == '<' )
533 ++level;
534 else
535 --level;
536
537 ++cur; // skip '<' or '>' token
538
539 if ( level == 0 )
540 return;
541
542 while( *cur != '<' && *cur != '>' && cur < _gSrcEnd )
543 {
544 if (*cur == 10 ) ++_gLineNo;
545 ++cur;
546 }
547
548 } while (1);
549 }
550
551 static inline void skip_statement( char*& cur )
552 {
553 for( ; cur < _gSrcEnd; ++cur )
554
555 switch (*cur)
556 {
557 case ';' : ++cur; // skip statement-terminator token
558 return;
559
560 case '"' : skip_quoted_string(cur);
561 --cur;
562 continue;
563
564 case 10 : ++_gLineNo;
565
566 continue;
567 case '/' : skip_comments( cur );
568 --cur;
569 continue;
570 default : continue;
571 }
572 }
573
574 // "reversed" versions of skip_token() and get_next_token()
575
576 static inline void skip_token_back( char*& cur )
577 {
578 // FIXME:: now, when moving backwards, neither strings nor
579 // comment blocks are checked
580
581 --cur; // skip to the trailing character
582
583 if ( *cur == ',' ||
584 *cur == ')' ||
585 *cur == '('
586 )
587 return;
588
589
590 for( ; cur < _gSrcEnd ; --cur )
591 {
592 switch ( *cur )
593 {
594 case ' ' : break;
595 case '\t': break;
596 case 13 : break;
597 case 10 : break;
598 case ',' : break;
599 case '(' : break;
600
601 default : continue;
602 };
603
604 break;
605 }
606
607 ++cur; // get to the leading character of the token
608 }
609
610 static inline void skip_next_token_back( char*& cur )
611 {
612 --cur; // skip leading character of the current token
613
614 if ( *cur == ',' ||
615 *cur == ')' ||
616 *cur == '('
617 )
618 {
619 ++cur;
620 return;
621 }
622
623 for( ; cur < _gSrcEnd; --cur )
624 {
625 switch ( *cur )
626 {
627 case ' ' : continue;
628 case '\t': continue;
629 case 13 : continue;
630 case 10 : continue;
631 case ',' : continue;
632 case '(' : continue;
633
634 default : break;
635 };
636
637 break;
638 }
639
640 ++cur; // position after the trailing charcter of the prev token
641 }
642
643 static wxString get_token_str( char* cur )
644 {
645 return wxString( cur, get_token_len( cur ) );
646 }
647
648 // skips token or whole expression which may have
649 // nested expressions between '(' ')' brackets.
650 //
651 // Upon return, the cursor points to the terminating bracket ')',
652 //
653 // Return value is the size of the block
654
655 static size_t skip_block( char*& cur )
656 {
657 size_t level = 0; // nesting level
658
659 char* start = cur;
660
661 // NOTE:: assumed that block not necessarely starts
662 // with bracket rightaway
663
664 if ( *cur == '(' )
665 {
666 ++level;
667 }
668
669 do
670 {
671 skip_token( cur );
672
673 char* savedPos = cur;
674 int tmpLnNo;
675 store_line_no( tmpLnNo );
676
677 get_next_token( cur );
678
679 if ( cur >= _gSrcEnd ) return 0;
680
681 if ( *cur == '(' )
682 {
683 ++level;
684 }
685 else
686 if ( *cur == ')' )
687 {
688 if ( level == 0 )
689 {
690 cur = savedPos;
691 restore_line_no( tmpLnNo );
692
693 return size_t(cur-start);
694 }
695
696 --level;
697
698 if ( level == 0 )
699 {
700 ++cur;
701
702 // QUICK-HACK::to easily handle function prototypes ,
703 // it works, besause theoretically there should
704 // be no cast-expressions in non-implementation
705 // scope (e.g. "time( (long*)(ptr+1) )" should not
706 // appear in the declarations, thus it is most likelly
707 // for the ")(" fragment to be within a function
708 // prototype in the declarations scope
709
710 if ( *cur == '(' )
711 {
712 ++level;
713 continue;
714 }
715
716 else return size_t(cur-start);
717 }
718 }
719 else
720 {
721 if ( level == 0 )
722 {
723 cur = savedPos;
724 restore_line_no( tmpLnNo );
725
726 return size_t(cur-start);
727 }
728 }
729
730 } while(1);
731 }
732
733 // returns 0, if end of source reached
734 static inline bool skip_imp_block( char*& cur )
735 {
736 while( *cur != '{' && cur < _gSrcEnd )
737 {
738 skip_token( cur );
739 if ( !get_next_token( cur ) ) return false;
740 }
741
742 while( *cur != '}' && cur < _gSrcEnd )
743 {
744 skip_token( cur );
745 if ( !get_next_token( cur ) ) return false;
746 }
747
748 ++cur;
749
750 return true;
751 }
752
753 static bool is_class_token( char*& cur )
754 {
755 // FIXME:: the below mess should be cleaned in it's entirely
756
757 if ( *cur == 'i' )
758 if ( *(cur+1) == 'n' )
759
760 return cmp_tokens_fast( cur, "interface", 9 );
761
762 if ( *cur == 'c' )
763 if ( *(cur+1) == 'l' )
764
765 return cmp_tokens_fast( cur, "class", 5 );
766
767 if ( *cur == 's' )
768 if ( *(cur+1) == 't' )
769
770 return cmp_tokens_fast( cur, "struct", 6 );
771
772 if ( *cur == 'u' )
773 if ( *(cur+1) == 'n' )
774
775 return cmp_tokens_fast( cur, "union", 5 );
776
777 return false;
778 }
779
780 inline static bool is_forward_decl( char* cur )
781 {
782 do
783 {
784 switch( *cur )
785 {
786 case ':' : return false;
787 case '{' : return false;
788 case '(' : return false;
789
790 case ';' : return true;
791
792 default : break;
793 };
794
795 ++cur;
796
797 } while (cur < _gSrcEnd); // prevent running out of bounds
798
799 return false;
800 }
801
802 inline static bool is_function( char* cur, bool& isAMacro )
803 {
804 isAMacro = false;
805
806 int tmpLnNo;
807 store_line_no( tmpLnNo );
808
809 // NOTE:: comments and quoted strings are not checked here
810
811 // first,check for "single-line hanginging macros" like:
812 // ___UNICODE
813 //
814
815 char* eol = cur;
816 skip_to_eol( eol );
817
818 skip_token( cur );
819 get_next_token( cur );
820
821 if ( cur > eol )
822 {
823 isAMacro = true;
824 restore_line_no( tmpLnNo );
825
826 return true;
827 }
828
829 // it's not a macro, go to the begining of arg. list
830
831 do
832 {
833 // if bracket found, it's a function or a begining
834 // of some macro
835 if ( *cur == '(' )
836 {
837 restore_line_no( tmpLnNo );
838 return true;
839 }
840
841 // end of statement found without any brackets in it
842 // - it cannot be a function
843
844 if ( *cur == ';' )
845 {
846 restore_line_no( tmpLnNo );
847 return false;
848 }
849
850 ++cur;
851
852 } while( cur < _gSrcEnd);
853
854 isAMacro = 1;
855 restore_line_no( tmpLnNo );
856
857 return false;
858 }
859
860 // upon return the cursor is positioned after the
861 // terminating curly brace
862
863 static inline void skip_scope_block( char*& cur )
864 {
865 size_t level = 0;
866
867 for( ; cur < _gSrcEnd ; ++cur )
868
869 switch( *cur )
870 {
871 case '/' : skip_comments( cur );
872 --cur;
873 continue;
874 case '"' : skip_quoted_string( cur );
875 --cur;
876 continue;
877
878 case '{' : ++level;
879 continue;
880
881 case '}' :--level;
882 if ( level == 0 )
883 {
884 ++cur; // skip final closing curly brace
885 return;
886 }
887
888 case 10 : ++_gLineNo; continue;
889
890 default : continue;
891 };
892 }
893
894 // moves tokens like '*' '**', '***', '&' from the name
895 // to the type
896
897 static void arrange_indirection_tokens_between( wxString& type,
898 wxString& identifier )
899 {
900 // TBD:: FIXME:: return value of operators !
901
902 while ( identifier[0u] == _T('*') ||
903 identifier[0u] == _T('&')
904 )
905 {
906 type += identifier[0u];
907 identifier.erase(0,1);
908
909 if ( !identifier.length() ) return;
910 }
911 }
912
913
914 // the only function where multi-lang keyword map is accessed
915
916 static bool is_keyword( char* cur )
917 {
918 size_t len = get_token_len( cur );
919
920 // put a terminating zero after the given token
921 char tmp = *(cur + len);
922 *(cur+len) = '\0';
923
924 KeywordMapT::iterator i;
925
926 i = __gMultiLangMap.find( cur );
927
928 // restore original character suppresed by terminating zero
929 *(cur + len) = tmp;
930
931 return i == __gMultiLangMap.end() ? false : true;
932 }
933
934 static inline void get_string_between( wxChar* start, wxChar* end,
935 wxString* pStr )
936 {
937 char saved = *end;
938
939 *end = _T('\0');
940 *pStr = start;
941 *end = saved;
942 }
943
944 static wxChar* set_comment_text( wxString& text, wxChar* start )
945 {
946 wxChar* end = start;
947
948 // to avoid poluting the queue with this comment
949 _gLastSuppresedComment = start;
950
951 skip_comments( end );
952
953 if ( *(end-1) == _T('/') )
954 end -= 2;
955
956 start += 2;
957
958 // skip multiple leading '/''s or '*''s
959 while( *start == _T('/') && start < end ) ++start;
960 while( *start == _T('*') && start < end ) ++start;
961
962 get_string_between( start, end, &text );
963
964 return end;
965 }
966
967 /***** Implementation for class CJSourceParser *****/
968
969 CJSourceParser::CJSourceParser( bool collectCommnets, bool collectMacros )
970 : mpStart(0),
971 mpEnd(0),
972 mpCurCtx( 0 ),
973 mCommentsOn( collectCommnets ),
974 mMacrosOn ( collectMacros )
975 {
976 check_keyword_map();
977 }
978
979 spFile* CJSourceParser::Parse( char* start, char* end )
980 {
981 // set up state variables
982 mCurVis = SP_VIS_PRIVATE;
983
984 spFile* pTopCtx = new spFile();
985 mpCurCtx = pTopCtx;
986
987 mIsVirtual = 0;
988 mIsTemplate = 0;
989 mNestingLevel = 0;
990
991 m_cur = start;
992
993 mpStart = start;
994 mpEnd = end;
995
996 _gSrcEnd = mpEnd; // let all the C-functions "smell" the end of file
997 _gSrcStart = start;
998
999 _gLineNo = 0;
1000
1001 clear_commets_queue();
1002
1003 // main parsing loop
1004
1005 do
1006 {
1007 if ( !get_next_token( m_cur ) )
1008 // end of source reached
1009 return pTopCtx;
1010
1011 if ( memcmp( m_cur, "ScriptSection( const string&",
1012 strlen( "ScriptSection( const string&" )
1013 ) == 0
1014 )
1015 {
1016 // int o = 0;
1017 // ++o;
1018 }
1019
1020 switch (*m_cur)
1021 {
1022 case '#' :
1023 {
1024 AddMacroNode( m_cur );
1025 continue;
1026 }
1027
1028 case ':' :
1029 {
1030 skip_token( m_cur );
1031 continue;
1032 }
1033
1034 case ';' :
1035 {
1036 skip_token( m_cur );
1037 continue;
1038 }
1039
1040 case ')' :
1041 {
1042 skip_token( m_cur );
1043 continue;
1044 }
1045
1046 case '=' :
1047 {
1048 skip_token( m_cur );
1049 continue;
1050 }
1051
1052 default: break;
1053 }
1054
1055 // 'const' is a part of the return type, not a keyword here
1056 if ( strncmp(m_cur, "const", 5) != 0 && is_keyword( m_cur ) )
1057 {
1058 // parses, token, if token identifies
1059 // the container context (e.g. class/namespace)
1060 // the corresponding context object is created
1061 // and set as current context
1062
1063 ParseKeyword( m_cur );
1064 continue;
1065 }
1066
1067 if ( *m_cur >= _T('0') && *m_cur <= _T('9') )
1068 {
1069 skip_token( m_cur );
1070 continue;
1071 }
1072
1073 if ( *m_cur == _T('}') )
1074 {
1075 if ( mCurCtxType != SP_CTX_CLASS )
1076 {
1077 // FOR NOW:: disable the below assertion
1078
1079 // DBG:: unexpected closing-bracket found
1080 //ASSERT(0);
1081
1082 skip_token( m_cur ); // just skip it
1083 continue;
1084 }
1085
1086 if ( mpCurCtx->GetType() == SP_CTX_CLASS )
1087 {
1088 int curOfs = ( (m_cur+1) - _gSrcStart );
1089
1090 mpCurCtx->mContextLength = ( curOfs - mpCurCtx->mSrcOffset );
1091 }
1092
1093 --mNestingLevel;
1094
1095 // terminate operation/class/namespace context
1096 // TBD:: check if it's really this type of context
1097
1098 wxASSERT( mpCurCtx );
1099 mpCurCtx = mpCurCtx->GetOutterContext();
1100 wxASSERT( mpCurCtx );
1101
1102 if ( mNestingLevel == 0 )
1103 {
1104
1105 mCurCtxType = SP_CTX_FILE;
1106
1107 // not-nested class delclaration finished,
1108 // rest template flag in any case
1109 mIsTemplate = 0;
1110 }
1111
1112 skip_token( m_cur );
1113 continue;
1114 }
1115
1116 bool isAMacro = false;
1117
1118 if ( is_function( m_cur, isAMacro ) )
1119 {
1120 if ( isAMacro )
1121 {
1122 skip_token( m_cur );
1123 continue;
1124 }
1125
1126 char* savedPos = m_cur;
1127
1128 int tmpLnNo;
1129 store_line_no( tmpLnNo );
1130 wxUnusedVar( tmpLnNo );
1131
1132 isAMacro = false;
1133
1134 if ( !ParseNameAndRetVal( m_cur, isAMacro ) )
1135 {
1136 if ( !isAMacro )
1137 {
1138 m_cur = savedPos;
1139 SkipFunction( m_cur );
1140 }
1141 continue;
1142 }
1143
1144 if ( !ParseArguments( m_cur ) )
1145 {
1146 // failure while parsing arguments,
1147 // remove enclosing operation context
1148
1149 spContext* pFailed = mpCurCtx;
1150 mpCurCtx = mpCurCtx->GetOutterContext();
1151 mpCurCtx->RemoveChild( pFailed );
1152
1153 skip_to_eol( m_cur );
1154 //m_cur = savedPos;
1155 }
1156 else
1157 {
1158 // otherwise, successfully close operation context:
1159
1160 clear_commets_queue();
1161
1162 SkipFunctionBody( m_cur );
1163
1164 mpCurCtx = mpCurCtx->GetOutterContext();
1165
1166 // DBG::
1167 wxASSERT( mpCurCtx );
1168
1169 }
1170 }
1171 else // otherwise it's declaration of a variable;
1172 {
1173 // now, the cursor point to the end of statement (';' token)
1174
1175 if ( mCurCtxType != SP_CTX_CLASS )
1176 {
1177 // non-class members are ignored
1178
1179 skip_token( m_cur ); // skip the end of statement
1180 continue;
1181 }
1182
1183 ParseMemberVar( m_cur );
1184 }
1185
1186 } while( 1 );
1187 }
1188
1189 void CJSourceParser::AttachComments( spContext& ctx, wxChar* cur )
1190 {
1191 if ( !mCommentsOn ) return;
1192
1193 MCommentListT& lst = ctx.GetCommentList();
1194
1195 wxChar* prevComEnd = 0;
1196
1197 int tmpLnNo;
1198 store_line_no( tmpLnNo );
1199
1200 // attach comments which were found before the given context
1201
1202 for( int i = 0; i != _gCQSize; ++i )
1203 {
1204 spComment* pComment = new spComment();
1205 lst.push_back( pComment );
1206
1207 // find the end of comment
1208 wxChar* start = _gCommentsQueue[i];
1209
1210 pComment->mIsMultiline = ( *(start+1) == _T('*') );
1211
1212 // first comment in the queue and multiline
1213 // comments are always treated as a begining
1214 // of the new paragraph in the comment text
1215
1216 if ( i == 0 )
1217 {
1218 pComment->mStartsPar = true;
1219 }
1220 else if ( pComment->mIsMultiline )
1221 {
1222 pComment->mStartsPar = true;
1223 }
1224 else
1225 {
1226 // find out wheather there is a new-line
1227 // between to adjecent comments
1228
1229 wxChar* prevLine = start;
1230 skip_to_prev_line(prevLine);
1231
1232 if ( prevLine >= prevComEnd )
1233 pComment->mStartsPar = true;
1234 else
1235 pComment->mStartsPar = false;
1236 }
1237
1238 prevComEnd = set_comment_text( pComment->m_Text, start );
1239 }
1240
1241 // attach comments which are at the end of the line
1242 // of the given context (if any)
1243
1244 if ( skip_to_next_comment_in_the_line( cur ) )
1245 {
1246 spComment* pComment = new spComment();
1247 lst.push_back( pComment );
1248
1249 set_comment_text( pComment->m_Text, cur );
1250
1251 pComment->mStartsPar = 1;
1252 pComment->mIsMultiline = ( *(cur+1) == _T('*') );
1253
1254 // mark this comment, so that it would not
1255 // get in the comments list of the next context
1256 _gLastSuppresedComment = cur;
1257 }
1258
1259 restore_line_no( tmpLnNo );
1260
1261 clear_commets_queue();
1262 }
1263
1264 void CJSourceParser::AddMacroNode( wxChar*& cur )
1265 {
1266 wxChar* start = cur;
1267
1268 int lineNo = get_line_no();
1269
1270 skip_preprocessor_dir( cur );
1271
1272 int tmpLnNo;
1273 store_line_no( tmpLnNo );
1274
1275 if ( !mMacrosOn ) return;
1276
1277 spPreprocessorLine* pPL = new spPreprocessorLine();
1278 pPL->mSrcLineNo = lineNo;
1279
1280 AttachComments( *pPL, cur );
1281
1282 get_string_between( start, cur, &pPL->m_Line );
1283
1284 ++start; // skip '#'
1285 get_next_token( start );
1286
1287 pPL->mDefType = SP_PREP_DEF_OTHER;
1288
1289 // if we found a definition or redefinition,
1290 // determine the type exactly and assign
1291 // a name to the context
1292
1293 if ( *start == _T('d') )
1294 {
1295 if ( cmp_tokens_fast( start, _T("define"), 6 ) )
1296 {
1297 char* tok = start+6;
1298
1299 get_next_token( tok );
1300
1301 pPL->m_Name = get_token_str( tok );
1302
1303 skip_token( tok );
1304 get_next_token( tok);
1305
1306
1307 if ( tok > cur )
1308 pPL->mDefType = SP_PREP_DEF_DEFINE_SYMBOL;
1309 else
1310 pPL->mDefType = SP_PREP_DEF_REDEFINE_SYMBOL;
1311 }
1312 }
1313 else if ( *start == _T('i') )
1314 {
1315 if ( cmp_tokens_fast( start, _T("include"), 7 ) )
1316 {
1317 pPL->mDefType = SP_PREP_DEF_INCLUDE_FILE;
1318 }
1319 else if ( *++start == _T('f') )
1320 {
1321 // either "#if" or "#ifdef"
1322 cur = start;
1323 skip_token( cur );
1324 get_next_token( cur );
1325
1326 wxString condition = get_token_str( cur );
1327
1328 // currently, everything except '0' is true
1329 if ( condition == _T("0") ) {
1330 // skip until the following else or enif
1331 while ( cur < _gSrcEnd ) {
1332 skip_to_eol( cur );
1333 skip_eol( cur );
1334
1335 get_next_token( cur );
1336 if ( *cur++ == _T('#') && *cur == _T('e') )
1337 break;
1338 }
1339 }
1340
1341 // TODO parse the condition...
1342 }
1343 }
1344 else if ( cmp_tokens_fast( start, _T("else"), 4 ) )
1345 {
1346 // skip until "#endif"
1347 while ( cur < _gSrcEnd ) {
1348 skip_to_eol( cur );
1349 skip_eol( cur );
1350
1351 get_next_token( cur );
1352 if ( *cur++ == _T('#') && cmp_tokens_fast( cur, "endif", 5 ) )
1353 break;
1354 }
1355 }
1356
1357 mpCurCtx->AddMember( pPL );
1358
1359 skip_to_eol( cur );
1360 skip_eol( cur );
1361
1362 restore_line_no( tmpLnNo );
1363
1364 clear_commets_queue();
1365 }
1366
1367 void CJSourceParser::ParseKeyword( char*& cur )
1368 {
1369 // analyze token, which identifies the begining of a new context
1370
1371 if ( CheckVisibilty( cur ) )
1372 {
1373 skip_token( cur );
1374 return;
1375 }
1376
1377 if ( is_class_token( cur ) )
1378 {
1379 if ( is_forward_decl( cur ) )
1380 {
1381 // forward declarations are ignored;
1382 skip_token( cur );
1383 return;
1384 }
1385
1386 if ( mNestingLevel == 0 )
1387 {
1388 // change context form global class context
1389 mCurCtxType = SP_CTX_CLASS;
1390 }
1391
1392 ++mNestingLevel;
1393
1394 // add information about new class (name, inheritance, etc)
1395 AddClassNode( cur );
1396
1397 // the default visiblity for class members is 'private'
1398 mCurVis = SP_VIS_PRIVATE;
1399
1400 return;
1401 }
1402
1403 size_t len = get_token_len( cur );
1404
1405 if ( cmp_tokens_fast( cur, "typedef", len ) )
1406 {
1407 skip_token(cur);
1408 get_next_token(cur);
1409
1410 if ( cmp_tokens_fast( cur, "struct", len ) ||
1411 cmp_tokens_fast( cur, "union", len ) ||
1412 cmp_tokens_fast( cur, "class", len )
1413 )
1414 {
1415 if ( mNestingLevel == 0 )
1416 {
1417 // change context form global class context
1418 mCurCtxType = SP_CTX_CLASS;
1419 }
1420
1421 ++mNestingLevel;
1422
1423 // add information about new class (name, inheritance, etc)
1424 AddClassNode( cur );
1425
1426 // the default visiblity for class members is 'private'
1427 mCurVis = SP_VIS_PRIVATE;
1428
1429 return;
1430
1431 // FOR NOW:: typedef struct, etc are also ignored
1432 //skip_scope_block( cur );
1433 }
1434
1435 if ( cmp_tokens_fast( cur, "enum", len ) )
1436 {
1437 AddEnumNode( cur );
1438 return;
1439 }
1440
1441 AddTypeDefNode( cur );
1442
1443 return;
1444 }
1445
1446 if ( cmp_tokens_fast( cur, "enum", len ) )
1447 {
1448 AddEnumNode( cur );
1449 return;
1450 }
1451
1452 if ( cmp_tokens_fast( cur, "extern", len ) )
1453 {
1454 // extern's are ignored (both extern "C" and extern vars)
1455 while ( *cur != '{' &&
1456 *cur != ';' )
1457 {
1458 skip_token( cur );
1459 get_next_token( cur );
1460 }
1461 return;
1462
1463 }
1464 if ( cmp_tokens_fast( cur, "enum", len ) )
1465 {
1466 // enumeration blocks are ignored
1467
1468 skip_scope_block( cur );
1469
1470 get_next_token( cur );
1471 skip_token( cur ); // skip ';' token;
1472 return;
1473 }
1474
1475 if ( cmp_tokens_fast( cur, "package", len ) )
1476 {
1477 // packages are ignored
1478 skip_statement( cur );
1479 return;
1480 };
1481
1482 if ( cmp_tokens_fast( cur, "import", len ) )
1483 {
1484 // import statements are ignored
1485 skip_statement( cur );
1486 return;
1487 }
1488
1489 if ( cmp_tokens_fast( cur, "virtual", len ) )
1490 {
1491 // probably the virtual method is in front of us;
1492 mIsVirtual = 1;
1493 skip_token( cur );
1494 return;
1495 }
1496
1497 if ( cmp_tokens_fast( cur, "template", len ) )
1498 {
1499 mIsTemplate = 1;
1500 skip_tempalate_statement( cur );
1501 return;
1502 }
1503
1504 if ( cmp_tokens_fast( cur, "friend", len ) )
1505 {
1506 skip_statement( cur );
1507 return;
1508 }
1509
1510 // ingnore "unsigificant" tokens (i.e. which do not
1511 // affect the current parsing context)
1512
1513 skip_token( cur );
1514 }
1515
1516 bool CJSourceParser::ParseNameAndRetVal( char*& cur, bool& isAMacro )
1517 {
1518 isAMacro = false;
1519
1520 // FOR NOW:: all functions in the global
1521 // scope are ignored
1522
1523 int lineNo = get_line_no();
1524
1525 char* start = cur;
1526
1527 bool isVirtual = false;
1528 while( *cur != '(' )
1529 {
1530 if ( get_token_str( cur ) == "virtual" )
1531 isVirtual = true;
1532
1533 skip_token( cur );
1534 if ( !get_next_token( cur ) ) return false;
1535 }
1536
1537 char* bracketPos = cur;
1538 char* savedPos = cur + 1;
1539
1540 int tmpLnNo;
1541 store_line_no( tmpLnNo );
1542
1543 // skip gap between function name and start of paramters list
1544 while ( *(cur-1) == ' ' )
1545 --cur;
1546
1547 // check if it's not a macro, and let plugin handle it, if so
1548
1549 if ( mpPlugin )
1550 {
1551 skip_token_back( cur );
1552
1553 char* tmp = cur;
1554
1555 if ( mpPlugin->CanUnderstandContext( tmp, _gSrcEnd, mpCurCtx ) )
1556 {
1557 cur = tmp;
1558
1559 mpPlugin->ParseContext( _gSrcStart, cur, _gSrcEnd, mpCurCtx );
1560
1561 isAMacro = true;
1562
1563 return false;
1564 }
1565 }
1566
1567 spOperation* pOp = new spOperation();
1568
1569 pOp->mSrcLineNo = lineNo;
1570 pOp->mSrcOffset = int( start - _gSrcStart );
1571 pOp->mHeaderLength = int( bracketPos - start );
1572 if ( mpCurCtx->GetContextType() == SP_CTX_CLASS )
1573 pOp->mScope = mpCurCtx->m_Name;
1574
1575 mpCurCtx->AddMember( pOp );
1576 pOp->mVisibility = mCurVis;
1577 pOp->mIsVirtual = isVirtual;
1578
1579 // add comments about operation
1580 AttachComments( *pOp, cur );
1581
1582 // go backwards to method name
1583 skip_token_back( cur );
1584
1585 pOp->m_Name = get_token_str( cur );
1586
1587 // checker whether it's not an operator
1588 char chFirst = *pOp->m_Name.c_str();
1589 if ( !isalpha(chFirst) && chFirst != '_' && chFirst != '~' ) {
1590 // skip 'operator'
1591 skip_next_token_back( cur );
1592 skip_token_back( cur );
1593
1594 wxString lastToken = get_token_str( cur );
1595 if ( lastToken == "operator" ) {
1596 lastToken += pOp->m_Name;
1597 pOp->m_Name = lastToken;
1598 }
1599 else {
1600 // ok, it wasn't an operator after all
1601 skip_token( cur );
1602 }
1603 }
1604 else if ( pOp->m_Name == "operator" ) {
1605 skip_token( cur );
1606 get_next_token( cur );
1607 wxString oper = get_token_str( cur );
1608
1609 pOp->m_Name += oper;
1610 }
1611
1612 // go backwards to method return type
1613 skip_next_token_back( cur );
1614
1615 if ( cur >= start )
1616 {
1617 wxString rettype = wxString( start, size_t( cur-start ) );
1618 // FIXME just for now...
1619 wxString::size_type pos = 0;
1620 wxString toerase("WXDLLEXPORT ");
1621 while((pos = rettype.find(toerase, pos)) != wxString::npos)
1622 rettype.erase(pos, toerase.length());
1623 pOp->m_RetType = rettype;
1624 }
1625
1626 arrange_indirection_tokens_between( pOp->m_RetType, pOp->m_Name );
1627
1628 cur = savedPos;
1629 restore_line_no( tmpLnNo );
1630
1631 // now, enter operation context
1632 mpCurCtx = pOp;
1633
1634 return true;
1635 }
1636
1637 bool CJSourceParser::ParseArguments( char*& cur )
1638 {
1639 // DANGER-MACROS::
1640
1641 // now cursor position is right after the first opening bracket
1642 // of the function declaration
1643
1644 char* blocks [16]; // used exclusivelly for iterative "lean out"
1645 // of macros and misc. not-obviouse grammar
1646 // (dirty,, but we cannot do it very nice,
1647 // we're not preprocessor-free C/C++ code)
1648 int blockSizes[16];
1649
1650 do
1651 {
1652 size_t blocksSkipped = 0;
1653
1654 get_next_token( cur );
1655
1656 bool first_blk = true;
1657
1658 while( *cur != ')' && *cur != ',' )
1659 {
1660 blocks[blocksSkipped] = cur;
1661
1662 if ( first_blk )
1663 {
1664 char* prev = cur;
1665 skip_token( cur );
1666
1667 blockSizes[blocksSkipped] = size_t(cur-prev);
1668
1669 first_blk = 0;
1670 }
1671 else
1672 blockSizes[blocksSkipped] = skip_block( cur );
1673
1674 get_next_token( cur );
1675 ++blocksSkipped;
1676 }
1677
1678
1679 if ( blocksSkipped == 1 )
1680 {
1681 // check if the empty arg. list stressed with "void" inside
1682 if ( cmp_tokens_fast( blocks[0] , "void", 4 ) )
1683 {
1684 cur++; // skip ')'
1685
1686 break;
1687 }
1688
1689 // FIXME:: TBD:: K&R-style function declarations!
1690
1691 // if only one block enclosed, than it's probably
1692 // some macro, there should be at least two blocks,
1693 // one for argument type and another for it's identifier
1694 return false;
1695 }
1696
1697 if ( blocksSkipped == 0 )
1698 {
1699 if ( *cur == 10 ) ++_gLineNo;
1700 ++cur; // skip ')'
1701
1702 break; // function without paramters
1703 }
1704
1705 // we should be in the operation context now
1706 spOperation* pOp = (spOperation*)mpCurCtx;
1707
1708 spParameter* pPar = new spParameter();
1709
1710 pOp->AddMember( pPar );
1711 // FOR NOW:: line number is not exact if argument list is mutiline
1712 pPar->mSrcLineNo = get_line_no();
1713
1714 size_t nameBlock = blocksSkipped - 1;
1715 size_t typeBlock = nameBlock - 1;
1716
1717 // check if default values present
1718 if ( *blocks[typeBlock] == '=' )
1719 {
1720 // expressions like "int = 5" are ignored,
1721 // since name for paramters is required
1722 if ( blocksSkipped == 3 )
1723 {
1724 if ( *cur == ')' )
1725 {
1726 ++cur;
1727 break;
1728 }
1729 else
1730 continue;
1731 }
1732
1733 pPar->m_InitVal = wxString( blocks[nameBlock], blockSizes[nameBlock] );
1734
1735 nameBlock = nameBlock - 2; // skip '=' token and default value block
1736 typeBlock = nameBlock - 1;
1737 }
1738
1739 // attach comments about the parameter
1740 AttachComments( *pPar, blocks[nameBlock] );
1741
1742 // retrieve argument name
1743 pPar->m_Name = wxString( blocks[nameBlock], blockSizes[nameBlock] );
1744
1745 // retreive argument type
1746
1747 size_t len = blockSizes[ typeBlock ];
1748 len = size_t ( (blocks[ typeBlock ] + len) - blocks[ 0 ] );
1749
1750 pPar->m_Type = wxString( blocks[0], len );
1751
1752 arrange_indirection_tokens_between( pPar->m_Type, pPar->m_Name );
1753
1754 if ( *cur == ')' )
1755 {
1756 ++cur;
1757 break;
1758 }
1759
1760 ++cur; // skip comma
1761 get_next_token(cur);
1762
1763 } while(1);
1764
1765 // skip possible whitespace between ')' and following "const"
1766 while ( isspace(*cur) )
1767 cur++;
1768
1769 // check if it was really a function not a macro,
1770 // if so, than it should be terminated with semicolon ';'
1771 // or opening implemenetaton bracket '{'
1772
1773 char* tok = cur;
1774
1775 int tmpLnNo;
1776 store_line_no( tmpLnNo );
1777
1778 bool result = true;
1779
1780 do
1781 {
1782 if ( *tok == '{' || *tok == ';' )
1783 {
1784 restore_line_no(tmpLnNo);
1785 break;
1786 }
1787
1788 // check for unexpected tokens
1789 if ( *tok == '=' || *tok == '0' )
1790 {
1791 skip_token(tok);
1792 if ( !get_next_token(tok) ) return false;
1793 continue;
1794 }
1795
1796 if ( *tok == '}' ) return false;
1797
1798 // if initialization list found
1799 if ( *tok == ':' )
1800 {
1801 restore_line_no(tmpLnNo);
1802 break;
1803 }
1804
1805 if ( cmp_tokens_fast( tok, "const", 5 ) )
1806 {
1807 ((spOperation*)mpCurCtx)->mIsConstant = true;
1808
1809 skip_token(tok);
1810 if ( !get_next_token(tok) ) return false;
1811 continue;
1812 }
1813
1814 if ( CheckVisibilty( tok ) ) return false;
1815
1816 // if next context found
1817 if ( is_keyword( tok ) ) return false;
1818
1819 skip_token(tok);
1820 if ( !get_next_token(tok) ) return false;
1821
1822 } while(1);
1823
1824 return result;
1825 }
1826
1827 void CJSourceParser::ParseMemberVar( char*& cur )
1828 {
1829 MMemberListT& members = mpCurCtx->GetMembers();
1830
1831 bool firstMember = true;
1832
1833 wxString type;
1834
1835 // jump to the end of statement
1836 // and start collecting same-type varibles
1837 // back-to-front towards the type identifier
1838
1839 skip_statement( cur );
1840 char* savedPos = cur;
1841
1842 int tmpLnNo;
1843 store_line_no( tmpLnNo );
1844
1845 --cur; // rewind back to ';'
1846
1847 do
1848 {
1849 spAttribute* pAttr = new spAttribute();
1850 // FOR NOW:: line not is not exact, if member declaration is multiline
1851 pAttr->mSrcLineNo = get_line_no();
1852
1853 mpCurCtx->AddMember( pAttr );
1854 pAttr->mVisibility = mCurVis;
1855
1856 pAttr->mIsConstant = 0;
1857
1858 if ( firstMember )
1859 {
1860 firstMember = 0;
1861 }
1862
1863 skip_token_back( cur );
1864
1865 // attach comments about the attribute
1866 AttachComments( *pAttr, cur );
1867
1868 pAttr->m_Name = get_token_str( cur );
1869
1870 // guessing that this going to be variable type
1871 skip_next_token_back( cur );
1872 skip_token_back( cur );
1873
1874 pAttr->m_Type = get_token_str( cur );
1875
1876 // if comma, than variable list continues
1877 // otherwise the variable type reached - stop
1878
1879 if ( *cur == _T('=') )
1880 {
1881 // yes, we've mistaken, it was not a identifier,
1882 // but it's default value
1883 pAttr->m_InitVal = pAttr->m_Name;
1884
1885 // skip default value and '=' symbol
1886 skip_next_token_back( cur );
1887 skip_token_back( cur );
1888
1889 pAttr->m_Name = get_token_str( cur );
1890
1891 skip_next_token_back( cur );
1892 skip_token_back( cur );
1893 }
1894
1895 if ( *cur != ',' )
1896 {
1897 type = get_token_str( cur );
1898 break;
1899 }
1900
1901 } while(1);
1902
1903 size_t first = 0;
1904
1905 // set up types for all collected (same-type) attributes;
1906 while ( first != members.size() - 1 )
1907 {
1908 spAttribute* pAttr = members[first++]->CastToAttribute();
1909 if ( !pAttr )
1910 continue;
1911
1912 if ( pAttr->m_Type.empty() )
1913 pAttr->m_Type = type;
1914 pAttr->mVisibility = mCurVis;
1915
1916 if ( !pAttr->m_Name.empty() )
1917 arrange_indirection_tokens_between( pAttr->m_Type, pAttr->m_Name );
1918 }
1919
1920 cur = savedPos;
1921 restore_line_no( tmpLnNo );
1922
1923 clear_commets_queue();
1924
1925
1926 }
1927
1928 void CJSourceParser::SkipFunction( char*& cur )
1929 {
1930 while ( *cur != '(' && cur < _gSrcEnd )
1931 {
1932 if (*cur == 10 ) ++_gLineNo;
1933 ++cur;
1934 }
1935
1936 skip_next_token_back( cur ); // go back and skip function identifier
1937 skip_token_back( cur ); // go back and skip return type
1938
1939 skip_block( cur ); // now, go ahead and skip whole declaration
1940
1941 SkipFunctionBody( cur );
1942
1943 }
1944
1945 void CJSourceParser::SkipFunctionBody( char*& cur )
1946 {
1947 // FIXME:: check for comments and quoted stirngs here
1948
1949 bool hasDefinition = false;
1950
1951 while( *cur != '{' && *cur != ';' )
1952 {
1953 if (*cur == 10 ) ++_gLineNo;
1954 ++cur;
1955 }
1956
1957 if ( *cur == ';' )
1958 {
1959 ++cur;
1960 }
1961 else
1962 {
1963 hasDefinition = true;
1964
1965 skip_scope_block( cur ); // skip the whole imp.
1966 }
1967
1968 if ( mpCurCtx->GetType() == SP_CTX_OPERATION )
1969 {
1970 spOperation& op = *((spOperation*)mpCurCtx);
1971
1972 int curOfs = int ( cur - _gSrcStart );
1973
1974 op.mContextLength = curOfs - mpCurCtx->mSrcOffset;
1975
1976 op.mHasDefinition = hasDefinition;
1977
1978 // separate scope resolution token from the name of operation
1979
1980 for( size_t i = 0; i != op.m_Name.length(); ++i )
1981 {
1982 if ( op.m_Name[i] == ':' && op.m_Name[i+1] == ':' )
1983 {
1984 wxString unscoped( op.m_Name, i+2, op.m_Name.length() - ( i + 2 ) );
1985
1986 op.mScope = wxString( op.m_Name, 0, i );
1987
1988 op.m_Name = unscoped;
1989
1990 break;
1991 }
1992 }
1993 }
1994 }
1995
1996 bool CJSourceParser::CheckVisibilty( char*& cur )
1997 {
1998 size_t len = get_token_len( cur );
1999
2000 if ( cmp_tokens_fast( cur, "public:", len ) )
2001 {
2002 mCurVis = SP_VIS_PUBLIC;
2003 return true;
2004 }
2005
2006 if ( cmp_tokens_fast( cur, "protected:", len ) )
2007 {
2008 mCurVis = SP_VIS_PROTECTED;
2009 return true;
2010 }
2011
2012 if ( cmp_tokens_fast( cur, "private:", len ) )
2013 {
2014 mCurVis = SP_VIS_PRIVATE;
2015 return true;
2016 }
2017
2018 return false;
2019 }
2020
2021 void CJSourceParser::AddClassNode( char*& cur )
2022 {
2023 char* ctxStart = cur;
2024
2025 wxString classkeyword = get_token_str( cur );
2026
2027 skip_token( cur ); // skip 'class' keyword
2028 if ( !get_next_token( cur ) ) return;
2029
2030 // in C++
2031 if ( *cur == ':' )
2032 {
2033 skip_token( cur );
2034 get_next_token( cur );
2035 }
2036
2037 // by default all class members are private
2038 mCurVis = SP_VIS_PRIVATE;
2039
2040 spClass* pClass = new spClass();
2041 if ( classkeyword == "class" )
2042 pClass->mClassSubType = SP_CLTYPE_CLASS;
2043 else if ( classkeyword == "struct" ) {
2044 pClass->mClassSubType = SP_CLTYPE_STRUCTURE;
2045
2046 mCurVis = SP_VIS_PUBLIC;
2047 }
2048 else if ( classkeyword == "union" ) {
2049 pClass->mClassSubType = SP_CLTYPE_UNION;
2050
2051 mCurVis = SP_VIS_PUBLIC;
2052 }
2053 else if ( classkeyword == "interface" )
2054 pClass->mClassSubType = SP_CLTYPE_INTERFACE;
2055 else {
2056 pClass->mClassSubType = SP_CLTYPE_INVALID;
2057
2058 wxFAIL_MSG("unknown class keyword");
2059 }
2060
2061 mpCurCtx->AddMember( pClass );
2062
2063 // attach comments about the class
2064 AttachComments( *pClass, cur );
2065
2066 pClass->mSrcLineNo = get_line_no();
2067
2068 pClass->mSrcOffset = int( ctxStart - _gSrcStart );
2069
2070 char* nameTok = cur;
2071 pClass->m_Name = get_token_str( cur );
2072
2073 bool isDerived = 0;
2074
2075 // DANGER-MACROS::
2076
2077 do
2078 {
2079 skip_token( cur );
2080 if ( !get_next_token( cur ) ) return;
2081
2082 if ( *cur == ':' )
2083 {
2084 isDerived = 1;
2085
2086 char* tok = cur;
2087
2088 int tmpLn;
2089 store_line_no( tmpLn );
2090
2091 skip_next_token_back( tok );
2092 skip_token_back( tok );
2093
2094 restore_line_no( tmpLn );
2095
2096 // class name should precend ':' colon, thus
2097 // the one which was captured before was
2098 // proablty something else (like __dllexport MyClass : ... )
2099
2100 if ( nameTok != tok )
2101 {
2102 pClass->m_Name = get_token_str( tok );
2103 }
2104
2105 }
2106
2107 if ( *cur == '{' )
2108 break;
2109
2110 if ( *cur == ',' )
2111 continue;
2112
2113 size_t len = get_token_len( cur );
2114
2115 // skip neglectable C++ modifieres
2116 if ( cmp_tokens_fast( cur, "public", len ) )
2117 continue;
2118
2119 if ( cmp_tokens_fast( cur, "protected", len ) )
2120 continue;
2121
2122 if ( cmp_tokens_fast( cur, "private", len ) )
2123 continue;
2124
2125 if ( cmp_tokens_fast( cur, "virtual", len ) )
2126 continue;
2127
2128 // skip neglectable JAVA modifieres
2129
2130 if ( cmp_tokens_fast( cur, "extends", len ) )
2131 {
2132 isDerived = 1;
2133 continue;
2134 }
2135
2136 if ( cmp_tokens_fast( cur, "implements", len ) )
2137 {
2138 isDerived = 1;
2139 continue;
2140 }
2141
2142 // all we need to know is superclass or interface
2143
2144 char* tok = cur;
2145 int tmpLn;
2146 store_line_no( tmpLn );
2147
2148 skip_token(tok);
2149 get_next_token(tok);
2150
2151 restore_line_no( tmpLn );
2152
2153 if ( *tok != ':' && *cur != ':' )
2154
2155 pClass->m_SuperClassNames.push_back( wxString( cur, len ) );
2156
2157 } while(1);
2158
2159 if ( !isDerived )
2160 {
2161 int tmpLn;
2162 store_line_no( tmpLn );
2163
2164 while ( pClass->m_SuperClassNames.size() )
2165
2166 pClass->m_SuperClassNames.erase( &pClass->m_SuperClassNames[0] );
2167
2168 char* tok = cur;
2169
2170 // some non-obviouse token was following "class" keyword -
2171 // we've confused it with class name - thus now we're reverting this mistake
2172
2173 skip_next_token_back( tok );
2174 skip_token_back( tok );
2175
2176 pClass->m_Name = get_token_str( tok );
2177
2178 restore_line_no( tmpLn );
2179 }
2180
2181
2182 ++cur; // skip opening curly brace
2183
2184 pClass->mHeaderLength = ( cur - ctxStart );
2185
2186 // now, enter the class context
2187 mpCurCtx = pClass;
2188
2189 clear_commets_queue();
2190 }
2191
2192 void CJSourceParser::AddEnumNode( wxChar*& cur )
2193 {
2194 // now the cursor is at "enum" keyword
2195 wxChar* start = cur;
2196
2197 spEnumeration* pEnum = new spEnumeration();
2198 mpCurCtx->AddMember( pEnum );
2199
2200 pEnum->mSrcLineNo = get_line_no();
2201
2202
2203 AttachComments( *pEnum, cur );
2204
2205 skip_token( cur );
2206 if ( !get_next_token( cur ) ) return;
2207
2208 // check if enumeration has got it's identifier
2209 if ( *cur != '{' )
2210 {
2211 pEnum->m_Name = get_token_str( cur );
2212 }
2213
2214 if ( !skip_imp_block( cur ) ) return;
2215
2216 get_string_between( start, cur, &pEnum->m_EnumContent );
2217
2218 if ( get_next_token(cur) )
2219 {
2220 // check if the identifier if after the {...} block
2221 if ( *cur != ';' )
2222
2223 pEnum->m_Name = get_token_str( cur );
2224 }
2225
2226 clear_commets_queue();
2227 }
2228
2229 void CJSourceParser::AddTypeDefNode( wxChar*& cur )
2230 {
2231 // now the cursor at the token next to "typedef" keyword
2232
2233 if ( !get_next_token(cur) ) return;
2234
2235 wxChar* start = cur;
2236
2237 spTypeDef* pTDef = new spTypeDef();
2238 mpCurCtx->AddMember( pTDef );
2239
2240 pTDef->mSrcLineNo = get_line_no();
2241
2242 AttachComments( *pTDef, cur );
2243
2244 skip_statement( cur );
2245
2246 int tmpLnNo;
2247 store_line_no( tmpLnNo );
2248
2249 wxChar* tok = cur-1;
2250 skip_next_token_back( tok );
2251
2252 wxChar* nameEnd = tok;
2253
2254 skip_token_back( tok );
2255
2256 wxChar* nameStart = tok;
2257
2258 skip_next_token_back( tok );
2259
2260 wxChar* typeEnd = tok;
2261
2262 // check if it's function prototype
2263 if ( *nameStart == ')' )
2264 {
2265 typeEnd = nameStart+1;
2266
2267 // skip argument list
2268 while ( *nameStart != '(' ) --nameStart;
2269
2270 // skip to function type definition
2271 while ( *nameStart != ')' ) --nameStart;
2272
2273 skip_next_token_back( nameStart );
2274
2275 nameEnd = nameStart;
2276
2277 skip_token_back( nameStart );
2278
2279 if ( *nameStart == '*' ) ++nameStart;
2280 }
2281
2282 get_string_between( start, typeEnd, &pTDef->m_OriginalType );
2283
2284 get_string_between( nameStart, nameEnd, &pTDef->m_Name );
2285
2286 clear_commets_queue();
2287
2288 restore_line_no( tmpLnNo );
2289 }