1 // Scintilla source code edit control
3 ** Text document that handles notifications, DBCS, styling, words and end of line.
5 // Copyright 1998-2003 by Neil Hodgson <neilh@scintilla.org>
6 // The License.txt file describes the conditions under which this software may be distributed.
15 #include "Scintilla.h"
17 #include "CellBuffer.h"
21 // This is ASCII specific but is safe with chars >= 0x80
22 static inline bool isspacechar(unsigned char ch
) {
23 return (ch
== ' ') || ((ch
>= 0x09) && (ch
<= 0x0d));
26 static inline bool IsPunctuation(char ch
) {
27 return isascii(ch
) && ispunct(ch
);
30 static inline bool IsADigit(char ch
) {
31 return isascii(ch
) && isdigit(ch
);
34 static inline bool IsLowerCase(char ch
) {
35 return isascii(ch
) && islower(ch
);
38 static inline bool IsUpperCase(char ch
) {
39 return isascii(ch
) && isupper(ch
);
42 Document::Document() {
47 eolMode
= SC_EOL_CRLF
;
51 stylingBitsMask
= 0x1F;
53 SetDefaultCharClasses();
57 enteredReadOnlyCount
= 0;
62 backspaceUnindents
= false;
71 Document::~Document() {
72 for (int i
= 0; i
< lenWatchers
; i
++) {
73 watchers
[i
].watcher
->NotifyDeleted(this, watchers
[i
].userData
);
84 // Increase reference count and return its previous value.
85 int Document::AddRef() {
89 // Decrease reference count and return its previous value.
90 // Delete the document if reference count reaches zero.
91 int Document::Release() {
92 int curRefCount
= --refCount
;
98 void Document::SetSavePoint() {
100 NotifySavePoint(true);
103 int Document::AddMark(int line
, int markerNum
) {
104 int prev
= cb
.AddMark(line
, markerNum
);
105 DocModification
mh(SC_MOD_CHANGEMARKER
, LineStart(line
), 0, 0, 0);
110 void Document::DeleteMark(int line
, int markerNum
) {
111 cb
.DeleteMark(line
, markerNum
);
112 DocModification
mh(SC_MOD_CHANGEMARKER
, LineStart(line
), 0, 0, 0);
116 void Document::DeleteMarkFromHandle(int markerHandle
) {
117 cb
.DeleteMarkFromHandle(markerHandle
);
118 DocModification
mh(SC_MOD_CHANGEMARKER
, 0, 0, 0, 0);
122 void Document::DeleteAllMarks(int markerNum
) {
123 cb
.DeleteAllMarks(markerNum
);
124 DocModification
mh(SC_MOD_CHANGEMARKER
, 0, 0, 0, 0);
128 int Document::LineStart(int line
) {
129 return cb
.LineStart(line
);
132 int Document::LineEnd(int line
) {
133 if (line
== LinesTotal() - 1) {
134 return LineStart(line
+ 1);
136 int position
= LineStart(line
+ 1) - 1;
137 // When line terminator is CR+LF, may need to go back one more
138 if ((position
> LineStart(line
)) && (cb
.CharAt(position
- 1) == '\r')) {
145 int Document::LineFromPosition(int pos
) {
146 return cb
.LineFromPosition(pos
);
149 int Document::LineEndPosition(int position
) {
150 return LineEnd(LineFromPosition(position
));
153 int Document::VCHomePosition(int position
) {
154 int line
= LineFromPosition(position
);
155 int startPosition
= LineStart(line
);
156 int endLine
= LineStart(line
+ 1) - 1;
157 int startText
= startPosition
;
158 while (startText
< endLine
&& (cb
.CharAt(startText
) == ' ' || cb
.CharAt(startText
) == '\t' ) )
160 if (position
== startText
)
161 return startPosition
;
166 int Document::SetLevel(int line
, int level
) {
167 int prev
= cb
.SetLevel(line
, level
);
169 DocModification
mh(SC_MOD_CHANGEFOLD
| SC_MOD_CHANGEMARKER
,
170 LineStart(line
), 0, 0, 0);
172 mh
.foldLevelNow
= level
;
173 mh
.foldLevelPrev
= prev
;
179 static bool IsSubordinate(int levelStart
, int levelTry
) {
180 if (levelTry
& SC_FOLDLEVELWHITEFLAG
)
183 return (levelStart
& SC_FOLDLEVELNUMBERMASK
) < (levelTry
& SC_FOLDLEVELNUMBERMASK
);
186 int Document::GetLastChild(int lineParent
, int level
) {
188 level
= GetLevel(lineParent
) & SC_FOLDLEVELNUMBERMASK
;
189 int maxLine
= LinesTotal();
190 int lineMaxSubord
= lineParent
;
191 while (lineMaxSubord
< maxLine
- 1) {
192 EnsureStyledTo(LineStart(lineMaxSubord
+ 2));
193 if (!IsSubordinate(level
, GetLevel(lineMaxSubord
+ 1)))
197 if (lineMaxSubord
> lineParent
) {
198 if (level
> (GetLevel(lineMaxSubord
+ 1) & SC_FOLDLEVELNUMBERMASK
)) {
199 // Have chewed up some whitespace that belongs to a parent so seek back
200 if (GetLevel(lineMaxSubord
) & SC_FOLDLEVELWHITEFLAG
) {
205 return lineMaxSubord
;
208 int Document::GetFoldParent(int line
) {
209 int level
= GetLevel(line
);
210 int lineLook
= line
- 1;
211 while ((lineLook
> 0) && (
212 (!(GetLevel(lineLook
) & SC_FOLDLEVELHEADERFLAG
)) ||
213 ((GetLevel(lineLook
) & SC_FOLDLEVELNUMBERMASK
) >= level
))
217 if ((GetLevel(lineLook
) & SC_FOLDLEVELHEADERFLAG
) &&
218 ((GetLevel(lineLook
) & SC_FOLDLEVELNUMBERMASK
) < level
)) {
225 int Document::ClampPositionIntoDocument(int pos
) {
226 return Platform::Clamp(pos
, 0, Length());
229 bool Document::IsCrLf(int pos
) {
232 if (pos
>= (Length() - 1))
234 return (cb
.CharAt(pos
) == '\r') && (cb
.CharAt(pos
+ 1) == '\n');
237 static const int maxBytesInDBCSCharacter
=5;
239 int Document::LenChar(int pos
) {
242 } else if (IsCrLf(pos
)) {
244 } else if (SC_CP_UTF8
== dbcsCodePage
) {
245 unsigned char ch
= static_cast<unsigned char>(cb
.CharAt(pos
));
249 if (ch
>= (0x80 + 0x40 + 0x20))
251 int lengthDoc
= Length();
252 if ((pos
+ len
) > lengthDoc
)
253 return lengthDoc
-pos
;
256 } else if (dbcsCodePage
) {
257 char mbstr
[maxBytesInDBCSCharacter
+1];
259 for (i
=0; i
<Platform::DBCSCharMaxLength(); i
++) {
260 mbstr
[i
] = cb
.CharAt(pos
+i
);
263 return Platform::DBCSCharLength(dbcsCodePage
, mbstr
);
269 // Normalise a position so that it is not halfway through a two byte character.
270 // This can occur in two situations -
271 // When lines are terminated with \r\n pairs which should be treated as one character.
272 // When displaying DBCS text such as Japanese.
273 // If moving, move the position in the indicated direction.
274 int Document::MovePositionOutsideChar(int pos
, int moveDir
, bool checkLineEnd
) {
275 //Platform::DebugPrintf("NoCRLF %d %d\n", pos, moveDir);
276 // If out of range, just return minimum/maximum value.
282 // assert pos > 0 && pos < Length()
283 if (checkLineEnd
&& IsCrLf(pos
- 1)) {
290 // Not between CR and LF
293 if (SC_CP_UTF8
== dbcsCodePage
) {
294 unsigned char ch
= static_cast<unsigned char>(cb
.CharAt(pos
));
295 while ((pos
> 0) && (pos
< Length()) && (ch
>= 0x80) && (ch
< (0x80 + 0x40))) {
296 // ch is a trail byte
301 ch
= static_cast<unsigned char>(cb
.CharAt(pos
));
304 // Anchor DBCS calculations at start of line because start of line can
305 // not be a DBCS trail byte.
306 int posCheck
= LineStart(LineFromPosition(pos
));
307 while (posCheck
< pos
) {
308 char mbstr
[maxBytesInDBCSCharacter
+1];
310 for(i
=0;i
<Platform::DBCSCharMaxLength();i
++) {
311 mbstr
[i
] = cb
.CharAt(posCheck
+i
);
315 int mbsize
= Platform::DBCSCharLength(dbcsCodePage
, mbstr
);
316 if (posCheck
+ mbsize
== pos
) {
318 } else if (posCheck
+ mbsize
> pos
) {
320 return posCheck
+ mbsize
;
333 void Document::ModifiedAt(int pos
) {
338 // Document only modified by gateways DeleteChars, InsertStyledString, Undo, Redo, and SetStyleAt.
339 // SetStyleAt does not change the persistent state of a document
341 // Unlike Undo, Redo, and InsertStyledString, the pos argument is a cell number not a char number
342 bool Document::DeleteChars(int pos
, int len
) {
345 if ((pos
+ len
) > Length())
347 if (cb
.IsReadOnly() && enteredReadOnlyCount
== 0) {
348 enteredReadOnlyCount
++;
349 NotifyModifyAttempt();
350 enteredReadOnlyCount
--;
352 if (enteredCount
!= 0) {
356 if (!cb
.IsReadOnly()) {
359 SC_MOD_BEFOREDELETE
| SC_PERFORMED_USER
,
362 int prevLinesTotal
= LinesTotal();
363 bool startSavePoint
= cb
.IsSavePoint();
364 const char *text
= cb
.DeleteChars(pos
* 2, len
* 2);
365 if (startSavePoint
&& cb
.IsCollectingUndo())
366 NotifySavePoint(!startSavePoint
);
367 if ((pos
< Length()) || (pos
== 0))
373 SC_MOD_DELETETEXT
| SC_PERFORMED_USER
,
375 LinesTotal() - prevLinesTotal
, text
));
379 return !cb
.IsReadOnly();
382 bool Document::InsertStyledString(int position
, char *s
, int insertLength
) {
383 if (cb
.IsReadOnly() && enteredReadOnlyCount
== 0) {
384 enteredReadOnlyCount
++;
385 NotifyModifyAttempt();
386 enteredReadOnlyCount
--;
388 if (enteredCount
!= 0) {
392 if (!cb
.IsReadOnly()) {
395 SC_MOD_BEFOREINSERT
| SC_PERFORMED_USER
,
396 position
/ 2, insertLength
/ 2,
398 int prevLinesTotal
= LinesTotal();
399 bool startSavePoint
= cb
.IsSavePoint();
400 const char *text
= cb
.InsertString(position
, s
, insertLength
);
401 if (startSavePoint
&& cb
.IsCollectingUndo())
402 NotifySavePoint(!startSavePoint
);
403 ModifiedAt(position
/ 2);
406 SC_MOD_INSERTTEXT
| SC_PERFORMED_USER
,
407 position
/ 2, insertLength
/ 2,
408 LinesTotal() - prevLinesTotal
, text
));
412 return !cb
.IsReadOnly();
415 int Document::Undo() {
417 if (enteredCount
== 0) {
419 bool startSavePoint
= cb
.IsSavePoint();
420 int steps
= cb
.StartUndo();
421 //Platform::DebugPrintf("Steps=%d\n", steps);
422 for (int step
= 0; step
< steps
; step
++) {
423 int prevLinesTotal
= LinesTotal();
424 const Action
&action
= cb
.GetUndoStep();
425 if (action
.at
== removeAction
) {
426 NotifyModified(DocModification(
427 SC_MOD_BEFOREINSERT
| SC_PERFORMED_UNDO
, action
));
429 NotifyModified(DocModification(
430 SC_MOD_BEFOREDELETE
| SC_PERFORMED_UNDO
, action
));
432 cb
.PerformUndoStep();
433 int cellPosition
= action
.position
/ 2;
434 ModifiedAt(cellPosition
);
435 newPos
= cellPosition
;
437 int modFlags
= SC_PERFORMED_UNDO
;
438 // With undo, an insertion action becomes a deletion notification
439 if (action
.at
== removeAction
) {
440 newPos
+= action
.lenData
;
441 modFlags
|= SC_MOD_INSERTTEXT
;
443 modFlags
|= SC_MOD_DELETETEXT
;
445 if (step
== steps
- 1)
446 modFlags
|= SC_LASTSTEPINUNDOREDO
;
447 NotifyModified(DocModification(modFlags
, cellPosition
, action
.lenData
,
448 LinesTotal() - prevLinesTotal
, action
.data
));
451 bool endSavePoint
= cb
.IsSavePoint();
452 if (startSavePoint
!= endSavePoint
)
453 NotifySavePoint(endSavePoint
);
459 int Document::Redo() {
461 if (enteredCount
== 0) {
463 bool startSavePoint
= cb
.IsSavePoint();
464 int steps
= cb
.StartRedo();
465 for (int step
= 0; step
< steps
; step
++) {
466 int prevLinesTotal
= LinesTotal();
467 const Action
&action
= cb
.GetRedoStep();
468 if (action
.at
== insertAction
) {
469 NotifyModified(DocModification(
470 SC_MOD_BEFOREINSERT
| SC_PERFORMED_REDO
, action
));
472 NotifyModified(DocModification(
473 SC_MOD_BEFOREDELETE
| SC_PERFORMED_REDO
, action
));
475 cb
.PerformRedoStep();
476 ModifiedAt(action
.position
/ 2);
477 newPos
= action
.position
/ 2;
479 int modFlags
= SC_PERFORMED_REDO
;
480 if (action
.at
== insertAction
) {
481 newPos
+= action
.lenData
;
482 modFlags
|= SC_MOD_INSERTTEXT
;
484 modFlags
|= SC_MOD_DELETETEXT
;
486 if (step
== steps
- 1)
487 modFlags
|= SC_LASTSTEPINUNDOREDO
;
489 DocModification(modFlags
, action
.position
/ 2, action
.lenData
,
490 LinesTotal() - prevLinesTotal
, action
.data
));
493 bool endSavePoint
= cb
.IsSavePoint();
494 if (startSavePoint
!= endSavePoint
)
495 NotifySavePoint(endSavePoint
);
501 bool Document::InsertChar(int pos
, char ch
) {
505 return InsertStyledString(pos
*2, chs
, 2);
508 // Insert a null terminated string
509 bool Document::InsertString(int position
, const char *s
) {
510 return InsertString(position
, s
, strlen(s
));
513 // Insert a string with a length
514 bool Document::InsertString(int position
, const char *s
, size_t insertLength
) {
515 bool changed
= false;
516 char *sWithStyle
= new char[insertLength
* 2];
518 for (size_t i
= 0; i
< insertLength
; i
++) {
519 sWithStyle
[i
*2] = s
[i
];
520 sWithStyle
[i
*2 + 1] = 0;
522 changed
= InsertStyledString(position
*2, sWithStyle
,
523 static_cast<int>(insertLength
*2));
529 void Document::ChangeChar(int pos
, char ch
) {
534 void Document::DelChar(int pos
) {
535 DeleteChars(pos
, LenChar(pos
));
538 void Document::DelCharBack(int pos
) {
541 } else if (IsCrLf(pos
- 2)) {
542 DeleteChars(pos
- 2, 2);
543 } else if (dbcsCodePage
) {
544 int startChar
= MovePositionOutsideChar(pos
- 1, -1, false);
545 DeleteChars(startChar
, pos
- startChar
);
547 DeleteChars(pos
- 1, 1);
551 static bool isindentchar(char ch
) {
552 return (ch
== ' ') || (ch
== '\t');
555 static int NextTab(int pos
, int tabSize
) {
556 return ((pos
/ tabSize
) + 1) * tabSize
;
559 static void CreateIndentation(char *linebuf
, int length
, int indent
, int tabSize
, bool insertSpaces
) {
560 length
--; // ensure space for \0
562 while ((indent
>= tabSize
) && (length
> 0)) {
568 while ((indent
> 0) && (length
> 0)) {
576 int Document::GetLineIndentation(int line
) {
578 if ((line
>= 0) && (line
< LinesTotal())) {
579 int lineStart
= LineStart(line
);
580 int length
= Length();
581 for (int i
= lineStart
;i
< length
;i
++) {
582 char ch
= cb
.CharAt(i
);
586 indent
= NextTab(indent
, tabInChars
);
594 void Document::SetLineIndentation(int line
, int indent
) {
595 int indentOfLine
= GetLineIndentation(line
);
598 if (indent
!= indentOfLine
) {
600 CreateIndentation(linebuf
, sizeof(linebuf
), indent
, tabInChars
, !useTabs
);
601 int thisLineStart
= LineStart(line
);
602 int indentPos
= GetLineIndentPosition(line
);
603 DeleteChars(thisLineStart
, indentPos
- thisLineStart
);
604 InsertString(thisLineStart
, linebuf
);
608 int Document::GetLineIndentPosition(int line
) {
611 int pos
= LineStart(line
);
612 int length
= Length();
613 while ((pos
< length
) && isindentchar(cb
.CharAt(pos
))) {
619 int Document::GetColumn(int pos
) {
621 int line
= LineFromPosition(pos
);
622 if ((line
>= 0) && (line
< LinesTotal())) {
623 for (int i
= LineStart(line
);i
< pos
;) {
624 char ch
= cb
.CharAt(i
);
626 column
= NextTab(column
, tabInChars
);
628 } else if (ch
== '\r') {
630 } else if (ch
== '\n') {
634 i
= MovePositionOutsideChar(i
+ 1, 1);
641 int Document::FindColumn(int line
, int column
) {
642 int position
= LineStart(line
);
643 int columnCurrent
= 0;
644 if ((line
>= 0) && (line
< LinesTotal())) {
645 while (columnCurrent
< column
) {
646 char ch
= cb
.CharAt(position
);
648 columnCurrent
= NextTab(columnCurrent
, tabInChars
);
650 } else if (ch
== '\r') {
652 } else if (ch
== '\n') {
656 position
= MovePositionOutsideChar(position
+ 1, 1);
663 void Document::Indent(bool forwards
, int lineBottom
, int lineTop
) {
664 // Dedent - suck white space off the front of the line to dedent by equivalent of a tab
665 for (int line
= lineBottom
; line
>= lineTop
; line
--) {
666 int indentOfLine
= GetLineIndentation(line
);
668 SetLineIndentation(line
, indentOfLine
+ IndentSize());
670 SetLineIndentation(line
, indentOfLine
- IndentSize());
674 void Document::ConvertLineEnds(int eolModeSet
) {
676 for (int pos
= 0; pos
< Length(); pos
++) {
677 if (cb
.CharAt(pos
) == '\r') {
678 if (cb
.CharAt(pos
+ 1) == '\n') {
679 if (eolModeSet
!= SC_EOL_CRLF
) {
681 if (eolModeSet
== SC_EOL_CR
)
682 InsertString(pos
, "\r", 1);
684 InsertString(pos
, "\n", 1);
689 if (eolModeSet
!= SC_EOL_CR
) {
691 if (eolModeSet
== SC_EOL_CRLF
) {
692 InsertString(pos
, "\r\n", 2);
695 InsertString(pos
, "\n", 1);
699 } else if (cb
.CharAt(pos
) == '\n') {
700 if (eolModeSet
!= SC_EOL_LF
) {
702 if (eolModeSet
== SC_EOL_CRLF
) {
703 InsertString(pos
, "\r\n", 2);
706 InsertString(pos
, "\r", 1);
714 int Document::ParaDown(int pos
) {
715 int line
= LineFromPosition(pos
);
716 while (line
< LinesTotal() && LineStart(line
) != LineEnd(line
)) { // skip non-empty lines
719 while (line
< LinesTotal() && LineStart(line
) == LineEnd(line
)) { // skip empty lines
722 if (line
< LinesTotal())
723 return LineStart(line
);
724 else // end of a document
725 return LineEnd(line
-1);
728 int Document::ParaUp(int pos
) {
729 int line
= LineFromPosition(pos
);
731 while (line
>= 0 && LineStart(line
) == LineEnd(line
)) { // skip empty lines
734 while (line
>= 0 && LineStart(line
) != LineEnd(line
)) { // skip non-empty lines
738 return LineStart(line
);
741 Document::charClassification
Document::WordCharClass(unsigned char ch
) {
742 if ((SC_CP_UTF8
== dbcsCodePage
) && (ch
>= 0x80))
744 return charClass
[ch
];
748 * Used by commmands that want to select whole words.
749 * Finds the start of word at pos when delta < 0 or the end of the word when delta >= 0.
751 int Document::ExtendWordSelect(int pos
, int delta
, bool onlyWordCharacters
) {
752 charClassification ccStart
= ccWord
;
754 if (!onlyWordCharacters
)
755 ccStart
= WordCharClass(cb
.CharAt(pos
-1));
756 while (pos
> 0 && (WordCharClass(cb
.CharAt(pos
- 1)) == ccStart
))
759 if (!onlyWordCharacters
)
760 ccStart
= WordCharClass(cb
.CharAt(pos
));
761 while (pos
< (Length()) && (WordCharClass(cb
.CharAt(pos
)) == ccStart
))
764 return MovePositionOutsideChar(pos
, delta
);
768 * Find the start of the next word in either a forward (delta >= 0) or backwards direction
770 * This is looking for a transition between character classes although there is also some
771 * additional movement to transit white space.
772 * Used by cursor movement by word commands.
774 int Document::NextWordStart(int pos
, int delta
) {
776 while (pos
> 0 && (WordCharClass(cb
.CharAt(pos
- 1)) == ccSpace
))
779 charClassification ccStart
= WordCharClass(cb
.CharAt(pos
-1));
780 while (pos
> 0 && (WordCharClass(cb
.CharAt(pos
- 1)) == ccStart
)) {
785 charClassification ccStart
= WordCharClass(cb
.CharAt(pos
));
786 while (pos
< (Length()) && (WordCharClass(cb
.CharAt(pos
)) == ccStart
))
788 while (pos
< (Length()) && (WordCharClass(cb
.CharAt(pos
)) == ccSpace
))
795 * Find the end of the next word in either a forward (delta >= 0) or backwards direction
797 * This is looking for a transition between character classes although there is also some
798 * additional movement to transit white space.
799 * Used by cursor movement by word commands.
801 int Document::NextWordEnd(int pos
, int delta
) {
804 charClassification ccStart
= WordCharClass(cb
.CharAt(pos
-1));
805 if (ccStart
!= ccSpace
) {
806 while (pos
> 0 && WordCharClass(cb
.CharAt(pos
- 1)) == ccStart
) {
810 while (pos
> 0 && WordCharClass(cb
.CharAt(pos
- 1)) == ccSpace
) {
815 while (pos
< Length() && WordCharClass(cb
.CharAt(pos
)) == ccSpace
) {
818 if (pos
< Length()) {
819 charClassification ccStart
= WordCharClass(cb
.CharAt(pos
));
820 while (pos
< Length() && WordCharClass(cb
.CharAt(pos
)) == ccStart
) {
829 * Check that the character at the given position is a word or punctuation character and that
830 * the previous character is of a different character class.
832 bool Document::IsWordStartAt(int pos
) {
834 charClassification ccPos
= WordCharClass(CharAt(pos
));
835 return (ccPos
== ccWord
|| ccPos
== ccPunctuation
) &&
836 (ccPos
!= WordCharClass(CharAt(pos
- 1)));
842 * Check that the character at the given position is a word or punctuation character and that
843 * the next character is of a different character class.
845 bool Document::IsWordEndAt(int pos
) {
846 if (pos
< Length() - 1) {
847 charClassification ccPrev
= WordCharClass(CharAt(pos
-1));
848 return (ccPrev
== ccWord
|| ccPrev
== ccPunctuation
) &&
849 (ccPrev
!= WordCharClass(CharAt(pos
)));
855 * Check that the given range is has transitions between character classes at both
856 * ends and where the characters on the inside are word or punctuation characters.
858 bool Document::IsWordAt(int start
, int end
) {
859 return IsWordStartAt(start
) && IsWordEndAt(end
);
862 // The comparison and case changing functions here assume ASCII
863 // or extended ASCII such as the normal Windows code page.
865 static inline char MakeUpperCase(char ch
) {
866 if (ch
< 'a' || ch
> 'z')
869 return static_cast<char>(ch
- 'a' + 'A');
872 static inline char MakeLowerCase(char ch
) {
873 if (ch
< 'A' || ch
> 'Z')
876 return static_cast<char>(ch
- 'A' + 'a');
879 // Define a way for the Regular Expression code to access the document
880 class DocumentIndexer
: public CharacterIndexer
{
884 DocumentIndexer(Document
*pdoc_
, int end_
) :
885 pdoc(pdoc_
), end(end_
) {
888 virtual char CharAt(int index
) {
889 if (index
< 0 || index
>= end
)
892 return pdoc
->CharAt(index
);
897 * Find text in document, supporting both forward and backward
898 * searches (just pass minPos > maxPos to do a backward search)
899 * Has not been tested with backwards DBCS searches yet.
901 long Document::FindText(int minPos
, int maxPos
, const char *s
,
902 bool caseSensitive
, bool word
, bool wordStart
, bool regExp
, bool posix
,
906 pre
= new RESearch();
910 int increment
= (minPos
<= maxPos
) ? 1 : -1;
912 int startPos
= minPos
;
915 // Range endpoints should not be inside DBCS characters, but just in case, move them.
916 startPos
= MovePositionOutsideChar(startPos
, 1, false);
917 endPos
= MovePositionOutsideChar(endPos
, 1, false);
919 const char *errmsg
= pre
->Compile(s
, *length
, caseSensitive
, posix
);
923 // Find a variable in a property file: \$(\([A-Za-z0-9_.]+\))
924 // Replace first '.' with '-' in each property file variable reference:
925 // Search: \$(\([A-Za-z0-9_-]+\)\.\([A-Za-z0-9_.]+\))
927 int lineRangeStart
= LineFromPosition(startPos
);
928 int lineRangeEnd
= LineFromPosition(endPos
);
929 if ((increment
== 1) &&
930 (startPos
>= LineEnd(lineRangeStart
)) &&
931 (lineRangeStart
< lineRangeEnd
)) {
932 // the start position is at end of line or between line end characters.
934 startPos
= LineStart(lineRangeStart
);
938 char searchEnd
= s
[*length
- 1];
939 int lineRangeBreak
= lineRangeEnd
+ increment
;
940 for (int line
= lineRangeStart
; line
!= lineRangeBreak
; line
+= increment
) {
941 int startOfLine
= LineStart(line
);
942 int endOfLine
= LineEnd(line
);
943 if (increment
== 1) {
944 if (line
== lineRangeStart
) {
945 if ((startPos
!= startOfLine
) && (s
[0] == '^'))
946 continue; // Can't match start of line if start position after start of line
947 startOfLine
= startPos
;
949 if (line
== lineRangeEnd
) {
950 if ((endPos
!= endOfLine
) && (searchEnd
== '$'))
951 continue; // Can't match end of line if end position before end of line
955 if (line
== lineRangeEnd
) {
956 if ((endPos
!= startOfLine
) && (s
[0] == '^'))
957 continue; // Can't match start of line if end position after start of line
958 startOfLine
= endPos
;
960 if (line
== lineRangeStart
) {
961 if ((startPos
!= endOfLine
) && (searchEnd
== '$'))
962 continue; // Can't match end of line if start position before end of line
963 endOfLine
= startPos
+1;
967 DocumentIndexer
di(this, endOfLine
);
968 int success
= pre
->Execute(di
, startOfLine
, endOfLine
);
971 lenRet
= pre
->eopat
[0] - pre
->bopat
[0];
972 if (increment
== -1) {
973 // Check for the last match on this line.
974 int repetitions
= 1000; // Break out of infinite loop
975 while (success
&& (pre
->eopat
[0] <= (endOfLine
+1)) && (repetitions
--)) {
976 success
= pre
->Execute(di
, pos
+1, endOfLine
+1);
978 if (pre
->eopat
[0] <= (minPos
+1)) {
980 lenRet
= pre
->eopat
[0] - pre
->bopat
[0];
995 bool forward
= minPos
<= maxPos
;
996 int increment
= forward
? 1 : -1;
998 // Range endpoints should not be inside DBCS characters, but just in case, move them.
999 int startPos
= MovePositionOutsideChar(minPos
, increment
, false);
1000 int endPos
= MovePositionOutsideChar(maxPos
, increment
, false);
1002 // Compute actual search ranges needed
1003 int lengthFind
= *length
;
1004 if (lengthFind
== -1)
1005 lengthFind
= static_cast<int>(strlen(s
));
1006 int endSearch
= endPos
;
1007 if (startPos
<= endPos
) {
1008 endSearch
= endPos
- lengthFind
+ 1;
1010 //Platform::DebugPrintf("Find %d %d %s %d\n", startPos, endPos, ft->lpstrText, lengthFind);
1011 char firstChar
= s
[0];
1013 firstChar
= static_cast<char>(MakeUpperCase(firstChar
));
1015 while (forward
? (pos
< endSearch
) : (pos
>= endSearch
)) {
1016 char ch
= CharAt(pos
);
1017 if (caseSensitive
) {
1018 if (ch
== firstChar
) {
1020 for (int posMatch
= 1; posMatch
< lengthFind
&& found
; posMatch
++) {
1021 ch
= CharAt(pos
+ posMatch
);
1022 if (ch
!= s
[posMatch
])
1026 if ((!word
&& !wordStart
) ||
1027 word
&& IsWordAt(pos
, pos
+ lengthFind
) ||
1028 wordStart
&& IsWordStartAt(pos
))
1033 if (MakeUpperCase(ch
) == firstChar
) {
1035 for (int posMatch
= 1; posMatch
< lengthFind
&& found
; posMatch
++) {
1036 ch
= CharAt(pos
+ posMatch
);
1037 if (MakeUpperCase(ch
) != MakeUpperCase(s
[posMatch
]))
1041 if ((!word
&& !wordStart
) ||
1042 word
&& IsWordAt(pos
, pos
+ lengthFind
) ||
1043 wordStart
&& IsWordStartAt(pos
))
1049 if (dbcsCodePage
&& (pos
>= 0)) {
1050 // Ensure trying to match from start of character
1051 pos
= MovePositionOutsideChar(pos
, increment
, false);
1055 //Platform::DebugPrintf("Not found\n");
1059 const char *Document::SubstituteByPosition(const char *text
, int *length
) {
1062 delete []substituted
;
1064 DocumentIndexer
di(this, Length());
1065 if (!pre
->GrabMatches(di
))
1067 unsigned int lenResult
= 0;
1068 for (int i
= 0; i
< *length
; i
++) {
1069 if (text
[i
] == '\\') {
1070 if (text
[i
+ 1] >= '1' && text
[i
+ 1] <= '9') {
1071 unsigned int patNum
= text
[i
+ 1] - '0';
1072 lenResult
+= pre
->eopat
[patNum
] - pre
->bopat
[patNum
];
1075 switch (text
[i
+ 1]) {
1091 substituted
= new char[lenResult
+ 1];
1094 char *o
= substituted
;
1095 for (int j
= 0; j
< *length
; j
++) {
1096 if (text
[j
] == '\\') {
1097 if (text
[j
+ 1] >= '1' && text
[j
+ 1] <= '9') {
1098 unsigned int patNum
= text
[j
+ 1] - '0';
1099 unsigned int len
= pre
->eopat
[patNum
] - pre
->bopat
[patNum
];
1100 if (pre
->pat
[patNum
]) // Will be null if try for a match that did not occur
1101 memcpy(o
, pre
->pat
[patNum
], len
);
1138 *length
= lenResult
;
1142 int Document::LinesTotal() {
1146 void Document::ChangeCase(Range r
, bool makeUpperCase
) {
1147 for (int pos
= r
.start
; pos
< r
.end
; pos
++) {
1148 int len
= LenChar(pos
);
1149 if (dbcsCodePage
&& (len
> 1)) {
1152 char ch
= CharAt(pos
);
1153 if (makeUpperCase
) {
1154 if (IsLowerCase(ch
)) {
1155 ChangeChar(pos
, static_cast<char>(MakeUpperCase(ch
)));
1158 if (IsUpperCase(ch
)) {
1159 ChangeChar(pos
, static_cast<char>(MakeLowerCase(ch
)));
1166 void Document::SetDefaultCharClasses() {
1167 // Initialize all char classes to default values
1168 for (int ch
= 0; ch
< 256; ch
++) {
1169 if (ch
== '\r' || ch
== '\n')
1170 charClass
[ch
] = ccNewLine
;
1171 else if (ch
< 0x20 || ch
== ' ')
1172 charClass
[ch
] = ccSpace
;
1173 else if (ch
>= 0x80 || isalnum(ch
) || ch
== '_')
1174 charClass
[ch
] = ccWord
;
1176 charClass
[ch
] = ccPunctuation
;
1180 void Document::SetCharClasses(unsigned char *chars
, charClassification newCharClass
) {
1181 // Apply the newCharClass to the specifed chars
1184 charClass
[*chars
] = newCharClass
;
1190 void Document::SetStylingBits(int bits
) {
1192 stylingBitsMask
= 0;
1193 for (int bit
= 0; bit
< stylingBits
; bit
++) {
1194 stylingBitsMask
<<= 1;
1195 stylingBitsMask
|= 1;
1199 void Document::StartStyling(int position
, char mask
) {
1201 endStyled
= position
;
1204 bool Document::SetStyleFor(int length
, char style
) {
1205 if (enteredCount
!= 0) {
1209 style
&= stylingMask
;
1210 int prevEndStyled
= endStyled
;
1211 if (cb
.SetStyleFor(endStyled
, length
, style
, stylingMask
)) {
1212 DocModification
mh(SC_MOD_CHANGESTYLE
| SC_PERFORMED_USER
,
1213 prevEndStyled
, length
);
1216 endStyled
+= length
;
1222 bool Document::SetStyles(int length
, char *styles
) {
1223 if (enteredCount
!= 0) {
1227 int prevEndStyled
= endStyled
;
1228 bool didChange
= false;
1230 for (int iPos
= 0; iPos
< length
; iPos
++, endStyled
++) {
1231 PLATFORM_ASSERT(endStyled
< Length());
1232 if (cb
.SetStyleAt(endStyled
, styles
[iPos
], stylingMask
)) {
1238 DocModification
mh(SC_MOD_CHANGESTYLE
| SC_PERFORMED_USER
,
1239 prevEndStyled
, lastChange
);
1247 bool Document::EnsureStyledTo(int pos
) {
1248 if (pos
> GetEndStyled()) {
1250 if (styleClock
> 0x100000) {
1253 // Ask the watchers to style, and stop as soon as one responds.
1254 for (int i
= 0; pos
> GetEndStyled() && i
< lenWatchers
; i
++) {
1255 watchers
[i
].watcher
->NotifyStyleNeeded(this, watchers
[i
].userData
, pos
);
1258 return pos
<= GetEndStyled();
1261 bool Document::AddWatcher(DocWatcher
*watcher
, void *userData
) {
1262 for (int i
= 0; i
< lenWatchers
; i
++) {
1263 if ((watchers
[i
].watcher
== watcher
) &&
1264 (watchers
[i
].userData
== userData
))
1267 WatcherWithUserData
*pwNew
= new WatcherWithUserData
[lenWatchers
+ 1];
1270 for (int j
= 0; j
< lenWatchers
; j
++)
1271 pwNew
[j
] = watchers
[j
];
1272 pwNew
[lenWatchers
].watcher
= watcher
;
1273 pwNew
[lenWatchers
].userData
= userData
;
1280 bool Document::RemoveWatcher(DocWatcher
*watcher
, void *userData
) {
1281 for (int i
= 0; i
< lenWatchers
; i
++) {
1282 if ((watchers
[i
].watcher
== watcher
) &&
1283 (watchers
[i
].userData
== userData
)) {
1284 if (lenWatchers
== 1) {
1289 WatcherWithUserData
*pwNew
= new WatcherWithUserData
[lenWatchers
];
1292 for (int j
= 0; j
< lenWatchers
- 1; j
++) {
1293 pwNew
[j
] = (j
< i
) ? watchers
[j
] : watchers
[j
+ 1];
1305 void Document::NotifyModifyAttempt() {
1306 for (int i
= 0; i
< lenWatchers
; i
++) {
1307 watchers
[i
].watcher
->NotifyModifyAttempt(this, watchers
[i
].userData
);
1311 void Document::NotifySavePoint(bool atSavePoint
) {
1312 for (int i
= 0; i
< lenWatchers
; i
++) {
1313 watchers
[i
].watcher
->NotifySavePoint(this, watchers
[i
].userData
, atSavePoint
);
1317 void Document::NotifyModified(DocModification mh
) {
1318 for (int i
= 0; i
< lenWatchers
; i
++) {
1319 watchers
[i
].watcher
->NotifyModified(this, mh
, watchers
[i
].userData
);
1323 bool Document::IsWordPartSeparator(char ch
) {
1324 return (WordCharClass(ch
) == ccWord
) && IsPunctuation(ch
);
1327 int Document::WordPartLeft(int pos
) {
1330 char startChar
= cb
.CharAt(pos
);
1331 if (IsWordPartSeparator(startChar
)) {
1332 while (pos
> 0 && IsWordPartSeparator(cb
.CharAt(pos
))) {
1337 startChar
= cb
.CharAt(pos
);
1339 if (IsLowerCase(startChar
)) {
1340 while (pos
> 0 && IsLowerCase(cb
.CharAt(pos
)))
1342 if (!IsUpperCase(cb
.CharAt(pos
)) && !IsLowerCase(cb
.CharAt(pos
)))
1344 } else if (IsUpperCase(startChar
)) {
1345 while (pos
> 0 && IsUpperCase(cb
.CharAt(pos
)))
1347 if (!IsUpperCase(cb
.CharAt(pos
)))
1349 } else if (IsADigit(startChar
)) {
1350 while (pos
> 0 && IsADigit(cb
.CharAt(pos
)))
1352 if (!IsADigit(cb
.CharAt(pos
)))
1354 } else if (IsPunctuation(startChar
)) {
1355 while (pos
> 0 && IsPunctuation(cb
.CharAt(pos
)))
1357 if (!IsPunctuation(cb
.CharAt(pos
)))
1359 } else if (isspacechar(startChar
)) {
1360 while (pos
> 0 && isspacechar(cb
.CharAt(pos
)))
1362 if (!isspacechar(cb
.CharAt(pos
)))
1364 } else if (!isascii(startChar
)) {
1365 while (pos
> 0 && !isascii(cb
.CharAt(pos
)))
1367 if (isascii(cb
.CharAt(pos
)))
1377 int Document::WordPartRight(int pos
) {
1378 char startChar
= cb
.CharAt(pos
);
1379 int length
= Length();
1380 if (IsWordPartSeparator(startChar
)) {
1381 while (pos
< length
&& IsWordPartSeparator(cb
.CharAt(pos
)))
1383 startChar
= cb
.CharAt(pos
);
1385 if (!isascii(startChar
)) {
1386 while (pos
< length
&& !isascii(cb
.CharAt(pos
)))
1388 } else if (IsLowerCase(startChar
)) {
1389 while (pos
< length
&& IsLowerCase(cb
.CharAt(pos
)))
1391 } else if (IsUpperCase(startChar
)) {
1392 if (IsLowerCase(cb
.CharAt(pos
+ 1))) {
1394 while (pos
< length
&& IsLowerCase(cb
.CharAt(pos
)))
1397 while (pos
< length
&& IsUpperCase(cb
.CharAt(pos
)))
1400 if (IsLowerCase(cb
.CharAt(pos
)) && IsUpperCase(cb
.CharAt(pos
- 1)))
1402 } else if (IsADigit(startChar
)) {
1403 while (pos
< length
&& IsADigit(cb
.CharAt(pos
)))
1405 } else if (IsPunctuation(startChar
)) {
1406 while (pos
< length
&& IsPunctuation(cb
.CharAt(pos
)))
1408 } else if (isspacechar(startChar
)) {
1409 while (pos
< length
&& isspacechar(cb
.CharAt(pos
)))
1417 bool IsLineEndChar(char c
) {
1418 return (c
== '\n' || c
== '\r');
1421 int Document::ExtendStyleRange(int pos
, int delta
, bool singleLine
) {
1422 int sStart
= cb
.StyleAt(pos
);
1424 while (pos
> 0 && (cb
.StyleAt(pos
) == sStart
) && (!singleLine
|| !IsLineEndChar(cb
.CharAt(pos
))) )
1428 while (pos
< (Length()) && (cb
.StyleAt(pos
) == sStart
) && (!singleLine
|| !IsLineEndChar(cb
.CharAt(pos
))) )