]> git.saurik.com Git - wxWidgets.git/blob - wxPython/samples/stxview/StructuredText/DocumentClass.py
*** empty log message ***
[wxWidgets.git] / wxPython / samples / stxview / StructuredText / DocumentClass.py
1 ##############################################################################
2 #
3 # Zope Public License (ZPL) Version 1.0
4 # -------------------------------------
5 #
6 # Copyright (c) Digital Creations. All rights reserved.
7 #
8 # This license has been certified as Open Source(tm).
9 #
10 # Redistribution and use in source and binary forms, with or without
11 # modification, are permitted provided that the following conditions are
12 # met:
13 #
14 # 1. Redistributions in source code must retain the above copyright
15 # notice, this list of conditions, and the following disclaimer.
16 #
17 # 2. Redistributions in binary form must reproduce the above copyright
18 # notice, this list of conditions, and the following disclaimer in
19 # the documentation and/or other materials provided with the
20 # distribution.
21 #
22 # 3. Digital Creations requests that attribution be given to Zope
23 # in any manner possible. Zope includes a "Powered by Zope"
24 # button that is installed by default. While it is not a license
25 # violation to remove this button, it is requested that the
26 # attribution remain. A significant investment has been put
27 # into Zope, and this effort will continue if the Zope community
28 # continues to grow. This is one way to assure that growth.
29 #
30 # 4. All advertising materials and documentation mentioning
31 # features derived from or use of this software must display
32 # the following acknowledgement:
33 #
34 # "This product includes software developed by Digital Creations
35 # for use in the Z Object Publishing Environment
36 # (http://www.zope.org/)."
37 #
38 # In the event that the product being advertised includes an
39 # intact Zope distribution (with copyright and license included)
40 # then this clause is waived.
41 #
42 # 5. Names associated with Zope or Digital Creations must not be used to
43 # endorse or promote products derived from this software without
44 # prior written permission from Digital Creations.
45 #
46 # 6. Modified redistributions of any form whatsoever must retain
47 # the following acknowledgment:
48 #
49 # "This product includes software developed by Digital Creations
50 # for use in the Z Object Publishing Environment
51 # (http://www.zope.org/)."
52 #
53 # Intact (re-)distributions of any official Zope release do not
54 # require an external acknowledgement.
55 #
56 # 7. Modifications are encouraged but must be packaged separately as
57 # patches to official Zope releases. Distributions that do not
58 # clearly separate the patches from the original work must be clearly
59 # labeled as unofficial distributions. Modifications which do not
60 # carry the name Zope may be packaged in any form, as long as they
61 # conform to all of the clauses above.
62 #
63 #
64 # Disclaimer
65 #
66 # THIS SOFTWARE IS PROVIDED BY DIGITAL CREATIONS ``AS IS'' AND ANY
67 # EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
68 # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
69 # PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL DIGITAL CREATIONS OR ITS
70 # CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
71 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
72 # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
73 # USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
74 # ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
75 # OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
76 # OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
77 # SUCH DAMAGE.
78 #
79 #
80 # This software consists of contributions made by Digital Creations and
81 # many individuals on behalf of Digital Creations. Specific
82 # attributions are listed in the accompanying credits file.
83 #
84 ##############################################################################
85
86 import re, ST, STDOM
87 from string import split, join, replace, expandtabs, strip, find, rstrip
88
89 StringType=type('')
90 ListType=type([])
91
92 class StructuredTextExample(ST.StructuredTextParagraph):
93 """Represents a section of document with literal text, as for examples"""
94
95 def __init__(self, subs, **kw):
96 t=[]; a=t.append
97 for s in subs: a(s.getNodeValue())
98 apply(ST.StructuredTextParagraph.__init__,
99 (self, join(t,'\n\n'), ()),
100 kw)
101
102 def getColorizableTexts(self): return ()
103 def setColorizableTexts(self, src): pass # never color examples
104
105 class StructuredTextBullet(ST.StructuredTextParagraph):
106 """Represents a section of a document with a title and a body"""
107
108 class StructuredTextNumbered(ST.StructuredTextParagraph):
109 """Represents a section of a document with a title and a body"""
110
111 class StructuredTextDescriptionTitle(ST.StructuredTextParagraph):
112 """Represents a section of a document with a title and a body"""
113
114 class StructuredTextDescriptionBody(ST.StructuredTextParagraph):
115 """Represents a section of a document with a title and a body"""
116
117 class StructuredTextDescription(ST.StructuredTextParagraph):
118 """Represents a section of a document with a title and a body"""
119
120 def __init__(self, title, src, subs, **kw):
121 apply(ST.StructuredTextParagraph.__init__, (self, src, subs), kw)
122 self._title=title
123
124 def getColorizableTexts(self): return self._title, self._src
125 def setColorizableTexts(self, src): self._title, self._src = src
126
127 def getChildren(self):
128 return (StructuredTextDescriptionTitle(self._title),
129 StructuredTextDescriptionBody(self._src, self._subs))
130
131 class StructuredTextSectionTitle(ST.StructuredTextParagraph):
132 """Represents a section of a document with a title and a body"""
133
134 class StructuredTextSection(ST.StructuredTextParagraph):
135 """Represents a section of a document with a title and a body"""
136 def __init__(self, src, subs=None, **kw):
137 apply(ST.StructuredTextParagraph.__init__,
138 (self, StructuredTextSectionTitle(src), subs),
139 kw)
140
141 # a StructuredTextTable holds StructuredTextRows
142 class StructuredTextTable(ST.StructuredTextDocument):
143 """
144 rows is a list of lists containing tuples, which
145 represent the columns/cells in each rows.
146 EX
147 rows = [[('row 1:column1',1)],[('row2:column1',1)]]
148 """
149
150 def __init__(self, rows, src, subs, **kw):
151 apply(ST.StructuredTextDocument.__init__,(self,subs),kw)
152 self._rows = []
153 for row in rows:
154 if row:
155 self._rows.append(StructuredTextRow(row,kw))
156
157 def getRows(self):
158 return [self._rows]
159
160 def _getRows(self):
161 return self.getRows()
162
163 def getColumns(self):
164 result = []
165 for row in self._rows:
166 result.append(row.getColumns())
167 return result
168
169 def _getColumns(self):
170 return self.getColumns()
171
172 def setColumns(self,columns):
173 for index in range(len(self._rows)):
174 self._rows[index].setColumns(columns[index])
175
176 def _setColumns(self,columns):
177 return self.setColumns(columns)
178
179 def getColorizableTexts(self):
180 """
181 return a tuple where each item is a column/cell's
182 contents. The tuple, result, will be of this format.
183 ("r1 col1", "r1=col2", "r2 col1", "r2 col2")
184 """
185
186 result = []
187 for row in self._rows:
188 for column in row.getColumns()[0]:
189 result.append(column.getColorizableTexts()[0])
190 return result
191
192 def setColorizableTexts(self,texts):
193 """
194 texts is going to a tuple where each item is the
195 result of being mapped to the colortext function.
196 Need to insert the results appropriately into the
197 individual columns/cells
198 """
199 for row_index in range(len(self._rows)):
200 for column_index in range(len(self._rows[row_index]._columns)):
201 self._rows[row_index]._columns[column_index].setColorizableTexts((texts[0],))
202 texts = texts[1:]
203
204 def _getColorizableTexts(self):
205 return self.getColorizableTexts()
206
207 def _setColorizableTexts(self):
208 return self.setColorizableTexts()
209
210 # StructuredTextRow holds StructuredTextColumns
211 class StructuredTextRow(ST.StructuredTextDocument):
212
213 def __init__(self,row,kw):
214 """
215 row is a list of tuples, where each tuple is
216 the raw text for a cell/column and the span
217 of that cell/column".
218 EX
219 [('this is column one',1), ('this is column two',1)]
220 """
221
222 apply(ST.StructuredTextDocument.__init__,(self,[]),kw)
223 self._columns = []
224 for column in row:
225 self._columns.append(StructuredTextColumn(column[0],column[1],kw))
226
227 def getColumns(self):
228 return [self._columns]
229
230 def _getColumns(self):
231 return [self._columns]
232
233 def setColumns(self,columns):
234 self._columns = columns
235
236 def _setColumns(self,columns):
237 return self.setColumns(columns)
238
239 # this holds the text of a table cell
240 class StructuredTextColumn(ST.StructuredTextParagraph):
241 """
242 StructuredTextColumn is a cell/column in a table.
243 A cell can hold multiple paragraphs. The cell
244 is either classified as a StructuredTextTableHeader
245 or StructuredTextTableData.
246 """
247
248 def __init__(self,text,span,kw):
249 # print "StructuredTextColumn", text, span
250 apply(ST.StructuredTextParagraph.__init__,(self,text,[]),kw)
251 self._span = span
252
253 def getSpan(self):
254 return self._span
255
256 def _getSpan(self):
257 return self._span
258
259 class StructuredTextTableHeader(ST.StructuredTextDocument): pass
260
261 class StructuredTextTableData(ST.StructuredTextDocument): pass
262
263 class StructuredTextMarkup(STDOM.Element):
264
265 def __init__(self, v, **kw):
266 self._value=v
267 self._attributes=kw.keys()
268 for k, v in kw.items(): setattr(self, k, v)
269
270 def getChildren(self, type=type, lt=type([])):
271 v=self._value
272 if type(v) is not lt: v=[v]
273 return v
274
275 def getColorizableTexts(self): return self._value,
276 def setColorizableTexts(self, v): self._value=v[0]
277
278 def __repr__(self):
279 return '%s(%s)' % (self.__class__.__name__, `self._value`)
280
281 class StructuredTextLiteral(StructuredTextMarkup):
282 def getColorizableTexts(self): return ()
283 def setColorizableTexts(self, v): pass
284
285 class StructuredTextEmphasis(StructuredTextMarkup): pass
286
287 class StructuredTextStrong(StructuredTextMarkup): pass
288
289 class StructuredTextInnerLink(StructuredTextMarkup): pass
290
291 class StructuredTextNamedLink(StructuredTextMarkup): pass
292
293 class StructuredTextUnderline(StructuredTextMarkup): pass
294
295 class StructuredTextSGML(StructuredTextMarkup): pass
296
297 class StructuredTextLink(StructuredTextMarkup): pass
298
299 class DocumentClass:
300 """
301 Class instance calls [ex.=> x()] require a structured text
302 structure. Doc will then parse each paragraph in the structure
303 and will find the special structures within each paragraph.
304 Each special structure will be stored as an instance. Special
305 structures within another special structure are stored within
306 the 'top' structure
307 EX : '-underline this-' => would be turned into an underline
308 instance. '-underline **this**' would be stored as an underline
309 instance with a strong instance stored in its string
310 """
311
312 #'doc_table',
313 paragraph_types = [
314 'doc_bullet',
315 'doc_numbered',
316 'doc_description',
317 'doc_header',
318 'doc_table',
319 ]
320
321 #'doc_inner_link',
322 #'doc_named_link',
323 #'doc_underline',
324 text_types = [
325 'doc_href',
326 'doc_strong',
327 'doc_emphasize',
328 'doc_literal',
329 'doc_sgml'
330 ]
331
332 def __call__(self, doc):
333 if type(doc) is type(''):
334 doc=ST.StructuredText(doc)
335 doc.setSubparagraphs(self.color_paragraphs(
336 doc.getSubparagraphs()))
337 else:
338 doc=ST.StructuredTextDocument(self.color_paragraphs(
339 doc.getSubparagraphs()))
340 return doc
341
342 def parse(self, raw_string, text_type,
343 type=type, st=type(''), lt=type([])):
344
345 """
346 Parse accepts a raw_string, an expr to test the raw_string,
347 and the raw_string's subparagraphs.
348
349 Parse will continue to search through raw_string until
350 all instances of expr in raw_string are found.
351
352 If no instances of expr are found, raw_string is returned.
353 Otherwise a list of substrings and instances is returned
354 """
355
356 tmp = [] # the list to be returned if raw_string is split
357 append=tmp.append
358
359 if type(text_type) is st: text_type=getattr(self, text_type)
360
361 while 1:
362 t = text_type(raw_string)
363 if not t: break
364 #an instance of expr was found
365 t, start, end = t
366
367 if start: append(raw_string[0:start])
368
369 tt=type(t)
370 if tt is st:
371 # if we get a string back, add it to text to be parsed
372 raw_string = t+raw_string[end:len(raw_string)]
373 else:
374 if tt is lt:
375 # is we get a list, append it's elements
376 tmp[len(tmp):]=t
377 else:
378 # normal case, an object
379 append(t)
380 raw_string = raw_string[end:len(raw_string)]
381
382 if not tmp: return raw_string # nothing found
383
384 if raw_string: append(raw_string)
385 elif len(tmp)==1: return tmp[0]
386
387 return tmp
388
389
390 def color_text(self, str, types=None):
391 """Search the paragraph for each special structure
392 """
393 if types is None: types=self.text_types
394
395 for text_type in types:
396
397 if type(str) is StringType:
398 str = self.parse(str, text_type)
399 elif type(str) is ListType:
400 r=[]; a=r.append
401 for s in str:
402 if type(s) is StringType:
403 s=self.parse(s, text_type)
404 if type(s) is ListType: r[len(r):]=s
405 else: a(s)
406 else:
407 s.setColorizableTexts(
408 map(self.color_text,
409 s.getColorizableTexts()
410 ))
411 a(s)
412 str=r
413 else:
414 r=[]; a=r.append; color=self.color_text
415 for s in str.getColorizableTexts():
416 color(s, (text_type,))
417 a(s)
418
419 str.setColorizableTexts(r)
420
421 return str
422
423 def color_paragraphs(self, raw_paragraphs,
424 type=type, sequence_types=(type([]), type(())),
425 st=type('')):
426 result=[]
427 for paragraph in raw_paragraphs:
428 #print type(paragraph)
429 if paragraph.getNodeName() != 'StructuredTextParagraph':
430 result.append(paragraph)
431 continue
432
433 for pt in self.paragraph_types:
434 if type(pt) is st:
435 # grab the corresponding function
436 pt=getattr(self, pt)
437 # evaluate the paragraph
438 r=pt(paragraph)
439 if r:
440 if type(r) not in sequence_types:
441 r=r,
442 new_paragraphs=r
443 for paragraph in new_paragraphs:
444 paragraph.setSubparagraphs(self.color_paragraphs(paragraph.getSubparagraphs()))
445 break
446 else:
447 new_paragraphs=ST.StructuredTextParagraph(paragraph.getColorizableTexts()[0],
448 self.color_paragraphs(paragraph.getSubparagraphs()),
449 indent=paragraph.indent),
450
451 # color the inline StructuredText types
452 # for each StructuredTextParagraph
453 for paragraph in new_paragraphs:
454
455 if paragraph.getNodeName() is "StructuredTextTable":
456 #print "we have a table"
457 cells = paragraph.getColumns()
458 text = paragraph.getColorizableTexts()
459 text = map(ST.StructuredText,text)
460 text = map(self.__call__,text)
461 #for index in range(len(text)):
462 # text[index].setColorizableTexts(map(self.color_text,text[index].getColorizableTexts()))
463 paragraph.setColorizableTexts(text)
464
465 paragraph.setColorizableTexts(
466 map(self.color_text,
467 paragraph.getColorizableTexts()
468 ))
469 result.append(paragraph)
470
471 return result
472
473 def doc_table(self, paragraph, expr = re.compile('\s*\|[-]+\|').match):
474 text = paragraph.getColorizableTexts()[0]
475 m = expr(text)
476
477 subs = paragraph.getSubparagraphs()
478
479 if not (m):
480 return None
481 rows = []
482
483 rows = split(text,'\n')
484
485 spans = []
486 ROWS = []
487 COLS = []
488
489 TDdivider = re.compile("[\-]+").match
490 THdivider = re.compile("[\=]+").match
491
492 # find where the column markers are located
493 col = re.compile('\|').search
494 text = strip(text)
495 rows = split(text,'\n')
496 for row in range(len(rows)):
497 rows[row] = strip(rows[row])
498
499 for row in rows:
500 tmp = strip(row)
501 tmp = row[1:len(tmp)-1] # remove leading and trailing |
502 offset = 0
503 if col(tmp):
504 while col(tmp):
505 start,end = col(tmp).span()
506 if not start+offset in spans:
507 spans.append(start + offset)
508 COLS.append((tmp[0:start],start+offset))
509 tmp = " " + tmp[end:]
510 offset = offset + (start)
511 if not offset+len(tmp) in spans:
512 spans.append(offset+len(tmp))
513 COLS.append((tmp,offset+len(tmp)))
514 ROWS.append(COLS)
515 COLS = []
516
517 spans.sort()
518
519 ROWS = ROWS[1:len(ROWS)]
520
521 # find each column span
522 cols = []
523 tmp = []
524
525 for row in ROWS:
526 for c in row:
527 tmp.append(c[1])
528 cols.append(tmp)
529 tmp = []
530
531 cur = 1 # the current column span
532 tmp = []
533 C = [] # holds the span of each cell
534 for col in cols:
535 for span in spans:
536 if not span in col:
537 cur = cur + 1
538 else:
539 tmp.append(cur)
540 cur = 1
541 C.append(tmp)
542 tmp = []
543
544 # make rows contain the cell's text and the span
545 # of that cell
546 for index in range(len(C)):
547 for i in range(len(C[index])):
548 ROWS[index][i] = (ROWS[index][i][0],C[index][i])
549 rows = ROWS
550
551 # now munge the table cells together
552 ROWS = []
553 COLS = []
554 for row in rows:
555 for index in range(len(row)):
556 if not COLS:
557 COLS = range(len(row))
558 for i in range(len(COLS)):
559 COLS[i] = ["",1]
560 if TDdivider(row[index][0]) or THdivider(row[index][0]):
561 ROWS.append(COLS)
562 COLS = []
563 else:
564 COLS[index][0] = COLS[index][0] + rstrip(row[index][0]) + "\n"
565 COLS[index][1] = row[index][1]
566 return StructuredTextTable(ROWS,text,subs,indent=paragraph.indent)
567
568 def doc_bullet(self, paragraph, expr = re.compile('\s*[-*o]\s+').match):
569 top=paragraph.getColorizableTexts()[0]
570 m=expr(top)
571
572 if not m:
573 return None
574
575 subs=paragraph.getSubparagraphs()
576 if top[-2:]=='::':
577 subs=[StructuredTextExample(subs)]
578 top=top[:-1]
579 return StructuredTextBullet(top[m.span()[1]:], subs,
580 indent=paragraph.indent,
581 bullet=top[:m.span()[1]]
582 )
583
584 def doc_numbered(
585 self, paragraph,
586 expr = re.compile('(\s*[a-zA-Z]+\.)|(\s*[0-9]+\.)|(\s*[0-9]+\s+)').match):
587
588 # This is the old expression. It had a nasty habit
589 # of grabbing paragraphs that began with a single
590 # letter word even if there was no following period.
591
592 #expr = re.compile('\s*'
593 # '(([a-zA-Z]|[0-9]+|[ivxlcdmIVXLCDM]+)\.)*'
594 # '([a-zA-Z]|[0-9]+|[ivxlcdmIVXLCDM]+)\.?'
595 # '\s+').match):
596
597 top=paragraph.getColorizableTexts()[0]
598 m=expr(top)
599 if not m: return None
600 subs=paragraph.getSubparagraphs()
601 if top[-2:]=='::':
602 subs=[StructuredTextExample(subs)]
603 top=top[:-1]
604 return StructuredTextNumbered(top[m.span()[1]:], subs,
605 indent=paragraph.indent,
606 number=top[:m.span()[1]])
607
608 def doc_description(
609 self, paragraph,
610 delim = re.compile('\s+--\s+').search,
611 nb=re.compile(r'[^\0- ]').search,
612 ):
613
614 top=paragraph.getColorizableTexts()[0]
615 d=delim(top)
616 if not d: return None
617 start, end = d.span()
618 title=top[:start]
619 if find(title, '\n') >= 0: return None
620 if not nb(title): return None
621 d=top[start:end]
622 top=top[end:]
623
624 subs=paragraph.getSubparagraphs()
625 if top[-2:]=='::':
626 subs=[StructuredTextExample(subs)]
627 top=top[:-1]
628
629 return StructuredTextDescription(
630 title, top, subs,
631 indent=paragraph.indent,
632 delim=d)
633
634 def doc_header(self, paragraph,
635 expr = re.compile('[ a-zA-Z0-9.:/,-_*<>\?\'\"]+').match
636 ):
637 subs=paragraph.getSubparagraphs()
638 if not subs: return None
639 top=paragraph.getColorizableTexts()[0]
640 if not strip(top): return None
641 if top[-2:]=='::':
642 subs=StructuredTextExample(subs)
643 if strip(top)=='::': return subs
644 return ST.StructuredTextParagraph(
645 top[:-1], [subs], indent=paragraph.indent)
646
647 if find(top,'\n') >= 0: return None
648 return StructuredTextSection(top, subs, indent=paragraph.indent)
649
650 def doc_literal(
651 self, s,
652 expr=re.compile(
653 "(?:\s|^)'" # open
654 "([^ \t\n\r\f\v']|[^ \t\n\r\f\v'][^\n']*[^ \t\n\r\f\v'])" # contents
655 "'(?:\s|[,.;:!?]|$)" # close
656 ).search):
657
658 r=expr(s)
659 if r:
660 start, end = r.span(1)
661 return (StructuredTextLiteral(s[start:end]), start-1, end+1)
662 else:
663 return None
664
665 def doc_emphasize(
666 self, s,
667 expr = re.compile('\s*\*([ \na-zA-Z0-9.:/;,\'\"\?]+)\*(?!\*|-)').search
668 ):
669
670 r=expr(s)
671 if r:
672 start, end = r.span(1)
673 return (StructuredTextEmphasis(s[start:end]), start-1, end+1)
674 else:
675 return None
676
677 def doc_inner_link(self,
678 s,
679 expr1 = re.compile("\.\.\s*").search,
680 expr2 = re.compile("\[[a-zA-Z0-9]+\]").search):
681
682 # make sure we dont grab a named link
683 if expr2(s) and expr1(s):
684 start1,end1 = expr1(s).span()
685 start2,end2 = expr2(s).span()
686 if end1 == start2:
687 # uh-oh, looks like a named link
688 return None
689 else:
690 # the .. is somewhere else, ignore it
691 return (StructuredTextInnerLink(s[start2+1,end2-1],start2,end2))
692 return None
693 elif expr2(s) and not expr1(s):
694 start,end = expr2(s).span()
695 return (StructuredTextInnerLink(s[start+1:end-1]),start,end)
696 return None
697
698 def doc_named_link(self,
699 s,
700 expr=re.compile("(\.\.\s)(\[[a-zA-Z0-9]+\])").search):
701
702 result = expr(s)
703 if result:
704 start,end = result.span(2)
705 a,b = result.span(1)
706 str = strip(s[a:b]) + s[start:end]
707 st,en = result.span()
708 return (StructuredTextNamedLink(str),st,en)
709 #return (StructuredTextNamedLink(s[st:en]),st,en)
710 return None
711
712 def doc_underline(self,
713 s,
714 expr=re.compile("\_([a-zA-Z0-9\s\.,\?]+)\_").search):
715
716 result = expr(s)
717 if result:
718 start,end = result.span(1)
719 st,e = result.span()
720 return (StructuredTextUnderline(s[start:end]),st,e)
721 else:
722 return None
723
724 def doc_strong(self,
725 s,
726 expr = re.compile('\s*\*\*([ \na-zA-Z0-9.:/;\-,!\?\'\"]+)\*\*').search
727 ):
728
729 r=expr(s)
730 if r:
731 start, end = r.span(1)
732 return (StructuredTextStrong(s[start:end]), start-2, end+2)
733 else:
734 return None
735
736 def doc_href(
737
738 self, s,
739 expr1 = re.compile("(\"[ a-zA-Z0-9\n\-\.\,\;\(\)\/\:\/]+\")(:)([a-zA-Z0-9\:\/\.\~\-]+)([,]*\s*)").search,
740 expr2 = re.compile('(\"[ a-zA-Z0-9\n\-\.\:\;\(\)\/]+\")([,]+\s+)([a-zA-Z0-9\@\.\,\?\!\/\:\;\-\#]+)(\s*)').search):
741
742 punctuation = re.compile("[\,\.\?\!\;]+").match
743 r=expr1(s) or expr2(s)
744
745 if r:
746 # need to grab the href part and the
747 # beginning part
748
749 start,e = r.span(1)
750 name = s[start:e]
751 name = replace(name,'"','',2)
752 #start = start + 1
753 st,end = r.span(3)
754 if punctuation(s[end-1:end]):
755 end = end -1
756 link = s[st:end]
757 #end = end - 1
758
759 # name is the href title, link is the target
760 # of the href
761 return (StructuredTextLink(name, href=link),
762 start, end)
763
764 #return (StructuredTextLink(s[start:end], href=s[start:end]),
765 # start, end)
766 else:
767 return None
768
769 def doc_sgml(self,s,expr=re.compile("\<[a-zA-Z0-9\.\=\'\"\:\/\-\#\+\s]+\>").search):
770 """
771 SGML text is ignored and outputed as-is
772 """
773 r = expr(s)
774 if r:
775 start,end = r.span()
776 text = s[start:end]
777 return (StructuredTextSGML(text),start,end)