##// END OF EJS Templates
Fixed: https urls in the wiki are not displayed as external (closes #943)....
Jean-Philippe Lang -
r1286:85858cebe64a
parent child
Show More
@@ -1,1140 +1,1140
1 1 # vim:ts=4:sw=4:
2 2 # = RedCloth - Textile and Markdown Hybrid for Ruby
3 3 #
4 4 # Homepage:: http://whytheluckystiff.net/ruby/redcloth/
5 5 # Author:: why the lucky stiff (http://whytheluckystiff.net/)
6 6 # Copyright:: (cc) 2004 why the lucky stiff (and his puppet organizations.)
7 7 # License:: BSD
8 8 #
9 9 # (see http://hobix.com/textile/ for a Textile Reference.)
10 10 #
11 11 # Based on (and also inspired by) both:
12 12 #
13 13 # PyTextile: http://diveintomark.org/projects/textile/textile.py.txt
14 14 # Textism for PHP: http://www.textism.com/tools/textile/
15 15 #
16 16 #
17 17
18 18 # = RedCloth
19 19 #
20 20 # RedCloth is a Ruby library for converting Textile and/or Markdown
21 21 # into HTML. You can use either format, intermingled or separately.
22 22 # You can also extend RedCloth to honor your own custom text stylings.
23 23 #
24 24 # RedCloth users are encouraged to use Textile if they are generating
25 25 # HTML and to use Markdown if others will be viewing the plain text.
26 26 #
27 27 # == What is Textile?
28 28 #
29 29 # Textile is a simple formatting style for text
30 30 # documents, loosely based on some HTML conventions.
31 31 #
32 32 # == Sample Textile Text
33 33 #
34 34 # h2. This is a title
35 35 #
36 36 # h3. This is a subhead
37 37 #
38 38 # This is a bit of paragraph.
39 39 #
40 40 # bq. This is a blockquote.
41 41 #
42 42 # = Writing Textile
43 43 #
44 44 # A Textile document consists of paragraphs. Paragraphs
45 45 # can be specially formatted by adding a small instruction
46 46 # to the beginning of the paragraph.
47 47 #
48 48 # h[n]. Header of size [n].
49 49 # bq. Blockquote.
50 50 # # Numeric list.
51 51 # * Bulleted list.
52 52 #
53 53 # == Quick Phrase Modifiers
54 54 #
55 55 # Quick phrase modifiers are also included, to allow formatting
56 56 # of small portions of text within a paragraph.
57 57 #
58 58 # \_emphasis\_
59 59 # \_\_italicized\_\_
60 60 # \*strong\*
61 61 # \*\*bold\*\*
62 62 # ??citation??
63 63 # -deleted text-
64 64 # +inserted text+
65 65 # ^superscript^
66 66 # ~subscript~
67 67 # @code@
68 68 # %(classname)span%
69 69 #
70 70 # ==notextile== (leave text alone)
71 71 #
72 72 # == Links
73 73 #
74 74 # To make a hypertext link, put the link text in "quotation
75 75 # marks" followed immediately by a colon and the URL of the link.
76 76 #
77 77 # Optional: text in (parentheses) following the link text,
78 78 # but before the closing quotation mark, will become a Title
79 79 # attribute for the link, visible as a tool tip when a cursor is above it.
80 80 #
81 81 # Example:
82 82 #
83 83 # "This is a link (This is a title) ":http://www.textism.com
84 84 #
85 85 # Will become:
86 86 #
87 87 # <a href="http://www.textism.com" title="This is a title">This is a link</a>
88 88 #
89 89 # == Images
90 90 #
91 91 # To insert an image, put the URL for the image inside exclamation marks.
92 92 #
93 93 # Optional: text that immediately follows the URL in (parentheses) will
94 94 # be used as the Alt text for the image. Images on the web should always
95 95 # have descriptive Alt text for the benefit of readers using non-graphical
96 96 # browsers.
97 97 #
98 98 # Optional: place a colon followed by a URL immediately after the
99 99 # closing ! to make the image into a link.
100 100 #
101 101 # Example:
102 102 #
103 103 # !http://www.textism.com/common/textist.gif(Textist)!
104 104 #
105 105 # Will become:
106 106 #
107 107 # <img src="http://www.textism.com/common/textist.gif" alt="Textist" />
108 108 #
109 109 # With a link:
110 110 #
111 111 # !/common/textist.gif(Textist)!:http://textism.com
112 112 #
113 113 # Will become:
114 114 #
115 115 # <a href="http://textism.com"><img src="/common/textist.gif" alt="Textist" /></a>
116 116 #
117 117 # == Defining Acronyms
118 118 #
119 119 # HTML allows authors to define acronyms via the tag. The definition appears as a
120 120 # tool tip when a cursor hovers over the acronym. A crucial aid to clear writing,
121 121 # this should be used at least once for each acronym in documents where they appear.
122 122 #
123 123 # To quickly define an acronym in Textile, place the full text in (parentheses)
124 124 # immediately following the acronym.
125 125 #
126 126 # Example:
127 127 #
128 128 # ACLU(American Civil Liberties Union)
129 129 #
130 130 # Will become:
131 131 #
132 132 # <acronym title="American Civil Liberties Union">ACLU</acronym>
133 133 #
134 134 # == Adding Tables
135 135 #
136 136 # In Textile, simple tables can be added by seperating each column by
137 137 # a pipe.
138 138 #
139 139 # |a|simple|table|row|
140 140 # |And|Another|table|row|
141 141 #
142 142 # Attributes are defined by style definitions in parentheses.
143 143 #
144 144 # table(border:1px solid black).
145 145 # (background:#ddd;color:red). |{}| | | |
146 146 #
147 147 # == Using RedCloth
148 148 #
149 149 # RedCloth is simply an extension of the String class, which can handle
150 150 # Textile formatting. Use it like a String and output HTML with its
151 151 # RedCloth#to_html method.
152 152 #
153 153 # doc = RedCloth.new "
154 154 #
155 155 # h2. Test document
156 156 #
157 157 # Just a simple test."
158 158 #
159 159 # puts doc.to_html
160 160 #
161 161 # By default, RedCloth uses both Textile and Markdown formatting, with
162 162 # Textile formatting taking precedence. If you want to turn off Markdown
163 163 # formatting, to boost speed and limit the processor:
164 164 #
165 165 # class RedCloth::Textile.new( str )
166 166
167 167 class RedCloth < String
168 168
169 169 VERSION = '3.0.4'
170 170 DEFAULT_RULES = [:textile, :markdown]
171 171
172 172 #
173 173 # Two accessor for setting security restrictions.
174 174 #
175 175 # This is a nice thing if you're using RedCloth for
176 176 # formatting in public places (e.g. Wikis) where you
177 177 # don't want users to abuse HTML for bad things.
178 178 #
179 179 # If +:filter_html+ is set, HTML which wasn't
180 180 # created by the Textile processor will be escaped.
181 181 #
182 182 # If +:filter_styles+ is set, it will also disable
183 183 # the style markup specifier. ('{color: red}')
184 184 #
185 185 attr_accessor :filter_html, :filter_styles
186 186
187 187 #
188 188 # Accessor for toggling hard breaks.
189 189 #
190 190 # If +:hard_breaks+ is set, single newlines will
191 191 # be converted to HTML break tags. This is the
192 192 # default behavior for traditional RedCloth.
193 193 #
194 194 attr_accessor :hard_breaks
195 195
196 196 # Accessor for toggling lite mode.
197 197 #
198 198 # In lite mode, block-level rules are ignored. This means
199 199 # that tables, paragraphs, lists, and such aren't available.
200 200 # Only the inline markup for bold, italics, entities and so on.
201 201 #
202 202 # r = RedCloth.new( "And then? She *fell*!", [:lite_mode] )
203 203 # r.to_html
204 204 # #=> "And then? She <strong>fell</strong>!"
205 205 #
206 206 attr_accessor :lite_mode
207 207
208 208 #
209 209 # Accessor for toggling span caps.
210 210 #
211 211 # Textile places `span' tags around capitalized
212 212 # words by default, but this wreaks havoc on Wikis.
213 213 # If +:no_span_caps+ is set, this will be
214 214 # suppressed.
215 215 #
216 216 attr_accessor :no_span_caps
217 217
218 218 #
219 219 # Establishes the markup predence. Available rules include:
220 220 #
221 221 # == Textile Rules
222 222 #
223 223 # The following textile rules can be set individually. Or add the complete
224 224 # set of rules with the single :textile rule, which supplies the rule set in
225 225 # the following precedence:
226 226 #
227 227 # refs_textile:: Textile references (i.e. [hobix]http://hobix.com/)
228 228 # block_textile_table:: Textile table block structures
229 229 # block_textile_lists:: Textile list structures
230 230 # block_textile_prefix:: Textile blocks with prefixes (i.e. bq., h2., etc.)
231 231 # inline_textile_image:: Textile inline images
232 232 # inline_textile_link:: Textile inline links
233 233 # inline_textile_span:: Textile inline spans
234 234 # glyphs_textile:: Textile entities (such as em-dashes and smart quotes)
235 235 #
236 236 # == Markdown
237 237 #
238 238 # refs_markdown:: Markdown references (for example: [hobix]: http://hobix.com/)
239 239 # block_markdown_setext:: Markdown setext headers
240 240 # block_markdown_atx:: Markdown atx headers
241 241 # block_markdown_rule:: Markdown horizontal rules
242 242 # block_markdown_bq:: Markdown blockquotes
243 243 # block_markdown_lists:: Markdown lists
244 244 # inline_markdown_link:: Markdown links
245 245 attr_accessor :rules
246 246
247 247 # Returns a new RedCloth object, based on _string_ and
248 248 # enforcing all the included _restrictions_.
249 249 #
250 250 # r = RedCloth.new( "h1. A <b>bold</b> man", [:filter_html] )
251 251 # r.to_html
252 252 # #=>"<h1>A &lt;b&gt;bold&lt;/b&gt; man</h1>"
253 253 #
254 254 def initialize( string, restrictions = [] )
255 255 restrictions.each { |r| method( "#{ r }=" ).call( true ) }
256 256 super( string )
257 257 end
258 258
259 259 #
260 260 # Generates HTML from the Textile contents.
261 261 #
262 262 # r = RedCloth.new( "And then? She *fell*!" )
263 263 # r.to_html( true )
264 264 # #=>"And then? She <strong>fell</strong>!"
265 265 #
266 266 def to_html( *rules )
267 267 rules = DEFAULT_RULES if rules.empty?
268 268 # make our working copy
269 269 text = self.dup
270 270
271 271 @urlrefs = {}
272 272 @shelf = []
273 273 textile_rules = [:refs_textile, :block_textile_table, :block_textile_lists,
274 274 :block_textile_prefix, :inline_textile_image, :inline_textile_link,
275 275 :inline_textile_code, :inline_textile_span]
276 276 markdown_rules = [:refs_markdown, :block_markdown_setext, :block_markdown_atx, :block_markdown_rule,
277 277 :block_markdown_bq, :block_markdown_lists,
278 278 :inline_markdown_reflink, :inline_markdown_link]
279 279 @rules = rules.collect do |rule|
280 280 case rule
281 281 when :markdown
282 282 markdown_rules
283 283 when :textile
284 284 textile_rules
285 285 else
286 286 rule
287 287 end
288 288 end.flatten
289 289
290 290 # standard clean up
291 291 incoming_entities text
292 292 clean_white_space text
293 293
294 294 # start processor
295 295 @pre_list = []
296 296 rip_offtags text
297 297 no_textile text
298 298 escape_html_tags text
299 299 hard_break text
300 300 unless @lite_mode
301 301 refs text
302 302 blocks text
303 303 end
304 304 inline text
305 305 smooth_offtags text
306 306
307 307 retrieve text
308 308
309 309 text.gsub!( /<\/?notextile>/, '' )
310 310 text.gsub!( /x%x%/, '&#38;' )
311 311 clean_html text if filter_html
312 312 text.strip!
313 313 text
314 314
315 315 end
316 316
317 317 #######
318 318 private
319 319 #######
320 320 #
321 321 # Mapping of 8-bit ASCII codes to HTML numerical entity equivalents.
322 322 # (from PyTextile)
323 323 #
324 324 TEXTILE_TAGS =
325 325
326 326 [[128, 8364], [129, 0], [130, 8218], [131, 402], [132, 8222], [133, 8230],
327 327 [134, 8224], [135, 8225], [136, 710], [137, 8240], [138, 352], [139, 8249],
328 328 [140, 338], [141, 0], [142, 0], [143, 0], [144, 0], [145, 8216], [146, 8217],
329 329 [147, 8220], [148, 8221], [149, 8226], [150, 8211], [151, 8212], [152, 732],
330 330 [153, 8482], [154, 353], [155, 8250], [156, 339], [157, 0], [158, 0], [159, 376]].
331 331
332 332 collect! do |a, b|
333 333 [a.chr, ( b.zero? and "" or "&#{ b };" )]
334 334 end
335 335
336 336 #
337 337 # Regular expressions to convert to HTML.
338 338 #
339 339 A_HLGN = /(?:(?:<>|<|>|\=|[()]+)+)/
340 340 A_VLGN = /[\-^~]/
341 341 C_CLAS = '(?:\([^)]+\))'
342 342 C_LNGE = '(?:\[[^\]]+\])'
343 343 C_STYL = '(?:\{[^}]+\})'
344 344 S_CSPN = '(?:\\\\\d+)'
345 345 S_RSPN = '(?:/\d+)'
346 346 A = "(?:#{A_HLGN}?#{A_VLGN}?|#{A_VLGN}?#{A_HLGN}?)"
347 347 S = "(?:#{S_CSPN}?#{S_RSPN}|#{S_RSPN}?#{S_CSPN}?)"
348 348 C = "(?:#{C_CLAS}?#{C_STYL}?#{C_LNGE}?|#{C_STYL}?#{C_LNGE}?#{C_CLAS}?|#{C_LNGE}?#{C_STYL}?#{C_CLAS}?)"
349 349 # PUNCT = Regexp::quote( '!"#$%&\'()*+,-./:;<=>?@[\\]^_`{|}~' )
350 350 PUNCT = Regexp::quote( '!"#$%&\'*+,-./:;=?@\\^_`|~' )
351 351 PUNCT_NOQ = Regexp::quote( '!"#$&\',./:;=?@\\`|' )
352 352 PUNCT_Q = Regexp::quote( '*-_+^~%' )
353 353 HYPERLINK = '(\S+?)([^\w\s/;=\?]*?)(?=\s|<|$)'
354 354
355 355 # Text markup tags, don't conflict with block tags
356 356 SIMPLE_HTML_TAGS = [
357 357 'tt', 'b', 'i', 'big', 'small', 'em', 'strong', 'dfn', 'code',
358 358 'samp', 'kbd', 'var', 'cite', 'abbr', 'acronym', 'a', 'img', 'br',
359 359 'br', 'map', 'q', 'sub', 'sup', 'span', 'bdo'
360 360 ]
361 361
362 362 QTAGS = [
363 363 ['**', 'b', :limit],
364 364 ['*', 'strong', :limit],
365 365 ['??', 'cite', :limit],
366 366 ['-', 'del', :limit],
367 367 ['__', 'i', :limit],
368 368 ['_', 'em', :limit],
369 369 ['%', 'span', :limit],
370 370 ['+', 'ins', :limit],
371 371 ['^', 'sup', :limit],
372 372 ['~', 'sub', :limit]
373 373 ]
374 374 QTAGS.collect! do |rc, ht, rtype|
375 375 rcq = Regexp::quote rc
376 376 re =
377 377 case rtype
378 378 when :limit
379 379 /(^|[>\s])
380 380 (#{rcq})
381 381 (#{C})
382 382 (?::(\S+?))?
383 383 ([^\s\-].*?[^\s\-]|\w)
384 384 #{rcq}
385 385 (?=[[:punct:]]|\s|$)/x
386 386 else
387 387 /(#{rcq})
388 388 (#{C})
389 389 (?::(\S+))?
390 390 ([^\s\-].*?[^\s\-]|\w)
391 391 #{rcq}/xm
392 392 end
393 393 [rc, ht, re, rtype]
394 394 end
395 395
396 396 # Elements to handle
397 397 GLYPHS = [
398 398 # [ /([^\s\[{(>])?\'([dmst]\b|ll\b|ve\b|\s|:|$)/, '\1&#8217;\2' ], # single closing
399 399 # [ /([^\s\[{(>#{PUNCT_Q}][#{PUNCT_Q}]*)\'/, '\1&#8217;' ], # single closing
400 400 # [ /\'(?=[#{PUNCT_Q}]*(s\b|[\s#{PUNCT_NOQ}]))/, '&#8217;' ], # single closing
401 401 # [ /\'/, '&#8216;' ], # single opening
402 402 [ /</, '&lt;' ], # less-than
403 403 [ />/, '&gt;' ], # greater-than
404 404 # [ /([^\s\[{(])?"(\s|:|$)/, '\1&#8221;\2' ], # double closing
405 405 # [ /([^\s\[{(>#{PUNCT_Q}][#{PUNCT_Q}]*)"/, '\1&#8221;' ], # double closing
406 406 # [ /"(?=[#{PUNCT_Q}]*[\s#{PUNCT_NOQ}])/, '&#8221;' ], # double closing
407 407 # [ /"/, '&#8220;' ], # double opening
408 408 [ /\b( )?\.{3}/, '\1&#8230;' ], # ellipsis
409 409 [ /\b([A-Z][A-Z0-9]{2,})\b(?:[(]([^)]*)[)])/, '<acronym title="\2">\1</acronym>' ], # 3+ uppercase acronym
410 410 [ /(^|[^"][>\s])([A-Z][A-Z0-9 ]+[A-Z0-9])([^<A-Za-z0-9]|$)/, '\1<span class="caps">\2</span>\3', :no_span_caps ], # 3+ uppercase caps
411 411 [ /(\.\s)?\s?--\s?/, '\1&#8212;' ], # em dash
412 412 [ /\s->\s/, ' &rarr; ' ], # right arrow
413 413 [ /\s-\s/, ' &#8211; ' ], # en dash
414 414 [ /(\d+) ?x ?(\d+)/, '\1&#215;\2' ], # dimension sign
415 415 [ /\b ?[(\[]TM[\])]/i, '&#8482;' ], # trademark
416 416 [ /\b ?[(\[]R[\])]/i, '&#174;' ], # registered
417 417 [ /\b ?[(\[]C[\])]/i, '&#169;' ] # copyright
418 418 ]
419 419
420 420 H_ALGN_VALS = {
421 421 '<' => 'left',
422 422 '=' => 'center',
423 423 '>' => 'right',
424 424 '<>' => 'justify'
425 425 }
426 426
427 427 V_ALGN_VALS = {
428 428 '^' => 'top',
429 429 '-' => 'middle',
430 430 '~' => 'bottom'
431 431 }
432 432
433 433 #
434 434 # Flexible HTML escaping
435 435 #
436 436 def htmlesc( str, mode )
437 437 str.gsub!( '&', '&amp;' )
438 438 str.gsub!( '"', '&quot;' ) if mode != :NoQuotes
439 439 str.gsub!( "'", '&#039;' ) if mode == :Quotes
440 440 str.gsub!( '<', '&lt;')
441 441 str.gsub!( '>', '&gt;')
442 442 end
443 443
444 444 # Search and replace for Textile glyphs (quotes, dashes, other symbols)
445 445 def pgl( text )
446 446 GLYPHS.each do |re, resub, tog|
447 447 next if tog and method( tog ).call
448 448 text.gsub! re, resub
449 449 end
450 450 end
451 451
452 452 # Parses Textile attribute lists and builds an HTML attribute string
453 453 def pba( text_in, element = "" )
454 454
455 455 return '' unless text_in
456 456
457 457 style = []
458 458 text = text_in.dup
459 459 if element == 'td'
460 460 colspan = $1 if text =~ /\\(\d+)/
461 461 rowspan = $1 if text =~ /\/(\d+)/
462 462 style << "vertical-align:#{ v_align( $& ) };" if text =~ A_VLGN
463 463 end
464 464
465 465 style << "#{ $1 };" if not filter_styles and
466 466 text.sub!( /\{([^}]*)\}/, '' )
467 467
468 468 lang = $1 if
469 469 text.sub!( /\[([^)]+?)\]/, '' )
470 470
471 471 cls = $1 if
472 472 text.sub!( /\(([^()]+?)\)/, '' )
473 473
474 474 style << "padding-left:#{ $1.length }em;" if
475 475 text.sub!( /([(]+)/, '' )
476 476
477 477 style << "padding-right:#{ $1.length }em;" if text.sub!( /([)]+)/, '' )
478 478
479 479 style << "text-align:#{ h_align( $& ) };" if text =~ A_HLGN
480 480
481 481 cls, id = $1, $2 if cls =~ /^(.*?)#(.*)$/
482 482
483 483 atts = ''
484 484 atts << " style=\"#{ style.join }\"" unless style.empty?
485 485 atts << " class=\"#{ cls }\"" unless cls.to_s.empty?
486 486 atts << " lang=\"#{ lang }\"" if lang
487 487 atts << " id=\"#{ id }\"" if id
488 488 atts << " colspan=\"#{ colspan }\"" if colspan
489 489 atts << " rowspan=\"#{ rowspan }\"" if rowspan
490 490
491 491 atts
492 492 end
493 493
494 494 TABLE_RE = /^(?:table(_?#{S}#{A}#{C})\. ?\n)?^(#{A}#{C}\.? ?\|.*?\|)(\n\n|\Z)/m
495 495
496 496 # Parses a Textile table block, building HTML from the result.
497 497 def block_textile_table( text )
498 498 text.gsub!( TABLE_RE ) do |matches|
499 499
500 500 tatts, fullrow = $~[1..2]
501 501 tatts = pba( tatts, 'table' )
502 502 tatts = shelve( tatts ) if tatts
503 503 rows = []
504 504
505 505 fullrow.
506 506 split( /\|$/m ).
507 507 delete_if { |x| x.empty? }.
508 508 each do |row|
509 509
510 510 ratts, row = pba( $1, 'tr' ), $2 if row =~ /^(#{A}#{C}\. )(.*)/m
511 511
512 512 cells = []
513 513 #row.split( /\(?!\[\[[^\]])|(?![^\[]\]\])/ ).each do |cell|
514 514 row.split( /\|(?![^\[\|]*\]\])/ ).each do |cell|
515 515 ctyp = 'd'
516 516 ctyp = 'h' if cell =~ /^_/
517 517
518 518 catts = ''
519 519 catts, cell = pba( $1, 'td' ), $2 if cell =~ /^(_?#{S}#{A}#{C}\. ?)(.*)/
520 520
521 521 unless cell.strip.empty?
522 522 catts = shelve( catts ) if catts
523 523 cells << "\t\t\t<t#{ ctyp }#{ catts }>#{ cell }</t#{ ctyp }>"
524 524 end
525 525 end
526 526 ratts = shelve( ratts ) if ratts
527 527 rows << "\t\t<tr#{ ratts }>\n#{ cells.join( "\n" ) }\n\t\t</tr>"
528 528 end
529 529 "\t<table#{ tatts }>\n#{ rows.join( "\n" ) }\n\t</table>\n\n"
530 530 end
531 531 end
532 532
533 533 LISTS_RE = /^([#*]+?#{C} .*?)$(?![^#*])/m
534 534 LISTS_CONTENT_RE = /^([#*]+)(#{A}#{C}) (.*)$/m
535 535
536 536 # Parses Textile lists and generates HTML
537 537 def block_textile_lists( text )
538 538 text.gsub!( LISTS_RE ) do |match|
539 539 lines = match.split( /\n/ )
540 540 last_line = -1
541 541 depth = []
542 542 lines.each_with_index do |line, line_id|
543 543 if line =~ LISTS_CONTENT_RE
544 544 tl,atts,content = $~[1..3]
545 545 if depth.last
546 546 if depth.last.length > tl.length
547 547 (depth.length - 1).downto(0) do |i|
548 548 break if depth[i].length == tl.length
549 549 lines[line_id - 1] << "</li>\n\t</#{ lT( depth[i] ) }l>\n\t"
550 550 depth.pop
551 551 end
552 552 end
553 553 if depth.last and depth.last.length == tl.length
554 554 lines[line_id - 1] << '</li>'
555 555 end
556 556 end
557 557 unless depth.last == tl
558 558 depth << tl
559 559 atts = pba( atts )
560 560 atts = shelve( atts ) if atts
561 561 lines[line_id] = "\t<#{ lT(tl) }l#{ atts }>\n\t<li>#{ content }"
562 562 else
563 563 lines[line_id] = "\t\t<li>#{ content }"
564 564 end
565 565 last_line = line_id
566 566
567 567 else
568 568 last_line = line_id
569 569 end
570 570 if line_id - last_line > 1 or line_id == lines.length - 1
571 571 depth.delete_if do |v|
572 572 lines[last_line] << "</li>\n\t</#{ lT( v ) }l>"
573 573 end
574 574 end
575 575 end
576 576 lines.join( "\n" )
577 577 end
578 578 end
579 579
580 580 CODE_RE = /(\W)
581 581 @
582 582 (?:\|(\w+?)\|)?
583 583 (.+?)
584 584 @
585 585 (?=\W)/x
586 586
587 587 def inline_textile_code( text )
588 588 text.gsub!( CODE_RE ) do |m|
589 589 before,lang,code,after = $~[1..4]
590 590 lang = " lang=\"#{ lang }\"" if lang
591 591 rip_offtags( "#{ before }<code#{ lang }>#{ code }</code>#{ after }" )
592 592 end
593 593 end
594 594
595 595 def lT( text )
596 596 text =~ /\#$/ ? 'o' : 'u'
597 597 end
598 598
599 599 def hard_break( text )
600 600 text.gsub!( /(.)\n(?!\Z| *([#*=]+(\s|$)|[{|]))/, "\\1<br />" ) if hard_breaks
601 601 end
602 602
603 603 BLOCKS_GROUP_RE = /\n{2,}(?! )/m
604 604
605 605 def blocks( text, deep_code = false )
606 606 text.replace( text.split( BLOCKS_GROUP_RE ).collect do |blk|
607 607 plain = blk !~ /\A[#*> ]/
608 608
609 609 # skip blocks that are complex HTML
610 610 if blk =~ /^<\/?(\w+).*>/ and not SIMPLE_HTML_TAGS.include? $1
611 611 blk
612 612 else
613 613 # search for indentation levels
614 614 blk.strip!
615 615 if blk.empty?
616 616 blk
617 617 else
618 618 code_blk = nil
619 619 blk.gsub!( /((?:\n(?:\n^ +[^\n]*)+)+)/m ) do |iblk|
620 620 flush_left iblk
621 621 blocks iblk, plain
622 622 iblk.gsub( /^(\S)/, "\t\\1" )
623 623 if plain
624 624 code_blk = iblk; ""
625 625 else
626 626 iblk
627 627 end
628 628 end
629 629
630 630 block_applied = 0
631 631 @rules.each do |rule_name|
632 632 block_applied += 1 if ( rule_name.to_s.match /^block_/ and method( rule_name ).call( blk ) )
633 633 end
634 634 if block_applied.zero?
635 635 if deep_code
636 636 blk = "\t<pre><code>#{ blk }</code></pre>"
637 637 else
638 638 blk = "\t<p>#{ blk }</p>"
639 639 end
640 640 end
641 641 # hard_break blk
642 642 blk + "\n#{ code_blk }"
643 643 end
644 644 end
645 645
646 646 end.join( "\n\n" ) )
647 647 end
648 648
649 649 def textile_bq( tag, atts, cite, content )
650 650 cite, cite_title = check_refs( cite )
651 651 cite = " cite=\"#{ cite }\"" if cite
652 652 atts = shelve( atts ) if atts
653 653 "\t<blockquote#{ cite }>\n\t\t<p#{ atts }>#{ content }</p>\n\t</blockquote>"
654 654 end
655 655
656 656 def textile_p( tag, atts, cite, content )
657 657 atts = shelve( atts ) if atts
658 658 "\t<#{ tag }#{ atts }>#{ content }</#{ tag }>"
659 659 end
660 660
661 661 alias textile_h1 textile_p
662 662 alias textile_h2 textile_p
663 663 alias textile_h3 textile_p
664 664 alias textile_h4 textile_p
665 665 alias textile_h5 textile_p
666 666 alias textile_h6 textile_p
667 667
668 668 def textile_fn_( tag, num, atts, cite, content )
669 669 atts << " id=\"fn#{ num }\""
670 670 content = "<sup>#{ num }</sup> #{ content }"
671 671 atts = shelve( atts ) if atts
672 672 "\t<p#{ atts }>#{ content }</p>"
673 673 end
674 674
675 675 BLOCK_RE = /^(([a-z]+)(\d*))(#{A}#{C})\.(?::(\S+))? (.*)$/m
676 676
677 677 def block_textile_prefix( text )
678 678 if text =~ BLOCK_RE
679 679 tag,tagpre,num,atts,cite,content = $~[1..6]
680 680 atts = pba( atts )
681 681
682 682 # pass to prefix handler
683 683 if respond_to? "textile_#{ tag }", true
684 684 text.gsub!( $&, method( "textile_#{ tag }" ).call( tag, atts, cite, content ) )
685 685 elsif respond_to? "textile_#{ tagpre }_", true
686 686 text.gsub!( $&, method( "textile_#{ tagpre }_" ).call( tagpre, num, atts, cite, content ) )
687 687 end
688 688 end
689 689 end
690 690
691 691 SETEXT_RE = /\A(.+?)\n([=-])[=-]* *$/m
692 692 def block_markdown_setext( text )
693 693 if text =~ SETEXT_RE
694 694 tag = if $2 == "="; "h1"; else; "h2"; end
695 695 blk, cont = "<#{ tag }>#{ $1 }</#{ tag }>", $'
696 696 blocks cont
697 697 text.replace( blk + cont )
698 698 end
699 699 end
700 700
701 701 ATX_RE = /\A(\#{1,6}) # $1 = string of #'s
702 702 [ ]*
703 703 (.+?) # $2 = Header text
704 704 [ ]*
705 705 \#* # optional closing #'s (not counted)
706 706 $/x
707 707 def block_markdown_atx( text )
708 708 if text =~ ATX_RE
709 709 tag = "h#{ $1.length }"
710 710 blk, cont = "<#{ tag }>#{ $2 }</#{ tag }>\n\n", $'
711 711 blocks cont
712 712 text.replace( blk + cont )
713 713 end
714 714 end
715 715
716 716 MARKDOWN_BQ_RE = /\A(^ *> ?.+$(.+\n)*\n*)+/m
717 717
718 718 def block_markdown_bq( text )
719 719 text.gsub!( MARKDOWN_BQ_RE ) do |blk|
720 720 blk.gsub!( /^ *> ?/, '' )
721 721 flush_left blk
722 722 blocks blk
723 723 blk.gsub!( /^(\S)/, "\t\\1" )
724 724 "<blockquote>\n#{ blk }\n</blockquote>\n\n"
725 725 end
726 726 end
727 727
728 728 MARKDOWN_RULE_RE = /^(#{
729 729 ['*', '-', '_'].collect { |ch| '( ?' + Regexp::quote( ch ) + ' ?){3,}' }.join( '|' )
730 730 })$/
731 731
732 732 def block_markdown_rule( text )
733 733 text.gsub!( MARKDOWN_RULE_RE ) do |blk|
734 734 "<hr />"
735 735 end
736 736 end
737 737
738 738 # XXX TODO XXX
739 739 def block_markdown_lists( text )
740 740 end
741 741
742 742 def inline_textile_span( text )
743 743 QTAGS.each do |qtag_rc, ht, qtag_re, rtype|
744 744 text.gsub!( qtag_re ) do |m|
745 745
746 746 case rtype
747 747 when :limit
748 748 sta,qtag,atts,cite,content = $~[1..5]
749 749 else
750 750 qtag,atts,cite,content = $~[1..4]
751 751 sta = ''
752 752 end
753 753 atts = pba( atts )
754 754 atts << " cite=\"#{ cite }\"" if cite
755 755 atts = shelve( atts ) if atts
756 756
757 757 "#{ sta }<#{ ht }#{ atts }>#{ content }</#{ ht }>"
758 758
759 759 end
760 760 end
761 761 end
762 762
763 763 LINK_RE = /
764 764 ([\s\[{(]|[#{PUNCT}])? # $pre
765 765 " # start
766 766 (#{C}) # $atts
767 767 ([^"]+?) # $text
768 768 \s?
769 769 (?:\(([^)]+?)\)(?="))? # $title
770 770 ":
771 771 (\S+?) # $url
772 772 (\/)? # $slash
773 773 ([^\w\/;]*?) # $post
774 774 (?=<|\s|$)
775 775 /x
776 776
777 777 def inline_textile_link( text )
778 778 text.gsub!( LINK_RE ) do |m|
779 779 pre,atts,text,title,url,slash,post = $~[1..7]
780 780
781 781 url, url_title = check_refs( url )
782 782 title ||= url_title
783 783
784 784 atts = pba( atts )
785 785 atts = " href=\"#{ url }#{ slash }\"#{ atts }"
786 786 atts << " title=\"#{ title }\"" if title
787 787 atts = shelve( atts ) if atts
788 788
789 external = (url =~ /^http:\/\//) ? ' class="external"' : ''
789 external = (url =~ /^https?:\/\//) ? ' class="external"' : ''
790 790
791 791 "#{ pre }<a#{ atts }#{ external }>#{ text }</a>#{ post }"
792 792 end
793 793 end
794 794
795 795 MARKDOWN_REFLINK_RE = /
796 796 \[([^\[\]]+)\] # $text
797 797 [ ]? # opt. space
798 798 (?:\n[ ]*)? # one optional newline followed by spaces
799 799 \[(.*?)\] # $id
800 800 /x
801 801
802 802 def inline_markdown_reflink( text )
803 803 text.gsub!( MARKDOWN_REFLINK_RE ) do |m|
804 804 text, id = $~[1..2]
805 805
806 806 if id.empty?
807 807 url, title = check_refs( text )
808 808 else
809 809 url, title = check_refs( id )
810 810 end
811 811
812 812 atts = " href=\"#{ url }\""
813 813 atts << " title=\"#{ title }\"" if title
814 814 atts = shelve( atts )
815 815
816 816 "<a#{ atts }>#{ text }</a>"
817 817 end
818 818 end
819 819
820 820 MARKDOWN_LINK_RE = /
821 821 \[([^\[\]]+)\] # $text
822 822 \( # open paren
823 823 [ \t]* # opt space
824 824 <?(.+?)>? # $href
825 825 [ \t]* # opt space
826 826 (?: # whole title
827 827 (['"]) # $quote
828 828 (.*?) # $title
829 829 \3 # matching quote
830 830 )? # title is optional
831 831 \)
832 832 /x
833 833
834 834 def inline_markdown_link( text )
835 835 text.gsub!( MARKDOWN_LINK_RE ) do |m|
836 836 text, url, quote, title = $~[1..4]
837 837
838 838 atts = " href=\"#{ url }\""
839 839 atts << " title=\"#{ title }\"" if title
840 840 atts = shelve( atts )
841 841
842 842 "<a#{ atts }>#{ text }</a>"
843 843 end
844 844 end
845 845
846 846 TEXTILE_REFS_RE = /(^ *)\[([^\[\n]+?)\](#{HYPERLINK})(?=\s|$)/
847 847 MARKDOWN_REFS_RE = /(^ *)\[([^\n]+?)\]:\s+<?(#{HYPERLINK})>?(?:\s+"((?:[^"]|\\")+)")?(?=\s|$)/m
848 848
849 849 def refs( text )
850 850 @rules.each do |rule_name|
851 851 method( rule_name ).call( text ) if rule_name.to_s.match /^refs_/
852 852 end
853 853 end
854 854
855 855 def refs_textile( text )
856 856 text.gsub!( TEXTILE_REFS_RE ) do |m|
857 857 flag, url = $~[2..3]
858 858 @urlrefs[flag.downcase] = [url, nil]
859 859 nil
860 860 end
861 861 end
862 862
863 863 def refs_markdown( text )
864 864 text.gsub!( MARKDOWN_REFS_RE ) do |m|
865 865 flag, url = $~[2..3]
866 866 title = $~[6]
867 867 @urlrefs[flag.downcase] = [url, title]
868 868 nil
869 869 end
870 870 end
871 871
872 872 def check_refs( text )
873 873 ret = @urlrefs[text.downcase] if text
874 874 ret || [text, nil]
875 875 end
876 876
877 877 IMAGE_RE = /
878 878 (<p>|.|^) # start of line?
879 879 \! # opening
880 880 (\<|\=|\>)? # optional alignment atts
881 881 (#{C}) # optional style,class atts
882 882 (?:\. )? # optional dot-space
883 883 ([^\s(!]+?) # presume this is the src
884 884 \s? # optional space
885 885 (?:\(((?:[^\(\)]|\([^\)]+\))+?)\))? # optional title
886 886 \! # closing
887 887 (?::#{ HYPERLINK })? # optional href
888 888 /x
889 889
890 890 def inline_textile_image( text )
891 891 text.gsub!( IMAGE_RE ) do |m|
892 892 stln,algn,atts,url,title,href,href_a1,href_a2 = $~[1..8]
893 893 atts = pba( atts )
894 894 atts = " src=\"#{ url }\"#{ atts }"
895 895 atts << " title=\"#{ title }\"" if title
896 896 atts << " alt=\"#{ title }\""
897 897 # size = @getimagesize($url);
898 898 # if($size) $atts.= " $size[3]";
899 899
900 900 href, alt_title = check_refs( href ) if href
901 901 url, url_title = check_refs( url )
902 902
903 903 out = ''
904 904 out << "<a#{ shelve( " href=\"#{ href }\"" ) }>" if href
905 905 out << "<img#{ shelve( atts ) } />"
906 906 out << "</a>#{ href_a1 }#{ href_a2 }" if href
907 907
908 908 if algn
909 909 algn = h_align( algn )
910 910 if stln == "<p>"
911 911 out = "<p style=\"float:#{ algn }\">#{ out }"
912 912 else
913 913 out = "#{ stln }<div style=\"float:#{ algn }\">#{ out }</div>"
914 914 end
915 915 else
916 916 out = stln + out
917 917 end
918 918
919 919 out
920 920 end
921 921 end
922 922
923 923 def shelve( val )
924 924 @shelf << val
925 925 " :redsh##{ @shelf.length }:"
926 926 end
927 927
928 928 def retrieve( text )
929 929 @shelf.each_with_index do |r, i|
930 930 text.gsub!( " :redsh##{ i + 1 }:", r )
931 931 end
932 932 end
933 933
934 934 def incoming_entities( text )
935 935 ## turn any incoming ampersands into a dummy character for now.
936 936 ## This uses a negative lookahead for alphanumerics followed by a semicolon,
937 937 ## implying an incoming html entity, to be skipped
938 938
939 939 text.gsub!( /&(?![#a-z0-9]+;)/i, "x%x%" )
940 940 end
941 941
942 942 def no_textile( text )
943 943 text.gsub!( /(^|\s)==([^=]+.*?)==(\s|$)?/,
944 944 '\1<notextile>\2</notextile>\3' )
945 945 text.gsub!( /^ *==([^=]+.*?)==/m,
946 946 '\1<notextile>\2</notextile>\3' )
947 947 end
948 948
949 949 def clean_white_space( text )
950 950 # normalize line breaks
951 951 text.gsub!( /\r\n/, "\n" )
952 952 text.gsub!( /\r/, "\n" )
953 953 text.gsub!( /\t/, ' ' )
954 954 text.gsub!( /^ +$/, '' )
955 955 text.gsub!( /\n{3,}/, "\n\n" )
956 956 text.gsub!( /"$/, "\" " )
957 957
958 958 # if entire document is indented, flush
959 959 # to the left side
960 960 flush_left text
961 961 end
962 962
963 963 def flush_left( text )
964 964 indt = 0
965 965 if text =~ /^ /
966 966 while text !~ /^ {#{indt}}\S/
967 967 indt += 1
968 968 end unless text.empty?
969 969 if indt.nonzero?
970 970 text.gsub!( /^ {#{indt}}/, '' )
971 971 end
972 972 end
973 973 end
974 974
975 975 def footnote_ref( text )
976 976 text.gsub!( /\b\[([0-9]+?)\](\s)?/,
977 977 '<sup><a href="#fn\1">\1</a></sup>\2' )
978 978 end
979 979
980 980 OFFTAGS = /(code|pre|kbd|notextile)/
981 981 OFFTAG_MATCH = /(?:(<\/#{ OFFTAGS }>)|(<#{ OFFTAGS }[^>]*>))(.*?)(?=<\/?#{ OFFTAGS }|\Z)/mi
982 982 OFFTAG_OPEN = /<#{ OFFTAGS }/
983 983 OFFTAG_CLOSE = /<\/?#{ OFFTAGS }/
984 984 HASTAG_MATCH = /(<\/?\w[^\n]*?>)/m
985 985 ALLTAG_MATCH = /(<\/?\w[^\n]*?>)|.*?(?=<\/?\w[^\n]*?>|$)/m
986 986
987 987 def glyphs_textile( text, level = 0 )
988 988 if text !~ HASTAG_MATCH
989 989 pgl text
990 990 footnote_ref text
991 991 else
992 992 codepre = 0
993 993 text.gsub!( ALLTAG_MATCH ) do |line|
994 994 ## matches are off if we're between <code>, <pre> etc.
995 995 if $1
996 996 if line =~ OFFTAG_OPEN
997 997 codepre += 1
998 998 elsif line =~ OFFTAG_CLOSE
999 999 codepre -= 1
1000 1000 codepre = 0 if codepre < 0
1001 1001 end
1002 1002 elsif codepre.zero?
1003 1003 glyphs_textile( line, level + 1 )
1004 1004 else
1005 1005 htmlesc( line, :NoQuotes )
1006 1006 end
1007 1007 # p [level, codepre, line]
1008 1008
1009 1009 line
1010 1010 end
1011 1011 end
1012 1012 end
1013 1013
1014 1014 def rip_offtags( text )
1015 1015 if text =~ /<.*>/
1016 1016 ## strip and encode <pre> content
1017 1017 codepre, used_offtags = 0, {}
1018 1018 text.gsub!( OFFTAG_MATCH ) do |line|
1019 1019 if $3
1020 1020 offtag, aftertag = $4, $5
1021 1021 codepre += 1
1022 1022 used_offtags[offtag] = true
1023 1023 if codepre - used_offtags.length > 0
1024 1024 htmlesc( line, :NoQuotes ) unless used_offtags['notextile']
1025 1025 @pre_list.last << line
1026 1026 line = ""
1027 1027 else
1028 1028 htmlesc( aftertag, :NoQuotes ) if aftertag and not used_offtags['notextile']
1029 1029 line = "<redpre##{ @pre_list.length }>"
1030 1030 @pre_list << "#{ $3 }#{ aftertag }"
1031 1031 end
1032 1032 elsif $1 and codepre > 0
1033 1033 if codepre - used_offtags.length > 0
1034 1034 htmlesc( line, :NoQuotes ) unless used_offtags['notextile']
1035 1035 @pre_list.last << line
1036 1036 line = ""
1037 1037 end
1038 1038 codepre -= 1 unless codepre.zero?
1039 1039 used_offtags = {} if codepre.zero?
1040 1040 end
1041 1041 line
1042 1042 end
1043 1043 end
1044 1044 text
1045 1045 end
1046 1046
1047 1047 def smooth_offtags( text )
1048 1048 unless @pre_list.empty?
1049 1049 ## replace <pre> content
1050 1050 text.gsub!( /<redpre#(\d+)>/ ) { @pre_list[$1.to_i] }
1051 1051 end
1052 1052 end
1053 1053
1054 1054 def inline( text )
1055 1055 [/^inline_/, /^glyphs_/].each do |meth_re|
1056 1056 @rules.each do |rule_name|
1057 1057 method( rule_name ).call( text ) if rule_name.to_s.match( meth_re )
1058 1058 end
1059 1059 end
1060 1060 end
1061 1061
1062 1062 def h_align( text )
1063 1063 H_ALGN_VALS[text]
1064 1064 end
1065 1065
1066 1066 def v_align( text )
1067 1067 V_ALGN_VALS[text]
1068 1068 end
1069 1069
1070 1070 def textile_popup_help( name, windowW, windowH )
1071 1071 ' <a target="_blank" href="http://hobix.com/textile/#' + helpvar + '" onclick="window.open(this.href, \'popupwindow\', \'width=' + windowW + ',height=' + windowH + ',scrollbars,resizable\'); return false;">' + name + '</a><br />'
1072 1072 end
1073 1073
1074 1074 # HTML cleansing stuff
1075 1075 BASIC_TAGS = {
1076 1076 'a' => ['href', 'title'],
1077 1077 'img' => ['src', 'alt', 'title'],
1078 1078 'br' => [],
1079 1079 'i' => nil,
1080 1080 'u' => nil,
1081 1081 'b' => nil,
1082 1082 'pre' => nil,
1083 1083 'kbd' => nil,
1084 1084 'code' => ['lang'],
1085 1085 'cite' => nil,
1086 1086 'strong' => nil,
1087 1087 'em' => nil,
1088 1088 'ins' => nil,
1089 1089 'sup' => nil,
1090 1090 'sub' => nil,
1091 1091 'del' => nil,
1092 1092 'table' => nil,
1093 1093 'tr' => nil,
1094 1094 'td' => ['colspan', 'rowspan'],
1095 1095 'th' => nil,
1096 1096 'ol' => nil,
1097 1097 'ul' => nil,
1098 1098 'li' => nil,
1099 1099 'p' => nil,
1100 1100 'h1' => nil,
1101 1101 'h2' => nil,
1102 1102 'h3' => nil,
1103 1103 'h4' => nil,
1104 1104 'h5' => nil,
1105 1105 'h6' => nil,
1106 1106 'blockquote' => ['cite']
1107 1107 }
1108 1108
1109 1109 def clean_html( text, tags = BASIC_TAGS )
1110 1110 text.gsub!( /<!\[CDATA\[/, '' )
1111 1111 text.gsub!( /<(\/*)(\w+)([^>]*)>/ ) do
1112 1112 raw = $~
1113 1113 tag = raw[2].downcase
1114 1114 if tags.has_key? tag
1115 1115 pcs = [tag]
1116 1116 tags[tag].each do |prop|
1117 1117 ['"', "'", ''].each do |q|
1118 1118 q2 = ( q != '' ? q : '\s' )
1119 1119 if raw[3] =~ /#{prop}\s*=\s*#{q}([^#{q2}]+)#{q}/i
1120 1120 attrv = $1
1121 1121 next if prop == 'src' and attrv =~ %r{^(?!http)\w+:}
1122 1122 pcs << "#{prop}=\"#{$1.gsub('"', '\\"')}\""
1123 1123 break
1124 1124 end
1125 1125 end
1126 1126 end if tags[tag]
1127 1127 "<#{raw[1]}#{pcs.join " "}>"
1128 1128 else
1129 1129 " "
1130 1130 end
1131 1131 end
1132 1132 end
1133 1133
1134 1134 ALLOWED_TAGS = %w(redpre pre code)
1135 1135
1136 1136 def escape_html_tags(text)
1137 1137 text.gsub!(%r{<((\/?)(\w+))}) {|m| ALLOWED_TAGS.include?($3) ? "<#{$1}" : "&lt;#{$1}" }
1138 1138 end
1139 1139 end
1140 1140
General Comments 0
You need to be logged in to leave comments. Login now