##// END OF EJS Templates
Fixes a regexp for ruby1.9....
Jean-Philippe Lang -
r2901:668ec7f69421
parent child
Show More
@@ -1,1182 +1,1182
1 # vim:ts=4:sw=4:
1 # vim:ts=4:sw=4:
2 # = RedCloth - Textile and Markdown Hybrid for Ruby
2 # = RedCloth - Textile and Markdown Hybrid for Ruby
3 #
3 #
4 # Homepage:: http://whytheluckystiff.net/ruby/redcloth/
4 # Homepage:: http://whytheluckystiff.net/ruby/redcloth/
5 # Author:: why the lucky stiff (http://whytheluckystiff.net/)
5 # Author:: why the lucky stiff (http://whytheluckystiff.net/)
6 # Copyright:: (cc) 2004 why the lucky stiff (and his puppet organizations.)
6 # Copyright:: (cc) 2004 why the lucky stiff (and his puppet organizations.)
7 # License:: BSD
7 # License:: BSD
8 #
8 #
9 # (see http://hobix.com/textile/ for a Textile Reference.)
9 # (see http://hobix.com/textile/ for a Textile Reference.)
10 #
10 #
11 # Based on (and also inspired by) both:
11 # Based on (and also inspired by) both:
12 #
12 #
13 # PyTextile: http://diveintomark.org/projects/textile/textile.py.txt
13 # PyTextile: http://diveintomark.org/projects/textile/textile.py.txt
14 # Textism for PHP: http://www.textism.com/tools/textile/
14 # Textism for PHP: http://www.textism.com/tools/textile/
15 #
15 #
16 #
16 #
17
17
18 # = RedCloth
18 # = RedCloth
19 #
19 #
20 # RedCloth is a Ruby library for converting Textile and/or Markdown
20 # RedCloth is a Ruby library for converting Textile and/or Markdown
21 # into HTML. You can use either format, intermingled or separately.
21 # into HTML. You can use either format, intermingled or separately.
22 # You can also extend RedCloth to honor your own custom text stylings.
22 # You can also extend RedCloth to honor your own custom text stylings.
23 #
23 #
24 # RedCloth users are encouraged to use Textile if they are generating
24 # RedCloth users are encouraged to use Textile if they are generating
25 # HTML and to use Markdown if others will be viewing the plain text.
25 # HTML and to use Markdown if others will be viewing the plain text.
26 #
26 #
27 # == What is Textile?
27 # == What is Textile?
28 #
28 #
29 # Textile is a simple formatting style for text
29 # Textile is a simple formatting style for text
30 # documents, loosely based on some HTML conventions.
30 # documents, loosely based on some HTML conventions.
31 #
31 #
32 # == Sample Textile Text
32 # == Sample Textile Text
33 #
33 #
34 # h2. This is a title
34 # h2. This is a title
35 #
35 #
36 # h3. This is a subhead
36 # h3. This is a subhead
37 #
37 #
38 # This is a bit of paragraph.
38 # This is a bit of paragraph.
39 #
39 #
40 # bq. This is a blockquote.
40 # bq. This is a blockquote.
41 #
41 #
42 # = Writing Textile
42 # = Writing Textile
43 #
43 #
44 # A Textile document consists of paragraphs. Paragraphs
44 # A Textile document consists of paragraphs. Paragraphs
45 # can be specially formatted by adding a small instruction
45 # can be specially formatted by adding a small instruction
46 # to the beginning of the paragraph.
46 # to the beginning of the paragraph.
47 #
47 #
48 # h[n]. Header of size [n].
48 # h[n]. Header of size [n].
49 # bq. Blockquote.
49 # bq. Blockquote.
50 # # Numeric list.
50 # # Numeric list.
51 # * Bulleted list.
51 # * Bulleted list.
52 #
52 #
53 # == Quick Phrase Modifiers
53 # == Quick Phrase Modifiers
54 #
54 #
55 # Quick phrase modifiers are also included, to allow formatting
55 # Quick phrase modifiers are also included, to allow formatting
56 # of small portions of text within a paragraph.
56 # of small portions of text within a paragraph.
57 #
57 #
58 # \_emphasis\_
58 # \_emphasis\_
59 # \_\_italicized\_\_
59 # \_\_italicized\_\_
60 # \*strong\*
60 # \*strong\*
61 # \*\*bold\*\*
61 # \*\*bold\*\*
62 # ??citation??
62 # ??citation??
63 # -deleted text-
63 # -deleted text-
64 # +inserted text+
64 # +inserted text+
65 # ^superscript^
65 # ^superscript^
66 # ~subscript~
66 # ~subscript~
67 # @code@
67 # @code@
68 # %(classname)span%
68 # %(classname)span%
69 #
69 #
70 # ==notextile== (leave text alone)
70 # ==notextile== (leave text alone)
71 #
71 #
72 # == Links
72 # == Links
73 #
73 #
74 # To make a hypertext link, put the link text in "quotation
74 # To make a hypertext link, put the link text in "quotation
75 # marks" followed immediately by a colon and the URL of the link.
75 # marks" followed immediately by a colon and the URL of the link.
76 #
76 #
77 # Optional: text in (parentheses) following the link text,
77 # Optional: text in (parentheses) following the link text,
78 # but before the closing quotation mark, will become a Title
78 # but before the closing quotation mark, will become a Title
79 # attribute for the link, visible as a tool tip when a cursor is above it.
79 # attribute for the link, visible as a tool tip when a cursor is above it.
80 #
80 #
81 # Example:
81 # Example:
82 #
82 #
83 # "This is a link (This is a title) ":http://www.textism.com
83 # "This is a link (This is a title) ":http://www.textism.com
84 #
84 #
85 # Will become:
85 # Will become:
86 #
86 #
87 # <a href="http://www.textism.com" title="This is a title">This is a link</a>
87 # <a href="http://www.textism.com" title="This is a title">This is a link</a>
88 #
88 #
89 # == Images
89 # == Images
90 #
90 #
91 # To insert an image, put the URL for the image inside exclamation marks.
91 # To insert an image, put the URL for the image inside exclamation marks.
92 #
92 #
93 # Optional: text that immediately follows the URL in (parentheses) will
93 # Optional: text that immediately follows the URL in (parentheses) will
94 # be used as the Alt text for the image. Images on the web should always
94 # be used as the Alt text for the image. Images on the web should always
95 # have descriptive Alt text for the benefit of readers using non-graphical
95 # have descriptive Alt text for the benefit of readers using non-graphical
96 # browsers.
96 # browsers.
97 #
97 #
98 # Optional: place a colon followed by a URL immediately after the
98 # Optional: place a colon followed by a URL immediately after the
99 # closing ! to make the image into a link.
99 # closing ! to make the image into a link.
100 #
100 #
101 # Example:
101 # Example:
102 #
102 #
103 # !http://www.textism.com/common/textist.gif(Textist)!
103 # !http://www.textism.com/common/textist.gif(Textist)!
104 #
104 #
105 # Will become:
105 # Will become:
106 #
106 #
107 # <img src="http://www.textism.com/common/textist.gif" alt="Textist" />
107 # <img src="http://www.textism.com/common/textist.gif" alt="Textist" />
108 #
108 #
109 # With a link:
109 # With a link:
110 #
110 #
111 # !/common/textist.gif(Textist)!:http://textism.com
111 # !/common/textist.gif(Textist)!:http://textism.com
112 #
112 #
113 # Will become:
113 # Will become:
114 #
114 #
115 # <a href="http://textism.com"><img src="/common/textist.gif" alt="Textist" /></a>
115 # <a href="http://textism.com"><img src="/common/textist.gif" alt="Textist" /></a>
116 #
116 #
117 # == Defining Acronyms
117 # == Defining Acronyms
118 #
118 #
119 # HTML allows authors to define acronyms via the tag. The definition appears as a
119 # HTML allows authors to define acronyms via the tag. The definition appears as a
120 # tool tip when a cursor hovers over the acronym. A crucial aid to clear writing,
120 # tool tip when a cursor hovers over the acronym. A crucial aid to clear writing,
121 # this should be used at least once for each acronym in documents where they appear.
121 # this should be used at least once for each acronym in documents where they appear.
122 #
122 #
123 # To quickly define an acronym in Textile, place the full text in (parentheses)
123 # To quickly define an acronym in Textile, place the full text in (parentheses)
124 # immediately following the acronym.
124 # immediately following the acronym.
125 #
125 #
126 # Example:
126 # Example:
127 #
127 #
128 # ACLU(American Civil Liberties Union)
128 # ACLU(American Civil Liberties Union)
129 #
129 #
130 # Will become:
130 # Will become:
131 #
131 #
132 # <acronym title="American Civil Liberties Union">ACLU</acronym>
132 # <acronym title="American Civil Liberties Union">ACLU</acronym>
133 #
133 #
134 # == Adding Tables
134 # == Adding Tables
135 #
135 #
136 # In Textile, simple tables can be added by seperating each column by
136 # In Textile, simple tables can be added by seperating each column by
137 # a pipe.
137 # a pipe.
138 #
138 #
139 # |a|simple|table|row|
139 # |a|simple|table|row|
140 # |And|Another|table|row|
140 # |And|Another|table|row|
141 #
141 #
142 # Attributes are defined by style definitions in parentheses.
142 # Attributes are defined by style definitions in parentheses.
143 #
143 #
144 # table(border:1px solid black).
144 # table(border:1px solid black).
145 # (background:#ddd;color:red). |{}| | | |
145 # (background:#ddd;color:red). |{}| | | |
146 #
146 #
147 # == Using RedCloth
147 # == Using RedCloth
148 #
148 #
149 # RedCloth is simply an extension of the String class, which can handle
149 # RedCloth is simply an extension of the String class, which can handle
150 # Textile formatting. Use it like a String and output HTML with its
150 # Textile formatting. Use it like a String and output HTML with its
151 # RedCloth#to_html method.
151 # RedCloth#to_html method.
152 #
152 #
153 # doc = RedCloth.new "
153 # doc = RedCloth.new "
154 #
154 #
155 # h2. Test document
155 # h2. Test document
156 #
156 #
157 # Just a simple test."
157 # Just a simple test."
158 #
158 #
159 # puts doc.to_html
159 # puts doc.to_html
160 #
160 #
161 # By default, RedCloth uses both Textile and Markdown formatting, with
161 # By default, RedCloth uses both Textile and Markdown formatting, with
162 # Textile formatting taking precedence. If you want to turn off Markdown
162 # Textile formatting taking precedence. If you want to turn off Markdown
163 # formatting, to boost speed and limit the processor:
163 # formatting, to boost speed and limit the processor:
164 #
164 #
165 # class RedCloth::Textile.new( str )
165 # class RedCloth::Textile.new( str )
166
166
167 class RedCloth3 < String
167 class RedCloth3 < String
168
168
169 VERSION = '3.0.4'
169 VERSION = '3.0.4'
170 DEFAULT_RULES = [:textile, :markdown]
170 DEFAULT_RULES = [:textile, :markdown]
171
171
172 #
172 #
173 # Two accessor for setting security restrictions.
173 # Two accessor for setting security restrictions.
174 #
174 #
175 # This is a nice thing if you're using RedCloth for
175 # This is a nice thing if you're using RedCloth for
176 # formatting in public places (e.g. Wikis) where you
176 # formatting in public places (e.g. Wikis) where you
177 # don't want users to abuse HTML for bad things.
177 # don't want users to abuse HTML for bad things.
178 #
178 #
179 # If +:filter_html+ is set, HTML which wasn't
179 # If +:filter_html+ is set, HTML which wasn't
180 # created by the Textile processor will be escaped.
180 # created by the Textile processor will be escaped.
181 #
181 #
182 # If +:filter_styles+ is set, it will also disable
182 # If +:filter_styles+ is set, it will also disable
183 # the style markup specifier. ('{color: red}')
183 # the style markup specifier. ('{color: red}')
184 #
184 #
185 attr_accessor :filter_html, :filter_styles
185 attr_accessor :filter_html, :filter_styles
186
186
187 #
187 #
188 # Accessor for toggling hard breaks.
188 # Accessor for toggling hard breaks.
189 #
189 #
190 # If +:hard_breaks+ is set, single newlines will
190 # If +:hard_breaks+ is set, single newlines will
191 # be converted to HTML break tags. This is the
191 # be converted to HTML break tags. This is the
192 # default behavior for traditional RedCloth.
192 # default behavior for traditional RedCloth.
193 #
193 #
194 attr_accessor :hard_breaks
194 attr_accessor :hard_breaks
195
195
196 # Accessor for toggling lite mode.
196 # Accessor for toggling lite mode.
197 #
197 #
198 # In lite mode, block-level rules are ignored. This means
198 # In lite mode, block-level rules are ignored. This means
199 # that tables, paragraphs, lists, and such aren't available.
199 # that tables, paragraphs, lists, and such aren't available.
200 # Only the inline markup for bold, italics, entities and so on.
200 # Only the inline markup for bold, italics, entities and so on.
201 #
201 #
202 # r = RedCloth.new( "And then? She *fell*!", [:lite_mode] )
202 # r = RedCloth.new( "And then? She *fell*!", [:lite_mode] )
203 # r.to_html
203 # r.to_html
204 # #=> "And then? She <strong>fell</strong>!"
204 # #=> "And then? She <strong>fell</strong>!"
205 #
205 #
206 attr_accessor :lite_mode
206 attr_accessor :lite_mode
207
207
208 #
208 #
209 # Accessor for toggling span caps.
209 # Accessor for toggling span caps.
210 #
210 #
211 # Textile places `span' tags around capitalized
211 # Textile places `span' tags around capitalized
212 # words by default, but this wreaks havoc on Wikis.
212 # words by default, but this wreaks havoc on Wikis.
213 # If +:no_span_caps+ is set, this will be
213 # If +:no_span_caps+ is set, this will be
214 # suppressed.
214 # suppressed.
215 #
215 #
216 attr_accessor :no_span_caps
216 attr_accessor :no_span_caps
217
217
218 #
218 #
219 # Establishes the markup predence. Available rules include:
219 # Establishes the markup predence. Available rules include:
220 #
220 #
221 # == Textile Rules
221 # == Textile Rules
222 #
222 #
223 # The following textile rules can be set individually. Or add the complete
223 # The following textile rules can be set individually. Or add the complete
224 # set of rules with the single :textile rule, which supplies the rule set in
224 # set of rules with the single :textile rule, which supplies the rule set in
225 # the following precedence:
225 # the following precedence:
226 #
226 #
227 # refs_textile:: Textile references (i.e. [hobix]http://hobix.com/)
227 # refs_textile:: Textile references (i.e. [hobix]http://hobix.com/)
228 # block_textile_table:: Textile table block structures
228 # block_textile_table:: Textile table block structures
229 # block_textile_lists:: Textile list structures
229 # block_textile_lists:: Textile list structures
230 # block_textile_prefix:: Textile blocks with prefixes (i.e. bq., h2., etc.)
230 # block_textile_prefix:: Textile blocks with prefixes (i.e. bq., h2., etc.)
231 # inline_textile_image:: Textile inline images
231 # inline_textile_image:: Textile inline images
232 # inline_textile_link:: Textile inline links
232 # inline_textile_link:: Textile inline links
233 # inline_textile_span:: Textile inline spans
233 # inline_textile_span:: Textile inline spans
234 # glyphs_textile:: Textile entities (such as em-dashes and smart quotes)
234 # glyphs_textile:: Textile entities (such as em-dashes and smart quotes)
235 #
235 #
236 # == Markdown
236 # == Markdown
237 #
237 #
238 # refs_markdown:: Markdown references (for example: [hobix]: http://hobix.com/)
238 # refs_markdown:: Markdown references (for example: [hobix]: http://hobix.com/)
239 # block_markdown_setext:: Markdown setext headers
239 # block_markdown_setext:: Markdown setext headers
240 # block_markdown_atx:: Markdown atx headers
240 # block_markdown_atx:: Markdown atx headers
241 # block_markdown_rule:: Markdown horizontal rules
241 # block_markdown_rule:: Markdown horizontal rules
242 # block_markdown_bq:: Markdown blockquotes
242 # block_markdown_bq:: Markdown blockquotes
243 # block_markdown_lists:: Markdown lists
243 # block_markdown_lists:: Markdown lists
244 # inline_markdown_link:: Markdown links
244 # inline_markdown_link:: Markdown links
245 attr_accessor :rules
245 attr_accessor :rules
246
246
247 # Returns a new RedCloth object, based on _string_ and
247 # Returns a new RedCloth object, based on _string_ and
248 # enforcing all the included _restrictions_.
248 # enforcing all the included _restrictions_.
249 #
249 #
250 # r = RedCloth.new( "h1. A <b>bold</b> man", [:filter_html] )
250 # r = RedCloth.new( "h1. A <b>bold</b> man", [:filter_html] )
251 # r.to_html
251 # r.to_html
252 # #=>"<h1>A &lt;b&gt;bold&lt;/b&gt; man</h1>"
252 # #=>"<h1>A &lt;b&gt;bold&lt;/b&gt; man</h1>"
253 #
253 #
254 def initialize( string, restrictions = [] )
254 def initialize( string, restrictions = [] )
255 restrictions.each { |r| method( "#{ r }=" ).call( true ) }
255 restrictions.each { |r| method( "#{ r }=" ).call( true ) }
256 super( string )
256 super( string )
257 end
257 end
258
258
259 #
259 #
260 # Generates HTML from the Textile contents.
260 # Generates HTML from the Textile contents.
261 #
261 #
262 # r = RedCloth.new( "And then? She *fell*!" )
262 # r = RedCloth.new( "And then? She *fell*!" )
263 # r.to_html( true )
263 # r.to_html( true )
264 # #=>"And then? She <strong>fell</strong>!"
264 # #=>"And then? She <strong>fell</strong>!"
265 #
265 #
266 def to_html( *rules )
266 def to_html( *rules )
267 rules = DEFAULT_RULES if rules.empty?
267 rules = DEFAULT_RULES if rules.empty?
268 # make our working copy
268 # make our working copy
269 text = self.dup
269 text = self.dup
270
270
271 @urlrefs = {}
271 @urlrefs = {}
272 @shelf = []
272 @shelf = []
273 textile_rules = [:refs_textile, :block_textile_table, :block_textile_lists,
273 textile_rules = [:refs_textile, :block_textile_table, :block_textile_lists,
274 :block_textile_prefix, :inline_textile_image, :inline_textile_link,
274 :block_textile_prefix, :inline_textile_image, :inline_textile_link,
275 :inline_textile_code, :inline_textile_span, :glyphs_textile]
275 :inline_textile_code, :inline_textile_span, :glyphs_textile]
276 markdown_rules = [:refs_markdown, :block_markdown_setext, :block_markdown_atx, :block_markdown_rule,
276 markdown_rules = [:refs_markdown, :block_markdown_setext, :block_markdown_atx, :block_markdown_rule,
277 :block_markdown_bq, :block_markdown_lists,
277 :block_markdown_bq, :block_markdown_lists,
278 :inline_markdown_reflink, :inline_markdown_link]
278 :inline_markdown_reflink, :inline_markdown_link]
279 @rules = rules.collect do |rule|
279 @rules = rules.collect do |rule|
280 case rule
280 case rule
281 when :markdown
281 when :markdown
282 markdown_rules
282 markdown_rules
283 when :textile
283 when :textile
284 textile_rules
284 textile_rules
285 else
285 else
286 rule
286 rule
287 end
287 end
288 end.flatten
288 end.flatten
289
289
290 # standard clean up
290 # standard clean up
291 incoming_entities text
291 incoming_entities text
292 clean_white_space text
292 clean_white_space text
293
293
294 # start processor
294 # start processor
295 @pre_list = []
295 @pre_list = []
296 rip_offtags text
296 rip_offtags text
297 no_textile text
297 no_textile text
298 escape_html_tags text
298 escape_html_tags text
299 hard_break text
299 hard_break text
300 unless @lite_mode
300 unless @lite_mode
301 refs text
301 refs text
302 # need to do this before text is split by #blocks
302 # need to do this before text is split by #blocks
303 block_textile_quotes text
303 block_textile_quotes text
304 blocks text
304 blocks text
305 end
305 end
306 inline text
306 inline text
307 smooth_offtags text
307 smooth_offtags text
308
308
309 retrieve text
309 retrieve text
310
310
311 text.gsub!( /<\/?notextile>/, '' )
311 text.gsub!( /<\/?notextile>/, '' )
312 text.gsub!( /x%x%/, '&#38;' )
312 text.gsub!( /x%x%/, '&#38;' )
313 clean_html text if filter_html
313 clean_html text if filter_html
314 text.strip!
314 text.strip!
315 text
315 text
316
316
317 end
317 end
318
318
319 #######
319 #######
320 private
320 private
321 #######
321 #######
322 #
322 #
323 # Mapping of 8-bit ASCII codes to HTML numerical entity equivalents.
323 # Mapping of 8-bit ASCII codes to HTML numerical entity equivalents.
324 # (from PyTextile)
324 # (from PyTextile)
325 #
325 #
326 TEXTILE_TAGS =
326 TEXTILE_TAGS =
327
327
328 [[128, 8364], [129, 0], [130, 8218], [131, 402], [132, 8222], [133, 8230],
328 [[128, 8364], [129, 0], [130, 8218], [131, 402], [132, 8222], [133, 8230],
329 [134, 8224], [135, 8225], [136, 710], [137, 8240], [138, 352], [139, 8249],
329 [134, 8224], [135, 8225], [136, 710], [137, 8240], [138, 352], [139, 8249],
330 [140, 338], [141, 0], [142, 0], [143, 0], [144, 0], [145, 8216], [146, 8217],
330 [140, 338], [141, 0], [142, 0], [143, 0], [144, 0], [145, 8216], [146, 8217],
331 [147, 8220], [148, 8221], [149, 8226], [150, 8211], [151, 8212], [152, 732],
331 [147, 8220], [148, 8221], [149, 8226], [150, 8211], [151, 8212], [152, 732],
332 [153, 8482], [154, 353], [155, 8250], [156, 339], [157, 0], [158, 0], [159, 376]].
332 [153, 8482], [154, 353], [155, 8250], [156, 339], [157, 0], [158, 0], [159, 376]].
333
333
334 collect! do |a, b|
334 collect! do |a, b|
335 [a.chr, ( b.zero? and "" or "&#{ b };" )]
335 [a.chr, ( b.zero? and "" or "&#{ b };" )]
336 end
336 end
337
337
338 #
338 #
339 # Regular expressions to convert to HTML.
339 # Regular expressions to convert to HTML.
340 #
340 #
341 A_HLGN = /(?:(?:<>|<|>|\=|[()]+)+)/
341 A_HLGN = /(?:(?:<>|<|>|\=|[()]+)+)/
342 A_VLGN = /[\-^~]/
342 A_VLGN = /[\-^~]/
343 C_CLAS = '(?:\([^)]+\))'
343 C_CLAS = '(?:\([^)]+\))'
344 C_LNGE = '(?:\[[^\[\]]+\])'
344 C_LNGE = '(?:\[[^\[\]]+\])'
345 C_STYL = '(?:\{[^}]+\})'
345 C_STYL = '(?:\{[^}]+\})'
346 S_CSPN = '(?:\\\\\d+)'
346 S_CSPN = '(?:\\\\\d+)'
347 S_RSPN = '(?:/\d+)'
347 S_RSPN = '(?:/\d+)'
348 A = "(?:#{A_HLGN}?#{A_VLGN}?|#{A_VLGN}?#{A_HLGN}?)"
348 A = "(?:#{A_HLGN}?#{A_VLGN}?|#{A_VLGN}?#{A_HLGN}?)"
349 S = "(?:#{S_CSPN}?#{S_RSPN}|#{S_RSPN}?#{S_CSPN}?)"
349 S = "(?:#{S_CSPN}?#{S_RSPN}|#{S_RSPN}?#{S_CSPN}?)"
350 C = "(?:#{C_CLAS}?#{C_STYL}?#{C_LNGE}?|#{C_STYL}?#{C_LNGE}?#{C_CLAS}?|#{C_LNGE}?#{C_STYL}?#{C_CLAS}?)"
350 C = "(?:#{C_CLAS}?#{C_STYL}?#{C_LNGE}?|#{C_STYL}?#{C_LNGE}?#{C_CLAS}?|#{C_LNGE}?#{C_STYL}?#{C_CLAS}?)"
351 # PUNCT = Regexp::quote( '!"#$%&\'()*+,-./:;<=>?@[\\]^_`{|}~' )
351 # PUNCT = Regexp::quote( '!"#$%&\'()*+,-./:;<=>?@[\\]^_`{|}~' )
352 PUNCT = Regexp::quote( '!"#$%&\'*+,-./:;=?@\\^_`|~' )
352 PUNCT = Regexp::quote( '!"#$%&\'*+,-./:;=?@\\^_`|~' )
353 PUNCT_NOQ = Regexp::quote( '!"#$&\',./:;=?@\\`|' )
353 PUNCT_NOQ = Regexp::quote( '!"#$&\',./:;=?@\\`|' )
354 PUNCT_Q = Regexp::quote( '*-_+^~%' )
354 PUNCT_Q = Regexp::quote( '*-_+^~%' )
355 HYPERLINK = '(\S+?)([^\w\s/;=\?]*?)(?=\s|<|$)'
355 HYPERLINK = '(\S+?)([^\w\s/;=\?]*?)(?=\s|<|$)'
356
356
357 # Text markup tags, don't conflict with block tags
357 # Text markup tags, don't conflict with block tags
358 SIMPLE_HTML_TAGS = [
358 SIMPLE_HTML_TAGS = [
359 'tt', 'b', 'i', 'big', 'small', 'em', 'strong', 'dfn', 'code',
359 'tt', 'b', 'i', 'big', 'small', 'em', 'strong', 'dfn', 'code',
360 'samp', 'kbd', 'var', 'cite', 'abbr', 'acronym', 'a', 'img', 'br',
360 'samp', 'kbd', 'var', 'cite', 'abbr', 'acronym', 'a', 'img', 'br',
361 'br', 'map', 'q', 'sub', 'sup', 'span', 'bdo'
361 'br', 'map', 'q', 'sub', 'sup', 'span', 'bdo'
362 ]
362 ]
363
363
364 QTAGS = [
364 QTAGS = [
365 ['**', 'b', :limit],
365 ['**', 'b', :limit],
366 ['*', 'strong', :limit],
366 ['*', 'strong', :limit],
367 ['??', 'cite', :limit],
367 ['??', 'cite', :limit],
368 ['-', 'del', :limit],
368 ['-', 'del', :limit],
369 ['__', 'i', :limit],
369 ['__', 'i', :limit],
370 ['_', 'em', :limit],
370 ['_', 'em', :limit],
371 ['%', 'span', :limit],
371 ['%', 'span', :limit],
372 ['+', 'ins', :limit],
372 ['+', 'ins', :limit],
373 ['^', 'sup', :limit],
373 ['^', 'sup', :limit],
374 ['~', 'sub', :limit]
374 ['~', 'sub', :limit]
375 ]
375 ]
376 QTAGS.collect! do |rc, ht, rtype|
376 QTAGS.collect! do |rc, ht, rtype|
377 rcq = Regexp::quote rc
377 rcq = Regexp::quote rc
378 re =
378 re =
379 case rtype
379 case rtype
380 when :limit
380 when :limit
381 /(^|[>\s\(])
381 /(^|[>\s\(])
382 (#{rcq})
382 (#{rcq})
383 (#{C})
383 (#{C})
384 (?::(\S+?))?
384 (?::(\S+?))?
385 (\w|[^\s\-].*?[^\s\-])
385 (\w|[^\s\-].*?[^\s\-])
386 #{rcq}
386 #{rcq}
387 (?=[[:punct:]]|\s|\)|$)/x
387 (?=[[:punct:]]|\s|\)|$)/x
388 else
388 else
389 /(#{rcq})
389 /(#{rcq})
390 (#{C})
390 (#{C})
391 (?::(\S+))?
391 (?::(\S+))?
392 (\w|[^\s\-].*?[^\s\-])
392 (\w|[^\s\-].*?[^\s\-])
393 #{rcq}/xm
393 #{rcq}/xm
394 end
394 end
395 [rc, ht, re, rtype]
395 [rc, ht, re, rtype]
396 end
396 end
397
397
398 # Elements to handle
398 # Elements to handle
399 GLYPHS = [
399 GLYPHS = [
400 # [ /([^\s\[{(>])?\'([dmst]\b|ll\b|ve\b|\s|:|$)/, '\1&#8217;\2' ], # single closing
400 # [ /([^\s\[{(>])?\'([dmst]\b|ll\b|ve\b|\s|:|$)/, '\1&#8217;\2' ], # single closing
401 # [ /([^\s\[{(>#{PUNCT_Q}][#{PUNCT_Q}]*)\'/, '\1&#8217;' ], # single closing
401 # [ /([^\s\[{(>#{PUNCT_Q}][#{PUNCT_Q}]*)\'/, '\1&#8217;' ], # single closing
402 # [ /\'(?=[#{PUNCT_Q}]*(s\b|[\s#{PUNCT_NOQ}]))/, '&#8217;' ], # single closing
402 # [ /\'(?=[#{PUNCT_Q}]*(s\b|[\s#{PUNCT_NOQ}]))/, '&#8217;' ], # single closing
403 # [ /\'/, '&#8216;' ], # single opening
403 # [ /\'/, '&#8216;' ], # single opening
404 # [ /</, '&lt;' ], # less-than
404 # [ /</, '&lt;' ], # less-than
405 # [ />/, '&gt;' ], # greater-than
405 # [ />/, '&gt;' ], # greater-than
406 # [ /([^\s\[{(])?"(\s|:|$)/, '\1&#8221;\2' ], # double closing
406 # [ /([^\s\[{(])?"(\s|:|$)/, '\1&#8221;\2' ], # double closing
407 # [ /([^\s\[{(>#{PUNCT_Q}][#{PUNCT_Q}]*)"/, '\1&#8221;' ], # double closing
407 # [ /([^\s\[{(>#{PUNCT_Q}][#{PUNCT_Q}]*)"/, '\1&#8221;' ], # double closing
408 # [ /"(?=[#{PUNCT_Q}]*[\s#{PUNCT_NOQ}])/, '&#8221;' ], # double closing
408 # [ /"(?=[#{PUNCT_Q}]*[\s#{PUNCT_NOQ}])/, '&#8221;' ], # double closing
409 # [ /"/, '&#8220;' ], # double opening
409 # [ /"/, '&#8220;' ], # double opening
410 # [ /\b( )?\.{3}/, '\1&#8230;' ], # ellipsis
410 # [ /\b( )?\.{3}/, '\1&#8230;' ], # ellipsis
411 # [ /\b([A-Z][A-Z0-9]{2,})\b(?:[(]([^)]*)[)])/, '<acronym title="\2">\1</acronym>' ], # 3+ uppercase acronym
411 # [ /\b([A-Z][A-Z0-9]{2,})\b(?:[(]([^)]*)[)])/, '<acronym title="\2">\1</acronym>' ], # 3+ uppercase acronym
412 # [ /(^|[^"][>\s])([A-Z][A-Z0-9 ]+[A-Z0-9])([^<A-Za-z0-9]|$)/, '\1<span class="caps">\2</span>\3', :no_span_caps ], # 3+ uppercase caps
412 # [ /(^|[^"][>\s])([A-Z][A-Z0-9 ]+[A-Z0-9])([^<A-Za-z0-9]|$)/, '\1<span class="caps">\2</span>\3', :no_span_caps ], # 3+ uppercase caps
413 # [ /(\.\s)?\s?--\s?/, '\1&#8212;' ], # em dash
413 # [ /(\.\s)?\s?--\s?/, '\1&#8212;' ], # em dash
414 # [ /\s->\s/, ' &rarr; ' ], # right arrow
414 # [ /\s->\s/, ' &rarr; ' ], # right arrow
415 # [ /\s-\s/, ' &#8211; ' ], # en dash
415 # [ /\s-\s/, ' &#8211; ' ], # en dash
416 # [ /(\d+) ?x ?(\d+)/, '\1&#215;\2' ], # dimension sign
416 # [ /(\d+) ?x ?(\d+)/, '\1&#215;\2' ], # dimension sign
417 # [ /\b ?[(\[]TM[\])]/i, '&#8482;' ], # trademark
417 # [ /\b ?[(\[]TM[\])]/i, '&#8482;' ], # trademark
418 # [ /\b ?[(\[]R[\])]/i, '&#174;' ], # registered
418 # [ /\b ?[(\[]R[\])]/i, '&#174;' ], # registered
419 # [ /\b ?[(\[]C[\])]/i, '&#169;' ] # copyright
419 # [ /\b ?[(\[]C[\])]/i, '&#169;' ] # copyright
420 ]
420 ]
421
421
422 H_ALGN_VALS = {
422 H_ALGN_VALS = {
423 '<' => 'left',
423 '<' => 'left',
424 '=' => 'center',
424 '=' => 'center',
425 '>' => 'right',
425 '>' => 'right',
426 '<>' => 'justify'
426 '<>' => 'justify'
427 }
427 }
428
428
429 V_ALGN_VALS = {
429 V_ALGN_VALS = {
430 '^' => 'top',
430 '^' => 'top',
431 '-' => 'middle',
431 '-' => 'middle',
432 '~' => 'bottom'
432 '~' => 'bottom'
433 }
433 }
434
434
435 #
435 #
436 # Flexible HTML escaping
436 # Flexible HTML escaping
437 #
437 #
438 def htmlesc( str, mode=:Quotes )
438 def htmlesc( str, mode=:Quotes )
439 if str
439 if str
440 str.gsub!( '&', '&amp;' )
440 str.gsub!( '&', '&amp;' )
441 str.gsub!( '"', '&quot;' ) if mode != :NoQuotes
441 str.gsub!( '"', '&quot;' ) if mode != :NoQuotes
442 str.gsub!( "'", '&#039;' ) if mode == :Quotes
442 str.gsub!( "'", '&#039;' ) if mode == :Quotes
443 str.gsub!( '<', '&lt;')
443 str.gsub!( '<', '&lt;')
444 str.gsub!( '>', '&gt;')
444 str.gsub!( '>', '&gt;')
445 end
445 end
446 str
446 str
447 end
447 end
448
448
449 # Search and replace for Textile glyphs (quotes, dashes, other symbols)
449 # Search and replace for Textile glyphs (quotes, dashes, other symbols)
450 def pgl( text )
450 def pgl( text )
451 #GLYPHS.each do |re, resub, tog|
451 #GLYPHS.each do |re, resub, tog|
452 # next if tog and method( tog ).call
452 # next if tog and method( tog ).call
453 # text.gsub! re, resub
453 # text.gsub! re, resub
454 #end
454 #end
455 text.gsub!(/\b([A-Z][A-Z0-9]{2,})\b(?:[(]([^)]*)[)])/) do |m|
455 text.gsub!(/\b([A-Z][A-Z0-9]{2,})\b(?:[(]([^)]*)[)])/) do |m|
456 "<acronym title=\"#{htmlesc $2}\">#{$1}</acronym>"
456 "<acronym title=\"#{htmlesc $2}\">#{$1}</acronym>"
457 end
457 end
458 end
458 end
459
459
460 # Parses Textile attribute lists and builds an HTML attribute string
460 # Parses Textile attribute lists and builds an HTML attribute string
461 def pba( text_in, element = "" )
461 def pba( text_in, element = "" )
462
462
463 return '' unless text_in
463 return '' unless text_in
464
464
465 style = []
465 style = []
466 text = text_in.dup
466 text = text_in.dup
467 if element == 'td'
467 if element == 'td'
468 colspan = $1 if text =~ /\\(\d+)/
468 colspan = $1 if text =~ /\\(\d+)/
469 rowspan = $1 if text =~ /\/(\d+)/
469 rowspan = $1 if text =~ /\/(\d+)/
470 style << "vertical-align:#{ v_align( $& ) };" if text =~ A_VLGN
470 style << "vertical-align:#{ v_align( $& ) };" if text =~ A_VLGN
471 end
471 end
472
472
473 style << "#{ htmlesc $1 };" if text.sub!( /\{([^}]*)\}/, '' ) && !filter_styles
473 style << "#{ htmlesc $1 };" if text.sub!( /\{([^}]*)\}/, '' ) && !filter_styles
474
474
475 lang = $1 if
475 lang = $1 if
476 text.sub!( /\[([^)]+?)\]/, '' )
476 text.sub!( /\[([^)]+?)\]/, '' )
477
477
478 cls = $1 if
478 cls = $1 if
479 text.sub!( /\(([^()]+?)\)/, '' )
479 text.sub!( /\(([^()]+?)\)/, '' )
480
480
481 style << "padding-left:#{ $1.length }em;" if
481 style << "padding-left:#{ $1.length }em;" if
482 text.sub!( /([(]+)/, '' )
482 text.sub!( /([(]+)/, '' )
483
483
484 style << "padding-right:#{ $1.length }em;" if text.sub!( /([)]+)/, '' )
484 style << "padding-right:#{ $1.length }em;" if text.sub!( /([)]+)/, '' )
485
485
486 style << "text-align:#{ h_align( $& ) };" if text =~ A_HLGN
486 style << "text-align:#{ h_align( $& ) };" if text =~ A_HLGN
487
487
488 cls, id = $1, $2 if cls =~ /^(.*?)#(.*)$/
488 cls, id = $1, $2 if cls =~ /^(.*?)#(.*)$/
489
489
490 atts = ''
490 atts = ''
491 atts << " style=\"#{ style.join }\"" unless style.empty?
491 atts << " style=\"#{ style.join }\"" unless style.empty?
492 atts << " class=\"#{ cls }\"" unless cls.to_s.empty?
492 atts << " class=\"#{ cls }\"" unless cls.to_s.empty?
493 atts << " lang=\"#{ lang }\"" if lang
493 atts << " lang=\"#{ lang }\"" if lang
494 atts << " id=\"#{ id }\"" if id
494 atts << " id=\"#{ id }\"" if id
495 atts << " colspan=\"#{ colspan }\"" if colspan
495 atts << " colspan=\"#{ colspan }\"" if colspan
496 atts << " rowspan=\"#{ rowspan }\"" if rowspan
496 atts << " rowspan=\"#{ rowspan }\"" if rowspan
497
497
498 atts
498 atts
499 end
499 end
500
500
501 TABLE_RE = /^(?:table(_?#{S}#{A}#{C})\. ?\n)?^(#{A}#{C}\.? ?\|.*?\|)(\n\n|\Z)/m
501 TABLE_RE = /^(?:table(_?#{S}#{A}#{C})\. ?\n)?^(#{A}#{C}\.? ?\|.*?\|)(\n\n|\Z)/m
502
502
503 # Parses a Textile table block, building HTML from the result.
503 # Parses a Textile table block, building HTML from the result.
504 def block_textile_table( text )
504 def block_textile_table( text )
505 text.gsub!( TABLE_RE ) do |matches|
505 text.gsub!( TABLE_RE ) do |matches|
506
506
507 tatts, fullrow = $~[1..2]
507 tatts, fullrow = $~[1..2]
508 tatts = pba( tatts, 'table' )
508 tatts = pba( tatts, 'table' )
509 tatts = shelve( tatts ) if tatts
509 tatts = shelve( tatts ) if tatts
510 rows = []
510 rows = []
511
511
512 fullrow.each_line do |row|
512 fullrow.each_line do |row|
513 ratts, row = pba( $1, 'tr' ), $2 if row =~ /^(#{A}#{C}\. )(.*)/m
513 ratts, row = pba( $1, 'tr' ), $2 if row =~ /^(#{A}#{C}\. )(.*)/m
514 cells = []
514 cells = []
515 row.split( /(\|)(?![^\[\|]*\]\])/ )[1..-2].each do |cell|
515 row.split( /(\|)(?![^\[\|]*\]\])/ )[1..-2].each do |cell|
516 next if cell == '|'
516 next if cell == '|'
517 ctyp = 'd'
517 ctyp = 'd'
518 ctyp = 'h' if cell =~ /^_/
518 ctyp = 'h' if cell =~ /^_/
519
519
520 catts = ''
520 catts = ''
521 catts, cell = pba( $1, 'td' ), $2 if cell =~ /^(_?#{S}#{A}#{C}\. ?)(.*)/
521 catts, cell = pba( $1, 'td' ), $2 if cell =~ /^(_?#{S}#{A}#{C}\. ?)(.*)/
522
522
523 catts = shelve( catts ) if catts
523 catts = shelve( catts ) if catts
524 cells << "\t\t\t<t#{ ctyp }#{ catts }>#{ cell }</t#{ ctyp }>"
524 cells << "\t\t\t<t#{ ctyp }#{ catts }>#{ cell }</t#{ ctyp }>"
525 end
525 end
526 ratts = shelve( ratts ) if ratts
526 ratts = shelve( ratts ) if ratts
527 rows << "\t\t<tr#{ ratts }>\n#{ cells.join( "\n" ) }\n\t\t</tr>"
527 rows << "\t\t<tr#{ ratts }>\n#{ cells.join( "\n" ) }\n\t\t</tr>"
528 end
528 end
529 "\t<table#{ tatts }>\n#{ rows.join( "\n" ) }\n\t</table>\n\n"
529 "\t<table#{ tatts }>\n#{ rows.join( "\n" ) }\n\t</table>\n\n"
530 end
530 end
531 end
531 end
532
532
533 LISTS_RE = /^([#*]+?#{C} .*?)$(?![^#*])/m
533 LISTS_RE = /^([#*]+?#{C} .*?)$(?![^#*])/m
534 LISTS_CONTENT_RE = /^([#*]+)(#{A}#{C}) (.*)$/m
534 LISTS_CONTENT_RE = /^([#*]+)(#{A}#{C}) (.*)$/m
535
535
536 # Parses Textile lists and generates HTML
536 # Parses Textile lists and generates HTML
537 def block_textile_lists( text )
537 def block_textile_lists( text )
538 text.gsub!( LISTS_RE ) do |match|
538 text.gsub!( LISTS_RE ) do |match|
539 lines = match.split( /\n/ )
539 lines = match.split( /\n/ )
540 last_line = -1
540 last_line = -1
541 depth = []
541 depth = []
542 lines.each_with_index do |line, line_id|
542 lines.each_with_index do |line, line_id|
543 if line =~ LISTS_CONTENT_RE
543 if line =~ LISTS_CONTENT_RE
544 tl,atts,content = $~[1..3]
544 tl,atts,content = $~[1..3]
545 if depth.last
545 if depth.last
546 if depth.last.length > tl.length
546 if depth.last.length > tl.length
547 (depth.length - 1).downto(0) do |i|
547 (depth.length - 1).downto(0) do |i|
548 break if depth[i].length == tl.length
548 break if depth[i].length == tl.length
549 lines[line_id - 1] << "</li>\n\t</#{ lT( depth[i] ) }l>\n\t"
549 lines[line_id - 1] << "</li>\n\t</#{ lT( depth[i] ) }l>\n\t"
550 depth.pop
550 depth.pop
551 end
551 end
552 end
552 end
553 if depth.last and depth.last.length == tl.length
553 if depth.last and depth.last.length == tl.length
554 lines[line_id - 1] << '</li>'
554 lines[line_id - 1] << '</li>'
555 end
555 end
556 end
556 end
557 unless depth.last == tl
557 unless depth.last == tl
558 depth << tl
558 depth << tl
559 atts = pba( atts )
559 atts = pba( atts )
560 atts = shelve( atts ) if atts
560 atts = shelve( atts ) if atts
561 lines[line_id] = "\t<#{ lT(tl) }l#{ atts }>\n\t<li>#{ content }"
561 lines[line_id] = "\t<#{ lT(tl) }l#{ atts }>\n\t<li>#{ content }"
562 else
562 else
563 lines[line_id] = "\t\t<li>#{ content }"
563 lines[line_id] = "\t\t<li>#{ content }"
564 end
564 end
565 last_line = line_id
565 last_line = line_id
566
566
567 else
567 else
568 last_line = line_id
568 last_line = line_id
569 end
569 end
570 if line_id - last_line > 1 or line_id == lines.length - 1
570 if line_id - last_line > 1 or line_id == lines.length - 1
571 depth.delete_if do |v|
571 depth.delete_if do |v|
572 lines[last_line] << "</li>\n\t</#{ lT( v ) }l>"
572 lines[last_line] << "</li>\n\t</#{ lT( v ) }l>"
573 end
573 end
574 end
574 end
575 end
575 end
576 lines.join( "\n" )
576 lines.join( "\n" )
577 end
577 end
578 end
578 end
579
579
580 QUOTES_RE = /(^>+([^\n]*?)\n?)+/m
580 QUOTES_RE = /(^>+([^\n]*?)(\n|$))+/m
581 QUOTES_CONTENT_RE = /^([> ]+)(.*)$/m
581 QUOTES_CONTENT_RE = /^([> ]+)(.*)$/m
582
582
583 def block_textile_quotes( text )
583 def block_textile_quotes( text )
584 text.gsub!( QUOTES_RE ) do |match|
584 text.gsub!( QUOTES_RE ) do |match|
585 lines = match.split( /\n/ )
585 lines = match.split( /\n/ )
586 quotes = ''
586 quotes = ''
587 indent = 0
587 indent = 0
588 lines.each do |line|
588 lines.each do |line|
589 line =~ QUOTES_CONTENT_RE
589 line =~ QUOTES_CONTENT_RE
590 bq,content = $1, $2
590 bq,content = $1, $2
591 l = bq.count('>')
591 l = bq.count('>')
592 if l != indent
592 if l != indent
593 quotes << ("\n\n" + (l>indent ? '<blockquote>' * (l-indent) : '</blockquote>' * (indent-l)) + "\n\n")
593 quotes << ("\n\n" + (l>indent ? '<blockquote>' * (l-indent) : '</blockquote>' * (indent-l)) + "\n\n")
594 indent = l
594 indent = l
595 end
595 end
596 quotes << (content + "\n")
596 quotes << (content + "\n")
597 end
597 end
598 quotes << ("\n" + '</blockquote>' * indent + "\n\n")
598 quotes << ("\n" + '</blockquote>' * indent + "\n\n")
599 quotes
599 quotes
600 end
600 end
601 end
601 end
602
602
603 CODE_RE = /(\W)
603 CODE_RE = /(\W)
604 @
604 @
605 (?:\|(\w+?)\|)?
605 (?:\|(\w+?)\|)?
606 (.+?)
606 (.+?)
607 @
607 @
608 (?=\W)/x
608 (?=\W)/x
609
609
610 def inline_textile_code( text )
610 def inline_textile_code( text )
611 text.gsub!( CODE_RE ) do |m|
611 text.gsub!( CODE_RE ) do |m|
612 before,lang,code,after = $~[1..4]
612 before,lang,code,after = $~[1..4]
613 lang = " lang=\"#{ lang }\"" if lang
613 lang = " lang=\"#{ lang }\"" if lang
614 rip_offtags( "#{ before }<code#{ lang }>#{ code }</code>#{ after }" )
614 rip_offtags( "#{ before }<code#{ lang }>#{ code }</code>#{ after }" )
615 end
615 end
616 end
616 end
617
617
618 def lT( text )
618 def lT( text )
619 text =~ /\#$/ ? 'o' : 'u'
619 text =~ /\#$/ ? 'o' : 'u'
620 end
620 end
621
621
622 def hard_break( text )
622 def hard_break( text )
623 text.gsub!( /(.)\n(?!\Z| *([#*=]+(\s|$)|[{|]))/, "\\1<br />" ) if hard_breaks
623 text.gsub!( /(.)\n(?!\Z| *([#*=]+(\s|$)|[{|]))/, "\\1<br />" ) if hard_breaks
624 end
624 end
625
625
626 BLOCKS_GROUP_RE = /\n{2,}(?! )/m
626 BLOCKS_GROUP_RE = /\n{2,}(?! )/m
627
627
628 def blocks( text, deep_code = false )
628 def blocks( text, deep_code = false )
629 text.replace( text.split( BLOCKS_GROUP_RE ).collect do |blk|
629 text.replace( text.split( BLOCKS_GROUP_RE ).collect do |blk|
630 plain = blk !~ /\A[#*> ]/
630 plain = blk !~ /\A[#*> ]/
631
631
632 # skip blocks that are complex HTML
632 # skip blocks that are complex HTML
633 if blk =~ /^<\/?(\w+).*>/ and not SIMPLE_HTML_TAGS.include? $1
633 if blk =~ /^<\/?(\w+).*>/ and not SIMPLE_HTML_TAGS.include? $1
634 blk
634 blk
635 else
635 else
636 # search for indentation levels
636 # search for indentation levels
637 blk.strip!
637 blk.strip!
638 if blk.empty?
638 if blk.empty?
639 blk
639 blk
640 else
640 else
641 code_blk = nil
641 code_blk = nil
642 blk.gsub!( /((?:\n(?:\n^ +[^\n]*)+)+)/m ) do |iblk|
642 blk.gsub!( /((?:\n(?:\n^ +[^\n]*)+)+)/m ) do |iblk|
643 flush_left iblk
643 flush_left iblk
644 blocks iblk, plain
644 blocks iblk, plain
645 iblk.gsub( /^(\S)/, "\t\\1" )
645 iblk.gsub( /^(\S)/, "\t\\1" )
646 if plain
646 if plain
647 code_blk = iblk; ""
647 code_blk = iblk; ""
648 else
648 else
649 iblk
649 iblk
650 end
650 end
651 end
651 end
652
652
653 block_applied = 0
653 block_applied = 0
654 @rules.each do |rule_name|
654 @rules.each do |rule_name|
655 block_applied += 1 if ( rule_name.to_s.match /^block_/ and method( rule_name ).call( blk ) )
655 block_applied += 1 if ( rule_name.to_s.match /^block_/ and method( rule_name ).call( blk ) )
656 end
656 end
657 if block_applied.zero?
657 if block_applied.zero?
658 if deep_code
658 if deep_code
659 blk = "\t<pre><code>#{ blk }</code></pre>"
659 blk = "\t<pre><code>#{ blk }</code></pre>"
660 else
660 else
661 blk = "\t<p>#{ blk }</p>"
661 blk = "\t<p>#{ blk }</p>"
662 end
662 end
663 end
663 end
664 # hard_break blk
664 # hard_break blk
665 blk + "\n#{ code_blk }"
665 blk + "\n#{ code_blk }"
666 end
666 end
667 end
667 end
668
668
669 end.join( "\n\n" ) )
669 end.join( "\n\n" ) )
670 end
670 end
671
671
672 def textile_bq( tag, atts, cite, content )
672 def textile_bq( tag, atts, cite, content )
673 cite, cite_title = check_refs( cite )
673 cite, cite_title = check_refs( cite )
674 cite = " cite=\"#{ cite }\"" if cite
674 cite = " cite=\"#{ cite }\"" if cite
675 atts = shelve( atts ) if atts
675 atts = shelve( atts ) if atts
676 "\t<blockquote#{ cite }>\n\t\t<p#{ atts }>#{ content }</p>\n\t</blockquote>"
676 "\t<blockquote#{ cite }>\n\t\t<p#{ atts }>#{ content }</p>\n\t</blockquote>"
677 end
677 end
678
678
679 def textile_p( tag, atts, cite, content )
679 def textile_p( tag, atts, cite, content )
680 atts = shelve( atts ) if atts
680 atts = shelve( atts ) if atts
681 "\t<#{ tag }#{ atts }>#{ content }</#{ tag }>"
681 "\t<#{ tag }#{ atts }>#{ content }</#{ tag }>"
682 end
682 end
683
683
684 alias textile_h1 textile_p
684 alias textile_h1 textile_p
685 alias textile_h2 textile_p
685 alias textile_h2 textile_p
686 alias textile_h3 textile_p
686 alias textile_h3 textile_p
687 alias textile_h4 textile_p
687 alias textile_h4 textile_p
688 alias textile_h5 textile_p
688 alias textile_h5 textile_p
689 alias textile_h6 textile_p
689 alias textile_h6 textile_p
690
690
691 def textile_fn_( tag, num, atts, cite, content )
691 def textile_fn_( tag, num, atts, cite, content )
692 atts << " id=\"fn#{ num }\" class=\"footnote\""
692 atts << " id=\"fn#{ num }\" class=\"footnote\""
693 content = "<sup>#{ num }</sup> #{ content }"
693 content = "<sup>#{ num }</sup> #{ content }"
694 atts = shelve( atts ) if atts
694 atts = shelve( atts ) if atts
695 "\t<p#{ atts }>#{ content }</p>"
695 "\t<p#{ atts }>#{ content }</p>"
696 end
696 end
697
697
698 BLOCK_RE = /^(([a-z]+)(\d*))(#{A}#{C})\.(?::(\S+))? (.*)$/m
698 BLOCK_RE = /^(([a-z]+)(\d*))(#{A}#{C})\.(?::(\S+))? (.*)$/m
699
699
700 def block_textile_prefix( text )
700 def block_textile_prefix( text )
701 if text =~ BLOCK_RE
701 if text =~ BLOCK_RE
702 tag,tagpre,num,atts,cite,content = $~[1..6]
702 tag,tagpre,num,atts,cite,content = $~[1..6]
703 atts = pba( atts )
703 atts = pba( atts )
704
704
705 # pass to prefix handler
705 # pass to prefix handler
706 if respond_to? "textile_#{ tag }", true
706 if respond_to? "textile_#{ tag }", true
707 text.gsub!( $&, method( "textile_#{ tag }" ).call( tag, atts, cite, content ) )
707 text.gsub!( $&, method( "textile_#{ tag }" ).call( tag, atts, cite, content ) )
708 elsif respond_to? "textile_#{ tagpre }_", true
708 elsif respond_to? "textile_#{ tagpre }_", true
709 text.gsub!( $&, method( "textile_#{ tagpre }_" ).call( tagpre, num, atts, cite, content ) )
709 text.gsub!( $&, method( "textile_#{ tagpre }_" ).call( tagpre, num, atts, cite, content ) )
710 end
710 end
711 end
711 end
712 end
712 end
713
713
714 SETEXT_RE = /\A(.+?)\n([=-])[=-]* *$/m
714 SETEXT_RE = /\A(.+?)\n([=-])[=-]* *$/m
715 def block_markdown_setext( text )
715 def block_markdown_setext( text )
716 if text =~ SETEXT_RE
716 if text =~ SETEXT_RE
717 tag = if $2 == "="; "h1"; else; "h2"; end
717 tag = if $2 == "="; "h1"; else; "h2"; end
718 blk, cont = "<#{ tag }>#{ $1 }</#{ tag }>", $'
718 blk, cont = "<#{ tag }>#{ $1 }</#{ tag }>", $'
719 blocks cont
719 blocks cont
720 text.replace( blk + cont )
720 text.replace( blk + cont )
721 end
721 end
722 end
722 end
723
723
724 ATX_RE = /\A(\#{1,6}) # $1 = string of #'s
724 ATX_RE = /\A(\#{1,6}) # $1 = string of #'s
725 [ ]*
725 [ ]*
726 (.+?) # $2 = Header text
726 (.+?) # $2 = Header text
727 [ ]*
727 [ ]*
728 \#* # optional closing #'s (not counted)
728 \#* # optional closing #'s (not counted)
729 $/x
729 $/x
730 def block_markdown_atx( text )
730 def block_markdown_atx( text )
731 if text =~ ATX_RE
731 if text =~ ATX_RE
732 tag = "h#{ $1.length }"
732 tag = "h#{ $1.length }"
733 blk, cont = "<#{ tag }>#{ $2 }</#{ tag }>\n\n", $'
733 blk, cont = "<#{ tag }>#{ $2 }</#{ tag }>\n\n", $'
734 blocks cont
734 blocks cont
735 text.replace( blk + cont )
735 text.replace( blk + cont )
736 end
736 end
737 end
737 end
738
738
739 MARKDOWN_BQ_RE = /\A(^ *> ?.+$(.+\n)*\n*)+/m
739 MARKDOWN_BQ_RE = /\A(^ *> ?.+$(.+\n)*\n*)+/m
740
740
741 def block_markdown_bq( text )
741 def block_markdown_bq( text )
742 text.gsub!( MARKDOWN_BQ_RE ) do |blk|
742 text.gsub!( MARKDOWN_BQ_RE ) do |blk|
743 blk.gsub!( /^ *> ?/, '' )
743 blk.gsub!( /^ *> ?/, '' )
744 flush_left blk
744 flush_left blk
745 blocks blk
745 blocks blk
746 blk.gsub!( /^(\S)/, "\t\\1" )
746 blk.gsub!( /^(\S)/, "\t\\1" )
747 "<blockquote>\n#{ blk }\n</blockquote>\n\n"
747 "<blockquote>\n#{ blk }\n</blockquote>\n\n"
748 end
748 end
749 end
749 end
750
750
751 MARKDOWN_RULE_RE = /^(#{
751 MARKDOWN_RULE_RE = /^(#{
752 ['*', '-', '_'].collect { |ch| ' ?(' + Regexp::quote( ch ) + ' ?){3,}' }.join( '|' )
752 ['*', '-', '_'].collect { |ch| ' ?(' + Regexp::quote( ch ) + ' ?){3,}' }.join( '|' )
753 })$/
753 })$/
754
754
755 def block_markdown_rule( text )
755 def block_markdown_rule( text )
756 text.gsub!( MARKDOWN_RULE_RE ) do |blk|
756 text.gsub!( MARKDOWN_RULE_RE ) do |blk|
757 "<hr />"
757 "<hr />"
758 end
758 end
759 end
759 end
760
760
761 # XXX TODO XXX
761 # XXX TODO XXX
762 def block_markdown_lists( text )
762 def block_markdown_lists( text )
763 end
763 end
764
764
765 def inline_textile_span( text )
765 def inline_textile_span( text )
766 QTAGS.each do |qtag_rc, ht, qtag_re, rtype|
766 QTAGS.each do |qtag_rc, ht, qtag_re, rtype|
767 text.gsub!( qtag_re ) do |m|
767 text.gsub!( qtag_re ) do |m|
768
768
769 case rtype
769 case rtype
770 when :limit
770 when :limit
771 sta,qtag,atts,cite,content = $~[1..5]
771 sta,qtag,atts,cite,content = $~[1..5]
772 else
772 else
773 qtag,atts,cite,content = $~[1..4]
773 qtag,atts,cite,content = $~[1..4]
774 sta = ''
774 sta = ''
775 end
775 end
776 atts = pba( atts )
776 atts = pba( atts )
777 atts << " cite=\"#{ cite }\"" if cite
777 atts << " cite=\"#{ cite }\"" if cite
778 atts = shelve( atts ) if atts
778 atts = shelve( atts ) if atts
779
779
780 "#{ sta }<#{ ht }#{ atts }>#{ content }</#{ ht }>"
780 "#{ sta }<#{ ht }#{ atts }>#{ content }</#{ ht }>"
781
781
782 end
782 end
783 end
783 end
784 end
784 end
785
785
786 LINK_RE = /
786 LINK_RE = /
787 (
787 (
788 ([\s\[{(]|[#{PUNCT}])? # $pre
788 ([\s\[{(]|[#{PUNCT}])? # $pre
789 " # start
789 " # start
790 (#{C}) # $atts
790 (#{C}) # $atts
791 ([^"\n]+?) # $text
791 ([^"\n]+?) # $text
792 \s?
792 \s?
793 (?:\(([^)]+?)\)(?="))? # $title
793 (?:\(([^)]+?)\)(?="))? # $title
794 ":
794 ":
795 ( # $url
795 ( # $url
796 (\/|[a-zA-Z]+:\/\/|www\.|mailto:) # $proto
796 (\/|[a-zA-Z]+:\/\/|www\.|mailto:) # $proto
797 [\w\/]\S+?
797 [\w\/]\S+?
798 )
798 )
799 (\/)? # $slash
799 (\/)? # $slash
800 ([^\w\=\/;\(\)]*?) # $post
800 ([^\w\=\/;\(\)]*?) # $post
801 )
801 )
802 (?=<|\s|$)
802 (?=<|\s|$)
803 /x
803 /x
804 #"
804 #"
805 def inline_textile_link( text )
805 def inline_textile_link( text )
806 text.gsub!( LINK_RE ) do |m|
806 text.gsub!( LINK_RE ) do |m|
807 all,pre,atts,text,title,url,proto,slash,post = $~[1..9]
807 all,pre,atts,text,title,url,proto,slash,post = $~[1..9]
808 if text.include?('<br />')
808 if text.include?('<br />')
809 all
809 all
810 else
810 else
811 url, url_title = check_refs( url )
811 url, url_title = check_refs( url )
812 title ||= url_title
812 title ||= url_title
813
813
814 # Idea below : an URL with unbalanced parethesis and
814 # Idea below : an URL with unbalanced parethesis and
815 # ending by ')' is put into external parenthesis
815 # ending by ')' is put into external parenthesis
816 if ( url[-1]==?) and ((url.count("(") - url.count(")")) < 0 ) )
816 if ( url[-1]==?) and ((url.count("(") - url.count(")")) < 0 ) )
817 url=url[0..-2] # discard closing parenth from url
817 url=url[0..-2] # discard closing parenth from url
818 post = ")"+post # add closing parenth to post
818 post = ")"+post # add closing parenth to post
819 end
819 end
820 atts = pba( atts )
820 atts = pba( atts )
821 atts = " href=\"#{ url }#{ slash }\"#{ atts }"
821 atts = " href=\"#{ url }#{ slash }\"#{ atts }"
822 atts << " title=\"#{ htmlesc title }\"" if title
822 atts << " title=\"#{ htmlesc title }\"" if title
823 atts = shelve( atts ) if atts
823 atts = shelve( atts ) if atts
824
824
825 external = (url =~ /^https?:\/\//) ? ' class="external"' : ''
825 external = (url =~ /^https?:\/\//) ? ' class="external"' : ''
826
826
827 "#{ pre }<a#{ atts }#{ external }>#{ text }</a>#{ post }"
827 "#{ pre }<a#{ atts }#{ external }>#{ text }</a>#{ post }"
828 end
828 end
829 end
829 end
830 end
830 end
831
831
832 MARKDOWN_REFLINK_RE = /
832 MARKDOWN_REFLINK_RE = /
833 \[([^\[\]]+)\] # $text
833 \[([^\[\]]+)\] # $text
834 [ ]? # opt. space
834 [ ]? # opt. space
835 (?:\n[ ]*)? # one optional newline followed by spaces
835 (?:\n[ ]*)? # one optional newline followed by spaces
836 \[(.*?)\] # $id
836 \[(.*?)\] # $id
837 /x
837 /x
838
838
839 def inline_markdown_reflink( text )
839 def inline_markdown_reflink( text )
840 text.gsub!( MARKDOWN_REFLINK_RE ) do |m|
840 text.gsub!( MARKDOWN_REFLINK_RE ) do |m|
841 text, id = $~[1..2]
841 text, id = $~[1..2]
842
842
843 if id.empty?
843 if id.empty?
844 url, title = check_refs( text )
844 url, title = check_refs( text )
845 else
845 else
846 url, title = check_refs( id )
846 url, title = check_refs( id )
847 end
847 end
848
848
849 atts = " href=\"#{ url }\""
849 atts = " href=\"#{ url }\""
850 atts << " title=\"#{ title }\"" if title
850 atts << " title=\"#{ title }\"" if title
851 atts = shelve( atts )
851 atts = shelve( atts )
852
852
853 "<a#{ atts }>#{ text }</a>"
853 "<a#{ atts }>#{ text }</a>"
854 end
854 end
855 end
855 end
856
856
857 MARKDOWN_LINK_RE = /
857 MARKDOWN_LINK_RE = /
858 \[([^\[\]]+)\] # $text
858 \[([^\[\]]+)\] # $text
859 \( # open paren
859 \( # open paren
860 [ \t]* # opt space
860 [ \t]* # opt space
861 <?(.+?)>? # $href
861 <?(.+?)>? # $href
862 [ \t]* # opt space
862 [ \t]* # opt space
863 (?: # whole title
863 (?: # whole title
864 (['"]) # $quote
864 (['"]) # $quote
865 (.*?) # $title
865 (.*?) # $title
866 \3 # matching quote
866 \3 # matching quote
867 )? # title is optional
867 )? # title is optional
868 \)
868 \)
869 /x
869 /x
870
870
871 def inline_markdown_link( text )
871 def inline_markdown_link( text )
872 text.gsub!( MARKDOWN_LINK_RE ) do |m|
872 text.gsub!( MARKDOWN_LINK_RE ) do |m|
873 text, url, quote, title = $~[1..4]
873 text, url, quote, title = $~[1..4]
874
874
875 atts = " href=\"#{ url }\""
875 atts = " href=\"#{ url }\""
876 atts << " title=\"#{ title }\"" if title
876 atts << " title=\"#{ title }\"" if title
877 atts = shelve( atts )
877 atts = shelve( atts )
878
878
879 "<a#{ atts }>#{ text }</a>"
879 "<a#{ atts }>#{ text }</a>"
880 end
880 end
881 end
881 end
882
882
883 TEXTILE_REFS_RE = /(^ *)\[([^\[\n]+?)\](#{HYPERLINK})(?=\s|$)/
883 TEXTILE_REFS_RE = /(^ *)\[([^\[\n]+?)\](#{HYPERLINK})(?=\s|$)/
884 MARKDOWN_REFS_RE = /(^ *)\[([^\n]+?)\]:\s+<?(#{HYPERLINK})>?(?:\s+"((?:[^"]|\\")+)")?(?=\s|$)/m
884 MARKDOWN_REFS_RE = /(^ *)\[([^\n]+?)\]:\s+<?(#{HYPERLINK})>?(?:\s+"((?:[^"]|\\")+)")?(?=\s|$)/m
885
885
886 def refs( text )
886 def refs( text )
887 @rules.each do |rule_name|
887 @rules.each do |rule_name|
888 method( rule_name ).call( text ) if rule_name.to_s.match /^refs_/
888 method( rule_name ).call( text ) if rule_name.to_s.match /^refs_/
889 end
889 end
890 end
890 end
891
891
892 def refs_textile( text )
892 def refs_textile( text )
893 text.gsub!( TEXTILE_REFS_RE ) do |m|
893 text.gsub!( TEXTILE_REFS_RE ) do |m|
894 flag, url = $~[2..3]
894 flag, url = $~[2..3]
895 @urlrefs[flag.downcase] = [url, nil]
895 @urlrefs[flag.downcase] = [url, nil]
896 nil
896 nil
897 end
897 end
898 end
898 end
899
899
900 def refs_markdown( text )
900 def refs_markdown( text )
901 text.gsub!( MARKDOWN_REFS_RE ) do |m|
901 text.gsub!( MARKDOWN_REFS_RE ) do |m|
902 flag, url = $~[2..3]
902 flag, url = $~[2..3]
903 title = $~[6]
903 title = $~[6]
904 @urlrefs[flag.downcase] = [url, title]
904 @urlrefs[flag.downcase] = [url, title]
905 nil
905 nil
906 end
906 end
907 end
907 end
908
908
909 def check_refs( text )
909 def check_refs( text )
910 ret = @urlrefs[text.downcase] if text
910 ret = @urlrefs[text.downcase] if text
911 ret || [text, nil]
911 ret || [text, nil]
912 end
912 end
913
913
914 IMAGE_RE = /
914 IMAGE_RE = /
915 (>|\s|^) # start of line?
915 (>|\s|^) # start of line?
916 \! # opening
916 \! # opening
917 (\<|\=|\>)? # optional alignment atts
917 (\<|\=|\>)? # optional alignment atts
918 (#{C}) # optional style,class atts
918 (#{C}) # optional style,class atts
919 (?:\. )? # optional dot-space
919 (?:\. )? # optional dot-space
920 ([^\s(!]+?) # presume this is the src
920 ([^\s(!]+?) # presume this is the src
921 \s? # optional space
921 \s? # optional space
922 (?:\(((?:[^\(\)]|\([^\)]+\))+?)\))? # optional title
922 (?:\(((?:[^\(\)]|\([^\)]+\))+?)\))? # optional title
923 \! # closing
923 \! # closing
924 (?::#{ HYPERLINK })? # optional href
924 (?::#{ HYPERLINK })? # optional href
925 /x
925 /x
926
926
927 def inline_textile_image( text )
927 def inline_textile_image( text )
928 text.gsub!( IMAGE_RE ) do |m|
928 text.gsub!( IMAGE_RE ) do |m|
929 stln,algn,atts,url,title,href,href_a1,href_a2 = $~[1..8]
929 stln,algn,atts,url,title,href,href_a1,href_a2 = $~[1..8]
930 htmlesc title
930 htmlesc title
931 atts = pba( atts )
931 atts = pba( atts )
932 atts = " src=\"#{ url }\"#{ atts }"
932 atts = " src=\"#{ url }\"#{ atts }"
933 atts << " title=\"#{ title }\"" if title
933 atts << " title=\"#{ title }\"" if title
934 atts << " alt=\"#{ title }\""
934 atts << " alt=\"#{ title }\""
935 # size = @getimagesize($url);
935 # size = @getimagesize($url);
936 # if($size) $atts.= " $size[3]";
936 # if($size) $atts.= " $size[3]";
937
937
938 href, alt_title = check_refs( href ) if href
938 href, alt_title = check_refs( href ) if href
939 url, url_title = check_refs( url )
939 url, url_title = check_refs( url )
940
940
941 out = ''
941 out = ''
942 out << "<a#{ shelve( " href=\"#{ href }\"" ) }>" if href
942 out << "<a#{ shelve( " href=\"#{ href }\"" ) }>" if href
943 out << "<img#{ shelve( atts ) } />"
943 out << "<img#{ shelve( atts ) } />"
944 out << "</a>#{ href_a1 }#{ href_a2 }" if href
944 out << "</a>#{ href_a1 }#{ href_a2 }" if href
945
945
946 if algn
946 if algn
947 algn = h_align( algn )
947 algn = h_align( algn )
948 if stln == "<p>"
948 if stln == "<p>"
949 out = "<p style=\"float:#{ algn }\">#{ out }"
949 out = "<p style=\"float:#{ algn }\">#{ out }"
950 else
950 else
951 out = "#{ stln }<div style=\"float:#{ algn }\">#{ out }</div>"
951 out = "#{ stln }<div style=\"float:#{ algn }\">#{ out }</div>"
952 end
952 end
953 else
953 else
954 out = stln + out
954 out = stln + out
955 end
955 end
956
956
957 out
957 out
958 end
958 end
959 end
959 end
960
960
961 def shelve( val )
961 def shelve( val )
962 @shelf << val
962 @shelf << val
963 " :redsh##{ @shelf.length }:"
963 " :redsh##{ @shelf.length }:"
964 end
964 end
965
965
966 def retrieve( text )
966 def retrieve( text )
967 @shelf.each_with_index do |r, i|
967 @shelf.each_with_index do |r, i|
968 text.gsub!( " :redsh##{ i + 1 }:", r )
968 text.gsub!( " :redsh##{ i + 1 }:", r )
969 end
969 end
970 end
970 end
971
971
972 def incoming_entities( text )
972 def incoming_entities( text )
973 ## turn any incoming ampersands into a dummy character for now.
973 ## turn any incoming ampersands into a dummy character for now.
974 ## This uses a negative lookahead for alphanumerics followed by a semicolon,
974 ## This uses a negative lookahead for alphanumerics followed by a semicolon,
975 ## implying an incoming html entity, to be skipped
975 ## implying an incoming html entity, to be skipped
976
976
977 text.gsub!( /&(?![#a-z0-9]+;)/i, "x%x%" )
977 text.gsub!( /&(?![#a-z0-9]+;)/i, "x%x%" )
978 end
978 end
979
979
980 def no_textile( text )
980 def no_textile( text )
981 text.gsub!( /(^|\s)==([^=]+.*?)==(\s|$)?/,
981 text.gsub!( /(^|\s)==([^=]+.*?)==(\s|$)?/,
982 '\1<notextile>\2</notextile>\3' )
982 '\1<notextile>\2</notextile>\3' )
983 text.gsub!( /^ *==([^=]+.*?)==/m,
983 text.gsub!( /^ *==([^=]+.*?)==/m,
984 '\1<notextile>\2</notextile>\3' )
984 '\1<notextile>\2</notextile>\3' )
985 end
985 end
986
986
987 def clean_white_space( text )
987 def clean_white_space( text )
988 # normalize line breaks
988 # normalize line breaks
989 text.gsub!( /\r\n/, "\n" )
989 text.gsub!( /\r\n/, "\n" )
990 text.gsub!( /\r/, "\n" )
990 text.gsub!( /\r/, "\n" )
991 text.gsub!( /\t/, ' ' )
991 text.gsub!( /\t/, ' ' )
992 text.gsub!( /^ +$/, '' )
992 text.gsub!( /^ +$/, '' )
993 text.gsub!( /\n{3,}/, "\n\n" )
993 text.gsub!( /\n{3,}/, "\n\n" )
994 text.gsub!( /"$/, "\" " )
994 text.gsub!( /"$/, "\" " )
995
995
996 # if entire document is indented, flush
996 # if entire document is indented, flush
997 # to the left side
997 # to the left side
998 flush_left text
998 flush_left text
999 end
999 end
1000
1000
1001 def flush_left( text )
1001 def flush_left( text )
1002 indt = 0
1002 indt = 0
1003 if text =~ /^ /
1003 if text =~ /^ /
1004 while text !~ /^ {#{indt}}\S/
1004 while text !~ /^ {#{indt}}\S/
1005 indt += 1
1005 indt += 1
1006 end unless text.empty?
1006 end unless text.empty?
1007 if indt.nonzero?
1007 if indt.nonzero?
1008 text.gsub!( /^ {#{indt}}/, '' )
1008 text.gsub!( /^ {#{indt}}/, '' )
1009 end
1009 end
1010 end
1010 end
1011 end
1011 end
1012
1012
1013 def footnote_ref( text )
1013 def footnote_ref( text )
1014 text.gsub!( /\b\[([0-9]+?)\](\s)?/,
1014 text.gsub!( /\b\[([0-9]+?)\](\s)?/,
1015 '<sup><a href="#fn\1">\1</a></sup>\2' )
1015 '<sup><a href="#fn\1">\1</a></sup>\2' )
1016 end
1016 end
1017
1017
1018 OFFTAGS = /(code|pre|kbd|notextile)/
1018 OFFTAGS = /(code|pre|kbd|notextile)/
1019 OFFTAG_MATCH = /(?:(<\/#{ OFFTAGS }>)|(<#{ OFFTAGS }[^>]*>))(.*?)(?=<\/?#{ OFFTAGS }|\Z)/mi
1019 OFFTAG_MATCH = /(?:(<\/#{ OFFTAGS }>)|(<#{ OFFTAGS }[^>]*>))(.*?)(?=<\/?#{ OFFTAGS }|\Z)/mi
1020 OFFTAG_OPEN = /<#{ OFFTAGS }/
1020 OFFTAG_OPEN = /<#{ OFFTAGS }/
1021 OFFTAG_CLOSE = /<\/?#{ OFFTAGS }/
1021 OFFTAG_CLOSE = /<\/?#{ OFFTAGS }/
1022 HASTAG_MATCH = /(<\/?\w[^\n]*?>)/m
1022 HASTAG_MATCH = /(<\/?\w[^\n]*?>)/m
1023 ALLTAG_MATCH = /(<\/?\w[^\n]*?>)|.*?(?=<\/?\w[^\n]*?>|$)/m
1023 ALLTAG_MATCH = /(<\/?\w[^\n]*?>)|.*?(?=<\/?\w[^\n]*?>|$)/m
1024
1024
1025 def glyphs_textile( text, level = 0 )
1025 def glyphs_textile( text, level = 0 )
1026 if text !~ HASTAG_MATCH
1026 if text !~ HASTAG_MATCH
1027 pgl text
1027 pgl text
1028 footnote_ref text
1028 footnote_ref text
1029 else
1029 else
1030 codepre = 0
1030 codepre = 0
1031 text.gsub!( ALLTAG_MATCH ) do |line|
1031 text.gsub!( ALLTAG_MATCH ) do |line|
1032 ## matches are off if we're between <code>, <pre> etc.
1032 ## matches are off if we're between <code>, <pre> etc.
1033 if $1
1033 if $1
1034 if line =~ OFFTAG_OPEN
1034 if line =~ OFFTAG_OPEN
1035 codepre += 1
1035 codepre += 1
1036 elsif line =~ OFFTAG_CLOSE
1036 elsif line =~ OFFTAG_CLOSE
1037 codepre -= 1
1037 codepre -= 1
1038 codepre = 0 if codepre < 0
1038 codepre = 0 if codepre < 0
1039 end
1039 end
1040 elsif codepre.zero?
1040 elsif codepre.zero?
1041 glyphs_textile( line, level + 1 )
1041 glyphs_textile( line, level + 1 )
1042 else
1042 else
1043 htmlesc( line, :NoQuotes )
1043 htmlesc( line, :NoQuotes )
1044 end
1044 end
1045 # p [level, codepre, line]
1045 # p [level, codepre, line]
1046
1046
1047 line
1047 line
1048 end
1048 end
1049 end
1049 end
1050 end
1050 end
1051
1051
1052 def rip_offtags( text )
1052 def rip_offtags( text )
1053 if text =~ /<.*>/
1053 if text =~ /<.*>/
1054 ## strip and encode <pre> content
1054 ## strip and encode <pre> content
1055 codepre, used_offtags = 0, {}
1055 codepre, used_offtags = 0, {}
1056 text.gsub!( OFFTAG_MATCH ) do |line|
1056 text.gsub!( OFFTAG_MATCH ) do |line|
1057 if $3
1057 if $3
1058 offtag, aftertag = $4, $5
1058 offtag, aftertag = $4, $5
1059 codepre += 1
1059 codepre += 1
1060 used_offtags[offtag] = true
1060 used_offtags[offtag] = true
1061 if codepre - used_offtags.length > 0
1061 if codepre - used_offtags.length > 0
1062 htmlesc( line, :NoQuotes )
1062 htmlesc( line, :NoQuotes )
1063 @pre_list.last << line
1063 @pre_list.last << line
1064 line = ""
1064 line = ""
1065 else
1065 else
1066 htmlesc( aftertag, :NoQuotes ) if aftertag
1066 htmlesc( aftertag, :NoQuotes ) if aftertag
1067 line = "<redpre##{ @pre_list.length }>"
1067 line = "<redpre##{ @pre_list.length }>"
1068 $3.match(/<#{ OFFTAGS }([^>]*)>/)
1068 $3.match(/<#{ OFFTAGS }([^>]*)>/)
1069 tag = $1
1069 tag = $1
1070 $2.to_s.match(/(class\=\S+)/i)
1070 $2.to_s.match(/(class\=\S+)/i)
1071 tag << " #{$1}" if $1
1071 tag << " #{$1}" if $1
1072 @pre_list << "<#{ tag }>#{ aftertag }"
1072 @pre_list << "<#{ tag }>#{ aftertag }"
1073 end
1073 end
1074 elsif $1 and codepre > 0
1074 elsif $1 and codepre > 0
1075 if codepre - used_offtags.length > 0
1075 if codepre - used_offtags.length > 0
1076 htmlesc( line, :NoQuotes )
1076 htmlesc( line, :NoQuotes )
1077 @pre_list.last << line
1077 @pre_list.last << line
1078 line = ""
1078 line = ""
1079 end
1079 end
1080 codepre -= 1 unless codepre.zero?
1080 codepre -= 1 unless codepre.zero?
1081 used_offtags = {} if codepre.zero?
1081 used_offtags = {} if codepre.zero?
1082 end
1082 end
1083 line
1083 line
1084 end
1084 end
1085 end
1085 end
1086 text
1086 text
1087 end
1087 end
1088
1088
1089 def smooth_offtags( text )
1089 def smooth_offtags( text )
1090 unless @pre_list.empty?
1090 unless @pre_list.empty?
1091 ## replace <pre> content
1091 ## replace <pre> content
1092 text.gsub!( /<redpre#(\d+)>/ ) { @pre_list[$1.to_i] }
1092 text.gsub!( /<redpre#(\d+)>/ ) { @pre_list[$1.to_i] }
1093 end
1093 end
1094 end
1094 end
1095
1095
1096 def inline( text )
1096 def inline( text )
1097 [/^inline_/, /^glyphs_/].each do |meth_re|
1097 [/^inline_/, /^glyphs_/].each do |meth_re|
1098 @rules.each do |rule_name|
1098 @rules.each do |rule_name|
1099 method( rule_name ).call( text ) if rule_name.to_s.match( meth_re )
1099 method( rule_name ).call( text ) if rule_name.to_s.match( meth_re )
1100 end
1100 end
1101 end
1101 end
1102 end
1102 end
1103
1103
1104 def h_align( text )
1104 def h_align( text )
1105 H_ALGN_VALS[text]
1105 H_ALGN_VALS[text]
1106 end
1106 end
1107
1107
1108 def v_align( text )
1108 def v_align( text )
1109 V_ALGN_VALS[text]
1109 V_ALGN_VALS[text]
1110 end
1110 end
1111
1111
1112 def textile_popup_help( name, windowW, windowH )
1112 def textile_popup_help( name, windowW, windowH )
1113 ' <a target="_blank" href="http://hobix.com/textile/#' + helpvar + '" onclick="window.open(this.href, \'popupwindow\', \'width=' + windowW + ',height=' + windowH + ',scrollbars,resizable\'); return false;">' + name + '</a><br />'
1113 ' <a target="_blank" href="http://hobix.com/textile/#' + helpvar + '" onclick="window.open(this.href, \'popupwindow\', \'width=' + windowW + ',height=' + windowH + ',scrollbars,resizable\'); return false;">' + name + '</a><br />'
1114 end
1114 end
1115
1115
1116 # HTML cleansing stuff
1116 # HTML cleansing stuff
1117 BASIC_TAGS = {
1117 BASIC_TAGS = {
1118 'a' => ['href', 'title'],
1118 'a' => ['href', 'title'],
1119 'img' => ['src', 'alt', 'title'],
1119 'img' => ['src', 'alt', 'title'],
1120 'br' => [],
1120 'br' => [],
1121 'i' => nil,
1121 'i' => nil,
1122 'u' => nil,
1122 'u' => nil,
1123 'b' => nil,
1123 'b' => nil,
1124 'pre' => nil,
1124 'pre' => nil,
1125 'kbd' => nil,
1125 'kbd' => nil,
1126 'code' => ['lang'],
1126 'code' => ['lang'],
1127 'cite' => nil,
1127 'cite' => nil,
1128 'strong' => nil,
1128 'strong' => nil,
1129 'em' => nil,
1129 'em' => nil,
1130 'ins' => nil,
1130 'ins' => nil,
1131 'sup' => nil,
1131 'sup' => nil,
1132 'sub' => nil,
1132 'sub' => nil,
1133 'del' => nil,
1133 'del' => nil,
1134 'table' => nil,
1134 'table' => nil,
1135 'tr' => nil,
1135 'tr' => nil,
1136 'td' => ['colspan', 'rowspan'],
1136 'td' => ['colspan', 'rowspan'],
1137 'th' => nil,
1137 'th' => nil,
1138 'ol' => nil,
1138 'ol' => nil,
1139 'ul' => nil,
1139 'ul' => nil,
1140 'li' => nil,
1140 'li' => nil,
1141 'p' => nil,
1141 'p' => nil,
1142 'h1' => nil,
1142 'h1' => nil,
1143 'h2' => nil,
1143 'h2' => nil,
1144 'h3' => nil,
1144 'h3' => nil,
1145 'h4' => nil,
1145 'h4' => nil,
1146 'h5' => nil,
1146 'h5' => nil,
1147 'h6' => nil,
1147 'h6' => nil,
1148 'blockquote' => ['cite']
1148 'blockquote' => ['cite']
1149 }
1149 }
1150
1150
1151 def clean_html( text, tags = BASIC_TAGS )
1151 def clean_html( text, tags = BASIC_TAGS )
1152 text.gsub!( /<!\[CDATA\[/, '' )
1152 text.gsub!( /<!\[CDATA\[/, '' )
1153 text.gsub!( /<(\/*)(\w+)([^>]*)>/ ) do
1153 text.gsub!( /<(\/*)(\w+)([^>]*)>/ ) do
1154 raw = $~
1154 raw = $~
1155 tag = raw[2].downcase
1155 tag = raw[2].downcase
1156 if tags.has_key? tag
1156 if tags.has_key? tag
1157 pcs = [tag]
1157 pcs = [tag]
1158 tags[tag].each do |prop|
1158 tags[tag].each do |prop|
1159 ['"', "'", ''].each do |q|
1159 ['"', "'", ''].each do |q|
1160 q2 = ( q != '' ? q : '\s' )
1160 q2 = ( q != '' ? q : '\s' )
1161 if raw[3] =~ /#{prop}\s*=\s*#{q}([^#{q2}]+)#{q}/i
1161 if raw[3] =~ /#{prop}\s*=\s*#{q}([^#{q2}]+)#{q}/i
1162 attrv = $1
1162 attrv = $1
1163 next if prop == 'src' and attrv =~ %r{^(?!http)\w+:}
1163 next if prop == 'src' and attrv =~ %r{^(?!http)\w+:}
1164 pcs << "#{prop}=\"#{$1.gsub('"', '\\"')}\""
1164 pcs << "#{prop}=\"#{$1.gsub('"', '\\"')}\""
1165 break
1165 break
1166 end
1166 end
1167 end
1167 end
1168 end if tags[tag]
1168 end if tags[tag]
1169 "<#{raw[1]}#{pcs.join " "}>"
1169 "<#{raw[1]}#{pcs.join " "}>"
1170 else
1170 else
1171 " "
1171 " "
1172 end
1172 end
1173 end
1173 end
1174 end
1174 end
1175
1175
1176 ALLOWED_TAGS = %w(redpre pre code notextile)
1176 ALLOWED_TAGS = %w(redpre pre code notextile)
1177
1177
1178 def escape_html_tags(text)
1178 def escape_html_tags(text)
1179 text.gsub!(%r{<(\/?([!\w]+)[^<>\n]*)(>?)}) {|m| ALLOWED_TAGS.include?($2) ? "<#{$1}#{$3}" : "&lt;#{$1}#{'&gt;' unless $3.blank?}" }
1179 text.gsub!(%r{<(\/?([!\w]+)[^<>\n]*)(>?)}) {|m| ALLOWED_TAGS.include?($2) ? "<#{$1}#{$3}" : "&lt;#{$1}#{'&gt;' unless $3.blank?}" }
1180 end
1180 end
1181 end
1181 end
1182
1182
General Comments 0
You need to be logged in to leave comments. Login now