##// END OF EJS Templates
Stricter textile links parsing (#2417)....
Jean-Philippe Lang -
r2210:8b7fb7213f0e
parent child
Show More
@@ -1,1174 +1,1177
1 # vim:ts=4:sw=4:
1 # vim:ts=4:sw=4:
2 # = RedCloth - Textile and Markdown Hybrid for Ruby
2 # = RedCloth - Textile and Markdown Hybrid for Ruby
3 #
3 #
4 # Homepage:: http://whytheluckystiff.net/ruby/redcloth/
4 # Homepage:: http://whytheluckystiff.net/ruby/redcloth/
5 # Author:: why the lucky stiff (http://whytheluckystiff.net/)
5 # Author:: why the lucky stiff (http://whytheluckystiff.net/)
6 # Copyright:: (cc) 2004 why the lucky stiff (and his puppet organizations.)
6 # Copyright:: (cc) 2004 why the lucky stiff (and his puppet organizations.)
7 # License:: BSD
7 # License:: BSD
8 #
8 #
9 # (see http://hobix.com/textile/ for a Textile Reference.)
9 # (see http://hobix.com/textile/ for a Textile Reference.)
10 #
10 #
11 # Based on (and also inspired by) both:
11 # Based on (and also inspired by) both:
12 #
12 #
13 # PyTextile: http://diveintomark.org/projects/textile/textile.py.txt
13 # PyTextile: http://diveintomark.org/projects/textile/textile.py.txt
14 # Textism for PHP: http://www.textism.com/tools/textile/
14 # Textism for PHP: http://www.textism.com/tools/textile/
15 #
15 #
16 #
16 #
17
17
18 # = RedCloth
18 # = RedCloth
19 #
19 #
20 # RedCloth is a Ruby library for converting Textile and/or Markdown
20 # RedCloth is a Ruby library for converting Textile and/or Markdown
21 # into HTML. You can use either format, intermingled or separately.
21 # into HTML. You can use either format, intermingled or separately.
22 # You can also extend RedCloth to honor your own custom text stylings.
22 # You can also extend RedCloth to honor your own custom text stylings.
23 #
23 #
24 # RedCloth users are encouraged to use Textile if they are generating
24 # RedCloth users are encouraged to use Textile if they are generating
25 # HTML and to use Markdown if others will be viewing the plain text.
25 # HTML and to use Markdown if others will be viewing the plain text.
26 #
26 #
27 # == What is Textile?
27 # == What is Textile?
28 #
28 #
29 # Textile is a simple formatting style for text
29 # Textile is a simple formatting style for text
30 # documents, loosely based on some HTML conventions.
30 # documents, loosely based on some HTML conventions.
31 #
31 #
32 # == Sample Textile Text
32 # == Sample Textile Text
33 #
33 #
34 # h2. This is a title
34 # h2. This is a title
35 #
35 #
36 # h3. This is a subhead
36 # h3. This is a subhead
37 #
37 #
38 # This is a bit of paragraph.
38 # This is a bit of paragraph.
39 #
39 #
40 # bq. This is a blockquote.
40 # bq. This is a blockquote.
41 #
41 #
42 # = Writing Textile
42 # = Writing Textile
43 #
43 #
44 # A Textile document consists of paragraphs. Paragraphs
44 # A Textile document consists of paragraphs. Paragraphs
45 # can be specially formatted by adding a small instruction
45 # can be specially formatted by adding a small instruction
46 # to the beginning of the paragraph.
46 # to the beginning of the paragraph.
47 #
47 #
48 # h[n]. Header of size [n].
48 # h[n]. Header of size [n].
49 # bq. Blockquote.
49 # bq. Blockquote.
50 # # Numeric list.
50 # # Numeric list.
51 # * Bulleted list.
51 # * Bulleted list.
52 #
52 #
53 # == Quick Phrase Modifiers
53 # == Quick Phrase Modifiers
54 #
54 #
55 # Quick phrase modifiers are also included, to allow formatting
55 # Quick phrase modifiers are also included, to allow formatting
56 # of small portions of text within a paragraph.
56 # of small portions of text within a paragraph.
57 #
57 #
58 # \_emphasis\_
58 # \_emphasis\_
59 # \_\_italicized\_\_
59 # \_\_italicized\_\_
60 # \*strong\*
60 # \*strong\*
61 # \*\*bold\*\*
61 # \*\*bold\*\*
62 # ??citation??
62 # ??citation??
63 # -deleted text-
63 # -deleted text-
64 # +inserted text+
64 # +inserted text+
65 # ^superscript^
65 # ^superscript^
66 # ~subscript~
66 # ~subscript~
67 # @code@
67 # @code@
68 # %(classname)span%
68 # %(classname)span%
69 #
69 #
70 # ==notextile== (leave text alone)
70 # ==notextile== (leave text alone)
71 #
71 #
72 # == Links
72 # == Links
73 #
73 #
74 # To make a hypertext link, put the link text in "quotation
74 # To make a hypertext link, put the link text in "quotation
75 # marks" followed immediately by a colon and the URL of the link.
75 # marks" followed immediately by a colon and the URL of the link.
76 #
76 #
77 # Optional: text in (parentheses) following the link text,
77 # Optional: text in (parentheses) following the link text,
78 # but before the closing quotation mark, will become a Title
78 # but before the closing quotation mark, will become a Title
79 # attribute for the link, visible as a tool tip when a cursor is above it.
79 # attribute for the link, visible as a tool tip when a cursor is above it.
80 #
80 #
81 # Example:
81 # Example:
82 #
82 #
83 # "This is a link (This is a title) ":http://www.textism.com
83 # "This is a link (This is a title) ":http://www.textism.com
84 #
84 #
85 # Will become:
85 # Will become:
86 #
86 #
87 # <a href="http://www.textism.com" title="This is a title">This is a link</a>
87 # <a href="http://www.textism.com" title="This is a title">This is a link</a>
88 #
88 #
89 # == Images
89 # == Images
90 #
90 #
91 # To insert an image, put the URL for the image inside exclamation marks.
91 # To insert an image, put the URL for the image inside exclamation marks.
92 #
92 #
93 # Optional: text that immediately follows the URL in (parentheses) will
93 # Optional: text that immediately follows the URL in (parentheses) will
94 # be used as the Alt text for the image. Images on the web should always
94 # be used as the Alt text for the image. Images on the web should always
95 # have descriptive Alt text for the benefit of readers using non-graphical
95 # have descriptive Alt text for the benefit of readers using non-graphical
96 # browsers.
96 # browsers.
97 #
97 #
98 # Optional: place a colon followed by a URL immediately after the
98 # Optional: place a colon followed by a URL immediately after the
99 # closing ! to make the image into a link.
99 # closing ! to make the image into a link.
100 #
100 #
101 # Example:
101 # Example:
102 #
102 #
103 # !http://www.textism.com/common/textist.gif(Textist)!
103 # !http://www.textism.com/common/textist.gif(Textist)!
104 #
104 #
105 # Will become:
105 # Will become:
106 #
106 #
107 # <img src="http://www.textism.com/common/textist.gif" alt="Textist" />
107 # <img src="http://www.textism.com/common/textist.gif" alt="Textist" />
108 #
108 #
109 # With a link:
109 # With a link:
110 #
110 #
111 # !/common/textist.gif(Textist)!:http://textism.com
111 # !/common/textist.gif(Textist)!:http://textism.com
112 #
112 #
113 # Will become:
113 # Will become:
114 #
114 #
115 # <a href="http://textism.com"><img src="/common/textist.gif" alt="Textist" /></a>
115 # <a href="http://textism.com"><img src="/common/textist.gif" alt="Textist" /></a>
116 #
116 #
117 # == Defining Acronyms
117 # == Defining Acronyms
118 #
118 #
119 # HTML allows authors to define acronyms via the tag. The definition appears as a
119 # HTML allows authors to define acronyms via the tag. The definition appears as a
120 # tool tip when a cursor hovers over the acronym. A crucial aid to clear writing,
120 # tool tip when a cursor hovers over the acronym. A crucial aid to clear writing,
121 # this should be used at least once for each acronym in documents where they appear.
121 # this should be used at least once for each acronym in documents where they appear.
122 #
122 #
123 # To quickly define an acronym in Textile, place the full text in (parentheses)
123 # To quickly define an acronym in Textile, place the full text in (parentheses)
124 # immediately following the acronym.
124 # immediately following the acronym.
125 #
125 #
126 # Example:
126 # Example:
127 #
127 #
128 # ACLU(American Civil Liberties Union)
128 # ACLU(American Civil Liberties Union)
129 #
129 #
130 # Will become:
130 # Will become:
131 #
131 #
132 # <acronym title="American Civil Liberties Union">ACLU</acronym>
132 # <acronym title="American Civil Liberties Union">ACLU</acronym>
133 #
133 #
134 # == Adding Tables
134 # == Adding Tables
135 #
135 #
136 # In Textile, simple tables can be added by seperating each column by
136 # In Textile, simple tables can be added by seperating each column by
137 # a pipe.
137 # a pipe.
138 #
138 #
139 # |a|simple|table|row|
139 # |a|simple|table|row|
140 # |And|Another|table|row|
140 # |And|Another|table|row|
141 #
141 #
142 # Attributes are defined by style definitions in parentheses.
142 # Attributes are defined by style definitions in parentheses.
143 #
143 #
144 # table(border:1px solid black).
144 # table(border:1px solid black).
145 # (background:#ddd;color:red). |{}| | | |
145 # (background:#ddd;color:red). |{}| | | |
146 #
146 #
147 # == Using RedCloth
147 # == Using RedCloth
148 #
148 #
149 # RedCloth is simply an extension of the String class, which can handle
149 # RedCloth is simply an extension of the String class, which can handle
150 # Textile formatting. Use it like a String and output HTML with its
150 # Textile formatting. Use it like a String and output HTML with its
151 # RedCloth#to_html method.
151 # RedCloth#to_html method.
152 #
152 #
153 # doc = RedCloth.new "
153 # doc = RedCloth.new "
154 #
154 #
155 # h2. Test document
155 # h2. Test document
156 #
156 #
157 # Just a simple test."
157 # Just a simple test."
158 #
158 #
159 # puts doc.to_html
159 # puts doc.to_html
160 #
160 #
161 # By default, RedCloth uses both Textile and Markdown formatting, with
161 # By default, RedCloth uses both Textile and Markdown formatting, with
162 # Textile formatting taking precedence. If you want to turn off Markdown
162 # Textile formatting taking precedence. If you want to turn off Markdown
163 # formatting, to boost speed and limit the processor:
163 # formatting, to boost speed and limit the processor:
164 #
164 #
165 # class RedCloth::Textile.new( str )
165 # class RedCloth::Textile.new( str )
166
166
167 class RedCloth3 < String
167 class RedCloth3 < String
168
168
169 VERSION = '3.0.4'
169 VERSION = '3.0.4'
170 DEFAULT_RULES = [:textile, :markdown]
170 DEFAULT_RULES = [:textile, :markdown]
171
171
172 #
172 #
173 # Two accessor for setting security restrictions.
173 # Two accessor for setting security restrictions.
174 #
174 #
175 # This is a nice thing if you're using RedCloth for
175 # This is a nice thing if you're using RedCloth for
176 # formatting in public places (e.g. Wikis) where you
176 # formatting in public places (e.g. Wikis) where you
177 # don't want users to abuse HTML for bad things.
177 # don't want users to abuse HTML for bad things.
178 #
178 #
179 # If +:filter_html+ is set, HTML which wasn't
179 # If +:filter_html+ is set, HTML which wasn't
180 # created by the Textile processor will be escaped.
180 # created by the Textile processor will be escaped.
181 #
181 #
182 # If +:filter_styles+ is set, it will also disable
182 # If +:filter_styles+ is set, it will also disable
183 # the style markup specifier. ('{color: red}')
183 # the style markup specifier. ('{color: red}')
184 #
184 #
185 attr_accessor :filter_html, :filter_styles
185 attr_accessor :filter_html, :filter_styles
186
186
187 #
187 #
188 # Accessor for toggling hard breaks.
188 # Accessor for toggling hard breaks.
189 #
189 #
190 # If +:hard_breaks+ is set, single newlines will
190 # If +:hard_breaks+ is set, single newlines will
191 # be converted to HTML break tags. This is the
191 # be converted to HTML break tags. This is the
192 # default behavior for traditional RedCloth.
192 # default behavior for traditional RedCloth.
193 #
193 #
194 attr_accessor :hard_breaks
194 attr_accessor :hard_breaks
195
195
196 # Accessor for toggling lite mode.
196 # Accessor for toggling lite mode.
197 #
197 #
198 # In lite mode, block-level rules are ignored. This means
198 # In lite mode, block-level rules are ignored. This means
199 # that tables, paragraphs, lists, and such aren't available.
199 # that tables, paragraphs, lists, and such aren't available.
200 # Only the inline markup for bold, italics, entities and so on.
200 # Only the inline markup for bold, italics, entities and so on.
201 #
201 #
202 # r = RedCloth.new( "And then? She *fell*!", [:lite_mode] )
202 # r = RedCloth.new( "And then? She *fell*!", [:lite_mode] )
203 # r.to_html
203 # r.to_html
204 # #=> "And then? She <strong>fell</strong>!"
204 # #=> "And then? She <strong>fell</strong>!"
205 #
205 #
206 attr_accessor :lite_mode
206 attr_accessor :lite_mode
207
207
208 #
208 #
209 # Accessor for toggling span caps.
209 # Accessor for toggling span caps.
210 #
210 #
211 # Textile places `span' tags around capitalized
211 # Textile places `span' tags around capitalized
212 # words by default, but this wreaks havoc on Wikis.
212 # words by default, but this wreaks havoc on Wikis.
213 # If +:no_span_caps+ is set, this will be
213 # If +:no_span_caps+ is set, this will be
214 # suppressed.
214 # suppressed.
215 #
215 #
216 attr_accessor :no_span_caps
216 attr_accessor :no_span_caps
217
217
218 #
218 #
219 # Establishes the markup predence. Available rules include:
219 # Establishes the markup predence. Available rules include:
220 #
220 #
221 # == Textile Rules
221 # == Textile Rules
222 #
222 #
223 # The following textile rules can be set individually. Or add the complete
223 # The following textile rules can be set individually. Or add the complete
224 # set of rules with the single :textile rule, which supplies the rule set in
224 # set of rules with the single :textile rule, which supplies the rule set in
225 # the following precedence:
225 # the following precedence:
226 #
226 #
227 # refs_textile:: Textile references (i.e. [hobix]http://hobix.com/)
227 # refs_textile:: Textile references (i.e. [hobix]http://hobix.com/)
228 # block_textile_table:: Textile table block structures
228 # block_textile_table:: Textile table block structures
229 # block_textile_lists:: Textile list structures
229 # block_textile_lists:: Textile list structures
230 # block_textile_prefix:: Textile blocks with prefixes (i.e. bq., h2., etc.)
230 # block_textile_prefix:: Textile blocks with prefixes (i.e. bq., h2., etc.)
231 # inline_textile_image:: Textile inline images
231 # inline_textile_image:: Textile inline images
232 # inline_textile_link:: Textile inline links
232 # inline_textile_link:: Textile inline links
233 # inline_textile_span:: Textile inline spans
233 # inline_textile_span:: Textile inline spans
234 # glyphs_textile:: Textile entities (such as em-dashes and smart quotes)
234 # glyphs_textile:: Textile entities (such as em-dashes and smart quotes)
235 #
235 #
236 # == Markdown
236 # == Markdown
237 #
237 #
238 # refs_markdown:: Markdown references (for example: [hobix]: http://hobix.com/)
238 # refs_markdown:: Markdown references (for example: [hobix]: http://hobix.com/)
239 # block_markdown_setext:: Markdown setext headers
239 # block_markdown_setext:: Markdown setext headers
240 # block_markdown_atx:: Markdown atx headers
240 # block_markdown_atx:: Markdown atx headers
241 # block_markdown_rule:: Markdown horizontal rules
241 # block_markdown_rule:: Markdown horizontal rules
242 # block_markdown_bq:: Markdown blockquotes
242 # block_markdown_bq:: Markdown blockquotes
243 # block_markdown_lists:: Markdown lists
243 # block_markdown_lists:: Markdown lists
244 # inline_markdown_link:: Markdown links
244 # inline_markdown_link:: Markdown links
245 attr_accessor :rules
245 attr_accessor :rules
246
246
247 # Returns a new RedCloth object, based on _string_ and
247 # Returns a new RedCloth object, based on _string_ and
248 # enforcing all the included _restrictions_.
248 # enforcing all the included _restrictions_.
249 #
249 #
250 # r = RedCloth.new( "h1. A <b>bold</b> man", [:filter_html] )
250 # r = RedCloth.new( "h1. A <b>bold</b> man", [:filter_html] )
251 # r.to_html
251 # r.to_html
252 # #=>"<h1>A &lt;b&gt;bold&lt;/b&gt; man</h1>"
252 # #=>"<h1>A &lt;b&gt;bold&lt;/b&gt; man</h1>"
253 #
253 #
254 def initialize( string, restrictions = [] )
254 def initialize( string, restrictions = [] )
255 restrictions.each { |r| method( "#{ r }=" ).call( true ) }
255 restrictions.each { |r| method( "#{ r }=" ).call( true ) }
256 super( string )
256 super( string )
257 end
257 end
258
258
259 #
259 #
260 # Generates HTML from the Textile contents.
260 # Generates HTML from the Textile contents.
261 #
261 #
262 # r = RedCloth.new( "And then? She *fell*!" )
262 # r = RedCloth.new( "And then? She *fell*!" )
263 # r.to_html( true )
263 # r.to_html( true )
264 # #=>"And then? She <strong>fell</strong>!"
264 # #=>"And then? She <strong>fell</strong>!"
265 #
265 #
266 def to_html( *rules )
266 def to_html( *rules )
267 rules = DEFAULT_RULES if rules.empty?
267 rules = DEFAULT_RULES if rules.empty?
268 # make our working copy
268 # make our working copy
269 text = self.dup
269 text = self.dup
270
270
271 @urlrefs = {}
271 @urlrefs = {}
272 @shelf = []
272 @shelf = []
273 textile_rules = [:refs_textile, :block_textile_table, :block_textile_lists,
273 textile_rules = [:refs_textile, :block_textile_table, :block_textile_lists,
274 :block_textile_prefix, :inline_textile_image, :inline_textile_link,
274 :block_textile_prefix, :inline_textile_image, :inline_textile_link,
275 :inline_textile_code, :inline_textile_span, :glyphs_textile]
275 :inline_textile_code, :inline_textile_span, :glyphs_textile]
276 markdown_rules = [:refs_markdown, :block_markdown_setext, :block_markdown_atx, :block_markdown_rule,
276 markdown_rules = [:refs_markdown, :block_markdown_setext, :block_markdown_atx, :block_markdown_rule,
277 :block_markdown_bq, :block_markdown_lists,
277 :block_markdown_bq, :block_markdown_lists,
278 :inline_markdown_reflink, :inline_markdown_link]
278 :inline_markdown_reflink, :inline_markdown_link]
279 @rules = rules.collect do |rule|
279 @rules = rules.collect do |rule|
280 case rule
280 case rule
281 when :markdown
281 when :markdown
282 markdown_rules
282 markdown_rules
283 when :textile
283 when :textile
284 textile_rules
284 textile_rules
285 else
285 else
286 rule
286 rule
287 end
287 end
288 end.flatten
288 end.flatten
289
289
290 # standard clean up
290 # standard clean up
291 incoming_entities text
291 incoming_entities text
292 clean_white_space text
292 clean_white_space text
293
293
294 # start processor
294 # start processor
295 @pre_list = []
295 @pre_list = []
296 rip_offtags text
296 rip_offtags text
297 no_textile text
297 no_textile text
298 escape_html_tags text
298 escape_html_tags text
299 hard_break text
299 hard_break text
300 unless @lite_mode
300 unless @lite_mode
301 refs text
301 refs text
302 # need to do this before text is split by #blocks
302 # need to do this before text is split by #blocks
303 block_textile_quotes text
303 block_textile_quotes text
304 blocks text
304 blocks text
305 end
305 end
306 inline text
306 inline text
307 smooth_offtags text
307 smooth_offtags text
308
308
309 retrieve text
309 retrieve text
310
310
311 text.gsub!( /<\/?notextile>/, '' )
311 text.gsub!( /<\/?notextile>/, '' )
312 text.gsub!( /x%x%/, '&#38;' )
312 text.gsub!( /x%x%/, '&#38;' )
313 clean_html text if filter_html
313 clean_html text if filter_html
314 text.strip!
314 text.strip!
315 text
315 text
316
316
317 end
317 end
318
318
319 #######
319 #######
320 private
320 private
321 #######
321 #######
322 #
322 #
323 # Mapping of 8-bit ASCII codes to HTML numerical entity equivalents.
323 # Mapping of 8-bit ASCII codes to HTML numerical entity equivalents.
324 # (from PyTextile)
324 # (from PyTextile)
325 #
325 #
326 TEXTILE_TAGS =
326 TEXTILE_TAGS =
327
327
328 [[128, 8364], [129, 0], [130, 8218], [131, 402], [132, 8222], [133, 8230],
328 [[128, 8364], [129, 0], [130, 8218], [131, 402], [132, 8222], [133, 8230],
329 [134, 8224], [135, 8225], [136, 710], [137, 8240], [138, 352], [139, 8249],
329 [134, 8224], [135, 8225], [136, 710], [137, 8240], [138, 352], [139, 8249],
330 [140, 338], [141, 0], [142, 0], [143, 0], [144, 0], [145, 8216], [146, 8217],
330 [140, 338], [141, 0], [142, 0], [143, 0], [144, 0], [145, 8216], [146, 8217],
331 [147, 8220], [148, 8221], [149, 8226], [150, 8211], [151, 8212], [152, 732],
331 [147, 8220], [148, 8221], [149, 8226], [150, 8211], [151, 8212], [152, 732],
332 [153, 8482], [154, 353], [155, 8250], [156, 339], [157, 0], [158, 0], [159, 376]].
332 [153, 8482], [154, 353], [155, 8250], [156, 339], [157, 0], [158, 0], [159, 376]].
333
333
334 collect! do |a, b|
334 collect! do |a, b|
335 [a.chr, ( b.zero? and "" or "&#{ b };" )]
335 [a.chr, ( b.zero? and "" or "&#{ b };" )]
336 end
336 end
337
337
338 #
338 #
339 # Regular expressions to convert to HTML.
339 # Regular expressions to convert to HTML.
340 #
340 #
341 A_HLGN = /(?:(?:<>|<|>|\=|[()]+)+)/
341 A_HLGN = /(?:(?:<>|<|>|\=|[()]+)+)/
342 A_VLGN = /[\-^~]/
342 A_VLGN = /[\-^~]/
343 C_CLAS = '(?:\([^)]+\))'
343 C_CLAS = '(?:\([^)]+\))'
344 C_LNGE = '(?:\[[^\[\]]+\])'
344 C_LNGE = '(?:\[[^\[\]]+\])'
345 C_STYL = '(?:\{[^}]+\})'
345 C_STYL = '(?:\{[^}]+\})'
346 S_CSPN = '(?:\\\\\d+)'
346 S_CSPN = '(?:\\\\\d+)'
347 S_RSPN = '(?:/\d+)'
347 S_RSPN = '(?:/\d+)'
348 A = "(?:#{A_HLGN}?#{A_VLGN}?|#{A_VLGN}?#{A_HLGN}?)"
348 A = "(?:#{A_HLGN}?#{A_VLGN}?|#{A_VLGN}?#{A_HLGN}?)"
349 S = "(?:#{S_CSPN}?#{S_RSPN}|#{S_RSPN}?#{S_CSPN}?)"
349 S = "(?:#{S_CSPN}?#{S_RSPN}|#{S_RSPN}?#{S_CSPN}?)"
350 C = "(?:#{C_CLAS}?#{C_STYL}?#{C_LNGE}?|#{C_STYL}?#{C_LNGE}?#{C_CLAS}?|#{C_LNGE}?#{C_STYL}?#{C_CLAS}?)"
350 C = "(?:#{C_CLAS}?#{C_STYL}?#{C_LNGE}?|#{C_STYL}?#{C_LNGE}?#{C_CLAS}?|#{C_LNGE}?#{C_STYL}?#{C_CLAS}?)"
351 # PUNCT = Regexp::quote( '!"#$%&\'()*+,-./:;<=>?@[\\]^_`{|}~' )
351 # PUNCT = Regexp::quote( '!"#$%&\'()*+,-./:;<=>?@[\\]^_`{|}~' )
352 PUNCT = Regexp::quote( '!"#$%&\'*+,-./:;=?@\\^_`|~' )
352 PUNCT = Regexp::quote( '!"#$%&\'*+,-./:;=?@\\^_`|~' )
353 PUNCT_NOQ = Regexp::quote( '!"#$&\',./:;=?@\\`|' )
353 PUNCT_NOQ = Regexp::quote( '!"#$&\',./:;=?@\\`|' )
354 PUNCT_Q = Regexp::quote( '*-_+^~%' )
354 PUNCT_Q = Regexp::quote( '*-_+^~%' )
355 HYPERLINK = '(\S+?)([^\w\s/;=\?]*?)(?=\s|<|$)'
355 HYPERLINK = '(\S+?)([^\w\s/;=\?]*?)(?=\s|<|$)'
356
356
357 # Text markup tags, don't conflict with block tags
357 # Text markup tags, don't conflict with block tags
358 SIMPLE_HTML_TAGS = [
358 SIMPLE_HTML_TAGS = [
359 'tt', 'b', 'i', 'big', 'small', 'em', 'strong', 'dfn', 'code',
359 'tt', 'b', 'i', 'big', 'small', 'em', 'strong', 'dfn', 'code',
360 'samp', 'kbd', 'var', 'cite', 'abbr', 'acronym', 'a', 'img', 'br',
360 'samp', 'kbd', 'var', 'cite', 'abbr', 'acronym', 'a', 'img', 'br',
361 'br', 'map', 'q', 'sub', 'sup', 'span', 'bdo'
361 'br', 'map', 'q', 'sub', 'sup', 'span', 'bdo'
362 ]
362 ]
363
363
364 QTAGS = [
364 QTAGS = [
365 ['**', 'b', :limit],
365 ['**', 'b', :limit],
366 ['*', 'strong', :limit],
366 ['*', 'strong', :limit],
367 ['??', 'cite', :limit],
367 ['??', 'cite', :limit],
368 ['-', 'del', :limit],
368 ['-', 'del', :limit],
369 ['__', 'i', :limit],
369 ['__', 'i', :limit],
370 ['_', 'em', :limit],
370 ['_', 'em', :limit],
371 ['%', 'span', :limit],
371 ['%', 'span', :limit],
372 ['+', 'ins', :limit],
372 ['+', 'ins', :limit],
373 ['^', 'sup', :limit],
373 ['^', 'sup', :limit],
374 ['~', 'sub', :limit]
374 ['~', 'sub', :limit]
375 ]
375 ]
376 QTAGS.collect! do |rc, ht, rtype|
376 QTAGS.collect! do |rc, ht, rtype|
377 rcq = Regexp::quote rc
377 rcq = Regexp::quote rc
378 re =
378 re =
379 case rtype
379 case rtype
380 when :limit
380 when :limit
381 /(^|[>\s\(])
381 /(^|[>\s\(])
382 (#{rcq})
382 (#{rcq})
383 (#{C})
383 (#{C})
384 (?::(\S+?))?
384 (?::(\S+?))?
385 (\w|[^\s\-].*?[^\s\-])
385 (\w|[^\s\-].*?[^\s\-])
386 #{rcq}
386 #{rcq}
387 (?=[[:punct:]]|\s|\)|$)/x
387 (?=[[:punct:]]|\s|\)|$)/x
388 else
388 else
389 /(#{rcq})
389 /(#{rcq})
390 (#{C})
390 (#{C})
391 (?::(\S+))?
391 (?::(\S+))?
392 (\w|[^\s\-].*?[^\s\-])
392 (\w|[^\s\-].*?[^\s\-])
393 #{rcq}/xm
393 #{rcq}/xm
394 end
394 end
395 [rc, ht, re, rtype]
395 [rc, ht, re, rtype]
396 end
396 end
397
397
398 # Elements to handle
398 # Elements to handle
399 GLYPHS = [
399 GLYPHS = [
400 # [ /([^\s\[{(>])?\'([dmst]\b|ll\b|ve\b|\s|:|$)/, '\1&#8217;\2' ], # single closing
400 # [ /([^\s\[{(>])?\'([dmst]\b|ll\b|ve\b|\s|:|$)/, '\1&#8217;\2' ], # single closing
401 # [ /([^\s\[{(>#{PUNCT_Q}][#{PUNCT_Q}]*)\'/, '\1&#8217;' ], # single closing
401 # [ /([^\s\[{(>#{PUNCT_Q}][#{PUNCT_Q}]*)\'/, '\1&#8217;' ], # single closing
402 # [ /\'(?=[#{PUNCT_Q}]*(s\b|[\s#{PUNCT_NOQ}]))/, '&#8217;' ], # single closing
402 # [ /\'(?=[#{PUNCT_Q}]*(s\b|[\s#{PUNCT_NOQ}]))/, '&#8217;' ], # single closing
403 # [ /\'/, '&#8216;' ], # single opening
403 # [ /\'/, '&#8216;' ], # single opening
404 # [ /</, '&lt;' ], # less-than
404 # [ /</, '&lt;' ], # less-than
405 # [ />/, '&gt;' ], # greater-than
405 # [ />/, '&gt;' ], # greater-than
406 # [ /([^\s\[{(])?"(\s|:|$)/, '\1&#8221;\2' ], # double closing
406 # [ /([^\s\[{(])?"(\s|:|$)/, '\1&#8221;\2' ], # double closing
407 # [ /([^\s\[{(>#{PUNCT_Q}][#{PUNCT_Q}]*)"/, '\1&#8221;' ], # double closing
407 # [ /([^\s\[{(>#{PUNCT_Q}][#{PUNCT_Q}]*)"/, '\1&#8221;' ], # double closing
408 # [ /"(?=[#{PUNCT_Q}]*[\s#{PUNCT_NOQ}])/, '&#8221;' ], # double closing
408 # [ /"(?=[#{PUNCT_Q}]*[\s#{PUNCT_NOQ}])/, '&#8221;' ], # double closing
409 # [ /"/, '&#8220;' ], # double opening
409 # [ /"/, '&#8220;' ], # double opening
410 # [ /\b( )?\.{3}/, '\1&#8230;' ], # ellipsis
410 # [ /\b( )?\.{3}/, '\1&#8230;' ], # ellipsis
411 # [ /\b([A-Z][A-Z0-9]{2,})\b(?:[(]([^)]*)[)])/, '<acronym title="\2">\1</acronym>' ], # 3+ uppercase acronym
411 # [ /\b([A-Z][A-Z0-9]{2,})\b(?:[(]([^)]*)[)])/, '<acronym title="\2">\1</acronym>' ], # 3+ uppercase acronym
412 # [ /(^|[^"][>\s])([A-Z][A-Z0-9 ]+[A-Z0-9])([^<A-Za-z0-9]|$)/, '\1<span class="caps">\2</span>\3', :no_span_caps ], # 3+ uppercase caps
412 # [ /(^|[^"][>\s])([A-Z][A-Z0-9 ]+[A-Z0-9])([^<A-Za-z0-9]|$)/, '\1<span class="caps">\2</span>\3', :no_span_caps ], # 3+ uppercase caps
413 # [ /(\.\s)?\s?--\s?/, '\1&#8212;' ], # em dash
413 # [ /(\.\s)?\s?--\s?/, '\1&#8212;' ], # em dash
414 # [ /\s->\s/, ' &rarr; ' ], # right arrow
414 # [ /\s->\s/, ' &rarr; ' ], # right arrow
415 # [ /\s-\s/, ' &#8211; ' ], # en dash
415 # [ /\s-\s/, ' &#8211; ' ], # en dash
416 # [ /(\d+) ?x ?(\d+)/, '\1&#215;\2' ], # dimension sign
416 # [ /(\d+) ?x ?(\d+)/, '\1&#215;\2' ], # dimension sign
417 # [ /\b ?[(\[]TM[\])]/i, '&#8482;' ], # trademark
417 # [ /\b ?[(\[]TM[\])]/i, '&#8482;' ], # trademark
418 # [ /\b ?[(\[]R[\])]/i, '&#174;' ], # registered
418 # [ /\b ?[(\[]R[\])]/i, '&#174;' ], # registered
419 # [ /\b ?[(\[]C[\])]/i, '&#169;' ] # copyright
419 # [ /\b ?[(\[]C[\])]/i, '&#169;' ] # copyright
420 ]
420 ]
421
421
422 H_ALGN_VALS = {
422 H_ALGN_VALS = {
423 '<' => 'left',
423 '<' => 'left',
424 '=' => 'center',
424 '=' => 'center',
425 '>' => 'right',
425 '>' => 'right',
426 '<>' => 'justify'
426 '<>' => 'justify'
427 }
427 }
428
428
429 V_ALGN_VALS = {
429 V_ALGN_VALS = {
430 '^' => 'top',
430 '^' => 'top',
431 '-' => 'middle',
431 '-' => 'middle',
432 '~' => 'bottom'
432 '~' => 'bottom'
433 }
433 }
434
434
435 #
435 #
436 # Flexible HTML escaping
436 # Flexible HTML escaping
437 #
437 #
438 def htmlesc( str, mode=:Quotes )
438 def htmlesc( str, mode=:Quotes )
439 if str
439 if str
440 str.gsub!( '&', '&amp;' )
440 str.gsub!( '&', '&amp;' )
441 str.gsub!( '"', '&quot;' ) if mode != :NoQuotes
441 str.gsub!( '"', '&quot;' ) if mode != :NoQuotes
442 str.gsub!( "'", '&#039;' ) if mode == :Quotes
442 str.gsub!( "'", '&#039;' ) if mode == :Quotes
443 str.gsub!( '<', '&lt;')
443 str.gsub!( '<', '&lt;')
444 str.gsub!( '>', '&gt;')
444 str.gsub!( '>', '&gt;')
445 end
445 end
446 str
446 str
447 end
447 end
448
448
449 # Search and replace for Textile glyphs (quotes, dashes, other symbols)
449 # Search and replace for Textile glyphs (quotes, dashes, other symbols)
450 def pgl( text )
450 def pgl( text )
451 #GLYPHS.each do |re, resub, tog|
451 #GLYPHS.each do |re, resub, tog|
452 # next if tog and method( tog ).call
452 # next if tog and method( tog ).call
453 # text.gsub! re, resub
453 # text.gsub! re, resub
454 #end
454 #end
455 text.gsub!(/\b([A-Z][A-Z0-9]{2,})\b(?:[(]([^)]*)[)])/) do |m|
455 text.gsub!(/\b([A-Z][A-Z0-9]{2,})\b(?:[(]([^)]*)[)])/) do |m|
456 "<acronym title=\"#{htmlesc $2}\">#{$1}</acronym>"
456 "<acronym title=\"#{htmlesc $2}\">#{$1}</acronym>"
457 end
457 end
458 end
458 end
459
459
460 # Parses Textile attribute lists and builds an HTML attribute string
460 # Parses Textile attribute lists and builds an HTML attribute string
461 def pba( text_in, element = "" )
461 def pba( text_in, element = "" )
462
462
463 return '' unless text_in
463 return '' unless text_in
464
464
465 style = []
465 style = []
466 text = text_in.dup
466 text = text_in.dup
467 if element == 'td'
467 if element == 'td'
468 colspan = $1 if text =~ /\\(\d+)/
468 colspan = $1 if text =~ /\\(\d+)/
469 rowspan = $1 if text =~ /\/(\d+)/
469 rowspan = $1 if text =~ /\/(\d+)/
470 style << "vertical-align:#{ v_align( $& ) };" if text =~ A_VLGN
470 style << "vertical-align:#{ v_align( $& ) };" if text =~ A_VLGN
471 end
471 end
472
472
473 style << "#{ htmlesc $1 };" if text.sub!( /\{([^}]*)\}/, '' ) && !filter_styles
473 style << "#{ htmlesc $1 };" if text.sub!( /\{([^}]*)\}/, '' ) && !filter_styles
474
474
475 lang = $1 if
475 lang = $1 if
476 text.sub!( /\[([^)]+?)\]/, '' )
476 text.sub!( /\[([^)]+?)\]/, '' )
477
477
478 cls = $1 if
478 cls = $1 if
479 text.sub!( /\(([^()]+?)\)/, '' )
479 text.sub!( /\(([^()]+?)\)/, '' )
480
480
481 style << "padding-left:#{ $1.length }em;" if
481 style << "padding-left:#{ $1.length }em;" if
482 text.sub!( /([(]+)/, '' )
482 text.sub!( /([(]+)/, '' )
483
483
484 style << "padding-right:#{ $1.length }em;" if text.sub!( /([)]+)/, '' )
484 style << "padding-right:#{ $1.length }em;" if text.sub!( /([)]+)/, '' )
485
485
486 style << "text-align:#{ h_align( $& ) };" if text =~ A_HLGN
486 style << "text-align:#{ h_align( $& ) };" if text =~ A_HLGN
487
487
488 cls, id = $1, $2 if cls =~ /^(.*?)#(.*)$/
488 cls, id = $1, $2 if cls =~ /^(.*?)#(.*)$/
489
489
490 atts = ''
490 atts = ''
491 atts << " style=\"#{ style.join }\"" unless style.empty?
491 atts << " style=\"#{ style.join }\"" unless style.empty?
492 atts << " class=\"#{ cls }\"" unless cls.to_s.empty?
492 atts << " class=\"#{ cls }\"" unless cls.to_s.empty?
493 atts << " lang=\"#{ lang }\"" if lang
493 atts << " lang=\"#{ lang }\"" if lang
494 atts << " id=\"#{ id }\"" if id
494 atts << " id=\"#{ id }\"" if id
495 atts << " colspan=\"#{ colspan }\"" if colspan
495 atts << " colspan=\"#{ colspan }\"" if colspan
496 atts << " rowspan=\"#{ rowspan }\"" if rowspan
496 atts << " rowspan=\"#{ rowspan }\"" if rowspan
497
497
498 atts
498 atts
499 end
499 end
500
500
501 TABLE_RE = /^(?:table(_?#{S}#{A}#{C})\. ?\n)?^(#{A}#{C}\.? ?\|.*?\|)(\n\n|\Z)/m
501 TABLE_RE = /^(?:table(_?#{S}#{A}#{C})\. ?\n)?^(#{A}#{C}\.? ?\|.*?\|)(\n\n|\Z)/m
502
502
503 # Parses a Textile table block, building HTML from the result.
503 # Parses a Textile table block, building HTML from the result.
504 def block_textile_table( text )
504 def block_textile_table( text )
505 text.gsub!( TABLE_RE ) do |matches|
505 text.gsub!( TABLE_RE ) do |matches|
506
506
507 tatts, fullrow = $~[1..2]
507 tatts, fullrow = $~[1..2]
508 tatts = pba( tatts, 'table' )
508 tatts = pba( tatts, 'table' )
509 tatts = shelve( tatts ) if tatts
509 tatts = shelve( tatts ) if tatts
510 rows = []
510 rows = []
511
511
512 fullrow.each_line do |row|
512 fullrow.each_line do |row|
513 ratts, row = pba( $1, 'tr' ), $2 if row =~ /^(#{A}#{C}\. )(.*)/m
513 ratts, row = pba( $1, 'tr' ), $2 if row =~ /^(#{A}#{C}\. )(.*)/m
514 cells = []
514 cells = []
515 row.split( /(\|)(?![^\[\|]*\]\])/ )[1..-2].each do |cell|
515 row.split( /(\|)(?![^\[\|]*\]\])/ )[1..-2].each do |cell|
516 next if cell == '|'
516 next if cell == '|'
517 ctyp = 'd'
517 ctyp = 'd'
518 ctyp = 'h' if cell =~ /^_/
518 ctyp = 'h' if cell =~ /^_/
519
519
520 catts = ''
520 catts = ''
521 catts, cell = pba( $1, 'td' ), $2 if cell =~ /^(_?#{S}#{A}#{C}\. ?)(.*)/
521 catts, cell = pba( $1, 'td' ), $2 if cell =~ /^(_?#{S}#{A}#{C}\. ?)(.*)/
522
522
523 catts = shelve( catts ) if catts
523 catts = shelve( catts ) if catts
524 cells << "\t\t\t<t#{ ctyp }#{ catts }>#{ cell }</t#{ ctyp }>"
524 cells << "\t\t\t<t#{ ctyp }#{ catts }>#{ cell }</t#{ ctyp }>"
525 end
525 end
526 ratts = shelve( ratts ) if ratts
526 ratts = shelve( ratts ) if ratts
527 rows << "\t\t<tr#{ ratts }>\n#{ cells.join( "\n" ) }\n\t\t</tr>"
527 rows << "\t\t<tr#{ ratts }>\n#{ cells.join( "\n" ) }\n\t\t</tr>"
528 end
528 end
529 "\t<table#{ tatts }>\n#{ rows.join( "\n" ) }\n\t</table>\n\n"
529 "\t<table#{ tatts }>\n#{ rows.join( "\n" ) }\n\t</table>\n\n"
530 end
530 end
531 end
531 end
532
532
533 LISTS_RE = /^([#*]+?#{C} .*?)$(?![^#*])/m
533 LISTS_RE = /^([#*]+?#{C} .*?)$(?![^#*])/m
534 LISTS_CONTENT_RE = /^([#*]+)(#{A}#{C}) (.*)$/m
534 LISTS_CONTENT_RE = /^([#*]+)(#{A}#{C}) (.*)$/m
535
535
536 # Parses Textile lists and generates HTML
536 # Parses Textile lists and generates HTML
537 def block_textile_lists( text )
537 def block_textile_lists( text )
538 text.gsub!( LISTS_RE ) do |match|
538 text.gsub!( LISTS_RE ) do |match|
539 lines = match.split( /\n/ )
539 lines = match.split( /\n/ )
540 last_line = -1
540 last_line = -1
541 depth = []
541 depth = []
542 lines.each_with_index do |line, line_id|
542 lines.each_with_index do |line, line_id|
543 if line =~ LISTS_CONTENT_RE
543 if line =~ LISTS_CONTENT_RE
544 tl,atts,content = $~[1..3]
544 tl,atts,content = $~[1..3]
545 if depth.last
545 if depth.last
546 if depth.last.length > tl.length
546 if depth.last.length > tl.length
547 (depth.length - 1).downto(0) do |i|
547 (depth.length - 1).downto(0) do |i|
548 break if depth[i].length == tl.length
548 break if depth[i].length == tl.length
549 lines[line_id - 1] << "</li>\n\t</#{ lT( depth[i] ) }l>\n\t"
549 lines[line_id - 1] << "</li>\n\t</#{ lT( depth[i] ) }l>\n\t"
550 depth.pop
550 depth.pop
551 end
551 end
552 end
552 end
553 if depth.last and depth.last.length == tl.length
553 if depth.last and depth.last.length == tl.length
554 lines[line_id - 1] << '</li>'
554 lines[line_id - 1] << '</li>'
555 end
555 end
556 end
556 end
557 unless depth.last == tl
557 unless depth.last == tl
558 depth << tl
558 depth << tl
559 atts = pba( atts )
559 atts = pba( atts )
560 atts = shelve( atts ) if atts
560 atts = shelve( atts ) if atts
561 lines[line_id] = "\t<#{ lT(tl) }l#{ atts }>\n\t<li>#{ content }"
561 lines[line_id] = "\t<#{ lT(tl) }l#{ atts }>\n\t<li>#{ content }"
562 else
562 else
563 lines[line_id] = "\t\t<li>#{ content }"
563 lines[line_id] = "\t\t<li>#{ content }"
564 end
564 end
565 last_line = line_id
565 last_line = line_id
566
566
567 else
567 else
568 last_line = line_id
568 last_line = line_id
569 end
569 end
570 if line_id - last_line > 1 or line_id == lines.length - 1
570 if line_id - last_line > 1 or line_id == lines.length - 1
571 depth.delete_if do |v|
571 depth.delete_if do |v|
572 lines[last_line] << "</li>\n\t</#{ lT( v ) }l>"
572 lines[last_line] << "</li>\n\t</#{ lT( v ) }l>"
573 end
573 end
574 end
574 end
575 end
575 end
576 lines.join( "\n" )
576 lines.join( "\n" )
577 end
577 end
578 end
578 end
579
579
580 QUOTES_RE = /(^>+([^\n]*?)\n?)+/m
580 QUOTES_RE = /(^>+([^\n]*?)\n?)+/m
581 QUOTES_CONTENT_RE = /^([> ]+)(.*)$/m
581 QUOTES_CONTENT_RE = /^([> ]+)(.*)$/m
582
582
583 def block_textile_quotes( text )
583 def block_textile_quotes( text )
584 text.gsub!( QUOTES_RE ) do |match|
584 text.gsub!( QUOTES_RE ) do |match|
585 lines = match.split( /\n/ )
585 lines = match.split( /\n/ )
586 quotes = ''
586 quotes = ''
587 indent = 0
587 indent = 0
588 lines.each do |line|
588 lines.each do |line|
589 line =~ QUOTES_CONTENT_RE
589 line =~ QUOTES_CONTENT_RE
590 bq,content = $1, $2
590 bq,content = $1, $2
591 l = bq.count('>')
591 l = bq.count('>')
592 if l != indent
592 if l != indent
593 quotes << ("\n\n" + (l>indent ? '<blockquote>' * (l-indent) : '</blockquote>' * (indent-l)) + "\n\n")
593 quotes << ("\n\n" + (l>indent ? '<blockquote>' * (l-indent) : '</blockquote>' * (indent-l)) + "\n\n")
594 indent = l
594 indent = l
595 end
595 end
596 quotes << (content + "\n")
596 quotes << (content + "\n")
597 end
597 end
598 quotes << ("\n" + '</blockquote>' * indent + "\n\n")
598 quotes << ("\n" + '</blockquote>' * indent + "\n\n")
599 quotes
599 quotes
600 end
600 end
601 end
601 end
602
602
603 CODE_RE = /(\W)
603 CODE_RE = /(\W)
604 @
604 @
605 (?:\|(\w+?)\|)?
605 (?:\|(\w+?)\|)?
606 (.+?)
606 (.+?)
607 @
607 @
608 (?=\W)/x
608 (?=\W)/x
609
609
610 def inline_textile_code( text )
610 def inline_textile_code( text )
611 text.gsub!( CODE_RE ) do |m|
611 text.gsub!( CODE_RE ) do |m|
612 before,lang,code,after = $~[1..4]
612 before,lang,code,after = $~[1..4]
613 lang = " lang=\"#{ lang }\"" if lang
613 lang = " lang=\"#{ lang }\"" if lang
614 rip_offtags( "#{ before }<code#{ lang }>#{ code }</code>#{ after }" )
614 rip_offtags( "#{ before }<code#{ lang }>#{ code }</code>#{ after }" )
615 end
615 end
616 end
616 end
617
617
618 def lT( text )
618 def lT( text )
619 text =~ /\#$/ ? 'o' : 'u'
619 text =~ /\#$/ ? 'o' : 'u'
620 end
620 end
621
621
622 def hard_break( text )
622 def hard_break( text )
623 text.gsub!( /(.)\n(?!\Z| *([#*=]+(\s|$)|[{|]))/, "\\1<br />" ) if hard_breaks
623 text.gsub!( /(.)\n(?!\Z| *([#*=]+(\s|$)|[{|]))/, "\\1<br />" ) if hard_breaks
624 end
624 end
625
625
626 BLOCKS_GROUP_RE = /\n{2,}(?! )/m
626 BLOCKS_GROUP_RE = /\n{2,}(?! )/m
627
627
628 def blocks( text, deep_code = false )
628 def blocks( text, deep_code = false )
629 text.replace( text.split( BLOCKS_GROUP_RE ).collect do |blk|
629 text.replace( text.split( BLOCKS_GROUP_RE ).collect do |blk|
630 plain = blk !~ /\A[#*> ]/
630 plain = blk !~ /\A[#*> ]/
631
631
632 # skip blocks that are complex HTML
632 # skip blocks that are complex HTML
633 if blk =~ /^<\/?(\w+).*>/ and not SIMPLE_HTML_TAGS.include? $1
633 if blk =~ /^<\/?(\w+).*>/ and not SIMPLE_HTML_TAGS.include? $1
634 blk
634 blk
635 else
635 else
636 # search for indentation levels
636 # search for indentation levels
637 blk.strip!
637 blk.strip!
638 if blk.empty?
638 if blk.empty?
639 blk
639 blk
640 else
640 else
641 code_blk = nil
641 code_blk = nil
642 blk.gsub!( /((?:\n(?:\n^ +[^\n]*)+)+)/m ) do |iblk|
642 blk.gsub!( /((?:\n(?:\n^ +[^\n]*)+)+)/m ) do |iblk|
643 flush_left iblk
643 flush_left iblk
644 blocks iblk, plain
644 blocks iblk, plain
645 iblk.gsub( /^(\S)/, "\t\\1" )
645 iblk.gsub( /^(\S)/, "\t\\1" )
646 if plain
646 if plain
647 code_blk = iblk; ""
647 code_blk = iblk; ""
648 else
648 else
649 iblk
649 iblk
650 end
650 end
651 end
651 end
652
652
653 block_applied = 0
653 block_applied = 0
654 @rules.each do |rule_name|
654 @rules.each do |rule_name|
655 block_applied += 1 if ( rule_name.to_s.match /^block_/ and method( rule_name ).call( blk ) )
655 block_applied += 1 if ( rule_name.to_s.match /^block_/ and method( rule_name ).call( blk ) )
656 end
656 end
657 if block_applied.zero?
657 if block_applied.zero?
658 if deep_code
658 if deep_code
659 blk = "\t<pre><code>#{ blk }</code></pre>"
659 blk = "\t<pre><code>#{ blk }</code></pre>"
660 else
660 else
661 blk = "\t<p>#{ blk }</p>"
661 blk = "\t<p>#{ blk }</p>"
662 end
662 end
663 end
663 end
664 # hard_break blk
664 # hard_break blk
665 blk + "\n#{ code_blk }"
665 blk + "\n#{ code_blk }"
666 end
666 end
667 end
667 end
668
668
669 end.join( "\n\n" ) )
669 end.join( "\n\n" ) )
670 end
670 end
671
671
672 def textile_bq( tag, atts, cite, content )
672 def textile_bq( tag, atts, cite, content )
673 cite, cite_title = check_refs( cite )
673 cite, cite_title = check_refs( cite )
674 cite = " cite=\"#{ cite }\"" if cite
674 cite = " cite=\"#{ cite }\"" if cite
675 atts = shelve( atts ) if atts
675 atts = shelve( atts ) if atts
676 "\t<blockquote#{ cite }>\n\t\t<p#{ atts }>#{ content }</p>\n\t</blockquote>"
676 "\t<blockquote#{ cite }>\n\t\t<p#{ atts }>#{ content }</p>\n\t</blockquote>"
677 end
677 end
678
678
679 def textile_p( tag, atts, cite, content )
679 def textile_p( tag, atts, cite, content )
680 atts = shelve( atts ) if atts
680 atts = shelve( atts ) if atts
681 "\t<#{ tag }#{ atts }>#{ content }</#{ tag }>"
681 "\t<#{ tag }#{ atts }>#{ content }</#{ tag }>"
682 end
682 end
683
683
684 alias textile_h1 textile_p
684 alias textile_h1 textile_p
685 alias textile_h2 textile_p
685 alias textile_h2 textile_p
686 alias textile_h3 textile_p
686 alias textile_h3 textile_p
687 alias textile_h4 textile_p
687 alias textile_h4 textile_p
688 alias textile_h5 textile_p
688 alias textile_h5 textile_p
689 alias textile_h6 textile_p
689 alias textile_h6 textile_p
690
690
691 def textile_fn_( tag, num, atts, cite, content )
691 def textile_fn_( tag, num, atts, cite, content )
692 atts << " id=\"fn#{ num }\" class=\"footnote\""
692 atts << " id=\"fn#{ num }\" class=\"footnote\""
693 content = "<sup>#{ num }</sup> #{ content }"
693 content = "<sup>#{ num }</sup> #{ content }"
694 atts = shelve( atts ) if atts
694 atts = shelve( atts ) if atts
695 "\t<p#{ atts }>#{ content }</p>"
695 "\t<p#{ atts }>#{ content }</p>"
696 end
696 end
697
697
698 BLOCK_RE = /^(([a-z]+)(\d*))(#{A}#{C})\.(?::(\S+))? (.*)$/m
698 BLOCK_RE = /^(([a-z]+)(\d*))(#{A}#{C})\.(?::(\S+))? (.*)$/m
699
699
700 def block_textile_prefix( text )
700 def block_textile_prefix( text )
701 if text =~ BLOCK_RE
701 if text =~ BLOCK_RE
702 tag,tagpre,num,atts,cite,content = $~[1..6]
702 tag,tagpre,num,atts,cite,content = $~[1..6]
703 atts = pba( atts )
703 atts = pba( atts )
704
704
705 # pass to prefix handler
705 # pass to prefix handler
706 if respond_to? "textile_#{ tag }", true
706 if respond_to? "textile_#{ tag }", true
707 text.gsub!( $&, method( "textile_#{ tag }" ).call( tag, atts, cite, content ) )
707 text.gsub!( $&, method( "textile_#{ tag }" ).call( tag, atts, cite, content ) )
708 elsif respond_to? "textile_#{ tagpre }_", true
708 elsif respond_to? "textile_#{ tagpre }_", true
709 text.gsub!( $&, method( "textile_#{ tagpre }_" ).call( tagpre, num, atts, cite, content ) )
709 text.gsub!( $&, method( "textile_#{ tagpre }_" ).call( tagpre, num, atts, cite, content ) )
710 end
710 end
711 end
711 end
712 end
712 end
713
713
714 SETEXT_RE = /\A(.+?)\n([=-])[=-]* *$/m
714 SETEXT_RE = /\A(.+?)\n([=-])[=-]* *$/m
715 def block_markdown_setext( text )
715 def block_markdown_setext( text )
716 if text =~ SETEXT_RE
716 if text =~ SETEXT_RE
717 tag = if $2 == "="; "h1"; else; "h2"; end
717 tag = if $2 == "="; "h1"; else; "h2"; end
718 blk, cont = "<#{ tag }>#{ $1 }</#{ tag }>", $'
718 blk, cont = "<#{ tag }>#{ $1 }</#{ tag }>", $'
719 blocks cont
719 blocks cont
720 text.replace( blk + cont )
720 text.replace( blk + cont )
721 end
721 end
722 end
722 end
723
723
724 ATX_RE = /\A(\#{1,6}) # $1 = string of #'s
724 ATX_RE = /\A(\#{1,6}) # $1 = string of #'s
725 [ ]*
725 [ ]*
726 (.+?) # $2 = Header text
726 (.+?) # $2 = Header text
727 [ ]*
727 [ ]*
728 \#* # optional closing #'s (not counted)
728 \#* # optional closing #'s (not counted)
729 $/x
729 $/x
730 def block_markdown_atx( text )
730 def block_markdown_atx( text )
731 if text =~ ATX_RE
731 if text =~ ATX_RE
732 tag = "h#{ $1.length }"
732 tag = "h#{ $1.length }"
733 blk, cont = "<#{ tag }>#{ $2 }</#{ tag }>\n\n", $'
733 blk, cont = "<#{ tag }>#{ $2 }</#{ tag }>\n\n", $'
734 blocks cont
734 blocks cont
735 text.replace( blk + cont )
735 text.replace( blk + cont )
736 end
736 end
737 end
737 end
738
738
739 MARKDOWN_BQ_RE = /\A(^ *> ?.+$(.+\n)*\n*)+/m
739 MARKDOWN_BQ_RE = /\A(^ *> ?.+$(.+\n)*\n*)+/m
740
740
741 def block_markdown_bq( text )
741 def block_markdown_bq( text )
742 text.gsub!( MARKDOWN_BQ_RE ) do |blk|
742 text.gsub!( MARKDOWN_BQ_RE ) do |blk|
743 blk.gsub!( /^ *> ?/, '' )
743 blk.gsub!( /^ *> ?/, '' )
744 flush_left blk
744 flush_left blk
745 blocks blk
745 blocks blk
746 blk.gsub!( /^(\S)/, "\t\\1" )
746 blk.gsub!( /^(\S)/, "\t\\1" )
747 "<blockquote>\n#{ blk }\n</blockquote>\n\n"
747 "<blockquote>\n#{ blk }\n</blockquote>\n\n"
748 end
748 end
749 end
749 end
750
750
751 MARKDOWN_RULE_RE = /^(#{
751 MARKDOWN_RULE_RE = /^(#{
752 ['*', '-', '_'].collect { |ch| ' ?(' + Regexp::quote( ch ) + ' ?){3,}' }.join( '|' )
752 ['*', '-', '_'].collect { |ch| ' ?(' + Regexp::quote( ch ) + ' ?){3,}' }.join( '|' )
753 })$/
753 })$/
754
754
755 def block_markdown_rule( text )
755 def block_markdown_rule( text )
756 text.gsub!( MARKDOWN_RULE_RE ) do |blk|
756 text.gsub!( MARKDOWN_RULE_RE ) do |blk|
757 "<hr />"
757 "<hr />"
758 end
758 end
759 end
759 end
760
760
761 # XXX TODO XXX
761 # XXX TODO XXX
762 def block_markdown_lists( text )
762 def block_markdown_lists( text )
763 end
763 end
764
764
765 def inline_textile_span( text )
765 def inline_textile_span( text )
766 QTAGS.each do |qtag_rc, ht, qtag_re, rtype|
766 QTAGS.each do |qtag_rc, ht, qtag_re, rtype|
767 text.gsub!( qtag_re ) do |m|
767 text.gsub!( qtag_re ) do |m|
768
768
769 case rtype
769 case rtype
770 when :limit
770 when :limit
771 sta,qtag,atts,cite,content = $~[1..5]
771 sta,qtag,atts,cite,content = $~[1..5]
772 else
772 else
773 qtag,atts,cite,content = $~[1..4]
773 qtag,atts,cite,content = $~[1..4]
774 sta = ''
774 sta = ''
775 end
775 end
776 atts = pba( atts )
776 atts = pba( atts )
777 atts << " cite=\"#{ cite }\"" if cite
777 atts << " cite=\"#{ cite }\"" if cite
778 atts = shelve( atts ) if atts
778 atts = shelve( atts ) if atts
779
779
780 "#{ sta }<#{ ht }#{ atts }>#{ content }</#{ ht }>"
780 "#{ sta }<#{ ht }#{ atts }>#{ content }</#{ ht }>"
781
781
782 end
782 end
783 end
783 end
784 end
784 end
785
785
786 LINK_RE = /
786 LINK_RE = /
787 ([\s\[{(]|[#{PUNCT}])? # $pre
787 ([\s\[{(]|[#{PUNCT}])? # $pre
788 " # start
788 " # start
789 (#{C}) # $atts
789 (#{C}) # $atts
790 ([^"\n]+?) # $text
790 ([^"\n]+?) # $text
791 \s?
791 \s?
792 (?:\(([^)]+?)\)(?="))? # $title
792 (?:\(([^)]+?)\)(?="))? # $title
793 ":
793 ":
794 ([\w\/]\S+?) # $url
794 ( # $url
795 (\/|https?:\/\/|s?ftps?:\/\/|www\.)
796 [\w\/]\S+?
797 )
795 (\/)? # $slash
798 (\/)? # $slash
796 ([^\w\=\/;\(\)]*?) # $post
799 ([^\w\=\/;\(\)]*?) # $post
797 (?=<|\s|$)
800 (?=<|\s|$)
798 /x
801 /x
799 #"
802 #"
800 def inline_textile_link( text )
803 def inline_textile_link( text )
801 text.gsub!( LINK_RE ) do |m|
804 text.gsub!( LINK_RE ) do |m|
802 pre,atts,text,title,url,slash,post = $~[1..7]
805 pre,atts,text,title,url,proto,slash,post = $~[1..8]
803
806
804 url, url_title = check_refs( url )
807 url, url_title = check_refs( url )
805 title ||= url_title
808 title ||= url_title
806
809
807 # Idea below : an URL with unbalanced parethesis and
810 # Idea below : an URL with unbalanced parethesis and
808 # ending by ')' is put into external parenthesis
811 # ending by ')' is put into external parenthesis
809 if ( url[-1]==?) and ((url.count("(") - url.count(")")) < 0 ) )
812 if ( url[-1]==?) and ((url.count("(") - url.count(")")) < 0 ) )
810 url=url[0..-2] # discard closing parenth from url
813 url=url[0..-2] # discard closing parenth from url
811 post = ")"+post # add closing parenth to post
814 post = ")"+post # add closing parenth to post
812 end
815 end
813 atts = pba( atts )
816 atts = pba( atts )
814 atts = " href=\"#{ url }#{ slash }\"#{ atts }"
817 atts = " href=\"#{ url }#{ slash }\"#{ atts }"
815 atts << " title=\"#{ htmlesc title }\"" if title
818 atts << " title=\"#{ htmlesc title }\"" if title
816 atts = shelve( atts ) if atts
819 atts = shelve( atts ) if atts
817
820
818 external = (url =~ /^https?:\/\//) ? ' class="external"' : ''
821 external = (url =~ /^https?:\/\//) ? ' class="external"' : ''
819
822
820 "#{ pre }<a#{ atts }#{ external }>#{ text }</a>#{ post }"
823 "#{ pre }<a#{ atts }#{ external }>#{ text }</a>#{ post }"
821 end
824 end
822 end
825 end
823
826
824 MARKDOWN_REFLINK_RE = /
827 MARKDOWN_REFLINK_RE = /
825 \[([^\[\]]+)\] # $text
828 \[([^\[\]]+)\] # $text
826 [ ]? # opt. space
829 [ ]? # opt. space
827 (?:\n[ ]*)? # one optional newline followed by spaces
830 (?:\n[ ]*)? # one optional newline followed by spaces
828 \[(.*?)\] # $id
831 \[(.*?)\] # $id
829 /x
832 /x
830
833
831 def inline_markdown_reflink( text )
834 def inline_markdown_reflink( text )
832 text.gsub!( MARKDOWN_REFLINK_RE ) do |m|
835 text.gsub!( MARKDOWN_REFLINK_RE ) do |m|
833 text, id = $~[1..2]
836 text, id = $~[1..2]
834
837
835 if id.empty?
838 if id.empty?
836 url, title = check_refs( text )
839 url, title = check_refs( text )
837 else
840 else
838 url, title = check_refs( id )
841 url, title = check_refs( id )
839 end
842 end
840
843
841 atts = " href=\"#{ url }\""
844 atts = " href=\"#{ url }\""
842 atts << " title=\"#{ title }\"" if title
845 atts << " title=\"#{ title }\"" if title
843 atts = shelve( atts )
846 atts = shelve( atts )
844
847
845 "<a#{ atts }>#{ text }</a>"
848 "<a#{ atts }>#{ text }</a>"
846 end
849 end
847 end
850 end
848
851
849 MARKDOWN_LINK_RE = /
852 MARKDOWN_LINK_RE = /
850 \[([^\[\]]+)\] # $text
853 \[([^\[\]]+)\] # $text
851 \( # open paren
854 \( # open paren
852 [ \t]* # opt space
855 [ \t]* # opt space
853 <?(.+?)>? # $href
856 <?(.+?)>? # $href
854 [ \t]* # opt space
857 [ \t]* # opt space
855 (?: # whole title
858 (?: # whole title
856 (['"]) # $quote
859 (['"]) # $quote
857 (.*?) # $title
860 (.*?) # $title
858 \3 # matching quote
861 \3 # matching quote
859 )? # title is optional
862 )? # title is optional
860 \)
863 \)
861 /x
864 /x
862
865
863 def inline_markdown_link( text )
866 def inline_markdown_link( text )
864 text.gsub!( MARKDOWN_LINK_RE ) do |m|
867 text.gsub!( MARKDOWN_LINK_RE ) do |m|
865 text, url, quote, title = $~[1..4]
868 text, url, quote, title = $~[1..4]
866
869
867 atts = " href=\"#{ url }\""
870 atts = " href=\"#{ url }\""
868 atts << " title=\"#{ title }\"" if title
871 atts << " title=\"#{ title }\"" if title
869 atts = shelve( atts )
872 atts = shelve( atts )
870
873
871 "<a#{ atts }>#{ text }</a>"
874 "<a#{ atts }>#{ text }</a>"
872 end
875 end
873 end
876 end
874
877
875 TEXTILE_REFS_RE = /(^ *)\[([^\[\n]+?)\](#{HYPERLINK})(?=\s|$)/
878 TEXTILE_REFS_RE = /(^ *)\[([^\[\n]+?)\](#{HYPERLINK})(?=\s|$)/
876 MARKDOWN_REFS_RE = /(^ *)\[([^\n]+?)\]:\s+<?(#{HYPERLINK})>?(?:\s+"((?:[^"]|\\")+)")?(?=\s|$)/m
879 MARKDOWN_REFS_RE = /(^ *)\[([^\n]+?)\]:\s+<?(#{HYPERLINK})>?(?:\s+"((?:[^"]|\\")+)")?(?=\s|$)/m
877
880
878 def refs( text )
881 def refs( text )
879 @rules.each do |rule_name|
882 @rules.each do |rule_name|
880 method( rule_name ).call( text ) if rule_name.to_s.match /^refs_/
883 method( rule_name ).call( text ) if rule_name.to_s.match /^refs_/
881 end
884 end
882 end
885 end
883
886
884 def refs_textile( text )
887 def refs_textile( text )
885 text.gsub!( TEXTILE_REFS_RE ) do |m|
888 text.gsub!( TEXTILE_REFS_RE ) do |m|
886 flag, url = $~[2..3]
889 flag, url = $~[2..3]
887 @urlrefs[flag.downcase] = [url, nil]
890 @urlrefs[flag.downcase] = [url, nil]
888 nil
891 nil
889 end
892 end
890 end
893 end
891
894
892 def refs_markdown( text )
895 def refs_markdown( text )
893 text.gsub!( MARKDOWN_REFS_RE ) do |m|
896 text.gsub!( MARKDOWN_REFS_RE ) do |m|
894 flag, url = $~[2..3]
897 flag, url = $~[2..3]
895 title = $~[6]
898 title = $~[6]
896 @urlrefs[flag.downcase] = [url, title]
899 @urlrefs[flag.downcase] = [url, title]
897 nil
900 nil
898 end
901 end
899 end
902 end
900
903
901 def check_refs( text )
904 def check_refs( text )
902 ret = @urlrefs[text.downcase] if text
905 ret = @urlrefs[text.downcase] if text
903 ret || [text, nil]
906 ret || [text, nil]
904 end
907 end
905
908
906 IMAGE_RE = /
909 IMAGE_RE = /
907 (<p>|.|^) # start of line?
910 (<p>|.|^) # start of line?
908 \! # opening
911 \! # opening
909 (\<|\=|\>)? # optional alignment atts
912 (\<|\=|\>)? # optional alignment atts
910 (#{C}) # optional style,class atts
913 (#{C}) # optional style,class atts
911 (?:\. )? # optional dot-space
914 (?:\. )? # optional dot-space
912 ([^\s(!]+?) # presume this is the src
915 ([^\s(!]+?) # presume this is the src
913 \s? # optional space
916 \s? # optional space
914 (?:\(((?:[^\(\)]|\([^\)]+\))+?)\))? # optional title
917 (?:\(((?:[^\(\)]|\([^\)]+\))+?)\))? # optional title
915 \! # closing
918 \! # closing
916 (?::#{ HYPERLINK })? # optional href
919 (?::#{ HYPERLINK })? # optional href
917 /x
920 /x
918
921
919 def inline_textile_image( text )
922 def inline_textile_image( text )
920 text.gsub!( IMAGE_RE ) do |m|
923 text.gsub!( IMAGE_RE ) do |m|
921 stln,algn,atts,url,title,href,href_a1,href_a2 = $~[1..8]
924 stln,algn,atts,url,title,href,href_a1,href_a2 = $~[1..8]
922 htmlesc title
925 htmlesc title
923 atts = pba( atts )
926 atts = pba( atts )
924 atts = " src=\"#{ url }\"#{ atts }"
927 atts = " src=\"#{ url }\"#{ atts }"
925 atts << " title=\"#{ title }\"" if title
928 atts << " title=\"#{ title }\"" if title
926 atts << " alt=\"#{ title }\""
929 atts << " alt=\"#{ title }\""
927 # size = @getimagesize($url);
930 # size = @getimagesize($url);
928 # if($size) $atts.= " $size[3]";
931 # if($size) $atts.= " $size[3]";
929
932
930 href, alt_title = check_refs( href ) if href
933 href, alt_title = check_refs( href ) if href
931 url, url_title = check_refs( url )
934 url, url_title = check_refs( url )
932
935
933 out = ''
936 out = ''
934 out << "<a#{ shelve( " href=\"#{ href }\"" ) }>" if href
937 out << "<a#{ shelve( " href=\"#{ href }\"" ) }>" if href
935 out << "<img#{ shelve( atts ) } />"
938 out << "<img#{ shelve( atts ) } />"
936 out << "</a>#{ href_a1 }#{ href_a2 }" if href
939 out << "</a>#{ href_a1 }#{ href_a2 }" if href
937
940
938 if algn
941 if algn
939 algn = h_align( algn )
942 algn = h_align( algn )
940 if stln == "<p>"
943 if stln == "<p>"
941 out = "<p style=\"float:#{ algn }\">#{ out }"
944 out = "<p style=\"float:#{ algn }\">#{ out }"
942 else
945 else
943 out = "#{ stln }<div style=\"float:#{ algn }\">#{ out }</div>"
946 out = "#{ stln }<div style=\"float:#{ algn }\">#{ out }</div>"
944 end
947 end
945 else
948 else
946 out = stln + out
949 out = stln + out
947 end
950 end
948
951
949 out
952 out
950 end
953 end
951 end
954 end
952
955
953 def shelve( val )
956 def shelve( val )
954 @shelf << val
957 @shelf << val
955 " :redsh##{ @shelf.length }:"
958 " :redsh##{ @shelf.length }:"
956 end
959 end
957
960
958 def retrieve( text )
961 def retrieve( text )
959 @shelf.each_with_index do |r, i|
962 @shelf.each_with_index do |r, i|
960 text.gsub!( " :redsh##{ i + 1 }:", r )
963 text.gsub!( " :redsh##{ i + 1 }:", r )
961 end
964 end
962 end
965 end
963
966
964 def incoming_entities( text )
967 def incoming_entities( text )
965 ## turn any incoming ampersands into a dummy character for now.
968 ## turn any incoming ampersands into a dummy character for now.
966 ## This uses a negative lookahead for alphanumerics followed by a semicolon,
969 ## This uses a negative lookahead for alphanumerics followed by a semicolon,
967 ## implying an incoming html entity, to be skipped
970 ## implying an incoming html entity, to be skipped
968
971
969 text.gsub!( /&(?![#a-z0-9]+;)/i, "x%x%" )
972 text.gsub!( /&(?![#a-z0-9]+;)/i, "x%x%" )
970 end
973 end
971
974
972 def no_textile( text )
975 def no_textile( text )
973 text.gsub!( /(^|\s)==([^=]+.*?)==(\s|$)?/,
976 text.gsub!( /(^|\s)==([^=]+.*?)==(\s|$)?/,
974 '\1<notextile>\2</notextile>\3' )
977 '\1<notextile>\2</notextile>\3' )
975 text.gsub!( /^ *==([^=]+.*?)==/m,
978 text.gsub!( /^ *==([^=]+.*?)==/m,
976 '\1<notextile>\2</notextile>\3' )
979 '\1<notextile>\2</notextile>\3' )
977 end
980 end
978
981
979 def clean_white_space( text )
982 def clean_white_space( text )
980 # normalize line breaks
983 # normalize line breaks
981 text.gsub!( /\r\n/, "\n" )
984 text.gsub!( /\r\n/, "\n" )
982 text.gsub!( /\r/, "\n" )
985 text.gsub!( /\r/, "\n" )
983 text.gsub!( /\t/, ' ' )
986 text.gsub!( /\t/, ' ' )
984 text.gsub!( /^ +$/, '' )
987 text.gsub!( /^ +$/, '' )
985 text.gsub!( /\n{3,}/, "\n\n" )
988 text.gsub!( /\n{3,}/, "\n\n" )
986 text.gsub!( /"$/, "\" " )
989 text.gsub!( /"$/, "\" " )
987
990
988 # if entire document is indented, flush
991 # if entire document is indented, flush
989 # to the left side
992 # to the left side
990 flush_left text
993 flush_left text
991 end
994 end
992
995
993 def flush_left( text )
996 def flush_left( text )
994 indt = 0
997 indt = 0
995 if text =~ /^ /
998 if text =~ /^ /
996 while text !~ /^ {#{indt}}\S/
999 while text !~ /^ {#{indt}}\S/
997 indt += 1
1000 indt += 1
998 end unless text.empty?
1001 end unless text.empty?
999 if indt.nonzero?
1002 if indt.nonzero?
1000 text.gsub!( /^ {#{indt}}/, '' )
1003 text.gsub!( /^ {#{indt}}/, '' )
1001 end
1004 end
1002 end
1005 end
1003 end
1006 end
1004
1007
1005 def footnote_ref( text )
1008 def footnote_ref( text )
1006 text.gsub!( /\b\[([0-9]+?)\](\s)?/,
1009 text.gsub!( /\b\[([0-9]+?)\](\s)?/,
1007 '<sup><a href="#fn\1">\1</a></sup>\2' )
1010 '<sup><a href="#fn\1">\1</a></sup>\2' )
1008 end
1011 end
1009
1012
1010 OFFTAGS = /(code|pre|kbd|notextile)/
1013 OFFTAGS = /(code|pre|kbd|notextile)/
1011 OFFTAG_MATCH = /(?:(<\/#{ OFFTAGS }>)|(<#{ OFFTAGS }[^>]*>))(.*?)(?=<\/?#{ OFFTAGS }|\Z)/mi
1014 OFFTAG_MATCH = /(?:(<\/#{ OFFTAGS }>)|(<#{ OFFTAGS }[^>]*>))(.*?)(?=<\/?#{ OFFTAGS }|\Z)/mi
1012 OFFTAG_OPEN = /<#{ OFFTAGS }/
1015 OFFTAG_OPEN = /<#{ OFFTAGS }/
1013 OFFTAG_CLOSE = /<\/?#{ OFFTAGS }/
1016 OFFTAG_CLOSE = /<\/?#{ OFFTAGS }/
1014 HASTAG_MATCH = /(<\/?\w[^\n]*?>)/m
1017 HASTAG_MATCH = /(<\/?\w[^\n]*?>)/m
1015 ALLTAG_MATCH = /(<\/?\w[^\n]*?>)|.*?(?=<\/?\w[^\n]*?>|$)/m
1018 ALLTAG_MATCH = /(<\/?\w[^\n]*?>)|.*?(?=<\/?\w[^\n]*?>|$)/m
1016
1019
1017 def glyphs_textile( text, level = 0 )
1020 def glyphs_textile( text, level = 0 )
1018 if text !~ HASTAG_MATCH
1021 if text !~ HASTAG_MATCH
1019 pgl text
1022 pgl text
1020 footnote_ref text
1023 footnote_ref text
1021 else
1024 else
1022 codepre = 0
1025 codepre = 0
1023 text.gsub!( ALLTAG_MATCH ) do |line|
1026 text.gsub!( ALLTAG_MATCH ) do |line|
1024 ## matches are off if we're between <code>, <pre> etc.
1027 ## matches are off if we're between <code>, <pre> etc.
1025 if $1
1028 if $1
1026 if line =~ OFFTAG_OPEN
1029 if line =~ OFFTAG_OPEN
1027 codepre += 1
1030 codepre += 1
1028 elsif line =~ OFFTAG_CLOSE
1031 elsif line =~ OFFTAG_CLOSE
1029 codepre -= 1
1032 codepre -= 1
1030 codepre = 0 if codepre < 0
1033 codepre = 0 if codepre < 0
1031 end
1034 end
1032 elsif codepre.zero?
1035 elsif codepre.zero?
1033 glyphs_textile( line, level + 1 )
1036 glyphs_textile( line, level + 1 )
1034 else
1037 else
1035 htmlesc( line, :NoQuotes )
1038 htmlesc( line, :NoQuotes )
1036 end
1039 end
1037 # p [level, codepre, line]
1040 # p [level, codepre, line]
1038
1041
1039 line
1042 line
1040 end
1043 end
1041 end
1044 end
1042 end
1045 end
1043
1046
1044 def rip_offtags( text )
1047 def rip_offtags( text )
1045 if text =~ /<.*>/
1048 if text =~ /<.*>/
1046 ## strip and encode <pre> content
1049 ## strip and encode <pre> content
1047 codepre, used_offtags = 0, {}
1050 codepre, used_offtags = 0, {}
1048 text.gsub!( OFFTAG_MATCH ) do |line|
1051 text.gsub!( OFFTAG_MATCH ) do |line|
1049 if $3
1052 if $3
1050 offtag, aftertag = $4, $5
1053 offtag, aftertag = $4, $5
1051 codepre += 1
1054 codepre += 1
1052 used_offtags[offtag] = true
1055 used_offtags[offtag] = true
1053 if codepre - used_offtags.length > 0
1056 if codepre - used_offtags.length > 0
1054 htmlesc( line, :NoQuotes )
1057 htmlesc( line, :NoQuotes )
1055 @pre_list.last << line
1058 @pre_list.last << line
1056 line = ""
1059 line = ""
1057 else
1060 else
1058 htmlesc( aftertag, :NoQuotes ) if aftertag
1061 htmlesc( aftertag, :NoQuotes ) if aftertag
1059 line = "<redpre##{ @pre_list.length }>"
1062 line = "<redpre##{ @pre_list.length }>"
1060 $3.match(/<#{ OFFTAGS }([^>]*)>/)
1063 $3.match(/<#{ OFFTAGS }([^>]*)>/)
1061 tag = $1
1064 tag = $1
1062 $2.to_s.match(/(class\=\S+)/i)
1065 $2.to_s.match(/(class\=\S+)/i)
1063 tag << " #{$1}" if $1
1066 tag << " #{$1}" if $1
1064 @pre_list << "<#{ tag }>#{ aftertag }"
1067 @pre_list << "<#{ tag }>#{ aftertag }"
1065 end
1068 end
1066 elsif $1 and codepre > 0
1069 elsif $1 and codepre > 0
1067 if codepre - used_offtags.length > 0
1070 if codepre - used_offtags.length > 0
1068 htmlesc( line, :NoQuotes )
1071 htmlesc( line, :NoQuotes )
1069 @pre_list.last << line
1072 @pre_list.last << line
1070 line = ""
1073 line = ""
1071 end
1074 end
1072 codepre -= 1 unless codepre.zero?
1075 codepre -= 1 unless codepre.zero?
1073 used_offtags = {} if codepre.zero?
1076 used_offtags = {} if codepre.zero?
1074 end
1077 end
1075 line
1078 line
1076 end
1079 end
1077 end
1080 end
1078 text
1081 text
1079 end
1082 end
1080
1083
1081 def smooth_offtags( text )
1084 def smooth_offtags( text )
1082 unless @pre_list.empty?
1085 unless @pre_list.empty?
1083 ## replace <pre> content
1086 ## replace <pre> content
1084 text.gsub!( /<redpre#(\d+)>/ ) { @pre_list[$1.to_i] }
1087 text.gsub!( /<redpre#(\d+)>/ ) { @pre_list[$1.to_i] }
1085 end
1088 end
1086 end
1089 end
1087
1090
1088 def inline( text )
1091 def inline( text )
1089 [/^inline_/, /^glyphs_/].each do |meth_re|
1092 [/^inline_/, /^glyphs_/].each do |meth_re|
1090 @rules.each do |rule_name|
1093 @rules.each do |rule_name|
1091 method( rule_name ).call( text ) if rule_name.to_s.match( meth_re )
1094 method( rule_name ).call( text ) if rule_name.to_s.match( meth_re )
1092 end
1095 end
1093 end
1096 end
1094 end
1097 end
1095
1098
1096 def h_align( text )
1099 def h_align( text )
1097 H_ALGN_VALS[text]
1100 H_ALGN_VALS[text]
1098 end
1101 end
1099
1102
1100 def v_align( text )
1103 def v_align( text )
1101 V_ALGN_VALS[text]
1104 V_ALGN_VALS[text]
1102 end
1105 end
1103
1106
1104 def textile_popup_help( name, windowW, windowH )
1107 def textile_popup_help( name, windowW, windowH )
1105 ' <a target="_blank" href="http://hobix.com/textile/#' + helpvar + '" onclick="window.open(this.href, \'popupwindow\', \'width=' + windowW + ',height=' + windowH + ',scrollbars,resizable\'); return false;">' + name + '</a><br />'
1108 ' <a target="_blank" href="http://hobix.com/textile/#' + helpvar + '" onclick="window.open(this.href, \'popupwindow\', \'width=' + windowW + ',height=' + windowH + ',scrollbars,resizable\'); return false;">' + name + '</a><br />'
1106 end
1109 end
1107
1110
1108 # HTML cleansing stuff
1111 # HTML cleansing stuff
1109 BASIC_TAGS = {
1112 BASIC_TAGS = {
1110 'a' => ['href', 'title'],
1113 'a' => ['href', 'title'],
1111 'img' => ['src', 'alt', 'title'],
1114 'img' => ['src', 'alt', 'title'],
1112 'br' => [],
1115 'br' => [],
1113 'i' => nil,
1116 'i' => nil,
1114 'u' => nil,
1117 'u' => nil,
1115 'b' => nil,
1118 'b' => nil,
1116 'pre' => nil,
1119 'pre' => nil,
1117 'kbd' => nil,
1120 'kbd' => nil,
1118 'code' => ['lang'],
1121 'code' => ['lang'],
1119 'cite' => nil,
1122 'cite' => nil,
1120 'strong' => nil,
1123 'strong' => nil,
1121 'em' => nil,
1124 'em' => nil,
1122 'ins' => nil,
1125 'ins' => nil,
1123 'sup' => nil,
1126 'sup' => nil,
1124 'sub' => nil,
1127 'sub' => nil,
1125 'del' => nil,
1128 'del' => nil,
1126 'table' => nil,
1129 'table' => nil,
1127 'tr' => nil,
1130 'tr' => nil,
1128 'td' => ['colspan', 'rowspan'],
1131 'td' => ['colspan', 'rowspan'],
1129 'th' => nil,
1132 'th' => nil,
1130 'ol' => nil,
1133 'ol' => nil,
1131 'ul' => nil,
1134 'ul' => nil,
1132 'li' => nil,
1135 'li' => nil,
1133 'p' => nil,
1136 'p' => nil,
1134 'h1' => nil,
1137 'h1' => nil,
1135 'h2' => nil,
1138 'h2' => nil,
1136 'h3' => nil,
1139 'h3' => nil,
1137 'h4' => nil,
1140 'h4' => nil,
1138 'h5' => nil,
1141 'h5' => nil,
1139 'h6' => nil,
1142 'h6' => nil,
1140 'blockquote' => ['cite']
1143 'blockquote' => ['cite']
1141 }
1144 }
1142
1145
1143 def clean_html( text, tags = BASIC_TAGS )
1146 def clean_html( text, tags = BASIC_TAGS )
1144 text.gsub!( /<!\[CDATA\[/, '' )
1147 text.gsub!( /<!\[CDATA\[/, '' )
1145 text.gsub!( /<(\/*)(\w+)([^>]*)>/ ) do
1148 text.gsub!( /<(\/*)(\w+)([^>]*)>/ ) do
1146 raw = $~
1149 raw = $~
1147 tag = raw[2].downcase
1150 tag = raw[2].downcase
1148 if tags.has_key? tag
1151 if tags.has_key? tag
1149 pcs = [tag]
1152 pcs = [tag]
1150 tags[tag].each do |prop|
1153 tags[tag].each do |prop|
1151 ['"', "'", ''].each do |q|
1154 ['"', "'", ''].each do |q|
1152 q2 = ( q != '' ? q : '\s' )
1155 q2 = ( q != '' ? q : '\s' )
1153 if raw[3] =~ /#{prop}\s*=\s*#{q}([^#{q2}]+)#{q}/i
1156 if raw[3] =~ /#{prop}\s*=\s*#{q}([^#{q2}]+)#{q}/i
1154 attrv = $1
1157 attrv = $1
1155 next if prop == 'src' and attrv =~ %r{^(?!http)\w+:}
1158 next if prop == 'src' and attrv =~ %r{^(?!http)\w+:}
1156 pcs << "#{prop}=\"#{$1.gsub('"', '\\"')}\""
1159 pcs << "#{prop}=\"#{$1.gsub('"', '\\"')}\""
1157 break
1160 break
1158 end
1161 end
1159 end
1162 end
1160 end if tags[tag]
1163 end if tags[tag]
1161 "<#{raw[1]}#{pcs.join " "}>"
1164 "<#{raw[1]}#{pcs.join " "}>"
1162 else
1165 else
1163 " "
1166 " "
1164 end
1167 end
1165 end
1168 end
1166 end
1169 end
1167
1170
1168 ALLOWED_TAGS = %w(redpre pre code notextile)
1171 ALLOWED_TAGS = %w(redpre pre code notextile)
1169
1172
1170 def escape_html_tags(text)
1173 def escape_html_tags(text)
1171 text.gsub!(%r{<(\/?([!\w]+)[^<>\n]*)(>?)}) {|m| ALLOWED_TAGS.include?($2) ? "<#{$1}#{$3}" : "&lt;#{$1}#{'&gt;' unless $3.blank?}" }
1174 text.gsub!(%r{<(\/?([!\w]+)[^<>\n]*)(>?)}) {|m| ALLOWED_TAGS.include?($2) ? "<#{$1}#{$3}" : "&lt;#{$1}#{'&gt;' unless $3.blank?}" }
1172 end
1175 end
1173 end
1176 end
1174
1177
General Comments 0
You need to be logged in to leave comments. Login now