diff --git a/Gemfile b/Gemfile index a47ffec3b..9a77f1c58 100644 --- a/Gemfile +++ b/Gemfile @@ -62,7 +62,7 @@ gem 'rails-i18n' # parsing gem 'nokogiri' -gem 'redcarpet', :git => 'git://github.com/tanoku/redcarpet' +gem 'redcarpet', "2.0.0b5" gem 'roxml', :git => 'git://github.com/Empact/roxml.git', :ref => '7ea9a9ffd2338aaef5b0' # queue diff --git a/Gemfile.lock b/Gemfile.lock index 546eaf952..64d5104f5 100644 --- a/Gemfile.lock +++ b/Gemfile.lock @@ -56,12 +56,6 @@ GIT addressable (>= 2.1.1) eventmachine (>= 0.12.9) -GIT - remote: git://github.com/tanoku/redcarpet - revision: 3c6b5807e8a5be51d769149e555b09bae8ae3228 - specs: - redcarpet (2.0.0b3) - GEM remote: http://rubygems.org/ specs: @@ -363,6 +357,7 @@ GEM rash (0.3.0) hashie (~> 1.0.0) rdoc (3.9.4) + redcarpet (2.0.0b5) redis (2.2.2) redis-namespace (0.8.0) redis (< 3.0.0) @@ -518,7 +513,7 @@ DEPENDENCIES omniauth (= 0.2.6) rails (= 3.0.10) rails-i18n - redcarpet! + redcarpet (= 2.0.0b5) resque (= 1.10.0) resque-ensure-connected resque-timeout (= 1.0.0) diff --git a/app/helpers/markdownify_helper.rb b/app/helpers/markdownify_helper.rb index 13cb7c5cb..e6c66dc98 100644 --- a/app/helpers/markdownify_helper.rb +++ b/app/helpers/markdownify_helper.rb @@ -31,6 +31,7 @@ module MarkdownifyHelper return '' if message.blank? + #renderer = Redcarpet::Render::HTML.new(render_options) renderer = Diaspora::Markdownify::HTML.new(render_options) markdown = Redcarpet::Markdown.new(renderer, markdown_options) diff --git a/lib/diaspora/markdownify.rb b/lib/diaspora/markdownify.rb index c21fdaa68..a937afbb2 100644 --- a/lib/diaspora/markdownify.rb +++ b/lib/diaspora/markdownify.rb @@ -3,186 +3,13 @@ require 'erb' module Diaspora module Markdownify class HTML < Redcarpet::Render::HTML - attr_accessor :newlines, :specialchars, :youtube_maps, :vimeo_maps - def initialize(options={}) - super - - @newlines = options.fetch(:newlines, true) - @specialchars = options.fetch(:specialchars, true) - @youtube_maps = options[:youtube_maps]||{} - @vimeo_maps = options[:vimeo_maps] || {} - end + include ActionView::Helpers::TextHelper + include ActionView::Helpers::TagHelper def autolink(link, type) - return link if type == :email - autolink_youtube(link) || autolink_vimeo(link) || autolink_simple(link) + auto_link(link, :link => :urls ) end - - def autolink_simple(link) - - # If there isn't *some* protocol, assume http - if link !~ %r{^\w+://} - link = "http://#{link}" - end - - content = link.gsub(%r{^\w+://}, '') - - %Q{#{content}} - end - - def autolink_vimeo(link) - regex = %r{https?://(?:w{3}\.)?vimeo.com/(\d{6,})/?} - if link =~ regex - video_id = $1 - if @vimeo_maps[video_id] - title = ERB::Util.h(CGI::unescape(@vimeo_maps[video_id])) - else - title = I18n.t 'application.helper.video_title.unknown' - end - return ' Vimeo: ' + title + '' - end - return - end - - def autolink_youtube(link) - if link =~ YoutubeTitles::YOUTUBE_ID_REGEX - video_id = $1 - anchor = $2 || '' - - if @youtube_maps[video_id] - title = ERB::Util.h(CGI::unescape(@youtube_maps[video_id])) - else - title = I18n.t 'application.helper.video_title.unknown' - end - return ' Youtube: ' + title + '' - end - return - end - - def block_code(text, language) - "
\n#{text}"
- end
-
- def double_emphasis(text)
- "#{text}"
- end
-
- def linebreak()
- "#{text}
" - end - - def preprocess(full_document) - entities = [ - ['&', '&'], - ['>', '>'], - ['<', '<'] - ] - entities.each do |original, replacement| - full_document = full_document.gsub(original, replacement) - end - - if @specialchars - full_document = specialchars(full_document) - end - - our_unsafe_chars = '()' - full_document = full_document.gsub(%r{ - \[ \s*? ( [^ \] ]+ ) \s*? \] - (?: - \( \s*? (\S+) \s*? (?: "([^"]+)" )? \) \s*? - ) - }xm) do |m| - content = $1 - link = URI.escape($2, our_unsafe_chars) - title = $3 - - title_chunk = if title - %W{" #{title}"} - else - '' - end - %Q{[#{content}](#{link}#{title_chunk})} - end - - return full_document - end - - - - def single_emphasis(text) - "#{text}" - end - - def specialchars(text) - if @specialchars - map = [ - ["<3", "♥"], - ["<->", "↔"], - ["->", "→"], - ["<-", "←"], - ["\.\.\.", "…"], - ["(tm)", "™"], - ["(r)", "®"], - ["(c)", "©"] - ] - end - - map.each do |mapping| - text = text.gsub(mapping[0], mapping[1]) - end - - return text - end - - - def triple_emphasis(text) - single_emphasis(double_emphasis(text)) - end - end end end diff --git a/spec/helpers/markdownify_helper_spec.rb b/spec/helpers/markdownify_helper_spec.rb index 08ba42f90..95c960d64 100644 --- a/spec/helpers/markdownify_helper_spec.rb +++ b/spec/helpers/markdownify_helper_spec.rb @@ -7,302 +7,27 @@ require 'spec_helper' describe MarkdownifyHelper do describe "#markdownify" do - it 'does not error if youtube_maps in the hash is explicitly set to nil' do - expect{ - markdownify("http://www.youtube.com/watch?v=pZROlhHOvuo", :youtube_maps => nil) - }.should_not raise_error - end - - it 'does not error if youtube_maps in the hash is explicitly set to nil' do - expect{ - markdownify("http://vimeo.com/18589934", :vimeo_maps => nil) - }.should_not raise_error - end - - describe "autolinks" do - it "should not allow basic XSS/HTML" do - markdownify("").should == "<script>alert('XSS is evil')</script>
" + describe "not doing something dumb" do + it "strips out script tags" do + markdownify("").should == + "alert('XSS is evil')
\n" end - it "should recognize basic http links (1/3)" do - proto="http" - url="bugs.joindiaspora.com/issues/332" - full_url = "#{proto}://#{url}" - markdownify(full_url).should == %Q{} - end - - it "should recognize basic http links (2/3)" do - proto="http" - url="webmail.example.com?~()!*/" - full_url = "#{proto}://#{url}" - markdownify(full_url).should == %Q{} - end - - it "should recognize basic http links (3/3)" do - proto="http" - url="127.0.0.1:3000/users/sign_in" - full_url = "#{proto}://#{url}" - markdownify(full_url).should == %Q{} - end - - it "should recognize secure https links" do - proto="https" - url="127.0.0.1:3000/users/sign_in" - full_url = "#{proto}://#{url}" - markdownify(full_url).should == %Q{} - end - - it "doesn't muck up code text" do - message = %{`puts "Hello"`} - markdownify(message).should =~ %r{puts "Hello"}
- message = %Q{~~~\nA\nB\n~~~\n}
- markdownify(message).should =~ %r{\nA\nB\n}
- end
-
- it "doesn't double parse video links" do
- message = "http://www.vimeo.com/17449557
- http://www.youtube.com/watch?v=0x__dDWdf23&a=GxdCwVVULXdvEBKmx_f5ywvZ0zZHHHDU&list=ML&playnext=1
- http://youtu.be/x_CzD0GBD-4"
- res = markdownify(message)
- res.should =~ /href.+href.+href/m
- res.should_not =~ /href.+href.+href.+href/m
- end
-
- describe "video links" do
- it "recognizes vimeo links" do
- video_id = "17449557"
- url = "http://www.vimeo.com/#{video_id}"
- res = markdownify(url)
- res.should =~ /data-host="vimeo.com"/
- res.should =~ /data-video-id="#{video_id}"/
- end
-
- it "matches a trailing slash in a vimeo link" do
- video_id = "17449557"
- url = "http://www.vimeo.com/#{video_id}/"
- res = markdownify(url)
- res.should =~ /data-host="vimeo.com"/
- res.should =~ /data-video-id="#{video_id}"/
- res.should_not =~ />\//
- end
-
- it "recognizes youtube links" do
- video_id = "0x__dDWdf23"
- url = "http://www.youtube.com/watch?v=" + video_id + "&a=GxdCwVVULXdvEBKmx_f5ywvZ0zZHHHDU&list=ML&playnext=1"
- res = markdownify(url)
- res.should =~ /Youtube:/
- res.should =~ /data-host="youtube.com"/
- res.should =~ /data-video-id="#{video_id}"/
-
- url = "www.youtube.com/watch?foo=bar&v=BARFOO-----&whatever=related"
- res = markdownify(url)
- res.should =~ /Youtube:/
- res.should =~ /data-host="youtube.com"/
- res.should =~ /data-video-id="BARFOO-----"/
- end
-
- it "recognizes youtu.be links" do
- video_id = "x_CzD0GBD-4"
- url = "http://youtu.be/#{video_id}"
- res = markdownify(url)
- res.should =~ /Youtube:/
- res.should =~ /data-host="youtube.com"/
- res.should =~ /data-video-id="#{video_id}"/
- end
-
- it "recognizes youtube links with hyphens" do
- video_id = "ABYnqp-bxvg"
- url = "http://www.youtube.com/watch?v=" + video_id + "&a=GxdCwVVULXdvEBKmx_f5ywvZ0zZHHHDU&list=ML&playnext=1"
- res = markdownify(url)
- res.should =~ /Youtube:/
- res.should =~ /data-host="youtube.com"/
- res.should =~ /data-video-id="#{video_id}"/
- end
-
- it "keeps anchors" do
- anchor = "#t=11m34"
- video_id = "DHRoHuv3I8E"
- url = "http://www.youtube.com/watch?v=" + video_id + anchor
- res = markdownify(url)
- res.should =~ /Youtube:/
- res.should =~ /data-host="youtube.com"/
- res.should =~ /data-video-id="#{video_id}"/
- res.should =~ /data-anchor="#{anchor}"/
- end
-
- it "has an empty data-anchor attribute if there is no anchor" do
- video_id = "DHRoHuv3I8E"
- url = "http://www.youtube.com/watch?v=" + video_id
- res = markdownify(url)
- res.should =~ /Youtube:/
- res.should =~ /data-host="youtube.com"/
- res.should =~ /data-video-id="#{video_id}"/
- res.should =~ /data-anchor=""/
- end
-
- it "leaves the links in the href of the #a tag" do
- video_id = "ABYnqp-bxvg"
- start_url ="http://www.youtube.com/watch?v=" + video_id
- url = start_url + "&a=GxdCwVVULXdvEBKmx_f5ywvZ0zZHHHDU&list=ML&playnext=1"
- res = markdownify(url)
- res.should =~ /href=[\S]+v=#{video_id}/
- end
-
- it 'does not autolink inside the link' do
- video_id = "ABYnqp-bxvg"
- start_url ="http://www.youtube.com/watch?v=" + video_id
- url = start_url + "&a=GxdCwVVULXdvEBKmx_f5ywvZ0zZHHHDU&list=ML&playnext=1"
- res = markdownify(url)
- res.match(/href=""+url+""
- end
-
- it "should recognize www links" do
- url="www.joindiaspora.com"
- markdownify(url).should == %Q{}
+ it 'strips onClick handlers from links' do
+ omghax = '[XSS](http://joindiaspora.com/" onClick="$\(\'a\'\).remove\(\))'
+ markdownify(omghax).should_not match(/ onClick/i)
end
end
- describe "specialchars" do
- it "replaces <3 with ♥" do
- message = "i <3 you"
- markdownify(message).should == "i ♥ you
" - end - - it "replaces various things with (their) HTML entities" do - message = "... <-> -> <- (tm) (r) (c)" - markdownify(message).should == "… ↔ → ← ™ ® ©
" - end - - it "skips doing it if you say so" do - message = "... -> <-" - markdownify(message, :specialchars => false).should == "... -> <-
" - end - end - - describe "weak emphasis" do - it "should be recognized (1/2)" do - message = "*some text* some text *some text* some text" - markdownify(message).should == "some text some text some text some text
" - end - - it "should be recognized (2/2)" do - message = "_some text_ some text _some text_ some text" - markdownify(message).should == "some text some text some text some text
" - end - end - - describe "strong emphasis" do - it "should be recognized (1/2)" do - message = "**some text** some text **some text** some text" - markdownify(message).should == "some text some text some text some text
" - end - - it "should be recognized (2/2)" do - message = "__some text__ some text __some text__ some text" - markdownify(message).should == "some text some text some text some text
" - end - end - - describe "nested weak and strong emphasis" do - it "should be rendered correctly" do - message = "__this is _some_ text__" - markdownify(message).should == "this is some text
" - message = "*this is **some** text*" - markdownify(message).should == "this is some text
" - message = "___some text___" - markdownify(message).should == "some text
" - end - end - - describe "links" do - it "should be recognized without title attribute" do - message = "[link text](http://someurl.com) [link text](http://someurl.com)" - markdownify(message).should == '' - end - - it "should be recognized with title attribute" do - message = '[link text](http://someurl.com "some title") [link text](http://someurl.com "some title")' - markdownify(message).should == '' - end - - it "should have a robust link parsing" do - message = "[wikipedia](http://en.wikipedia.org/wiki/Text_(literary_theory))" - link = markdownify(message) - link.should =~ %r{href="http://en.wikipedia.org/wiki/Text_%28literary_theory%29"} - - message = "[ links]( google.com)" - markdownify(message).should == %Q{} - - message = "[_http_](http://google.com/search?q=with_multiple__underscores*and**asterisks )" - markdownify(message).should == %Q{} - message = %{[___FTP___]( ftp://ftp.uni-kl.de/CCC/26C3/mp4/26c3-3540-en-a_hackers_utopia.mp4 'File Transfer Protocol')} - markdownify(message).should == %{} - - message = %{[**any protocol**](foo://bar.example.org/yes_it*makes*no_sense)} - markdownify(message).should == %{} - - message = "This [ *text* ]( http://en.wikipedia.org/wiki/Text_(literary_theory) ) with many [ links]( google.com) tests [_http_](http://google.com/search?q=with_multiple__underscores*and**asterisks ), [___FTP___]( ftp://ftp.uni-kl.de/CCC/26C3/mp4/26c3-3540-en-a_hackers_utopia.mp4 'File Transfer Protocol'), [**any protocol**](foo://bar.example.org/yes_it*makes*no_sense)" - markdownify(message).should == 'This text with many links tests http, FTP, any protocol
' - end - - end - - describe "nested emphasis and links tags" do - it "should be rendered correctly" do - message = '[**some *link* text**](someurl.com "some title")' - markdownify(message).should == '' - end - end - - it "should allow escaping" do - message = '*some text* \*some text* \**some text* _some text_ \_some text_ \__some text_' - markdownify(message).should == "some text *some text* *some text some text _some text_ _some text
" - end - - describe "newlines" do - it 'skips inserting newlines if you pass the newlines option' do - message = "These\nare\n\some\nnew\lines" - res = markdownify(message, :newlines => false) - res.should == "#{message}
" - end - - it 'generates breaklines' do - message = "These\nare\nsome\nnew\nlines" - res = markdownify(message) - res.should == "These
are
some
new
lines
Some text, then a line break and a link
joindiaspora.com
some more text