* Decouple Status#local? from uri being nil * Replace on-the-fly URI generation with stored URIs - Generate URI in after_save hook for local statuses - Use static value in TagManager when available, fallback to tag format - Make TagManager use ActivityPub::TagManager to understand new format - Adjust tests * Use other heuristic for locality of old statuses, do not perform long query * Exclude tombstone stream entries from Atom feed * Prevent nil statuses from landing in Pubsubhubbub::DistributionWorker * Fix URI not being saved (#4818) * Add more specs for Status * Save generated uri immediately and also fix method order to minimize diff. * Fix alternate HTML URL in Atom * Fix tests * Remove not-null constraint from statuses migration to speed it up
		
			
				
	
	
		
			294 lines
		
	
	
		
			8.5 KiB
		
	
	
	
		
			Ruby
		
	
	
	
	
	
			
		
		
	
	
			294 lines
		
	
	
		
			8.5 KiB
		
	
	
	
		
			Ruby
		
	
	
	
	
	
| require 'rails_helper'
 | |
| 
 | |
| RSpec.describe Formatter do
 | |
|   let(:local_account)  { Fabricate(:account, domain: nil, username: 'alice') }
 | |
|   let(:remote_account) { Fabricate(:account, domain: 'remote', username: 'bob', url: 'https://remote/') }
 | |
| 
 | |
|   shared_examples 'encode and link URLs' do
 | |
|     context 'matches a stand-alone medium URL' do
 | |
|       let(:text) { 'https://hackernoon.com/the-power-to-build-communities-a-response-to-mark-zuckerberg-3f2cac9148a4' }
 | |
| 
 | |
|       it 'has valid URL' do
 | |
|         is_expected.to include 'href="https://hackernoon.com/the-power-to-build-communities-a-response-to-mark-zuckerberg-3f2cac9148a4"'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'matches a stand-alone google URL' do
 | |
|       let(:text) { 'http://google.com' }
 | |
| 
 | |
|       it 'has valid URL' do
 | |
|         is_expected.to include 'href="http://google.com/"'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'matches a stand-alone IDN URL' do
 | |
|       let(:text) { 'https://nic.みんな/' }
 | |
| 
 | |
|       it 'has valid URL' do
 | |
|         is_expected.to include 'href="https://nic.xn--q9jyb4c/"'
 | |
|       end
 | |
| 
 | |
|       it 'has display URL' do
 | |
|         is_expected.to include '<span class="">nic.みんな/</span>'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'matches a URL without trailing period' do
 | |
|       let(:text) { 'http://www.mcmansionhell.com/post/156408871451/50-states-of-mcmansion-hell-scottsdale-arizona. ' }
 | |
| 
 | |
|       it 'has valid URL' do
 | |
|         is_expected.to include 'href="http://www.mcmansionhell.com/post/156408871451/50-states-of-mcmansion-hell-scottsdale-arizona"'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'matches a URL without closing paranthesis' do
 | |
|       let(:text) { '(http://google.com/)' }
 | |
| 
 | |
|       it 'has valid URL' do
 | |
|         is_expected.to include 'href="http://google.com/"'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'matches a URL without exclamation point' do
 | |
|       let(:text) { 'http://www.google.com!' }
 | |
| 
 | |
|       it 'has valid URL' do
 | |
|         is_expected.to include 'href="http://www.google.com/"'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'matches a URL without single quote' do
 | |
|       let(:text) { "http://www.google.com'" }
 | |
| 
 | |
|       it 'has valid URL' do
 | |
|         is_expected.to include 'href="http://www.google.com/"'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'matches a URL without angle brackets' do
 | |
|       let(:text) { 'http://www.google.com>' }
 | |
| 
 | |
|       it 'has valid URL' do
 | |
|         is_expected.to include 'href="http://www.google.com/"'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'matches a URL with a query string' do
 | |
|       let(:text) { 'https://www.ruby-toolbox.com/search?utf8=%E2%9C%93&q=autolink' }
 | |
| 
 | |
|       it 'has valid URL' do
 | |
|         is_expected.to include 'href="https://www.ruby-toolbox.com/search?utf8=%E2%9C%93&q=autolink"'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'matches a URL with parenthesis in it' do
 | |
|       let(:text) { 'https://en.wikipedia.org/wiki/Diaspora_(software)' }
 | |
| 
 | |
|       it 'has valid URL' do
 | |
|         is_expected.to include 'href="https://en.wikipedia.org/wiki/Diaspora_(software)"'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'contains HTML (script tag)' do
 | |
|       let(:text) { '<script>alert("Hello")</script>' }
 | |
| 
 | |
|       it 'has escaped HTML' do
 | |
|         is_expected.to include '<p><script>alert("Hello")</script></p>'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'contains HTML (XSS attack)' do
 | |
|       let(:text) { %q{<img src="javascript:alert('XSS');">} }
 | |
| 
 | |
|       it 'has escaped HTML' do
 | |
|         is_expected.to include '<p><img src="javascript:alert('XSS');"></p>'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'contains invalid URL' do
 | |
|       let(:text) { 'http://www\.google\.com' }
 | |
| 
 | |
|       it 'has raw URL' do
 | |
|         is_expected.to eq '<p>http://www\.google\.com</p>'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'contains a hashtag' do
 | |
|       let(:text)  { '#hashtag' }
 | |
| 
 | |
|       it 'has a link' do
 | |
|         is_expected.to include '/tags/hashtag" class="mention hashtag" rel="tag">#<span>hashtag</span></a>'
 | |
|       end
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   describe '#format' do
 | |
|     subject { Formatter.instance.format(status) }
 | |
| 
 | |
|     context 'with local status' do
 | |
|       context 'with reblog' do
 | |
|         let(:reblog) { Fabricate(:status, account: local_account, text: 'Hello world', uri: nil) }
 | |
|         let(:status) { Fabricate(:status, reblog: reblog) }
 | |
| 
 | |
|         it 'returns original status with credit to its author' do
 | |
|           is_expected.to include 'RT <span class="h-card"><a href="https://cb6e6126.ngrok.io/@alice" class="u-url mention">@<span>alice</span></a></span> Hello world'
 | |
|         end
 | |
|       end
 | |
| 
 | |
|       context 'contains plain text' do
 | |
|         let(:status)  { Fabricate(:status, text: 'text', uri: nil) }
 | |
| 
 | |
|         it 'paragraphizes' do
 | |
|           is_expected.to eq '<p>text</p>'
 | |
|         end
 | |
|       end
 | |
| 
 | |
|       context 'contains line feeds' do
 | |
|         let(:status)  { Fabricate(:status, text: "line\nfeed", uri: nil) }
 | |
| 
 | |
|         it 'removes line feeds' do
 | |
|           is_expected.not_to include "\n"
 | |
|         end
 | |
|       end
 | |
| 
 | |
|       context 'contains linkable mentions' do
 | |
|         let(:status) { Fabricate(:status, mentions: [ Fabricate(:mention, account: local_account) ], text: '@alice') }
 | |
| 
 | |
|         it 'links' do
 | |
|           is_expected.to include '<a href="https://cb6e6126.ngrok.io/@alice" class="u-url mention">@<span>alice</span></a></span>'
 | |
|         end
 | |
|       end
 | |
| 
 | |
|       context 'contains unlinkable mentions' do
 | |
|         let(:status) { Fabricate(:status, text: '@alice', uri: nil) }
 | |
| 
 | |
|         it 'does not link' do
 | |
|           is_expected.to include '@alice'
 | |
|         end
 | |
|       end
 | |
| 
 | |
|       context do
 | |
|         subject do
 | |
|           status = Fabricate(:status, text: text, uri: nil)
 | |
|           Formatter.instance.format(status)
 | |
|         end
 | |
| 
 | |
|         include_examples 'encode and link URLs'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'with remote status' do
 | |
|       let(:status) { Fabricate(:status, account: remote_account, text: 'Beep boop') }
 | |
| 
 | |
|       it 'reformats' do
 | |
|         is_expected.to eq 'Beep boop'
 | |
|       end
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   describe '#reformat' do
 | |
|     subject { Formatter.instance.reformat(text) }
 | |
| 
 | |
|     context 'contains plain text' do
 | |
|       let(:text) { 'Beep boop' }
 | |
| 
 | |
|       it 'contains plain text' do
 | |
|         is_expected.to include 'Beep boop'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'contains scripts' do
 | |
|       let(:text) { '<script>alert("Hello")</script>' }
 | |
| 
 | |
|       it 'strips scripts' do
 | |
|         is_expected.to_not include '<script>alert("Hello")</script>'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'contains malicious classes' do
 | |
|       let(:text) { '<span class="status__content__spoiler-link">Show more</span>' }
 | |
| 
 | |
|       it 'strips malicious classes' do
 | |
|         is_expected.to_not include 'status__content__spoiler-link'
 | |
|       end
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   describe '#plaintext' do
 | |
|     subject { Formatter.instance.plaintext(status) }
 | |
| 
 | |
|     context 'with local status' do
 | |
|       let(:status)  { Fabricate(:status, text: '<p>a text by a nerd who uses an HTML tag in text</p>', uri: nil) }
 | |
| 
 | |
|       it 'returns raw text' do
 | |
|         is_expected.to eq '<p>a text by a nerd who uses an HTML tag in text</p>'
 | |
|       end
 | |
|     end
 | |
| 
 | |
|     context 'with remote status' do
 | |
|       let(:status)  { Fabricate(:status, account: remote_account, text: '<script>alert("Hello")</script>') }
 | |
| 
 | |
|       it 'returns tag-stripped text' do
 | |
|         is_expected.to eq ''
 | |
|       end
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   describe '#simplified_format' do
 | |
|     subject { Formatter.instance.simplified_format(account) }
 | |
| 
 | |
|     context 'with local status' do
 | |
|       let(:account) { Fabricate(:account, domain: nil, note: text) }
 | |
| 
 | |
|       context 'contains linkable mentions for local accounts' do
 | |
|         let(:text) { '@alice' }
 | |
| 
 | |
|         before { local_account }
 | |
| 
 | |
|         it 'links' do
 | |
|           is_expected.to eq '<p><span class="h-card"><a href="https://cb6e6126.ngrok.io/@alice" class="u-url mention">@<span>alice</span></a></span></p>'
 | |
|         end
 | |
|       end
 | |
| 
 | |
|       context 'contains linkable mentions for remote accounts' do
 | |
|         let(:text) { '@bob@remote' }
 | |
| 
 | |
|         before { remote_account }
 | |
| 
 | |
|         it 'links' do
 | |
|           is_expected.to eq '<p><span class="h-card"><a href="https://remote/" class="u-url mention">@<span>bob</span></a></span></p>'
 | |
|         end
 | |
|       end
 | |
| 
 | |
|       context 'contains unlinkable mentions' do
 | |
|         let(:text) { '@alice' }
 | |
| 
 | |
|         it 'returns raw mention texts' do
 | |
|           is_expected.to eq '<p>@alice</p>'
 | |
|         end
 | |
|       end
 | |
| 
 | |
|       include_examples 'encode and link URLs'
 | |
|     end
 | |
| 
 | |
|     context 'with remote status' do
 | |
|       let(:text) { '<script>alert("Hello")</script>' }
 | |
|       let(:account) { Fabricate(:account, domain: 'remote', note: text) }
 | |
| 
 | |
|       it 'reformats' do
 | |
|         is_expected.to_not include '<script>alert("Hello")</script>'
 | |
|       end
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   describe '#sanitize' do
 | |
|     let(:html) { '<script>alert("Hello")</script>' }
 | |
| 
 | |
|     subject { Formatter.instance.sanitize(html, Sanitize::Config::MASTODON_STRICT) }
 | |
| 
 | |
|     it 'sanitizes' do
 | |
|       is_expected.to eq 'alert("Hello")'
 | |
|     end
 | |
|   end
 | |
| end
 |