2017-04-25 02:47:31 +02:00
require 'rails_helper'
2018-05-02 18:58:48 +02:00
RSpec . describe FetchLinkCardService , type : :service do
2021-11-05 23:23:05 +01:00
subject { described_class . new }
2017-05-17 00:41:15 +02:00
2017-04-25 02:47:31 +02:00
before do
stub_request ( :get , 'http://example.xn--fiqs8s/' ) . to_return ( request_fixture ( 'idn.txt' ) )
2017-07-05 21:54:21 +09:00
stub_request ( :get , 'http://example.com/sjis' ) . to_return ( request_fixture ( 'sjis.txt' ) )
2017-07-09 05:44:31 +09:00
stub_request ( :get , 'http://example.com/sjis_with_wrong_charset' ) . to_return ( request_fixture ( 'sjis_with_wrong_charset.txt' ) )
stub_request ( :get , 'http://example.com/koi8-r' ) . to_return ( request_fixture ( 'koi8-r.txt' ) )
2017-09-15 01:03:20 +09:00
stub_request ( :get , 'http://example.com/日本語' ) . to_return ( request_fixture ( 'sjis.txt' ) )
2019-10-01 04:54:10 +02:00
stub_request ( :get , 'https://github.com/qbi/WannaCry' ) . to_return ( status : 404 )
2023-06-01 12:14:49 +02:00
stub_request ( :get , 'http://example.com/test?data=file.gpx%5E1' ) . to_return ( status : 200 )
2018-02-11 22:49:18 +00:00
stub_request ( :get , 'http://example.com/test-' ) . to_return ( request_fixture ( 'idn.txt' ) )
2018-12-17 19:19:45 +01:00
stub_request ( :get , 'http://example.com/windows-1251' ) . to_return ( request_fixture ( 'windows-1251.txt' ) )
2024-06-21 14:51:10 +02:00
stub_request ( :get , 'http://example.com/low_confidence_latin1' ) . to_return ( request_fixture ( 'low_confidence_latin1.txt' ) )
2017-05-17 00:41:15 +02:00
subject . call ( status )
end
context 'in a local status' do
context do
let ( :status ) { Fabricate ( :status , text : 'Check out http://example.中国' ) }
it 'works with IDN URLs' do
expect ( a_request ( :get , 'http://example.xn--fiqs8s/' ) ) . to have_been_made . at_least_once
end
end
2017-07-05 21:54:21 +09:00
context do
let ( :status ) { Fabricate ( :status , text : 'Check out http://example.com/sjis' ) }
it 'works with SJIS' do
expect ( a_request ( :get , 'http://example.com/sjis' ) ) . to have_been_made . at_least_once
2017-09-01 16:20:16 +02:00
expect ( status . preview_cards . first . title ) . to eq ( " SJISのページ " )
2017-07-09 05:44:31 +09:00
end
end
context do
let ( :status ) { Fabricate ( :status , text : 'Check out http://example.com/sjis_with_wrong_charset' ) }
it 'works with SJIS even with wrong charset header' do
expect ( a_request ( :get , 'http://example.com/sjis_with_wrong_charset' ) ) . to have_been_made . at_least_once
2017-09-01 16:20:16 +02:00
expect ( status . preview_cards . first . title ) . to eq ( " SJISのページ " )
2017-07-09 05:44:31 +09:00
end
end
context do
let ( :status ) { Fabricate ( :status , text : 'Check out http://example.com/koi8-r' ) }
it 'works with koi8-r' do
expect ( a_request ( :get , 'http://example.com/koi8-r' ) ) . to have_been_made . at_least_once
2017-09-01 16:20:16 +02:00
expect ( status . preview_cards . first . title ) . to eq ( " Московя начинаетъ только въ XVI ст. привлекать внимане иностранцевъ. " )
2017-07-05 21:54:21 +09:00
end
end
2017-09-15 01:03:20 +09:00
2018-12-17 19:19:45 +01:00
context do
let ( :status ) { Fabricate ( :status , text : 'Check out http://example.com/windows-1251' ) }
it 'works with windows-1251' do
expect ( a_request ( :get , 'http://example.com/windows-1251' ) ) . to have_been_made . at_least_once
expect ( status . preview_cards . first . title ) . to eq ( 'сэмпл текст' )
end
end
2024-06-21 14:51:10 +02:00
context 'with a URL of a page in ISO-8859-1 encoding, that charlock_holmes cannot detect' do
let ( :status ) { Fabricate ( :status , text : 'Check out http://example.com/low_confidence_latin1' ) }
it 'decodes the HTML' do
expect ( status . preview_card . title ) . to eq ( " Tofu á l'orange " )
end
end
context 'with a Japanese path URL' do
2017-09-15 01:03:20 +09:00
let ( :status ) { Fabricate ( :status , text : 'テストhttp://example.com/日本語' ) }
it 'works with Japanese path string' do
expect ( a_request ( :get , 'http://example.com/日本語' ) ) . to have_been_made . at_least_once
expect ( status . preview_cards . first . title ) . to eq ( " SJISのページ " )
end
end
2018-02-11 22:49:18 +00:00
context do
let ( :status ) { Fabricate ( :status , text : 'test http://example.com/test-' ) }
it 'works with a URL ending with a hyphen' do
expect ( a_request ( :get , 'http://example.com/test-' ) ) . to have_been_made . at_least_once
end
end
2021-03-04 00:12:26 +01:00
context do
let ( :status ) { Fabricate ( :status , text : 'testhttp://example.com/sjis' ) }
it 'does not fetch URLs with not isolated from their surroundings' do
expect ( a_request ( :get , 'http://example.com/sjis' ) ) . to_not have_been_made
end
end
2023-06-01 12:14:49 +02:00
context do
let ( :status ) { Fabricate ( :status , text : 'test http://example.com/test?data=file.gpx^1' ) }
it 'does fetch URLs with a caret in search params' do
expect ( a_request ( :get , 'http://example.com/test?data=file.gpx' ) ) . to_not have_been_made
expect ( a_request ( :get , 'http://example.com/test?data=file.gpx%5E1' ) ) . to have_been_made . once
end
end
2024-06-27 16:40:19 +02:00
context 'with an URL too long for PostgreSQL unique indexes' do
let ( :url ) { " http://example.com/ #{ 'a' * 2674 } " }
let ( :status ) { Fabricate ( :status , text : url ) }
it 'does not fetch the URL' do
expect ( a_request ( :get , url ) ) . to_not have_been_made
end
it 'does not create a preview card' do
expect ( status . preview_card ) . to be_nil
end
end
2017-04-25 02:47:31 +02:00
end
2017-05-17 00:41:15 +02:00
context 'in a remote status' do
2019-11-21 16:04:52 +01:00
let ( :status ) { Fabricate ( :status , account : Fabricate ( :account , domain : 'example.com' ) , text : 'Habt ihr ein paar gute Links zu <a>foo</a> #<span class="tag"><a href="https://quitter.se/tag/wannacry" target="_blank" rel="tag noopener noreferrer" title="https://quitter.se/tag/wannacry">Wannacry</a></span> herumfliegen? Ich will mal unter <br> <a href="https://github.com/qbi/WannaCry" target="_blank" rel="noopener noreferrer" title="https://github.com/qbi/WannaCry">https://github.com/qbi/WannaCry</a> was sammeln. !<a href="http://sn.jonkman.ca/group/416/id" target="_blank" rel="noopener noreferrer" title="http://sn.jonkman.ca/group/416/id">security</a> ' ) }
2017-05-17 00:41:15 +02:00
it 'parses out URLs' do
2019-10-01 04:54:10 +02:00
expect ( a_request ( :get , 'https://github.com/qbi/WannaCry' ) ) . to have_been_made . at_least_once
2017-05-17 00:41:15 +02:00
end
2017-04-25 02:47:31 +02:00
2017-05-17 00:41:15 +02:00
it 'ignores URLs to hashtags' do
2019-10-01 04:54:10 +02:00
expect ( a_request ( :get , 'https://quitter.se/tag/wannacry' ) ) . to_not have_been_made
2017-05-17 00:41:15 +02:00
end
2017-04-25 02:47:31 +02:00
end
end