# frozen_string_literal: true require 'rails_helper' describe LanguageDetector do describe 'prepare_text' do it 'returns unmodified string without special cases' do string = 'just a regular string' result = described_class.instance.send(:prepare_text, string) expect(result).to eq string end it 'collapses spacing in strings' do string = 'The formatting in this is very odd' result = described_class.instance.send(:prepare_text, string) expect(result).to eq 'The formatting in this is very odd' end it 'strips usernames from strings before detection' do string = '@username Yeah, very surreal...! also @friend' result = described_class.instance.send(:prepare_text, string) expect(result).to eq 'Yeah, very surreal...! also' end it 'strips URLs from strings before detection' do string = 'Our website is https://example.com and also http://localhost.dev' result = described_class.instance.send(:prepare_text, string) expect(result).to eq 'Our website is and also' end it 'converts #hashtags back to normal text before detection' do string = 'Hey look at all the #animals and #FishAndChips' result = described_class.instance.send(:prepare_text, string) expect(result).to eq 'Hey look at all the animals and fish and chips' end end describe 'detect' do let(:account_without_user_locale) { Fabricate(:user, locale: nil).account } let(:account_remote) { Fabricate(:account, domain: 'joinmastodon.org') } it 'detects english language for basic strings' do strings = [ "Hello and welcome to mastodon how are you today?", "I'd rather not!", "a lot of people just want to feel righteous all the time and that's all that matters", ] strings.each do |string| result = described_class.instance.detect(string, account_without_user_locale) expect(result).to eq(:en), string end end it 'detects spanish language' do string = 'Obtener un Hola y bienvenidos a Mastodon. Obtener un Hola y bienvenidos a Mastodon. Obtener un Hola y bienvenidos a Mastodon. Obtener un Hola y bienvenidos a Mastodon' result = described_class.instance.detect(string, account_without_user_locale) expect(result).to eq :es end describe 'when language can\'t be detected' do it 'uses nil when sent an empty document' do result = described_class.instance.detect('', account_without_user_locale) expect(result).to eq nil end describe 'because of a URL' do it 'uses nil when sent just a URL' do string = 'http://example.com/media/2kFTgOJLXhQf0g2nKB4' cld_result = CLD3::NNetLanguageIdentifier.new(0, 2048).find_language(string) expect(cld_result).not_to eq :en result = described_class.instance.detect(string, account_without_user_locale) expect(result).to eq nil end end describe 'with an account' do it 'uses the account locale when present' do account = double(user_locale: 'fr') result = described_class.instance.detect('', account) expect(result).to eq nil end it 'uses nil when account is present but has no locale' do result = described_class.instance.detect('', account_without_user_locale) expect(result).to eq nil end end describe 'with an `en` default locale' do it 'uses nil for undetectable string' do result = described_class.instance.detect('', account_without_user_locale) expect(result).to eq nil end end describe 'remote user' do it 'detects Korean language' do string = '안녕하세요' result = described_class.instance.detect(string, account_remote) expect(result).to eq :ko end end describe 'with a non-`en` default locale' do around(:each) do |example| before = I18n.default_locale I18n.default_locale = :ja example.run I18n.default_locale = before end it 'uses nil for undetectable string' do string = '' result = described_class.instance.detect(string, account_without_user_locale) expect(result).to eq nil end end end end end