Remove language detection through cld3 (#17478)
* Remove language detection through cld3 * Update app/helpers/languages_helper.rb Co-authored-by: Yamagishi Kazutoshi <ykzts@desire.sh> Co-authored-by: Yamagishi Kazutoshi <ykzts@desire.sh>
This commit is contained in:
		| @@ -3,9 +3,9 @@ | ||||
| require 'rails_helper' | ||||
|  | ||||
| describe LanguagesHelper do | ||||
|   describe 'the HUMAN_LOCALES constant' do | ||||
|     it 'includes all I18n locales' do | ||||
|       expect(described_class::HUMAN_LOCALES.keys).to include(*I18n.available_locales) | ||||
|   describe 'the SUPPORTED_LOCALES constant' do | ||||
|     it 'includes all i18n locales' do | ||||
|       expect(Set.new(described_class::SUPPORTED_LOCALES.keys + described_class::REGIONAL_LOCALE_NAMES.keys)).to include(*I18n.available_locales) | ||||
|     end | ||||
|   end | ||||
|  | ||||
|   | ||||
| @@ -1,134 +0,0 @@ | ||||
| # frozen_string_literal: true | ||||
|  | ||||
| require 'rails_helper' | ||||
|  | ||||
| describe LanguageDetector do | ||||
|   describe 'prepare_text' do | ||||
|     it 'returns unmodified string without special cases' do | ||||
|       string = 'just a regular string' | ||||
|       result = described_class.instance.send(:prepare_text, string) | ||||
|  | ||||
|       expect(result).to eq string | ||||
|     end | ||||
|  | ||||
|     it 'collapses spacing in strings' do | ||||
|       string = 'The formatting   in    this is very        odd' | ||||
|  | ||||
|       result = described_class.instance.send(:prepare_text, string) | ||||
|       expect(result).to eq 'The formatting in this is very odd' | ||||
|     end | ||||
|  | ||||
|     it 'strips usernames from strings before detection' do | ||||
|       string = '@username Yeah, very surreal...! also @friend' | ||||
|  | ||||
|       result = described_class.instance.send(:prepare_text, string) | ||||
|       expect(result).to eq 'Yeah, very surreal...! also' | ||||
|     end | ||||
|  | ||||
|     it 'strips URLs from strings before detection' do | ||||
|       string = 'Our website is https://example.com and also http://localhost.dev' | ||||
|  | ||||
|       result = described_class.instance.send(:prepare_text, string) | ||||
|       expect(result).to eq 'Our website is and also' | ||||
|     end | ||||
|  | ||||
|     it 'converts #hashtags back to normal text before detection' do | ||||
|       string = 'Hey look at all the #animals and #FishAndChips' | ||||
|  | ||||
|       result = described_class.instance.send(:prepare_text, string) | ||||
|       expect(result).to eq 'Hey look at all the animals and fish and chips' | ||||
|     end | ||||
|   end | ||||
|  | ||||
|   describe 'detect' do | ||||
|     let(:account_without_user_locale) { Fabricate(:user, locale: nil).account } | ||||
|     let(:account_remote) { Fabricate(:account, domain: 'joinmastodon.org') } | ||||
|  | ||||
|     it 'detects english language for basic strings' do | ||||
|       strings = [ | ||||
|         "Hello and welcome to mastodon how are you today?", | ||||
|         "I'd rather not!", | ||||
|         "a lot of people just want to feel righteous all the time and that's all that matters", | ||||
|       ] | ||||
|       strings.each do |string| | ||||
|         result = described_class.instance.detect(string, account_without_user_locale) | ||||
|  | ||||
|         expect(result).to eq(:en), string | ||||
|       end | ||||
|     end | ||||
|  | ||||
|     it 'detects spanish language' do | ||||
|       string = 'Obtener un Hola y bienvenidos a Mastodon. Obtener un Hola y bienvenidos a Mastodon. Obtener un Hola y bienvenidos a Mastodon. Obtener un Hola y bienvenidos a Mastodon' | ||||
|       result = described_class.instance.detect(string, account_without_user_locale) | ||||
|  | ||||
|       expect(result).to eq :es | ||||
|     end | ||||
|  | ||||
|     describe 'when language can\'t be detected' do | ||||
|       it 'uses nil when sent an empty document' do | ||||
|         result = described_class.instance.detect('', account_without_user_locale) | ||||
|         expect(result).to eq nil | ||||
|       end | ||||
|  | ||||
|       describe 'because of a URL' do | ||||
|         it 'uses nil when sent just a URL' do | ||||
|           string = 'http://example.com/media/2kFTgOJLXhQf0g2nKB4' | ||||
|           cld_result = CLD3::NNetLanguageIdentifier.new(0, 2048).find_language(string) | ||||
|           expect(cld_result).not_to eq :en | ||||
|  | ||||
|           result = described_class.instance.detect(string, account_without_user_locale) | ||||
|  | ||||
|           expect(result).to eq nil | ||||
|         end | ||||
|       end | ||||
|  | ||||
|       describe 'with an account' do | ||||
|         it 'uses the account locale when present' do | ||||
|           account = double(user_locale: 'fr') | ||||
|           result  = described_class.instance.detect('', account) | ||||
|  | ||||
|           expect(result).to eq nil | ||||
|         end | ||||
|  | ||||
|         it 'uses nil when account is present but has no locale' do | ||||
|           result = described_class.instance.detect('', account_without_user_locale) | ||||
|  | ||||
|           expect(result).to eq nil | ||||
|         end | ||||
|       end | ||||
|  | ||||
|       describe 'with an `en` default locale' do | ||||
|         it 'uses nil for undetectable string' do | ||||
|           result = described_class.instance.detect('', account_without_user_locale) | ||||
|  | ||||
|           expect(result).to eq nil | ||||
|         end | ||||
|       end | ||||
|  | ||||
|       describe 'remote user' do | ||||
|         it 'detects Korean language' do | ||||
|           string = '안녕하세요' | ||||
|           result = described_class.instance.detect(string, account_remote) | ||||
|  | ||||
|           expect(result).to eq :ko | ||||
|         end | ||||
|       end | ||||
|  | ||||
|       describe 'with a non-`en` default locale' do | ||||
|         around(:each) do |example| | ||||
|           before = I18n.default_locale | ||||
|           I18n.default_locale = :ja | ||||
|           example.run | ||||
|           I18n.default_locale = before | ||||
|         end | ||||
|  | ||||
|         it 'uses nil for undetectable string' do | ||||
|           string = '' | ||||
|           result = described_class.instance.detect(string, account_without_user_locale) | ||||
|  | ||||
|           expect(result).to eq nil | ||||
|         end | ||||
|       end | ||||
|     end | ||||
|   end | ||||
| end | ||||
		Reference in New Issue
	
	Block a user