Fix filterable_languages method of SettingsHelper (#4966)
This commit is contained in:
		
							parent
							
								
									efec507230
								
							
						
					
					
						commit
						48d77ea1eb
					
				
					 7 changed files with 43 additions and 53 deletions
				
			
		
							
								
								
									
										2
									
								
								Gemfile
									
										
									
									
									
								
							
							
						
						
									
										2
									
								
								Gemfile
									
										
									
									
									
								
							|  | @ -25,7 +25,7 @@ gem 'bootsnap' | ||||||
| gem 'browser' | gem 'browser' | ||||||
| gem 'charlock_holmes', '~> 0.7.5' | gem 'charlock_holmes', '~> 0.7.5' | ||||||
| gem 'iso-639' | gem 'iso-639' | ||||||
| gem 'cld3', '~> 3.1' | gem 'cld3', '~> 3.2.0' | ||||||
| gem 'devise', '~> 4.2' | gem 'devise', '~> 4.2' | ||||||
| gem 'devise-two-factor', '~> 3.0' | gem 'devise-two-factor', '~> 3.0' | ||||||
| gem 'doorkeeper', '~> 4.2' | gem 'doorkeeper', '~> 4.2' | ||||||
|  |  | ||||||
|  | @ -110,7 +110,7 @@ GEM | ||||||
|       activesupport |       activesupport | ||||||
|     charlock_holmes (0.7.5) |     charlock_holmes (0.7.5) | ||||||
|     chunky_png (1.3.8) |     chunky_png (1.3.8) | ||||||
|     cld3 (3.1.3) |     cld3 (3.2.0) | ||||||
|       ffi (>= 1.1.0, < 1.10.0) |       ffi (>= 1.1.0, < 1.10.0) | ||||||
|     climate_control (0.2.0) |     climate_control (0.2.0) | ||||||
|     cocaine (0.5.8) |     cocaine (0.5.8) | ||||||
|  | @ -541,7 +541,7 @@ DEPENDENCIES | ||||||
|   capistrano-yarn (~> 2.0) |   capistrano-yarn (~> 2.0) | ||||||
|   capybara (~> 2.14) |   capybara (~> 2.14) | ||||||
|   charlock_holmes (~> 0.7.5) |   charlock_holmes (~> 0.7.5) | ||||||
|   cld3 (~> 3.1) |   cld3 (~> 3.2.0) | ||||||
|   climate_control (~> 0.2) |   climate_control (~> 0.2) | ||||||
|   devise (~> 4.2) |   devise (~> 4.2) | ||||||
|   devise-two-factor (~> 3.0) |   devise-two-factor (~> 3.0) | ||||||
|  |  | ||||||
|  | @ -41,7 +41,7 @@ module SettingsHelper | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   def filterable_languages |   def filterable_languages | ||||||
|     I18n.available_locales.map { |locale| locale.to_s.split('-').first.to_sym }.uniq |     LanguageDetector.instance.language_names.select(&HUMAN_LOCALES.method(:key?)) | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   def hash_to_object(hash) |   def hash_to_object(hash) | ||||||
|  |  | ||||||
|  | @ -1,26 +1,31 @@ | ||||||
| # frozen_string_literal: true | # frozen_string_literal: true | ||||||
| 
 | 
 | ||||||
| class LanguageDetector | class LanguageDetector | ||||||
|   attr_reader :text, :account |   include Singleton | ||||||
| 
 | 
 | ||||||
|   def initialize(text, account = nil) |   def initialize | ||||||
|     @text = text |  | ||||||
|     @account = account |  | ||||||
|     @identifier = CLD3::NNetLanguageIdentifier.new(1, 2048) |     @identifier = CLD3::NNetLanguageIdentifier.new(1, 2048) | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   def to_iso_s |   def detect(text, account) | ||||||
|     detected_language_code || default_locale |     detect_language_code(text) || default_locale(account) | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   def prepared_text |   def language_names | ||||||
|     simplified_text.strip |     @language_names = | ||||||
|  |       CLD3::TaskContextParams::LANGUAGE_NAMES.map { |name| iso6391(name.to_s).to_sym } | ||||||
|  |                                              .uniq | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   private |   private | ||||||
| 
 | 
 | ||||||
|   def detected_language_code |   def prepare_text(text) | ||||||
|     iso6391(result.language).to_sym if detected_language_reliable? |     simplify_text(text).strip | ||||||
|  |   end | ||||||
|  | 
 | ||||||
|  |   def detect_language_code(text) | ||||||
|  |     result = @identifier.find_language(prepare_text(text)) | ||||||
|  |     iso6391(result.language.to_s).to_sym if result.reliable? | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   def iso6391(bcp47) |   def iso6391(bcp47) | ||||||
|  | @ -32,15 +37,7 @@ class LanguageDetector | ||||||
|     ISO_639.find(iso639).alpha2 |     ISO_639.find(iso639).alpha2 | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   def result |   def simplify_text(text) | ||||||
|     @result ||= @identifier.find_language(prepared_text) |  | ||||||
|   end |  | ||||||
| 
 |  | ||||||
|   def detected_language_reliable? |  | ||||||
|     result.reliable? |  | ||||||
|   end |  | ||||||
| 
 |  | ||||||
|   def simplified_text |  | ||||||
|     text.dup.tap do |new_text| |     text.dup.tap do |new_text| | ||||||
|       new_text.gsub!(FetchLinkCardService::URL_PATTERN, '') |       new_text.gsub!(FetchLinkCardService::URL_PATTERN, '') | ||||||
|       new_text.gsub!(Account::MENTION_RE, '') |       new_text.gsub!(Account::MENTION_RE, '') | ||||||
|  | @ -49,7 +46,7 @@ class LanguageDetector | ||||||
|     end |     end | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   def default_locale |   def default_locale(account) | ||||||
|     account&.user_locale&.to_sym || nil |     account.user_locale&.to_sym | ||||||
|   end |   end | ||||||
| end | end | ||||||
|  |  | ||||||
|  | @ -28,7 +28,7 @@ class PostStatusService < BaseService | ||||||
|                                         sensitive: options[:sensitive], |                                         sensitive: options[:sensitive], | ||||||
|                                         spoiler_text: options[:spoiler_text] || '', |                                         spoiler_text: options[:spoiler_text] || '', | ||||||
|                                         visibility: options[:visibility] || account.user&.setting_default_privacy, |                                         visibility: options[:visibility] || account.user&.setting_default_privacy, | ||||||
|                                         language: detect_language_for(text, account), |                                         language: LanguageDetector.instance.detect(text, account), | ||||||
|                                         application: options[:application]) |                                         application: options[:application]) | ||||||
| 
 | 
 | ||||||
|       attach_media(status, media) |       attach_media(status, media) | ||||||
|  | @ -69,10 +69,6 @@ class PostStatusService < BaseService | ||||||
|     media.update(status_id: status.id) |     media.update(status_id: status.id) | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   def detect_language_for(text, account) |  | ||||||
|     LanguageDetector.new(text, account).to_iso_s |  | ||||||
|   end |  | ||||||
| 
 |  | ||||||
|   def process_mentions_service |   def process_mentions_service | ||||||
|     @process_mentions_service ||= ProcessMentionsService.new |     @process_mentions_service ||= ProcessMentionsService.new | ||||||
|   end |   end | ||||||
|  |  | ||||||
|  | @ -3,10 +3,10 @@ | ||||||
| require 'rails_helper' | require 'rails_helper' | ||||||
| 
 | 
 | ||||||
| describe LanguageDetector do | describe LanguageDetector do | ||||||
|   describe 'prepared_text' do |   describe 'prepare_text' do | ||||||
|     it 'returns unmodified string without special cases' do |     it 'returns unmodified string without special cases' do | ||||||
|       string = 'just a regular string' |       string = 'just a regular string' | ||||||
|       result = described_class.new(string).prepared_text |       result = described_class.instance.send(:prepare_text, string) | ||||||
| 
 | 
 | ||||||
|       expect(result).to eq string |       expect(result).to eq string | ||||||
|     end |     end | ||||||
|  | @ -14,33 +14,35 @@ describe LanguageDetector do | ||||||
|     it 'collapses spacing in strings' do |     it 'collapses spacing in strings' do | ||||||
|       string = 'The formatting   in    this is very        odd' |       string = 'The formatting   in    this is very        odd' | ||||||
| 
 | 
 | ||||||
|       result = described_class.new(string).prepared_text |       result = described_class.instance.send(:prepare_text, string) | ||||||
|       expect(result).to eq 'The formatting in this is very odd' |       expect(result).to eq 'The formatting in this is very odd' | ||||||
|     end |     end | ||||||
| 
 | 
 | ||||||
|     it 'strips usernames from strings before detection' do |     it 'strips usernames from strings before detection' do | ||||||
|       string = '@username Yeah, very surreal...! also @friend' |       string = '@username Yeah, very surreal...! also @friend' | ||||||
| 
 | 
 | ||||||
|       result = described_class.new(string).prepared_text |       result = described_class.instance.send(:prepare_text, string) | ||||||
|       expect(result).to eq 'Yeah, very surreal...! also' |       expect(result).to eq 'Yeah, very surreal...! also' | ||||||
|     end |     end | ||||||
| 
 | 
 | ||||||
|     it 'strips URLs from strings before detection' do |     it 'strips URLs from strings before detection' do | ||||||
|       string = 'Our website is https://example.com and also http://localhost.dev' |       string = 'Our website is https://example.com and also http://localhost.dev' | ||||||
| 
 | 
 | ||||||
|       result = described_class.new(string).prepared_text |       result = described_class.instance.send(:prepare_text, string) | ||||||
|       expect(result).to eq 'Our website is and also' |       expect(result).to eq 'Our website is and also' | ||||||
|     end |     end | ||||||
| 
 | 
 | ||||||
|     it 'strips #hashtags from strings before detection' do |     it 'strips #hashtags from strings before detection' do | ||||||
|       string = 'Hey look at all the #animals and #fish' |       string = 'Hey look at all the #animals and #fish' | ||||||
| 
 | 
 | ||||||
|       result = described_class.new(string).prepared_text |       result = described_class.instance.send(:prepare_text, string) | ||||||
|       expect(result).to eq 'Hey look at all the and' |       expect(result).to eq 'Hey look at all the and' | ||||||
|     end |     end | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   describe 'to_iso_s' do |   describe 'detect' do | ||||||
|  |     let(:account_without_user_locale) { Fabricate(:user, locale: nil).account } | ||||||
|  | 
 | ||||||
|     it 'detects english language for basic strings' do |     it 'detects english language for basic strings' do | ||||||
|       strings = [ |       strings = [ | ||||||
|         "Hello and welcome to mastodon how are you today?", |         "Hello and welcome to mastodon how are you today?", | ||||||
|  | @ -48,7 +50,7 @@ describe LanguageDetector do | ||||||
|         "a lot of people just want to feel righteous all the time and that's all that matters", |         "a lot of people just want to feel righteous all the time and that's all that matters", | ||||||
|       ] |       ] | ||||||
|       strings.each do |string| |       strings.each do |string| | ||||||
|         result = described_class.new(string).to_iso_s |         result = described_class.instance.detect(string, account_without_user_locale) | ||||||
| 
 | 
 | ||||||
|         expect(result).to eq(:en), string |         expect(result).to eq(:en), string | ||||||
|       end |       end | ||||||
|  | @ -56,14 +58,14 @@ describe LanguageDetector do | ||||||
| 
 | 
 | ||||||
|     it 'detects spanish language' do |     it 'detects spanish language' do | ||||||
|       string = 'Obtener un Hola y bienvenidos a Mastodon' |       string = 'Obtener un Hola y bienvenidos a Mastodon' | ||||||
|       result = described_class.new(string).to_iso_s |       result = described_class.instance.detect(string, account_without_user_locale) | ||||||
| 
 | 
 | ||||||
|       expect(result).to eq :es |       expect(result).to eq :es | ||||||
|     end |     end | ||||||
| 
 | 
 | ||||||
|     describe 'when language can\'t be detected' do |     describe 'when language can\'t be detected' do | ||||||
|       it 'uses nil when sent an empty document' do |       it 'uses nil when sent an empty document' do | ||||||
|         result = described_class.new('').to_iso_s |         result = described_class.instance.detect('', account_without_user_locale) | ||||||
|         expect(result).to eq nil |         expect(result).to eq nil | ||||||
|       end |       end | ||||||
| 
 | 
 | ||||||
|  | @ -73,7 +75,7 @@ describe LanguageDetector do | ||||||
|           cld_result = CLD3::NNetLanguageIdentifier.new(0, 2048).find_language(string) |           cld_result = CLD3::NNetLanguageIdentifier.new(0, 2048).find_language(string) | ||||||
|           expect(cld_result).not_to eq :en |           expect(cld_result).not_to eq :en | ||||||
| 
 | 
 | ||||||
|           result = described_class.new(string).to_iso_s |           result = described_class.instance.detect(string, account_without_user_locale) | ||||||
| 
 | 
 | ||||||
|           expect(result).to eq nil |           expect(result).to eq nil | ||||||
|         end |         end | ||||||
|  | @ -82,14 +84,13 @@ describe LanguageDetector do | ||||||
|       describe 'with an account' do |       describe 'with an account' do | ||||||
|         it 'uses the account locale when present' do |         it 'uses the account locale when present' do | ||||||
|           account = double(user_locale: 'fr') |           account = double(user_locale: 'fr') | ||||||
|           result  = described_class.new('', account).to_iso_s |           result  = described_class.instance.detect('', account) | ||||||
| 
 | 
 | ||||||
|           expect(result).to eq :fr |           expect(result).to eq :fr | ||||||
|         end |         end | ||||||
| 
 | 
 | ||||||
|         it 'uses nil when account is present but has no locale' do |         it 'uses nil when account is present but has no locale' do | ||||||
|           account = double(user_locale: nil) |           result  = described_class.instance.detect('', account_without_user_locale) | ||||||
|           result  = described_class.new('', account).to_iso_s |  | ||||||
| 
 | 
 | ||||||
|           expect(result).to eq nil |           expect(result).to eq nil | ||||||
|         end |         end | ||||||
|  | @ -97,8 +98,7 @@ describe LanguageDetector do | ||||||
| 
 | 
 | ||||||
|       describe 'with an `en` default locale' do |       describe 'with an `en` default locale' do | ||||||
|         it 'uses nil for undetectable string' do |         it 'uses nil for undetectable string' do | ||||||
|           string = '' |           result = described_class.instance.detect('', account_without_user_locale) | ||||||
|           result = described_class.new(string).to_iso_s |  | ||||||
| 
 | 
 | ||||||
|           expect(result).to eq nil |           expect(result).to eq nil | ||||||
|         end |         end | ||||||
|  | @ -114,7 +114,7 @@ describe LanguageDetector do | ||||||
| 
 | 
 | ||||||
|         it 'uses nil for undetectable string' do |         it 'uses nil for undetectable string' do | ||||||
|           string = '' |           string = '' | ||||||
|           result = described_class.new(string).to_iso_s |           result = described_class.instance.detect(string, account_without_user_locale) | ||||||
| 
 | 
 | ||||||
|           expect(result).to eq nil |           expect(result).to eq nil | ||||||
|         end |         end | ||||||
|  |  | ||||||
|  | @ -65,15 +65,12 @@ RSpec.describe PostStatusService do | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   it 'creates a status with a language set' do |   it 'creates a status with a language set' do | ||||||
|     detector = double(to_iso_s: :en) |  | ||||||
|     allow(LanguageDetector).to receive(:new).and_return(detector) |  | ||||||
| 
 |  | ||||||
|     account = Fabricate(:account) |     account = Fabricate(:account) | ||||||
|     text = 'test status text' |     text = 'This is an English text.' | ||||||
| 
 | 
 | ||||||
|     subject.call(account, text) |     status = subject.call(account, text) | ||||||
| 
 | 
 | ||||||
|     expect(LanguageDetector).to have_received(:new).with(text, account) |     expect(status.language).to eq 'en' | ||||||
|   end |   end | ||||||
| 
 | 
 | ||||||
|   it 'processes mentions' do |   it 'processes mentions' do | ||||||
|  |  | ||||||
		Loading…
	
	Add table
		
		Reference in a new issue