| 
									
										
										
										
											2019-03-16 02:20:00 +00:00
										 |  |  | # frozen_string_literal: true | 
					
						
							| 
									
										
										
										
											2011-04-16 06:43:49 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-11-26 14:07:17 +00:00
										 |  |  | # Redmine - project management software | 
					
						
							| 
									
										
										
										
											2024-02-26 22:55:54 +00:00
										 |  |  | # Copyright (C) 2006-  Jean-Philippe Lang | 
					
						
							| 
									
										
										
										
											2023-11-26 14:07:17 +00:00
										 |  |  | # | 
					
						
							|  |  |  | # This program is free software; you can redistribute it and/or | 
					
						
							|  |  |  | # modify it under the terms of the GNU General Public License | 
					
						
							|  |  |  | # as published by the Free Software Foundation; either version 2 | 
					
						
							|  |  |  | # of the License, or (at your option) any later version. | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | # This program is distributed in the hope that it will be useful, | 
					
						
							|  |  |  | # but WITHOUT ANY WARRANTY; without even the implied warranty of | 
					
						
							|  |  |  | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
					
						
							|  |  |  | # GNU General Public License for more details. | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | # You should have received a copy of the GNU General Public License | 
					
						
							|  |  |  | # along with this program; if not, write to the Free Software | 
					
						
							|  |  |  | # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA. | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-04-16 06:43:49 +00:00
										 |  |  | module Redmine | 
					
						
							|  |  |  |   module CodesetUtil | 
					
						
							|  |  |  |     def self.replace_invalid_utf8(str) | 
					
						
							| 
									
										
										
										
											2019-03-16 02:20:00 +00:00
										 |  |  |       return nil if str.nil? | 
					
						
							| 
									
										
										
										
											2020-09-17 15:48:58 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-03-16 02:20:00 +00:00
										 |  |  |       str = str.dup | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |       str.force_encoding('UTF-8') | 
					
						
							| 
									
										
										
										
											2024-08-25 08:44:33 +00:00
										 |  |  |       unless str.valid_encoding? | 
					
						
							| 
									
										
										
										
											2017-01-28 06:24:51 +00:00
										 |  |  |         str = str.encode("UTF-16LE", :invalid => :replace, | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |               :undef => :replace, :replace => '?').encode("UTF-8") | 
					
						
							| 
									
										
										
										
											2011-04-16 06:43:49 +00:00
										 |  |  |       end | 
					
						
							|  |  |  |       str | 
					
						
							|  |  |  |     end | 
					
						
							| 
									
										
										
										
											2011-11-14 23:04:45 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def self.to_utf8(str, encoding) | 
					
						
							| 
									
										
										
										
											2019-03-16 02:20:00 +00:00
										 |  |  |       return if str.nil? | 
					
						
							| 
									
										
										
										
											2020-09-17 15:48:58 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-03-20 01:36:44 +00:00
										 |  |  |       str = str.b | 
					
						
							| 
									
										
										
										
											2011-11-14 23:04:45 +00:00
										 |  |  |       if str.empty? | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |         str.force_encoding("UTF-8") | 
					
						
							| 
									
										
										
										
											2011-11-14 23:04:45 +00:00
										 |  |  |         return str | 
					
						
							|  |  |  |       end | 
					
						
							|  |  |  |       enc = encoding.blank? ? "UTF-8" : encoding | 
					
						
							| 
									
										
										
										
											2019-09-21 15:54:25 +00:00
										 |  |  |       if enc.casecmp("UTF-8") != 0
 | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |         str.force_encoding(enc) | 
					
						
							|  |  |  |         str = str.encode("UTF-8", :invalid => :replace, | 
					
						
							|  |  |  |               :undef => :replace, :replace => '?') | 
					
						
							| 
									
										
										
										
											2011-11-14 23:04:45 +00:00
										 |  |  |       else | 
					
						
							| 
									
										
										
										
											2017-01-28 05:43:33 +00:00
										 |  |  |         str = replace_invalid_utf8(str) | 
					
						
							| 
									
										
										
										
											2011-11-14 23:04:45 +00:00
										 |  |  |       end | 
					
						
							|  |  |  |       str | 
					
						
							|  |  |  |     end | 
					
						
							| 
									
										
										
										
											2011-11-16 05:07:16 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-11-17 11:53:15 +00:00
										 |  |  |     def self.to_utf8_by_setting(str) | 
					
						
							| 
									
										
										
										
											2019-03-16 02:20:00 +00:00
										 |  |  |       return if str.nil? | 
					
						
							| 
									
										
										
										
											2020-09-17 15:48:58 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-03-16 02:20:00 +00:00
										 |  |  |       str = str.dup | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |       self.to_utf8_by_setting_internal(str).force_encoding('UTF-8') | 
					
						
							| 
									
										
										
										
											2011-11-17 11:53:15 +00:00
										 |  |  |     end | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def self.to_utf8_by_setting_internal(str) | 
					
						
							| 
									
										
										
										
											2019-03-16 02:20:00 +00:00
										 |  |  |       return if str.nil? | 
					
						
							| 
									
										
										
										
											2020-09-17 15:48:58 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-03-20 01:36:44 +00:00
										 |  |  |       str = str.b | 
					
						
							| 
									
										
										
										
											2011-11-17 11:53:15 +00:00
										 |  |  |       return str if str.empty? | 
					
						
							| 
									
										
										
										
											2019-03-27 02:15:24 +00:00
										 |  |  |       return str if /\A[\r\n\t\x20-\x7e]*\Z/n.match?(str) # for us-ascii | 
					
						
							| 
									
										
										
										
											2020-09-17 15:48:58 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |       str.force_encoding('UTF-8') | 
					
						
							| 
									
										
										
										
											2011-11-17 11:53:15 +00:00
										 |  |  |       encodings = Setting.repositories_encodings.split(',').collect(&:strip) | 
					
						
							|  |  |  |       encodings.each do |encoding| | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |         begin | 
					
						
							|  |  |  |           str.force_encoding(encoding) | 
					
						
							|  |  |  |           utf8 = str.encode('UTF-8') | 
					
						
							|  |  |  |           return utf8 if utf8.valid_encoding? | 
					
						
							|  |  |  |         rescue | 
					
						
							|  |  |  |           # do nothing here and try the next encoding | 
					
						
							| 
									
										
										
										
											2011-11-17 11:53:15 +00:00
										 |  |  |         end | 
					
						
							|  |  |  |       end | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |       self.replace_invalid_utf8(str).force_encoding('UTF-8') | 
					
						
							| 
									
										
										
										
											2011-11-17 11:53:15 +00:00
										 |  |  |     end | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-11-16 05:07:16 +00:00
										 |  |  |     def self.from_utf8(str, encoding) | 
					
						
							| 
									
										
										
										
											2019-03-16 02:20:00 +00:00
										 |  |  |       return if str.nil? | 
					
						
							| 
									
										
										
										
											2020-09-17 15:48:58 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-03-16 02:20:00 +00:00
										 |  |  |       str = str.dup | 
					
						
							| 
									
										
										
										
											2011-11-16 05:07:16 +00:00
										 |  |  |       str ||= '' | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |       str.force_encoding('UTF-8') | 
					
						
							| 
									
										
										
										
											2019-09-21 15:54:25 +00:00
										 |  |  |       if encoding.casecmp('UTF-8') != 0
 | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |         str = str.encode(encoding, :invalid => :replace, | 
					
						
							|  |  |  |                          :undef => :replace, :replace => '?') | 
					
						
							| 
									
										
										
										
											2011-11-16 05:07:16 +00:00
										 |  |  |       else | 
					
						
							| 
									
										
										
										
											2014-10-22 17:37:16 +00:00
										 |  |  |         str = self.replace_invalid_utf8(str) | 
					
						
							| 
									
										
										
										
											2011-11-16 05:07:16 +00:00
										 |  |  |       end | 
					
						
							|  |  |  |     end | 
					
						
							| 
									
										
										
										
											2022-01-07 01:29:55 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def self.guess_encoding(str) | 
					
						
							|  |  |  |       return if str.nil? | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |       str = str.dup | 
					
						
							|  |  |  |       encodings = Setting.repositories_encodings.split(',').collect(&:strip) | 
					
						
							|  |  |  |       encodings = encodings.presence || ['UTF-8'] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |       encodings.each do |encoding| | 
					
						
							|  |  |  |         begin | 
					
						
							|  |  |  |           str.force_encoding(encoding) | 
					
						
							|  |  |  |         rescue Encoding::ConverterNotFoundError | 
					
						
							|  |  |  |           # ignore if the encoding name is invalid | 
					
						
							|  |  |  |         end | 
					
						
							|  |  |  |         return encoding if str.valid_encoding? | 
					
						
							|  |  |  |       end | 
					
						
							|  |  |  |       nil | 
					
						
							|  |  |  |     end | 
					
						
							| 
									
										
										
										
											2011-04-16 06:43:49 +00:00
										 |  |  |   end | 
					
						
							|  |  |  | end |