######################## BEGIN LICENSE BLOCK ######################## # The Original Code is Mozilla Universal charset detector code. # # The Initial Developer of the Original Code is # Netscape Communications Corporation. # Portions created by the Initial Developer are Copyright (C) 2001 # the Initial Developer. All Rights Reserved. # # Contributor(s): # Mark Pilgrim - port to Python # Shy Shalom - original C code # Proofpoint, Inc. # # This library is free software; you can redistribute it and/or # modify it under the terms of the GNU Lesser General Public # License as published by the Free Software Foundation; either # version 2.1 of the License, or (at your option) any later version. # # This library is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU # Lesser General Public License for more details. # # You should have received a copy of the GNU Lesser General Public # License along with this library; if not, write to the Free Software # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA # 02110-1301 USA ######################### END LICENSE BLOCK ######################### from .charsetgroupprober import CharSetGroupProber from .utf8prober import UTF8Prober from .sjisprober import SJISProber from .eucjpprober import EUCJPProber from .gb2312prober import GB2312Prober from .euckrprober import EUCKRProber from .cp949prober import CP949Prober from .big5prober import Big5Prober from .euctwprober import EUCTWProber class MBCSGroupProber(CharSetGroupProber): # 初始化MBCSGroupProber类,继承自CharSetGroupProber类 def __init__(self, lang_filter=None): # 调用父类CharSetGroupProber的初始化方法 super(MBCSGroupProber, self).__init__(lang_filter=lang_filter) # 定义一个包含多种字符集探测器的列表 self.probers = [ UTF8Prober(), # UTF-8字符集探测器 SJISProber(), # Shift_JIS字符集探测器 EUCJPProber(), # EUC-JP字符集探测器 GB2312Prober(), # GB2312字符集探测器 EUCKRProber(), # EUCKR字符集探测器 CP949Prober(), # CP949字符集探测器 Big5Prober(), # Big5字符集探测器 EUCTWProber() # EUCTW字符集探测器 ] # 重置探测器 self.reset()