iOS 获取文件字符编码

      NSString *fileString=nil;
      if (fileString==nil||[fileString length]==0) {
        NSArray *codeArray=@[
            /*  kCFStringEncodingMacRoman = 0L, defined in CoreFoundation/CFString.h */
            @(kCFStringEncodingMacJapanese),
            @(kCFStringEncodingMacChineseTrad),
            @(kCFStringEncodingMacKorean),
            @(kCFStringEncodingMacArabic),
            @(kCFStringEncodingMacHebrew),
            @(kCFStringEncodingMacGreek),
            @(kCFStringEncodingMacCyrillic),
            @(kCFStringEncodingMacDevanagari),
            @(kCFStringEncodingMacGurmukhi),
            @(kCFStringEncodingMacGujarati),
           @(kCFStringEncodingMacOriya),
            @(kCFStringEncodingMacBengali),
            @(kCFStringEncodingMacTamil),
            @(kCFStringEncodingMacTelugu),
            @(kCFStringEncodingMacKannada),
            @(kCFStringEncodingMacMalayalam),
            @(kCFStringEncodingMacSinhalese),
            @(kCFStringEncodingMacBurmese),
            @(kCFStringEncodingMacKhmer),
            @(kCFStringEncodingMacThai ),
            @(kCFStringEncodingMacLaotian),
            @(kCFStringEncodingMacGeorgian),
            @(kCFStringEncodingMacArmenian),
            @(kCFStringEncodingMacChineseSimp),
            @(kCFStringEncodingMacTibetan ),
            @(kCFStringEncodingMacMongolian ),
            @(kCFStringEncodingMacEthiopic ) ,
            @(kCFStringEncodingMacCentralEurRoman),
            @(kCFStringEncodingMacVietnamese),
            @(kCFStringEncodingMacExtArabic ),
            /* The following use script code 0, smRoman */
            @(kCFStringEncodingMacSymbol ),
            @(kCFStringEncodingMacDingbats),
            @(kCFStringEncodingMacTurkish),
            @(kCFStringEncodingMacCroatian),
            @(kCFStringEncodingMacIcelandic),
            @(kCFStringEncodingMacRomanian),
            @(kCFStringEncodingMacCeltic),
            @(kCFStringEncodingMacGaelic),
            /* The following use script code 4, smArabic */
            @(kCFStringEncodingMacFarsi), /* Like MacArabic but uses Farsi digits */
            /* The following use script code 7, smCyrillic */
            @(kCFStringEncodingMacUkrainian),
            /* The following use script code 32, smUnimplemented */
            @(kCFStringEncodingMacInuit),
            @(kCFStringEncodingMacVT100), /* VT100/102 font from Comm Toolbox: Latin-1 repertoire + box drawing etc */
            /* Special Mac OS encodings*/
            @(kCFStringEncodingMacHFS), /* Meta-value, should never appear in a table */
            
            /* Unicode & ISO UCS encodings begin at 0x100 */
            /* We don't use Unicode variations defined in TextEncoding; use the ones in CFString.h, instead. */
            
            /* ISO 8-bit and 7-bit encodings begin at 0x200 */
            /*  kCFStringEncodingISOLatin1)0x0201, defined in CoreFoundation/CFString.h */
            @(kCFStringEncodingISOLatin2), /* ISO 8859-2 */
            @(kCFStringEncodingISOLatin3), /* ISO 8859-3 */
            @(kCFStringEncodingISOLatin4), /* ISO 8859-4 */
            @(kCFStringEncodingISOLatinCyrillic), /* ISO 8859-5 */
            @(kCFStringEncodingISOLatinArabic), /* ISO 8859-6, =ASMO 708, =DOS CP 708 */
            @(kCFStringEncodingISOLatinGreek), /* ISO 8859-7 */
            @(kCFStringEncodingISOLatinHebrew), /* ISO 8859-8 */
            @(kCFStringEncodingISOLatin5), /* ISO 8859-9 */
            @(kCFStringEncodingISOLatin6), /* ISO 8859-10 */
            @(kCFStringEncodingISOLatinThai), /* ISO 8859-11 */
            @(kCFStringEncodingISOLatin7), /* ISO 8859-13 */
            @(kCFStringEncodingISOLatin8), /* ISO 8859-14 */
            @(kCFStringEncodingISOLatin9), /* ISO 8859-15 */
            @(kCFStringEncodingISOLatin10), /* ISO 8859-16 */
            
            /* MS-DOS & Windows encodings begin at 0x400 */
            @(kCFStringEncodingDOSLatinUS), /* code page 437 */
            @(kCFStringEncodingDOSGreek),  /* code page 737 (formerly code page 437G) */
            @(kCFStringEncodingDOSBalticRim), /* code page 775 */
            @(kCFStringEncodingDOSLatin1), /* code page 850, "Multilingual" */
            @(kCFStringEncodingDOSGreek1), /* code page 851 */
            @(kCFStringEncodingDOSLatin2), /* code page 852, Slavic */
            @(kCFStringEncodingDOSCyrillic), /* code page 855, IBM Cyrillic */
            @(kCFStringEncodingDOSTurkish), /* code page 857, IBM Turkish */
            @(kCFStringEncodingDOSPortuguese), /* code page 860 */
            @(kCFStringEncodingDOSIcelandic), /* code page 861 */
            @(kCFStringEncodingDOSHebrew), /* code page 862 */
            @(kCFStringEncodingDOSCanadianFrench), /* code page 863 */
            @(kCFStringEncodingDOSArabic), /* code page 864 */
            @(kCFStringEncodingDOSNordic), /* code page 865 */
            @(kCFStringEncodingDOSRussian), /* code page 866 */
            @(kCFStringEncodingDOSGreek2), /* code page 869, IBM Modern Greek */
            @(kCFStringEncodingDOSThai),  /* code page 874, also for Windows */
            @(kCFStringEncodingDOSJapanese), /* code page 932, also for Windows */
            @(kCFStringEncodingDOSChineseSimplif), /* code page 936, also for Windows */
            @(kCFStringEncodingDOSKorean), /* code page 949, also for Windows; Unified Hangul Code */
            @(kCFStringEncodingDOSChineseTrad), /* code page 950, also for Windows */
            /*  kCFStringEncodingWindowsLatin1)0x0500, defined in CoreFoundation/CFString.h */
            @(kCFStringEncodingWindowsLatin2), /* code page 1250, Central Europe */
            @(kCFStringEncodingWindowsCyrillic), /* code page 1251, Slavic Cyrillic */
            @(kCFStringEncodingWindowsGreek), /* code page 1253 */
            @(kCFStringEncodingWindowsLatin5), /* code page 1254, Turkish */
            @(kCFStringEncodingWindowsHebrew), /* code page 1255 */
            @(kCFStringEncodingWindowsArabic), /* code page 1256 */
            @(kCFStringEncodingWindowsBalticRim), /* code page 1257 */
            @(kCFStringEncodingWindowsVietnamese), /* code page 1258 */
            @(kCFStringEncodingWindowsKoreanJohab), /* code page 1361, for Windows NT */
            
            /* Various national standards begin at 0x600 */
            /*  kCFStringEncodingASCII)0x0600, defined in CoreFoundation/CFString.h */
            @(kCFStringEncodingANSEL), /* ANSEL (ANSI Z39.47) */
            @(kCFStringEncodingJIS_X0201_76),
            @(kCFStringEncodingJIS_X0208_83),
            @(kCFStringEncodingJIS_X0208_90),
            @(kCFStringEncodingJIS_X0212_90),
            @(kCFStringEncodingJIS_C6226_78),
            @(kCFStringEncodingShiftJIS_X0213), /* Shift-JIS format encoding of JIS X0213 planes 1 and 2*/
            @(kCFStringEncodingShiftJIS_X0213_MenKuTen), /* JIS X0213 in plane-row-column notation */
            @(kCFStringEncodingGB_2312_80),
            @(kCFStringEncodingGBK_95),  /* annex to GB 13000-93; for Windows 95 */
            @(kCFStringEncodingGB_18030_2000),
            @(kCFStringEncodingKSC_5601_87), /* same as KSC 5601-92 without Johab annex */
            @(kCFStringEncodingKSC_5601_92_Johab), /* KSC 5601-92 Johab annex */
            @(kCFStringEncodingCNS_11643_92_P1), /* CNS 11643-1992 plane 1 */
            @(kCFStringEncodingCNS_11643_92_P2), /* CNS 11643-1992 plane 2 */
            @(kCFStringEncodingCNS_11643_92_P3), /* CNS 11643-1992 plane 3 (was plane 14 in 1986 version) */
            
            /* ISO 2022 collections begin at 0x800 */
            @(kCFStringEncodingISO_2022_JP),
            @(kCFStringEncodingISO_2022_JP_2),
            @(kCFStringEncodingISO_2022_JP_1), /* RFC 2237*/
            @(kCFStringEncodingISO_2022_JP_3), /* JIS X0213*/
            @(kCFStringEncodingISO_2022_CN),
            @(kCFStringEncodingISO_2022_CN_EXT),
            @(kCFStringEncodingISO_2022_KR),
            
            /* EUC collections begin at 0x900 */
            @(kCFStringEncodingEUC_JP),  /* ISO 646, 1-byte katakana, JIS 208, JIS 212 */
            @(kCFStringEncodingEUC_CN),  /* ISO 646, GB 2312-80 */
            @(kCFStringEncodingEUC_TW),  /* ISO 646, CNS 11643-1992 Planes 1-16 */
            @(kCFStringEncodingEUC_KR),  /* ISO 646, KS C 5601-1987 */
            
            /* Misc standards begin at 0xA00 */
            @(kCFStringEncodingShiftJIS),  /* plain Shift-JIS */
            @(kCFStringEncodingKOI8_R),  /* Russian internet standard */
            @(kCFStringEncodingBig5),  /* Big-5 (has variants) */
            @(kCFStringEncodingMacRomanLatin1), /* Mac OS Roman permuted to align with ISO Latin-1 */
            @(kCFStringEncodingHZ_GB_2312), /* HZ (RFC 1842, for Chinese mail & news) */
            @(kCFStringEncodingBig5_HKSCS_1999), /* Big-5 with Hong Kong special char set supplement*/
            @(kCFStringEncodingVISCII), /* RFC 1456, Vietnamese */
            @(kCFStringEncodingKOI8_U), /* RFC 2319, Ukrainian */
            @(kCFStringEncodingBig5_E), /* Taiwan Big-5E standard */
            
            /* Other platform encodings*/
            /*  kCFStringEncodingNextStepLatin)0x0B01, defined in CoreFoundation/CFString.h */
            @(kCFStringEncodingNextStepJapanese), /* NextStep Japanese encoding */
            
            /* EBCDIC & IBM host encodings begin at 0xC00 */
            @(kCFStringEncodingEBCDIC_US), /* basic EBCDIC-US */
            @(kCFStringEncodingEBCDIC_CP037), /* code page 037, extended EBCDIC (Latin-1 set) for US,Canada... */
            
            @(kCFStringEncodingUTF7), /* kTextEncodingUnicodeDefault + kUnicodeUTF7Format RFC2152 */
            @(kCFStringEncodingUTF7_IMAP), /* UTF-7 (IMAP folder variant) RFC3501 */
            
            /* Deprecated constants */
            @(kCFStringEncodingShiftJIS_X0213_00) /* Shift-JIS format encoding of JIS X0213 planes 1 and 2 (DEPRECATED) */
            ];
        
        for (NSNumber *number in codeArray) {
            unsigned int encodingCode = [number unsignedIntValue];
            NSStringEncoding enc = CFStringConvertEncodingToNSStringEncoding(encodingCode);
            
            NSError *error = nil;
            fileString = [NSString stringWithContentsOfFile:path encoding:enc  error:&error];
            NSLog(@"Error:%@", [error localizedDescription]);
            NSLog(@"%@", fileString);
            NSLog(@"NSStringEncoding=%@",fileString);
        }

    }
    
    
    
    if (fileString==nil||[fileString length]==0) {
        
        NSArray *arrEncoding = @[@(NSASCIIStringEncoding),
                                 @(NSNEXTSTEPStringEncoding),
                                 @(NSJapaneseEUCStringEncoding),
                                 @(NSUTF8StringEncoding),
                                 @(NSISOLatin1StringEncoding),
                                 @(NSSymbolStringEncoding),
                                 @(NSNonLossyASCIIStringEncoding),
                                 @(NSShiftJISStringEncoding),
                                 @(NSISOLatin2StringEncoding),
                                 @(NSUnicodeStringEncoding),
                                 @(NSWindowsCP1251StringEncoding),
                                 @(NSWindowsCP1252StringEncoding),
                                 @(NSWindowsCP1253StringEncoding),
                                 @(NSWindowsCP1254StringEncoding),
                                 @(NSWindowsCP1250StringEncoding),
                                 @(NSISO2022JPStringEncoding),
                                 @(NSMacOSRomanStringEncoding),
                                 @(NSUTF16StringEncoding),
                                 @(NSUTF16BigEndianStringEncoding),
                                 @(NSUTF16LittleEndianStringEncoding),
                                 @(NSUTF32StringEncoding),
                                 @(NSUTF32BigEndianStringEncoding),
                                 @(NSUTF32LittleEndianStringEncoding)
                                 ];
        
        NSArray *arrEncodingName = @[@"NSASCIIStringEncoding",
                                     @"NSNEXTSTEPStringEncoding",
                                     @"NSJapaneseEUCStringEncoding",
                                     @"NSUTF8StringEncoding",
                                     @"NSISOLatin1StringEncoding",
                                     @"NSSymbolStringEncoding",
                                     @"NSNonLossyASCIIStringEncoding",
                                     @"NSShiftJISStringEncoding",
                                     @"NSISOLatin2StringEncoding",
                                     @"NSUnicodeStringEncoding",
                                     @"NSWindowsCP1251StringEncoding",
                                     @"NSWindowsCP1252StringEncoding",
                                     @"NSWindowsCP1253StringEncoding",
                                     @"NSWindowsCP1254StringEncoding",
                                     @"NSWindowsCP1250StringEncoding",
                                     @"NSISO2022JPStringEncoding",
                                     @"NSMacOSRomanStringEncoding",
                                     @"NSUTF16StringEncoding",
                                     @"NSUTF16BigEndianStringEncoding",
                                     @"NSUTF16LittleEndianStringEncoding",
                                     @"NSUTF32StringEncoding",
                                     @"NSUTF32BigEndianStringEncoding",
                                     @"NSUTF32LittleEndianStringEncoding"
                                     ];
        
        for (int i = 0 ; i < [arrEncoding count]; i++) {
            unsigned long encodingCode = [arrEncoding[i] unsignedLongValue];
            NSLog(@"(%@)", arrEncodingName[i]);
            NSError *error = nil;
            fileString = [NSString stringWithContentsOfFile:path encoding:encodingCode  error:&error];
            NSLog(@"Error:%@", [error localizedDescription]);
            NSLog(@"%@", fileString);
        }
    }
最后编辑于
©著作权归作者所有,转载或内容合作请联系作者
  • 序言:七十年代末,一起剥皮案震惊了整个滨河市,随后出现的几起案子,更是在滨河造成了极大的恐慌,老刑警刘岩,带你破解...
    沈念sama阅读 213,558评论 6 492
  • 序言:滨河连续发生了三起死亡事件,死亡现场离奇诡异,居然都是意外死亡,警方通过查阅死者的电脑和手机,发现死者居然都...
    沈念sama阅读 91,002评论 3 387
  • 文/潘晓璐 我一进店门,熙熙楼的掌柜王于贵愁眉苦脸地迎上来,“玉大人,你说我怎么就摊上这事。” “怎么了?”我有些...
    开封第一讲书人阅读 159,036评论 0 349
  • 文/不坏的土叔 我叫张陵,是天一观的道长。 经常有香客问我,道长,这世上最难降的妖魔是什么? 我笑而不...
    开封第一讲书人阅读 57,024评论 1 285
  • 正文 为了忘掉前任,我火速办了婚礼,结果婚礼上,老公的妹妹穿的比我还像新娘。我一直安慰自己,他们只是感情好,可当我...
    茶点故事阅读 66,144评论 6 385
  • 文/花漫 我一把揭开白布。 她就那样静静地躺着,像睡着了一般。 火红的嫁衣衬着肌肤如雪。 梳的纹丝不乱的头发上,一...
    开封第一讲书人阅读 50,255评论 1 292
  • 那天,我揣着相机与录音,去河边找鬼。 笑死,一个胖子当着我的面吹牛,可吹牛的内容都是我干的。 我是一名探鬼主播,决...
    沈念sama阅读 39,295评论 3 412
  • 文/苍兰香墨 我猛地睁开眼,长吁一口气:“原来是场噩梦啊……” “哼!你这毒妇竟也来了?” 一声冷哼从身侧响起,我...
    开封第一讲书人阅读 38,068评论 0 268
  • 序言:老挝万荣一对情侣失踪,失踪者是张志新(化名)和其女友刘颖,没想到半个月后,有当地人在树林里发现了一具尸体,经...
    沈念sama阅读 44,478评论 1 305
  • 正文 独居荒郊野岭守林人离奇死亡,尸身上长有42处带血的脓包…… 初始之章·张勋 以下内容为张勋视角 年9月15日...
    茶点故事阅读 36,789评论 2 327
  • 正文 我和宋清朗相恋三年,在试婚纱的时候发现自己被绿了。 大学时的朋友给我发了我未婚夫和他白月光在一起吃饭的照片。...
    茶点故事阅读 38,965评论 1 341
  • 序言:一个原本活蹦乱跳的男人离奇死亡,死状恐怖,灵堂内的尸体忽然破棺而出,到底是诈尸还是另有隐情,我是刑警宁泽,带...
    沈念sama阅读 34,649评论 4 336
  • 正文 年R本政府宣布,位于F岛的核电站,受9级特大地震影响,放射性物质发生泄漏。R本人自食恶果不足惜,却给世界环境...
    茶点故事阅读 40,267评论 3 318
  • 文/蒙蒙 一、第九天 我趴在偏房一处隐蔽的房顶上张望。 院中可真热闹,春花似锦、人声如沸。这庄子的主人今日做“春日...
    开封第一讲书人阅读 30,982评论 0 21
  • 文/苍兰香墨 我抬头看了看天上的太阳。三九已至,却和暖如春,着一层夹袄步出监牢的瞬间,已是汗流浃背。 一阵脚步声响...
    开封第一讲书人阅读 32,223评论 1 267
  • 我被黑心中介骗来泰国打工, 没想到刚下飞机就差点儿被人妖公主榨干…… 1. 我叫王不留,地道东北人。 一个月前我还...
    沈念sama阅读 46,800评论 2 365
  • 正文 我出身青楼,却偏偏与公主长得像,于是被迫代替她去往敌国和亲。 传闻我的和亲对象是个残疾皇子,可洞房花烛夜当晚...
    茶点故事阅读 43,847评论 2 351

推荐阅读更多精彩内容