Guess Text File Encoding : UTF8 UTF16 « File Stream « C# / C Sharp

Home
C# / C Sharp
1.2D Graphics
2.Class Interface
3.Collections Data Structure
4.Components
5.Data Types
6.Database ADO.net
7.Date Time
8.Design Patterns
9.Development Class
10.Event
11.File Stream
12.Generics
13.GUI Windows Form
14.Internationalization I18N
15.Language Basics
16.LINQ
17.Network
18.Office
19.Reflection
20.Regular Expressions
21.Security
22.Services Event
23.Thread
24.Web Services
25.Windows
26.Windows Presentation Foundation
27.XML
28.XML LINQ
C# Book
C# / C Sharp by API
C# / CSharp Tutorial
C# / CSharp Open Source
C# / C Sharp » File Stream » UTF8 UTF16Screenshots 
Guess Text File Encoding
     
//----------------------------------------------------------------------------------------
// Copyright (C) 2008  ???? ?????
//
// ?????      
// ? ? ??      TxtFileEncoding.cs
// ???????   ???????????????(Encoding)
//
// ?????      ???    2008-3-22 13:01:03
//
// ?????
// ?????
// 
// ?????
// ?????
//----------------------------------------------------------------------------------------

using System;
using System.Text;
using System.IO;
namespace MaoCaiJun.DataBase.Sys.Common
{
    /// <summary>
    /// ???????????????(Encoding)?
    /// </summary>
     class TxtFileEncoding
    {
        //public TxtFileEncoding()
        //{
        //    //
        //    // TODO: ???????????
        //    //
        //}
        /// <summary>
        /// ????????????????????????????????Encoding.Default?????
        /// </summary>
        /// <param name="fileName">????</param>
        /// <returns></returns>
        public static Encoding GetEncoding(string fileName)
        {
            return GetEncoding(fileName, Encoding.Default);
        }
        /// <summary>
        /// ???????????????
        /// </summary>
        /// <param name="stream">??????</param>
        /// <returns></returns>
        public static Encoding GetEncoding(FileStream stream)
        {
            return GetEncoding(stream, Encoding.Default);
        }
        /// <summary>
        /// ??????????????
        /// </summary>
        /// <param name="fileName">????</param>
        /// <param name="defaultEncoding">??????????????????????????????????????</param>
        /// <returns></returns>
        public static Encoding GetEncoding(string fileName, Encoding defaultEncoding)
        {
            FileStream fs = new FileStream(fileName, FileMode.Open);
            Encoding targetEncoding = GetEncoding(fs, defaultEncoding);
            fs.Close();
            return targetEncoding;
        }
        /// <summary>
        /// ???????????????
        /// </summary>
        /// <param name="stream">??????</param>
        /// <param name="defaultEncoding">??????????????????????????????????????</param>
        /// <returns></returns>
        public static Encoding GetEncoding(FileStream stream, Encoding defaultEncoding)
        {
            Encoding targetEncoding = defaultEncoding;
            if (stream != null && stream.Length >= 2)
            {
                //???????4???
                byte byte1 = 0;
                byte byte2 = 0;
                byte byte3 = 0;
                byte byte4 = 0;
                //????Seek??
                long origPos = stream.Seek(0, SeekOrigin.Begin);
                stream.Seek(0, SeekOrigin.Begin);

                int nByte = stream.ReadByte();
                byte1 = Convert.ToByte(nByte);
                byte2 = Convert.ToByte(stream.ReadByte());
                if (stream.Length >= 3)
                {
                    byte3 = Convert.ToByte(stream.ReadByte());
                }
                if (stream.Length >= 4)
                {
                    byte4 = Convert.ToByte(stream.ReadByte());
                }
                //???????4?????Encoding
                //Unicode {0xFF, 0xFE};
                //BE-Unicode {0xFE, 0xFF};
                //UTF8 = {0xEF, 0xBB, 0xBF};
                if (byte1 == 0xFE && byte2 == 0xFF)//UnicodeBe
                {
                    targetEncoding = Encoding.BigEndianUnicode;
                }
                if (byte1 == 0xFF && byte2 == 0xFE && byte3 != 0xFF)//Unicode
                {
                    targetEncoding = Encoding.Unicode;
                }
                if (byte1 == 0xEF && byte2 == 0xBB && byte3 == 0xBF)//UTF8
                {
                    targetEncoding = Encoding.UTF8;
                }
                //??Seek??       
                stream.Seek(origPos, SeekOrigin.Begin);
            }
            return targetEncoding;
        }
    }
}

   
    
    
    
    
  
Related examples in the same category
1.Convert UTF-8 and ASCII encoded bytes back to UTF-16 encoded stringConvert UTF-8 and ASCII encoded bytes back to UTF-16 encoded string
2.UTF8 decoder
3.String to ASCII
4.Byte Endian
java2s.com  |  | Contact Us | Privacy Policy
Copyright 2009 - 12 Demo Source and Support. All rights reserved.
All other trademarks are property of their respective owners.