U++ forum: Welcome to the forum

WString LoadBOMW(const Stream& s); WString LoadFileBOMW(const char *path); void SaveBOMUtf8(const Stream& s, const WString& data); bool SaveFileBOMUtf8(const char *path, const WString& data); String LoadBOM(const Stream& s); // Default encoding, usually utf-8 String LoadFileBOM(const char *path); void SaveBOMUtf8(const Stream& s, const String& data); bool SaveFileBOMUtf8(const char *path, const String& data);

String LoadFileBOM(const char *path) { String s = LoadFile(path); if (((s[0]&0xFF) == 0xFF) && ((s[1]&0xFF) == 0xFE)) // UTF16 Little Endian s = ToUtf8(s.Mid(2).ToWString()); else if (((s[0]&0xFF) == 0xEF) && ((s[1]&0xFF) == 0xBB) && ((s[2]&0xFF) == 0xBF)) // UTF8 s = s.Mid(3); return s; }

String s = LoadFileBOM("demo_u_16le.txt"); String ss; for (int i = 0; i < s.GetCount(); ++i) ss.Cat(Format("%d: %0x;\n", i, s[i]&0xFF)); ss.Cat(s); TestLineEdit.SetData(ss); TestEditString.SetData(ss); TestDocEdit.SetData(ss);

String LoadFileBOM(const char *path) { String s = LoadFile(path); if (((s[0]&0xFF) == 0xFF) && ((s[1]&0xFF) == 0xFE)) { // UTF16 Little Endian StringBuffer ws = s.Mid(2); s = ToUtf8((wchar *)ws.Begin(), ws.GetCount()*sizeof(char)/sizeof(wchar)); } else if (((s[0]&0xFF) == 0xEF) && ((s[1]&0xFF) == 0xBB) && ((s[2]&0xFF) == 0xBF)) // UTF8 s = s.Mid(3); else // May be ISO8859-1 s = ToUtf8(ToUnicode(s, CHARSET_ISO8859_1)); return s; } bool SaveBOMUtf8(Stream& out, const String& data) { if(!out.IsOpen() || out.IsError()) return false; unsigned char bom[] = {0xEF, 0xBB, 0xBF}; out.Put(bom, 3); out.Put((const char *)data, data.GetLength()); out.Close(); return out.IsOK(); } bool SaveFileBOMUtf8(const char *path, const String& data) { FileOut out(path); return SaveBOMUtf8(out, data); }

String LoadStreamBOM(Stream& in) 
{
	if(in.IsOpen()) {
		in.ClearError();
		int size = (int)in.GetLeft();
		if((dword)size != 0xffffffff) {
			unsigned char header[3];								// Get 3 bytes header
			if (!in.GetAll(&header, 3))
				return String::GetVoid();
			if ((header[0] == 0xFF) && (header[1] == 0xFE)) {		// Check header
				StringBuffer s(size-2);								// UTF16 Little Endian		
				s[0] = header[2];									// This char is not header
				if (!in.GetAll(s.Begin()+1, size-3))
					return String::GetVoid();						// Conversion
				return ToUtf8((wchar *)s.Begin(), (size-2)*sizeof(char)/sizeof(wchar));
			} else if ((header[0] == 0xFE) && (header[1] == 0xFF)) {		
				StringBuffer s(size-2);								// UTF16 Big Endian		
				s[0] = header[2];									// This char is not header
				if (!in.GetAll(s.Begin()+1, size-3))
					return String::GetVoid();
				for (int i = 0; i < size-2; i += 2) {	// Change from big to little endian
					unsigned char aux = s[i];			// by changing byte order
					s[i] = s[i+1];
					s[i+1] = aux;
				}													// Conversion
				return ToUtf8((wchar *)s.Begin(), (size-2)*sizeof(char)/sizeof(wchar));
			} else if ((header[0] == 0xEF) && (header[1] == 0xBB) && (header[2] == 0xBF))
				return in.Get(size-3);								// UTF8. No conversion required
			else {																
				StringBuffer s(size);								// Maybe ISO8859-1
				s[0] = header[0];									// Three chars are not header
				s[1] = header[1];									// so inserted into the StringBuffer
				s[2] = header[2];
				if (!in.GetAll(s.Begin()+3, size-3))
					return String::GetVoid();
				return ToUtf8(ToUnicode(s.Begin(), size, CHARSET_ISO8859_1));	// Conversion
			}
		}
	}
	return String::GetVoid();
}
String LoadFileBOM(const char *filename) 
{
	FileIn in(filename);
	return LoadStreamBOM(in);
}
bool SaveBOMUtf8(Stream& out, const String& data) {
	if(!out.IsOpen() || out.IsError()) 
		return false;
	unsigned char bom[] = {0xEF, 0xBB, 0xBF};
	out.Put(bom, 3);
	out.Put((const char *)data, data.GetLength());
	out.Close();
	return out.IsOK();
}
bool SaveFileBOMUtf8(const char *path, const String& data)
{
	FileOut out(path);
	return SaveBOMUtf8(out, data);
}