Skip to content

Commit 3d90678

Browse files
committed
Fix encoding detection when reading text file. Win32 API could mistakenly report UTF16 when the file is actually UTF8.
1 parent ba396cc commit 3d90678

File tree

1 file changed

+11
-13
lines changed

1 file changed

+11
-13
lines changed

source/core/text-io.cpp

+11-13
Original file line numberDiff line numberDiff line change
@@ -194,6 +194,14 @@ namespace Slang
194194
this->encoding = determinedEncoding;
195195
}
196196

197+
bool HasNullBytes(char * str, int len)
198+
{
199+
for (int i = 0; i < len; i++)
200+
if (str[len] == 0)
201+
return true;
202+
return false;
203+
}
204+
197205
Encoding * StreamReader::DetermineEncoding()
198206
{
199207
if (buffer.Count() >= 3 && (unsigned char)(buffer[0]) == 0xEF && (unsigned char)(buffer[1]) == 0xBB && (unsigned char)(buffer[2]) == 0xBF)
@@ -213,19 +221,9 @@ namespace Slang
213221
}
214222
else
215223
{
216-
#ifdef _WIN32
217-
int flag = IS_TEXT_UNICODE_SIGNATURE | IS_TEXT_UNICODE_REVERSE_SIGNATURE | IS_TEXT_UNICODE_STATISTICS | IS_TEXT_UNICODE_ASCII16;
218-
int rs = IsTextUnicode(buffer.Buffer(), (int) buffer.Count(), &flag);
219-
if (rs)
220-
{
221-
if (flag & (IS_TEXT_UNICODE_SIGNATURE | IS_TEXT_UNICODE_STATISTICS))
222-
return Encoding::UTF16;
223-
else if (flag & (IS_TEXT_UNICODE_SIGNATURE | IS_TEXT_UNICODE_STATISTICS))
224-
return Encoding::UTF16Reversed;
225-
else if (flag & IS_TEXT_UNICODE_ASCII16)
226-
return Encoding::UTF8;
227-
}
228-
#endif
224+
// find null bytes
225+
if (HasNullBytes(buffer.Buffer(), (int)buffer.Count()))
226+
return Encoding::UTF16;
229227
return Encoding::UTF8;
230228
}
231229
}

0 commit comments

Comments
 (0)