mirror of
https://github.com/notepad-plus-plus/notepad-plus-plus.git
synced 2025-07-29 00:34:24 +02:00
Fix file content detection for xml/html/php/bash
Add the ability of take into account Unicode BOM for file content detection (xml/html/php/bash).
This commit is contained in:
parent
2cbc6a7a99
commit
2c80fc3018
@ -1261,8 +1261,19 @@ LangType FileManager::detectLanguageFromTextBegining(const unsigned char *data,
|
||||
std::string htmlHeader2 = "<html>"; // length : 6
|
||||
std::string htmlHeader1 = "<!DOCTYPE html>"; // length : 15
|
||||
|
||||
const size_t longestLength = htmlHeader1.length(); // longest length - html header Length
|
||||
const size_t longestLength = htmlHeader1.length(); // longest length : html header Length
|
||||
const size_t shortestLength = xmlHeader.length();
|
||||
|
||||
size_t i = 0;
|
||||
|
||||
if (dataLen <= shortestLength)
|
||||
return L_TEXT;
|
||||
|
||||
// Eliminate BOM if present
|
||||
if ((data[0] == 0xEF && data[1] == 0xBB && data[2] == 0xBF) || // UTF8 BOM
|
||||
(data[0] == 0xFE && data[1] == 0xFF && data[2] == 0x00) || // UTF16 BE BOM
|
||||
(data[0] == 0xFF && data[1] == 0xFE && data[2] == 0x00)) // UTF16 LE BOM
|
||||
i += 3;
|
||||
|
||||
for (; i < dataLen; ++i)
|
||||
{
|
||||
|
Loading…
x
Reference in New Issue
Block a user