<?php
function documentNotUTF8($content)
{
$exprs = array(
'#<\?xml[^>]+encoding=([\'"])[Uu][Tt][Ff]-8\1#U',
'#<meta\s+(?:(?:http-equiv\s*=\s*([\'"])content-type\1\s*)|(?:content\s*=\s*([\'"])text/html\s*;.*charset\s*=\s*utf-?8.*\2\s*)){2}#Ui',
'#<meta\s+charset\s*=\s*([\'"])utf-?8\1#Ui',
);
foreach ($exprs as $expr) {
if ( $match = preg_match($expr, $content) ) {
break;
}
}
return (bool) $match;
}
$content = array(
<<<HTML
<?xml version="1.0" encoding="utf-8"?>
<HTML>
<HEAD>
<TITLE>PHP Manual</TITLE>
<LINK REL="STYLESHEET" HREF="style.css">
</HEAD>
HTML
,
<<<HTML
<HTML>
<HEAD>
<TITLE>PHP Manual</TITLE>
<META HTTP-EQUIV="Content-Type" CONTENT="text/html; charset=UTF8">
<LINK REL="STYLESHEET" HREF="style.css">
</HEAD>
HTML
,
<<<HTML
<?xml version="1.0" encoding="utf-8" bar="baz"?>
<HTML>
<HEAD>
<TITLE>PHP Manual</TITLE>
<LINK REL="STYLESHEET" HREF="style.css">
</HEAD>
HTML
,
<<<HTML
<HTML>
<HEAD>
<TITLE>PHP Manual</TITLE>
<META CONTENT="text/html; charset=UTF-8" HTTP-EQUIV="Content-Type">
<LINK REL="STYLESHEET" HREF="style.css">
</HEAD>
HTML
,
<<<HTML
<HTML>
<HEAD>
<TITLE>PHP Manual</TITLE>
<META HTTP-EQUIV="Content-Type" CONTENT="text/html; charset=UTF-8">
<LINK REL="STYLESHEET" HREF="style.css">
</HEAD>
HTML
,
<<<HTML
<HTML>
<HEAD>
<TITLE>PHP Manual</TITLE>
<META HTTP-EQUIV="Content-Type" CONTENT="text/html; stuff=things, charset=UTF-8, otherparam=foo">
<LINK REL="STYLESHEET" HREF="style.css">
</HEAD>
HTML
,
<<<HTML
<HTML>
<HEAD>
<TITLE>PHP Manual</TITLE>
<META charset="UTF-8">
<LINK REL="STYLESHEET" HREF="style.css">
</HEAD>
HTML
,
<<<HTML
<HTML>
<HEAD>
<TITLE>PHP Manual</TITLE>
<META charset="UTF8">
<LINK REL="STYLESHEET" HREF="style.css">
</HEAD>
HTML
,
<<<HTML
<HTML>
<HEAD>
<TITLE>PHP Manual</TITLE>
<LINK REL="STYLESHEET" HREF="style.css">
</HEAD>
HTML
);
foreach ($content as $str) {
var_dump(documentNotUTF8($str));
}
- Output for 4.3.0 - 4.3.11, 4.4.0 - 4.4.9, 5.0.0 - 5.0.5, 5.1.0 - 5.1.6, 5.2.0 - 5.2.17, 5.3.0 - 5.3.29, 5.4.0 - 5.4.45, 5.5.24 - 5.5.35, 5.6.8 - 5.6.28, 7.0.0 - 7.0.20, 7.1.0 - 7.1.33, 7.2.0 - 7.2.33, 7.3.0 - 7.3.33, 7.4.0 - 7.4.33, 8.0.0 - 8.0.30, 8.1.0 - 8.1.28, 8.2.0 - 8.2.18, 8.3.0 - 8.3.6
- bool(true)
bool(true)
bool(true)
bool(true)
bool(true)
bool(true)
bool(true)
bool(true)
bool(false)
preferences:
239.97 ms | 405 KiB | 357 Q