- preg_replace: documentation ( source)
<?php
$html=<<<EOT
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<title>KvK NL - Uittreksel inzien</title>
<meta http-equiv="Content-Type" content="text/html; charset=UTF-8"/>
<link rel="stylesheet" type="text/css" href="../css/style.css"/>
<link rel="stylesheet" type="text/css" href="../css/uittreksel.css"/>
<link rel="stylesheet" type="text/css" href="../css/printUittreksel.css" media="print"/>
<script type="text/javascript" src="../resources/nl.kvk.hp.web.pages.InzienPage/google-analytics.js"></script>
</head>
<body class="hrfixed">
<div>
</div>
<div id="uittrekselWrapper">
<span><?xml version="1.0" encoding="UTF-8"?>
<div id="uittreksel"></div></span>
</div>
<div id="footer">
</div>
</body>
</html>
EOT;
$html = '<?xml version="1.0" encoding="UTF-8"?>' . preg_replace('/(<\?xml[^!\?>]+\?>)/msi','', $html);
try
{
$xml = new DOMDocument('1.0', 'UTF-8');
$xml->loadHTML($html);
}
catch (DOMException $e)
{
throw new exception('Document could not be generated, no html found');
}
// get the part of the document we need
$xpath = new DOMXPath($xml);