<?php
header('Content-Type: text/html; charset=UTF-8');
$str = "<h1>He'llü & Wor'ldÆØÅÅÅ!</h1>" . "\tcafé\n";
if ('UTF-8' !== mb_detect_encoding($str)) {
$str = utf8_encode($str);
}
var_dump($str);
$str = html_entity_decode($str, ENT_QUOTES | ENT_XML1, 'UTF-8');
var_dump($str);
$str = filter_var(html_entity_decode($str, ENT_QUOTES | ENT_XML1, 'UTF-8'),
FILTER_SANITIZE_STRING, FILTER_FLAG_STRIP_LOW | FILTER_FLAG_STRIP_HIGH | FILTER_FLAG_NO_ENCODE_QUOTES);
var_dump($str);
#$newstr = preg_replace('/\s[\s]+/', ' ', $str); // Strip off multiple spaces
$newstr = preg_replace('/[^\000-\128]+/', '', $str); // Strip off non-alpha-numeric
#$newstr = preg_replace('/[\s\W]+/', '-', $newstr); // Strip off spaces and non-alpha-numeric
#$newstr = preg_replace('/[^A-Za-z0-9_-]+/', '', $newstr);
var_dump($newstr);
preferences:
55.44 ms | 402 KiB | 5 Q