@ -0,0 +1,135 @@
Plugin Name: Visitors contributions
Plugin URI:
Description: A wordpress plugin that gives your visitors the possiblity to develop your website content by submiting new versions to your articles.
Version: 1.07
Author: Leavy
Author URI:
class visitors_edits{
public function __construct() {
register_activation_hook( __FILE__, array($this,'install'));
add_action( 'admin_menu', array( $this, 'admin_pages' ) );
add_filter('the_content', array($this,'contentFilter'));
add_filter( 'query_vars', array($this,'query_vars') );
add_action( 'init',array($this,'init'));
add_action( 'parse_request',array($this,'parse_request'));
add_filter( 'mce_buttons', array($this,'tinymce_btns') );
add_filter( 'mce_external_plugins', array($this,'tinymce_scripts') );
add_action('admin_head', array($this,'admin_head') );
add_action('admin_init', array($this,'admin_init') );
public function admin_pages() {
add_menu_page('Visitors Contributions | Pending reviews','Visitors contributions','read','visitors_edits_main',array($this , 'main'),plugins_url("img/contribute.png",__FILE__),87);
add_submenu_page(null,"Visitors Contributions | Review","Review a contribution","read",'visitors_edits_approve',array($this,'approve'));
add_submenu_page("visitors_edits_main","Visitors Contributions | Settings","Settings","read",'visitors_edits_settings',array($this,'settings'));
public function admin_head(){
if(isset($_GET["page"]) && ($_GET["page"]==="visitors_edits_approve" || $_GET["page"]==="visitors_edits_main" || $_GET["page"]==="visitors_edits_settings")){
<link rel="stylesheet" type="text/css" href="<?php echo plugins_url( '/css/app.css',__FILE__ );?>">
public function admin_init(){
add_editor_style(plugins_url( './css/tinymce.css',__FILE__ ));
public function main(){
require "inc/main.php";
public function approve(){
require 'inc/approve.php';
public function settings(){
require 'inc/settings.php';
public function contentFilter($content){
if(is_single()) {
$options=get_option( "visitors_edits_options", [
"propose_edit_link"=>"<p><a href='#post_link#'>Propose an edit</a></p>"
global $post;
$new_content = str_replace("#post_link#", get_site_url().'/'.$post->post_name.'/suggestions', stripcslashes($options["propose_edit_link"]));
$content .= $new_content;
return $content;
public function install(){
//General Settings
//Database Settings
global $wpdb;
$charset_collate = $wpdb->get_charset_collate();
$table_name = $wpdb->prefix . 'visitors_edits';
$sql = "CREATE TABLE $table_name (
edit_id bigint(20) NOT NULL AUTO_INCREMENT,
edit_time datetime DEFAULT '0000-00-00 00:00:00' NOT NULL,
visitor_name text DEFAULT '',
visitor_email text DEFAULT '',
visitor_comment longtext DEFAULT '',
edit_content longtext DEFAULT '',
post_id bigint(20),
post_content longtext DEFAULT '',
UNIQUE KEY (edit_id)
) $charset_collate;";
require_once( ABSPATH . 'wp-admin/includes/upgrade.php' );
dbDelta( $sql );
public function query_vars($query_vars){
$query_vars[] = 'visitors_edits_post_name';
return $query_vars;
public function init(){
public function parse_request($request){
if( isset( $request->query_vars['visitors_edits_post_name'] ) ):
include( plugin_dir_path(__FILE__) . "/inc/editor.php" );
return $request;
public function tinymce_btns($buttons){
if(isset($_GET["page"]) && $_GET["page"]==="visitors_edits_approve"){
return $buttons;
public function tinymce_scripts($plugin_array){
$plugin_array['visitors_edits'] = plugins_url( 'js/approve.js',__FILE__ );
return $plugin_array;
static function scriptUrl($script){
return plugins_url( 'js/'.$script.'.js',__FILE__);
new visitors_edits();
use Caxy\HtmlDiff\HtmlDiff;
use PHPHtmlParser\Dom;
function visitors_editsDIFF($oldHtml,$newHtml){
require "vendor/autoload.php";
$htmlDiff = new HtmlDiff($oldHtml, $newHtml);
return $htmlDiff->build();
function visitors_editsDOM(){
return new Dom;

@ -0,0 +1,178 @@
@import url(",400,700");
/* line 3, ../sass/app.scss */
.visitors_edits_no_data {
text-align: center;
font-weight: bold;
font-size: 50px;
margin-top: 250px;
opacity: 0.3;
text-transform: uppercase;
display: none;
/* line 12, ../sass/app.scss */
.visitors_edits_pending {
padding: 15px;
/* line 14, ../sass/app.scss */
.visitors_edits_pending h1 {
font-weight: 100;
font-size: 20px;
/* line 22, ../sass/app.scss */
.visitors_flashMessage {
margin: 15px;
background: #fff;
padding: 10px 15px;
border-left: 6px solid #089D08;
color: #089D08;
font-size: 14px;
font-weight: 100;
/* line 30, ../sass/app.scss */
.visitors_flashMessage.danger {
color: #F6214E;
border-color: #F6214E;
/* line 36, ../sass/app.scss */
.visitors_edits_review_editor {
padding: 15px;
/* line 38, ../sass/app.scss */
.visitors_edits_review_editor h1 {
font-weight: 100;
font-size: 25px;
display: inline-block;
margin-right: 15px;
margin-bottom: 10px;
/* line 45, ../sass/app.scss */
.visitors_edits_review_editor .delete_edit {
transition-duration: 0.3s;
color: #F6214E;
text-decoration: none;
text-decoration: underline;
font-style: italic;
font-style: 12px;
opacity: 0.6;
/* line 53, ../sass/app.scss */
.visitors_edits_review_editor .delete_edit:hover {
opacity: 1;
/* line 57, ../sass/app.scss */
.visitors_edits_review_editor .edit_info, .visitors_edits_review_editor .edit_notify {
padding-left: 15px;
font-style: italic;
opacity: 0.8;
font-size: 14px;
/* line 62, ../sass/app.scss */
.visitors_edits_review_editor .edit_info .mail, .visitors_edits_review_editor .edit_notify .mail {
opacity: 0.6;
font-size: 12px;
/* line 67, ../sass/app.scss */
.visitors_edits_review_editor .edit_notify {
margin: 10px 0;
padding: 0;
/* line 70, ../sass/app.scss */
.visitors_edits_review_editor .edit_notify label {
display: block;
margin-bottom: 10px;
/* line 74, ../sass/app.scss */
.visitors_edits_review_editor .edit_notify #edit_notify_message {
font-family: "Roboto",sans-serif;
max-height: 100px;
min-height: 100px;
max-width: 100%;
min-width: 100%;
line-height: normal;
border: none;
border-bottom: 1px solid #DFDFDF;
font-size: 18px;
padding: 10px;
display: none;
/* line 85, ../sass/app.scss */
.visitors_edits_review_editor .edit_notify #edit_notify_message:focus {
outline: none;
border-bottom-width: 2px;
border-color: rgba(3, 133, 244, 0.7);
/* line 93, ../sass/app.scss */
.visitors_edits_review_editor .controls {
margin-top: 20px;
/* line 96, ../sass/app.scss */
.visitors_edits_review_editor .comment {
font-size: 14px;
margin: 0;
padding: 10px;
background: #fff;
border: 1px solid #999;
font-style: normal;
opacity: 1;
color: #000;
/* line 107, ../sass/app.scss */
.visitors_edits_admin {
font-family: "Roboto",sans-serif;
width: 70%;
margin: 50px auto;
background: #fff;
border: 1px solid #E2E2E2;
padding: 20px;
/* line 114, ../sass/app.scss */
.visitors_edits_admin h2 {
font-size: 25px;
font-weight: 100;
/* line 120, ../sass/app.scss */
.visitors_edits_admin .control label {
display: block;
font-weight: bold;
margin: 15px 0 0;
opacity: 0.9;
font-size: 13px;
/* line 127, ../sass/app.scss */
.visitors_edits_admin .control input[type="text"], .visitors_edits_admin .control .notif_message {
background: #F3F3F3;
outline: none;
padding: 0 10px;
height: 40px;
line-height: normal;
border: none;
border-bottom: 1px solid #DFDFDF;
width: 100%;
/* line 136, ../sass/app.scss */
.visitors_edits_admin .control input[type="text"]:focus, .visitors_edits_admin .control .notif_message:focus {
outline: none;
border-bottom-width: 2px;
border-color: rgba(3, 133, 244, 0.7);
/* line 142, ../sass/app.scss */
.visitors_edits_admin .control .notif_message {
min-height: 120px;
max-height: 120px;
padding: 10px;
min-width: 100%;
max-width: 100%;
line-height: normal;
/* line 150, ../sass/app.scss */
.visitors_edits_admin .control input[type="checkbox"] {
margin-right: 10px;
/* line 153, ../sass/app.scss */
.visitors_edits_admin .control .save_btn {
margin-top: 20px;

@ -0,0 +1,156 @@
@import url(",400,700");
/* line 7, ../sass/editor.scss */
body {
font-family: "Roboto",sans-serif;
font-size: 18px;
color: #545454;
padding: 0;
margin: 0;
/* line 14, ../sass/editor.scss */
a {
text-decoration: none;
color: inherit;
/* line 18, ../sass/editor.scss */
* {
transition-duration: 0.3s;
-moz-box-sizing: border-box;
-webkit-box-sizing: border-box;
box-sizing: border-box;
/* line 22, ../sass/editor.scss */
.header {
padding: 20px 60px;
background: #0385F4;
/* line 25, ../sass/editor.scss */
.header .header-title {
font-size: 50px;
font-weight: 100;
color: #fff;
opacity: 0.5;
/* line 31, ../sass/editor.scss */
.header .header-content {
font-weight: 100;
color: #fff;
text-align: right;
font-size: 14px;
opacity: 0.7;
/* line 37, ../sass/editor.scss */
.header .header-content:hover {
opacity: 0.9;
/* line 42, ../sass/editor.scss */
.editor_form {
padding: 20px 40px;
overflow: hidden;
width: 100%;
/* line 46, ../sass/editor.scss */
.editor_form .editor_field {
background: #f5f5f5;
padding: 15px;
/* line 50, ../sass/editor.scss */
.editor_form .submit_fields {
padding: 0 20px;
/* line 55, ../sass/editor.scss */
label {
display: block;
margin: 30px 0 10px;
/* line 59, ../sass/editor.scss */
.text_field, .area_field {
height: 40px;
line-height: 40px;
border: none;
border-bottom: 1px solid #DFDFDF;
width: 100%;
font-size: 18px;
/* line 66, ../sass/editor.scss */
.text_field:focus, .area_field:focus {
outline: none;
border-bottom-width: 2px;
border-color: rgba(3, 133, 244, 0.7);
/* line 72, ../sass/editor.scss */
.area_field {
font-family: "Roboto",sans-serif;
max-height: 100px;
min-height: 100px;
max-width: 100%;
min-width: 100%;
line-height: normal;
/* line 80, ../sass/editor.scss */
.submit_fields_error {
line-height: 20px;
font-style: italic;
font-size: 12px;
opacity: 0.8;
color: #e74c3c;
/* line 87, ../sass/editor.scss */
.btn {
height: 40px;
color: #fff;
line-height: 40px;
padding: 0 20px;
text-transform: uppercase;
background: #0385F4;
border: 1px solid #0385F4;
cursor: pointer;
margin: 20px 0;
/* line 97, ../sass/editor.scss */
.btn:hover {
color: #0385F4;
background: #fff;
/* line 102, ../sass/editor.scss */
.cb {
clear: both;
/* line 105, ../sass/editor.scss */
.grey {
background: #f5f5f5;
/* line 108, ../sass/editor.scss */
.submit_success {
margin-top: 200px;
background: #0385F4;
padding: 30px;
color: #fff;
/* line 113, ../sass/editor.scss */
.submit_success .alert_title {
font-size: 40px;
opacity: 0.4;
/* line 117, ../sass/editor.scss */
.submit_success .alert_content {
font-weight: 100;
/* line 120, ../sass/editor.scss */
.submit_success .alert_footer {
opacity: 0.7;
font-size: 12px;
font-style: italic;

@ -0,0 +1,230 @@
/* line 2, style.scss */
* {
-webkit-box-sizing: border-box;
-moz-box-sizing: border-box;
box-sizing: border-box;
/* line 3, style.scss */
body {
margin: 0;
padding: 0;
font-family: sans-serif;
/* line 6, _grid.scss */
.col-1, .col-m-1, .col-l-1, .col-2, .col-m-2, .col-l-2, .col-3, .col-m-3, .col-l-3, .col-4, .col-m-4, .col-l-4, .col-5, .col-m-5, .col-l-5, .col-6, .col-m-6, .col-l-6, .col-7, .col-m-7, .col-l-7, .col-8, .col-m-8, .col-l-8, .col-9, .col-m-9, .col-l-9, .col-10, .col-m-10, .col-l-10, .col-11, .col-m-11, .col-l-11, .col-12, .col-m-12, .col-l-12 {
float: right;
position: relative;
min-height: 1px;
padding: 0 10px;
/*border: 1px solid rgba(255, 0, 0, 0.5);*/
/* line 16, _grid.scss */
.col-1 {
width: 8.33333%;
/* line 16, _grid.scss */
.col-2 {
width: 16.66667%;
/* line 16, _grid.scss */
.col-3 {
width: 25%;
/* line 16, _grid.scss */
.col-4 {
width: 33.33333%;
/* line 16, _grid.scss */
.col-5 {
width: 41.66667%;
/* line 16, _grid.scss */
.col-6 {
width: 50%;
/* line 16, _grid.scss */
.col-7 {
width: 58.33333%;
/* line 16, _grid.scss */
.col-8 {
width: 66.66667%;
/* line 16, _grid.scss */
.col-9 {
width: 75%;
/* line 16, _grid.scss */
.col-10 {
width: 83.33333%;
/* line 16, _grid.scss */
.col-11 {
width: 91.66667%;
/* line 16, _grid.scss */
.col-12 {
width: 100%;
/* line 23, _grid.scss */
.row {
margin: 0 -10px;
overflow: hidden;
*zoom: 1;
/* line 27, _grid.scss */
.col-center {
margin: 0 auto;
float: none;
@media only screen and (min-width: 640px) {
/* line 30, _grid.scss */
.col-m-center {
margin: 0 auto;
float: none;
/* line 32, _grid.scss */
.col-m-1 {
width: 8.33333%;
/* line 32, _grid.scss */
.col-m-2 {
width: 16.66667%;
/* line 32, _grid.scss */
.col-m-3 {
width: 25%;
/* line 32, _grid.scss */
.col-m-4 {
width: 33.33333%;
/* line 32, _grid.scss */
.col-m-5 {
width: 41.66667%;
/* line 32, _grid.scss */
.col-m-6 {
width: 50%;
/* line 32, _grid.scss */
.col-m-7 {
width: 58.33333%;
/* line 32, _grid.scss */
.col-m-8 {
width: 66.66667%;
/* line 32, _grid.scss */
.col-m-9 {
width: 75%;
/* line 32, _grid.scss */
.col-m-10 {
width: 83.33333%;
/* line 32, _grid.scss */
.col-m-11 {
width: 91.66667%;
/* line 32, _grid.scss */
.col-m-12 {
width: 100%;
@media only screen and (min-width: 1024px) {
/* line 39, _grid.scss */
.col-l-center {
margin: 0 auto;
float: none;
/* line 41, _grid.scss */
.col-l-1 {
width: 8.33333%;
/* line 41, _grid.scss */
.col-l-2 {
width: 16.66667%;
/* line 41, _grid.scss */
.col-l-3 {
width: 25%;
/* line 41, _grid.scss */
.col-l-4 {
width: 33.33333%;
/* line 41, _grid.scss */
.col-l-5 {
width: 41.66667%;
/* line 41, _grid.scss */
.col-l-6 {
width: 50%;
/* line 41, _grid.scss */
.col-l-7 {
width: 58.33333%;
/* line 41, _grid.scss */
.col-l-8 {
width: 66.66667%;
/* line 41, _grid.scss */
.col-l-9 {
width: 75%;
/* line 41, _grid.scss */
.col-l-10 {
width: 83.33333%;
/* line 41, _grid.scss */
.col-l-11 {
width: 91.66667%;
/* line 41, _grid.scss */
.col-l-12 {
width: 100%;

@ -0,0 +1,10 @@
background: transparent !important;
color: inherit !important;
background:#4DB1FB !important;
background:#4DFB74 !important;

@ -0,0 +1,204 @@
global $wpdb;
$table_name = $wpdb->prefix . 'visitors_edits';
$edit = $wpdb->get_row("SELECT * FROM ".$table_name." WHERE edit_id=".$_GET["edit"]);
$options=get_option( "visitors_edits_options", [
//Fix nl
//$edit->post->post_content=str_replace(["\r\n", "\r", "\n"], "<br/>",$edit->post->post_content);
//$edit->post_content=str_replace(["\r\n", "\r", "\n"], "<br/>",$edit->post_content);
//$edit->edit_content=str_replace(["\r\n", "\r", "\n"], "<br/>",$edit->edit_content);
echo '<div style="display:none" id="visitors_edits_diff">'.$diff.'</div>';
noData("Select a visitor contribution");
<script type="text/javascript">
window.location="<?php echo menu_page_url('visitors_edits_main',false);?>";
function showEditor($edit,$editor_content=""){
$options=get_option( "visitors_edits_options", [
"edit_notify_message"=>"Thanks for your contribution to our blog, your contribution was reviewed and approved."
<div class="visitors_edits_review_editor">
<h1>Review a contribution</h1><a class="delete_edit" href="<?php echo menu_page_url('visitors_edits_main',false);?>&delete=<?php echo $edit->edit_id;?>">Delete this contribution</a>
<ul class="edit_info">
<li><a target="_blank" href="<?php echo get_permalink($edit->post->ID);?>">View original post</a></li>
<li>Author : <?php echo $edit->visitor_name; ?> <span class="mail"><?php echo $edit->visitor_email; ?></span></li>
<li>Submited on :
echo date_format($creationDate,"m/d/Y")." at ".date_format($creationDate,"h:i a");
<li>Author comment :</li>
<p class="comment">
<?php echo stripcslashes($edit->visitor_comment); ?>
<div class="cb"></div>
<form action="<?php echo menu_page_url('visitors_edits_main',false);?>" method="POST" onsubmit="return editSubmit()">
<div class="editor">
"mode" => "textareas",
"theme" => "modern"
.diff_editor ins{
background: #44B3FD !important;
<div class="controls">
<input type="hidden" value="<?php echo $edit->visitor_name; ?>" name="visitor_name">
<input type="hidden" value="<?php echo $edit->visitor_email; ?>" name="visitor_email">
<input type="hidden" value="<?php echo $edit->edit_id; ?>" name="edit_id">
<input type="hidden" value="<?php echo $edit->post_id; ?>" name="ID">
<div class="edit_notify">
<label><input type="checkbox" name="notify_visitor" id="edit_notify_activate"> Notify the author.</label>
<textarea name="admin_message" id="edit_notify_message"><?php echo $options["edit_notify_message"]; ?></textarea>
<button class="button-primary" type="submit">Save changes</button>
<script src="<?php echo visitors_edits::scriptUrl('admin');?>"></script>
function noData($msg){
<h1 class="visitors_edits_no_data" style="display:block">
<?php echo $msg; ?>
function clearTag($tag,$content){
return preg_replace("#<".$tag.".*?>.*?</".$tag.">#i","", $content);
function addAttrTag($tag,$attr,$content){
return preg_replace("#<".$tag."(.*?)>#i","<".$tag." ".$attr."='1'$1>", $content);
function clearTagName($tag,$content){
return preg_replace("#</*".$tag.".*?>#i", "", $content);
function replaceTag($origin,$replace,$content){
return preg_replace("#(<(/*)(".$origin.")(.*?)>)#i", '[$2'.$replace.'$4]', $content);
function encodeDiff($diff){
//composer require paquettg/php-html-parser
require_once "parser.php";
foreach($html->find('ins') as $ins){
foreach($html->find('del') as $del){
return $encoded;
function cleanDiff($content){
require_once "parser.php";
foreach($html->find('ul') as $ul){
foreach($ul->find("br") as $br){
foreach($html->find('ol') as $ol){
foreach($ol->find("br") as $br){
return $html;
function cleanEncodedDiff($content){
$diffs = $html->find('ins, del');
for ($i=0; $i < count($diffs); $i++) {
$isSpecial=preg_match("#%(INS|DEL)\d*?%#", $diff->innertext);
if ($isSpecial){
//is important
return $html;
function decodeDiff($content,$codes){
foreach ($codes["INS"] as $id => $code) {
$content=str_replace("%INS".$id."%", $code, $content);
foreach ($codes["DEL"] as $id => $code) {
$content=str_replace("%DEL".$id."%", $code, $content);
return $content;

@ -0,0 +1,152 @@
global $wpdb;
$table_name = $wpdb->prefix . 'visitors_edits';
$post = get_post($post_id);
//Check if changed
"edit_time"=>date('Y-m-d H:i:s'),
require "mail.php";
$options=get_option( "visitors_edits_options", [
"visitor_notif_message"=>"Your suggestion was submitted.",
"admin_notif_message"=>"A new suggestion was submitted."
$mail = [
"edit_time"=>date('H:i')." - ".date('d/m/y'),
"blog_title" => get_bloginfo("name"),
$visitor_submitionMail=new visitors_edits_EMAIL($mail,"visitor_submition");
$admin_submitionMail=new visitors_edits_EMAIL($mail,"admin_submition");
global $wp;
global $post;
$post = get_posts([
"name"=> $wp->query_vars['visitors_edits_post_name'],
'post_type' => 'post',
'post_status' => 'publish',
'numberposts' => 1
<!DOCTYPE html>
<html xmlns="" xml:lang="en" lang="en">
<meta http-equiv="Content-Type" content="text/html; charset=utf-8">
<link rel="stylesheet" type="text/css" href="<?php echo plugins_url( '/../css/grid.css',__FILE__ );?>">
<link rel="stylesheet" type="text/css" href="<?php echo plugins_url( '/../css/editor.css',__FILE__ );?>">
<script src="<?php echo visitors_edits::scriptUrl('jquery');?>"></script>
<title>Submit an edit</title>
<body <?php if(!empty($_POST)){echo 'class="grey"';} ?>>
confirmSubmit("Edit Submitted!","Thanks for your contribution you will be notified once the edit reviewed.");
function showForm(){
global $post;
<div class="header">
<div class="header-title">Submit a contribution</div>
<p class="header-content">
<a href="<?php echo get_permalink($post->ID) ?>">Original post : <?php echo $post->post_title; ?>.</a>
<form action="" method="POST" class="editor_form row" id="editor_form" onsubmit="return">
<div class="submit_fields col-12 col-l-4">
<ul class="submit_fields_error" id="submit_fields_error">
<label for="name">Name</label>
<input class="text_field" type="text" name="visitor_name" placeholder="Name" id="name">
<label for="email">Email</label>
<input class="text_field" type="email" name="visitor_email" placeholder="Email" id="email">
<label for="comment">Description</label>
<textarea class="area_field" type="text" name="visitor_comment" value=" " id="comment">
<input type="hidden" name="post_id" value="<?php echo $post->ID;?>">
<input type="hidden" name="post_url" value="<?php echo get_permalink($post->ID);?>">
<input type="submit" class="btn" value="Submit for review">
<div class="editor_field col-12 col-l-8">
"mode" => "textareas",
"theme" => "modern"
<div class="cb"></div>
<script src="<?php echo visitors_edits::scriptUrl('editor');?>"></script>
function confirmSubmit($title,$message){
<div class="submit_success col-10 col-l-6 col-center">
<strong class="alert_title">
<?php echo $title;?>
<p class="alert_content">
<?php echo $message;?>
<p class="alert_footer">
<a href="<?php echo $_POST['post_url']?>">Click here to continue back to the post</a>

@ -0,0 +1,48 @@
class visitors_edits_EMAIL{
var $subject;
var $body;
public function __construct($cpts,$template){
public function send($destination){
$options=get_option( "visitors_edits_options", [
$headers= "MIME-Version: 1.0\r\n";
$headers .= "Content-Type: text/html; charset=UTF-8\r\n";
wp_mail($destination, $this->subject, $this->body,$headers);
subject : $this->subject
body : $this->body
private function loadTemplate($template){
return [
private function inject($str,$body){
foreach ($body as $key => $value) {
return $str;
public function preview(){
echo $this->subject;
echo $this->body;

@ -0,0 +1,89 @@
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
<html xmlns:v="urn:schemas-microsoft-com:vml">
<subject>[#blog_title# | Visitors Contributions] - Contribution submited</subject>
<meta http-equiv="content-type" content="text/html, charset=utf-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0, maximum-scale=1.0">
<link href='' rel='stylesheet' type='text/css'>
<body leftmargin="0" rightmargin="0" marginwidth="0" marginheight="0">
<table bgcolor="#0385F4" width="100%" border="0" cellpadding="0" cellspacing="0">
<table align="center" width="600" border="0" cellpadding="0" cellspacing="0">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;font-size:50px;color:#fff;mso-line-height-rule:exactly;line-height:28px">#blog_title#</td>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;font-size:20px;color:#fff;mso-line-height-rule:exactly;line-height:28px">Contribution submited</td>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<table bgcolor="#E3E3E3" width="100%" border="0" cellpadding="0" cellspacing="0">
<table align="center" width="600" border="0" cellpadding="0" cellspacing="0">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
Submition details
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<a href="#post_url#" style="color:#262626">#post_title#</a>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
Submited on : #edit_time#
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
Author : #visitor_name# (#visitor_email#)
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<table align="center" bgcolor="#0385F4" width="100" border="0" cellpadding="0" cellspacing="0">
<tbody><tr><td height="4" style="font-size:4px; line-height:4px">&nbsp;</td></tr></tbody>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
Visitors Contributions
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>

@ -0,0 +1,84 @@
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
<html xmlns:v="urn:schemas-microsoft-com:vml">
<subject>[#blog_title#] - Contribution reviewed</subject>
<meta http-equiv="content-type" content="text/html, charset=utf-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0, maximum-scale=1.0">
<link href='' rel='stylesheet' type='text/css'>
<body leftmargin="0" rightmargin="0" marginwidth="0" marginheight="0">
<table bgcolor="#0385F4" width="100%" border="0" cellpadding="0" cellspacing="0">
<table align="center" width="600" border="0" cellpadding="0" cellspacing="0">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;font-size:50px;color:#fff;mso-line-height-rule:exactly;line-height:28px">#blog_title#</td>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;font-size:20px;color:#fff;mso-line-height-rule:exactly;line-height:28px">Contribution approved</td>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<table bgcolor="#E3E3E3" width="100%" border="0" cellpadding="0" cellspacing="0">
<table align="center" width="600" border="0" cellpadding="0" cellspacing="0">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<strong>Dear #visitor_name#</strong>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<a href="#post_url#" style="color:#262626">#post_title#</a>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<table align="center" bgcolor="#0385F4" width="100" border="0" cellpadding="0" cellspacing="0">
<tbody><tr><td height="4" style="font-size:4px; line-height:4px">&nbsp;</td></tr></tbody>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
#blog_title# team
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>

@ -0,0 +1,95 @@
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
<html xmlns:v="urn:schemas-microsoft-com:vml">
<subject>[#blog_title#] - Contribution submited</subject>
<meta http-equiv="content-type" content="text/html, charset=utf-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0, maximum-scale=1.0">
<link href='' rel='stylesheet' type='text/css'>
<body leftmargin="0" rightmargin="0" marginwidth="0" marginheight="0">
<table bgcolor="#0385F4" width="100%" border="0" cellpadding="0" cellspacing="0">
<table align="center" width="600" border="0" cellpadding="0" cellspacing="0">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;font-size:50px;color:#fff;mso-line-height-rule:exactly;line-height:28px">#blog_title#</td>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;font-size:20px;color:#fff;mso-line-height-rule:exactly;line-height:28px">Contribution submited</td>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<table bgcolor="#E3E3E3" width="100%" border="0" cellpadding="0" cellspacing="0">
<table align="center" width="600" border="0" cellpadding="0" cellspacing="0">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<strong>Dear #visitor_name#</strong>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
Submition details
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<a href="#post_url#" style="color:#262626">#post_title#</a>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
Submited on : #edit_time#
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<table align="center" bgcolor="#0385F4" width="100" border="0" cellpadding="0" cellspacing="0">
<tbody><tr><td height="4" style="font-size:4px; line-height:4px">&nbsp;</td></tr></tbody>
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
#blog_title# team
<td align="center "style="font-family:'Questrial',Helvetica,sans-serif; text-align:center;color:#262626;mso-line-height-rule:exactly;line-height:28px">
<tr><td height="30" style="font-size:30px; line-height:30px">&nbsp;</td></tr>

@ -0,0 +1,86 @@
global $wpdb;
$table_name = $wpdb->prefix . 'visitors_edits';
$wpdb->delete($table_name, array( 'edit_id' => $_GET["delete"] ) );
flashMessage("The review was deleted","danger");
$wpdb->delete($table_name, array( 'edit_id' => $_POST["edit_id"] ) );
flashMessage("The post was updated successfully","");
//Notify visitor
require 'mail.php';
$post = get_post($_POST["ID"]);
$mail = [
"blog_title" => get_bloginfo("name"),
$visitor_submitionMail=new visitors_edits_EMAIL($mail,"visitor_approval");
$edits = $wpdb->get_results("SELECT * FROM ".$table_name);
for ($r=0; $r <count($edits); $r++) {
<h1 class="visitors_edits_no_data" <?php if(count($edits)==0){echo 'style="display:block"';}?>>
Emty pending list
<div class="visitors_edits_pending" <?php if(count($edits)==0){echo 'style="display:none"';}?>>
<h1>Pending reviews (<?php echo count($edits);?>)</h1>
<table class="widefat pending">
<th>Author comment</th>
for ($i=0; $i < count($edits); $i++) {
<td><?php echo $edit->post->post_title; ?></td>
<td><?php echo $edit->visitor_name?></td>
<?php echo stripslashes($edit->visitor_comment); ?>
echo date_format($creationDate,"m/d/Y")." at ".date_format($creationDate,"h:i a")
<a class="button-primary" href="<?php echo menu_page_url('visitors_edits_approve',false);?>&edit=<?php echo $edit->edit_id;?>">Review</a>
<a class="button-secondary" href="<?php echo menu_page_url('visitors_edits_main',false);?>&delete=<?php echo $edit->edit_id;?>">Delete</a>
function flashMessage($msg,$type){
<div class="visitors_flashMessage <?php echo $type ?>">
<?php echo $msg ;?>

@ -0,0 +1,71 @@
update_option( "visitors_edits_options", $options );
flashMessage("Settings saved.","");
$options=get_option( "visitors_edits_options", [
"visitor_notif_message"=>"Your suggestion was submitted.",
"admin_notif_message"=>"A new suggestion was submitted.",
"edit_notify_message"=>"Thanks for your contribution to our blog, your contribution was reviewed and approved.",
"propose_edit_link"=>"<p><a href='#post_link#'>Propose an edit</a></p>"
<div class="visitors_edits_admin">
<form action="" method="post">
<div class="control">
<label>Propose an edit link</label>
<input type="text" name="propose_edit_link" value="<?php echo stripcslashes($options['propose_edit_link']) ?>">
<div class="control">
<label>Admin notification message</label>
<textarea name="admin_notif_message" class="notif_message" value=""><?php echo $options['admin_notif_message'] ?></textarea>
<div class="control">
<label>Visitor notification message (On Submit)</label>
<textarea name="visitor_notif_message" class="notif_message" value=""><?php echo $options['visitor_notif_message'] ?></textarea>
<div class="control">
<label>Visitor notification message (On Review)</label>
<textarea name="edit_notify_message" class="notif_message" value=""><?php echo $options['edit_notify_message'] ?></textarea>
<div class="control">
<label>Admin email</label>
<input type="text" placeholder="Email" name="admin_email" value="<?php echo $options['admin_email'] ?>">
<div class="control">
<label><input type="checkbox" name="notify_admin" <?php echo (($options['notify_admin']==null) ? "" : "checked")?>>Notify me on new submits.</label>
<div class="control">
<label><input type="checkbox" name="advanced_merge" <?php echo (($options['advanced_merge']==null) ? "" : "checked")?>>Use deep merging.</label>
<div class="control">
<input type="submit" class="save_btn button-primary" value="Save settings" name="save_settings">
function flashMessage($msg,$type){
<div class="visitors_flashMessage <?php echo $type ?>">
<?php echo $msg ;?>

@ -0,0 +1,8 @@
var $notification=document.querySelector("#edit_notify_message");

@ -0,0 +1,121 @@
var regexp=RegExp("<"+tag+">.*?<\/"+tag+">", "gi");
var editedContent=content.replace(regexp,"");
return editedContent;
var $contentDiv=jQuery("<div/>").html(content);
return $contentDiv.html();
var $contentDiv=jQuery("<div/>").html(content);
return $contentDiv.html();
var $contentDiv=jQuery("<div/>").html(content);
return $contentDiv.html();
var elt=ed.selection.getNode();
var elt=ed.selection.getNode();
var eltContent=elt.outerHTML;
ed.execCommand('mceInsertContent', 0, eltContent);
//Create plugin
tinymce.create('tinymce.plugins.visitors_edits', {
init : function(ed, url) {
//Add buttons
ed.addButton('visitors_edits_approve', {
title : 'Approve',
cmd : 'visitors_edits_approve',
image : url + '/../img/approve.png'
ed.addButton('visitors_edits_reject', {
title : 'Reject',
cmd : 'visitors_edits_reject',
image : url + '/../img/reject.png',
ed.addButton('visitors_edits_clean', {
title : 'Clean All',
cmd : 'visitors_edits_clean',
image : url + '/../img/clean.png'
//Add Commands
ed.addCommand('visitors_edits_approve', function() {
var elt=ed.selection.getNode();
ed.addCommand('visitors_edits_reject', function() {
var elt=ed.selection.getNode();
var content=ed.getContent();
//Load content
//Procedce diff Html
var diffDiv=document.querySelector("#visitors_edits_diff");
var $diffDiv=jQuery(diffDiv);
var $ins=$(this);
if([""," "].indexOf($ins.html())>-1){
//Clean content
var $diffDiv=jQuery("<div/>").html(ed.getContent());
var $p=$(this);
// Register plugin
tinymce.PluginManager.add( 'visitors_edits', tinymce.plugins.visitors_edits );
function editSubmit(){
return true;

@ -0,0 +1,41 @@
var validateEdit={
msg:"Name field required"
msg:"Email field required"
msg:"Please describe your edit to speed up the approval"
var errors=[];
jQuery.each(this.validateRules, function(id, rule) {
var element=jQuery("#"+id);
if(rule.required && element.val()===""){
for (var i = 0; i < errors.length; i++) {
return false;
return true;
jQuery.each(this.validateRules, function(id, rule) {
var element=jQuery("#"+id);

js/jquery.js vendored

File diff suppressed because one or more lines are too long

js/jquery.validate.js vendored

File diff suppressed because it is too large Load Diff

@ -0,0 +1,145 @@
# Change Log
## [v0.1.1]( (2016-03-16)
[Full Changelog](
**Features and Enhancements:**
- Update TableDiff HTMLPurifier Initialization [\#35]( ([dbergunder](
- Update the README and add additional documentation [\#34]( ([jschroed91](
## [0.1.0]( (2016-03-10)
[Full Changelog](
**Features and Enhancements:**
- Allow caching of the calculated diffs using a doctrine cache provider [\#33]( ([jschroed91](
- Create configuration class for HtmlDiff config options [\#32]( ([jschroed91](
- New Feature: Table Diffing [\#31]( ([jschroed91](
- Detect link changes to resolve [\#28]( [\#30]( ([jschroed91](
- Setup PHPUnit testsuite with basic functional test and a few test cases [\#26]( ([jschroed91](
## [0.1.0-beta.1]( (2016-02-26)
[Full Changelog](
**Features and Enhancements:**
- New Feature: Table Diffing [\#31]( ([jschroed91](
- Detect link changes to resolve [\#28]( [\#30]( ([jschroed91](
- Setup PHPUnit testsuite with basic functional test and a few test cases [\#26]( ([jschroed91](
## [0.0.14]( (2016-02-03)
[Full Changelog](
**Fixed bugs:**
- Fix HtmlDiff matching logic skipping over single word matches [\#25]( ([jschroed91](
## [0.0.13]( (2016-01-12)
[Full Changelog](
**Fixed bugs:**
- Misc. list diffing updates and fixes [\#24]( ([jschroed91](
- Updated list diff class to maintain the tags on lists. [\#23]( ([adamCaxy](
## [0.0.12]( (2015-11-11)
[Full Changelog](
**Fixed bugs:**
- feature-list\_diffing-new [\#20]( ([adamCaxy](
## [0.0.11]( (2015-11-06)
[Full Changelog](
**Features and Enhancements:**
- Feature list diffing new [\#19]( ([adamCaxy](
## [0.0.10]( (2015-10-21)
[Full Changelog](
**Fixed bugs:**
- Fix: Updated code so that null is not given in list formatting. [\#17]( ([adamCaxy](
## [0.0.9]( (2015-10-20)
[Full Changelog](
**Fixed bugs:**
- Missed an array\_column in ListDiff. Updated to use ArrayColumn function. [\#16]( ([jschroed91](
## [0.0.8]( (2015-10-20)
[Full Changelog](
**Fixed bugs:**
- Added update for php versions that do not have array\_column as a function. [\#15]( ([jschroed91](
## [0.0.7]( (2015-10-20)
[Full Changelog](
**Features and Enhancements:**
- Created ListDiff class to handle diffing of lists. [\#14]( ([adamCaxy](
## [0.0.6]( (2015-09-11)
[Full Changelog](
**Features and Enhancements:**
- Feature - html tag isolation [\#12]( ([jschroed91](
- ICC-4313 | ICC-4314 | Replace Special HTML Elements with placeholder tokens and update diffing logic [\#11]( ([usaqlain01](
## [0.0.5]( (2015-03-03)
[Full Changelog](
**Features and Enhancements:**
- Support derived classes [\#10]( ([mkalkbrenner](
## [0.0.4]( (2015-01-09)
[Full Changelog](
**Fixed bugs:**
- Check for empty oldText or newText before processing del or ins in processReplaceOperation [\#9]( ([jschroed91](
## [0.0.3]( (2015-01-08)
[Full Changelog](
**Features and Enhancements:**
- Add option to insert a space between del and ins tags [\#8]( ([jschroed91](
- Updated demo to accept input and diff on the fly [\#5]( ([jschroed91](
## [0.0.2]( (2014-08-12)
[Full Changelog](
**Features and Enhancements:**
- Break out HTML content to individual HTML, CSS, JS files [\#6]( ([mgersten-caxy](
**Fixed bugs:**
- Fix error caused when passing empty array into setSpecialCaseTags [\#7]( ([jschroed91](
## [0.0.1]( (2014-07-31)
**Features and Enhancements:**
- Added static properties for the default config variables [\#4]( ([jschroed91](
- Feature nonpartial word diffing [\#3]( ([jschroed91](
- Added option to group together diffed words in output [\#2]( ([jschroed91](
\* *This Change Log was automatically generated by [github_changelog_generator](*
\* *This Change Log was automatically generated by [github_changelog_generator](*

@ -0,0 +1,74 @@
# Contributor Covenant Code of Conduct
## Our Pledge
In the interest of fostering an open and welcoming environment, we as
contributors and maintainers pledge to making participation in our project and
our community a harassment-free experience for everyone, regardless of age, body
size, disability, ethnicity, gender identity and expression, level of experience,
nationality, personal appearance, race, religion, or sexual identity and
## Our Standards
Examples of behavior that contributes to creating a positive environment
* Using welcoming and inclusive language
* Being respectful of differing viewpoints and experiences
* Gracefully accepting constructive criticism
* Focusing on what is best for the community
* Showing empathy towards other community members
Examples of unacceptable behavior by participants include:
* The use of sexualized language or imagery and unwelcome sexual attention or
* Trolling, insulting/derogatory comments, and personal or political attacks
* Public or private harassment
* Publishing others' private information, such as a physical or electronic
address, without explicit permission
* Other conduct which could reasonably be considered inappropriate in a
professional setting
## Our Responsibilities
Project maintainers are responsible for clarifying the standards of acceptable
behavior and are expected to take appropriate and fair corrective action in
response to any instances of unacceptable behavior.
Project maintainers have the right and responsibility to remove, edit, or
reject comments, commits, code, wiki edits, issues, and other contributions
that are not aligned to this Code of Conduct, or to ban temporarily or
permanently any contributor for other behaviors that they deem inappropriate,
threatening, offensive, or harmful.
## Scope
This Code of Conduct applies both within project spaces and in public spaces
when an individual is representing the project or its community. Examples of
representing a project or community include using an official project e-mail
address, posting via an official social media account, or acting as an appointed
representative at an online or offline event. Representation of a project may be
further defined and clarified by project maintainers.
## Enforcement
Instances of abusive, harassing, or otherwise unacceptable behavior may be
reported by contacting the project team at All
complaints will be reviewed and investigated and will result in a response that
is deemed necessary and appropriate to the circumstances. The project team is
obligated to maintain confidentiality with regard to the reporter of an incident.
Further details of specific enforcement policies may be posted separately.
Project maintainers who do not follow or enforce the Code of Conduct in good
faith may face temporary or permanent repercussions as determined by other
members of the project's leadership.
## Attribution
This Code of Conduct is adapted from the [Contributor Covenant][homepage], version 1.4,
available at [][version]

@ -0,0 +1,33 @@
First of all, **thank you** for contributing, **you are awesome**!
Here are a few rules to follow in order to ease code reviews, and discussions before
maintainers accept and merge your work.
You MUST follow the [PSR-1]( and
[PSR-2]( If you don't know about any of them, you
should really read the recommendations. Can't wait? Use the [PHP-CS-Fixer
You MUST run the test suite.
You MUST write (or update) unit tests.
You SHOULD write documentation.
Please, write [commit messages that make
and [rebase your branch](
before submitting your Pull Request.
One may ask you to [squash your
too. This is used to "clean" your Pull Request before merging it (we don't want
commits such as `fix tests`, `fix 2`, `fix 3`, etc.).
Also, while creating your Pull Request on GitHub, you MUST write a description
which gives the context and/or explains why you are creating it.
Thank you!

@ -0,0 +1,130 @@
Version 2, June 1991
Copyright (C) 1989, 1991 Free Software Foundation, Inc.
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
Everyone is permitted to copy and distribute verbatim copies
of this license document, but changing it is not allowed.
The licenses for most software are designed to take away your freedom to share and change it. By contrast, the GNU General Public License is intended to guarantee your freedom to share and change free software--to make sure the software is free for all its users. This General Public License applies to most of the Free Software Foundation's software and to any other program whose authors commit to using it. (Some other Free Software Foundation software is covered by the GNU Lesser General Public License instead.) You can apply it to your programs, too.
When we speak of free software, we are referring to freedom, not price. Our General Public Licenses are designed to make sure that you have the freedom to distribute copies of free software (and charge for this service if you wish), that you receive source code or can get it if you want it, that you can change the software or use pieces of it in new free programs; and that you know you can do these things.
To protect your rights, we need to make restrictions that forbid anyone to deny you these rights or to ask you to surrender the rights. These restrictions translate to certain responsibilities for you if you distribute copies of the software, or if you modify it.
For example, if you distribute copies of such a program, whether gratis or for a fee, you must give the recipients all the rights that you have. You must make sure that they, too, receive or can get the source code. And you must show them these terms so they know their rights.
We protect your rights with two steps: (1) copyright the software, and (2) offer you this license which gives you legal permission to copy, distribute and/or modify the software.
Also, for each author's protection and ours, we want to make certain that everyone understands that there is no warranty for this free software. If the software is modified by someone else and passed on, we want its recipients to know that what they have is not the original, so that any problems introduced by others will not reflect on the original authors' reputations.
Finally, any free program is threatened constantly by software patents. We wish to avoid the danger that redistributors of a free program will individually obtain patent licenses, in effect making the program proprietary. To prevent this, we have made it clear that any patent must be licensed for everyone's free use or not licensed at all.
The precise terms and conditions for copying, distribution and modification follow.
0. This License applies to any program or other work which contains a notice placed by the copyright holder saying it may be distributed under the terms of this General Public License. The "Program", below, refers to any such program or work, and a "work based on the Program" means either the Program or any derivative work under copyright law: that is to say, a work containing the Program or a portion of it, either verbatim or with modifications and/or translated into another language. (Hereinafter, translation is included without limitation in the term "modification".) Each licensee is addressed as "you".
Activities other than copying, distribution and modification are not covered by this License; they are outside its scope. The act of running the Program is not restricted, and the output from the Program is covered only if its contents constitute a work based on the Program (independent of having been made by running the Program). Whether that is true depends on what the Program does.
1. You may copy and distribute verbatim copies of the Program's source code as you receive it, in any medium, provided that you conspicuously and appropriately publish on each copy an appropriate copyright notice and disclaimer of warranty; keep intact all the notices that refer to this License and to the absence of any warranty; and give any other recipients of the Program a copy of this License along with the Program.
You may charge a fee for the physical act of transferring a copy, and you may at your option offer warranty protection in exchange for a fee.
2. You may modify your copy or copies of the Program or any portion of it, thus forming a work based on the Program, and copy and distribute such modifications or work under the terms of Section 1 above, provided that you also meet all of these conditions:
a) You must cause the modified files to carry prominent notices stating that you changed the files and the date of any change.
b) You must cause any work that you distribute or publish, that in whole or in part contains or is derived from the Program or any part thereof, to be licensed as a whole at no charge to all third parties under the terms of this License.
c) If the modified program normally reads commands interactively when run, you must cause it, when started running for such interactive use in the most ordinary way, to print or display an announcement including an appropriate copyright notice and a notice that there is no warranty (or else, saying that you provide a warranty) and that users may redistribute the program under these conditions, and telling the user how to view a copy of this License. (Exception: if the Program itself is interactive but does not normally print such an announcement, your work based on the Program is not required to print an announcement.)
These requirements apply to the modified work as a whole. If identifiable sections of that work are not derived from the Program, and can be reasonably considered independent and separate works in themselves, then this License, and its terms, do not apply to those sections when you distribute them as separate works. But when you distribute the same sections as part of a whole which is a work based on the Program, the distribution of the whole must be on the terms of this License, whose permissions for other licensees extend to the entire whole, and thus to each and every part regardless of who wrote it.
Thus, it is not the intent of this section to claim rights or contest your rights to work written entirely by you; rather, the intent is to exercise the right to control the distribution of derivative or collective works based on the Program.
In addition, mere aggregation of another work not based on the Program with the Program (or with a work based on the Program) on a volume of a storage or distribution medium does not bring the other work under the scope of this License.
3. You may copy and distribute the Program (or a work based on it, under Section 2) in object code or executable form under the terms of Sections 1 and 2 above provided that you also do one of the following:
a) Accompany it with the complete corresponding machine-readable source code, which must be distributed under the terms of Sections 1 and 2 above on a medium customarily used for software interchange; or,
b) Accompany it with a written offer, valid for at least three years, to give any third party, for a charge no more than your cost of physically performing source distribution, a complete machine-readable copy of the corresponding source code, to be distributed under the terms of Sections 1 and 2 above on a medium customarily used for software interchange; or,
c) Accompany it with the information you received as to the offer to distribute corresponding source code. (This alternative is allowed only for noncommercial distribution and only if you received the program in object code or executable form with such an offer, in accord with Subsection b above.)
The source code for a work means the preferred form of the work for making modifications to it. For an executable work, complete source code means all the source code for all modules it contains, plus any associated interface definition files, plus the scripts used to control compilation and installation of the executable. However, as a special exception, the source code distributed need not include anything that is normally distributed (in either source or binary form) with the major components (compiler, kernel, and so on) of the operating system on which the executable runs, unless that component itself accompanies the executable.
If distribution of executable or object code is made by offering access to copy from a designated place, then offering equivalent access to copy the source code from the same place counts as distribution of the source code, even though third parties are not compelled to copy the source along with the object code.
4. You may not copy, modify, sublicense, or distribute the Program except as expressly provided under this License. Any attempt otherwise to copy, modify, sublicense or distribute the Program is void, and will automatically terminate your rights under this License. However, parties who have received copies, or rights, from you under this License will not have their licenses terminated so long as such parties remain in full compliance.
5. You are not required to accept this License, since you have not signed it. However, nothing else grants you permission to modify or distribute the Program or its derivative works. These actions are prohibited by law if you do not accept this License. Therefore, by modifying or distributing the Program (or any work based on the Program), you indicate your acceptance of this License to do so, and all its terms and conditions for copying, distributing or modifying the Program or works based on it.
6. Each time you redistribute the Program (or any work based on the Program), the recipient automatically receives a license from the original licensor to copy, distribute or modify the Program subject to these terms and conditions. You may not impose any further restrictions on the recipients' exercise of the rights granted herein. You are not responsible for enforcing compliance by third parties to this License.
7. If, as a consequence of a court judgment or allegation of patent infringement or for any other reason (not limited to patent issues), conditions are imposed on you (whether by court order, agreement or otherwise) that contradict the conditions of this License, they do not excuse you from the conditions of this License. If you cannot distribute so as to satisfy simultaneously your obligations under this License and any other pertinent obligations, then as a consequence you may not distribute the Program at all. For example, if a patent license would not permit royalty-free redistribution of the Program by all those who receive copies directly or indirectly through you, then the only way you could satisfy both it and this License would be to refrain entirely from distribution of the Program.
If any portion of this section is held invalid or unenforceable under any particular circumstance, the balance of the section is intended to apply and the section as a whole is intended to apply in other circumstances.
It is not the purpose of this section to induce you to infringe any patents or other property right claims or to contest validity of any such claims; this section has the sole purpose of protecting the integrity of the free software distribution system, which is implemented by public license practices. Many people have made generous contributions to the wide range of software distributed through that system in reliance on consistent application of that system; it is up to the author/donor to decide if he or she is willing to distribute software through any other system and a licensee cannot impose that choice.
This section is intended to make thoroughly clear what is believed to be a consequence of the rest of this License.
8. If the distribution and/or use of the Program is restricted in certain countries either by patents or by copyrighted interfaces, the original copyright holder who places the Program under this License may add an explicit geographical distribution limitation excluding those countries, so that distribution is permitted only in or among countries not thus excluded. In such case, this License incorporates the limitation as if written in the body of this License.
9. The Free Software Foundation may publish revised and/or new versions of the General Public License from time to time. Such new versions will be similar in spirit to the present version, but may differ in detail to address new problems or concerns.
Each version is given a distinguishing version number. If the Program specifies a version number of this License which applies to it and "any later version", you have the option of following the terms and conditions either of that version or of any later version published by the Free Software Foundation. If the Program does not specify a version number of this License, you may choose any version ever published by the Free Software Foundation.
10. If you wish to incorporate parts of the Program into other free programs whose distribution conditions are different, write to the author to ask for permission. For software which is copyrighted by the Free Software Foundation, write to the Free Software Foundation; we sometimes make exceptions for this. Our decision will be guided by the two goals of preserving the free status of all derivatives of our free software and of promoting the sharing and reuse of software generally.
How to Apply These Terms to Your New Programs
If you develop a new program, and you want it to be of the greatest possible use to the public, the best way to achieve this is to make it free software which everyone can redistribute and change under these terms.
To do so, attach the following notices to the program. It is safest to attach them to the start of each source file to most effectively convey the exclusion of warranty; and each file should have at least the "copyright" line and a pointer to where the full notice is found.
one line to give the program's name and an idea of what it does.
Copyright (C) yyyy name of author
This program is free software; you can redistribute it and/or
modify it under the terms of the GNU General Public License
as published by the Free Software Foundation; either version 2
of the License, or (at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
Also add information on how to contact you by electronic and paper mail.
If the program is interactive, make it output a short notice like this when it starts in an interactive mode:
Gnomovision version 69, Copyright (C) year name of author
Gnomovision comes with ABSOLUTELY NO WARRANTY; for details
type `show w'. This is free software, and you are welcome
to redistribute it under certain conditions; type `show c'
for details.
The hypothetical commands `show w' and `show c' should show the appropriate parts of the General Public License. Of course, the commands you use may be called something other than `show w' and `show c'; they could even be mouse-clicks or menu items--whatever suits your program.
You should also get your employer (if you work as a programmer) or your school, if any, to sign a "copyright disclaimer" for the program, if necessary. Here is a sample; alter the names:
Yoyodyne, Inc., hereby disclaims all copyright
interest in the program `Gnomovision'
(which makes passes at compilers) written
by James Hacker.
signature of Ty Coon, 1 April 1989
Ty Coon, President of Vice
This General Public License does not permit incorporating your program into proprietary programs. If your program is a subroutine library, you may consider it more useful to permit linking proprietary applications with the library. If this is what you want to do, use the GNU Lesser General Public License instead of this License.

@ -0,0 +1,201 @@
[![Scrutinizer Code Quality](][badge_score]
[![Build Status](][badge_status]
[![Code Coverage](][badge_coverage]
[![Average time to resolve an issue](][badge_resolve]
[![Percentage of issues still open](][badge_issues]
php-htmldiff is a library for comparing two HTML files/snippets and highlighting the differences using simple HTML.
This HTML Diff implementation was forked from [rashid2538/php-htmldiff][upstream] and has been modified with new features,
bug fixes, and enhancements to the original code.
For more information on these modifications, read the [differences from rashid2538/php-htmldiff][differences] or view the [CHANGELOG][changelog].
## Installation
The recommended way to install php-htmldiff is through [Composer][composer].
Require the [caxy/php-htmldiff][badge_packagist] package by running following command:
composer require caxy/php-htmldiff
This will resolve the latest stable version.
Otherwise, install the library and setup the autoloader yourself.
### Working with Symfony
If you are using Symfony, you can use the [caxy/HtmlDiffBundle][htmldiffbundle] to make life easy!
## Usage
use Caxy\HtmlDiff\HtmlDiff;
$htmlDiff = new HtmlDiff($oldHtml, $newHtml);
$content = $htmlDiff->build();
## Configuration
The configuration for HtmlDiff is contained in the `Caxy\HtmlDiff\HtmlDiffConfig` class.
There are two ways to set the configuration:
1. [Configure an Existing HtmlDiff Object](#configure-an-existing-htmldiff-object)
2. [Create and Use a HtmlDiffConfig Object](#create-and-use-a-htmldiffconfig-object)
#### Configure an Existing HtmlDiff Object
When a new `HtmlDiff` object is created, it creates a `HtmlDiffConfig` object with the default configuration.
You can change the configuration using setters on the object:
use Caxy\HtmlDiff\HtmlDiff;
// ...
$htmlDiff = new HtmlDiff($oldHtml, $newHtml);
// Set some of the configuration options.
// Calculate the differences using the configuration and get the html diff.
$content = $htmlDiff->build();
// ...
#### Create and Use a HtmlDiffConfig Object
You can also set the configuration by creating an instance of
`Caxy\HtmlDiff\HtmlDiffConfig` and using it when creating a new `HtmlDiff`
object using `HtmlDiff::create`.
This is useful when creating more than one instance of `HtmlDiff`:
use Caxy\HtmlDiff\HtmlDiff;
use Caxy\HtmlDiff\HtmlDiffConfig;
// ...
$config = new HtmlDiffConfig();
// Create an HtmlDiff object with the custom configuration.
$firstHtmlDiff = HtmlDiff::create($oldHtml, $newHtml, $config);
$firstContent = $firstHtmlDiff->build();
$secondHtmlDiff = HtmlDiff::create($oldHtml2, $newHtml2, $config);
$secondContent = $secondHtmlDiff->build();
// ...
#### Full Configuration with Defaults:
$config = new HtmlDiffConfig();
// Percentage required for list items to be considered a match.
// Set the encoding of the text to be diffed.
// If true, a space will be added between the <del> and <ins> tags of text that was replaced.
// Option to disable the new Table Diffing feature and treat tables as regular text.
// Pass an instance of \Doctrine\Common\Cache\Cache to cache the calculated diffs.
// Set the cache directory that HTMLPurifier should use.
// Group consecutive deletions and insertions instead of showing a deletion and insertion for each word individually.
// List of characters to consider part of a single word when in the middle of text.
->setSpecialCaseChars(array('.', ',', '(', ')', '\''))
// List of tags to treat as special case tags.
->setSpecialCaseTags(array('strong', 'b', 'i', 'big', 'small', 'u', 'sub', 'sup', 'strike', 's', 'p'))
// List of tags (and their replacement strings) to be diffed in isolation.
'sub' => '[[REPLACE_SUB_SCRIPT]]',
'sup' => '[[REPLACE_SUPER_SCRIPT]]',
'table' => '[[REPLACE_TABLE]]',
'strong' => '[[REPLACE_STRONG]]',
'b' => '[[REPLACE_B]]',
'em' => '[[REPLACE_EM]]',
'i' => '[[REPLACE_I]]',
'a' => '[[REPLACE_A]]',
## Contributing
See [CONTRIBUTING][contributing] file.
## Contributor Code of Conduct
Please note that this project is released with a [Contributor Code of
Conduct][contributor_covenant]. By participating in this project
you agree to abide by its terms. See [CODE_OF_CONDUCT][code_of_conduct] file.
## Credits
* [rashid2538][] for the port to PHP and the base for our project: [rashid2538/php-htmldiff][upstream]
* [willdurand][] for an excellent post on [open sourcing libraries][].
Much of this documentation is based off of the examples in the post.
Did we miss anyone? If we did, let us know or put in a pull request!
## License
php-htmldiff is available under [GNU General Public License, version 2][gnu]. See the [LICENSE][license] file for details.
[badge_resolve]: "Average time to resolve an issue"
[badge_issues]: "Percentage of issues still open"
[open sourcing libraries]:

@ -0,0 +1,43 @@
"name": "caxy/php-htmldiff",
"type": "library",
"description": "A library for comparing two HTML files/snippets and highlighting the differences using simple HTML.",
"keywords": [
"homepage": "",
"license": "GPL-2.0",
"authors": [
"name": "Josh Schroeder",
"email": "",
"homepage": ""
"support": {
"issues": ""
"require": {
"php": ">=5.3.3",
"ezyang/htmlpurifier": "^4.7"
"require-dev": {
"phpunit/phpunit": "~4.8",
"doctrine/cache": "~1.0"
"suggest": {
"doctrine/cache": "Used for caching the calculated diffs using a Doctrine Cache Provider"
"autoload": {
"psr-0": { "Caxy\\HtmlDiff": "lib/" }
"autoload-dev": {
"psr-4": { "Caxy\\Tests\\": "tests/Caxy/Tests" }
"extra": {
"branch-alias": {
"dev-master": "0.1.x-dev"

@ -0,0 +1 @@
Just write the code as shown in php file and enjoy.

@ -0,0 +1,16 @@
"name": "php-htmldiff-demo",
"dependencies": {
"bootstrap": "v4.0.0-alpha.2",
"angular": "1.5.0",
"clipboard": "^1.5.8",
"font-awesome": "^4.5.0",
"angular-sanitize": "^1.5.0",
"tether": "^1.2.0",
"ng-ckeditor": "^0.2.1",
"ckeditor": "^4.5.7",
"angular-ui": "^0.4.0",
"AngularJS-Toaster": "angularjs-toaster#^1.2.0",
"angular-bootstrap": "^1.1.2"

@ -0,0 +1,276 @@
Document : codes
Created on : Sep 23, 2013, 4:41:58 PM
Author : mgersten
Description: CSS related to I-code specific display
.diff-list > li.normal,
.diff-list > li.removed,
.diff-list > li.replacement{
display: table-row;
.diff-list > li.normal:before,
.diff-list > li.removed:before,
.diff-list > li.replacement:before{
width: 15px;
overflow: hidden;
content: counters(section,".") ". ";
display: table-cell;
text-indent: -1em;
padding-left: 1em;
/* overwrite width of :before on ballot pages */
.ballot-monograph .diff-list > li.normal:before,
.ballot-monograph .diff-list > li.removed:before,
.ballot-monograph .diff-list > li.replacement:before {
width: 30px;
.diff-list > li.normal:before,
li.replacement + li.replacement:before,
.diff-list > li.replacement:first-child:before{
counter-increment: section;
.diff-list > li.removed:before{
counter-increment: section;
text-decoration: line-through;
ol.diff-list li.removed + li.replacement {
counter-increment: none;
ol.diff-list li.removed + li.removed + li.replacement {
counter-increment: section -1;
ol.diff-list li.removed + li.removed + li.removed + li.replacement {
counter-increment: section -2;
ol.diff-list li.removed + li.removed + li.removed + li.removed + li.replacement {
counter-increment: section -3;
ol.diff-list li.removed + li.removed + li.removed + li.removed + li.removed + li.replacement {
counter-increment: section -4;
ol.diff-list li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.replacement {
counter-increment: section -5;
ol.diff-list li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.replacement {
counter-increment: section -6;
ol.diff-list li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.replacement {
counter-increment: section -7;
ol.diff-list li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.replacement {
counter-increment: section -8;
ol.diff-list li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.replacement {
counter-increment: section -9;
ol.diff-list li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.replacement{
counter-increment: section -10;
ol.diff-list li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.removed + li.replacement {
counter-increment: section -11;
.diff-list > li.replacement:before,
.diff-list >{
text-decoration: underline;
.diff-list > li > div{
display: inline;
list-style: none;
counter-reset: section;
display: table;
.sectionContent ol,
.revision-container ol{
list-style: none;
counter-reset: section;
.sectionContent ol li,
.revision-container ol li{
position: relative;
padding: 0 0 0 30px;
color: #000000;
text-indent: 0px;
.sectionContent ol ol li,
.revision-container ol ol li{
padding: 0 0 0 45px;
.sectionContent ol ol ol li,
.revision-container ol ol ol li{
padding: 0 0 0 60px;
.sectionContent ol ol ol ol li,
.revision-container ol ol ol ol li{
padding: 0 0 0 75px;
.sectionContent ol ol ol ol ol li,
.revision-container ol ol ol ol ol li{
padding: 0 0 0 90px;
.sectionContent ol ol ol ol ol ol li,
.revision-container ol ol ol ol ol ol li{
padding: 0 0 0 105px;
.sectionContent ol ol ol ol ol ol ol li,
.revision-container ol ol ol ol ol ol ol li{
padding: 0 0 0 120px;
.sectionContent ol ol ol ol ol ol ol ol li,
.revision-container ol ol ol ol ol ol ol ol li{
padding: 0 0 0 135px;
.sectionContent ol ol ol ol ol ol ol ol ol li,
.revision-container ol ol ol ol ol ol ol ol ol li{
padding: 0 0 0 160px;
.sectionContent ol ol ol ol ol ol ol ol ol ol li,
.revision-container ol ol ol ol ol ol ol ol ol ol li{
padding: 0 0 0 175px;
.sectionContent ol li:before,
.revision-container ol li:before{
counter-increment: section;
content:counters(section, ".") ".";
position: absolute;
left: 0px;
li.italic {
font-style: italic;
.sectionTitle {
text-align: center;
margin: 23px 0 15px;
.precontent-title {
margin-bottom: 10px;
display: block;
.secondParagraph {
text-indent: 1em;
.indentedParagraph {
margin-left: 1em;
.outdentOneLevel {
margin-left: -75px;
ol.list-alpha-upper > li:before {
content: counter(section, upper-alpha) ".";
ol.list-alpha-lower > li:before {
content: counter(section, lower-alpha) ".";
ol.list-roman-upper > li:before {
content: counter(section, upper-roman) ".";
ol.list-roman-lower > li:before {
content: counter(section, lower-roman) ".";
ol.list-roman-lower-parentheses > li:before {
content: "(" counter(section, lower-roman) ")";
ol.list-alpha-lower-parentheses > li:before {
content: "(" counter(section, lower-alpha) ")";
ol.list-numeric-right-parenthesis > li:before {
content: counter(section) ")";
.revision-content p,
.revision-content ol,
.revision-content ul,
.revision-content li,
.revision-content td,
.sectionContent p,
.sectionContent ol,
.sectionContent ul,
.sectionContent li,
.sectionContent td,
.revision-notes {
font-family: "Helvetica Neue",Helvetica,Arial,sans-serif !important;
font-size: 14px !important;
font-weight: normal !important;
line-height: 18px !important;
color:#404040 !important;
.revision-content .footnotes p,
.revision-content .footnotes ol,
.revision-content .footnotes ul,
.revision-content .footnotes li,
.revision-content .footnotes td,
.sectionContent .footnotes p,
.sectionContent .footnotes ol,
.sectionContent .footnotes ul,
.sectionContent .footnotes li,
.sectionContent .footnotes td {
font-size: 12px !important;
.diff-list ul.exception ol ,
.sectionContent ul.exception ol ,
.revision-container ul.exception ol{
list-style: none;
counter-reset: exception-section;
/* Creates a new instance of the section counter with each ol element */
ul.exception li:before {
list-style: none;
content: none;
.diff-list ul.exception ol > li:before,
.sectionContent ul.exception ol > li:before,
.revision-container ul.exception ol > li:before {
counter-increment: exception-section;
content:counters(exception-section, ".") ".";
.sectionContent i > sub,
.revision-container i > sub {
font-style: italic;
div.print-section a {
text-align: center;
color: #818181;
display: block;
text-decoration: none;
font-size: 0.8em;
div.print-section a.disabled {
display: none;
.print-link {
color: #818181;
.print-link.disabled {
cursor: text;
text-decoration: none;
/* Hack for generic styles that shouldn't exist in the database */
.content_bold {
font-weight: bold;
.content_italics {
font-style: italic;

@ -0,0 +1,212 @@
(function() {
'use strict';
.controller('DemoController', DemoController);
DemoController.$inject = ['$q', '$http', '$sce', '$timeout'];
function DemoController($q, $http, $sce, $timeout) {
var vm = this;
vm.demos = [];
vm.updateDelay = 800;
vm.currentTimeout = null;
vm.loading = false;
vm.waiting = false;
vm.diffName = '';
vm.currentDemo = null;
vm.debugOutput = {};
vm.matchThreshold = 80;
vm.overrides = [];
vm.legislativeOverride = null;
vm.tableDiffNumber = 1;
vm.tableDiffing = true;
vm.editorOptions = {};
vm.ckEditorEnabled = true;
vm.trustHtml = trustHtml;
vm.reset = reset;
vm.update = update;
vm.swapText = swapText;
vm.diffDemo = diffDemo;
vm.diffOverride = diffOverride;
vm.diffTableDemo = diffTableDemo;
vm.updateDemo = updateDemo;
vm.saveNewDemo = saveNewDemo;
vm.toggleCkEditor = toggleCkEditor;
function activate() {
var promises = [loadDemos(), loadOverrides()];
return $q.all(promises).then(function() {
function trustHtml(text) {
return typeof text !== 'undefined' ? $sce.trustAsHtml(text) : '';
function toggleCkEditor() {
vm.ckEditorEnabled = !vm.ckEditorEnabled;
function reset() {
vm.oldText = '';
vm.newText = '';
vm.diff = '';
vm.loading = false;
vm.waiting = false;
vm.currentDemo = null;
vm.legislativeOverride = null;
if (vm.currentTimeout) {
function update() {
if (vm.currentTimeout) {
vm.currentTimeout = $timeout(function () {
}, vm.updateDelay);
vm.diff = null;
vm.waiting = true;
function swapText() {
var oldText = vm.oldText;
vm.oldText = vm.newText;
vm.newText = oldText;
function diffDemo(index) {
if (typeof index === 'undefined') {
index = 0;
vm.oldText = vm.demos[index]['old'];
vm.newText = vm.demos[index]['new'];
vm.currentDemo = vm.demos[index];
vm.legislativeOverride = vm.demos[index].hasOwnProperty('legislativeOverride') ? vm.demos[index]['legislativeOverride'] : null;
function diffOverride(override, index) {
vm.oldText = override.old;
vm.newText =;
vm.legislativeOverride = override.override;
vm.currentDemo = override;
if (! { = 'Override Demo ' + (index + 1);
vm.currentDemo.isOverride = true;
function diffTableDemo(index) {
.then(function(response) {
vm.oldText =;
vm.newText =;
vm.legislativeOverride = null;
vm.currentDemo = null;
.catch(function(e) {
function updateDemo() {
vm.currentDemo.old = vm.oldText; = vm.newText;
return $'save_demo.php', vm.currentDemo)
.then(function (response) {
return response;
function saveNewDemo() {
var newIndex = vm.demos.length + 1;
if (vm.diffName.length === 0) {
vm.diffName = 'DEMO ' + newIndex;
var newDemo = {'old': vm.oldText, 'new': vm.newText, 'name': vm.diffName, 'legislativeOverride': vm.legislativeOverride};
return $'save_demo.php', newDemo)
.then(function (response) {
vm.currentDemo = newDemo;
return vm.currentDemo;
function loadTableDiff(index) {
return $http({
url: 'load_table_diff.php',
method: 'POST',
data: {index: index},
header: {'Content-Type': 'application/json; charset=UTF-8'}
function getDiff() {
vm.waiting = false;
vm.loading = true;
vm.diff = null;
$'index.php', {
oldText: vm.oldText,
newText: vm.newText,
matchThreshold: vm.matchThreshold,
tableDiffing: vm.tableDiffing
.then(function (response) {
vm.diff ='diff') ? :;
vm.loading = false;
.catch(function (response) {
console.error('Gists error', response.status,;
function loadDemos() {
.success(function (data) {
vm.demos = data;
function loadOverrides() {
return $http.get('diff.json')
.then(function (response) {
vm.overrides =;
return vm.overrides;
function addDebugOutput(data) {
angular.forEach(data, function(value, key) {
data[key] = {
messages: value,
isCollapsed: true
vm.debugOutput = data;

@ -0,0 +1,246 @@
<!DOCTYPE html>
<html lang="en" ng-app="demo">
<meta charset="utf-8">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<meta http-equiv="x-ua-compatible" content="ie=edge">
<link rel="stylesheet" href="bower_components/tether/dist/css/tether.min.css">
<link rel="stylesheet" href="bower_components/bootstrap/dist/css/bootstrap.min.css">
<link rel="stylesheet" href="bower_components/font-awesome/css/font-awesome.min.css">
<link rel="stylesheet" href="bower_components/ng-ckeditor/ng-ckeditor.css">
<link rel="stylesheet" href="bower_components/angular-ui/build/angular-ui.min.css">
<link rel="stylesheet" href="bower_components/AngularJS-Toaster/toaster.min.css">
<link rel="stylesheet" href="bower_components/angular-bootstrap/ui-bootstrap-csp.css">
<link type="text/css" href="codes.css" rel="stylesheet">
<body ng-controller="DemoController as vm">
<!-- Main Navigation -->
<nav class="navbar navbar-light bg-faded">
<a class="navbar-brand" href="#">caxy/php-htmldiff</a>
<ul class="nav navbar-nav">
<li class="nav-item active">
<a class="nav-link" href="#">Demo <span class="sr-only">(current)</span></a>
<!-- Main Content -->
<div class="container-fluid">
<!-- diff controls and input -->
<div class="card">
<div class="card-header">
<button class="btn btn-secondary btn-sm" type="button" data-toggle="collapse" data-target="#diffControls">
<i class="fa fa-compress"></i>
Diff Controls
<div class="pull-right">
<div ng-if="vm.currentDemo">
Current Demo: {{ }}
<button ng-if="!vm.currentDemo.isOverride" type="button" class="btn btn-primary btn-sm" ng-click="vm.updateDemo()">
Update Demo
<div class="card-block collapse in" id="diffControls">
<!-- Diff controls -->
<div class="form-inline row">
<!-- Reset button -->
<div class="btn-group" role="group">
<button type="button" class="btn btn-sm btn-danger-outline" ng-click="vm.reset()">RESET</button>
<!-- Load demo buttons w/ dropdowns -->
<div class="btn-group" role="group">
<div class="btn-group btn-group-sm">
<button type="button" class="btn btn-secondary dropdown-toggle" data-toggle="dropdown" aria-haspopup="true" aria-expanded="false">
Load Custom Demo
<div class="dropdown-menu">
<a href ng-repeat="demo in vm.demos" type="button" class="dropdown-item" ng-class="{active: demo == vm.currentDemo}" ng-click="vm.diffDemo($index)">
{{ }}
<div class="btn-group btn-group-sm" role="group">
<button type="button" class="btn btn-secondary dropdown-toggle" data-toggle="dropdown" aria-haspopup="true" aria-expanded="false">
Load Diff Override Demo
<div class="dropdown-menu">
<a href class="dropdown-item" ng-repeat="override in vm.overrides" ng-class="{active: vm.currentDemo == override}" ng-click="vm.diffOverride(override, $index)">
Override Demo {{ $index + 1 }}
<!-- Load table diff button and input -->
<div class="form-group">
<div class="input-group input-group-sm" role="group">
<span class="input-group-btn">
<button ng-click="vm.diffTableDemo(vm.tableDiffNumber)" type="button" class="btn btn-secondary">Load Table Diff</button>
<input type="number" class="form-control" ng-model="vm.tableDiffNumber" />
<!-- Match Threshold -->
<div class="form-group">
<label for="matchThreshold">Match Threshold</label>
<input type="number" class="form-control form-control-sm" ng-model="vm.matchThreshold" id="matchThreshold" ng-change="vm.update()">
<!-- Table Diffing Checkbox -->
<div class="form-group">
<label class="checkbox-inline" for="tableDiffing">
<input type="checkbox" ng-model="vm.tableDiffing" id="tableDiffing" ng-change="vm.update()"> Use Table Diffing
<!-- Swap Text Button -->
<button type="button" class="btn btn-secondary btn-sm" ng-click="vm.swapText()">Swap Text</button>
<!-- Save as New Demo -->
<div class="form-group">
<div class="input-group input-group-sm">
<input type="text" class="form-control" placeholder="Demo Name" ng-model="vm.diffName" />
<span class="input-group-btn">
<button class="btn btn-secondary" type="button" ng-click="vm.saveNewDemo()">Save as New Demo</button>
</div><!-- end of diff controls -->
<!-- Diff Inputs (Old Text / New Text) -->
<div class="form-group row m-t-2">
<div class="col-sm-6">
<label class="form-control-label" for="oldText">
Old Text
<button type="button" class="btn btn-sm btn-secondary clipboard" data-clipboard-target="#oldText">
<i class="fa fa-clipboard"></i>
<a ng-click="vm.toggleCkEditor()">Toggle CK</a>
<div ng-if="vm.ckEditorEnabled">
<textarea ckeditor="vm.editorOptions" ng-model="vm.oldText" id="oldText" ng-change="vm.update()"></textarea>
<textarea ng-if="!vm.ckEditorEnabled" class="form-control" ng-model="vm.oldText" name="old_text" ng-change="vm.update()" rows="15"></textarea>
<div class="col-sm-6">
<label class="form-control-label" for="newText">
New Text
<button type="button" class="btn btn-sm btn-secondary clipboard" data-clipboard-target="#newText">
<i class="fa fa-clipboard"></i>
<a ng-click="vm.toggleCkEditor()">Toggle CK</a>
<div ng-if="vm.ckEditorEnabled">
<textarea ckeditor="vm.editorOptions" ng-model="vm.newText" id="newText" ng-change="vm.update()"></textarea>
<textarea ng-if="!vm.ckEditorEnabled" class="form-control" ng-model="vm.newText" name="new_text" ng-change="vm.update()" rows="15"></textarea>
</div><!-- end of diff inputs -->
</div><!-- end of diff controls card-block -->
</div><!-- end of diff controls card -->
<!-- Diff Output -->
<div class="card">
<div class="card-header">
<div class="btn-group">
<button class="btn btn-secondary btn-sm" type="button" data-toggle="collapse" data-target="#diffBlock">
<i class="fa fa-compress"></i>
<button type="button" class="btn btn-sm btn-secondary clipboard" data-clipboard-target="#diffPreview">
<i class="fa fa-clipboard"></i>
<button type="button" class="btn btn-sm btn-secondary" ng-click="vm.update()">
<i class="fa fa-refresh"></i>
Diff Output
<span ng-show="vm.loading || vm.waiting">- {{ vm.loading ? 'Loading' : 'Waiting' }}...</span>
<div class="card-block collapse in" id="diffBlock">
<div class="form-group row">
<div class="col-sm-12">
<div id="diffPreview" class="html-preview" ng-bind-html="vm.trustHtml(vm.diff)"></div>
</div><!-- end of diff output -->
<!-- Diff Output (HTML) -->
<div class="card">
<div class="card-header">
<button class="btn btn-secondary btn-sm" type="button" data-toggle="collapse" data-target="#rawDiffBlock">
<i class="fa fa-compress"></i>
<label class="form-control-label" for="rawDiff">
Diff Output (HTML)
<button type="button" class="btn btn-sm btn-secondary clipboard" data-clipboard-target="#rawDiff">
<i class="fa fa-clipboard"></i>
<span ng-show="vm.loading || vm.waiting">- {{ vm.loading ? 'Loading' : 'Waiting' }}...</span>
<div class="card-block collapse" id="rawDiffBlock">
<div class="form-group row">
<div class="col-sm-12">
<textarea id="rawDiff" class="form-control" ng-model="vm.diff" name="diff" readonly ng-change="vm.update()" rows="15"></textarea>
</div><!-- end of diff output (html) -->
<!-- Debug Output -->
<div class="row">
<div class="col-sm-6">
<h3>Debug Output</h3>
<div class="card" ng-repeat="(category, categoryMessages) in vm.debugOutput track by category">
<div class="card-header">
<a ng-click="categoryMessages.isCollapsed = !categoryMessages.isCollapsed">
{{ category }}
<div class="card-block" uib-collapse="categoryMessages.isCollapsed">
<pre ng-repeat="message in categoryMessages.messages track by $index">
{{ message }}
<div class="col-sm-6" ng-show="vm.legislativeOverride">
<h3>Legislative Override</h3>
<div class="html-preview" ng-bind-html="vm.trustHtml(vm.legislativeOverride)"></div>
</div><!-- end of debug output -->
</div><!-- end of outer container div -->
<script src="bower_components/jquery/dist/jquery.min.js"></script>
<script src="bower_components/tether/dist/js/tether.min.js"></script>
<script src="bower_components/bootstrap/dist/js/bootstrap.min.js"></script>
<script src="bower_components/angular/angular.min.js"></script>
<script src="bower_components/angular-sanitize/angular-sanitize.min.js"></script>
<script src="bower_components/clipboard/dist/clipboard.min.js"></script>
<script src="bower_components/ckeditor/ckeditor.js"></script>
<script src="bower_components/ng-ckeditor/ng-ckeditor.min.js"></script>
<script src="bower_components/angular-ui/build/angular-ui.min.js"></script>
<script src="bower_components/angular-animate/angular-animate.min.js"></script>
<script src="bower_components/AngularJS-Toaster/toaster.min.js"></script>
<script src="bower_components/angular-bootstrap/ui-bootstrap-tpls.min.js"></script>
<script type="text/javascript" src="demo.module.js"></script>
<script type="text/javascript" src="demo.controller.js"></script>
new Clipboard('.clipboard');

@ -0,0 +1,9 @@
(function() {
'use strict';
angular.module('demo', [

File diff suppressed because one or more lines are too long

File diff suppressed because one or more lines are too long

@ -0,0 +1,56 @@
use Caxy\HtmlDiff\HtmlDiff;
ini_set('display_errors', 1);
require __DIR__.'/../vendor/autoload.php';
$debugOutput = array();
function addDebugOutput($value, $key = 'general')
global $debugOutput;
if (!is_string($value)) {
$value = var_export($value, true);
if (!array_key_exists($key, $debugOutput)) {
$debugOutput[$key] = array();
$debugOutput[$key][] = $value;
$input = file_get_contents('php://input');
if ($input) {
header('Content-Type: application/json');
$data = json_decode($input, true);
$oldText = $data['oldText'];
$newText = $data['newText'];
$useTableDiffing = isset($data['tableDiffing']) ? $data['tableDiffing'] : true;
$diff = new HtmlDiff($oldText, $newText, 'UTF-8', array());
if (array_key_exists('matchThreshold', $data)) {
$diffOutput = $diff->build();
$diffOutput = mb_convert_encoding($diffOutput, 'UTF-8');
$jsonOutput = json_encode(array('diff' => $diffOutput, 'debug' => $debugOutput));
if (false === $jsonOutput) {
throw new \Exception('Failed to encode JSON: '.json_last_error_msg());
echo $jsonOutput;
} else {
header('Content-Type: text/html');
echo file_get_contents('demo.html');

@ -0,0 +1,22 @@
$requestBody = file_get_contents('php://input');
$requestJson = json_decode($requestBody, true);
if (empty($requestJson['index'])) {
throw new \Exception('index is required.');
$jsonFile = __DIR__.'/tablediffs.json';
$demoStorage = json_decode(file_get_contents($jsonFile), true);
if (!array_key_exists($requestJson['index'], $demoStorage)) {
throw new \Exception('index not found.');
$targetDemo = $demoStorage[$requestJson['index']];
header('Content-Type: application/json');
echo json_encode($targetDemo);

@ -0,0 +1,46 @@
$requestBody = file_get_contents('php://input');
$requestJson = json_decode($requestBody, true);
if (empty($requestJson['old']) && empty($requestJson['new'])) {
throw new \Exception('Old text or new text is required.');
$jsonFile = __DIR__.'/demos.json';
$demoStorage = json_decode(file_get_contents($jsonFile), true);
if (empty($requestJson['name'])) {
$requestJson['name'] = 'DEMO '.count($demoStorage);
$oldText = $requestJson['old'];
$newText = $requestJson['new'];
$name = $requestJson['name'];
$legislativeOverride = !empty($requestJson['legislativeOverride']) ? $requestJson['legislativeOverride'] : null;
$existingDemoIndex = null;
foreach ($demoStorage as $index => $demo) {
if ($demo['name'] === $name) {
$existingDemoIndex = $index;
if ($existingDemoIndex !== null) {
$demoStorage[$existingDemoIndex]['old'] = $oldText;
$demoStorage[$existingDemoIndex]['new'] = $newText;
} else {
$demoStorage[] = array(
'name' => $name,
'old' => $oldText,
'new' => $newText,
'legislativeOverride' => $legislativeOverride,
if (false === file_put_contents($jsonFile, json_encode($demoStorage))) {
throw new \Exception("Unable to save to file: $jsonFile");

File diff suppressed because one or more lines are too long

@ -0,0 +1,116 @@
Differences from rashid2538/php-htmldiff
.. contents:: Table of Contents
Code Styling and Clean-up
* Added namespaces, split up classes to their own files, some code styling changes
* Allow the specialCaseOpeningTags and specialCaseClosingTags properties to be modified by passing an array into the constructor or using set/add/remove functions
* Updated the demo to accept input and diff via AJAX
* Added static properties for the default config variables
Bug Fixes
* Fixed an index out of range bug (may have been fixed on the original repo since): c9ba1fa_
* Check for empty oldText or newText before processing del or ins in processReplaceOperation function
New Features
Isolated Diffing of certain HTML elements
This is the one of the largest changes from the original repository.
For more information, see the release notes for tag `0.0.6`_
List Diffing
Similar to the Isolated Diffing feature, but specifically for HTML lists.
More information is to come on this, and there will definitely be some tweaks and configuration options added for this
feature. Currently there is no easy way to enable/disable the feature, so if you're having issues with it I suggest
using the `0.0.6`_ or earlier release.
Table Diffing
Similar to the Isolated Diffing and List Diffing features, but specifically for HTML tables.
More information to come on this soon.
New option to group together diffed words by not matching on whitespace-only. Option is enabled by default.
This was a specific requirement for an application we use this library for. The original library would replace
single words at a time, but enabling this feature will group replacements instead. See example below.
Old Text::
testing some text here and there
New Text::
testing other words here and there
With $groupDiffs = false (original functionality)::
testing <del>some</del><ins>other</ins> <del>text</del><ins>words</ins> here and there
With $groupDiffs = true (new feature)::
testing <del>some text</del><ins>other words</ins> here and there
Change diffing to strike through entire words/numbers if they contain periods or commas within the word
This change introduced a new property ``$specialCaseChars``, which defaults to the following characters: ``.`` ``,`` ``(`` ``)`` ``'``
This feature can be "disabled" by simply setting the $specialCaseChars to an empty array i.e. ``$diff->setSpecialCaseChars(array())``
In the original library, special characters are treated as their own "words" even if they are in the middle of a word.
This causes weird things to happen when diffing numbers that have a comma or a period in the middle of the number.
For example, diffing ``10,000.50`` against ``11,100.75`` gives you:
Original Functionality::
<del class="diffmod">10</del><ins class="diffmod">11</ins>,<del class="diffmod">000</del><ins class="diffmod">100</ins>.<del class="diffmod">50</del><ins class="diffmod">75</ins>
This is very difficult to read, so the new feature allows you to add ``.`` and ``,`` to the ``$specialCaseChars`` array in order
to get output that looks like::
<del class="diffmod">10,000.50</del><ins class="diffmod">11,100.75</ins>
Note: It will *not* treat the specialCaseChars as part of the word if it is at the beginning or end of the word,
so normal periods or commas at the end of words will still be diffed like the original.
Added option to insert a space between ``<del>`` and ``<ins>`` tags. Disabled by default.
This was a requirement for one our applications that uses this library.
New property ``$insertSpaceInReplace`` was added, and setting it to true will simply add a space between
the ``<del>`` and ``<ins>`` tags in replace operations, which was requested for easier reading.
Enable it by calling ``$diff->setInsertSpaceInReplace(true);``
Original Functionality::
New Functionality::
<del>Old</del> <ins>New</ins>
.. _c9ba1fa:
.. _0.0.6:

@ -0,0 +1,490 @@
namespace Caxy\HtmlDiff;
* Class AbstractDiff
* @package Caxy\HtmlDiff
abstract class AbstractDiff
* @var array
* @deprecated since 0.1.0
public static $defaultSpecialCaseTags = array('strong', 'b', 'i', 'big', 'small', 'u', 'sub', 'sup', 'strike', 's', 'p');
* @var array
* @deprecated since 0.1.0
public static $defaultSpecialCaseChars = array('.', ',', '(', ')', '\'');
* @var bool
* @deprecated since 0.1.0
public static $defaultGroupDiffs = true;
* @var HtmlDiffConfig
protected $config;
* @var string
protected $content;
* @var string
protected $oldText;
* @var string
protected $newText;
* @var array
protected $oldWords = array();
* @var array
protected $newWords = array();
* @var DiffCache[]
private $diffCaches = array();
* AbstractDiff constructor.
* @param string $oldText
* @param string $newText
* @param string $encoding
* @param null|array $specialCaseTags
* @param null|bool $groupDiffs
public function __construct($oldText, $newText, $encoding = 'UTF-8', $specialCaseTags = null, $groupDiffs = null)
$this->config = HtmlDiffConfig::create()->setEncoding($encoding);
if ($specialCaseTags !== null) {
if ($groupDiffs !== null) {
$this->oldText = $this->purifyHtml(trim($oldText));
$this->newText = $this->purifyHtml(trim($newText));
$this->content = '';
* @return bool|string
abstract public function build();
* @return DiffCache|null
protected function getDiffCache()
if (!$this->hasDiffCache()) {
return null;
$hash = spl_object_hash($this->getConfig()->getCacheProvider());
if (!array_key_exists($hash, $this->diffCaches)) {
$this->diffCaches[$hash] = new DiffCache($this->getConfig()->getCacheProvider());
return $this->diffCaches[$hash];
* @return bool
protected function hasDiffCache()
return null !== $this->getConfig()->getCacheProvider();
* @return HtmlDiffConfig
public function getConfig()
return $this->config;
* @param HtmlDiffConfig $config
* @return AbstractDiff
public function setConfig(HtmlDiffConfig $config)
$this->config = $config;
return $this;
* @return int
* @deprecated since 0.1.0
public function getMatchThreshold()
return $this->config->getMatchThreshold();
* @param int $matchThreshold
* @return AbstractDiff
* @deprecated since 0.1.0
public function setMatchThreshold($matchThreshold)
return $this;
* @param array $chars
* @deprecated since 0.1.0
public function setSpecialCaseChars(array $chars)
* @return array|null
* @deprecated since 0.1.0
public function getSpecialCaseChars()
return $this->config->getSpecialCaseChars();
* @param string $char
* @deprecated since 0.1.0
public function addSpecialCaseChar($char)
* @param string $char
* @deprecated since 0.1.0
public function removeSpecialCaseChar($char)
* @param array $tags
* @deprecated since 0.1.0
public function setSpecialCaseTags(array $tags = array())
* @param string $tag
* @deprecated since 0.1.0
public function addSpecialCaseTag($tag)
* @param string $tag
* @deprecated since 0.1.0
public function removeSpecialCaseTag($tag)
* @return array|null
* @deprecated since 0.1.0
public function getSpecialCaseTags()
return $this->config->getSpecialCaseTags();
* @return string
public function getOldHtml()
return $this->oldText;
* @return string
public function getNewHtml()
return $this->newText;
* @return string
public function getDifference()
return $this->content;
* @param bool $boolean
* @return $this
* @deprecated since 0.1.0
public function setGroupDiffs($boolean)
return $this;
* @return bool
* @deprecated since 0.1.0
public function isGroupDiffs()
return $this->config->isGroupDiffs();
* @param string $tag
* @return string
protected function getOpeningTag($tag)
return "/<".$tag."[^>]*/i";
* @param string $tag
* @return string
protected function getClosingTag($tag)
return "</".$tag.">";
* @param string $str
* @param string $start
* @param string $end
* @return string
protected function getStringBetween($str, $start, $end)
$expStr = explode( $start, $str, 2 );
if ( count( $expStr ) > 1 ) {
$expStr = explode( $end, $expStr[ 1 ] );
if ( count( $expStr ) > 1 ) {
array_pop( $expStr );
return implode( $end, $expStr );
return '';
* @param string $html
* @return string
protected function purifyHtml($html)
if ( class_exists( 'Tidy' ) && false ) {
$config = array( 'output-xhtml' => true, 'indent' => false );
$tidy = new tidy();
$tidy->parseString( $html, $config, 'utf8' );
$html = (string) $tidy;
return $this->getStringBetween( $html, '<body>' );
return $html;
protected function splitInputsToWords()
$this->oldWords = $this->convertHtmlToListOfWords( $this->explode( $this->oldText ) );
$this->newWords = $this->convertHtmlToListOfWords( $this->explode( $this->newText ) );
* @param string $text
* @return bool
protected function isPartOfWord($text)
return ctype_alnum(str_replace($this->config->getSpecialCaseChars(), '', $text));
* @param array $characterString
* @return array
protected function convertHtmlToListOfWords($characterString)
$mode = 'character';
$current_word = '';
$words = array();
foreach ($characterString as $i => $character) {
switch ($mode) {
case 'character':
if ( $this->isStartOfTag( $character ) ) {
if ($current_word != '') {
$words[] = $current_word;
$current_word = "<";
$mode = 'tag';
} elseif (preg_match("/\s/", $character)) {
if ($current_word !== '') {
$words[] = $current_word;
$current_word = preg_replace('/\s+/S', ' ', $character);
$mode = 'whitespace';
} else {
if (
(ctype_alnum($character) && (strlen($current_word) == 0 || $this->isPartOfWord($current_word))) ||
(in_array($character, $this->config->getSpecialCaseChars()) && isset($characterString[$i+1]) && $this->isPartOfWord($characterString[$i+1]))
) {
$current_word .= $character;
} else {
$words[] = $current_word;
$current_word = $character;
case 'tag' :
if ( $this->isEndOfTag( $character ) ) {
$current_word .= ">";
$words[] = $current_word;
$current_word = "";
if ( !preg_match('[^\s]', $character ) ) {
$mode = 'whitespace';
} else {
$mode = 'character';
} else {
$current_word .= $character;
case 'whitespace':
if ( $this->isStartOfTag( $character ) ) {
if ($current_word !== '') {
$words[] = $current_word;
$current_word = "<";
$mode = 'tag';
} elseif ( preg_match( "/\s/", $character ) ) {
$current_word .= $character;
$current_word = preg_replace('/\s+/S', ' ', $current_word);
} else {
if ($current_word != '') {
$words[] = $current_word;
$current_word = $character;
$mode = 'character';
if ($current_word != '') {
$words[] = $current_word;
return $words;
* @param string $val
* @return bool
protected function isStartOfTag($val)
return $val == "<";
* @param string $val
* @return bool
protected function isEndOfTag($val)
return $val == ">";
* @param string $value
* @return bool
protected function isWhiteSpace($value)
return !preg_match( '[^\s]', $value );
* @param string $value
* @return array
protected function explode($value)
// as suggested by @onassar
return preg_split( '//u', $value );

@ -0,0 +1,112 @@
namespace Caxy\HtmlDiff;
use Doctrine\Common\Cache\Cache;
* Class DiffCache
* @package Caxy\HtmlDiff
class DiffCache
* @var Cache
protected $cacheProvider;
* DiffCache constructor.
* @param Cache $cacheProvider
public function __construct(Cache $cacheProvider)
$this->cacheProvider = $cacheProvider;
* @return Cache
public function getCacheProvider()
return $this->cacheProvider;
* @param Cache $cacheProvider
* @return DiffCache
public function setCacheProvider($cacheProvider)
$this->cacheProvider = $cacheProvider;
return $this;
* @param string $oldText
* @param string $newText
* @return bool
public function contains($oldText, $newText)
return $this->cacheProvider->contains($this->getHashKey($oldText, $newText));
* @param string $oldText
* @param string $newText
* @return string
public function fetch($oldText, $newText)
return $this->cacheProvider->fetch($this->getHashKey($oldText, $newText));
* @param string $oldText
* @param string $newText
* @param string $data
* @param int $lifeTime
* @return bool
public function save($oldText, $newText, $data, $lifeTime = 0)
return $this->cacheProvider->save($this->getHashKey($oldText, $newText), $data, $lifeTime);
* @param string $oldText
* @param string $newText
* @return bool
public function delete($oldText, $newText)
return $this->cacheProvider->delete($this->getHashKey($oldText, $newText));
* @return array|null
public function getStats()
return $this->cacheProvider->getStats();
* @param string $oldText
* @param string $newText
* @return string
protected function getHashKey($oldText, $newText)
return sprintf('%s_%s', md5($oldText), md5($newText));

@ -0,0 +1,795 @@
namespace Caxy\HtmlDiff;
use Caxy\HtmlDiff\Table\TableDiff;
* Class HtmlDiff
* @package Caxy\HtmlDiff
class HtmlDiff extends AbstractDiff
* @var array
protected $wordIndices;
* @var array
protected $oldTables;
* @var array
protected $newTables;
* @var array
protected $newIsolatedDiffTags;
* @var array
protected $oldIsolatedDiffTags;
* @param string $oldText
* @param string $newText
* @param HtmlDiffConfig|null $config
* @return self
public static function create($oldText, $newText, HtmlDiffConfig $config = null)
$diff = new self($oldText, $newText);
if (null !== $config) {
return $diff;
* @param $bool
* @return $this
* @deprecated since 0.1.0
public function setUseTableDiffing($bool)
return $this;
* @param boolean $boolean
* @return HtmlDiff
* @deprecated since 0.1.0
public function setInsertSpaceInReplace($boolean)
return $this;
* @return boolean
* @deprecated since 0.1.0
public function getInsertSpaceInReplace()
return $this->config->isInsertSpaceInReplace();
* @return string
public function build()
if ($this->hasDiffCache() && $this->getDiffCache()->contains($this->oldText, $this->newText)) {
$this->content = $this->getDiffCache()->fetch($this->oldText, $this->newText);
return $this->content;
$operations = $this->operations();
foreach ($operations as $item) {
$this->performOperation( $item );
if ($this->hasDiffCache()) {
$this->getDiffCache()->save($this->oldText, $this->newText, $this->content);
return $this->content;
protected function indexNewWords()
$this->wordIndices = array();
foreach ($this->newWords as $i => $word) {
if ( $this->isTag( $word ) ) {
$word = $this->stripTagAttributes( $word );
if ( isset( $this->wordIndices[ $word ] ) ) {
$this->wordIndices[ $word ][] = $i;
} else {
$this->wordIndices[ $word ] = array( $i );
protected function replaceIsolatedDiffTags()
$this->oldIsolatedDiffTags = $this->createIsolatedDiffTagPlaceholders($this->oldWords);
$this->newIsolatedDiffTags = $this->createIsolatedDiffTagPlaceholders($this->newWords);
* @param array $words
* @return array
protected function createIsolatedDiffTagPlaceholders(&$words)
$openIsolatedDiffTags = 0;
$isolatedDiffTagIndicies = array();
$isolatedDiffTagStart = 0;
$currentIsolatedDiffTag = null;
foreach ($words as $index => $word) {
$openIsolatedDiffTag = $this->isOpeningIsolatedDiffTag($word, $currentIsolatedDiffTag);
if ($openIsolatedDiffTag) {
if ($openIsolatedDiffTags === 0) {
$isolatedDiffTagStart = $index;
$currentIsolatedDiffTag = $openIsolatedDiffTag;
} elseif ($openIsolatedDiffTags > 0 && $this->isClosingIsolatedDiffTag($word, $currentIsolatedDiffTag)) {
if ($openIsolatedDiffTags == 0) {
$isolatedDiffTagIndicies[] = array ('start' => $isolatedDiffTagStart, 'length' => $index - $isolatedDiffTagStart + 1, 'tagType' => $currentIsolatedDiffTag);
$currentIsolatedDiffTag = null;
$isolatedDiffTagScript = array();
$offset = 0;
foreach ($isolatedDiffTagIndicies as $isolatedDiffTagIndex) {
$start = $isolatedDiffTagIndex['start'] - $offset;
$placeholderString = $this->config->getIsolatedDiffTagPlaceholder($isolatedDiffTagIndex['tagType']);
$isolatedDiffTagScript[$start] = array_splice($words, $start, $isolatedDiffTagIndex['length'], $placeholderString);
$offset += $isolatedDiffTagIndex['length'] - 1;
return $isolatedDiffTagScript;
* @param string $item
* @param null|string $currentIsolatedDiffTag
* @return false|string
protected function isOpeningIsolatedDiffTag($item, $currentIsolatedDiffTag = null)
$tagsToMatch = $currentIsolatedDiffTag !== null
? array($currentIsolatedDiffTag => $this->config->getIsolatedDiffTagPlaceholder($currentIsolatedDiffTag))
: $this->config->getIsolatedDiffTags();
foreach ($tagsToMatch as $key => $value) {
if (preg_match("#<".$key."[^>]*>\\s*#iU", $item)) {
return $key;
return false;
* @param string $item
* @param null|string $currentIsolatedDiffTag
* @return false|string
protected function isClosingIsolatedDiffTag($item, $currentIsolatedDiffTag = null)
$tagsToMatch = $currentIsolatedDiffTag !== null
? array($currentIsolatedDiffTag => $this->config->getIsolatedDiffTagPlaceholder($currentIsolatedDiffTag))
: $this->config->getIsolatedDiffTags();
foreach ($tagsToMatch as $key => $value) {
if (preg_match("#</".$key."[^>]*>\\s*#iU", $item)) {
return $key;
return false;
* @param Operation $operation
protected function performOperation($operation)
switch ($operation->action) {
case 'equal' :
$this->processEqualOperation( $operation );
case 'delete' :
$this->processDeleteOperation( $operation, "diffdel" );
case 'insert' :
$this->processInsertOperation( $operation, "diffins");
case 'replace':
$this->processReplaceOperation( $operation );
* @param Operation $operation
protected function processReplaceOperation($operation)
$this->processDeleteOperation( $operation, "diffmod" );
$this->processInsertOperation( $operation, "diffmod" );
* @param Operation $operation
* @param string $cssClass
protected function processInsertOperation($operation, $cssClass)
$text = array();
foreach ($this->newWords as $pos => $s) {
if ($pos >= $operation->startInNew && $pos < $operation->endInNew) {
if ($this->config->isIsolatedDiffTagPlaceholder($s) && isset($this->newIsolatedDiffTags[$pos])) {
foreach ($this->newIsolatedDiffTags[$pos] as $word) {
$text[] = $word;
} else {
$text[] = $s;
$this->insertTag( "ins", $cssClass, $text );
* @param Operation $operation
* @param string $cssClass
protected function processDeleteOperation($operation, $cssClass)
$text = array();
foreach ($this->oldWords as $pos => $s) {
if ($pos >= $operation->startInOld && $pos < $operation->endInOld) {
if ($this->config->isIsolatedDiffTagPlaceholder($s) && isset($this->oldIsolatedDiffTags[$pos])) {
foreach ($this->oldIsolatedDiffTags[$pos] as $word) {
$text[] = $word;
} else {
$text[] = $s;
$this->insertTag( "del", $cssClass, $text );
* @param Operation $operation
* @param int $pos
* @param string $placeholder
* @param bool $stripWrappingTags
* @return string
protected function diffIsolatedPlaceholder($operation, $pos, $placeholder, $stripWrappingTags = true)
$oldText = implode("", $this->findIsolatedDiffTagsInOld($operation, $pos));
$newText = implode("", $this->newIsolatedDiffTags[$pos]);
if ($this->isListPlaceholder($placeholder)) {
return $this->diffList($oldText, $newText);
} elseif ($this->config->isUseTableDiffing() && $this->isTablePlaceholder($placeholder)) {
return $this->diffTables($oldText, $newText);
} elseif ($this->isLinkPlaceholder($placeholder)) {
return $this->diffLinks($oldText, $newText);
return $this->diffElements($oldText, $newText, $stripWrappingTags);
* @param string $oldText
* @param string $newText
* @param bool $stripWrappingTags
* @return string
protected function diffElements($oldText, $newText, $stripWrappingTags = true)
$wrapStart = '';
$wrapEnd = '';
if ($stripWrappingTags) {
$pattern = '/(^<[^>]+>)|(<\/[^>]+>$)/i';
$matches = array();
if (preg_match_all($pattern, $newText, $matches)) {
$wrapStart = isset($matches[0][0]) ? $matches[0][0] : '';
$wrapEnd = isset($matches[0][1]) ? $matches[0][1] : '';
$oldText = preg_replace($pattern, '', $oldText);
$newText = preg_replace($pattern, '', $newText);
$diff = HtmlDiff::create($oldText, $newText, $this->config);
return $wrapStart . $diff->build() . $wrapEnd;
* @param string $oldText
* @param string $newText
* @return string
protected function diffList($oldText, $newText)
$diff = ListDiffNew::create($oldText, $newText, $this->config);
return $diff->build();
* @param string $oldText
* @param string $newText
* @return string
protected function diffTables($oldText, $newText)
$diff = TableDiff::create($oldText, $newText, $this->config);
return $diff->build();
* @param string $oldText
* @param string $newText
* @return string
protected function diffLinks($oldText, $newText)
$oldHref = $this->getAttributeFromTag($oldText, 'href');
$newHref = $this->getAttributeFromTag($newText, 'href');
if ($oldHref != $newHref) {
return sprintf(
$this->wrapText($oldText, 'del', 'diffmod diff-href'),
$this->wrapText($newText, 'ins', 'diffmod diff-href')
return $this->diffElements($oldText, $newText);
* @param Operation $operation
protected function processEqualOperation($operation)
$result = array();
foreach ($this->newWords as $pos => $s) {
if ($pos >= $operation->startInNew && $pos < $operation->endInNew) {
if ($this->config->isIsolatedDiffTagPlaceholder($s) && isset($this->newIsolatedDiffTags[$pos])) {
$result[] = $this->diffIsolatedPlaceholder($operation, $pos, $s);
} else {
$result[] = $s;
$this->content .= implode( "", $result );
* @param string $text
* @param string $attribute
* @return null|string
protected function getAttributeFromTag($text, $attribute)
$matches = array();
if (preg_match(sprintf('/<a\s+[^>]*%s=([\'"])(.*)\1[^>]*>/i', $attribute), $text, $matches)) {
return $matches[2];
return null;
* @param string $text
* @return bool
protected function isListPlaceholder($text)
return $this->isPlaceholderType($text, array('ol', 'dl', 'ul'));
* @param string $text
* @return bool
public function isLinkPlaceholder($text)
return $this->isPlaceholderType($text, 'a');
* @param string $text
* @param array|string $types
* @param bool $strict
* @return bool
protected function isPlaceholderType($text, $types, $strict = true)
if (!is_array($types)) {
$types = array($types);
$criteria = array();
foreach ($types as $type) {
if ($this->config->isIsolatedDiffTag($type)) {
$criteria[] = $this->config->getIsolatedDiffTagPlaceholder($type);
} else {
$criteria[] = $type;
return in_array($text, $criteria, $strict);
* @param string $text
* @return bool
protected function isTablePlaceholder($text)
return $this->isPlaceholderType($text, 'table');
* @param Operation $operation
* @param int $posInNew
* @return array
protected function findIsolatedDiffTagsInOld($operation, $posInNew)
$offset = $posInNew - $operation->startInNew;
return $this->oldIsolatedDiffTags[$operation->startInOld + $offset];
* @param string $tag
* @param string $cssClass
* @param array $words
protected function insertTag($tag, $cssClass, &$words)
while (true) {
if ( count( $words ) == 0 ) {
$nonTags = $this->extractConsecutiveWords( $words, 'noTag' );
$specialCaseTagInjection = '';
$specialCaseTagInjectionIsBefore = false;
if ( count( $nonTags ) != 0 ) {
$text = $this->wrapText( implode( "", $nonTags ), $tag, $cssClass );
$this->content .= $text;
} else {
$firstOrDefault = false;
foreach ($this->config->getSpecialCaseOpeningTags() as $x) {
if ( preg_match( $x, $words[ 0 ] ) ) {
$firstOrDefault = $x;
if ($firstOrDefault) {
$specialCaseTagInjection = '<ins class="mod">';
if ($tag == "del") {
unset( $words[ 0 ] );
} elseif ( array_search( $words[ 0 ], $this->config->getSpecialCaseClosingTags()) !== false ) {
$specialCaseTagInjection = "</ins>";
$specialCaseTagInjectionIsBefore = true;
if ($tag == "del") {
unset( $words[ 0 ] );
if ( count( $words ) == 0 && count( $specialCaseTagInjection ) == 0 ) {
if ($specialCaseTagInjectionIsBefore) {
$this->content .= $specialCaseTagInjection . implode( "", $this->extractConsecutiveWords( $words, 'tag' ) );
} else {
$workTag = $this->extractConsecutiveWords( $words, 'tag' );
if ( isset( $workTag[ 0 ] ) && $this->isOpeningTag( $workTag[ 0 ] ) && !$this->isClosingTag( $workTag[ 0 ] ) ) {
if ( strpos( $workTag[ 0 ], 'class=' ) ) {
$workTag[ 0 ] = str_replace( 'class="', 'class="diffmod ', $workTag[ 0 ] );
$workTag[ 0 ] = str_replace( "class='", 'class="diffmod ', $workTag[ 0 ] );
} else {
$workTag[ 0 ] = str_replace( ">", ' class="diffmod">', $workTag[ 0 ] );
$this->content .= implode( "", $workTag ) . $specialCaseTagInjection;
* @param string $word
* @param string $condition
* @return bool
protected function checkCondition($word, $condition)
return $condition == 'tag' ? $this->isTag( $word ) : !$this->isTag( $word );
* @param string $text
* @param string $tagName
* @param string $cssClass
* @return string
protected function wrapText($text, $tagName, $cssClass)
return sprintf( '<%1$s class="%2$s">%3$s</%1$s>', $tagName, $cssClass, $text );
* @param array $words
* @param string $condition
* @return array
protected function extractConsecutiveWords(&$words, $condition)
$indexOfFirstTag = null;
$words = array_values($words);
foreach ($words as $i => $word) {
if ( !$this->checkCondition( $word, $condition ) ) {
$indexOfFirstTag = $i;
if ($indexOfFirstTag !== null) {
$items = array();
foreach ($words as $pos => $s) {
if ($pos >= 0 && $pos < $indexOfFirstTag) {
$items[] = $s;
if ($indexOfFirstTag > 0) {
array_splice( $words, 0, $indexOfFirstTag );
return $items;
} else {
$items = array();
foreach ($words as $pos => $s) {
if ( $pos >= 0 && $pos <= count( $words ) ) {
$items[] = $s;
array_splice( $words, 0, count( $words ) );
return $items;
* @param string $item
* @return bool
protected function isTag($item)
return $this->isOpeningTag( $item ) || $this->isClosingTag( $item );
* @param string $item
* @return bool
protected function isOpeningTag($item)
return preg_match( "#<[^>]+>\\s*#iU", $item );
* @param string $item
* @return bool
protected function isClosingTag($item)
return preg_match( "#</[^>]+>\\s*#iU", $item );
* @return Operation[]
protected function operations()
$positionInOld = 0;
$positionInNew = 0;
$operations = array();
$matches = $this->matchingBlocks();
$matches[] = new Match( count( $this->oldWords ), count( $this->newWords ), 0 );
foreach ($matches as $i => $match) {
$matchStartsAtCurrentPositionInOld = ( $positionInOld == $match->startInOld );
$matchStartsAtCurrentPositionInNew = ( $positionInNew == $match->startInNew );
$action = 'none';
if ($matchStartsAtCurrentPositionInOld == false && $matchStartsAtCurrentPositionInNew == false) {
$action = 'replace';
} elseif ($matchStartsAtCurrentPositionInOld == true && $matchStartsAtCurrentPositionInNew == false) {
$action = 'insert';
} elseif ($matchStartsAtCurrentPositionInOld == false && $matchStartsAtCurrentPositionInNew == true) {
$action = 'delete';
} else { // This occurs if the first few words are the same in both versions
$action = 'none';
if ($action != 'none') {
$operations[] = new Operation( $action, $positionInOld, $match->startInOld, $positionInNew, $match->startInNew );
if ( count( $match ) != 0 ) {
$operations[] = new Operation( 'equal', $match->startInOld, $match->endInOld(), $match->startInNew, $match->endInNew() );
$positionInOld = $match->endInOld();
$positionInNew = $match->endInNew();
return $operations;
* @return Match[]
protected function matchingBlocks()
$matchingBlocks = array();
$this->findMatchingBlocks( 0, count( $this->oldWords ), 0, count( $this->newWords ), $matchingBlocks );
return $matchingBlocks;
* @param int $startInOld
* @param int $endInOld
* @param int $startInNew
* @param int $endInNew
* @param array $matchingBlocks
protected function findMatchingBlocks($startInOld, $endInOld, $startInNew, $endInNew, &$matchingBlocks)
$match = $this->findMatch( $startInOld, $endInOld, $startInNew, $endInNew );
if ($match !== null) {
if ($startInOld < $match->startInOld && $startInNew < $match->startInNew) {
$this->findMatchingBlocks( $startInOld, $match->startInOld, $startInNew, $match->startInNew, $matchingBlocks );
$matchingBlocks[] = $match;
if ( $match->endInOld() < $endInOld && $match->endInNew() < $endInNew ) {
$this->findMatchingBlocks( $match->endInOld(), $endInOld, $match->endInNew(), $endInNew, $matchingBlocks );
* @param string $word
* @return string
protected function stripTagAttributes($word)
$word = explode( ' ', trim( $word, '<>' ) );
return '<' . $word[ 0 ] . '>';
* @param int $startInOld
* @param int $endInOld
* @param int $startInNew
* @param int $endInNew
* @return Match|null
protected function findMatch($startInOld, $endInOld, $startInNew, $endInNew)
$bestMatchInOld = $startInOld;
$bestMatchInNew = $startInNew;
$bestMatchSize = 0;
$matchLengthAt = array();
for ($indexInOld = $startInOld; $indexInOld < $endInOld; $indexInOld++) {
$newMatchLengthAt = array();
$index = $this->oldWords[ $indexInOld ];
if ( $this->isTag( $index ) ) {
$index = $this->stripTagAttributes( $index );
if ( !isset( $this->wordIndices[ $index ] ) ) {
$matchLengthAt = $newMatchLengthAt;
foreach ($this->wordIndices[ $index ] as $indexInNew) {
if ($indexInNew < $startInNew) {
if ($indexInNew >= $endInNew) {
$newMatchLength = ( isset( $matchLengthAt[ $indexInNew - 1 ] ) ? $matchLengthAt[ $indexInNew - 1 ] : 0 ) + 1;
$newMatchLengthAt[ $indexInNew ] = $newMatchLength;
if ($newMatchLength > $bestMatchSize ||
$this->isGroupDiffs() &&
$bestMatchSize > 0 &&
implode('', array_slice($this->oldWords, $bestMatchInOld, $bestMatchSize))
) {
$bestMatchInOld = $indexInOld - $newMatchLength + 1;
$bestMatchInNew = $indexInNew - $newMatchLength + 1;
$bestMatchSize = $newMatchLength;
$matchLengthAt = $newMatchLengthAt;
// Skip match if none found or match consists only of whitespace
if ($bestMatchSize != 0 &&
!$this->isGroupDiffs() ||
!preg_match('/^\s+$/', implode('', array_slice($this->oldWords, $bestMatchInOld, $bestMatchSize)))
) {
return new Match($bestMatchInOld, $bestMatchInNew, $bestMatchSize);
return null;

@ -0,0 +1,488 @@
namespace Caxy\HtmlDiff;
* Class HtmlDiffConfig
* @package Caxy\HtmlDiff
class HtmlDiffConfig
* @var array
protected $specialCaseTags = array('strong', 'b', 'i', 'big', 'small', 'u', 'sub', 'sup', 'strike', 's', 'p');
* @var array
protected $specialCaseChars = array('.', ',', '(', ')', '\'');
* @var bool
protected $groupDiffs = true;
* @var bool
protected $insertSpaceInReplace = false;
* @var string
protected $encoding = 'UTF-8';
* @var array
protected $isolatedDiffTags = array(
'sub' => '[[REPLACE_SUB_SCRIPT]]',
'sup' => '[[REPLACE_SUPER_SCRIPT]]',
'table' => '[[REPLACE_TABLE]]',
'strong' => '[[REPLACE_STRONG]]',
'b' => '[[REPLACE_B]]',
'em' => '[[REPLACE_EM]]',
'i' => '[[REPLACE_I]]',
'a' => '[[REPLACE_A]]',
* @var int
protected $matchThreshold = 80;
* @var array
protected $specialCaseOpeningTags = array();
* @var array
protected $specialCaseClosingTags = array();
* @var bool
protected $useTableDiffing = true;
* @var null|\Doctrine\Common\Cache\Cache
protected $cacheProvider;
* @var null|string
protected $purifierCacheLocation = null;
* @return HtmlDiffConfig
public static function create()
return new self();
* HtmlDiffConfig constructor.
public function __construct()
* @return int
public function getMatchThreshold()
return $this->matchThreshold;
* @param int $matchThreshold
* @return AbstractDiff
public function setMatchThreshold($matchThreshold)
$this->matchThreshold = $matchThreshold;
return $this;
* @param array $chars
public function setSpecialCaseChars(array $chars)
$this->specialCaseChars = $chars;
* @return array|null
public function getSpecialCaseChars()
return $this->specialCaseChars;
* @param string $char
* @return $this
public function addSpecialCaseChar($char)
if (!in_array($char, $this->specialCaseChars)) {
$this->specialCaseChars[] = $char;
return $this;
* @param string $char
* @return $this
public function removeSpecialCaseChar($char)
$key = array_search($char, $this->specialCaseChars);
if ($key !== false) {
return $this;
* @param array $tags
* @return $this
public function setSpecialCaseTags(array $tags = array())
$this->specialCaseTags = $tags;
$this->specialCaseOpeningTags = array();
$this->specialCaseClosingTags = array();
foreach ($this->specialCaseTags as $tag) {
return $this;
* @param string $tag
* @return $this
public function addSpecialCaseTag($tag)
if (!in_array($tag, $this->specialCaseTags)) {
$this->specialCaseTags[] = $tag;
$opening = $this->getOpeningTag($tag);
$closing = $this->getClosingTag($tag);
if (!in_array($opening, $this->specialCaseOpeningTags)) {
$this->specialCaseOpeningTags[] = $opening;
if (!in_array($closing, $this->specialCaseClosingTags)) {
$this->specialCaseClosingTags[] = $closing;
return $this;
* @param string $tag
* @return $this
public function removeSpecialCaseTag($tag)
if (($key = array_search($tag, $this->specialCaseTags)) !== false) {
$opening = $this->getOpeningTag($tag);
$closing = $this->getClosingTag($tag);
if (($key = array_search($opening, $this->specialCaseOpeningTags)) !== false) {
if (($key = array_search($closing, $this->specialCaseClosingTags)) !== false) {
return $this;
* @return array|null
public function getSpecialCaseTags()
return $this->specialCaseTags;
* @return boolean
public function isGroupDiffs()
return $this->groupDiffs;
* @param boolean $groupDiffs
* @return HtmlDiffConfig
public function setGroupDiffs($groupDiffs)
$this->groupDiffs = $groupDiffs;
return $this;
* @return string
public function getEncoding()
return $this->encoding;
* @param string $encoding
* @return HtmlDiffConfig
public function setEncoding($encoding)
$this->encoding = $encoding;
return $this;
* @return boolean
public function isInsertSpaceInReplace()
return $this->insertSpaceInReplace;
* @param boolean $insertSpaceInReplace
* @return HtmlDiffConfig
public function setInsertSpaceInReplace($insertSpaceInReplace)
$this->insertSpaceInReplace = $insertSpaceInReplace;
return $this;
* @return array
public function getIsolatedDiffTags()
return $this->isolatedDiffTags;
* @param array $isolatedDiffTags
* @return HtmlDiffConfig
public function setIsolatedDiffTags($isolatedDiffTags)
$this->isolatedDiffTags = $isolatedDiffTags;
return $this;
* @param string $tag
* @param null|string $placeholder
* @return $this
public function addIsolatedDiffTag($tag, $placeholder = null)
if (null === $placeholder) {
$placeholder = sprintf('[[REPLACE_%s]]', strtoupper($tag));
if ($this->isIsolatedDiffTag($tag) && $this->isolatedDiffTags[$tag] !== $placeholder) {
throw new \InvalidArgumentException(
sprintf('Isolated diff tag "%s" already exists using a different placeholder', $tag)
$matchingKey = array_search($placeholder, $this->isolatedDiffTags, true);
if (false !== $matchingKey && $matchingKey !== $tag) {
throw new \InvalidArgumentException(
sprintf('Placeholder already being used for a different tag "%s"', $tag)
if (!array_key_exists($tag, $this->isolatedDiffTags)) {
$this->isolatedDiffTags[$tag] = $placeholder;
return $this;
* @param string $tag
* @return $this
public function removeIsolatedDiffTag($tag)
if ($this->isIsolatedDiffTag($tag)) {
return $this;
* @param string $tag
* @return bool
public function isIsolatedDiffTag($tag)
return array_key_exists($tag, $this->isolatedDiffTags);
* @param string $text
* @return bool
public function isIsolatedDiffTagPlaceholder($text)
return in_array($text, $this->isolatedDiffTags, true);
* @param string $tag
* @return null|string
public function getIsolatedDiffTagPlaceholder($tag)
return $this->isIsolatedDiffTag($tag) ? $this->isolatedDiffTags[$tag] : null;
* @return array
public function getSpecialCaseOpeningTags()
return $this->specialCaseOpeningTags;
* @return array
public function getSpecialCaseClosingTags()
return $this->specialCaseClosingTags;
* @return boolean
public function isUseTableDiffing()
return $this->useTableDiffing;
* @param boolean $useTableDiffing
* @return HtmlDiffConfig
public function setUseTableDiffing($useTableDiffing)
$this->useTableDiffing = $useTableDiffing;
return $this;
* @param null|\Doctrine\Common\Cache\Cache $cacheProvider
* @return $this
public function setCacheProvider(\Doctrine\Common\Cache\Cache $cacheProvider = null)
$this->cacheProvider = $cacheProvider;
return $this;
* @return null|\Doctrine\Common\Cache\Cache
public function getCacheProvider()
return $this->cacheProvider;
* @param null|string
* @return $this
public function setPurifierCacheLocation($purifierCacheLocation = null)
$this->purifierCacheLocation = $purifierCacheLocation;
return $this;
* @return null|string
public function getPurifierCacheLocation()
return $this->purifierCacheLocation;
* @param string $tag
* @return string
protected function getOpeningTag($tag)
return "/<".$tag."[^>]*/i";
* @param string $tag
* @return string
protected function getClosingTag($tag)
return "</".$tag.">";

@ -0,0 +1,944 @@
namespace Caxy\HtmlDiff;
class ListDiff extends HtmlDiff
* This is the minimum percentage a list item can match its counterpart in order to be considered a match.
* @var integer
protected static $listMatchThreshold = 35;
/** @var array */
protected $listWords = array();
/** @var array */
protected $listTags = array();
/** @var array */
protected $listIsolatedDiffTags = array();
/** @var array */
protected $isolatedDiffTags = array (
* List (li) placeholder.
* @var string
protected static $listPlaceHolder = "[[REPLACE_LIST_ITEM]]";
* Holds the type of list this is ol, ul, dl.
* @var string
protected $listType;
* Used to hold what type of list the old list is.
* @var string
protected $oldListType;
* Used to hold what type of list the new list is.
* @var string
protected $newListType;
* Hold the old/new content of the content of the list.
* @var array
protected $list;
* Contains the old/new child lists content within this list.
* @var array
protected $childLists;
* Contains the old/new text strings that match
* @var array
protected $textMatches;
* Contains the indexed start positions of each list within word string.
* @var array
protected $listsIndex;
* Array that holds the index of all content outside of the array. Format is array(index => content).
* @var array
protected $contentIndex = array();
* Holds the order and data on each list/content block within this list.
* @var array
protected $diffOrderIndex = array();
* This is the opening ol,ul,dl ist tag.
* @var string
protected $oldParentTag;
* This is the opening ol,ul,dl ist tag.
* @var string
protected $newParentTag;
* We're using the same functions as the parent in build() to get us to the point of
* manipulating the data within this class.
* @return string
public function build()
// Use the parent functions to get the data we need organized.
// Now use the custom functions in this class to use the data and generate our diff.
return $this->content;
* Calls to the actual custom functions of this class, to diff list content.
protected function diffListContent()
/* Format the list we're focusing on.
* There will always be one list, though passed as an array with one item.
* Format this to only have the list contents, outside of the array.
/* Build an index of content outside of list tags.
/* In cases where we're dealing with nested lists,
* make sure we use placeholders to replace the nested lists
/* Build a list of matches we can reference when we diff the contents of the lists.
* This is needed so that we each NEW list node is matched against the best possible OLD list node/
* It helps us determine whether the list was added, removed, or changed.
/* Go through the list of matches, content, and diff each.
* Any nested lists would be sent to parent's diffList function, which creates a new listDiff class.
* This function is used to populate both contentIndex and diffOrderIndex arrays for use in the diff function.
protected function indexContent()
$this->contentIndex = array();
$this->diffOrderIndex = array('new' => array(), 'old' => array());
foreach ($this->list as $type => $list) {
$this->contentIndex[$type] = array();
$depth = 0;
$parentList = 0;
$position = 0;
$newBlock = true;
$listCount = 0;
$contentCount = 0;
foreach ($list as $key => $word) {
if (!$parentList && $this->isOpeningListTag($word)) {
$this->diffOrderIndex[$type][] = array('type' => 'list', 'position' => $listCount, 'index' => $key);
if (!$parentList && $this->isClosingListTag($word)) {
if ($depth == 0) {
$newBlock = true;
if ($this->isOpeningIsolatedDiffTag($word)) {
if ($this->isClosingIsolatedDiffTag($word)) {
if ($depth == 0) {
if ($newBlock && !array_key_exists($contentCount, $this->contentIndex[$type])) {
$this->diffOrderIndex[$type][] = array('type' => 'content', 'position' => $contentCount, 'index' => $key);
$position = $contentCount;
$this->contentIndex[$type][$position] = '';
$this->contentIndex[$type][$position] .= $word;
$newBlock = false;
* This function is used to remove the wrapped ul, ol, or dl characters from this list
* and sets the listType as ul, ol, or dl, so that we can use it later.
* $list is being set here as well, as an array with the old and new version of this list content.
protected function formatThisListContent()
$formatArray = array(
array('type' => 'old', 'array' => $this->oldIsolatedDiffTags),
array('type' => 'new', 'array' => $this->newIsolatedDiffTags)
foreach ($formatArray as $item) {
$values = array_values($item['array']);
$this->list[$item['type']] = count($values)
? $this->formatList($values[0], $item['type'])
: array();
$this->listType = $this->newListType ?: $this->oldListType;
* @param array $arrayData
* @param string $index
* @return array
protected function formatList(array $arrayData, $index = 'old')
$openingTag = $this->getAndStripTag($arrayData[0]);
$closingTag = $this->getAndStripTag($arrayData[count($arrayData) - 1]);
if (array_key_exists($openingTag, $this->isolatedDiffTags) &&
array_key_exists($closingTag, $this->isolatedDiffTags)
) {
if ($index == 'new' && $this->isOpeningTag($arrayData[0])) {
$this->newParentTag = $arrayData[0];
$this->newListType = $this->getAndStripTag($arrayData[0]);
if ($index == 'old' && $this->isOpeningTag($arrayData[0])) {
$this->oldParentTag = $arrayData[0];
$this->oldListType = $this->getAndStripTag($arrayData[0]);
return $arrayData;
* @param string $tag
* @return string
protected function getAndStripTag($tag)
$content = explode(' ', preg_replace("/[^A-Za-z0-9 ]/", '', $tag));
return $content[0];
protected function matchAndCompareLists()
* Build the an array (childLists) to hold the contents of the list nodes within this list.
* This only holds the content of each list node.
* Index the list, starting positions, so that we can refer back to it later.
* This is used to see where one list node starts and another ends.
* Compare the lists and build $textMatches array with the matches.
* Each match is an array of "new" and "old" keys, with the id of the list it matches to.
* Whenever there is no match (in cases where a new list item was added or removed), null is used instead of the id.
* Creates matches for lists.
protected function compareChildLists()
$this->createNewOldMatches($this->childLists, $this->textMatches, 'content');
* Abstracted function used to match items in an array.
* This is used primarily for populating lists matches.
* @param array $listArray
* @param array $resultArray
* @param string|null $column
protected function createNewOldMatches(&$listArray, &$resultArray, $column = null)
// Always compare the new against the old.
// Compare each new string against each old string.
$bestMatchPercentages = array();
foreach ($listArray['new'] as $thisKey => $thisList) {
$bestMatchPercentages[$thisKey] = array();
foreach ($listArray['old'] as $thatKey => $thatList) {
// Save the percent amount each new list content compares against the old list content.
$column ? $thisList[$column] : $thisList,
$column ? $thatList[$column] : $thatList,
$bestMatchPercentages[$thisKey][] = $percentage;
// Sort each array by value, highest percent to lowest percent.
foreach ($bestMatchPercentages as &$thisMatch) {
// Build matches.
$matches = array();
$taken = array();
$takenItems = array();
$absoluteMatch = 100;
foreach ($bestMatchPercentages as $item => $percentages) {
$highestMatch = -1;
$highestMatchKey = -1;
$takeItemKey = -1;
foreach ($percentages as $key => $percent) {
// Check that the key for the percentage is not already taken and the new percentage is higher.
if (!in_array($key, $taken) && $percent > $highestMatch) {
// If an absolute match, choose this one.
if ($percent == $absoluteMatch) {
$highestMatch = $percent;
$highestMatchKey = $key;
$takenItemKey = $item;
} else {
// Get all the other matces for the same $key
$columns = $this->getArrayColumn($bestMatchPercentages, $key);
$thisBestMatches = array_filter(
function ($v) use ($percent) {
return $v > $percent;
* If the list item does not meet the threshold, it will not be considered a match.
if ($percent >= self::$listMatchThreshold) {
// If no greater amounts, use this one.
if (!count($thisBestMatches)) {
$highestMatch = $percent;
$highestMatchKey = $key;
$takenItemKey = $item;
// Loop through, comparing only the items that have not already been added.
foreach ($thisBestMatches as $k => $v) {
if (in_array($k, $takenItems)) {
$highestMatch = $percent;
$highestMatchKey = $key;
$takenItemKey = $item;
$matches[] = array('new' => $item, 'old' => $highestMatchKey > -1 ? $highestMatchKey : null);
if ($highestMatchKey > -1) {
$taken[] = $highestMatchKey;
$takenItems[] = $takenItemKey;
/* Checking for removed items. Basically, if a list item from the old lists is removed
* it will not be accounted for, and will disappear in the results altogether.
* Loop through all the old lists, any that has not been added, will be added as:
* array( new => null, old => oldItemId )
$matchColumns = $this->getArrayColumn($matches, 'old');
foreach ($listArray['old'] as $thisKey => $thisList) {
if (!in_array($thisKey, $matchColumns)) {
$matches[] = array('new' => null, 'old' => $thisKey);
// Save the matches.
$resultArray = $matches;
* This fuction is exactly like array_column. This is added for PHP versions that do not support array_column.
* @param array $targetArray
* @param mixed $key
* @return array
protected function getArrayColumn(array $targetArray, $key)
$data = array();
foreach ($targetArray as $item) {
if (array_key_exists($key, $item)) {
$data[] = $item[$key];
return $data;
* Build multidimensional array holding the contents of each list node, old and new.
protected function buildChildLists()
$this->childLists['old'] = $this->getListsContent($this->list['old']);
$this->childLists['new'] = $this->getListsContent($this->list['new']);
* Diff the actual contents of the lists against their matched counterpart.
* Build the content of the class.
protected function diff()
// Add the opening parent node from listType. So if ol, <ol>, etc.
$this->content = $this->addListTypeWrapper();
$oldIndexCount = 0;
$diffOrderNewKeys = array_keys($this->diffOrderIndex['new']);
foreach ($this->diffOrderIndex['new'] as $key => $index) {
if ($index['type'] == "list") {
// Check to see if an old list was deleted.
$oldMatch = $this->getArrayByColumnValue($this->textMatches, 'old', $index['position']);
if ($oldMatch && $oldMatch['new'] === null) {
$newList = '';
$oldList = $this->getListByMatch($oldMatch, 'old');
$this->content .= $this->addListElementToContent($newList, $oldList, $oldMatch, $index, 'old');
$match = $this->getArrayByColumnValue($this->textMatches, 'new', $index['position']);
$newList = $this->childLists['new'][$match['new']];
$oldList = $this->getListByMatch($match, 'old');
$this->content .= $this->addListElementToContent($newList, $oldList, $match, $index, 'new');
if ($index['type'] == 'content') {
$this->content .= $this->addContentElementsToContent($oldIndexCount, $index['position']);
if ($key == $diffOrderNewKeys[count($diffOrderNewKeys) - 1]) {
foreach ($this->diffOrderIndex['old'] as $oldKey => $oldIndex) {
if ($oldKey > $key) {
if ($oldIndex['type'] == 'list') {
$oldMatch = $this->getArrayByColumnValue($this->textMatches, 'old', $oldIndex['position']);
if ($oldMatch && $oldMatch['new'] === null) {
$newList = '';
$oldList = $this->getListByMatch($oldMatch, 'old');
$this->content .= $this->addListElementToContent($newList, $oldList, $oldMatch, $oldIndex, 'old');
} else {
$this->content .= $this->addContentElementsToContent($oldKey);
// Add the closing parent node from listType. So if ol, </ol>, etc.
$this->content .= $this->addListTypeWrapper(false);
* @param string $newList
* @param string $oldList
* @param array $match
* @param array $index
* @return string
protected function addListElementToContent($newList, $oldList, array $match, array $index, $type)
$content = $this->list[$type][$index['index']];
$content .= $this->processPlaceholders(
$content .= "</li>";
return $content;
* @param integer $oldIndexCount
* @param null|integer $newPosition
* @return string
protected function addContentElementsToContent($oldIndexCount, $newPosition = null)
$newContent = $newPosition && array_key_exists($newPosition, $this->contentIndex['new'])
? $this->contentIndex['new'][$newPosition]
: '';
$oldDiffOrderIndexMatch = array_key_exists($oldIndexCount, $this->diffOrderIndex['old'])
? $this->diffOrderIndex['old'][$oldIndexCount]
: '';
$oldContent = $oldDiffOrderIndexMatch && array_key_exists($oldDiffOrderIndexMatch['position'], $this->contentIndex['old'])
? $this->contentIndex['old'][$oldDiffOrderIndexMatch['position']]
: '';
$diffObject = new HtmlDiff($oldContent, $newContent);
$content = $diffObject->build();
return $content;
* @param array $match
* @param string $type
* @return array|string
protected function getListByMatch(array $match, $type = 'new')
return array_key_exists($match[$type], $this->childLists[$type])
? $this->childLists[$type][$match[$type]]
: '';
* This function replaces array_column function in PHP for older versions of php.
* @param array $parentArray
* @param string $column
* @param mixed $value
* @param boolean $allMatches
* @return array|boolean
protected function getArrayByColumnValue($parentArray, $column, $value, $allMatches = false)
$returnArray = array();
foreach ($parentArray as $array) {
if (array_key_exists($column, $array) && $array[$column] == $value) {
if ($allMatches) {
$returnArray[] = $array;
} else {
return $array;
return $allMatches ? $returnArray : false;
* Converts the list (li) content arrays to string.
* @param array $listContentArray
* @return string
protected function convertListContentArrayToString($listContentArray)
if (!is_array($listContentArray)) {
return $listContentArray;
$content = array();
$words = explode(" ", $listContentArray['content']);
$nestedListCount = 0;
foreach ($words as $word) {
$match = $word == self::$listPlaceHolder;
$content[] = $match
? "<li>" . $this->convertListContentArrayToString($listContentArray['kids'][$nestedListCount]) . "</li>"
: $word;
if ($match) {
return implode(" ", $content);
* Return the contents of each list node.
* Process any placeholders for nested lists.
* @param string $text
* @param array $matches
* @return string
protected function processPlaceholders($text, array $matches)
// Prepare return
$returnText = array();
// Save the contents of all list nodes, new and old.
$contentVault = array(
'old' => $this->getListContent('old', $matches),
'new' => $this->getListContent('new', $matches)
$count = 0;
// Loop through the text checking for placeholders. If a nested list is found, create a new ListDiff object for it.
foreach (explode(' ', $text) as $word) {
$preContent = $this->checkWordForDiffTag($this->stripNewLine($word));
if (in_array(
is_array($preContent) ? $preContent[1] : $preContent,
) {
$oldText = array_key_exists($count, $contentVault['old']) ? implode('', $contentVault['old'][$count]) : '';
$newText = array_key_exists($count, $contentVault['new']) ? implode('', $contentVault['new'][$count]) : '';
$content = $this->diffList($oldText, $newText);
} else {
$content = $preContent;
$returnText[] = is_array($preContent) ? $preContent[0] . $content . $preContent[2] : $content;
// Return the result.
return implode(' ', $returnText);
* Checks to see if a diff tag is in string.
* @param string $word
* @return string
protected function checkWordForDiffTag($word)
foreach ($this->isolatedDiffTags as $diffTag) {
if (strpos($word, $diffTag) > -1) {
$position = strpos($word, $diffTag);
$length = strlen($diffTag);
$result = array(
substr($word, 0, $position),
substr($word, ($position + $length))
return $result;
return $word;
* Used to remove new lines.
* @param string $text
* @return string
protected function stripNewLine($text)
return trim(preg_replace('/\s\s+/', ' ', $text));
* Grab the list content using the listsIndex array.
* @param string $indexKey
* @param array $matches
* @return array
protected function getListContent($indexKey = 'new', array $matches)
$bucket = array();
if (isset($matches[$indexKey]) && $matches[$indexKey] !== null) {
$start = $this->listsIndex[$indexKey][$matches[$indexKey]];
$stop = $this->findEndForIndex($this->list[$indexKey], $start);
for ($x = $start; $x <= $stop; $x++) {
if (in_array($this->list[$indexKey][$x], $this->isolatedDiffTags)) {
$bucket[] = $this->listIsolatedDiffTags[$indexKey][$x];
return $bucket;
* Finds the end of list within its index.
* @param array $index
* @param integer $start
* @return integer
protected function findEndForIndex(array $index, $start)
$array = array_splice($index, $start);
$count = 0;
foreach ($array as $key => $item) {
if ($this->isOpeningListTag($item)) {
if ($this->isClosingListTag($item)) {
if ($count === 0) {
return $start + $key;
return $start + count($array);
* indexLists
* Index the list, starting positions, so that we can refer back to it later.
* This is used to see where one list node starts and another ends.
protected function indexLists()
$this->listsIndex = array();
$count = 0;
foreach ($this->list as $type => $list) {
$this->listsIndex[$type] = array();
foreach ($list as $key => $listItem) {
if ($this->isOpeningListTag($listItem)) {
if ($count === 1) {
$this->listsIndex[$type][] = $key;
if ($this->isClosingListTag($listItem)) {
* Adds the opening or closing list html element, based on listType.
* @param boolean $opening
* @return string
protected function addListTypeWrapper($opening = true)
if ($opening) {
return $this->newParentTag ?: $this->oldParentTag;
} else {
return "<" . (!$opening ? "/" : '') . $this->listType . ">";
* Replace nested list with placeholders.
public function replaceListIsolatedDiffTags()
$this->listIsolatedDiffTags['old'] = $this->createIsolatedDiffTagPlaceholders($this->list['old']);
$this->listIsolatedDiffTags['new'] = $this->createIsolatedDiffTagPlaceholders($this->list['new']);
* Grab the contents of a list node.
* @param array $contentArray
* @param boolean $stripTags
* @return array
protected function getListsContent(array $contentArray, $stripTags = true)
$lematches = array();
$arrayDepth = 0;
$nestedCount = array();
foreach ($contentArray as $index => $word) {
if ($this->isOpeningListTag($word)) {
if (!array_key_exists($arrayDepth, $nestedCount)) {
$nestedCount[$arrayDepth] = 1;
} else {
if ($this->isClosingListTag($word)) {
if ($arrayDepth > 0) {
$this->addStringToArrayByDepth($word, $lematches, $arrayDepth, 1, $nestedCount);
return $lematches;
* This function helps build the list content array of a list.
* If a list has another list within it, the inner list is replaced with the list placeholder and the inner list
* content becomes a child of the parent list.
* This goes recursively down.
* @param string $word
* @param array $array
* @param integer $targetDepth
* @param integer $thisDepth
* @param array $nestedCount
protected function addStringToArrayByDepth($word, array &$array, $targetDepth, $thisDepth, array $nestedCount)
// determine what depth we're at
if ($targetDepth == $thisDepth) {
// decide on what to do at this level
if (array_key_exists('content', $array)) {
$array['content'] .= $word;
} else {
// if we're on depth 1, add content
if ($nestedCount[$targetDepth] > count($array)) {
$array[] = array('content' => '', 'kids' => array());
$array[count($array) - 1]['content'] .= $word;
} else {
// create first kid if not exist
$newArray = array('content' => '', 'kids' => array());
if (array_key_exists('kids', $array)) {
if ($nestedCount[$targetDepth] > count($array['kids'])) {
$array['kids'][] = $newArray;
$array['content'] .= self::$listPlaceHolder;
// continue to the next depth
// get last kid and send to next depth
$array['kids'][count($array['kids']) - 1],
} else {
if ($nestedCount[$targetDepth] > count($array[count($array) - 1]['kids'])) {
$array[count($array) - 1]['kids'][] = $newArray;
$array[count($array) - 1]['content'] .= self::$listPlaceHolder;
// continue to the next depth
// get last kid and send to next depth
$array[count($array) - 1]['kids'][count($array[count($array) - 1]['kids']) - 1],
* Checks if text is opening list tag.
* @param string $item
* @return boolean
protected function isOpeningListTag($item)
if (preg_match("#<li[^>]*>\\s*#iU", $item)) {
return true;
return false;
* Check if text is closing list tag.
* @param string $item
* @return boolean
protected function isClosingListTag($item)
if (preg_match("#</li[^>]*>\\s*#iU", $item)) {
return true;
return false;

@ -0,0 +1,102 @@
namespace Caxy\HtmlDiff\ListDiff;
class DiffList
protected $listType;
protected $listItems = array();
protected $attributes = array();
protected $startTag;
protected $endTag;
public function __construct($listType, $startTag, $endTag, $listItems = array(), $attributes = array())
$this->listType = $listType;
$this->startTag = $startTag;
$this->endTag = $endTag;
$this->listItems = $listItems;
$this->attributes = $attributes;
* @return mixed
public function getListType()
return $this->listType;
* @param mixed $listType
* @return DiffList
public function setListType($listType)
$this->listType = $listType;
return $this;
* @return mixed
public function getStartTag()
return $this->startTag;
public function getStartTagWithDiffClass($class = 'diff-list')
return str_replace('>', ' class="'.$class.'">', $this->startTag);
* @param mixed $startTag
public function setStartTag($startTag)
$this->startTag = $startTag;
* @return mixed
public function getEndTag()
return $this->endTag;
* @param mixed $endTag
public function setEndTag($endTag)
$this->endTag = $endTag;
* @return mixed
public function getListItems()
return $this->listItems;
* @param mixed $listItems
* @return DiffList
public function setListItems($listItems)
$this->listItems = $listItems;
return $this;

@ -0,0 +1,124 @@
namespace Caxy\HtmlDiff\ListDiff;
class DiffListItem
protected $attributes = array();
protected $text;
protected $startTag;
protected $endTag;
public function __construct($text, $attributes = array(), $startTag, $endTag)
$this->text = $text;
$this->attributes = $attributes;
$this->startTag = $startTag;
$this->endTag = $endTag;
* @return array
public function getAttributes()
return $this->attributes;
* @param array $attributes
* @return DiffListItem
public function setAttributes($attributes)
$this->attributes = $attributes;
return $this;
* @return mixed
public function getText()
return $this->text;
* @param mixed $text
* @return DiffListItem
public function setText($text)
$this->text = $text;
return $this;
* @return mixed
public function getStartTag()
return $this->startTag;
public function getStartTagWithDiffClass($class = 'normal')
return str_replace('>', ' class="'.$class.'">', $this->startTag);
* @param mixed $startTag
* @return DiffListItem
public function setStartTag($startTag)
$this->startTag = $startTag;
return $this;
* @return mixed
public function getEndTag()
return $this->endTag;
* @param mixed $endTag
* @return DiffListItem
public function setEndTag($endTag)
$this->endTag = $endTag;
return $this;
public function getHtml($class = 'normal', $wrapTag = null)
$startWrap = $wrapTag ? sprintf('<%s>', $wrapTag) : '';
$endWrap = $wrapTag ? sprintf('</%s>', $wrapTag) : '';
return sprintf('%s%s%s%s%s', $this->getStartTagWithDiffClass($class), $startWrap, $this->getInnerHtml(), $endWrap, $this->endTag);
public function getInnerHtml()
return implode('', $this->text);
public function __toString()
return $this->getHtml();

@ -0,0 +1,280 @@
namespace Caxy\HtmlDiff;
use Caxy\HtmlDiff\ListDiff\DiffList;
use Caxy\HtmlDiff\ListDiff\DiffListItem;
class ListDiffNew extends AbstractDiff
protected static $listTypes = array('ul', 'ol', 'dl');
* @param string $oldText
* @param string $newText
* @param HtmlDiffConfig|null $config
* @return self
public static function create($oldText, $newText, HtmlDiffConfig $config = null)
$diff = new self($oldText, $newText);
if (null !== $config) {
return $diff;
public function build()
if ($this->hasDiffCache() && $this->getDiffCache()->contains($this->oldText, $this->newText)) {
$this->content = $this->getDiffCache()->fetch($this->oldText, $this->newText);
return $this->content;
$this->content = $this->diffLists(
if ($this->hasDiffCache()) {
$this->getDiffCache()->save($this->oldText, $this->newText, $this->content);
return $this->content;
protected function diffLists(DiffList $oldList, DiffList $newList)
$oldMatchData = array();
$newMatchData = array();
$oldListIndices = array();
$newListIndices = array();
$oldListItems = array();
$newListItems = array();
foreach ($oldList->getListItems() as $oldIndex => $oldListItem) {
if ($oldListItem instanceof DiffListItem) {
$oldListItems[$oldIndex] = $oldListItem;
$oldListIndices[] = $oldIndex;
$oldMatchData[$oldIndex] = array();
// Get match percentages
foreach ($newList->getListItems() as $newIndex => $newListItem) {
if ($newListItem instanceof DiffListItem) {
if (!in_array($newListItem, $newListItems)) {
$newListItems[$newIndex] = $newListItem;
if (!in_array($newIndex, $newListIndices)) {
$newListIndices[] = $newIndex;
if (!array_key_exists($newIndex, $newMatchData)) {
$newMatchData[$newIndex] = array();
$oldText = implode('', $oldListItem->getText());
$newText = implode('', $newListItem->getText());
// similar_text
$percentage = null;
similar_text($oldText, $newText, $percentage);
$oldMatchData[$oldIndex][$newIndex] = $percentage;
$newMatchData[$newIndex][$oldIndex] = $percentage;
$currentIndexInOld = 0;
$currentIndexInNew = 0;
$oldCount = count($oldListIndices);
$newCount = count($newListIndices);
$difference = max($oldCount, $newCount) - min($oldCount, $newCount);
$diffOutput = '';
foreach ($newList->getListItems() as $newIndex => $newListItem) {
if ($newListItem instanceof DiffListItem) {
$operation = null;
$oldListIndex = array_key_exists($currentIndexInOld, $oldListIndices) ? $oldListIndices[$currentIndexInOld] : null;
$class = 'normal';
if (null !== $oldListIndex && array_key_exists($oldListIndex, $oldMatchData)) {
// Check percentage matches of upcoming list items in old.
$matchPercentage = $oldMatchData[$oldListIndex][$newIndex];
// does the old list item match better?
$otherMatchBetter = false;
foreach ($oldMatchData[$oldListIndex] as $index => $percentage) {
if ($index > $newIndex && $percentage > $matchPercentage) {
$otherMatchBetter = $index;
if (false !== $otherMatchBetter && $newCount > $oldCount && $difference > 0) {
$diffOutput .= sprintf('%s', $newListItem->getHtml('normal new', 'ins'));
$nextOldListIndex = array_key_exists($currentIndexInOld + 1, $oldListIndices) ? $oldListIndices[$currentIndexInOld + 1] : null;
$replacement = false;
if ($nextOldListIndex !== null && $oldMatchData[$nextOldListIndex][$newIndex] > $matchPercentage && $oldMatchData[$nextOldListIndex][$newIndex] > $this->config->getMatchThreshold()) {
// Following list item in old is better match, use that.
$diffOutput .= sprintf('%s', $oldListItems[$oldListIndex]->getHtml('removed', 'del'));
$oldListIndex = $nextOldListIndex;
$matchPercentage = $oldMatchData[$oldListIndex];
$replacement = true;
if ($matchPercentage > $this->config->getMatchThreshold() || $currentIndexInNew === $currentIndexInOld) {
// Diff the two lists.
$htmlDiff = HtmlDiff::create(
$diffContent = $htmlDiff->build();
$diffOutput .= sprintf('%s%s%s', $newListItem->getStartTagWithDiffClass($replacement ? 'replacement' : 'normal'), $diffContent, $newListItem->getEndTag());
} else {
$diffOutput .= sprintf('%s', $oldListItems[$oldListIndex]->getHtml('removed', 'del'));
$diffOutput .= sprintf('%s', $newListItem->getHtml('replacement', 'ins'));
} else {
$diffOutput .= sprintf('%s', $newListItem->getHtml('normal new', 'ins'));
// Output any additional list items
while (array_key_exists($currentIndexInOld, $oldListIndices)) {
$oldListIndex = $oldListIndices[$currentIndexInOld];
$diffOutput .= sprintf('%s', $oldListItems[$oldListIndex]->getHtml('removed', 'del'));
return sprintf('%s%s%s', $newList->getStartTagWithDiffClass(), $diffOutput, $newList->getEndTag());
protected function buildDiffList($words)
$listType = null;
$listStartTag = null;
$listEndTag = null;
$attributes = array();
$openLists = 0;
$openListItems = 0;
$list = array();
$currentListItem = null;
$listItemType = null;
$listItemStart = null;
$listItemEnd = null;
foreach ($words as $i => $word) {
if ($this->isOpeningListTag($word, $listType)) {
if ($openLists > 0) {
if ($openListItems > 0) {
$currentListItem[] = $word;
} else {
$list[] = $word;
} else {
$listType = substr($word, 1, 2);
$listStartTag = $word;
} elseif ($this->isClosingListTag($word, $listType)) {
if ($openLists > 1) {
if ($openListItems > 0) {
$currentListItem[] = $word;
} else {
$list[] = $word;
} else {
$listEndTag = $word;
} elseif ($this->isOpeningListItemTag($word, $listItemType)) {
if ($openListItems === 0) {
// New top-level list item
$currentListItem = array();
$listItemType = substr($word, 1, 2);
$listItemStart = $word;
} else {
$currentListItem[] = $word;
} elseif ($this->isClosingListItemTag($word, $listItemType)) {
if ($openListItems === 1) {
$listItemEnd = $word;
$listItem = new DiffListItem($currentListItem, array(), $listItemStart, $listItemEnd);
$list[] = $listItem;
$currentListItem = null;
} else {
$currentListItem[] = $word;
} else {
if ($openListItems > 0) {
$currentListItem[] = $word;
} else {
$list[] = $word;
$diffList = new DiffList($listType, $listStartTag, $listEndTag, $list, $attributes);
return $diffList;
protected function isOpeningListTag($word, $type = null)
$filter = $type !== null ? array('<' . $type) : array('<ul', '<ol', '<dl');
return in_array(substr($word, 0, 3), $filter);
protected function isClosingListTag($word, $type = null)
$filter = $type !== null ? array('</' . $type) : array('</ul', '</ol', '</dl');
return in_array(substr($word, 0, 4), $filter);
protected function isOpeningListItemTag($word, $type = null)
$filter = $type !== null ? array('<' . $type) : array('<li', '<dd', '<dt');
return in_array(substr($word, 0, 3), $filter);
protected function isClosingListItemTag($word, $type = null)
$filter = $type !== null ? array('</' . $type) : array('</li', '</dd', '</dt');
return in_array(substr($word, 0, 4), $filter);

@ -0,0 +1,27 @@
namespace Caxy\HtmlDiff;
class Match
public $startInOld;
public $startInNew;
public $size;
public function __construct($startInOld, $startInNew, $size)
$this->startInOld = $startInOld;
$this->startInNew = $startInNew;
$this->size = $size;
public function endInOld()
return $this->startInOld + $this->size;
public function endInNew()
return $this->startInNew + $this->size;

@ -0,0 +1,21 @@
namespace Caxy\HtmlDiff;
class Operation
public $action;
public $startInOld;
public $endInOld;
public $startInNew;
public $endInNew;
public function __construct($action, $startInOld, $endInOld, $startInNew, $endInNew)
$this->action = $action;
$this->startInOld = $startInOld;
$this->endInOld = $endInOld;
$this->startInNew = $startInNew;
$this->endInNew = $endInNew;

@ -0,0 +1,94 @@
namespace Caxy\HtmlDiff\Table;
* Class AbstractTableElement
* @package Caxy\HtmlDiff\Table
abstract class AbstractTableElement
* @var \DOMElement
protected $domNode;
* AbstractTableElement constructor.
* @param \DOMElement|null $domNode
public function __construct(\DOMElement $domNode = null)
$this->domNode = $domNode;
* @return \DOMElement
public function getDomNode()
return $this->domNode;
* @param \DOMElement $domNode
* @return $this
public function setDomNode(\DOMElement $domNode)
$this->domNode = $domNode;
return $this;
* @return string
public function getInnerHtml()
$innerHtml = '';
if ($this->domNode) {
foreach ($this->domNode->childNodes as $child) {
$innerHtml .= static::htmlFromNode($child);
return $innerHtml;
* @param string $name
* @return string
public function getAttribute($name)
return $this->domNode->getAttribute($name);
* @param \DOMDocument $domDocument
* @return \DOMElement
public function cloneNode(\DOMDocument $domDocument)
return $domDocument->importNode($this->getDomNode()->cloneNode(false), false);
* @param \DOMElement $node
* @return string
public static function htmlFromNode($node)
$domDocument = new \DOMDocument();
$newNode = $domDocument->importNode($node, true);
return trim($domDocument->saveHTML());

@ -0,0 +1,268 @@
namespace Caxy\HtmlDiff\Table;
* Class DiffRowPosition
* @package Caxy\HtmlDiff\Table
class DiffRowPosition
* @var int
protected $indexInOld;
* @var int
protected $indexInNew;
* @var int
protected $columnInOld;
* @var int
protected $columnInNew;
* DiffRowPosition constructor.
* @param int $indexInOld
* @param int $indexInNew
* @param int $columnInOld
* @param int $columnInNew
public function __construct($indexInOld = 0, $indexInNew = 0, $columnInOld = 0, $columnInNew = 0)
$this->indexInOld = $indexInOld;
$this->indexInNew = $indexInNew;
$this->columnInOld = $columnInOld;
$this->columnInNew = $columnInNew;
* @return int
public function getIndexInOld()
return $this->indexInOld;
* @param int $indexInOld
* @return DiffRowPosition
public function setIndexInOld($indexInOld)
$this->indexInOld = $indexInOld;
return $this;
* @return int
public function getIndexInNew()
return $this->indexInNew;
* @param int $indexInNew
* @return DiffRowPosition
public function setIndexInNew($indexInNew)
$this->indexInNew = $indexInNew;
return $this;
* @return int
public function getColumnInOld()
return $this->columnInOld;
* @param int $columnInOld
* @return DiffRowPosition
public function setColumnInOld($columnInOld)
$this->columnInOld = $columnInOld;
return $this;
* @return int
public function getColumnInNew()
return $this->columnInNew;
* @param int $columnInNew
* @return DiffRowPosition
public function setColumnInNew($columnInNew)
$this->columnInNew = $columnInNew;
return $this;
* @param int $increment
* @return int
public function incrementColumnInNew($increment = 1)
$this->columnInNew += $increment;
return $this->columnInNew;
* @param int $increment
* @return int
public function incrementColumnInOld($increment = 1)
$this->columnInOld += $increment;
return $this->columnInOld;
* @param int $increment
* @return int
public function incrementIndexInNew($increment = 1)
$this->indexInNew += $increment;
return $this->indexInNew;
* @param int $increment
* @return int
public function incrementIndexInOld($increment = 1)
$this->indexInOld += $increment;
return $this->indexInOld;
* @param string $type
* @param int $increment
* @return int
public function incrementIndex($type, $increment = 1)
if ($type === 'new') {
return $this->incrementIndexInNew($increment);
return $this->incrementIndexInOld($increment);
* @param string $type
* @param int $increment
* @return int
public function incrementColumn($type, $increment = 1)
if ($type === 'new') {
return $this->incrementColumnInNew($increment);
return $this->incrementColumnInOld($increment);
* @param string $type
* @return bool
public function isColumnLessThanOther($type)
if ($type === 'new') {
return $this->getColumnInNew() < $this->getColumnInOld();
return $this->getColumnInOld() < $this->getColumnInNew();
* @param string $type
* @return int
public function getColumn($type)
if ($type === 'new') {
return $this->getColumnInNew();
return $this->getColumnInOld();
* @param string $type
* @return int
public function getIndex($type)
if ($type === 'new') {
return $this->getIndexInNew();
return $this->getIndexInOld();
* @return bool
public function areColumnsEqual()
return $this->getColumnInOld() === $this->getColumnInNew();
* @return null|string
public function getLesserColumnType()
if ($this->isColumnLessThanOther('new')) {
return 'new';
} elseif ($this->isColumnLessThanOther('old')) {
return 'old';
return null;

@ -0,0 +1,133 @@
namespace Caxy\HtmlDiff\Table;
* Class RowMatch
* @package Caxy\HtmlDiff\Table
class RowMatch
* @var int
protected $startInNew;
* @var int
protected $startInOld;
* @var int
protected $endInNew;
* @var int
protected $endInOld;
* @var float|null
protected $percentage;
* RowMatch constructor.
* @param int $startInNew
* @param int $startInOld
* @param int $endInNew
* @param int $endInOld
* @param float|null $percentage
public function __construct($startInNew = 0, $startInOld = 0, $endInNew = 0, $endInOld = 0, $percentage = null)
$this->startInNew = $startInNew;
$this->startInOld = $startInOld;
$this->endInNew = $endInNew;
$this->endInOld = $endInOld;
$this->percentage = $percentage;
* @return int
public function getStartInNew()
return $this->startInNew;
* @param int $startInNew
* @return RowMatch
public function setStartInNew($startInNew)
$this->startInNew = $startInNew;
return $this;
* @return int
public function getStartInOld()
return $this->startInOld;
* @param int $startInOld
* @return RowMatch
public function setStartInOld($startInOld)
$this->startInOld = $startInOld;
return $this;
* @return int
public function getEndInNew()
return $this->endInNew;
* @param int $endInNew
* @return RowMatch
public function setEndInNew($endInNew)
$this->endInNew = $endInNew;
return $this;
* @return int
public function getEndInOld()
return $this->endInOld;
* @param int $endInOld
* @return RowMatch
public function setEndInOld($endInOld)
$this->endInOld = $endInOld;
return $this;

@ -0,0 +1,161 @@
namespace Caxy\HtmlDiff\Table;
* Class Table
* @package Caxy\HtmlDiff\Table
class Table extends AbstractTableElement
* @var TableRow[]
protected $rows = array();
* @return TableRow[]
public function getRows()
return $this->rows;
* @param TableRow $row
public function addRow(TableRow $row)
$this->rows[] = $row;
if (!$row->getTable()) {
* @param TableRow $row
public function removeRow(TableRow $row)
$key = array_search($row, $this->rows, true);
if ($key !== false) {
if ($row->getTable()) {
* @param int $index
* @return null|TableRow
public function getRow($index)
return isset($this->rows[$index]) ? $this->rows[$index] : null;
* @param TableRow[] $rows
* @param null|int $position
public function insertRows($rows, $position = null)
if ($position === null) {
$this->rows = array_merge($this->rows, $rows);
} else {
array_splice($this->rows, $position, 0, $rows);
* @param TablePosition $position
* @return null|TableCell
public function getCellByPosition(TablePosition $position)
$row = $this->getRow($position->getRow());
return $row ? $row->getCell($position->getCell()) : null;
* @param TablePosition $position
* @param int $offset
* @return TablePosition|null
public function getPositionBefore(TablePosition $position, $offset = 1)
if ($position->getCell() > ($offset - 1)) {
$newRow = $position->getRow();
$newCell = $position->getCell() - $offset;
} elseif ($position->getRow() > 0) {
$cellsToMove = $offset;
$newRow = $position->getRow();
$newCell = $position->getCell();
while ($cellsToMove > 0 && $newRow >= 0) {
if ($cellsToMove > $newCell) {
if ($newRow < 0) {
return null;
$cellsToMove = $cellsToMove - ($newCell + 1);
$cellCount = count($this->getRow($newRow)->getCells());
$newCell = $cellCount - 1;
} else {
$newCell = $newCell - $cellsToMove;
$cellsToMove -= $newCell;
} else {
return null;
if ($newRow >= 0 && $newCell >= 0) {
return new TablePosition($newRow, $newCell);
return null;
* @param TablePosition $position
* @param int $offset
* @return TablePosition|null
public function getPositionAfter(TablePosition $position, $offset = 1)
$cellsToMove = $offset;
$newRow = $position->getRow();
$newCell = $position->getCell();
while ($cellsToMove > 0 && $newRow < count($this->rows)) {
$cellCount = count($this->getRow($newRow)->getCells());
$cellsLeft = $cellCount - $newCell - 1;
if ($cellsToMove > $cellsLeft) {
$cellsToMove -= $cellsLeft - 1;
$newCell = 0;
} else {
$newCell = $newCell + $cellsToMove;
$cellsToMove -= $cellsLeft;
if ($newRow >= 0 && $newCell >= 0) {
return new TablePosition($newRow, $newCell);
return null;

@ -0,0 +1,55 @@
namespace Caxy\HtmlDiff\Table;
* Class TableCell
* @package Caxy\HtmlDiff\Table
class TableCell extends AbstractTableElement
* @var TableRow
protected $row;
* @return TableRow
public function getRow()
return $this->row;
* @param TableRow|null $row
* @return $this
public function setRow(TableRow $row = null)
$this->row = $row;
if (null !== $row && !in_array($this, $row->getCells())) {
return $this;
* @return int
public function getColspan()
return (int)$this->getAttribute('colspan') ?: 1;
* @return int
public function getRowspan()
return (int)$this->getAttribute('rowspan') ?: 1;

@ -0,0 +1,921 @@
namespace Caxy\HtmlDiff\Table;
use Caxy\HtmlDiff\AbstractDiff;
use Caxy\HtmlDiff\HtmlDiff;
use Caxy\HtmlDiff\HtmlDiffConfig;
use Caxy\HtmlDiff\Operation;
* Class TableDiff
* @package Caxy\HtmlDiff\Table
class TableDiff extends AbstractDiff
* @var null|Table
protected $oldTable = null;
* @var null|Table
protected $newTable = null;
* @var null|\DOMElement
protected $diffTable = null;
* @var null|\DOMDocument
protected $diffDom = null;
* @var int
protected $newRowOffsets = 0;
* @var int
protected $oldRowOffsets = 0;
* @var array
protected $cellValues = array();
* @var \HTMLPurifier
protected $purifier;
* @param string $oldText
* @param string $newText
* @param HtmlDiffConfig|null $config
* @return self
public static function create($oldText, $newText, HtmlDiffConfig $config = null)
$diff = new self($oldText, $newText);
if (null !== $config) {
return $diff;
* TableDiff constructor.
* @param string $oldText
* @param string $newText
* @param string $encoding
* @param array|null $specialCaseTags
* @param bool|null $groupDiffs
public function __construct(
$encoding = 'UTF-8',
$specialCaseTags = null,
$groupDiffs = null
parent::__construct($oldText, $newText, $encoding, $specialCaseTags, $groupDiffs);
* Initializes HTMLPurifier with cache location
* @param null|string $defaultPurifierSerializerCache
* @return void
protected function initPurifier($defaultPurifierSerializerCache = null)
$HTMLPurifierConfig = \HTMLPurifier_Config::createDefault();
// Cache.SerializerPath defaults to Null and sets
// the location to inside the vendor HTMLPurifier library
// under the DefinitionCache/Serializer folder.
if (!is_null($defaultPurifierSerializerCache)) {
$HTMLPurifierConfig->set('Cache.SerializerPath', $defaultPurifierSerializerCache);
$this->purifier = new \HTMLPurifier($HTMLPurifierConfig);
* @return string
public function build()
if ($this->hasDiffCache() && $this->getDiffCache()->contains($this->oldText, $this->newText)) {
$this->content = $this->getDiffCache()->fetch($this->oldText, $this->newText);
return $this->content;
$this->diffDom = new \DOMDocument();
if ($this->hasDiffCache()) {
$this->getDiffCache()->save($this->oldText, $this->newText, $this->content);
return $this->content;
protected function diffTableContent()
$this->diffDom = new \DOMDocument();
$this->diffTable = $this->newTable->cloneNode($this->diffDom);
$oldRows = $this->oldTable->getRows();
$newRows = $this->newTable->getRows();
$oldMatchData = array();
$newMatchData = array();
/* @var $oldRow TableRow */
foreach ($oldRows as $oldIndex => $oldRow) {
$oldMatchData[$oldIndex] = array();
// Get match percentages
/* @var $newRow TableRow */
foreach ($newRows as $newIndex => $newRow) {
if (!array_key_exists($newIndex, $newMatchData)) {
$newMatchData[$newIndex] = array();
// similar_text
$percentage = $this->getMatchPercentage($oldRow, $newRow, $oldIndex, $newIndex);
$oldMatchData[$oldIndex][$newIndex] = $percentage;
$newMatchData[$newIndex][$oldIndex] = $percentage;
$matches = $this->getRowMatches($oldMatchData, $newMatchData);
$this->diffTableRowsWithMatches($oldRows, $newRows, $matches);
$this->content = $this->htmlFromNode($this->diffTable);
* @param TableRow[] $oldRows
* @param TableRow[] $newRows
* @param RowMatch[] $matches
protected function diffTableRowsWithMatches($oldRows, $newRows, $matches)
$operations = array();
$indexInOld = 0;
$indexInNew = 0;
$oldRowCount = count($oldRows);
$newRowCount = count($newRows);
$matches[] = new RowMatch($newRowCount, $oldRowCount, $newRowCount, $oldRowCount);
// build operations
foreach ($matches as $match) {
$matchAtIndexInOld = $indexInOld === $match->getStartInOld();
$matchAtIndexInNew = $indexInNew === $match->getStartInNew();
$action = 'equal';
if (!$matchAtIndexInOld && !$matchAtIndexInNew) {
$action = 'replace';
} elseif ($matchAtIndexInOld && !$matchAtIndexInNew) {
$action = 'insert';
} elseif (!$matchAtIndexInOld && $matchAtIndexInNew) {
$action = 'delete';
if ($action !== 'equal') {
$operations[] = new Operation(
$operations[] = new Operation(
$indexInOld = $match->getEndInOld();
$indexInNew = $match->getEndInNew();
$appliedRowSpans = array();
// process operations
foreach ($operations as $operation) {
switch ($operation->action) {
case 'equal':
$this->processEqualOperation($operation, $oldRows, $newRows, $appliedRowSpans);
case 'delete':
$this->processDeleteOperation($operation, $oldRows, $appliedRowSpans);
case 'insert':
$this->processInsertOperation($operation, $newRows, $appliedRowSpans);
case 'replace':
$this->processReplaceOperation($operation, $oldRows, $newRows, $appliedRowSpans);
* @param Operation $operation
* @param array $newRows
* @param array $appliedRowSpans
* @param bool $forceExpansion
protected function processInsertOperation(
Operation $operation,
$forceExpansion = false
) {
$targetRows = array_slice($newRows, $operation->startInNew, $operation->endInNew - $operation->startInNew);
foreach ($targetRows as $row) {
$this->diffAndAppendRows(null, $row, $appliedRowSpans, $forceExpansion);
* @param Operation $operation
* @param array $oldRows
* @param array $appliedRowSpans
* @param bool $forceExpansion
protected function processDeleteOperation(
Operation $operation,
$forceExpansion = false
) {
$targetRows = array_slice($oldRows, $operation->startInOld, $operation->endInOld - $operation->startInOld);
foreach ($targetRows as $row) {
$this->diffAndAppendRows($row, null, $appliedRowSpans, $forceExpansion);
* @param Operation $operation
* @param array $oldRows
* @param array $newRows
* @param array $appliedRowSpans
protected function processEqualOperation(Operation $operation, $oldRows, $newRows, &$appliedRowSpans)
$targetOldRows = array_values(
array_slice($oldRows, $operation->startInOld, $operation->endInOld - $operation->startInOld)
$targetNewRows = array_values(
array_slice($newRows, $operation->startInNew, $operation->endInNew - $operation->startInNew)
foreach ($targetNewRows as $index => $newRow) {
if (!isset($targetOldRows[$index])) {
$this->diffAndAppendRows($targetOldRows[$index], $newRow, $appliedRowSpans);
* @param Operation $operation
* @param array $oldRows
* @param array $newRows
* @param array $appliedRowSpans
protected function processReplaceOperation(Operation $operation, $oldRows, $newRows, &$appliedRowSpans)
$this->processDeleteOperation($operation, $oldRows, $appliedRowSpans, true);
$this->processInsertOperation($operation, $newRows, $appliedRowSpans, true);
* @param array $oldMatchData
* @param array $newMatchData
* @return array
protected function getRowMatches($oldMatchData, $newMatchData)
$matches = array();
$startInOld = 0;
$startInNew = 0;
$endInOld = count($oldMatchData);
$endInNew = count($newMatchData);
$this->findRowMatches($newMatchData, $startInOld, $endInOld, $startInNew, $endInNew, $matches);
return $matches;
* @param array $newMatchData
* @param int $startInOld
* @param int $endInOld
* @param int $startInNew
* @param int $endInNew
* @param array $matches
protected function findRowMatches($newMatchData, $startInOld, $endInOld, $startInNew, $endInNew, &$matches)
$match = $this->findRowMatch($newMatchData, $startInOld, $endInOld, $startInNew, $endInNew);
if ($match !== null) {
if ($startInOld < $match->getStartInOld() &&
$startInNew < $match->getStartInNew()
) {
$matches[] = $match;
if ($match->getEndInOld() < $endInOld &&
$match->getEndInNew() < $endInNew
) {
* @param array $newMatchData
* @param int $startInOld
* @param int $endInOld
* @param int $startInNew
* @param int $endInNew
* @return RowMatch|null
protected function findRowMatch($newMatchData, $startInOld, $endInOld, $startInNew, $endInNew)
$bestMatch = null;
$bestPercentage = 0;
foreach ($newMatchData as $newIndex => $oldMatches) {
if ($newIndex < $startInNew) {
if ($newIndex >= $endInNew) {
foreach ($oldMatches as $oldIndex => $percentage) {
if ($oldIndex < $startInOld) {
if ($oldIndex >= $endInOld) {
if ($percentage > $bestPercentage) {
$bestPercentage = $percentage;
$bestMatch = array(
'oldIndex' => $oldIndex,
'newIndex' => $newIndex,
'percentage' => $percentage,
if ($bestMatch !== null) {
return new RowMatch(
$bestMatch['newIndex'] + 1,
$bestMatch['oldIndex'] + 1,
return null;
* @param TableRow|null $oldRow
* @param TableRow|null $newRow
* @param array $appliedRowSpans
* @param bool $forceExpansion
* @return array
protected function diffRows($oldRow, $newRow, array &$appliedRowSpans, $forceExpansion = false)
// create tr dom element
$rowToClone = $newRow ?: $oldRow;
/* @var $diffRow \DOMElement */
$diffRow = $this->diffDom->importNode($rowToClone->getDomNode()->cloneNode(false), false);
$oldCells = $oldRow ? $oldRow->getCells() : array();
$newCells = $newRow ? $newRow->getCells() : array();
$position = new DiffRowPosition();
$extraRow = null;
/* @var $expandCells \DOMElement[] */
$expandCells = array();
/* @var $cellsWithMultipleRows \DOMElement[] */
$cellsWithMultipleRows = array();
$newCellCount = count($newCells);
while ($position->getIndexInNew() < $newCellCount) {
if (!$position->areColumnsEqual()) {
$type = $position->getLesserColumnType();
if ($type === 'new') {
$row = $newRow;
$targetRow = $extraRow;
} else {
$row = $oldRow;
$targetRow = $diffRow;
if ($row && $targetRow && (!$type === 'old' || isset($oldCells[$position->getIndexInOld()]))) {
$this->syncVirtualColumns($row, $position, $cellsWithMultipleRows, $targetRow, $type, true);
/* @var $newCell TableCell */
$newCell = $newCells[$position->getIndexInNew()];
/* @var $oldCell TableCell */
$oldCell = isset($oldCells[$position->getIndexInOld()]) ? $oldCells[$position->getIndexInOld()] : null;
if ($oldCell && $newCell->getColspan() != $oldCell->getColspan()) {
if (null === $extraRow) {
/* @var $extraRow \DOMElement */
$extraRow = $this->diffDom->importNode($rowToClone->getDomNode()->cloneNode(false), false);
if ($oldCell->getColspan() > $newCell->getColspan()) {
$this->syncVirtualColumns($newRow, $position, $cellsWithMultipleRows, $extraRow, 'new', true);
} else {
$this->syncVirtualColumns($oldRow, $position, $cellsWithMultipleRows, $diffRow, 'old', true);
} else {
$diffCell = $this->diffCellsAndIncrementCounters(
$expandCells[] = $diffCell;
$oldCellCount = count($oldCells);
while ($position->getIndexInOld() < $oldCellCount) {
$diffCell = $this->diffCellsAndIncrementCounters(
$expandCells[] = $diffCell;
if ($extraRow) {
foreach ($expandCells as $expandCell) {
$rowspan = $expandCell->getAttribute('rowspan') ?: 1;
$expandCell->setAttribute('rowspan', 1 + $rowspan);
if ($extraRow || $forceExpansion) {
foreach ($appliedRowSpans as $rowSpanCells) {
/* @var $rowSpanCells \DOMElement[] */
foreach ($rowSpanCells as $extendCell) {
$rowspan = $extendCell->getAttribute('rowspan') ?: 1;
$extendCell->setAttribute('rowspan', 1 + $rowspan);
if (!$forceExpansion) {
$appliedRowSpans = array_values($appliedRowSpans);
$appliedRowSpans = array_merge($appliedRowSpans, array_values($cellsWithMultipleRows));
return array($diffRow, $extraRow);
* @param TableCell|null $oldCell
* @param TableCell|null $newCell
* @return \DOMElement
protected function getNewCellNode(TableCell $oldCell = null, TableCell $newCell = null)
// If only one cell exists, use it
if (!$oldCell || !$newCell) {
$clone = $newCell
? $newCell->getDomNode()->cloneNode(false)
: $oldCell->getDomNode()->cloneNode(false);
} else {
$oldNode = $oldCell->getDomNode();
$newNode = $newCell->getDomNode();
/* @var $clone \DOMElement */
$clone = $newNode->cloneNode(false);
$oldRowspan = $oldNode->getAttribute('rowspan') ?: 1;
$oldColspan = $oldNode->getAttribute('colspan') ?: 1;
$newRowspan = $newNode->getAttribute('rowspan') ?: 1;
$newColspan = $newNode->getAttribute('colspan') ?: 1;
$clone->setAttribute('rowspan', max($oldRowspan, $newRowspan));
$clone->setAttribute('colspan', max($oldColspan, $newColspan));
return $this->diffDom->importNode($clone);
* @param TableCell|null $oldCell
* @param TableCell|null $newCell
* @param bool $usingExtraRow
* @return \DOMElement
protected function diffCells($oldCell, $newCell, $usingExtraRow = false)
$diffCell = $this->getNewCellNode($oldCell, $newCell);
$oldContent = $oldCell ? $this->getInnerHtml($oldCell->getDomNode()) : '';
$newContent = $newCell ? $this->getInnerHtml($newCell->getDomNode()) : '';
$htmlDiff = HtmlDiff::create(
mb_convert_encoding($oldContent, 'UTF-8', 'HTML-ENTITIES'),
mb_convert_encoding($newContent, 'UTF-8', 'HTML-ENTITIES'),
$diff = $htmlDiff->build();
$this->setInnerHtml($diffCell, $diff);
if (null === $newCell) {
$diffCell->setAttribute('class', trim($diffCell->getAttribute('class').' del'));
if (null === $oldCell) {
$diffCell->setAttribute('class', trim($diffCell->getAttribute('class').' ins'));
if ($usingExtraRow) {
$diffCell->setAttribute('class', trim($diffCell->getAttribute('class').' extra-row'));
return $diffCell;
protected function buildTableDoms()
$this->oldTable = $this->parseTableStructure($this->oldText);
$this->newTable = $this->parseTableStructure($this->newText);
* @param string $text
* @return \DOMDocument
protected function createDocumentWithHtml($text)
$dom = new \DOMDocument();
$this->purifier->purify(mb_convert_encoding($text, $this->config->getEncoding(), mb_detect_encoding($text))),
return $dom;
* @param string $text
* @return Table
protected function parseTableStructure($text)
$dom = $this->createDocumentWithHtml($text);
$tableNode = $dom->getElementsByTagName('table')->item(0);
$table = new Table($tableNode);
return $table;
* @param Table $table
* @param \DOMNode|null $node
protected function parseTable(Table $table, \DOMNode $node = null)
if ($node === null) {
$node = $table->getDomNode();
if (!$node->childNodes) {
foreach ($node->childNodes as $child) {
if ($child->nodeName === 'tr') {
$row = new TableRow($child);
} else {
$this->parseTable($table, $child);
* @param TableRow $row
protected function parseTableRow(TableRow $row)
$node = $row->getDomNode();
foreach ($node->childNodes as $child) {
if (in_array($child->nodeName, array('td', 'th'))) {
$cell = new TableCell($child);
* @param \DOMNode $node
* @return string
protected function getInnerHtml($node)
$innerHtml = '';
$children = $node->childNodes;
foreach ($children as $child) {
$innerHtml .= $this->htmlFromNode($child);
return $innerHtml;
* @param \DOMNode $node
* @return string
protected function htmlFromNode($node)
$domDocument = new \DOMDocument();
$newNode = $domDocument->importNode($node, true);
return $domDocument->saveHTML();
* @param \DOMNode $node
* @param string $html
protected function setInnerHtml($node, $html)
// DOMDocument::loadHTML does not allow empty strings.
if (strlen($html) === 0) {
$html = '<span class="empty"></span>';
$doc = $this->createDocumentWithHtml($html);
$fragment = $node->ownerDocument->createDocumentFragment();
$root = $doc->getElementsByTagName('body')->item(0);
foreach ($root->childNodes as $child) {
$fragment->appendChild($node->ownerDocument->importNode($child, true));
* @param Table $table
protected function indexCellValues(Table $table)
foreach ($table->getRows() as $rowIndex => $row) {
foreach ($row->getCells() as $cellIndex => $cell) {
$value = trim($cell->getDomNode()->textContent);
if (!isset($this->cellValues[$value])) {
$this->cellValues[$value] = array();
$this->cellValues[$value][] = new TablePosition($rowIndex, $cellIndex);
* @param TableRow $tableRow
* @param DiffRowPosition $position
* @param array $cellsWithMultipleRows
* @param \DOMNode $diffRow
* @param string $diffType
* @param bool $usingExtraRow
protected function syncVirtualColumns(
DiffRowPosition $position,
$usingExtraRow = false
) {
$currentCell = $tableRow->getCell($position->getIndex($diffType));
while ($position->isColumnLessThanOther($diffType) && $currentCell) {
$diffCell = $diffType === 'new' ? $this->diffCells(null, $currentCell, $usingExtraRow) : $this->diffCells(
// Store cell in appliedRowSpans if spans multiple rows
if ($diffCell->getAttribute('rowspan') > 1) {
$cellsWithMultipleRows[$diffCell->getAttribute('rowspan')][] = $diffCell;
$position->incrementColumn($diffType, $currentCell->getColspan());
$currentCell = $tableRow->getCell($position->incrementIndex($diffType));
* @param null|TableCell $oldCell
* @param null|TableCell $newCell
* @param array $cellsWithMultipleRows
* @param \DOMElement $diffRow
* @param DiffRowPosition $position
* @param bool $usingExtraRow
* @return \DOMElement
protected function diffCellsAndIncrementCounters(
DiffRowPosition $position,
$usingExtraRow = false
) {
$diffCell = $this->diffCells($oldCell, $newCell, $usingExtraRow);
// Store cell in appliedRowSpans if spans multiple rows
if ($diffCell->getAttribute('rowspan') > 1) {
$cellsWithMultipleRows[$diffCell->getAttribute('rowspan')][] = $diffCell;
if ($newCell !== null) {
if ($oldCell !== null) {
return $diffCell;
* @param TableRow|null $oldRow
* @param TableRow|null $newRow
* @param array $appliedRowSpans
* @param bool $forceExpansion
protected function diffAndAppendRows($oldRow, $newRow, &$appliedRowSpans, $forceExpansion = false)
list($rowDom, $extraRow) = $this->diffRows(
if ($extraRow) {
* @param TableRow $oldRow
* @param TableRow $newRow
* @param int $oldIndex
* @param int $newIndex
* @return float|int
protected function getMatchPercentage(TableRow $oldRow, TableRow $newRow, $oldIndex, $newIndex)
$firstCellWeight = 1.5;
$indexDeltaWeight = 0.25 * (abs($oldIndex - $newIndex));
$thresholdCount = 0;
$minCells = min(count($newRow->getCells()), count($oldRow->getCells()));
$totalCount = ($minCells + $firstCellWeight + $indexDeltaWeight) * 100;
foreach ($newRow->getCells() as $newIndex => $newCell) {
$oldCell = $oldRow->getCell($newIndex);
if ($oldCell) {
$percentage = null;
similar_text($oldCell->getInnerHtml(), $newCell->getInnerHtml(), $percentage);
if ($percentage > ($this->config->getMatchThreshold() * 0.50)) {
$increment = $percentage;
if ($newIndex === 0 && $percentage > 95) {
$increment = $increment * $firstCellWeight;
$thresholdCount += $increment;
return ($totalCount > 0) ? ($thresholdCount / $totalCount) : 0;

@ -0,0 +1,75 @@
namespace Caxy\HtmlDiff\Table;
* Class TableMatch
* @package Caxy\HtmlDiff\Table
class TableMatch
* @var int
public $startInOld;
* @var int
public $startInNew;
* @var int
public $endInOld;
* @var int
public $endInNew;
* TableMatch constructor.
* @param int $startInOld
* @param int $startInNew
* @param int $endInOld
* @param int $endInNew
public function __construct($startInOld, $startInNew, $endInOld, $endInNew)
$this->startInOld = $startInOld;
$this->startInNew = $startInNew;
$this->endInOld = $endInOld;
$this->endInNew = $endInNew;
* @return int
public function getStartInOld()
return $this->startInOld;
* @return int
public function getStartInNew()
return $this->startInNew;
* @return int
public function getEndInOld()
return $this->endInOld;
* @return int
public function getEndInNew()
return $this->endInNew;

@ -0,0 +1,70 @@
namespace Caxy\HtmlDiff\Table;
* Class TablePosition
* @package Caxy\HtmlDiff\Table
class TablePosition
* @var int
public $row;
* @var int
public $cell;
* TablePosition constructor.
* @param int $row
* @param int $cell
public function __construct($row, $cell)
$this->row = $row;
$this->cell = $cell;
* @return int
public function getRow()
return $this->row;
* @return int
public function getCell()
return $this->cell;
* @return string
public function __toString()
return $this->row.':'.$this->cell;
* @param TablePosition $a
* @param TablePosition $b
* @return int
public static function compare($a, $b)
if ($a->getRow() == $b->getRow()) {
return $a->getCell() - $b->getCell();
return $a->getRow() - $b->getRow();

@ -0,0 +1,106 @@
namespace Caxy\HtmlDiff\Table;
* Class TableRow
* @package Caxy\HtmlDiff\Table
class TableRow extends AbstractTableElement
* @var Table
protected $table;
* @var TableCell[]
protected $cells = array();
* @return Table
public function getTable()
return $this->table;
* @param Table|null $table
* @return $this
public function setTable(Table $table = null)
$this->table = $table;
if ($table && !in_array($this, $table->getRows())) {
return $this;
* @return TableCell[]
public function getCells()
return $this->cells;
* @param TableCell $cell
* @return $this
public function addCell(TableCell $cell)
$this->cells[] = $cell;
if (!$cell->getRow()) {
return $this;
* @param TableCell $cell
public function removeCell(TableCell $cell)
$key = array_search($cell, $this->cells, true);
if ($key !== false) {
if ($cell->getRow()) {
* @param int $index
* @return TableCell|null
public function getCell($index)
return isset($this->cells[$index]) ? $this->cells[$index] : null;
* @param TableCell[] $cells
* @param null|int $position
public function insertCells($cells, $position = null)
if ($position === null) {
$this->cells = array_merge($this->cells, $cells);
} else {
array_splice($this->cells, $position, 0, $cells);

@ -0,0 +1,26 @@
<?xml version="1.0" encoding="utf-8"?>
<phpunit backupGlobals="false"
<testsuite name="php-htmldiff Test Suite">
<whitelist processUncoveredFilesFromWhitelist="true">
<directory suffix=".php">./lib</directory>

@ -0,0 +1,40 @@
namespace Caxy\Tests\HtmlDiff\Functional;
use Caxy\HtmlDiff\HtmlDiff;
use Caxy\Tests\HtmlDiff\HtmlFileIterator;
class HtmlDiffFunctionalTest extends \PHPUnit_Framework_TestCase
* @dataProvider diffContentProvider
* @param $oldText
* @param $newText
* @param $expected
public function testHtmlDiff($oldText, $newText, $expected)
$diff = new HtmlDiff(trim($oldText), trim($newText), 'UTF-8', array());
$output = $diff->build();
static::assertEquals($this->stripExtraWhitespaceAndNewLines($expected), $this->stripExtraWhitespaceAndNewLines($output));
public function diffContentProvider()
return new HtmlFileIterator(__DIR__.'/../../../../fixtures/HtmlDiff');
protected function stripExtraWhitespaceAndNewLines($text)
return trim(
preg_replace('/\s+/S', " ", preg_replace("/[\n\r]/", '', $text))

@ -0,0 +1,103 @@
namespace Caxy\Tests\HtmlDiff;
class HtmlFileIterator implements \Iterator
protected $files = array();
protected $key = 0;
protected $loadedDiffs = array();
public function __construct($directory)
$this->files = glob($directory.DIRECTORY_SEPARATOR."*.html");
* Return the current element
* @link
* @return mixed Can return any type.
* @since 5.0.0
public function current()
return $this->loadHtmlFile($this->key);
* Move forward to next element
* @link
* @return void Any returned value is ignored.
* @since 5.0.0
public function next()
* Return the key of the current element
* @link
* @return mixed scalar on success, or null on failure.
* @since 5.0.0
public function key()
return basename($this->files[$this->key]);
* Checks if current position is valid
* @link
* @return boolean The return value will be casted to boolean and then evaluated.
* Returns true on success or false on failure.
* @since 5.0.0
public function valid()
return isset($this->files[$this->key]);
* Rewind the Iterator to the first element
* @link
* @return void Any returned value is ignored.
* @since 5.0.0
public function rewind()
$this->key = 0;
protected function loadHtmlFile($key)
$filename = $this->files[$key];
if (!isset($this->loadedDiffs[$filename])) {
$html = file_get_contents($filename);
$oldText = $this->parseTagContent('oldText', $html);
$newText = $this->parseTagContent('newText', $html);
$expected = $this->parseTagContent('expected', $html);
if (null === $expected) {
throw new \Exception('HTML fixture content should have an <expected> tag.');
$this->loadedDiffs[$filename] = array($oldText, $newText, $expected);
return $this->loadedDiffs[$filename];
protected function parseTagContent($tagName, $html)
$matches = array();
if (preg_match(sprintf('/<%s\s*[^>]*>(.*)<\/%s\s*>/is', $tagName, $tagName), $html, $matches)) {
return $matches[1];
return null;

@ -0,0 +1,14 @@
* This file bootstraps the test environment.
namespace Caxy\Tests;
error_reporting(E_ALL | E_STRICT);
if (!file_exists(__DIR__ . '/../../../vendor/autoload.php')) {
throw new \Exception('Can\'t find autoload.php. Did you install dependencies via composer?');
require __DIR__ . '/../../../vendor/autoload.php';

@ -0,0 +1,13 @@
Compliance with this section requires that the provisions identified in Sections R401 through R404 labeled as "mandatory" and Section R403.5.3 be met. The building thermal envelope shall be greater than or equal to levels of efficiency and Solar Heat Gain Coefficient in Table 402.1.1 or 402.1.3 of the 2009 <em>International Energy Conservation Code</em>.<ul class="exception"><li><strong>Exception:</strong> Supply and return ducts not completely inside the building thermal envelope shall be insulated to a minimum of R-6.</li></ul>
<p>Compliance with this section requires that the provisions identified in Sections R401 through R404 labeled as "mandatory" and Section R403.5.3 shall be met. Fenestration U-factor and SHGC shall not exceed the maximum values for the climate zone set forth in Table R402.1.2. The remaining components of the building thermal envelope shall comply with either the minimum R-values or maximum U-factors for the climate zones specified in Table R402.1.2 and R402.1.4.</p>
<ul class="exception"><li><strong>Exception:</strong> Supply and return ducts not completely inside the building thermal envelope shall be insulated to a minimum of R-6.</li>
<p class="diffmod">Compliance with this section requires that the provisions identified in Sections R401 through R404 labeled as "mandatory" and Section R403.5.3 <ins class="diffins">shall </ins>be met. <ins class="diffins">Fenestration U-factor and SHGC shall not exceed the maximum values for the climate zone set forth in Table R402.1.2. </ins>The<ins class="diffins"> remaining components of the</ins> building thermal envelope shall <del class="diffmod">be greater than</del><ins class="diffmod">comply with either the minimum R-values</ins> or <del class="diffmod">equal to levels of efficiency and Solar Heat Gain Coefficient</del><ins class="diffmod">maximum U-factors for the climate zones specified</ins> in Table <del class="diffmod">402.1.1 or 402.1.3 of the 2009 </del><em class="diffmod"><del class="diffmod">International Energy Conservation Code</del></em><ins class="diffmod">R402.1.2 and R402.1.4</ins>.</p><ins class="diffins"> </ins><ul class="exception" class="diff-list"><li class="normal"><strong>Exception:</strong> Supply and return ducts not completely inside the building thermal envelope shall be insulated to a minimum of R-6.</li></ul>

@ -0,0 +1,39 @@
Etiam feugiat lorem non metus. Nullam accumsan lorem in dui.
Praesent ac sem eget est egestas volutpat. Nulla neque dolor, sagittis eget, iaculis quis, molestie non, velit. Maecenas tempus, tellus eget condimentum rhoncus, sem quam semper libero, sit amet adipiscing sem neque sed ipsum. Integer ante arcu, accumsan a, consectetuer eget, posuere ut, mauris. Aenean massa.
Vestibulum suscipit nulla quis orci. Integer ante arcu, accumsan a, consectetuer eget, posuere ut, mauris. Class aptent taciti sociosqu ad litora torquent per conubia nostra, per inceptos hymenaeos.
Suspendisse non nisl sit amet velit hendrerit rutrum. Aenean massa. Curabitur ullamcorper ultricies nisi. Praesent vestibulum dapibus nibh. In dui magna, posuere eget, vestibulum et, tempor auctor, justo.
Suspendisse non nisl sit amet velit hendrerit rutrum. Aenean massa. Curabitur ullamcorper ultricies nisi. Praesent vestibulum dapibus nibh. In dui magna, posuere eget, vestibulum et, tempor auctor, justo.
Donec pede justo, fringilla vel, aliquet nec, vulputate eget, arcu.
Duis lobortis massa imperdiet quam. Donec sodales sagittis magna. Nam ipsum risus, rutrum vitae, vestibulum eu, molestie vel, lacus. Suspendisse eu ligula. Morbi nec metus.
<ol class="diff-list"><li class="normal"><del class="diffmod">Etiam feugiat lorem</del><ins class="diffmod">Suspendisse</ins> non <del class="diffmod">metus</del><ins class="diffmod">nisl sit amet velit hendrerit rutrum</ins>. <del class="diffmod">Nullam accumsan lorem in</del><ins class="diffmod">Aenean massa. Curabitur ullamcorper ultricies nisi. Praesent vestibulum dapibus nibh. In</ins> dui<ins class="diffins"> magna, posuere eget, vestibulum et, tempor auctor, justo</ins>.</li><li class="normal"><del class="diffmod">Praesent ac sem eget est egestas volutpat. Nulla neque dolor</del><ins class="diffmod">Donec pede justo</ins>, <del class="diffmod">sagittis</del><ins class="diffmod">fringilla vel, aliquet nec, vulputate</ins> eget, <del class="diffmod">iaculis quis, molestie non, velit</del><ins class="diffmod">arcu</ins>.<del class="diffdel"> Maecenas tempus, tellus eget condimentum rhoncus, sem quam semper libero, sit amet adipiscing sem neque sed ipsum. Integer ante arcu, accumsan a, consectetuer eget, posuere ut, mauris. Aenean massa.</del></li><li class="normal"><del class="diffmod">Vestibulum suscipit nulla quis orci</del><ins class="diffmod">Duis lobortis massa imperdiet quam</ins>. <del class="diffmod">Integer ante arcu</del><ins class="diffmod">Donec sodales sagittis magna. Nam ipsum risus</ins>, <del class="diffmod">accumsan a</del><ins class="diffmod">rutrum vitae</ins>, <del class="diffmod">consectetuer eget</del><ins class="diffmod">vestibulum eu</ins>, <del class="diffmod">posuere ut</del><ins class="diffmod">molestie vel</ins>, <del class="diffmod">mauris</del><ins class="diffmod">lacus</ins>. <del class="diffmod">Class aptent taciti sociosqu ad litora torquent per conubia nostra, per inceptos hymenaeos</del><ins class="diffmod">Suspendisse eu ligula</ins>.<ins class="diffins"> Morbi nec metus.</ins></li><li class="removed"><del> Suspendisse non nisl sit amet velit hendrerit rutrum. Aenean massa. Curabitur ullamcorper ultricies nisi. Praesent vestibulum dapibus nibh. In dui magna, posuere eget, vestibulum et, tempor auctor, justo. </del></li></ol>

@ -0,0 +1,15 @@
Testing <a href="">Link Changes</a>
And when the link <a href="">stays the same</a>
Testing <a href="">Link Changes</a>
And when the link <a href="">stays the same</a>
Testing <del class="diffmod diff-href"><a href="">Link Changes</a></del><ins class="diffmod diff-href"><a href="">Link Changes</a></ins>
And when the link <a href="">stays the same</a>

File diff suppressed because one or more lines are too long

@ -0,0 +1,18 @@
<p>Air handling equipment and HVAC equipment shall be designed and installed to limit the amount of airflow that bypasses the air filters and shall comply with the following: </p>
<ol><li>Channels, racks and other filter retaining constructions that do not seal tightly to the filter frame by means of a friction fit shall be provided with a means to seal the filter frame to the filter retaining construction.</li>
<li>Where standard size filters are installed in banks of multiple filters, gaskets shall seal the gap between the frames of adjacent filters. As an alternative to gaskets, the frames of adjacent filters shall be compressed by means of spring elements that are built into the filter retaining construction.</li>
<li>Channels, racks and other filter retaining constructions shall be sealed to the duct or housing of the HVAC equipment served by the filters.</li>
<li>Filter access doors in ducts and HVAC equipment shall be designed to limit the amount of airflow that bypasses the filters.</li>
<li>Field or shop fabricated spacers shall not be installed for the purpose of replacing the intended size filter with a smaller size filter.</li>
<li>Gaskets and seals shall be provided with access for repair, maintenance and replacement.</li>
<p>Air handling equipment and HVAC equipment shall be designed and installed to limit the amount of airflow that bypasses the air filters. Filter access doors in ducts and HVAC equipment shall be designed to limit the amount of airflow that bypasses the filters. Channels, racks and other filter retaining constructions shall be sealed to the duct or housing of the HVAC equipment served by the filters. Field or shop fabricated spacers shall not be installed for the purpose of replacing the intended size filter with a smaller size filter.</p>
<p>Air handling equipment and HVAC equipment shall be designed and installed to limit the amount of airflow that bypasses the air filters<ins class="diffins">. Filter access doors in ducts</ins> and <ins class="diffins">HVAC equipment </ins>shall <del class="diffmod">comply</del><ins class="diffmod">be designed to limit the amount of airflow that bypasses the filters. Channels, racks and other filter retaining constructions shall be sealed to the duct or housing of the HVAC equipment served by the filters. Field or shop fabricated spacers shall not be installed for the purpose of replacing the intended size filter</ins> with <del class="diffmod">the following: </del><ins class="diffmod">a smaller size filter.</ins></p><del class="diffdel"> </del><ol class="diffmod"><li><del class="diffdel">Channels, racks and other filter retaining constructions that do not seal tightly to the filter frame by means of a friction fit shall be provided with a means to seal the filter frame to the filter retaining construction.</del></li><del class="diffdel"> </del><li class="diffmod"><del class="diffdel">Where standard size filters are installed in banks of multiple filters, gaskets shall seal the gap between the frames of adjacent filters. As an alternative to gaskets, the frames of adjacent filters shall be compressed by means of spring elements that are built into the filter retaining construction.</del></li><del class="diffdel"> </del><li class="diffmod"><del class="diffdel">Channels, racks and other filter retaining constructions shall be sealed to the duct or housing of the HVAC equipment served by the filters.</del></li><del class="diffdel"> </del><li class="diffmod"><del class="diffdel">Filter access doors in ducts and HVAC equipment shall be designed to limit the amount of airflow that bypasses the filters.</del></li><del class="diffdel"> </del><li class="diffmod"><del class="diffdel">Field or shop fabricated spacers shall not be installed for the purpose of replacing the intended size filter with a smaller size filter.</del></li><del class="diffdel"> </del><li class="diffmod"><del class="diffdel">Gaskets and seals shall be provided with access for repair, maintenance and replacement.</del></li><del class="diffdel"> </del></ol>

@ -0,0 +1,29 @@
<div>The path of egress travel to an exit shall not pass through more than one adjacent story.</div>
<div> </div>
<div style="padding-left:30px;"><strong>Exception:</strong> The path of egress travel to an exit shall be permitted to pass through more than one adjacent story in any of the following:</div>
<ol><li>In Group R-1, R-2 or R-3 occupancies, exit access stairways and ramps connecting four stories or less serving and contained within an individual dwelling unit or sleeping unit or live/work unit.</li>
<li>Exit access stairways serving and contained within a Group R-3 congregate residence or a Group R-4 facility.</li>
<li>Exit access stairways and ramps in open parking garages that serve only the parking garage.</li>
<li>Exit access stairways and ramps serving open-air assembly seating complying with the exit access travel distance requirements of Section 1029.7.</li>
<li>Exit access stairways and ramps between the balcony, gallery or press box and the main assembly floor in occupancies such as theaters, places of religious worship, auditoriums and sports facilities.</li>
</ol><div> </div>
<div>The path of egress travel to an exit shall not pass through more than one adjacent story.</div>
<div> </div>
<div style="padding-left:30px;"><strong>Exception:</strong> The path of egress travel to an exit shall be permitted to pass through more than one adjacent story in any of the following:</div>
<ol><li>In Group R-1, R-2 or R-3 occupancies, exit access stairways and ramps connecting four stories or less serving and contained within an individual dwelling unit or sleeping unit or live/work unit.</li>
<li>Exit access stairways serving and contained within a Group R-3 congregate residence or a Group R-4 facility.</li>
<li>Exit access stairways and ramps in open parking garages that serve only the parking garage.</li>
<li>Exit access stairways and ramps in buildings equipped throughout with an automatic sprinkler system in accordance with Section 903.3.1.1, where the area of the vertical opening between stories does not exceed twice the horizontal projected area of the stairway or ramp and the opening is protected by a draft curtain and closely spaced sprinklers in accordance with NFPA 13. In other than Group B and M occupancies, this provision is limited to openings that do not connect more than four stories.</li>
<li>Exit access stairways and ramps within an atrium complying with the provisions of Section 404.</li>
<li>Exit access stairways and ramps serving open-air assembly seating complying with the exit access travel distance requirements of Section 1029.7.</li>
<li>Exit access stairways and ramps between the balcony, gallery or press box and the main assembly floor in occupancies such as theaters, places of religious worship, auditoriums and sports facilities.</li>
</ol><div> </div>
<div>The path of egress travel to an exit shall not pass through more than one adjacent story.</div> <div> </div> <div style="padding-left:30px;"><strong>Exception:</strong> The path of egress travel to an exit shall be permitted to pass through more than one adjacent story in any of the following:</div> <ol class="diff-list"><li class="normal">In Group R-1, R-2 or R-3 occupancies, exit access stairways and ramps connecting four stories or less serving and contained within an individual dwelling unit or sleeping unit or live/work unit.</li><li class="normal">Exit access stairways serving and contained within a Group R-3 congregate residence or a Group R-4 facility.</li><li class="normal">Exit access stairways and ramps in open parking garages that serve only the parking garage.</li><li class="normal new"><ins>Exit access stairways and ramps in buildings equipped throughout with an automatic sprinkler system in accordance with Section 903.3.1.1, where the area of the vertical opening between stories does not exceed twice the horizontal projected area of the stairway or ramp and the opening is protected by a draft curtain and closely spaced sprinklers in accordance with NFPA 13. In other than Group B and M occupancies, this provision is limited to openings that do not connect more than four stories.</ins></li><li class="normal new"><ins>Exit access stairways and ramps within an atrium complying with the provisions of Section 404.</ins></li><li class="normal">Exit access stairways and ramps serving open-air assembly seating complying with the exit access travel distance requirements of Section 1029.7.</li><li class="normal">Exit access stairways and ramps between the balcony, gallery or press box and the main assembly floor in occupancies such as theaters, places of religious worship, auditoriums and sports facilities.</li></ol><div> </div>

@ -0,0 +1,28 @@
<em>Corridors</em> shall be fire-resistance rated in accordance with Table 1020.1. The <em>corridor</em> walls required to be fire-resistance rated shall comply with Section 708 for <em>fire partitions</em>.<br /><br />In addition, corridors in buildings of Types IIB, IIIB, and VB construction and assigned Risk Categories III and IV in Table 1604.5, other than Group I, shall have a fire resistance rating of not less than 1 hour where such buildings are any of the following:<br /><br /><ol><li>Assigned a Seismic Design Category C or D in Table 1613.3.5(1).</li>
<li>Located in a flood hazard area established in accordance with Section 1612.3.</li>
<li>Located in a <em>hurricane-prone regions</em>.</li>
</ol><ul class="exception"><li><strong>Exceptions:</strong><ol><li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> in an occupancy in Group E where each room that is used for instruction has not less than one door opening directly to the exterior and rooms for assembly purposes have not less than one-half of the required <em>means of egress</em> doors opening directly to the exterior. Exterior doors specified in this exception are required to be at ground level.</li>
<li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> contained within a <em>dwelling unit</em> or <em>sleeping unit</em> in an occupancy in Groups I-1 and R.</li>
<li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> in <em>open parking garages</em>.</li>
<li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> in an occupancy in Group B that is a space requiring only a single <em>means of egress</em> complying with Section 1006.2.</li>
<li><em>Corridors</em> adjacent to the <em>exterior walls</em> of buildings shall be permitted to have unprotected openings on unrated <em>exterior walls</em> where unrated walls are permitted by Table 602 and unprotected openings are permitted by Table 705.8.</li>
<em>Corridors</em> shall be fire-resistance rated in accordance with Table 1020.1 and where applicable in Section 1020.1.1. The <em>corridor</em> walls required to be fire-resistance rated shall comply with Section 708 for <em>fire partitions</em>.<br /><ul class="exception"><li><strong>Exceptions:</strong></li>
<ol><li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> in an occupancy in Group E where each room that is used for instruction has not less than one door opening directly to the exterior and rooms for assembly purposes have not less than one-half of the required <em>means of egress</em> doors opening directly to the exterior. Exterior doors specified in this exception are required to be at ground level.</li>
<li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> contained within a <em>dwelling unit</em> or <em>sleeping unit</em> in an occupancy in Groups I-1 and R.</li>
<li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> in <em>open parking garages</em>.</li>
<li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> in an occupancy in Group B that is a space requiring only a single <em>means of egress</em> complying with Section 1006.2.</li>
<li><em>Corridors</em> adjacent to the <em>exterior walls</em> of buildings shall be permitted to have unprotected openings on unrated <em>exterior walls</em> where unrated walls are permitted by Table 602 and unprotected openings are permitted by Table 705.8.</li>
<em>Corridors</em> shall be fire-resistance rated in accordance with Table 1020.1<ins class="diffins"> and where applicable in Section 1020.1.1</ins>. The <em>corridor</em> walls required to be fire-resistance rated shall comply with Section 708 for <em>fire partitions</em>.<br /><br / class="diffmod"><del class="diffdel">In addition, corridors in buildings of Types IIB, IIIB, and VB construction and assigned Risk Categories III and IV in Table 1604.5, other than Group I, shall have a fire resistance rating of not less than 1 hour where such buildings are any of the following:</del><br / class="diffmod"><br /><ol><li><del class="diffdel">Assigned a Seismic Design Category C or D in Table 1613.3.5(1).</del></li><del class="diffdel"> </del><li class="diffmod"><del class="diffdel">Located in a flood hazard area established in accordance with Section 1612.3.</del></li><del class="diffdel"> </del><li class="diffmod"><del class="diffdel">Located in a </del><em class="diffmod"><del class="diffdel">hurricane-prone regions</del></em><del class="diffdel">.</del></li><del class="diffdel"> </del></ol><ul class="exception"><li><strong>Exceptions:</strong></li><ins class="diffins"> </ins><li class="diffmod"><ins class="diffins"> </ins><ol><li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> in an occupancy in Group E where each room that is used for instruction has not less than one door opening directly to the exterior and rooms for assembly purposes have not less than one-half of the required <em>means of egress</em> doors opening directly to the exterior. Exterior doors specified in this exception are required to be at ground level.</li> <li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> contained within a <em>dwelling unit</em> or <em>sleeping unit</em> in an occupancy in Groups I-1 and R.</li> <li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> in <em>open parking garages</em>.</li> <li>A <em>fire-resistance rating</em> is not required for <em>corridors</em> in an occupancy in Group B that is a space requiring only a single <em>means of egress</em> complying with Section 1006.2.</li> <li><em>Corridors</em> adjacent to the <em>exterior walls</em> of buildings shall be permitted to have unprotected openings on unrated <em>exterior walls</em> where unrated walls are permitted by Table 602 and unprotected openings are permitted by Table 705.8.</li> </ol></li> </ul>

File diff suppressed because one or more lines are too long

@ -0,0 +1,42 @@
<p>Return air openings for heating, ventilation and air-conditioning systems shall comply with all of the following:</p>
<ol><li>Openings shall not be located less than 10 feet (3048 mm) measured in any direction from an open combustion chamber or draft hood of another appliance located in the same room or space.</li>
<li>Return air shall not be taken from a hazardous or insanitary location or a refrigeration room as defined in this code.</li>
<li>The amount of return air taken from any room or space shall be not greater than the flow rate of supply air delivered to such room or space.</li>
<li>Return and transfer openings shall be sized in accordance with the appliance or equipment manufacturer's installation instructions, ACCA Manual D or the design of the registered design professional.</li>
<li>Return air taken from one dwelling unit shall not be discharged into another dwelling unit.</li>
<li>Taking return air from a crawl space shall not be accomplished through a direct connection to the return side of a forced air furnace. Transfer openings in the crawl space enclosure shall not be prohibited.</li>
<li>Return air shall not be taken from a closet, bathroom, toilet room, kitchen, garage, boiler room, furnace room or unconditioned attic.
<ul class="exception"><li><strong>Exceptions:</strong>
<ol><li>Taking return air from a kitchen is not prohibited where such return air openings serve the kitchen and are located not less than 10 feet (3048 mm) from the cooking appliances.</li>
<li>Dedicated forced air systems serving only the garage shall not be prohibited from obtaining return air from the garage</li>
<li>Return air shall not be taken from indoor swimming pool enclosures and associated deck areas.
<ul class="exception"><li><strong>Exceptions:</strong>
<ol><li>Where the air from such spaces is dehumidified in accordance with Sections 403.2.1 Item #2.</li>
<li>Dedicated HVAC systems serving only such spaces.</li>
<p>Return air openings for heating, ventilation and air-conditioning systems shall comply with all of the following:</p>
<ol><li>Openings shall not be located less than 10 feet (3048 mm) measured in any direction from an open combustion chamber or draft hood of another appliance located in the same room or space.</li>
<li>Return air shall not be taken from a hazardous or insanitary location or a refrigeration room as defined in this code.</li>
<li>The amount of return air taken from any room or space shall be not greater than the flow rate of supply air delivered to such room or space.</li>
<li>Return and transfer openings shall be sized in accordance with the appliance or equipment manufacturer's installation instructions, ACCA Manual D or the design of the registered design professional.</li>
<li>Return air taken from one dwelling unit shall not be discharged into another dwelling unit.</li>
<li>Taking return air from a crawl space shall not be accomplished through a direct connection to the return side of a forced air furnace. Transfer openings in the crawl space enclosure shall not be prohibited.</li>
<li>Return air shall not be taken from a closet, bathroom, toilet room, kitchen, garage, boiler room, furnace room, indoor swimming pool enclosure and associated deck area, or unconditioned attic.</li>
</ol><ul class="exception"><li><strong>Exceptions:</strong></li>
</ul><ol><li>Taking return air from a kitchen is not prohibited where such return air openings serve the kitchen and are located not less than 10 feet (3048 mm) from the cooking appliances.</li>
<li>Dedicated forced air systems serving only the garage shall not be prohibited from obtaining return air from the garage</li>
<li>Dedicated HVAC systems serving indoor swimming pool enclosures and associated deck areas shall not be prohibited from obtaining return air from such swimming pool enclosures and associated deck areas</li>
<p>Return air openings for heating, ventilation and air-conditioning systems shall comply with all of the following:</p> <ol class="diff-list"><li class="normal">Openings shall not be located less than 10 feet (3048 mm) measured in any direction from an open combustion chamber or draft hood of another appliance located in the same room or space.</li><li class="normal">Return air shall not be taken from a hazardous or insanitary location or a refrigeration room as defined in this code.</li><li class="normal">The amount of return air taken from any room or space shall be not greater than the flow rate of supply air delivered to such room or space.</li><li class="normal">Return and transfer openings shall be sized in accordance with the appliance or equipment manufacturer's installation instructions, ACCA Manual D or the design of the registered design professional.</li><li class="normal">Return air taken from one dwelling unit shall not be discharged into another dwelling unit.</li><li class="normal">Taking return air from a crawl space shall not be accomplished through a direct connection to the return side of a forced air furnace. Transfer openings in the crawl space enclosure shall not be prohibited.</li><li class="normal">Return air shall not be taken from a closet, bathroom, toilet room, kitchen, garage, boiler room, furnace room<ins class="diffins">, indoor swimming pool enclosure and associated deck area,</ins> or unconditioned attic.<del class="diffdel"> </del><ul class="diffmod exception"><li><strong><del class="diffdel">Exceptions:</del></strong><del class="diffdel"> </del><ol class="diffmod"><li><del class="diffdel">Taking return air from a kitchen is not prohibited where such return air openings serve the kitchen and are located not less than 10 feet (3048 mm) from the cooking appliances.</del></li><del class="diffdel"> </del><li class="diffmod"><del class="diffdel">Dedicated forced air systems serving only the garage shall not be prohibited from obtaining return air from the garage</del></li><del class="diffdel"> </del></ol></li><del class="diffdel"> </del></ul></li><li class="removed"><del>Return air shall not be taken from indoor swimming pool enclosures and associated deck areas. <ul class="exception"><li><strong>Exceptions:</strong> <ol><li>Where the air from such spaces is dehumidified in accordance with Sections 403.2.1 Item #2.</li> <li>Dedicated HVAC systems serving only such spaces.</li> </ol></li> </ul></del></li></ol><ul class="diffmod exception"><li><strong><ins class="diffins">Exceptions:</ins></strong></li><ins class="diffins"> </ins></ul><ol><li><ins class="diffins">Taking return air from a kitchen is not prohibited where such return air openings serve the kitchen and are located not less than 10 feet (3048 mm) from the cooking appliances.</ins></li><ins class="diffins"> </ins><li class="diffmod"><ins class="diffins">Dedicated forced air systems serving only the garage shall not be prohibited from obtaining return air from the garage</ins></li><ins class="diffins"> </ins><li class="diffmod"><ins class="diffins">Dedicated HVAC systems serving indoor swimming pool enclosures and associated deck areas shall not be prohibited from obtaining return air from such swimming pool enclosures and associated deck areas</ins></li><ins class="diffins"> </ins></ol>

@ -0,0 +1,11 @@
<p>The manufacturer of PEX tubing shall have marked the outside of the tubing with the thermoplastic material designation code in accordance with ASTM F876. The designation code shall consist of the abbreviation "PEX" followed by four digits. The first digit shall represent a chlorine resistance rating as established by testing in accordance with ASTM F876.</p>
<p>For PEX tubing complying with ASTM F876, the first digit folllowing "PEX" as marked on the tubing exterior shall be an indicator of the maximum service temperatures for which the PEX tubing can be used. The maximum service temperatures shall be as follows:<br /><br />1. Digit “0”: 73⁰F (23⁰C). <br /><br />2. Digit “1”: For not more that 25% of the time, greater than 73⁰F (23⁰C) and not exceeding140⁰F (60⁰C). For the remainder of the time, not greater than 73⁰F (23⁰C). <br /><br />3. Digit “3”: For not more that 50% of the time, greater than 73⁰F (23⁰C) and not exceeding 140⁰F (60⁰C). For the remainder of the time, not greater than 73⁰F (23⁰C). <br /><br />4. Digit “5”: 140⁰F (60⁰C). <br /><br /><br /></p>
<p><del class="diffmod">The manufacturer of</del><ins class="diffmod">For</ins> PEX tubing <del class="diffmod">shall have marked the outside of the tubing with the thermoplastic material designation code in accordance</del><ins class="diffmod">complying</ins> with ASTM F876<del class="diffmod">. The designation code</del><ins class="diffmod">, the first digit folllowing "PEX" as marked on the tubing exterior</ins> shall <del class="diffmod">consist</del><ins class="diffmod">be an indicator</ins> of the <del class="diffmod">abbreviation "</del><ins class="diffmod">maximum service temperatures for which the </ins>PEX<del class="diffmod">" followed by four digits</del><ins class="diffmod"> tubing can be used</ins>. The <del class="diffmod">first digit</del><ins class="diffmod">maximum service temperatures</ins> shall <del class="diffmod">represent a chlorine resistance rating</del><ins class="diffmod">be</ins> as <del class="diffmod">established by testing in accordance with ASTM F876</del><ins class="diffmod">follows:</ins><br / class="diffmod"><br /><ins class="diffmod">1</ins>.<ins class="diffins"> Digit “0”: 73⁰F (23⁰C). </ins><br / class="diffmod"><br /><ins class="diffins">2. Digit “1”: For not more that 25% of the time, greater than 73⁰F (23⁰C) and not exceeding140⁰F (60⁰C). For the remainder of the time, not greater than 73⁰F (23⁰C). </ins><br / class="diffmod"><br /><ins class="diffins">3. Digit “3”: For not more that 50% of the time, greater than 73⁰F (23⁰C) and not exceeding 140⁰F (60⁰C). For the remainder of the time, not greater than 73⁰F (23⁰C). </ins><br / class="diffmod"><br /><ins class="diffins">4. Digit “5”: 140⁰F (60⁰C). </ins><br / class="diffmod"><br /><br /></p>

@ -0,0 +1,11 @@
<i>Existing buildings </i>that undergo a change of group or occupancy shall comply with this section.<ul class="exception"><li><b>Exception: </b>Type B dwelling or sleeping units required by Section 1107 of the <i>International Building Code </i>are not required to be provided in <i>existing buildings </i>and facilities undergoing a <i>change of occupancy </i>in conjunction with <i>alterations </i>where the <i>work area </i>is 50 percent or less of the aggregate area of the building.</li></ul>
<em>Where existing buildings </em>undergo a change of group or occupancy any alterations shall comply with Sections 410.6, 410.7 and 410.8 as applicable.
<i class="diffmod"><del class="diffmod">Existing buildings </del></i><del class="diffmod">that </del><em class="diffmod"><ins class="diffmod">Where existing buildings </ins></em>undergo a change of group or occupancy <ins class="diffins">any alterations </ins>shall comply with <del class="diffmod">this section</del><ins class="diffmod">Sections 410.6, 410.7 and 410.8 as applicable</ins>.<ul class="diffmod exception"><li><b><del class="diffdel">Exception: </del></b><del class="diffdel">Type B dwelling or sleeping units required by Section 1107 of the </del><i class="diffmod"><del class="diffdel">International Building Code </del></i><del class="diffdel">are not required to be provided in </del><i class="diffmod"><del class="diffdel">existing buildings </del></i><del class="diffdel">and facilities undergoing a </del><i class="diffmod"><del class="diffdel">change of occupancy </del></i><del class="diffdel">in conjunction with </del><i class="diffmod"><del class="diffdel">alterations </del></i><del class="diffdel">where the </del><i class="diffmod"><del class="diffdel">work area </del></i><del class="diffdel">is 50 percent or less of the aggregate area of the building.</del></li></ul>

@ -0,0 +1,413 @@
* This file is part of Composer.
* (c) Nils Adermann <>
* Jordi Boggiano <>
* For the full copyright and license information, please view the LICENSE
* file that was distributed with this source code.
namespace Composer\Autoload;
* ClassLoader implements a PSR-0, PSR-4 and classmap class loader.
* $loader = new \Composer\Autoload\ClassLoader();
* // register classes with namespaces
* $loader->add('Symfony\Component', __DIR__.'/component');
* $loader->add('Symfony', __DIR__.'/framework');
* // activate the autoloader
* $loader->register();
* // to enable searching the include path (eg. for PEAR packages)
* $loader->setUseIncludePath(true);
* In this example, if you try to use a class in the Symfony\Component
* namespace or one of its children (Symfony\Component\Console for instance),
* the autoloader will first look for the class under the component/
* directory, and it will then fallback to the framework/ directory if not
* found before giving up.
* This class is loosely based on the Symfony UniversalClassLoader.
* @author Fabien Potencier <>
* @author Jordi Boggiano <>
* @see
* @see
class ClassLoader
// PSR-4
private $prefixLengthsPsr4 = array();
private $prefixDirsPsr4 = array();
private $fallbackDirsPsr4 = array();
// PSR-0
private $prefixesPsr0 = array();
private $fallbackDirsPsr0 = array();
private $useIncludePath = false;
private $classMap = array();
private $classMapAuthoritative = false;
public function getPrefixes()
if (!empty($this->prefixesPsr0)) {
return call_user_func_array('array_merge', $this->prefixesPsr0);
return array();
public function getPrefixesPsr4()
return $this->prefixDirsPsr4;
public function getFallbackDirs()
return $this->fallbackDirsPsr0;
public function getFallbackDirsPsr4()
return $this->fallbackDirsPsr4;
public function getClassMap()
return $this->classMap;
* @param array $classMap Class to filename map
public function addClassMap(array $classMap)
if ($this->classMap) {
$this->classMap = array_merge($this->classMap, $classMap);
} else {
$this->classMap = $classMap;
* Registers a set of PSR-0 directories for a given prefix, either
* appending or prepending to the ones previously set for this prefix.
* @param string $prefix The prefix
* @param array|string $paths The PSR-0 root directories
* @param bool $prepend Whether to prepend the directories
public function add($prefix, $paths, $prepend = false)
if (!$prefix) {
if ($prepend) {
$this->fallbackDirsPsr0 = array_merge(
(array) $paths,
} else {
$this->fallbackDirsPsr0 = array_merge(
(array) $paths
$first = $prefix[0];
if (!isset($this->prefixesPsr0[$first][$prefix])) {
$this->prefixesPsr0[$first][$prefix] = (array) $paths;
if ($prepend) {
$this->prefixesPsr0[$first][$prefix] = array_merge(
(array) $paths,
} else {
$this->prefixesPsr0[$first][$prefix] = array_merge(
(array) $paths
* Registers a set of PSR-4 directories for a given namespace, either
* appending or prepending to the ones previously set for this namespace.
* @param string $prefix The prefix/namespace, with trailing '\\'
* @param array|string $paths The PSR-4 base directories
* @param bool $prepend Whether to prepend the directories
* @throws \InvalidArgumentException
public function addPsr4($prefix, $paths, $prepend = false)
if (!$prefix) {
// Register directories for the root namespace.
if ($prepend) {
$this->fallbackDirsPsr4 = array_merge(
(array) $paths,
} else {
$this->fallbackDirsPsr4 = array_merge(
(array) $paths
} elseif (!isset($this->prefixDirsPsr4[$prefix])) {
// Register directories for a new namespace.
$length = strlen($prefix);
if ('\\' !== $prefix[$length - 1]) {
throw new \InvalidArgumentException("A non-empty PSR-4 prefix must end with a namespace separator.");
$this->prefixLengthsPsr4[$prefix[0]][$prefix] = $length;
$this->prefixDirsPsr4[$prefix] = (array) $paths;
} elseif ($prepend) {
// Prepend directories for an already registered namespace.
$this->prefixDirsPsr4[$prefix] = array_merge(
(array) $paths,
} else {
// Append directories for an already registered namespace.
$this->prefixDirsPsr4[$prefix] = array_merge(
(array) $paths
* Registers a set of PSR-0 directories for a given prefix,
* replacing any others previously set for this prefix.
* @param string $prefix The prefix
* @param array|string $paths The PSR-0 base directories
public function set($prefix, $paths)
if (!$prefix) {
$this->fallbackDirsPsr0 = (array) $paths;
} else {
$this->prefixesPsr0[$prefix[0]][$prefix] = (array) $paths;
* Registers a set of PSR-4 directories for a given namespace,
* replacing any others previously set for this namespace.
* @param string $prefix The prefix/namespace, with trailing '\\'
* @param array|string $paths The PSR-4 base directories
* @throws \InvalidArgumentException
public function setPsr4($prefix, $paths)
if (!$prefix) {
$this->fallbackDirsPsr4 = (array) $paths;
} else {
$length = strlen($prefix);
if ('\\' !== $prefix[$length - 1]) {
throw new \InvalidArgumentException("A non-empty PSR-4 prefix must end with a namespace separator.");
$this->prefixLengthsPsr4[$prefix[0]][$prefix] = $length;
$this->prefixDirsPsr4[$prefix] = (array) $paths;
* Turns on searching the include path for class files.
* @param bool $useIncludePath
public function setUseIncludePath($useIncludePath)
$this->useIncludePath = $useIncludePath;
* Can be used to check if the autoloader uses the include path to check
* for classes.
* @return bool
public function getUseIncludePath()
return $this->useIncludePath;
* Turns off searching the prefix and fallback directories for classes
* that have not been registered with the class map.
* @param bool $classMapAuthoritative
public function setClassMapAuthoritative($classMapAuthoritative)
$this->classMapAuthoritative = $classMapAuthoritative;
* Should class lookup fail if not found in the current class map?
* @return bool
public function isClassMapAuthoritative()
return $this->classMapAuthoritative;
* Registers this instance as an autoloader.
* @param bool $prepend Whether to prepend the autoloader or not
public function register($prepend = false)
spl_autoload_register(array($this, 'loadClass'), true, $prepend);
* Unregisters this instance as an autoloader.
public function unregister()
spl_autoload_unregister(array($this, 'loadClass'));
* Loads the given class or interface.
* @param string $class The name of the class
* @return bool|null True if loaded, null otherwise
public function loadClass($class)
if ($file = $this->findFile($class)) {
return true;
* Finds the path to the file where the class is defined.
* @param string $class The name of the class
* @return string|false The path if found, false otherwise
public function findFile($class)
// work around for PHP 5.3.0 - 5.3.2
if ('\\' == $class[0]) {
$class = substr($class, 1);
// class map lookup
if (isset($this->classMap[$class])) {
return $this->classMap[$class];
if ($this->classMapAuthoritative) {
return false;
$file = $this->findFileWithExtension($class, '.php');
// Search for Hack files if we are running on HHVM
if ($file === null && defined('HHVM_VERSION')) {
$file = $this->findFileWithExtension($class, '.hh');
if ($file === null) {
// Remember that this class does not exist.
return $this->classMap[$class] = false;
return $file;
private function findFileWithExtension($class, $ext)
// PSR-4 lookup
$logicalPathPsr4 = strtr($class, '\\', DIRECTORY_SEPARATOR) . $ext;
$first = $class[0];
if (isset($this->prefixLengthsPsr4[$first])) {
foreach ($this->prefixLengthsPsr4[$first] as $prefix => $length) {
if (0 === strpos($class, $prefix)) {
foreach ($this->prefixDirsPsr4[$prefix] as $dir) {
if (file_exists($file = $dir . DIRECTORY_SEPARATOR . substr($logicalPathPsr4, $length))) {
return $file;
// PSR-4 fallback dirs
foreach ($this->fallbackDirsPsr4 as $dir) {
if (file_exists($file = $dir . DIRECTORY_SEPARATOR . $logicalPathPsr4)) {
return $file;
// PSR-0 lookup
if (false !== $pos = strrpos($class, '\\')) {
// namespaced class name
$logicalPathPsr0 = substr($logicalPathPsr4, 0, $pos + 1)
. strtr(substr($logicalPathPsr4, $pos + 1), '_', DIRECTORY_SEPARATOR);
} else {
// PEAR-like class name
$logicalPathPsr0 = strtr($class, '_', DIRECTORY_SEPARATOR) . $ext;
if (isset($this->prefixesPsr0[$first])) {
foreach ($this->prefixesPsr0[$first] as $prefix => $dirs) {
if (0 === strpos($class, $prefix)) {
foreach ($dirs as $dir) {
if (file_exists($file = $dir . DIRECTORY_SEPARATOR . $logicalPathPsr0)) {
return $file;
// PSR-0 fallback dirs
foreach ($this->fallbackDirsPsr0 as $dir) {
if (file_exists($file = $dir . DIRECTORY_SEPARATOR . $logicalPathPsr0)) {
return $file;
// PSR-0 include paths.
if ($this->useIncludePath && $file = stream_resolve_include_path($logicalPathPsr0)) {
return $file;
* Scope isolated include.
* Prevents access to $this/self from included files.
function includeFile($file)
include $file;

@ -0,0 +1,21 @@
Copyright (c) 2016 Nils Adermann, Jordi Boggiano
Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is furnished
to do so, subject to the following conditions:
The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

@ -0,0 +1,9 @@
// autoload_classmap.php @generated by Composer
$vendorDir = dirname(dirname(__FILE__));
$baseDir = dirname($vendorDir);
return array(

@ -0,0 +1,10 @@
// autoload_files.php @generated by Composer
$vendorDir = dirname(dirname(__FILE__));
$baseDir = dirname($vendorDir);
return array(
'2cffec82183ee1cea088009cef9a6fc3' => $vendorDir . '/ezyang/htmlpurifier/library/HTMLPurifier.composer.php',

@ -0,0 +1,11 @@
// autoload_namespaces.php @generated by Composer
$vendorDir = dirname(dirname(__FILE__));
$baseDir = dirname($vendorDir);
return array(
'HTMLPurifier' => array($vendorDir . '/ezyang/htmlpurifier/library'),
'Caxy\\HtmlDiff' => array($vendorDir . '/caxy/php-htmldiff/lib'),

@ -0,0 +1,9 @@
// autoload_psr4.php @generated by Composer
$vendorDir = dirname(dirname(__FILE__));
$baseDir = dirname($vendorDir);
return array(

@ -0,0 +1,59 @@
// autoload_real.php @generated by Composer
class ComposerAutoloaderInit8a728e750e2d17f1173f31bda205adec
private static $loader;
public static function loadClassLoader($class)
if ('Composer\Autoload\ClassLoader' === $class) {
require __DIR__ . '/ClassLoader.php';
public static function getLoader()
if (null !== self::$loader) {
return self::$loader;
spl_autoload_register(array('ComposerAutoloaderInit8a728e750e2d17f1173f31bda205adec', 'loadClassLoader'), true, true);
self::$loader = $loader = new \Composer\Autoload\ClassLoader();
spl_autoload_unregister(array('ComposerAutoloaderInit8a728e750e2d17f1173f31bda205adec', 'loadClassLoader'));
$map = require __DIR__ . '/autoload_namespaces.php';
foreach ($map as $namespace => $path) {
$loader->set($namespace, $path);
$map = require __DIR__ . '/autoload_psr4.php';
foreach ($map as $namespace => $path) {
$loader->setPsr4($namespace, $path);
$classMap = require __DIR__ . '/autoload_classmap.php';
if ($classMap) {
$includeFiles = require __DIR__ . '/autoload_files.php';
foreach ($includeFiles as $fileIdentifier => $file) {
composerRequire8a728e750e2d17f1173f31bda205adec($fileIdentifier, $file);
return $loader;
function composerRequire8a728e750e2d17f1173f31bda205adec($fileIdentifier, $file)
if (empty($GLOBALS['__composer_autoload_files'][$fileIdentifier])) {
require $file;
$GLOBALS['__composer_autoload_files'][$fileIdentifier] = true;

@ -0,0 +1,105 @@
"name": "ezyang/htmlpurifier",
"version": "v4.7.0",
"version_normalized": "",
"source": {
"type": "git",
"url": "",
"reference": "ae1828d955112356f7677c465f94f7deb7d27a40"
"dist": {
"type": "zip",
"url": "",
"reference": "ae1828d955112356f7677c465f94f7deb7d27a40",
"shasum": ""
"require": {
"php": ">=5.2"
"time": "2015-08-05 01:03:42",
"type": "library",
"installation-source": "dist",
"autoload": {
"psr-0": {
"HTMLPurifier": "library/"
"files": [
"notification-url": "",
"license": [
"authors": [
"name": "Edward Z. Yang",
"email": "",
"homepage": ""
"description": "Standards compliant HTML filter written in PHP",
"homepage": "",
"keywords": [
"name": "caxy/php-htmldiff",
"version": "v0.1.1",
"version_normalized": "",
"source": {
"type": "git",
"url": "",
"reference": "65b1794a9a7ce790712a2ab3419f3d5600c70bb8"
"dist": {
"type": "zip",
"url": "",
"reference": "65b1794a9a7ce790712a2ab3419f3d5600c70bb8",
"shasum": ""
"require": {
"ezyang/htmlpurifier": "^4.7",
"php": ">=5.3.3"
"require-dev": {
"doctrine/cache": "~1.0",
"phpunit/phpunit": "~4.8"
"suggest": {
"doctrine/cache": "Used for caching the calculated diffs using a Doctrine Cache Provider"
"time": "2016-03-16 15:51:25",
"type": "library",
"extra": {
"branch-alias": {
"dev-master": "0.1.x-dev"
"installation-source": "dist",
"autoload": {
"psr-0": {
"Caxy\\HtmlDiff": "lib/"
"notification-url": "",
"license": [
"authors": [
"name": "Josh Schroeder",
"email": "",
"homepage": ""
"description": "A library for comparing two HTML files/snippets and highlighting the differences using simple HTML.",
"homepage": "",
"keywords": [

@ -0,0 +1,9 @@
Almost everything written by Edward Z. Yang (Ambush Commander). Lots of thanks
to the DevNetwork Community for their help (see docs/ref-devnetwork.html for
more details), Feyd especially (namely IPv6 and optimization). Thanks to RSnake
for letting me package his fantastic XSS cheatsheet for a smoketest.
vim: et sw=4 sts=4

@ -0,0 +1,374 @@
How to install HTML Purifier
HTML Purifier is designed to run out of the box, so actually using the
library is extremely easy. (Although... if you were looking for a
step-by-step installation GUI, you've downloaded the wrong software!)
While the impatient can get going immediately with some of the sample
code at the bottom of this library, it's well worth reading this entire
document--most of the other documentation assumes that you are familiar
with these contents.
1. Compatibility
HTML Purifier is PHP 5 only, and is actively tested from PHP 5.0.5 and
up. It has no core dependencies with other libraries. PHP
4 support was deprecated on December 31, 2007 with HTML Purifier 3.0.0.
HTML Purifier is not compatible with zend.ze1_compatibility_mode.
These optional extensions can enhance the capabilities of HTML Purifier:
* iconv : Converts text to and from non-UTF-8 encodings
* bcmath : Used for unit conversion and imagecrash protection
* tidy : Used for pretty-printing HTML
These optional libraries can enhance the capabilities of HTML Purifier:
* CSSTidy : Clean CSS stylesheets using %Core.ExtractStyleBlocks
* Net_IDNA2 (PEAR) : IRI support using %Core.EnableIDNA
2. Reconnaissance
A big plus of HTML Purifier is its inerrant support of standards, so
your web-pages should be standards-compliant. (They should also use
semantic markup, but that's another issue altogether, one HTML Purifier
cannot fix without reading your mind.)
HTML Purifier can process these doctypes:
* XHTML 1.0 Transitional (default)
* XHTML 1.0 Strict
* HTML 4.01 Transitional
* HTML 4.01 Strict
* XHTML 1.1
...and these character encodings:
* UTF-8 (default)
* Any encoding iconv supports (with crippled internationalization support)
These defaults reflect what my choices would be if I were authoring an
HTML document, however, what you choose depends on the nature of your
codebase. If you don't know what doctype you are using, you can determine
the doctype from this identifier at the top of your source code:
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
...and the character encoding from this code:
<meta http-equiv="Content-type" content="text/html;charset=ENCODING">
If the character encoding declaration is missing, STOP NOW, and
read 'docs/enduser-utf8.html' (web accessible at In fact, even if it is
present, read this document anyway, as many websites specify their
document's character encoding incorrectly.
3. Including the library
The procedure is quite simple:
require_once '/path/to/library/';
This will setup an autoloader, so the library's files are only included
when you use them.
Only the contents in the library/ folder are necessary, so you can remove
everything else when using HTML Purifier in a production environment.
If you installed HTML Purifier via PEAR, all you need to do is:
require_once '';
Please note that the usual PEAR practice of including just the classes you
want will not work with HTML Purifier's autoloading scheme.
Advanced users, read on; other users can skip to section 4.
Autoload compatibility
HTML Purifier attempts to be as smart as possible when registering an
autoloader, but there are some cases where you will need to change
your own code to accomodate HTML Purifier. These are those cases:
Because spl_autoload_register() doesn't exist in early versions
of PHP 5, HTML Purifier has no way of adding itself to the autoload
stack. Modify your __autoload function to test
For example, suppose your autoload function looks like this:
function __autoload($class) {
require str_replace('_', '/', $class) . '.php';
return true;
A modified version with HTML Purifier would look like this:
function __autoload($class) {
if (HTMLPurifier_Bootstrap::autoload($class)) return true;
require str_replace('_', '/', $class) . '.php';
return true;
Note that there *is* some custom behavior in our autoloader; the
original autoloader in our example would work for 99% of the time,
but would fail when including language files.
spl_autoload_register() has the curious behavior of disabling
the existing __autoload() handler. Users need to explicitly
spl_autoload_register('__autoload'). Because we use SPL when it
is available, __autoload() will ALWAYS be disabled. If __autoload()
is declared before HTML Purifier is loaded, this is not a problem:
HTML Purifier will register the function for you. But if it is
declared afterwards, it will mysteriously not work. This
snippet of code (after your autoloader is defined) will fix it:
Users should also be on guard if they use a version of PHP previous
to 5.1.2 without an autoloader--HTML Purifier will define __autoload()
for you, which can collide with an autoloader that was added by *you*
For better performance
Opcode caches, which greatly speed up PHP initialization for scripts
with large amounts of code (HTML Purifier included), don't like
autoloaders. We offer an include file that includes all of HTML Purifier's
files in one go in an opcode cache friendly manner:
// If /path/to/library isn't already in your include path, uncomment
// the below line:
// require '/path/to/library/HTMLPurifier.path.php';
require 'HTMLPurifier.includes.php';
Optional components still need to be included--you'll know if you try to
use a feature and you get a class doesn't exists error! The autoloader
can be used in conjunction with this approach to catch classes that are
missing. Simply add this afterwards:
require 'HTMLPurifier.autoload.php';
Standalone version
HTML Purifier has a standalone distribution; you can also generate
a standalone file from the full version by running the script
maintenance/generate-standalone.php . The standalone version has the
benefit of having most of its code in one file, so parsing is much
faster and the library is easier to manage.
If HTMLPurifier.standalone.php exists in the library directory, you
can use it like this:
require '/path/to/HTMLPurifier.standalone.php';
This is equivalent to including HTMLPurifier.includes.php, except that
the contents of standalone/ will be added to your path. To override this
behavior, specify a new HTMLPURIFIER_PREFIX where standalone files can
be found (usually, this will be one directory up, the "true" library
directory in full distributions). Don't forget to set your path too!
The autoloader can be added to the end to ensure the classes are
loaded when necessary; otherwise you can manually include them.
To use the autoloader, use this:
require 'HTMLPurifier.autoload.php';
For advanced users
------------------ performs a number of operations that can be done
individually. These are:
Puts /path/to/library in the include path. For high performance,
this should be done in php.ini.
Registers our autoload handler HTMLPurifier_Bootstrap::autoload($class).
You can do these operations by yourself--in fact, you must modify your own
autoload handler if you are using a version of PHP earlier than PHP 5.1.2
(See "Autoload compatibility" above).
4. Configuration
HTML Purifier is designed to run out-of-the-box, but occasionally HTML
Purifier needs to be told what to do. If you answer no to any of these
questions, read on; otherwise, you can skip to the next section (or, if you're
into configuring things just for the heck of it, skip to 4.3).
* Am I using UTF-8?
* Am I using XHTML 1.0 Transitional?
If you answered no to any of these questions, instantiate a configuration
object and read on:
$config = HTMLPurifier_Config::createDefault();
4.1. Setting a different character encoding
You really shouldn't use any other encoding except UTF-8, especially if you
plan to support multilingual websites (read section three for more details).
However, switching to UTF-8 is not always immediately feasible, so we can
HTML Purifier uses iconv to support other character encodings, as such,
any encoding that iconv supports <>
HTML Purifier supports with this code:
$config->set('Core.Encoding', /* put your encoding here */);
An example usage for Latin-1 websites (the most common encoding for English
$config->set('Core.Encoding', 'ISO-8859-1');
Note that HTML Purifier's support for non-Unicode encodings is crippled by the
fact that any character not supported by that encoding will be silently
dropped, EVEN if it is ampersand escaped. If you want to work around
this, you are welcome to read docs/enduser-utf8.html for a fix,
but please be cognizant of the issues the "solution" creates (for this
reason, I do not include the solution in this document).
4.2. Setting a different doctype
For those of you using HTML 4.01 Transitional, you can disable
XHTML output like this:
$config->set('HTML.Doctype', 'HTML 4.01 Transitional');
Other supported doctypes include:
* HTML 4.01 Strict
* HTML 4.01 Transitional
* XHTML 1.0 Strict
* XHTML 1.0 Transitional
* XHTML 1.1
4.3. Other settings
There are more configuration directives which can be read about
here: <> They're a bit boring,
but they can help out for those of you who like to exert maximum control over
your code. Some of the more interesting ones are configurable at the
demo <> and are well worth looking into
for your own system.
For example, you can fine tune allowed elements and attributes, convert
relative URLs to absolute ones, and even autoparagraph input text! These
are, respectively, %HTML.Allowed, %URI.MakeAbsolute and %URI.Base, and
%AutoFormat.AutoParagraph. The %Namespace.Directive naming convention
translates to:
$config->set('Namespace.Directive', $value);
$config->set('HTML.Allowed', 'p,b,a[href],i');
$config->set('URI.Base', '');
$config->set('URI.MakeAbsolute', true);
$config->set('AutoFormat.AutoParagraph', true);
5. Caching
HTML Purifier generates some cache files (generally one or two) to speed up
its execution. For maximum performance, make sure that
library/HTMLPurifier/DefinitionCache/Serializer is writeable by the webserver.
If you are in the library/ folder of HTML Purifier, you can set the
appropriate permissions using:
chmod -R 0755 HTMLPurifier/DefinitionCache/Serializer
If the above command doesn't work, you may need to assign write permissions
to all. This may be necessary if your webserver runs as nobody, but is
not recommended since it means any other user can write files in the
directory. Use:
chmod -R 0777 HTMLPurifier/DefinitionCache/Serializer
You can also chmod files via your FTP client; this option
is usually accessible by right clicking the corresponding directory and
then selecting "chmod" or "file permissions".
Starting with 2.0.1, HTML Purifier will generate friendly error messages
that will tell you exactly what you have to chmod the directory to, if in doubt,
follow its advice.
If you are unable or unwilling to give write permissions to the cache
directory, you can either disable the cache (and suffer a performance
$config->set('Core.DefinitionCache', null);
Or move the cache directory somewhere else (no trailing slash):
$config->set('Cache.SerializerPath', '/home/user/absolute/path');
6. Using the code
The interface is mind-numbingly simple:
$purifier = new HTMLPurifier($config);
$clean_html = $purifier->purify( $dirty_html );
That's it! For more examples, check out docs/examples/ (they aren't very
different though). Also, docs/enduser-slow.html gives advice on what to
do if HTML Purifier is slowing down your application.
7. Quick install
First, make sure library/HTMLPurifier/DefinitionCache/Serializer is
writable by the webserver (see Section 5: Caching above for details).
If your website is in UTF-8 and XHTML Transitional, use this code:
require_once '/path/to/htmlpurifier/library/';
$config = HTMLPurifier_Config::createDefault();
$purifier = new HTMLPurifier($config);
$clean_html = $purifier->purify($dirty_html);
If your website is in a different encoding or doctype, use this code:
require_once '/path/to/htmlpurifier/library/';
$config = HTMLPurifier_Config::createDefault();
$config->set('Core.Encoding', 'ISO-8859-1'); // replace with your encoding
$config->set('HTML.Doctype', 'HTML 4.01 Transitional'); // replace with your doctype
$purifier = new HTMLPurifier($config);
$clean_html = $purifier->purify($dirty_html);
vim: et sw=4 sts=4

@ -0,0 +1,60 @@

Comment installer HTML Purifier
Attention : Ce document est encodé en UTF-8, si les lettres avec des accents
ne s'affichent pas, prenez un meilleur éditeur de texte.
L'installation de HTML Purifier est très simple, parce qu'il n'a pas besoin
de configuration. Pour les utilisateurs impatients, le code se trouve dans le
pied de page, mais je recommande de lire le document.
1. Compatibilité
HTML Purifier fonctionne avec PHP 5. PHP 5.0.5 est la dernière version testée.
Il ne dépend pas d'autres librairies.
Les extensions optionnelles sont iconv (généralement déjà installée) et tidy
(répendue aussi). Si vous utilisez UTF-8 et que vous ne voulez pas l'indentation,
vous pouvez utiliser HTML Purifier sans ces extensions.
2. Inclure la librairie
Quand vous devez l'utilisez, incluez le :
Ne pas l'inclure si ce n'est pas nécessaire, car HTML Purifier est lourd.
HTML Purifier utilise "autoload". Si vous avez défini la fonction __autoload,
vous devez ajouter cette fonction :
Plus d'informations dans le document "INSTALL".
3. Installation rapide
Si votre site Web est en UTF-8 et XHTML Transitional, utilisez :
$purificateur = new HTMLPurifier();
$html_propre = $purificateur->purify($html_a_purifier);
Sinon, utilisez :
$config = $HTMLPurifier_Config::createDefault();
$config->set('Core', 'Encoding', 'ISO-8859-1'); //Remplacez par votre
$config->set('Core', 'XHTML', true); //Remplacer par false si HTML 4.01
$purificateur = new HTMLPurifier($config);
$html_propre = $purificateur->purify($html_a_purifier);
vim: et sw=4 sts=4

@ -0,0 +1,504 @@
Version 2.1, February 1999
Copyright (C) 1991, 1999 Free Software Foundation, Inc.
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Everyone is permitted to copy and distribute verbatim copies
of this license document, but changing it is not allowed.
[This is the first released version of the Lesser GPL. It also counts
as the successor of the GNU Library Public License, version 2, hence
the version number 2.1.]
The licenses for most software are designed to take away your
freedom to share and change it. By contrast, the GNU General Public
Licenses are intended to guarantee your freedom to share and change
free software--to make sure the software is free for all its users.
This license, the Lesser General Public License, applies to some
specially designated software packages--typically libraries--of the
Free Software Foundation and other authors who decide to use it. You
can use it too, but we suggest you first think carefully about whether
this license or the ordinary General Public License is the better
strategy to use in any particular case, based on the explanations below.
When we speak of free software, we are referring to freedom of use,
not price. Our General Public Licenses are designed to make sure that
you have the freedom to distribute copies of free software (and charge
for this service if you wish); that you receive source code or can get
it if you want it; that you can change the software and use pieces of
it in new free programs; and that you are informed that you can do
these things.
To protect your rights, we need to make restrictions that forbid
distributors to deny you these rights or to ask you to surrender these
rights. These restrictions translate to certain responsibilities for
you if you distribute copies of the library or if you modify it.
For example, if you distribute copies of the library, whether gratis
or for a fee, you must give the recipients all the rights that we gave
you. You must make sure that they, too, receive or can get the source
code. If you link other code with the library, you must provide
complete object files to the recipients, so that they can relink them
with the library after making changes to the library and recompiling
it. And you must show them these terms so they know their rights.
We protect your rights with a two-step method: (1) we copyright the
library, and (2) we offer you this license, which gives you legal
permission to copy, distribute and/or modify the library.
To protect each distributor, we want to make it very clear that
there is no warranty for the free library. Also, if the library is
modified by someone else and passed on, the recipients should know
that what they have is not the original version, so that the original
author's reputation will not be affected by problems that might be
introduced by others.
Finally, software patents pose a constant threat to the existence of
any free program. We wish to make sure that a company cannot
effectively restrict the users of a free program by obtaining a
restrictive license from a patent holder. Therefore, we insist that
any patent license obtained for a version of the library must be
consistent with the full freedom of use specified in this license.
Most GNU software, including some libraries, is covered by the
ordinary GNU General Public License. This license, the GNU Lesser
General Public License, applies to certain designated libraries, and
is quite different from the ordinary General Public License. We use
this license for certain libraries in order to permit linking those
libraries into non-free programs.
When a program is linked with a library, whether statically or using
a shared library, the combination of the two is legally speaking a
combined work, a derivative of the original library. The ordinary
General Public License therefore permits such linking only if the
entire combination fits its criteria of freedom. The Lesser General
Public License permits more lax criteria for linking other code with
the library.
We call this license the "Lesser" General Public License because it
does Less to protect the user's freedom than the ordinary General
Public License. It also provides other free software developers Less
of an advantage over competing non-free programs. These disadvantages
are the reason we use the ordinary General Public License for many
libraries. However, the Lesser license provides advantages in certain
special circumstances.
For example, on rare occasions, there may be a special need to
encourage the widest possible use of a certain library, so that it becomes
a de-facto standard. To achieve this, non-free programs must be
allowed to use the library. A more frequent case is that a free
library does the same job as widely used non-free libraries. In this
case, there is little to gain by limiting the free library to free
software only, so we use the Lesser General Public License.
In other cases, permission to use a particular library in non-free
programs enables a greater number of people to use a large body of
free software. For example, permission to use the GNU C Library in
non-free programs enables many more people to use the whole GNU
operating system, as well as its variant, the GNU/Linux operating
Although the Lesser General Public License is Less protective of the
users' freedom, it does ensure that the user of a program that is
linked with the Library has the freedom and the wherewithal to run
that program using a modified version of the Library.
The precise terms and conditions for copying, distribution and
modification follow. Pay close attention to the difference between a
"work based on the library" and a "work that uses the library". The
former contains code derived from the library, whereas the latter must
be combined with the library in order to run.
0. This License Agreement applies to any software library or other
program which contains a notice placed by the copyright holder or
other authorized party saying it may be distributed under the terms of
this Lesser General Public License (also called "this License").
Each licensee is addressed as "you".
A "library" means a collection of software functions and/or data
prepared so as to be conveniently linked with application programs
(which use some of those functions and data) to form executables.
The "Library", below, refers to any such software library or work
which has been distributed under these terms. A "work based on the
Library" means either the Library or any derivative work under
copyright law: that is to say, a work containing the Library or a
portion of it, either verbatim or with modifications and/or translated
straightforwardly into another language. (Hereinafter, translation is
included without limitation in the term "modification".)
"Source code" for a work means the preferred form of the work for
making modifications to it. For a library, complete source code means
all the source code for all modules it contains, plus any associated
interface definition files, plus the scripts used to control compilation
and installation of the library.
Activities other than copying, distribution and modification are not
covered by this License; they are outside its scope. The act of
running a program using the Library is not restricted, and output from
such a program is covered only if its contents constitute a work based
on the Library (independent of the use of the Library in a tool for
writing it). Whether that is true depends on what the Library does
and what the program that uses the Library does.
1. You may copy and distribute verbatim copies of the Library's
complete source code as you receive it, in any medium, provided that
you conspicuously and appropriately publish on each copy an
appropriate copyright notice and disclaimer of warranty; keep intact
all the notices that refer to this License and to the absence of any
warranty; and distribute a copy of this License along with the
You may charge a fee for the physical act of transferring a copy,
and you may at your option offer warranty protection in exchange for a
2. You may modify your copy or copies of the Library or any portion
of it, thus forming a work based on the Library, and copy and
distribute such modifications or work under the terms of Section 1
above, provided that you also meet all of these conditions:
a) The modified work must itself be a software library.
b) You must cause the files modified to carry prominent notices
stating that you changed the files and the date of any change.
c) You must cause the whole of the work to be licensed at no
charge to all third parties under the terms of this License.
d) If a facility in the modified Library refers to a function or a
table of data to be supplied by an application program that uses
the facility, other than as an argument passed when the facility
is invoked, then you must make a good faith effort to ensure that,
in the event an application does not supply such function or
table, the facility still operates, and performs whatever part of
its purpose remains meaningful.
(For example, a function in a library to compute square roots has
a purpose that is entirely well-defined independent of the
application. Therefore, Subsection 2d requires that any
application-supplied function or table used by this function must
be optional: if the application does not supply it, the square
root function must still compute square roots.)
These requirements apply to the modified work as a whole. If
identifiable sections of that work are not derived from the Library,
and can be reasonably considered independent and separate works in
themselves, then this License, and its terms, do not apply to those
sections when you distribute them as separate works. But when you
distribute the same sections as part of a whole which is a work based
on the Library, the distribution of the whole must be on the terms of
this License, whose permissions for other licensees extend to the
entire whole, and thus to each and every part regardless of who wrote
Thus, it is not the intent of this section to claim rights or contest
your rights to work written entirely by you; rather, the intent is to
exercise the right to control the distribution of derivative or
collective works based on the Library.
In addition, mere aggregation of another work not based on the Library
with the Library (or with a work based on the Library) on a volume of
a storage or distribution medium does not bring the other work under
the scope of this License.
3. You may opt to apply the terms of the ordinary GNU General Public
License instead of this License to a given copy of the Library. To do
this, you must alter all the notices that refer to this License, so
that they refer to the ordinary GNU General Public License, version 2,
instead of to this License. (If a newer version than version 2 of the
ordinary GNU General Public License has appeared, then you can specify
that version instead if you wish.) Do not make any other change in
these notices.
Once this change is made in a given copy, it is irreversible for
that copy, so the ordinary GNU General Public License applies to all
subsequent copies and derivative works made from that copy.
This option is useful when you wish to copy part of the code of
the Library into a program that is not a library.
4. You may copy and distribute the Library (or a portion or
derivative of it, under Section 2) in object code or executable form
under the terms of Sections 1 and 2 above provided that you accompany
it with the complete corresponding machine-readable source code, which
must be distributed under the terms of Sections 1 and 2 above on a
medium customarily used for software interchange.
If distribution of object code is made by offering access to copy
from a designated place, then offering equivalent access to copy the
source code from the same place satisfies the requirement to
distribute the source code, even though third parties are not
compelled to copy the source along with the object code.
5. A program that contains no derivative of any portion of the
Library, but is designed to work with the Library by being compiled or
linked with it, is called a "work that uses the Library". Such a
work, in isolation, is not a derivative work of the Library, and
therefore falls outside the scope of this License.
However, linking a "work that uses the Library" with the Library
creates an executable that is a derivative of the Library (because it
contains portions of the Library), rather than a "work that uses the
library". The executable is therefore covered by this License.
Section 6 states terms for distribution of such executables.
When a "work that uses the Library" uses material from a header file
that is part of the Library, the object code for the work may be a
derivative work of the Library even though the source code is not.
Whether this is true is especially significant if the work can be
linked without the Library, or if the work is itself a library. The
threshold for this to be true is not precisely defined by law.
If such an object file uses only numerical parameters, data
structure layouts and accessors, and small macros and small inline
functions (ten lines or less in length), then the use of the object
file is unrestricted, regardless of whether it is legally a derivative
work. (Executables containing this object code plus portions of the
Library will still fall under Section 6.)
Otherwise, if the work is a derivative of the Library, you may
distribute the object code for the work under the terms of Section 6.
Any executables containing that work also fall under Section 6,
whether or not they are linked directly with the Library itself.
6. As an exception to the Sections above, you may also combine or
link a "work that uses the Library" with the Library to produce a
work containing portions of the Library, and distribute that work
under terms of your choice, provided that the terms permit
modification of the work for the customer's own use and reverse
engineering for debugging such modifications.
You must give prominent notice with each copy of the work that the
Library is used in it and that the Library and its use are covered by
this License. You must supply a copy of this License. If the work
during execution displays copyright notices, you must include the
copyright notice for the Library among them, as well as a reference
directing the user to the copy of this License. Also, you must do one
of these things:
a) Accompany the work with the complete corresponding
machine-readable source code for the Library including whatever
changes were used in the work (which must be distributed under
Sections 1 and 2 above); and, if the work is an executable linked
with the Library, with the complete machine-readable "work that
uses the Library", as object code and/or source code, so that the
user can modify the Library and then relink to produce a modified
executable containing the modified Library. (It is understood
that the user who changes the contents of definitions files in the
Library will not necessarily be able to recompile the application
to use the modified definitions.)
b) Use a suitable shared library mechanism for linking with the
Library. A suitable mechanism is one that (1) uses at run time a
copy of the library already present on the user's computer system,
rather than copying library functions into the executable, and (2)
will operate properly with a modified version of the library, if
the user installs one, as long as the modified version is
interface-compatible with the version that the work was made with.
c) Accompany the work with a written offer, valid for at
least three years, to give the same user the materials
specified in Subsection 6a, above, for a charge no more
than the cost of performing this distribution.
d) If distribution of the work is made by offering access to copy
from a designated place, offer equivalent access to copy the above
specified materials from the same place.
e) Verify that the user has already received a copy of these
materials or that you have already sent this user a copy.
For an executable, the required form of the "work that uses the
Library" must include any data and utility programs needed for
reproducing the executable from it. However, as a special exception,
the materials to be distributed need not include anything that is
normally distributed (in either source or binary form) with the major
components (compiler, kernel, and so on) of the operating system on
which the executable runs, unless that component itself accompanies
the executable.
It may happen that this requirement contradicts the license
restrictions of other proprietary libraries that do not normally
accompany the operating system. Such a contradiction means you cannot
use both them and the Library together in an executable that you
7. You may place library facilities that are a work based on the
Library side-by-side in a single library together with other library
facilities not covered by this License, and distribute such a combined
library, provided that the separate distribution of the work based on
the Library and of the other library facilities is otherwise
permitted, and provided that you do these two things:
a) Accompany the combined library with a copy of the same work
based on the Library, uncombined with any other library
facilities. This must be distributed under the terms of the
Sections above.
b) Give prominent notice with the combined library of the fact
that part of it is a work based on the Library, and explaining
where to find the accompanying uncombined form of the same work.
8. You may not copy, modify, sublicense, link with, or distribute
the Library except as expressly provided under this License. Any
attempt otherwise to copy, modify, sublicense, link with, or
distribute the Library is void, and will automatically terminate your
rights under this License. However, parties who have received copies,
or rights, from you under this License will not have their licenses
terminated so long as such parties remain in full compliance.
9. You are not required to accept this License, since you have not
signed it. However, nothing else grants you permission to modify or
distribute the Library or its derivative works. These actions are
prohibited by law if you do not accept this License. Therefore, by
modifying or distributing the Library (or any work based on the
Library), you indicate your acceptance of this License to do so, and
all its terms and conditions for copying, distributing or modifying
the Library or works based on it.
10. Each time you redistribute the Library (or any work based on the
Library), the recipient automatically receives a license from the
original licensor to copy, distribute, link with or modify the Library
subject to these terms and conditions. You may not impose any further
restrictions on the recipients' exercise of the rights granted herein.
You are not responsible for enforcing compliance by third parties with
this License.
11. If, as a consequence of a court judgment or allegation of patent
infringement or for any other reason (not limited to patent issues),
conditions are imposed on you (whether by court order, agreement or
otherwise) that contradict the conditions of this License, they do not
excuse you from the conditions of this License. If you cannot
distribute so as to satisfy simultaneously your obligations under this
License and any other pertinent obligations, then as a consequence you
may not distribute the Library at all. For example, if a patent
license would not permit royalty-free redistribution of the Library by
all those who receive copies directly or indirectly through you, then
the only way you could satisfy both it and this License would be to
refrain entirely from distribution of the Library.
If any portion of this section is held invalid or unenforceable under any
particular circumstance, the balance of the section is intended to apply,
and the section as a whole is intended to apply in other circumstances.
It is not the purpose of this section to induce you to infringe any
patents or other property right claims or to contest validity of any
such claims; this section has the sole purpose of protecting the
integrity of the free software distribution system which is
implemented by public license practices. Many people have made
generous contributions to the wide range of software distributed
through that system in reliance on consistent application of that
system; it is up to the author/donor to decide if he or she is willing
to distribute software through any other system and a licensee cannot
impose that choice.
This section is intended to make thoroughly clear what is believed to
be a consequence of the rest of this License.
12. If the distribution and/or use of the Library is restricted in
certain countries either by patents or by copyrighted interfaces, the
original copyright holder who places the Library under this License may add
an explicit geographical distribution limitation excluding those countries,
so that distribution is permitted only in or among countries not thus
excluded. In such case, this License incorporates the limitation as if
written in the body of this License.
13. The Free Software Foundation may publish revised and/or new
versions of the Lesser General Public License from time to time.
Such new versions will be similar in spirit to the present version,
but may differ in detail to address new problems or concerns.
Each version is given a distinguishing version number. If the Library
specifies a version number of this License which applies to it and
"any later version", you have the option of following the terms and
conditions either of that version or of any later version published by
the Free Software Foundation. If the Library does not specify a
license version number, you may choose any version ever published by
the Free Software Foundation.
14. If you wish to incorporate parts of the Library into other free
programs whose distribution conditions are incompatible with these,
write to the author to ask for permission. For software which is
copyrighted by the Free Software Foundation, write to the Free
Software Foundation; we sometimes make exceptions for this. Our
decision will be guided by the two goals of preserving the free status
of all derivatives of our free software and of promoting the sharing
and reuse of software generally.
How to Apply These Terms to Your New Libraries
If you develop a new library, and you want it to be of the greatest
possible use to the public, we recommend making it free software that
everyone can redistribute and change. You can do so by permitting
redistribution under these terms (or, alternatively, under the terms of the
ordinary General Public License).
To apply these terms, attach the following notices to the library. It is
safest to attach them to the start of each source file to most effectively
convey the exclusion of warranty; and each file should have at least the
"copyright" line and a pointer to where the full notice is found.
<one line to give the library's name and a brief idea of what it does.>
Copyright (C) <year> <name of author>
This library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
This library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with this library; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Also add information on how to contact you by electronic and paper mail.
You should also get your employer (if you work as a programmer) or your
school, if any, to sign a "copyright disclaimer" for the library, if
necessary. Here is a sample; alter the names:
Yoyodyne, Inc., hereby disclaims all copyright interest in the
library `Frob' (a library for tweaking knobs) written by James Random Hacker.
<signature of Ty Coon>, 1 April 1990
Ty Coon, President of Vice
That's all there is to it!
vim: et sw=4 sts=4

File diff suppressed because it is too large Load Diff

@ -0,0 +1,24 @@
All about HTML Purifier
HTML Purifier is an HTML filtering solution that uses a unique combination
of robust whitelists and agressive parsing to ensure that not only are
XSS attacks thwarted, but the resulting HTML is standards compliant.
HTML Purifier is oriented towards richly formatted documents from
untrusted sources that require CSS and a full tag-set. This library can
be configured to accept a more restrictive set of tags, but it won't be
as efficient as more bare-bones parsers. It will, however, do the job
right, which may be more important.
Places to go:
* See INSTALL for a quick installation guide
* See docs/ for developer-oriented documentation, code examples and
an in-depth installation guide.
* See WYSIWYG for information on editors like TinyMCE and FCKeditor
HTML Purifier can be found on the web at:
vim: et sw=4 sts=4

@ -0,0 +1,150 @@
= KEY ====================
# Flagship
- Regular
? Maybe I'll Do It
If no interest is expressed for a feature that may require a considerable
amount of effort to implement, it may get endlessly delayed. Do not be
afraid to cast your vote for the next feature to be implemented!
Things to do as soon as possible:
- Think about allowing explicit order of operations hooks for transforms
- Fix "<.<" bug (trailing < is removed if not EOD)
- Build in better internal state dumps and debugging tools for remote
- Allowed/Allowed* have strange interactions when both set
? Transform lone embeds into object tags
- Deprecated config options that emit warnings when you set them (with'
a way of muting the warning if you really want to)
- Make HTML.Trusted work with Output.FlashCompat
- HTML.Trusted and HTML.SafeObject have funny interaction; general
problem is what to do when a module "supersedes" another
(see also tables and basic tables.) This is a little dicier
because HTML.SafeObject has some extra functionality that
trusted might find useful. See,5762,6100
4.8 release [OMG CONFIG PONIES]
! Fix Printer. It's from the old days when we didn't have decent XML classes
! Factor demo.php into a set of Printer classes, and then create a stub
file for users here (inside the actual HTML Purifier library)
- Fix error handling with form construction
- Do encoding validation in Printers, or at least, where user data comes in
- Config: Add examples to everything (make built-in which also automatically
gives output)
- Add "register" field to config schemas to eliminate dependence on
naming conventions (try to remember why we ultimately decided on tihs)
5.0 release [HTML 5]
# Swap out code to use html5lib tokenizer and tree-builder
! Allow turning off of FixNesting and required attribute insertion
5.1 release [It's All About Trust] (floating)
# Implement untrusted, dangerous elements/attributes
# Implement IDREF support (harder than it seems, since you cannot have
IDREFs to non-existent IDs)
- Implement <area> (client and server side image maps are blocking
on IDREF support)
# Frameset XHTML 1.0 and HTML 4.01 doctypes
- Figure out how to simultaneously set %CSS.Trusted and %HTML.Trusted (?)
5.2 release [Error'ed]
# Error logging for filtering/cleanup procedures
# Additional support for poorly written HTML
- Microsoft Word HTML cleaning (i.e. MsoNormal, but research essential!)
- Friendly strict handling of <address> (block -> <br>)
- XSS-attempt detection--certain errors are flagged XSS-like
- Append something to duplicate IDs so they're still usable (impl. note: the
dupe detector would also need to detect the suffix as well)
6.0 release [Beyond HTML]
# Legit token based CSS parsing (will require revamping almost every
AttrDef class). Probably will use CSSTidy
# More control over allowed CSS properties using a modularization
# IRI support (this includes IDN)
- Standardize token armor for all areas of processing
7.0 release [To XML and Beyond]
- Extended HTML capabilities based on namespacing and tag transforms (COMPLEX)
- Hooks for adding custom processors to custom namespaced tags and
attributes, offer default implementation
- Lots of documentation and samples
- More refactoring to take advantage of PHP5's facilities
- Refactor unit tests into lots of test methods
- Plugins for major CMSes (COMPLEX)
- phpBB
- Also, a FAQ for extension writers with HTML Purifier
- Smileys
- Syntax highlighting (with GeSHi) with <pre> and possibly <?php
- Look at for ideas
Neat feature related
! Support exporting configuration, so users can easily tweak settings
in the demo, and then copy-paste into their own setup
- Advanced URI filtering schemes (see docs/proposal-new-directives.txt)
- Allow scoped="scoped" attribute in <style> tags; may be troublesome
because regular CSS has no way of uniquely identifying nodes, so we'd
have to generate IDs
- Explain how to use HTML Purifier in non-PHP languages / create
a simple command line stub (or complicated?)
- Fixes for Firefox's inability to handle COL alignment props (Bug 915)
- Automatically add non-breaking spaces to empty table cells when
empty-cells:show is applied to have compatibility with Internet Explorer
- Table of Contents generation (XHTML Compiler might be reusable). May also
be out-of-band information.
- Full set of color keywords. Also, a way to add onto them without
finalizing the configuration object.
- Write a var_export and memcached DefinitionCache - Denis
- Built-in support for target="_blank" on all external links
- Convert RTL/LTR override characters to <bdo> tags, or vice versa on demand.
Also, enable disabling of directionality
? Externalize inline CSS to promote clean HTML, proposed by Sander Tekelenburg
? Remove redundant tags, ex. <u><u>Underlined</u></u>. Implementation notes:
1. Analyzing which tags to remove duplicants
2. Ensure attributes are merged into the parent tag
3. Extend the tag exclusion system to specify whether or not the
contents should be dropped or not (currently, there's code that could do
something like this if it didn't drop the inner text too.)
? Make AutoParagraph also support paragraph-izing double <br> tags, and not
just double newlines. This is kind of tough to do in the current framework,
though, and might be reasonably approximated by search replacing double <br>s
with newlines before running it through HTML Purifier.
Maintenance related (slightly boring)
# CHMOD install script for PEAR installs
! Factor out command line parser into its own class, and unit test it
- Reduce size of internal data-structures (esp. HTMLDefinition)
- Allow merging configurations. Thus,
a -> b -> default
c -> d -> default
a -> b -> c -> d -> default
Maybe allow more fine-grained tuning of this behavior. Alternatively,
encourage people to use short plist depths before building them up.
- Time PHPT tests
ChildDef related (very boring)
- Abstract ChildDef_BlockQuote to work with all elements that only
allow blocks in them, required or optional
- Implement lenient <ruby> child validation
- Non-lossy smart alternate character encoding transformations (unless
patch provided)
- Pretty-printing HTML: users can use Tidy on the output on entire page
- Native content compression, whitespace stripping: use gzip if this is
really important
vim: et sw=4 sts=4

@ -0,0 +1,4 @@
HTML Purifier 4.7.0 is a bugfix release, collecting two years
worth of accumulated bug fixes. Highlighted bugfixes are updated
YouTube filter code, corrected rgb() CSS parsing, and one new
configuration option, %AutoFormat.RemoveEmpty.Predicate.

@ -0,0 +1,20 @@
WYSIWYG - What You See Is What You Get
HTML Purifier: A Pretty Good Fit for TinyMCE and FCKeditor
Javascript-based WYSIWYG editors, simply stated, are quite amazing. But I've
always been wary about using them due to security issues: they handle the
client-side magic, but once you've been served a piping hot load of unfiltered
HTML, what should be done then? In some situations, you can serve it uncleaned,
since you only offer these facilities to trusted(?) authors.
Unfortunantely, for blog comments and anonymous input, BBCode, Textile and
other markup languages still reign supreme. Put simply: filtering HTML is
hard work, and these WYSIWYG authors don't offer anything to alleviate that
trouble. Therein lies the solution:
HTML Purifier is perfect for filtering pure-HTML input from WYSIWYG editors.
Enough said.
vim: et sw=4 sts=4

@ -0,0 +1,22 @@
"name": "ezyang/htmlpurifier",
"description": "Standards compliant HTML filter written in PHP",
"type": "library",
"keywords": ["html"],
"homepage": "",
"license": "LGPL",
"authors": [
"name": "Edward Z. Yang",
"email": "",
"homepage": ""
"require": {
"php": ">=5.2"
"autoload": {
"psr-0": { "HTMLPurifier": "library/" },
"files": ["library/HTMLPurifier.composer.php"]

@ -0,0 +1,91 @@
* Decorator/extender XSLT processor specifically for HTML documents.
class ConfigDoc_HTMLXSLTProcessor
* Instance of XSLTProcessor
protected $xsltProcessor;
public function __construct($proc = false)
if ($proc === false) $proc = new XSLTProcessor();
$this->xsltProcessor = $proc;
* @note Allows a string $xsl filename to be passed
public function importStylesheet($xsl)
if (is_string($xsl)) {
$xsl_file = $xsl;
$xsl = new DOMDocument();
return $this->xsltProcessor->importStylesheet($xsl);
* Transforms an XML file into compatible XHTML based on the stylesheet
* @param $xml XML DOM tree, or string filename
* @return string HTML output
* @todo Rename to transformToXHTML, as transformToHTML is misleading
public function transformToHTML($xml)
if (is_string($xml)) {
$dom = new DOMDocument();
} else {
$dom = $xml;
$out = $this->xsltProcessor->transformToXML($dom);
// fudges for HTML backwards compatibility
// assumes that document is XHTML
$out = str_replace('/>', ' />', $out); // <br /> not <br/>
$out = str_replace(' xmlns=""', '', $out); // rm unnecessary xmlns
if (class_exists('Tidy')) {
// cleanup output
$config = array(
'indent' => true,
'output-xhtml' => true,
'wrap' => 80
$tidy = new Tidy;
$tidy->parseString($out, $config, 'utf8');
$out = (string) $tidy;
return $out;
* Bulk sets parameters for the XSL stylesheet
* @param array $options Associative array of options to set
public function setParameters($options)
foreach ($options as $name => $value) {
$this->xsltProcessor->setParameter('', $name, $value);
* Forward any other calls to the XSLT processor
public function __call($name, $arguments)
call_user_func_array(array($this->xsltProcessor, $name), $arguments);
// vim: et sw=4 sts=4

@ -0,0 +1,164 @@
* Filesystem tools not provided by default; can recursively create, copy
* and delete folders. Some template methods are provided for extensibility.
* @note This class must be instantiated to be used, although it does
* not maintain state.
class FSTools
private static $singleton;
* Returns a global instance of FSTools
public static function singleton()
if (empty(FSTools::$singleton)) FSTools::$singleton = new FSTools();
return FSTools::$singleton;
* Sets our global singleton to something else; useful for overloading
* functions.
public static function setSingleton($singleton)
FSTools::$singleton = $singleton;
* Recursively creates a directory
* @param string $folder Name of folder to create
* @note Adapted from the PHP manual comment 76612
public function mkdirr($folder)
$folders = preg_split("#[\\\\/]#", $folder);
$base = '';
for($i = 0, $c = count($folders); $i < $c; $i++) {
if(empty($folders[$i])) {
if (!$i) {
// special case for root level
$base .= $folders[$i];
* Copy a file, or recursively copy a folder and its contents; modified
* so that copied files, if PHP, have includes removed
* @note Adapted from
public function copyr($source, $dest)
// Simple copy for a file
if (is_file($source)) {
return $this->copy($source, $dest);
// Make destination directory
if (!is_dir($dest)) {
// Loop through the folder
$dir = $this->dir($source);
while ( false !== ($entry = $dir->read()) ) {
// Skip pointers
if ($entry == '.' || $entry == '..') {
if (!$this->copyable($entry)) {
// Deep copy directories
if ($dest !== "$source/$entry") {
$this->copyr("$source/$entry", "$dest/$entry");
// Clean up
return true;
* Overloadable function that tests a filename for copyability. By
* default, everything should be copied; you can restrict things to
* ignore hidden files, unreadable files, etc. This function
* applies to copyr().
public function copyable($file)
return true;
* Delete a file, or a folder and its contents
* @note Adapted from
public function rmdirr($dirname)
// Sanity check
if (!$this->file_exists($dirname)) {
return false;
// Simple delete for a file
if ($this->is_file($dirname) || $this->is_link($dirname)) {
return $this->unlink($dirname);
// Loop through the folder
$dir = $this->dir($dirname);
while (false !== $entry = $dir->read()) {
// Skip pointers
if ($entry == '.' || $entry == '..') {
// Recurse
$this->rmdirr($dirname . DIRECTORY_SEPARATOR . $entry);
// Clean up
return $this->rmdir($dirname);
* Recursively globs a directory.
public function globr($dir, $pattern, $flags = NULL)
$files = $this->glob("$dir/$pattern", $flags);
if ($files === false) $files = array();
$sub_dirs = $this->glob("$dir/*", GLOB_ONLYDIR);
if ($sub_dirs === false) $sub_dirs = array();
foreach ($sub_dirs as $sub_dir) {
$sub_files = $this->globr($sub_dir, $pattern, $flags);
$files = array_merge($files, $sub_files);
return $files;
* Allows for PHP functions to be called and be stubbed.
* @warning This function will not work for functions that need
* to pass references; manually define a stub function for those.
public function __call($name, $args)
return call_user_func_array($name, $args);
// vim: et sw=4 sts=4

@ -0,0 +1,141 @@
* Represents a file in the filesystem
* @warning Be sure to distinguish between get() and write() versus
* read() and put(), the former operates on the entire file, while
* the latter operates on a handle.
class FSTools_File
/** Filename of file this object represents */
protected $name;
/** Handle for the file */
protected $handle = false;
/** Instance of FSTools for interfacing with filesystem */
protected $fs;
* Filename of file you wish to instantiate.
* @note This file need not exist
public function __construct($name, $fs = false)
$this->name = $name;
$this->fs = $fs ? $fs : FSTools::singleton();
/** Returns the filename of the file. */
public function getName() {return $this->name;}
/** Returns directory of the file without trailing slash */
public function getDirectory() {return $this->fs->dirname($this->name);}
* Retrieves the contents of a file
* @todo Throw an exception if file doesn't exist
public function get()
return $this->fs->file_get_contents($this->name);
/** Writes contents to a file, creates new file if necessary */
public function write($contents)
return $this->fs->file_put_contents($this->name, $contents);
/** Deletes the file */
public function delete()
return $this->fs->unlink($this->name);
/** Returns true if file exists and is a file. */
public function exists()
return $this->fs->is_file($this->name);
/** Returns last file modification time */
public function getMTime()
return $this->fs->filemtime($this->name);
* Chmod a file
* @note We ignore errors because of some weird owner trickery due
* to SVN duality
public function chmod($octal_code)
return @$this->fs->chmod($this->name, $octal_code);
/** Opens file's handle */
public function open($mode)
if ($this->handle) $this->close();
$this->handle = $this->fs->fopen($this->name, $mode);
return true;
/** Closes file's handle */
public function close()
if (!$this->handle) return false;
$status = $this->fs->fclose($this->handle);
$this->handle = false;
return $status;
/** Retrieves a line from an open file, with optional max length $length */
public function getLine($length = null)
if (!$this->handle) $this->open('r');
if ($length === null) return $this->fs->fgets($this->handle);
else return $this->fs->fgets($this->handle, $length);
/** Retrieves a character from an open file */
public function getChar()
if (!$this->handle) $this->open('r');
return $this->fs->fgetc($this->handle);
/** Retrieves an $length bytes of data from an open data */
public function read($length)
if (!$this->handle) $this->open('r');
return $this->fs->fread($this->handle, $length);
/** Writes to an open file */
public function put($string)
if (!$this->handle) $this->open('a');
return $this->fs->fwrite($this->handle, $string);
/** Returns TRUE if the end of the file has been reached */
public function eof()
if (!$this->handle) return true;
return $this->fs->feof($this->handle);
public function __destruct()
if ($this->handle) $this->close();
// vim: et sw=4 sts=4

Some files were not shown because too many files have changed in this diff Show More