summaryrefslogtreecommitdiff
path: root/includes/tidy/Html5Depurate.php
blob: 23e445fa6b8e6f5b86c8878bd4895b2c27b1a4d6 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
<?php

namespace MediaWiki\Tidy;
use MWHttpRequest;
use Exception;

class Html5Depurate extends TidyDriverBase {
	public function __construct( array $config ) {
		parent::__construct( $config + array(
			'url' => 'http://localhost:4339/document',
			'timeout' => 10,
			'connectTimeout' => 0.5,
		) );
	}

	public function tidy( $text ) {
		$wrappedtext = '<!DOCTYPE html><html>' .
			'<body>' . $text . '</body></html>';

		$req = MWHttpRequest::factory( $this->config['url'],
			array(
				'method' => 'POST',
				'timeout' => $this->config['timeout'],
				'connectTimeout' => $this->config['connectTimeout'],
				'postData' => array(
					'text' => $wrappedtext
				)
			) );
		$status = $req->execute();
		if ( !$status->isOK() ) {
			throw new Exception( "Error contacting depurate service: " . $status->getWikiText() );
		} elseif ( $req->getStatus() !== 200 ) {
			throw new Exception( "Depurate returned error: " . $status->getWikiText() );
		}
		$result = $req->getContent();
		$startBody = strpos( $result, "<body>" );
		$endBody = strrpos( $result, "</body>" );
		if ( $startBody !== false && $endBody !== false && $endBody > $startBody ) {
			$startBody += strlen( "<body>" );
			return substr( $result, $startBody, $endBody - $startBody );
		} else {
			return $text . "\n<!-- Html5Depurate returned an invalid result -->";
		}
	}
}