123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120 |
- <?php
- namespace IXR;
- use Typecho\Common;
- use Typecho\Http\Client as HttpClient;
- use Typecho\Http\Client\Exception as HttpException;
- /**
- * fetch pingback
- */
- class Pingback
- {
- /**
- * @var string
- */
- private $html;
- /**
- * @var string
- */
- private $target;
- /**
- * @param string $url
- * @param string $target
- * @throws Exception
- */
- public function __construct(string $url, string $target)
- {
- $client = HttpClient::get();
- $this->target = $target;
- if (!isset($client)) {
- throw new Exception('No available http client', 50);
- }
- try {
- $client->setTimeout(5)
- ->send($url);
- } catch (HttpException $e) {
- throw new Exception('Pingback http error', 50);
- }
- if ($client->getResponseStatus() != 200) {
- throw new Exception('Pingback wrong http status', 50);
- }
- $response = $client->getResponseBody();
- $encoding = 'UTF-8';
- $contentType = $client->getResponseHeader('Content-Type');
- if (!empty($contentType) && preg_match("/charset=([_a-z0-9-]+)/i", $contentType, $matches)) {
- $encoding = strtoupper($matches[1]);
- } elseif (preg_match("/<meta\s+charset=\"([_a-z0-9-]+)\"/i", $response, $matches)) {
- $encoding = strtoupper($matches[1]);
- }
- $this->html = $encoding == 'UTF-8' ? $response : mb_convert_encoding($response, 'UTF-8', $encoding);
- if (
- !$client->getResponseHeader('X-Pingback') &&
- !preg_match_all("/<link[^>]*rel=[\"']pingback[\"'][^>]+href=[\"']([^\"']*)[\"'][^>]*>/i", $this->html)
- ) {
- throw new Exception("Source server doesn't support pingback", 50);
- }
- }
- /**
- * get title
- *
- * @return string
- */
- public function getTitle(): string
- {
- if (preg_match("/\<title\>([^<]*?)\<\/title\\>/is", $this->html, $matchTitle)) {
- return Common::subStr(Common::removeXSS(trim(strip_tags($matchTitle[1]))), 0, 150, '...');
- }
- return parse_url($this->target, PHP_URL_HOST);
- }
- /**
- * get content
- *
- * @return string
- * @throws Exception
- */
- public function getContent(): string
- {
- /** 干掉html tag,只留下<a>*/
- $text = Common::stripTags($this->html, '<a href="">');
- /** 此处将$target quote,留着后面用*/
- $pregLink = preg_quote($this->target);
- /** 找出含有target链接的最长的一行作为$finalText*/
- $finalText = null;
- $lines = explode("\n", $text);
- foreach ($lines as $line) {
- $line = trim($line);
- if (null != $line) {
- if (preg_match("|<a[^>]*href=[\"']{$pregLink}[\"'][^>]*>(.*?)</a>|", $line)) {
- if (strlen($line) > strlen($finalText)) {
- /** <a>也要干掉,*/
- $finalText = Common::stripTags($line);
- break;
- }
- }
- }
- }
- if (!isset($finalText)) {
- throw new Exception("Source page doesn't have target url", 50);
- }
- return '[...]' . Common::subStr($finalText, 0, 200, '') . '[...]';
- }
- }
|