From 1d35149191224cbffd68306117cd08c20096ec6e Mon Sep 17 00:00:00 2001 From: Ruslan Date: Tue, 30 Jan 2018 20:57:07 +0400 Subject: [PATCH] Update VkBridge (#625) --- bridges/VkBridge.php | 85 +++++++++++++++++++++++++++++++++++--------- 1 file changed, 68 insertions(+), 17 deletions(-) diff --git a/bridges/VkBridge.php b/bridges/VkBridge.php index 9981da12..85bf60c5 100644 --- a/bridges/VkBridge.php +++ b/bridges/VkBridge.php @@ -1,9 +1,11 @@ getInput('u'))) { + public function getURI() + { + if (!is_null($this->getInput('u'))) { return static::URI . urlencode($this->getInput('u')); } return parent::getURI(); } - public function collectData(){ + public function collectData() + { - ini_set('user-agent', 'Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:53.0) Gecko/20100101 Firefox/53.0'); - - $text_html = getContents($this->getURI()) - or returnServerError('No results for group or user name "' . $this->getInput('u') . '".'); + $text_html = $this->getContents() + or returnServerError('No results for group or user name "' . $this->getInput('u') . '".'); $text_html = iconv('windows-1251', 'utf-8', $text_html); $html = str_get_html($text_html); + $pageName = $html->find('.page_name', 0)->plaintext; - foreach($html->find('.post') as $post) { + foreach ($html->find('.post') as $post) { - if(is_object($post->find('a.wall_post_more', 0))) { + if (is_object($post->find('a.wall_post_more', 0))) { //delete link "show full" in content $post->find('a.wall_post_more', 0)->outertext = ''; } $item = array(); $item['content'] = strip_tags(backgroundToImg($post->find('div.wall_text', 0)->innertext), '
'); - if(is_object($post->find('a.page_media_link_title', 0))) { - $link = $post->find('a.page_media_link_title', 0)->getAttribute('href'); + if (is_object($post->find('a.page_media_link_title', 0))) { + $link = $post->find('a.page_media_link_title', 0)->getAttribute('href'); //external link in the post $item['content'] .= "\n\rExternal link: " - . str_replace('/away.php?to=', '', urldecode($link)); + . str_replace('/away.php?to=', '', urldecode($link)); } //get video on post - if(is_object($post->find('span.post_video_title_content', 0))) { + if (is_object($post->find('span.post_video_title_content', 0))) { $titleVideo = $post->find('span.post_video_title_content', 0)->plaintext; $linkToVideo = self::URI . $post->find('a.page_post_thumb_video', 0)->getAttribute('href'); $item['content'] .= "\n\r {$titleVideo}: {$linkToVideo}"; @@ -58,9 +61,57 @@ class VkBridge extends BridgeAbstract { // get post link $item['uri'] = self::URI . $post->find('a.post_link', 0)->getAttribute('href'); - $item['date'] = $post->find('span.rel_date', 0)->plaintext; + $item['timestamp'] = $this->getTime($post); + $item['author'] = $pageName; $this->items[] = $item; - // var_dump($item['date']); + } } + + private function getTime($post) + { + if ($time = $post->find('span.rel_date', 0)->getAttribute('time')) { + return $time; + } else { + $strdate = $post->find('span.rel_date', 0)->plaintext; + + $date = date_parse($strdate); + if (!$date['year']) { + if (strstr($strdate, 'today') !== false) { + $strdate = date('d-m-Y') . ' ' . $strdate; + } elseif (strstr($strdate, 'yesterday ') !== false) { + $time = time() - 60 * 60 * 24; + $strdate = date('d-m-Y', $time) . ' ' . $strdate; + } else { + $strdate = $strdate . ' ' . date('Y'); + } + + $date = date_parse($strdate); + } + return strtotime($date['day'] . '-' . $date['month'] . '-' . $date['year'] . ' ' . + $date['hour'] . ':' . $date['minute']); + } + + } + + public function getContents() + { + ini_set('user-agent', 'Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:53.0) Gecko/20100101 Firefox/53.0'); + + $opts = array( + 'http' => array( + 'method' => "GET", + 'user_agent' => ini_get('user_agent'), + 'accept_encoding' => 'gzip', + 'header' => "Accept-language: en\r\n + Cookie: remixlang=3\r\n" + ) + ); + + $context = stream_context_create($opts); + + return getContents($this->getURI(), false, $context); + } + + }