array( 'name' => 'Profile URL', 'type' => 'text', 'required' => true, 'title' => 'Profile URL. Example: https://www.scribd.com/user/489040929/number10leaks-com', 'exampleValue' => 'https://www.scribd.com/user/' ), )); const CACHE_TIMEOUT = 3600; private $profileUrlRegex = '/scribd\.com\/(user\/[0-9]+\/[\w-]+)\/?/'; private $feedName = ''; public function collectData() { $html = getSimpleHTMLDOM($this->getURI()) or returnServerError('Could not request: ' . $this->getURI()); $header = $html->find('div.header', 0); $this->feedName = $header->find('a', 0)->plaintext; foreach($html->find('div.content ul li') as $index => $li) { $item = array(); $item['title'] = $li->find('div.under_title', 0)->plaintext; $item['uri'] = $li->find('a', 0)->href; $item['author'] = $li->find('span.uploader', 0)->plaintext; //$item['timestamp'] = $item['uid'] = $li->find('a', 0)->href; $pageHtml = getSimpleHTMLDOMCached($item['uri'], 3600) or returnServerError('Could not request: ' . $item['uri']); $image = $pageHtml->find('meta[property="og:image"]', 0)->content; $description = $pageHtml->find('meta[property="og:description"]', 0)->content; foreach ($pageHtml->find('ul.interest_pills li') as $pills) { $item['categories'][] = $pills->plaintext; } $item['content'] = <<{$description}

EOD; $item['enclosures'][] = $image; $this->items[] = $item; if (count($this->items) >= 15) { break; } } } public function getName() { if ($this->feedName) { return $this->feedName . ' - Scribd'; } return parent::getName(); } public function getURI() { if (!is_null($this->getInput('profile'))) { preg_match($this->profileUrlRegex, $this->getInput('profile'), $user) or returnServerError('Could not extract user ID and name from given profile URL.'); return self::URI . '/' . $user[1] . '/uploads'; } return parent::getURI(); } }