find('div.inner > a') as $index => $a) { $item = array(); $articlePath = $a->href; $articlePageHtml = getSimpleHTMLDOMCached($articlePath, self::CACHE_TIMEOUT) or returnServerError('Could not request: ' . $articlePath); $articlePageHtml = defaultLinkTo($articlePageHtml, self::URI); $contents = $articlePageHtml->find('div.Contents', 0); $item['uri'] = $articlePath; $item['title'] = $contents->find('h5', 0)->innertext; $contents->find('h5', 0)->outertext = ''; $item['content'] = $contents->innertext; $item['timestamp'] = $this->extractDate($a->plaintext); $item['enclosures'][] = $a->find('img', 0)->src; $this->items[] = $item; if (count($this->items) >= 10) { break; } } } private function extractDate($text) { $dateRegex = '/^([0-9]{4}\/[0-9]{1,2}\/[0-9]{1,2})/'; $text = trim($text); if (preg_match($dateRegex, $text, $matches)) { return $matches[1]; } return ''; } }