| @ -0,0 +1,84 @@ | |||
| <?php | |||
| namespace p3k\XRay\Formats; | |||
| use DateTime, DateTimeZone; | |||
| use Config; | |||
| use cebe\markdown\GithubMarkdown; | |||
| class Hackernews extends Format { | |||
| public static function matches_host($url) { | |||
| $host = parse_url($url, PHP_URL_HOST); | |||
| return $host == 'news.ycombinator.com'; | |||
| } | |||
| public static function matches($url) { | |||
| if(preg_match('~https?://news\.ycombinator\.com/item\?id=(\d+)$~', $url, $match)) | |||
| return $match; | |||
| else | |||
| return false; | |||
| } | |||
| public static function fetch($http, $url, $opts) { | |||
| $match = self::matches($url); | |||
| $response = $http->get('https://hacker-news.firebaseio.com/v0/item/'.$match[1].'.json'); | |||
| if($response['code'] != 200) { | |||
| return [ | |||
| 'error' => 'hackernews_error', | |||
| 'error_description' => $response['body'], | |||
| 'code' => $response['code'], | |||
| ]; | |||
| } | |||
| return [ | |||
| 'url' => $url, | |||
| 'body' => $response['body'], | |||
| 'code' => $response['code'], | |||
| ]; | |||
| } | |||
| public static function parse($json, $url) { | |||
| $data = @json_decode($json, true); | |||
| if(!$data) | |||
| return self::_unknown(); | |||
| $match = self::matches($url); | |||
| $date = DateTime::createFromFormat('U', $data['time']); | |||
| // Start building the h-entry | |||
| $entry = array( | |||
| 'type' => 'entry', | |||
| 'url' => $url, | |||
| 'author' => [ | |||
| 'type' => 'card', | |||
| 'name' => $data['by'], | |||
| 'photo' => null, | |||
| 'url' => 'https://news.ycombinator.com/user?id='.$data['by'] | |||
| ], | |||
| 'published' => $date->format('c') | |||
| ); | |||
| if(isset($data['title'])) { | |||
| $entry['name'] = $data['title']; | |||
| } | |||
| if(isset($data['text'])) { | |||
| $htmlContent = trim(self::sanitizeHTML($data['text'])); | |||
| $textContent = str_replace('</p><p>', "</p>\n<p>", $htmlContent); | |||
| $textContent = strip_tags($textContent); | |||
| $entry['content'] = [ | |||
| 'html' => $htmlContent, | |||
| 'text' => $textContent | |||
| ]; | |||
| } | |||
| return [ | |||
| 'data' => $entry, | |||
| 'original' => $json | |||
| ]; | |||
| } | |||
| } | |||
| @ -0,0 +1,42 @@ | |||
| <?php | |||
| use Symfony\Component\HttpFoundation\Request; | |||
| use Symfony\Component\HttpFoundation\Response; | |||
| class HackernewsTest extends PHPUnit_Framework_TestCase { | |||
| private $http; | |||
| public function setUp() { | |||
| $this->client = new Parse(); | |||
| $this->client->http = new p3k\HTTP\Test(dirname(__FILE__).'/data/'); | |||
| $this->client->mc = null; | |||
| } | |||
| private function parse($params) { | |||
| $request = new Request($params); | |||
| $response = new Response(); | |||
| return $this->client->parse($request, $response); | |||
| } | |||
| public function testSubmission() { | |||
| $url = 'https://news.ycombinator.com/item?id=14516538'; | |||
| $response = $this->parse(['url' => $url]); | |||
| $body = $response->getContent(); | |||
| $this->assertEquals(200, $response->getStatusCode()); | |||
| $data = json_decode($body, true); | |||
| $this->assertEquals('entry', $data['data']['type']); | |||
| $this->assertEquals('2017-06-08T19:32:12+00:00', $data['data']['published']); | |||
| $this->assertEquals('vkb', $data['data']['author']['name']); | |||
| $this->assertEquals('https://news.ycombinator.com/user?id=vkb', $data['data']['author']['url']); | |||
| $this->assertEquals('What are we doing about Facebook, Google, and the closed internet?', $data['data']['name']); | |||
| $this->assertEquals('There have been many, many posts about how toxic advertising and Facebook are (I\'ve written many myself[1][2][3]) for our internet ecosystem today.<p>What projects or companies are you working on to combat filter bubbles, walled gardens, emotional manipulation, and the like, and how can the HN community help you in your goals?</p><p>[1]http://veekaybee.github.io/facebook-is-collecting-this/ | |||
| [2]http://veekaybee.github.io/content-is-dead/ | |||
| [3] http://veekaybee.github.io/who-is-doing-this-to-my-internet/</p>', $data['data']['content']['html']); | |||
| } | |||
| } | |||
| @ -0,0 +1,11 @@ | |||
| HTTP/1.1 200 OK | |||
| Server: nginx | |||
| Date: Thu, 08 Jun 2017 21:28:24 GMT | |||
| Content-Type: application/json; charset=utf-8 | |||
| Content-Length: 949 | |||
| Connection: keep-alive | |||
| Access-Control-Allow-Origin: * | |||
| Cache-Control: no-cache | |||
| Strict-Transport-Security: max-age=31556926; includeSubDomains; preload | |||
| {"by":"vkb","descendants":51,"id":14516538,"kids":[14516923,14517320,14517322,14517224,14516999,14516850,14517290,14516926,14516808,14517088,14517137,14516981,14516706,14517080,14517055,14516805,14516785,14516890,14517104,14516723,14516853,14517094],"score":84,"text":"There have been many, many posts about how toxic advertising and Facebook are (I've written many myself[1][2][3]) for our internet ecosystem today.<p>What projects or companies are you working on to combat filter bubbles, walled gardens, emotional manipulation, and the like, and how can the HN community help you in your goals?<p>[1]http://veekaybee.github.io/facebook-is-collecting-this/\n[2]http://veekaybee.github.io/content-is-dead/\n[3] http://veekaybee.github.io/who-is-doing-this-to-my-internet/","time":1496950332,"title":"What are we doing about Facebook, Google, and the closed internet?","type":"story"} | |||