Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								a50cd6284b 
								
									
								
							
								 
							
						 
						
							
							
								
								fix whitespace handling for br tags in html  
							
							
								
							
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								c27f228314 
								
									
								
							
								 
							
						 
						
							
							
								
								include in-reply-to URL for tweets  
							
							
								
							
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								c68c7661c8 
								
									
								
							
								 
							
						 
						
							
							
								
								inspect content to determine if a page is atom or rss  
							
							closes  #62  
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								cb1e32278d 
								
									
								
							
								 
							
						 
						
							
							
								
								convert newlines to <br> for html in tweets  
							
							
								
							
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								bf4bc3a668 
								
									
								
							
								 
							
						 
						
							
							
								
								extract photos and videos from streaming tweets when truncated  
							
							
								
							
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								fb2fcec9c6 
								
									
								
							
								 
							
						 
						
							
							
								
								include HTML for tweets with links or user mentions  
							
							also expands parsing to be able to handle twitter JSON from the streaming API which is subtly different from the HTTP API.
closes  #61  
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								584f34e1ed 
								
									
								
							
								 
							
						 
						
							
							
								
								add test from ascraeus.org which was causing an INTL error  
							
							
								
							
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								2cc215d370 
								
									
								
							
								 
							
						 
						
							
							
								
								add .editorconfig to data folder  
							
							tells the editor to save data files with crlf needed for parsing the test http responses 
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								aba067234c 
								
									
								
							
								 
							
						 
						
							
							
								
								add h-x-app vocabulary  
							
							closes  #13  
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								fe65def90f 
								
									
								
							
								 
							
						 
						
							
							
								
								comment out two tests until open mf2 parser issues are resolved  
							
							
								
							
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								2515f618c7 
								
									
								
							
								 
							
						 
						
							
							
								
								include featured image for h-entry  
							
							closes  #51  
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								4d65b1ca1e 
								
									
								
							
								 
							
						 
						
							
							
								
								if removing the img results in empty content, put the name value back  
							
							closes  #57  
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								3ac38f9dbf 
								
									
								
							
								 
							
						 
						
							
							
								
								add simple case of Known markup  
							
							for #57  
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								85c2b9b15f 
								
									
								
							
								 
							
						 
						
							
							
								
								add failing test for `p-content` containing an `u-photo`  
							
							
								
							
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								44770396f9 
								
									
								
							
								 
							
						 
						
							
							
								
								add test to ensure a content property is not returned unless it is defined  
							
							
								
							
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								bdedef6e1e 
								
									
								
							
								 
							
						 
						
							
							
								
								adds a bunch of broken tests for  #52  
							
							
								
							
							
						 
						7 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								a9b1001e62 
								
									
								
							
								 
							
						 
						
							
							
								
								switch to fork of picofeed with authorUrl support  
							
							* adds test of instagram-atom feed with individual authors per item
* dedupes atom/rss title if it's a prefix of the content 
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								7872429f0c 
								
									
								
							
								 
							
						 
						
							
							
								
								prioritize url on the same domain  
							
							if an item has multiple URL values, return the one that is on the same domain 
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								206e27ea25 
								
									
								
							
								 
							
						 
						
							
							
								
								add feed discovery API  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								85b8a35212 
								
									
								
							
								 
							
						 
						
							
							
								
								normalize URLs when comparing  
							
							Treats `https://example.com ` and `https://example.com/ ` as equivalent when comparing URLs. Closes  #33  
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								15743d411d 
								
									
								
							
								 
							
						 
						
							
							
								
								Find author when author is a property of the h-feed  
							
							closes  #32  
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								05f7d9c86c 
								
									
								
							
								 
							
						 
						
							
							
								
								implement h-feed and other microformats feed parsing  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								7b16371418 
								
									
								
							
								 
							
						 
						
							
							
								
								add basic support for JSONFeed  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								e8e63caba6 
								
									
								
							
								 
							
						 
						
							
							
								
								implements parsing Atom and RSS feeds  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								a37ed3bbae 
								
									
								
							
								 
							
						 
						
							
							
								
								update to support multiple photos  
							
							uses the video's poster frame as the photo if any of the multi-post images are videos 
							
						 
						8 years ago  
				
					
						
							
							
								 
						
							
							
							
								
							
								6b286157e3 
								
							
								 
							
						 
						
							
							
								
								based tests on TwitterTest.php  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								 
						
							
							
							
								
							
								67c159ec29 
								
							
								 
							
						 
						
							
							
								
								added tests  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								d50231142a 
								
									
								
							
								 
							
						 
						
							
							
								
								adds support for parsing checkins  
							
							checkin data is returned embedded like author data rather than in the `refs` object
closes  #35  
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								4fab3e9e0a 
								
									
								
							
								 
							
						 
						
							
							
								
								add test for HN comment  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								d0de523746 
								
									
								
							
								 
							
						 
						
							
							
								
								add hackernews support  
							
							closes  #40  
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								330bc9024d 
								
									
								
							
								 
							
						 
						
							
							
								
								fix parsing for hReview  
							
							thanks to the new backcompat in php-mf2 0.3.2 
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								b76d72a77b 
								
									
								
							
								 
							
						 
						
							
							
								
								return issue labels as category  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								f8e9a87667 
								
									
								
							
								 
							
						 
						
							
							
								
								parse github issues and comments  
							
							closes  #20  
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								5f63ed7944 
								
									
								
							
								 
							
						 
						
							
							
								
								updates for instagram scraping  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								63ab3031a3 
								
									
								
							
								 
							
						 
						
							
							
								
								parse XKCD comics  
							
							skip image alt text for now
closes  #34  
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								5f5392a7b8 
								
									
								
							
								 
							
						 
						
							
							
								
								deduplicate categories, and strip leading hashtags  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								a1234f61e3 
								
									
								
							
								 
							
						 
						
							
							
								
								recognize h-card if it's the only object  
							
							closes  #36  
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								4a4bc73f5e 
								
									
								
							
								 
							
						 
						
							
							
								
								don't include the RT'd photo or video in the main entry  
							
							they are part of the reposted object instead.
closes  #27  
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								5e60e13b5a 
								
									
								
							
								 
							
						 
						
							
							
								
								add h-recipe  
							
							closes  #24  
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								5d8fb4e13c 
								
									
								
							
								 
							
						 
						
							
							
								
								support h-review and h-product vocab  
							
							* closes  #23 
* major refactor of the methods for extracting properties to consolidate the logic
* hReview parsing is incomplete due to issues with the php-mf2 backcompat parsing. see https://github.com/indieweb/php-mf2/issues/107  
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								88a2c7f5bf 
								
									
								
							
								 
							
						 
						
							
							
								
								add test for syndication property  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								7d781c3129 
								
									
								
							
								 
							
						 
						
							
							
								
								match `http-equiv=Status` in addition to `status`  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								227311faa9 
								
									
								
							
								 
							
						 
						
							
							
								
								check for meta-equiv HTTP deleted  
							
							closes  #16  
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								bc74919ade 
								
									
								
							
								 
							
						 
						
							
							
								
								return status code and final URL in response  
							
							* closes  #14 
* updated readme with details of the response
* includes `url` and `code` in the response with the final URL after following redirects and the HTTP status code returned 
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
							
								
							
								876d4696fb 
								
							
								 
							
						 
						
							
							
								
								catch non-expanded profile URLs  
							
							apparently some people's profile URLs don't get t.co'd 
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
							
								
							
								041cc92a8b 
								
							
								 
							
						 
						
							
							
								
								add test file  
							
							:headdesk: 
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
							
								
							
								0beac036b9 
								
							
								 
							
						 
						
							
							
								
								add twitter support  
							
							closes  #18  
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
							
								
							
								773252559d 
								
							
								 
							
						 
						
							
							
								
								parse instagram photos and videos  
							
							
								
							
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								3bdafad98e 
								
									
								
							
								 
							
						 
						
							
							
								
								parse URLs with fragment IDs  
							
							If the input URL contains a fragment, finds the DOM tree at that ID and runs the subtree through the mf2 parser.
closes  #15  
							
						 
						8 years ago  
				
					
						
							
							
								
									
								
								Aaron Parecki 
							
						 
						
							
							
								
								
							
							
								
							
								c59ab9a2d6 
								
									
								
							
								 
							
						 
						
							
							
								
								also check img/video/audio for target URL  
							
							
								
							
							
						 
						9 years ago