mirror of
https://github.com/not-kennethreitz/convore.json.git
synced 2026-06-21 15:40:58 +00:00
1 line
3.2 KiB
JSON
1 line
3.2 KiB
JSON
[{"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802384.94859, "message": "What's acceptable and unacceptable in your methods", "group_id": 11162, "id": 1914281}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802474.5716021, "message": "APIs are useful", "group_id": 11162, "id": 1914292}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802607.663029, "message": "Remember that there is probably a dude with a pager on the other end of the website who will get woken up if you break the site", "group_id": 11162, "id": 1914303}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802356.686084, "message": "Issue: Need to get info from a website", "group_id": 11162, "id": 1914280}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802736.358422, "message": "wget useful options: -m, -nc, -wX, -np", "group_id": 11162, "id": 1914310}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802883.2530191, "message": "Also, Perl, Python, and Ruby all have very friendly libs for scraping", "group_id": 11162, "id": 1914319}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313803286.0044341, "message": "Use NoSQL if your data doesn't fit nicely into tables", "group_id": 11162, "id": 1914340}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313803079.8727679, "message": "Beautiful Soup handles dirty data very very gracefully", "group_id": 11162, "id": 1914330}, {"user_id": 39099, "stars": [{"date_created": 1313814103.184592, "user_id": 39817}], "topic_id": 44144, "date_created": 1313803225.7008021, "message": "Nate O. says that \"SQL should be taught in 3rd grade\"", "group_id": 11162, "id": 1914337}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802709.417645, "message": "wget - your data hoover", "group_id": 11162, "id": 1914308}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802448.3758171, "message": "HTML is often really ugly for scraping purposes", "group_id": 11162, "id": 1914287}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802540.625757, "message": "Be nice - use a one hit per second slow crawl, off peak hours", "group_id": 11162, "id": 1914297}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802550.7016611, "message": "May need to get permission", "group_id": 11162, "id": 1914299}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313802459.098186, "message": "Look for alternatives to scraping", "group_id": 11162, "id": 1914290}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313803017.1356771, "message": "Although very powerful, regex isn't always the best solution", "group_id": 11162, "id": 1914327}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313803107.395292, "message": "http://www.crummy.com/software/BeautifulSoup/", "group_id": 11162, "id": 1914333}, {"user_id": 39099, "stars": [], "topic_id": 44144, "date_created": 1313803451.6055191, "message": "Hurdles: Logging into site, https, javascript data fetcthing, inconsistent data, truncations, spam, lots of sources", "group_id": 11162, "id": 1914347}] |