mirror of
https://github.com/not-kennethreitz/convore.json.git
synced 2026-06-05 23:20:19 +00:00
1 line
11 KiB
JSON
1 line
11 KiB
JSON
[{"user_id": 41191, "stars": [], "topic_id": 45475, "date_created": 1316367456.0966251, "message": "hey ultra: what's the rest of the curl url?", "group_id": 2328, "id": 2157614}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316367703.560771, "message": "K-Nearest Neighbors -- good for image data", "group_id": 2328, "id": 2157648}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316364189.8670051, "message": "66.246.75.131\n", "group_id": 2328, "id": 2157249}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316364426.9487021, "message": "\u201cHow can we build computer systems that automatically improve with experience, and what are the fundamental laws that govern all learning processes?\u201d -- Tom Mitchell, CMU", "group_id": 2328, "id": 2157299}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316364880.578048, "message": "Google Prediction API: http://code.google.com/apis/predict/", "group_id": 2328, "id": 2157352}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316363525.8462601, "message": "This topic is for the Machine Learning workshop and hack session at the conference.", "group_id": 2328, "id": 2157193}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316365400.3846691, "message": "supervised and unsupervised learning aren't in opposition, they are often used together", "group_id": 2328, "id": 2157427}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316364211.3363211, "message": "strangeloop1 / strangeloop1r0x -- only 5 accts, pls only use if you need it", "group_id": 2328, "id": 2157255}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316364421.5720739, "message": "Definition of machine learning as algorithms that improve with data", "group_id": 2328, "id": 2157298}, {"user_id": 41182, "stars": [{"date_created": 1316435333.092849, "user_id": 41102}], "topic_id": 45475, "date_created": 1316365195.638684, "message": "You\u2019ll need a machine with:\n\nPython (2.5, 2.6 or 2.7)\nNLTK\nnumpy\nPycluster\nhcluster\nmatplotlib\nJSONView (Chrome extension)*\n", "group_id": 2328, "id": 2157405}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316364180.871218, "message": "for folks in the workshop who need it", "group_id": 2328, "id": 2157248}, {"user_id": 41102, "stars": [], "topic_id": 45475, "date_created": 1316364260.3119199, "message": "Do you Telnet in or.... ? Thx", "group_id": 2328, "id": 2157262}, {"user_id": 41182, "stars": [{"date_created": 1316435353.7870531, "user_id": 41102}], "topic_id": 45475, "date_created": 1316364248.1941259, "message": "code for the workshop is here: http://bit.ly/pkn6W9", "group_id": 2328, "id": 2157261}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316364278.7322719, "message": "I think ssh...", "group_id": 2328, "id": 2157264}, {"user_id": 41188, "stars": [], "topic_id": 45475, "date_created": 1316365241.9252779, "message": "Thank you @ultrasaurus", "group_id": 2328, "id": 2157410}, {"user_id": 41188, "stars": [], "topic_id": 45475, "date_created": 1316364937.9467781, "message": "Where can I download the presentation?", "group_id": 2328, "id": 2157361}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316365615.6506801, "message": "Data Source Handbook by Pete Warden", "group_id": 2328, "id": 2157452}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316364978.822233, "message": "it's not posted. During the break, we can ask Hilary if she's is open to publishing it", "group_id": 2328, "id": 2157368}, {"user_id": 41182, "stars": [{"date_created": 1316435467.0648079, "user_id": 41102}], "topic_id": 45475, "date_created": 1316366150.962903, "message": "probability of B given A: p( B | A ) = p( A | B ) * p(B) / p(A)", "group_id": 2328, "id": 2157503}, {"user_id": 41182, "stars": [{"date_created": 1316435374.0613959, "user_id": 41102}], "topic_id": 45475, "date_created": 1316365151.635705, "message": "Taxonomy of Data Science http://bit.ly/9RYQEF -- article is slightly outdated, but model is still valid", "group_id": 2328, "id": 2157397}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316365154.4596679, "message": "OSEMN (pronounced \"awesome!\") Obtain, Scrub, Explore, Model, iNterpret", "group_id": 2328, "id": 2157398}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316365156.848026, "message": "here are some notes on the stuff you need installed: https://github.com/ultrasaurus/ml_class/blob/master/README.md", "group_id": 2328, "id": 2157399}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316365867.3766861, "message": "curl \"http://api.nytimes.com/svc/search/v1/article?query=jazz&api-key= ... \"", "group_id": 2328, "id": 2157470}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316365315.4816239, "message": "\"Classification is the assignment of a label to an unlabeled input based on previously seen data.\"", "group_id": 2328, "id": 2157420}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316365561.006284, "message": "fun datasets to play with... \nhttp://www.delicious.com/pskomoroch/dataset", "group_id": 2328, "id": 2157443}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316365562.566617, "message": "http://bit.ly/f2cX4h", "group_id": 2328, "id": 2157444}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316365659.2417459, "message": "Register for an API key at http://developer.nytimes.com/apps/register and select \"Article Search API\"", "group_id": 2328, "id": 2157458}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316367119.8065319, "message": "python nytimes_pull.py -> creates two files \"arts\" and \"sports\"", "group_id": 2328, "id": 2157584}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316367120.9245901, "message": "python classify.py -> prints probabilities", "group_id": 2328, "id": 2157586}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316367125.70259, "message": "nltk has a really nice sentence tokenizer (seems like it would be an easy problem for English, but becomes tough when the sentence has Dr. or Mrs. or 3.5)", "group_id": 2328, "id": 2157587}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316367519.5551021, "message": "Porter Stemming Algorithm: M.F. Porter, 1980, http://tartarus.org/~martin/PorterStemmer/def.txt", "group_id": 2328, "id": 2157622}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316367582.2411959, "message": "WordNet has synonyms which helps expand your set of \"features\" for a data set", "group_id": 2328, "id": 2157633}, {"user_id": 29799, "stars": [], "topic_id": 45475, "date_created": 1316367616.5727961, "message": ">>> word_tokenize(\"Hello there. Nice to meet you.\")\n['Hello', 'there.', 'Nice', 'to', 'meet', 'you', '.']", "group_id": 2328, "id": 2157638}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316367781.85888, "message": "uses a metaphor for distance", "group_id": 2328, "id": 2157659}, {"user_id": 29799, "stars": [], "topic_id": 45475, "date_created": 1316367639.8155279, "message": "anybody know nltk? why would periods not get split out (first period in example above).", "group_id": 2328, "id": 2157642}, {"user_id": 41182, "stars": [{"date_created": 1316435435.4428041, "user_id": 41102}], "topic_id": 45475, "date_created": 1316367546.6743619, "message": "WordNet models how words are related to each other in sentences: http://wordnet.princeton.edu/", "group_id": 2328, "id": 2157627}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316367621.1925571, "message": "hack for getting clean text of a webpage: lynx \u2013dump [url]", "group_id": 2328, "id": 2157641}, {"user_id": 41182, "stars": [{"date_created": 1316435423.540252, "user_id": 41102}], "topic_id": 45475, "date_created": 1316367914.838084, "message": "SciPy: http://docs.scipy.org/doc/scipy/reference/spatial.html", "group_id": 2328, "id": 2157674}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316370953.2960801, "message": "using pycluster and numpy", "group_id": 2328, "id": 2158071}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316370917.365181, "message": "K-means\n1. Decide on number of clusters\n2. Randomly place centroids\n3. Iterate until clusters are formed\n4. Iterate until convergence", "group_id": 2328, "id": 2158068}, {"user_id": 29799, "stars": [], "topic_id": 45475, "date_created": 1316369847.33266, "message": "answer to my own question above from the nltk docs: \"This tokenizer should be fed a single sentence at a time\"", "group_id": 2328, "id": 2157932}, {"user_id": 41182, "stars": [], "topic_id": 45475, "date_created": 1316370964.443418, "message": "download pycluster from here: http://bonsai.hgc.jp/~mdehoon/software/cluster/software.htm#pycluster", "group_id": 2328, "id": 2158072}, {"user_id": 41182, "stars": [{"date_created": 1316435389.4486179, "user_id": 41102}], "topic_id": 45475, "date_created": 1316372767.0915489, "message": "hcluster: http://code.google.com/p/scipy-cluster/", "group_id": 2328, "id": 2158259}, {"user_id": 41186, "stars": [{"date_created": 1316435384.2278531, "user_id": 41102}], "topic_id": 45475, "date_created": 1316374327.9824259, "message": "Stanford\u2019s Free Classes on AI, Machine Learning, and Databases.... http://active.tutsplus.com/articles/news/stanford%E2%80%99s-free-classes-on-ai-machine-learning-and-databases/", "group_id": 2328, "id": 2158381}, {"user_id": 1247, "stars": [{"date_created": 1316435393.1493499, "user_id": 41102}], "topic_id": 45475, "date_created": 1316373606.453017, "message": "Global Arrays: http://www.emsl.pnl.gov/docs/global/", "group_id": 2328, "id": 2158335}, {"user_id": 40528, "stars": [{"date_created": 1316435386.2097471, "user_id": 41102}], "topic_id": 45475, "date_created": 1316374161.7652309, "message": "http://ml-class.com/ - standford machine learning class", "group_id": 2328, "id": 2158367}, {"user_id": 3531, "stars": [{"date_created": 1316435319.695925, "user_id": 41102}], "topic_id": 45475, "date_created": 1316404237.6933081, "message": "Here are some other resources she mentioned:\n\n* Book: Programming Collective Intelligence by Toby Segaran (O'Reilly)\n* Book: Pattern Recognition and Machine Learning by Christopher Bishop\n* Book: Machine Learning by Tom Mitchell\n* Blog: Dataists: http://dataists.com/", "group_id": 2328, "id": 2161294}, {"user_id": 3531, "stars": [{"date_created": 1316435323.9517801, "user_id": 41102}], "topic_id": 45475, "date_created": 1316404835.053328, "message": "Also found earlier in my notes, some places for data:\n\n* Book: Data Source Handbook by Pete Warden (O'Reilly, http://oreilly.com/catalog/0636920018254)\n* Hilary's bundle of research-quality data sets: http://bit.ly/f2cX4h", "group_id": 2328, "id": 2161349}] |