DEVELOPMENT... { "data_id": "43507", "name": "The-Tweets-of-Wisdom", "exact_name": "The-Tweets-of-Wisdom", "version": 1, "version_label": "v1.0", "description": "Context\nIn the last few years, Twitter became one of the most popular social media platforms. From celebrity status to government policies, Twitter can accommodate a diverse range of people and thoughts. In these diverse set of thoughts, there are many Twitter accounts who tweet \"self-help\" thoughts often. These so-called \"wise\" thoughts are often related to improving one's life and how to excel at what you're doing. So I went down to the rabbit-hole to search these sorts of tweets. I find many common themes between them. Therefore, I decided to scrap the tweets so that you can explore the words of these \"self-help\" tweets and understand them much better. \nContent\nI scraped the data using Tweepy API. I have scraped all the tweets, retweets and retweets with a comment of 40 authors. The data contains more than 40 authors because every retweet from any of the 40 authors is stored as a tweet from the original author. Also, every retweet with a comment contains and tags. The author's comment is followed by tag and then the content of the retweet comes which is followed by . The script I used for scrapping can be found here.\nAcknowledgements\nI would like to thanks Stack Overflow which helped me at literally every stage of this project from scrapping to data analysis. Also kudos to the Tweepy API which made it far more easier to fetch tweets. \nInspiration\nI downloaded this dataset for many reasons. The most important one is that I want to know how similar these tweets are. Also, I like to know what makes some tweets viral and what factors affect a viral tweet. I explore these and many more questions in my kernel which you can find in the kernel section. \nContact Me", "format": "arff", "uploader": " Lowe", "uploader_id": 30126, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-23 13:31:21", "update_comment": null, "last_update": "2022-03-23 13:31:21", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102332\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": "\"handle\"", "runs": 0, "suggest": { "input": [ "The-Tweets-of-Wisdom", "Context In the last few years, Twitter became one of the most popular social media platforms. From celebrity status to government policies, Twitter can accommodate a diverse range of people and thoughts. In these diverse set of thoughts, there are many Twitter accounts who tweet \"self-help\" thoughts often. These so-called \"wise\" thoughts are often related to improving one's life and how to excel at what you're doing. So I went down to the rabbit-hole to search these sorts of tweets. I find many " ], "weight": 5 }, "qualities": { "NumberOfInstances": 31115, "NumberOfFeatures": 5, "NumberOfClasses": null, "NumberOfMissingValues": 456, "NumberOfInstancesWithMissingValues": 456, "NumberOfNumericFeatures": 2, "NumberOfSymbolicFeatures": 0, "PercentageOfSymbolicFeatures": 0, "AutoCorrelation": null, "PercentageOfNumericFeatures": 40, "PercentageOfMissingValues": 0.293106218865499, "PercentageOfInstancesWithMissingValues": 1.4655310943274946, "PercentageOfBinaryFeatures": 0, "NumberOfBinaryFeatures": 0, "MinorityClassSize": null, "MinorityClassPercentage": null, "MajorityClassSize": null, "MajorityClassPercentage": null, "Dimensionality": 0.0001606941989394183 }, "tags": [], "features": [ { "name": "author_name", "index": "0", "type": "string", "distinct": "2733", "missing": "92" }, { "name": "created_at", "index": "1", "type": "string", "distinct": "30997", "missing": "0" }, { "name": "handle", "index": "2", "type": "string", "distinct": "2804", "missing": "0", "ignore": "1" }, { "name": "likes", "index": "3", "type": "numeric", "distinct": "3554", "missing": "0", "min": "0", "max": "1352225", "mean": "1045", "stdev": "12215" }, { "name": "retweets", "index": "4", "type": "numeric", "distinct": "2216", "missing": "0", "min": "0", "max": "424270", "mean": "342", "stdev": "3887" }, { "name": "tweet_content", "index": "5", "type": "string", "distinct": "29488", "missing": "364" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }