The data herein is collected and processed using Stweeler (https://github.com/zafargilani/stcs). The data is the property of Twitter, but since processed and aggregated can be used for further research.

The data formats for the files is as:
./bots or ./humans -> screen_name, user_tweeted, user_retweeted, user_favourited, user_replied, likes_per_tweet, retweets_per_tweet, lists_per_user, follower_friend_ratio, tweet_frequency, favourite_tweet_ratio, age_of_account_in_days, sources_count, urls_count, cdn_content_in_kb, source_identity

-- // --

Please cite the following if you use these datasets:

@inproceedings{Gilani:2016:SFT:2872518.2889360,
 author = {Gilani, Zafar and Wang, Liang and Crowcroft, Jon and Almeida, Mario and Farahbakhsh, Reza},
 title = {Stweeler: A Framework for Twitter Bot Analysis},
 booktitle = {Proceedings of the 25th International Conference Companion on World Wide Web},
 series = {WWW '16 Companion},
 year = {2016},
 isbn = {978-1-4503-4144-8},
 location = {Montr\&\#233;al, Qu\&\#233;bec, Canada},
 pages = {37--38},
 numpages = {2},
 url = {https://doi.org/10.1145/2872518.2889360},
 doi = {10.1145/2872518.2889360},
 acmid = {2889360},
 publisher = {International World Wide Web Conferences Steering Committee},
 address = {Republic and Canton of Geneva, Switzerland},
 keywords = {bot analyser, content analysis, information dissemination},
} 

@inproceedings{Gilani:2017:CTA:3110025.3110091,
 author = {Gilani, Zafar and Kochmar, Ekaterina and Crowcroft, Jon},
 title = {Classification of Twitter Accounts into Automated Agents and Human Users},
 booktitle = {Proceedings of the 2017 IEEE/ACM International Conference on Advances in Social Networks Analysis and Mining 2017},
 series = {ASONAM '17},
 year = {2017},
 isbn = {978-1-4503-4993-2},
 location = {Sydney, Australia},
 pages = {489--496},
 numpages = {8},
 url = {http://doi.acm.org/10.1145/3110025.3110091},
 doi = {10.1145/3110025.3110091},
 acmid = {3110091},
 publisher = {ACM},
 address = {New York, NY, USA},
 keywords = {account classification, automated agents, bot detection, social network analysis},
}

