Python Fundamentos Para Análise de Dados - Data Science Academy

Victor Hugo Negrisoli

Manipulando Bancos de Dados NoSQL MongoDB com Python

In [2]:
from pymongo import MongoClient
In [3]:
conn = MongoClient('localhost', 27017)
In [4]:
db = conn.cadastrodb
In [6]:
type(conn)
Out[6]:
pymongo.mongo_client.MongoClient
In [9]:
collection = db.cadastrodb
collection
Out[9]:
Collection(Database(MongoClient(host=['localhost:27017'], document_class=dict, tz_aware=False, connect=True), 'cadastrodb'), 'cadastrodb')
In [10]:
import datetime
In [11]:
post1 = {"codigo": "19818", "prod_nome": "Livro", "marcas": ["Panini", "DC", "Marvel"], "data_cadastro": datetime.datetime.utcnow()}
In [13]:
type(post1)
Out[13]:
dict
In [14]:
collection = db.posts
In [15]:
post_id = collection.insert_one(post1)
In [16]:
post_id
Out[16]:
<pymongo.results.InsertOneResult at 0x1ba6820f388>
In [17]:
collection.find_one({"prod_nome": "Livro"})
Out[17]:
{'_id': ObjectId('5e1ceddb6be78d8673599d03'),
 'codigo': '19818',
 'prod_nome': 'Livro',
 'marcas': ['Panini', 'DC', 'Marvel'],
 'data_cadastro': datetime.datetime(2020, 1, 13, 22, 22, 45, 707000)}
In [19]:
post2 = {"codigo": "196516", "prod_nome": "Quadrinhos", "marcas": ["Vertigo", "Marvel"], "data_cadastro": datetime.datetime.utcnow()}
collection.insert_one(post2)
Out[19]:
<pymongo.results.InsertOneResult at 0x1ba6a54e4c8>
In [20]:
for i in collection.find():
    print(i)
{'_id': ObjectId('5e1ceddb6be78d8673599d03'), 'codigo': '19818', 'prod_nome': 'Livro', 'marcas': ['Panini', 'DC', 'Marvel'], 'data_cadastro': datetime.datetime(2020, 1, 13, 22, 22, 45, 707000)}
{'_id': ObjectId('5e1ceeb66be78d8673599d04'), 'codigo': '196516', 'prod_nome': 'Quadrinhos', 'marcas': ['Vertigo', 'Marvel'], 'data_cadastro': datetime.datetime(2020, 1, 13, 22, 27, 2, 950000)}
In [22]:
db.name
Out[22]:
'cadastrodb'
In [25]:
db.list_collection_names()
Out[25]:
['posts']
In [26]:
import pymongo
In [27]:
client_con = pymongo.MongoClient()
In [29]:
client_con.list_database_names()
Out[29]:
['admin', 'cadastrodb', 'config', 'local']
In [30]:
db.create_collection("mycollection")
In [36]:
db.mycollection.insert_one({"titulo":"Superman O Legado das Estrelas", 
                            "descricao":"Clássico", 
                            "editora": ["Panini", "DC Comics"]})
Out[36]:
<pymongo.results.InsertOneResult at 0x1ba6c530748>
In [37]:
db.mycollection.find_one()
Out[37]:
{'_id': ObjectId('5e1cf0026be78d8673599d06'),
 'titulo': 'Superman O Legado das Estrelas',
 'descricao': 'Clássico',
 'editora': ['Panini', 'DC Comics']}
In [38]:
dados = db.mycollection
for item in dados.find():
    print(item)
{'_id': ObjectId('5e1cf0026be78d8673599d06'), 'titulo': 'Superman O Legado das Estrelas', 'descricao': 'Clássico', 'editora': ['Panini', 'DC Comics']}
{'_id': ObjectId('5e1cf0556be78d8673599d07'), 'titulo': 'Superman O Legado das Estrelas', 'descricao': 'Clássico', 'editora': ['Panini', 'DC Comics']}
In [40]:
colecao = db["mycollection"]
colecao.estimated_document_count()
Out[40]:
2

Projeto - Extração / Stream de Dados com API do Twitter

01 - Criando conexão de autentitcação OAuth com a API do Twitter

In [234]:
from tweepy.streaming import StreamListener
from tweepy import OAuthHandler
from tweepy import Stream
from datetime import datetime
import json
In [235]:
consumer_key = "CS9jTBcuZoY8jLhB9beiYbyB0"
consumer_secret = "68LihL1qOdT1xbwBbvemSw7R5gZLW3HExALBqccXCJykUbyJ21"
access_token = "749755566701043712-pPvXYhjdUHTKlEFnxpRTgqrJMIfWeN1"
access_secret = "0DRG5Ct4gqbPAuu2sJcNr5Fi5zEnlZcEJAPalntTWfS90"
In [249]:
auth = OAuthHandler(consumer_key, consumer_secret)
In [250]:
auth.set_access_token(access_token, access_secret)
In [251]:
class MyListener(StreamListener):
    def on_data(self, dados):
        tweet = json.loads(dados)
        created_at = tweet["created_at"]
        id_str = tweet["id_str"]
        text = tweet["text"]
        obj = {"created_at": created_at, "id_str": id_str, "text": text}
        tweetind = colecao.insert_one(obj).inserted_id
        print(obj)
        return True
In [252]:
mylistener = MyListener()
In [260]:
mystream = Stream(auth = auth, listener = mylistener)

02 - Definindo o banco de dados com o MongoDB para armazenar os Tweets

In [241]:
from pymongo import MongoClient
In [242]:
client = MongoClient()
In [243]:
db = client.twitterdb
In [244]:
colecao = db.tweets
In [261]:
palavras_chave = ["Data Science", "Java", "Javascript", "Spring Boot", "Nodejs", "Node.js", "ReactJs", "Programming", "Data Analysis", "Análise de Dados", "Big Data", "Business Intelligence"]

03 - Criando a stream com o Twitter usando como track a lista de palavras-chave

In [262]:
mystream.filter(track=palavras_chave)
{'created_at': 'Tue Jan 14 00:16:33 +0000 2020', 'id_str': '1216876719631556608', 'text': 'RT @CatalogueBack: We interrupt our regular programming of pop culture and anime discussion posts to bring you @Cancelathon something fun I…', '_id': ObjectId('5e1d08656be78d8673599e23')}
{'created_at': 'Tue Jan 14 00:16:35 +0000 2020', 'id_str': '1216876728389292032', 'text': 'RT @NomadXrp: ⏰  PRICE UPDATE  🚀 \n\n⭐️ $XRP $ 0.2132\n24h -0.56% 📉\n\n⭐️ $BTC $ 8128.82\n24h -0.60% 📉\n\n⭐️ $ETH $ 143.88\n24h -1.67% 📉\n\n$xrp #thes…', '_id': ObjectId('5e1d08676be78d8673599e24')}
{'created_at': 'Tue Jan 14 00:16:36 +0000 2020', 'id_str': '1216876733929938944', 'text': 'BIG KETS ARE STILL KETS 😻😻😻😻', '_id': ObjectId('5e1d08686be78d8673599e25')}
{'created_at': 'Tue Jan 14 00:16:38 +0000 2020', 'id_str': '1216876741496582144', 'text': '[Cheat Sheet] Python Basics For Data Science https://t.co/LuZxXxs1dK', '_id': ObjectId('5e1d086a6be78d8673599e26')}
{'created_at': 'Tue Jan 14 00:16:39 +0000 2020', 'id_str': '1216876745992871936', 'text': 'RT @Justin_Stolpe: Happy Monday! Learning about the Instagram Graph API this week! What are you learning about?\n.\n.\n#instagram #instagramap…', '_id': ObjectId('5e1d086b6be78d8673599e27')}
{'created_at': 'Tue Jan 14 00:16:39 +0000 2020', 'id_str': '1216876748182257664', 'text': 'RT @davarcar1: @Jhonitrejos @JorgeIvanOspina @lunadavid @kevingomezpaz @SergioMZamoraB @lftroyano Para que sea ciudad inteligente de pasar…', '_id': ObjectId('5e1d086c6be78d8673599e28')}
{'created_at': 'Tue Jan 14 00:16:47 +0000 2020', 'id_str': '1216876781480878080', 'text': '"They are typically very experienced, having worked on many different projects under a wide variety of circumstance… https://t.co/mWRTfNnRmX', '_id': ObjectId('5e1d08746be78d8673599e29')}
{'created_at': 'Tue Jan 14 00:16:51 +0000 2020', 'id_str': '1216876795745751041', 'text': '@iceagereentry @rcsteeb Don’t worry, all is well. 😉 https://t.co/5jxh8gXtTk', '_id': ObjectId('5e1d08776be78d8673599e2a')}
{'created_at': 'Tue Jan 14 00:16:51 +0000 2020', 'id_str': '1216876798199451648', 'text': 'It "amazes" ME how an "influencer"  like @MarkDice hasn\'t TOUCHED UPON the "blatant" SYMBOLISM being shown on… https://t.co/WhB32QifGF', '_id': ObjectId('5e1d08786be78d8673599e2b')}
{'created_at': 'Tue Jan 14 00:16:54 +0000 2020', 'id_str': '1216876808173432832', 'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…', '_id': ObjectId('5e1d087a6be78d8673599e2c')}
{'created_at': 'Tue Jan 14 00:16:55 +0000 2020', 'id_str': '1216876811906207745', 'text': 'RT @HawkinsTammy: Know #javascript and looking for a new gig in #California? #Blizzard Entertainment is looking for an Associate Software W…', '_id': ObjectId('5e1d087b6be78d8673599e2d')}
{'created_at': 'Tue Jan 14 00:16:55 +0000 2020', 'id_str': '1216876814187909124', 'text': 'Coffee and code. NodeJs tutorial. Then I will do some ReactJs tutorials.\n\nChristmas cat mug FTW! https://t.co/8ATWXMVAqV', '_id': ObjectId('5e1d087c6be78d8673599e2e')}
{'created_at': 'Tue Jan 14 00:17:00 +0000 2020', 'id_str': '1216876836195618817', 'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…', '_id': ObjectId('5e1d08816be78d8673599e2f')}
{'created_at': 'Tue Jan 14 00:17:01 +0000 2020', 'id_str': '1216876837185511424', 'text': "📚 Wiley's Professional JavaScript for Web Developers is an essential guide to next-level ES6 and ES7 JavaScript dev… https://t.co/uyZB7AJ0en", '_id': ObjectId('5e1d08816be78d8673599e30')}
{'created_at': 'Tue Jan 14 00:17:05 +0000 2020', 'id_str': '1216876855405490176', 'text': 'With a few commands I can upgrade: sysinternals notepadplusplus googlechrome 7zip firefox SQLSentryPlanExplorer  vi… https://t.co/JkfFZEZPyB', '_id': ObjectId('5e1d08856be78d8673599e31')}
{'created_at': 'Tue Jan 14 00:17:07 +0000 2020', 'id_str': '1216876864192569345', 'text': 'New #job: Senior Fullstack Dev - JAVA and API Location: Wellington Central .. https://t.co/R8zY2oD9w6 #jobs #hiring', '_id': ObjectId('5e1d08876be78d8673599e32')}
{'created_at': 'Tue Jan 14 00:17:08 +0000 2020', 'id_str': '1216876866948255745', 'text': 'Feature request: add `base16` default themes, the next evolution of `Tomorrow` themes https://t.co/e99xcYh1aL… https://t.co/ShFLk4a0mj', '_id': ObjectId('5e1d08886be78d8673599e33')}
{'created_at': 'Tue Jan 14 00:17:11 +0000 2020', 'id_str': '1216876880080637953', 'text': 'insert baby yoda picture with caption \n\n“big kitties”', '_id': ObjectId('5e1d088b6be78d8673599e34')}
{'created_at': 'Tue Jan 14 00:17:14 +0000 2020', 'id_str': '1216876894664232961', 'text': 'RT @IsTheArchitect: Why #Python is better than #R for #DataScience careers.\n\nhttps://t.co/cyTiSBpV4P\n#dataengineering #bigdata', '_id': ObjectId('5e1d088f6be78d8673599e35')}
{'created_at': 'Tue Jan 14 00:17:17 +0000 2020', 'id_str': '1216876905573634054', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…', '_id': ObjectId('5e1d08916be78d8673599e36')}
{'created_at': 'Tue Jan 14 00:17:20 +0000 2020', 'id_str': '1216876917439238144', 'text': 'RT @Brilliance100: We handle:\n\nStatistics online classes\nPrecalculus\nAlgebra\nTrigonometry\nLinear programming\nMeasurements\nData analysis\nSPS…', '_id': ObjectId('5e1d08946be78d8673599e37')}
{'created_at': 'Tue Jan 14 00:17:21 +0000 2020', 'id_str': '1216876924657717248', 'text': 'RT @AlRokerEnt: "We are proud to debut this African American focused channel, created by and for the members of the black community." - Jam…', '_id': ObjectId('5e1d08966be78d8673599e38')}
{'created_at': 'Tue Jan 14 00:17:22 +0000 2020', 'id_str': '1216876926750613505', 'text': 'RT @nep_developer: Day: 08 of #100DaysOfCode \n-Pause the Tracker App(for a week)\n-Started a new project Planner that used firebase,\n\n------…', '_id': ObjectId('5e1d08966be78d8673599e39')}
{'created_at': 'Tue Jan 14 00:17:23 +0000 2020', 'id_str': '1216876930668036097', 'text': "RT @shog9: Well... I suddenly find myself in need of work. \nIf anyone's hiring: C++, JavaScript, C#, SQL + solid background in social softw…", '_id': ObjectId('5e1d08976be78d8673599e3a')}
{'created_at': 'Tue Jan 14 00:17:25 +0000 2020', 'id_str': '1216876940537126912', 'text': 'RT @brunoborges: For all maintainers of #Java frameworks and libraries, ping @ashleymcnamara and share your story.\n\n// @jtgreene @phillip_w…', '_id': ObjectId('5e1d089a6be78d8673599e3b')}
{'created_at': 'Tue Jan 14 00:17:28 +0000 2020', 'id_str': '1216876949949308928', 'text': '¡El último Cience, Technology &amp; Programming  Daily! https://t.co/LTH701EPUt Gracias a @CTcard44 @schoolprobIems… https://t.co/CVFHa0My36', '_id': ObjectId('5e1d089c6be78d8673599e3c')}
{'created_at': 'Tue Jan 14 00:17:29 +0000 2020', 'id_str': '1216876954869256195', 'text': 'New #job: Business Intelligence Analyst Location: Las Vegas .. https://t.co/jXAS0kPEL6 #jobs #hiring', '_id': ObjectId('5e1d089d6be78d8673599e3d')}
{'created_at': 'Tue Jan 14 00:17:32 +0000 2020', 'id_str': '1216876967628353536', 'text': 'RT @DD_FaFa_: Data Science from Scratch: Comprehensive guide with essential principles of Data Science https://t.co/xgdtkXevAm #DataScience', '_id': ObjectId('5e1d08a06be78d8673599e3e')}
{'created_at': 'Tue Jan 14 00:17:34 +0000 2020', 'id_str': '1216876976943828993', 'text': 'RT @motherofnodejs: I am not lazy, I just save energy 😑 #programming #coding #programmer #javascript #coder #php #java #programminglife #de…', '_id': ObjectId('5e1d08a26be78d8673599e3f')}
{'created_at': 'Tue Jan 14 00:17:34 +0000 2020', 'id_str': '1216876979254956033', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5', '_id': ObjectId('5e1d08a36be78d8673599e40')}
{'created_at': 'Tue Jan 14 00:17:35 +0000 2020', 'id_str': '1216876980294967296', 'text': 'FREE Webinar: Tuesday, 21 January 2020, 9 am EST for a review of #compositional #analysis by Handheld #XRF, along w… https://t.co/FvRX3YQDeB', '_id': ObjectId('5e1d08a36be78d8673599e41')}
{'created_at': 'Tue Jan 14 00:17:35 +0000 2020', 'id_str': '1216876982564278272', 'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…', '_id': ObjectId('5e1d08a46be78d8673599e42')}
{'created_at': 'Tue Jan 14 00:17:36 +0000 2020', 'id_str': '1216876984887906304', 'text': 'RT @susanhash: Leverage #CustomerData to identify opportunities for #proactive #custserv - Jon Christiansen of data science firm Ins &amp; Outs…', '_id': ObjectId('5e1d08a46be78d8673599e43')}
{'created_at': 'Tue Jan 14 00:17:36 +0000 2020', 'id_str': '1216876985009373184', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…', '_id': ObjectId('5e1d08a46be78d8673599e44')}
{'created_at': 'Tue Jan 14 00:17:36 +0000 2020', 'id_str': '1216876985126776832', 'text': "RT @h_ingo: TIL there's a Java version for one of the greatest performance diagnostics tools ever, PoorMansProfiler.", '_id': ObjectId('5e1d08a46be78d8673599e45')}
{'created_at': 'Tue Jan 14 00:17:36 +0000 2020', 'id_str': '1216876985487523840', 'text': 'RT @lakwatsarah: BIG KETS ARE STILL KETS 😻😻😻😻', '_id': ObjectId('5e1d08a46be78d8673599e46')}
{'created_at': 'Tue Jan 14 00:17:38 +0000 2020', 'id_str': '1216876994060619776', 'text': 'RT @PriscillaWT: The grandson of House Democratic Whip James Clyburn, D-S.C., has cut a radio ad invoking his grandfather’s legacy and call…', '_id': ObjectId('5e1d08a66be78d8673599e47')}
{'created_at': 'Tue Jan 14 00:17:40 +0000 2020', 'id_str': '1216877002256539649', 'text': 'RT @ActionableInsi3: [Cheat Sheet] Python Basics For Data Science https://t.co/LuZxXxs1dK', '_id': ObjectId('5e1d08a86be78d8673599e48')}
{'created_at': 'Tue Jan 14 00:17:40 +0000 2020', 'id_str': '1216877003585884160', 'text': "RT @chey_cobb: Soooo... \nWhat's scarier?\n* Foreign intelligence agencies listening in on you?\n* Domestic intelligence agencies listening in…", '_id': ObjectId('5e1d08a96be78d8673599e49')}
{'created_at': 'Tue Jan 14 00:17:41 +0000 2020', 'id_str': '1216877008199856130', 'text': 'I want nothing more than to hug a mf lion. Look at how cute and cuddly this big fluffs are!!!! I can’t handle it 😍😍', '_id': ObjectId('5e1d08aa6be78d8673599e4a')}
{'created_at': 'Tue Jan 14 00:17:42 +0000 2020', 'id_str': '1216877009193906178', 'text': '☀ Hiring: #Big Data Engineer\n#AI #Analyst #BigData #Developer #Plano #techjobs #devjobs\nApply Now &gt;&gt;… https://t.co/f67B6uP1sU', '_id': ObjectId('5e1d08aa6be78d8673599e4b')}
{'created_at': 'Tue Jan 14 00:17:42 +0000 2020', 'id_str': '1216877012012486659', 'text': 'RT @pdakean: Original study that found relation was retracted for data manipulation. The relation was never there but now epidemics are com…', '_id': ObjectId('5e1d08ab6be78d8673599e4c')}
{'created_at': 'Tue Jan 14 00:17:46 +0000 2020', 'id_str': '1216877026864484353', 'text': '@PoetWalker We need an independent revival, like French New Wave, maybe. Films not involving enormous corporations… https://t.co/9PUgw6EdsE', '_id': ObjectId('5e1d08ae6be78d8673599e4d')}
{'created_at': 'Tue Jan 14 00:17:48 +0000 2020', 'id_str': '1216877036414914561', 'text': '@EFL_law @KingMeren You are right - in theory this should not be that big of a deal. But you are giving the team mo… https://t.co/Cwn6ojUhX4', '_id': ObjectId('5e1d08b06be78d8673599e4e')}
{'created_at': 'Tue Jan 14 00:17:49 +0000 2020', 'id_str': '1216877038528868353', 'text': 'Practical Data Science with Hadoop and Spark: Designing and Building Effective Analytics at Scale (Addison-wesley D… https://t.co/zDsJpGTSoI', '_id': ObjectId('5e1d08b16be78d8673599e4f')}
{'created_at': 'Tue Jan 14 00:17:50 +0000 2020', 'id_str': '1216877044623081477', 'text': 'RT @MikelJoachim: Starting a “methods journal club” with grad students &amp; post-docs in @UWBadgerAP to discuss data organization, study desig…', '_id': ObjectId('5e1d08b26be78d8673599e50')}
{'created_at': 'Tue Jan 14 00:17:50 +0000 2020', 'id_str': '1216877046351220736', 'text': 'RT @nep_developer: Day: 08 of #100DaysOfCode \n-Pause the Tracker App(for a week)\n-Started a new project Planner that used firebase,\n\n------…', '_id': ObjectId('5e1d08b36be78d8673599e51')}
{'created_at': 'Tue Jan 14 00:17:54 +0000 2020', 'id_str': '1216877059789742080', 'text': 'RT @NoContextVinny: And we return to your regular programming. https://t.co/N9bbwoYtkp', '_id': ObjectId('5e1d08b66be78d8673599e52')}
{'created_at': 'Tue Jan 14 00:17:54 +0000 2020', 'id_str': '1216877061152878598', 'text': 'Current standard of discourse on the net: "I know nothing I write here will change your mind, because you are alrea… https://t.co/OMa09Z0Gz6', '_id': ObjectId('5e1d08b66be78d8673599e53')}
{'created_at': 'Tue Jan 14 00:17:55 +0000 2020', 'id_str': '1216877065481252867', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5', '_id': ObjectId('5e1d08b76be78d8673599e54')}
{'created_at': 'Tue Jan 14 00:17:56 +0000 2020', 'id_str': '1216877070594211840', 'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…', '_id': ObjectId('5e1d08b96be78d8673599e55')}
{'created_at': 'Tue Jan 14 00:17:56 +0000 2020', 'id_str': '1216877071177342979', 'text': 'actual footage of me because i have to TA  programming classes tomorrow for a total of 4 hours', '_id': ObjectId('5e1d08b96be78d8673599e56')}
{'created_at': 'Tue Jan 14 00:18:01 +0000 2020', 'id_str': '1216877088730439680', 'text': 'Take part in the #SPIE Career Summit, our professional development programming at #PhotonicsWest 2020! \n\nCheck out… https://t.co/L1ej80GLtq', '_id': ObjectId('5e1d08bd6be78d8673599e57')}
{'created_at': 'Tue Jan 14 00:17:58 +0000 2020', 'id_str': '1216877076021534720', 'text': '@Mandoline_Blue Those energies, hard coded into our genetic programming, can (not always) find a twisted way out if… https://t.co/TLAJEnJc6h', '_id': ObjectId('5e1d08be6be78d8673599e58')}
{'created_at': 'Tue Jan 14 00:18:02 +0000 2020', 'id_str': '1216877095667716096', 'text': 'もう火曜日。\nImperative  programming vs. Declarative :\n命令型プログラミング vs. 宣言型プログラミング', '_id': ObjectId('5e1d08be6be78d8673599e59')}
{'created_at': 'Tue Jan 14 00:18:02 +0000 2020', 'id_str': '1216877096472940544', 'text': 'Itu csy kalo suatu saat nongol di Java Jazz, gue ga heran', '_id': ObjectId('5e1d08bf6be78d8673599e5a')}
{'created_at': 'Tue Jan 14 00:18:03 +0000 2020', 'id_str': '1216877099937603584', 'text': 'Medical identity theft can leave you with big bills for procedures, treatment and equipment you never asked for or… https://t.co/hikhwEFoPo', '_id': ObjectId('5e1d08c06be78d8673599e5b')}
{'created_at': 'Tue Jan 14 00:18:06 +0000 2020', 'id_str': '1216877109865537537', 'text': '[Feature] Babel plugin: Add import URL version tag https://t.co/uObz0wNfua #github #JavaScript #TypeScript #CSS #HTML', '_id': ObjectId('5e1d08c26be78d8673599e5c')}
{'created_at': 'Tue Jan 14 00:18:03 +0000 2020', 'id_str': '1216877097899130880', 'text': 'There are many ways to profit off your health data, which leaves you with a big and sometimes life-threatening mess… https://t.co/nMhkQ793oe', '_id': ObjectId('5e1d08c26be78d8673599e5d')}
{'created_at': 'Tue Jan 14 00:18:07 +0000 2020', 'id_str': '1216877114709946369', 'text': 'RT @javascriptflx: 30 Free Resources To Help You Learn JavaScript Fundamentals https://t.co/W1C5eXVUkp  #Javascript', '_id': ObjectId('5e1d08c36be78d8673599e5e')}
{'created_at': 'Tue Jan 14 00:18:07 +0000 2020', 'id_str': '1216877116308033536', 'text': "Sr DevOps Developer - perm/downtown Toronto - Java/Python/Ruby or C req'd - build software to improve build/release… https://t.co/3qmpVgWt9Q", '_id': ObjectId('5e1d08c36be78d8673599e5f')}
{'created_at': 'Tue Jan 14 00:18:17 +0000 2020', 'id_str': '1216877157114437632', 'text': 'Malicious JavaScript package was only active on the npm repository for two weeks. Microsoft spots malicious npm pac… https://t.co/hZHWiiadOh', '_id': ObjectId('5e1d08cd6be78d8673599e60')}
{'created_at': 'Tue Jan 14 00:18:19 +0000 2020', 'id_str': '1216877166555627520', 'text': 'RT @SevenHillsUlti: We are submitting bids for YCC this summer! For more details or answers to some questions, check out our website: https…', '_id': ObjectId('5e1d08cf6be78d8673599e61')}
{'created_at': 'Tue Jan 14 00:18:21 +0000 2020', 'id_str': '1216877175460200448', 'text': "RT @juddy_96: Let me put Japan's situation in smash terms. Smash 4 Shulk. Hey he has all this great stuff. Let's give him shit frame data.…", '_id': ObjectId('5e1d08d26be78d8673599e62')}
{'created_at': 'Tue Jan 14 00:18:22 +0000 2020', 'id_str': '1216877177062481920', 'text': 'RT @BenjySarlin: A realistic scenario right now:\n\n-Trump WH asks courts to end protections for pre-existing conditions\n\n-Trump re-elected w…', '_id': ObjectId('5e1d08d26be78d8673599e63')}
{'created_at': 'Tue Jan 14 00:18:22 +0000 2020', 'id_str': '1216877178580803584', 'text': "RT @Brilliance100: We'll give you A's in your classes. Pay us for\n#essay\n#homework\n#assignment\n#discussion\n#code Java PHP C#\n#Programming p…", '_id': ObjectId('5e1d08d26be78d8673599e64')}
{'created_at': 'Tue Jan 14 00:18:22 +0000 2020', 'id_str': '1216877179658698752', 'text': 'RT @sicsuper: ¡Proteger tus datos personales es muy importante!\nEncuentra las recomendaciones que Big Data y la #SICSuper te dejamos aquí 👉…', '_id': ObjectId('5e1d08d36be78d8673599e65')}
{'created_at': 'Tue Jan 14 00:18:25 +0000 2020', 'id_str': '1216877192744849408', 'text': 'We back to regular programming boiiiis', '_id': ObjectId('5e1d08d66be78d8673599e66')}
{'created_at': 'Tue Jan 14 00:18:27 +0000 2020', 'id_str': '1216877200940683265', 'text': "RT @Cawfree: Here's the Boston Housing dataset for training #regression networks in #tensorflow #NeuralNetworks in #javascript.\n\nhttps://t.…", '_id': ObjectId('5e1d08d86be78d8673599e67')}
{'created_at': 'Tue Jan 14 00:18:28 +0000 2020', 'id_str': '1216877205730426881', 'text': 'RT @nytimesworld: “There aren’t that many things that are quintessentially Canadian, but skating is one of them,” said a university profess…', '_id': ObjectId('5e1d08d96be78d8673599e68')}
{'created_at': 'Tue Jan 14 00:18:34 +0000 2020', 'id_str': '1216877226819489792', 'text': 'What to Pay #JavaScript #Developers in 2020 via https://t.co/prqxSCAEJ8 https://t.co/3nNlRg8PQK', '_id': ObjectId('5e1d08de6be78d8673599e69')}
{'created_at': 'Tue Jan 14 00:18:35 +0000 2020', 'id_str': '1216877233584865281', 'text': '@msRachel9 As soon as we have programming news we’ll announce it here 😘', '_id': ObjectId('5e1d08df6be78d8673599e6a')}
{'created_at': 'Tue Jan 14 00:18:39 +0000 2020', 'id_str': '1216877249686855680', 'text': "My father just discovered that Steven Seagal was a real cop. Well he discovered Steven Seagal Law Man.\n\nThat's what… https://t.co/B1BMeIi25n", '_id': ObjectId('5e1d08e36be78d8673599e6b')}
{'created_at': 'Tue Jan 14 00:18:42 +0000 2020', 'id_str': '1216877261749735424', 'text': 'RT @RiverVanRain: What to Pay #JavaScript #Developers in 2020 via https://t.co/prqxSCAEJ8 https://t.co/3nNlRg8PQK', '_id': ObjectId('5e1d08e66be78d8673599e6c')}
{'created_at': 'Tue Jan 14 00:18:42 +0000 2020', 'id_str': '1216877262848581632', 'text': 'RT @MauraAlwyen: Science has just as many false prophets as religion and American politics does. Data, the Scriptures, and the Constitution…', '_id': ObjectId('5e1d08e66be78d8673599e6d')}
{'created_at': 'Tue Jan 14 00:18:49 +0000 2020', 'id_str': '1216877293773238272', 'text': 'RT @MattKresslein: Join us for the SOKY Robot Royale on Feb. 26th @GRRECKY!  EV3 &amp; Sphero Competitions, Drone Programming/Flying, @Scribit_…', '_id': ObjectId('5e1d08ee6be78d8673599e6e')}
{'created_at': 'Tue Jan 14 00:18:50 +0000 2020', 'id_str': '1216877295765311489', 'text': 'RT @WjgotINrU14Z1fB: Javaで3年くらいやると、他言語の実業務に参加可能になるやつが増えてくる。\n\nなんでJavaだとそうなのかはわからないが、お堅い言語であるが故、信用されてる部分があるっぽい。\n\n実際のところ、言語転換の際に現場で困った話も聞かない。…', '_id': ObjectId('5e1d08ee6be78d8673599e6f')}
{'created_at': 'Tue Jan 14 00:18:50 +0000 2020', 'id_str': '1216877296461795329', 'text': 'RT @Gurgling_MrD: Malicious JavaScript package was only active on the npm repository for two weeks. Microsoft spots malicious npm package s…', '_id': ObjectId('5e1d08ee6be78d8673599e70')}
{'created_at': 'Tue Jan 14 00:18:52 +0000 2020', 'id_str': '1216877302845304832', 'text': "RT @JamesFourM: @dark_wisdom_ @b_ofrights @TrickFreee @dcpoll @ninaandtito @3L3V3NTH @CORLEBRA777 Hey bruh. Let's not forget Bob Dole ➡️ Ma…", '_id': ObjectId('5e1d08f06be78d8673599e71')}
{'created_at': 'Tue Jan 14 00:18:53 +0000 2020', 'id_str': '1216877308386185216', 'text': 'RT @platzi: 📚 Seis Libros para mejorar tu conocimiento de Data Science 👇\n#NuncaParesDeAprender\nhttps://t.co/569j3rREx0 https://t.co/69KqUNy…', '_id': ObjectId('5e1d08f16be78d8673599e72')}
{'created_at': 'Tue Jan 14 00:18:53 +0000 2020', 'id_str': '1216877308491051009', 'text': 'Applied for college and university today, mainly computer programming for Colledge and a English major for universi… https://t.co/WhrU7gq7Q9', '_id': ObjectId('5e1d08f16be78d8673599e73')}
{'created_at': 'Tue Jan 14 00:18:58 +0000 2020', 'id_str': '1216877328266981376', 'text': 'RT @JamesFourM: @CORLEBRA777\n@ninaandtito\n\nFounder &amp; pres of Grassroots Targeting worked for Bob &amp; Elizabeth Dole &amp; as  adviser to Reince P…', '_id': ObjectId('5e1d08f66be78d8673599e74')}
{'created_at': 'Tue Jan 14 00:19:00 +0000 2020', 'id_str': '1216877337070850048', 'text': "RT @sarah_edo: 🎉 If you're interested in learning how to animate on the web with JavaScript, I wrote up a post on how to animate with @gree…", '_id': ObjectId('5e1d08f86be78d8673599e75')}
{'created_at': 'Tue Jan 14 00:19:02 +0000 2020', 'id_str': '1216877347292532736', 'text': 'RT @RobotMakerGirl: The first part of the “thing” is officially built and tested. Now on to the programming stage! Then the woodworking sta…', '_id': ObjectId('5e1d08fb6be78d8673599e76')}
{'created_at': 'Tue Jan 14 00:19:02 +0000 2020', 'id_str': '1216877347535826946', 'text': 'Moderated a data science panel yesterday\n当我准备总结一个数据科学研讨环节时,问三位嘉宾:假如,您公司现在就开始没有数据,您的业务将会怎样?他们那惊讶的神情,告诉了我们数据对业务发展的重要性… https://t.co/JXnU7igBRD', '_id': ObjectId('5e1d08fb6be78d8673599e77')}
{'created_at': 'Tue Jan 14 00:19:06 +0000 2020', 'id_str': '1216877361842544641', 'text': 'Hi, I can do the class for you\nDM or Email✉ EssayNerd7@gmail.com \n\nGuarantees:\n✴an A+ Grade√√\n✴Timely Completion ⏱… https://t.co/UBs4lIMgBG', '_id': ObjectId('5e1d08fe6be78d8673599e78')}
{'created_at': 'Tue Jan 14 00:19:08 +0000 2020', 'id_str': '1216877373045473280', 'text': 'For some reason remembering languages/tools I’ve developed in I haven’t heard much about in years.\n#Powerbuilder,… https://t.co/CcYD8Ux1pX', '_id': ObjectId('5e1d09016be78d8673599e79')}
{'created_at': 'Tue Jan 14 00:19:09 +0000 2020', 'id_str': '1216877373586624514', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…', '_id': ObjectId('5e1d09016be78d8673599e7a')}
{'created_at': 'Tue Jan 14 00:19:09 +0000 2020', 'id_str': '1216877375968989184', 'text': 'Gina Carano in a suit.....thats is all, we will now go back to your regularly scheduled programming #thisistheway https://t.co/QIC4xdsuhv', '_id': ObjectId('5e1d09016be78d8673599e7b')}
{'created_at': 'Tue Jan 14 00:19:10 +0000 2020', 'id_str': '1216877378330218496', 'text': 'RT @spring_io: First milestone of Spring Boot 2.3 will be released this Thursday and will GA two weeks before Spring I/O.\n\nDon’t miss out a…', '_id': ObjectId('5e1d09026be78d8673599e7c')}
{'created_at': 'Tue Jan 14 00:19:11 +0000 2020', 'id_str': '1216877385930432512', 'text': 'RT @genentech: Heading to #JPM20? Download S3E05 of our #podcast and find out more about the role of big data in #PersonalizedMedicine from…', '_id': ObjectId('5e1d09046be78d8673599e7d')}
{'created_at': 'Tue Jan 14 00:19:12 +0000 2020', 'id_str': '1216877387318616064', 'text': 'おはようございます☀\n\n#今日の積み上げ  予定\n✅#30DAYSトライアル 2nd Day3\n\n引き続きJavaScriptの学習です🏃\u200d♂️\n\n通勤往復中にProgateアプリ版→帰宅後パソコン版の流れ最強だったので本日も同じスタイルでいきます💪\n\n#駆け出しエンジニア', '_id': ObjectId('5e1d09046be78d8673599e7e')}
{'created_at': 'Tue Jan 14 00:19:12 +0000 2020', 'id_str': '1216877388753264641', 'text': 'RT @PVNCCDSB: As a result of a planned one-day full withdrawal of service by our teachers on Tuesday, Jan. 21, 2020, the Board will be clos…', '_id': ObjectId('5e1d09046be78d8673599e7f')}
{'created_at': 'Tue Jan 14 00:19:15 +0000 2020', 'id_str': '1216877401822466048', 'text': 'Tapos na event so wala na akong ipopost na annoucements and shiz I am back to regular programming welcome to my kal… https://t.co/NGsR2RSEtm', '_id': ObjectId('5e1d09086be78d8673599e80')}
{'created_at': 'Tue Jan 14 00:19:16 +0000 2020', 'id_str': '1216877404041379847', 'text': 'RT @platzi: 📚 Seis Libros para mejorar tu conocimiento de Data Science 👇\n#NuncaParesDeAprender\nhttps://t.co/569j3rREx0 https://t.co/69KqUNy…', '_id': ObjectId('5e1d09086be78d8673599e81')}
{'created_at': 'Tue Jan 14 00:19:17 +0000 2020', 'id_str': '1216877408147533824', 'text': 'RT @strnr: Eleven tips for working with big data https://t.co/KrdaN4gxSh\nKeep raw data raw\nViz\nRecord workflow\nUse version ctrl\nRecord meta…', '_id': ObjectId('5e1d09096be78d8673599e82')}
{'created_at': 'Tue Jan 14 00:19:17 +0000 2020', 'id_str': '1216877408718028800', 'text': '@AnimalDefenceBZ @DataCassette Please enforce the law against dog and wild boar fighting! Plz sign: https://t.co/n3pdX3hOP8', '_id': ObjectId('5e1d09096be78d8673599e83')}
{'created_at': 'Tue Jan 14 00:19:20 +0000 2020', 'id_str': '1216877423142297600', 'text': 'Rock it: A Cradle Story — An Arduino-powered Baby Crib Rocker\n\n☞ https://t.co/jrrPvUwrGv\n\n#arduino #programming https://t.co/niOfINyVkE', '_id': ObjectId('5e1d090d6be78d8673599e84')}
{'created_at': 'Tue Jan 14 00:19:22 +0000 2020', 'id_str': '1216877428603117568', 'text': 'RT @xximbecile: Bullshit. I was born in Madiun, live most of my youth without internet because my family is poor. And I know I read a lot.…', '_id': ObjectId('5e1d090e6be78d8673599e85')}
{'created_at': 'Tue Jan 14 00:19:24 +0000 2020', 'id_str': '1216877436916379652', 'text': 'RT @sethrosen: Just converted to @webflow after years of preaching squarespace. Wow - just wow. \n\nI truly see why *this* is called no-code.…', '_id': ObjectId('5e1d09106be78d8673599e86')}
{'created_at': 'Tue Jan 14 00:19:24 +0000 2020', 'id_str': '1216877437570543618', 'text': "@SimonJo37129961 @Rectitude20 On the contrary, you're not appealing to the science &amp; data because epidemiological s… https://t.co/sqR3pkPIeR", '_id': ObjectId('5e1d09106be78d8673599e87')}
{'created_at': 'Tue Jan 14 00:19:26 +0000 2020', 'id_str': '1216877445447438336', 'text': "Always the best bang for your buck of any pod out there, thank you guys. Y'all gotta check them out… https://t.co/gwg4EZKx58", '_id': ObjectId('5e1d09126be78d8673599e88')}
{'created_at': 'Tue Jan 14 00:19:29 +0000 2020', 'id_str': '1216877458613587976', 'text': 'RT @bass_analytics: An Effective Python Environment: Making Yourself at Home\n@realpython #Python #programming #coding\nhttps://t.co/jMkY3xyU…', '_id': ObjectId('5e1d09156be78d8673599e89')}
{'created_at': 'Tue Jan 14 00:19:30 +0000 2020', 'id_str': '1216877463633969152', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…', '_id': ObjectId('5e1d09166be78d8673599e8a')}
{'created_at': 'Tue Jan 14 00:19:31 +0000 2020', 'id_str': '1216877469652914176', 'text': 'Acquista il libro "Big Data, WebFare e Reddito per tutti. Quaderni per il Reddito n°9". Sostieni il BIN Italia - BI… https://t.co/R55bbOsxa3', '_id': ObjectId('5e1d09186be78d8673599e8b')}
{'created_at': 'Tue Jan 14 00:19:33 +0000 2020', 'id_str': '1216877475239616513', 'text': 'RT @MajoLedes: ✨Dejo esto por aquí.. \n\nHice un apunte de 24 páginas sobre conceptos principales de ReactJS🙈\n\nPueden ver el apunte completo…', '_id': ObjectId('5e1d09196be78d8673599e8c')}
{'created_at': 'Tue Jan 14 00:19:33 +0000 2020', 'id_str': '1216877477403840512', 'text': 'RT @iowahawkblog: fun fact: this advanced state-of-the are artificial intelligence powered big data pizza thinkbot system was invented by T…', '_id': ObjectId('5e1d091a6be78d8673599e8d')}
{'created_at': 'Tue Jan 14 00:19:35 +0000 2020', 'id_str': '1216877483796107267', 'text': 'RT @javascriptflx: Hermes: A new open source JavaScript engine optimized for mobile apps https://t.co/Zn7Zed8SkV  #Javascript', '_id': ObjectId('5e1d091b6be78d8673599e8e')}
{'created_at': 'Tue Jan 14 00:19:40 +0000 2020', 'id_str': '1216877507754020866', 'text': "RT @parscale: Big data from Toledo:\n\n✅ 22,927 Voters Identified\n\n✅ 18,210 Voters From Ohio\n\n✅ 5,216 Registrants Didn't Vote in 2016\n\n✅ 21.9…", '_id': ObjectId('5e1d09216be78d8673599e8f')}
{'created_at': 'Tue Jan 14 00:19:41 +0000 2020', 'id_str': '1216877508559343625', 'text': 'Big 5 Sporting Goods $BGFV Anticipates Fiscal 2019 Fourth Quarter EPS to Exceed High End of Prior Guidance Range… https://t.co/fCTX0sWhon', '_id': ObjectId('5e1d09216be78d8673599e90')}
{'created_at': 'Tue Jan 14 00:19:42 +0000 2020', 'id_str': '1216877514049695752', 'text': 'RT @Arthur81288011: @A_Chapman101 @Jack62084141 Clear @HMRCgovuk must NOT be given new powers to automate processes that could cause distre…', '_id': ObjectId('5e1d09226be78d8673599e91')}
{'created_at': 'Tue Jan 14 00:19:46 +0000 2020', 'id_str': '1216877530222743553', 'text': '@RandallKopchak @OptimistPanda The problem (if you can call it that) was that DS9 was way ahead of its time in term… https://t.co/y2UI7XQjYm', '_id': ObjectId('5e1d09266be78d8673599e92')}
{'created_at': 'Tue Jan 14 00:19:51 +0000 2020', 'id_str': '1216877549860663296', 'text': 'This thing is only growing. Excited to see what Gatsby will be like even 5 years from now.', '_id': ObjectId('5e1d092b6be78d8673599e93')}
{'created_at': 'Tue Jan 14 00:19:52 +0000 2020', 'id_str': '1216877555946414081', 'text': "2.  but oh well, it's cool data science!", '_id': ObjectId('5e1d092c6be78d8673599e94')}
{'created_at': 'Tue Jan 14 00:19:53 +0000 2020', 'id_str': '1216877561839484929', 'text': 'RT @KinarmLab: Kinarm Camp registration is now open!  Come join us June 8-12th in beautiful #ygk for a week of intensive #kinarm programmin…', '_id': ObjectId('5e1d092e6be78d8673599e95')}
{'created_at': 'Tue Jan 14 00:19:56 +0000 2020', 'id_str': '1216877570819600389', 'text': 'RT @ElemTeachersTO: The #TDSB has cut $13 million dollars of French programming and is planning to eliminate Extended French starting next…', '_id': ObjectId('5e1d09306be78d8673599e96')}
{'created_at': 'Tue Jan 14 00:19:56 +0000 2020', 'id_str': '1216877570978803712', 'text': 'RT @byLilyV: FEATURED #COURSES\n\nThe #Data #Science #Course 2019: Complete Data Science Bootcamp\n\nBest Seller 144,730 students enrolled\n\nCom…', '_id': ObjectId('5e1d09306be78d8673599e97')}
{'created_at': 'Tue Jan 14 00:20:00 +0000 2020', 'id_str': '1216877588385271808', 'text': 'How to pack #Angular 8 applications on regular war files https://t.co/t1AXyA1wD1 #javascript #typescript #frontend #webdev', '_id': ObjectId('5e1d09346be78d8673599e98')}
{'created_at': 'Tue Jan 14 00:20:00 +0000 2020', 'id_str': '1216877589110951936', 'text': 'CoStar Group (@TheCoStarGroup) is hiring https://t.co/cWm6u5KE5o #reactjs #angularjs', '_id': ObjectId('5e1d09346be78d8673599e99')}
{'created_at': 'Tue Jan 14 00:20:02 +0000 2020', 'id_str': '1216877599143665669', 'text': 'RT @NexWebSites: #Programming\n👇\nVisual Studio @code Keyboard Board Shortcuts for:\n \n👉Windows : PDF🔗: https://t.co/xxPqHUMjS3\n 👉#Linux : PDF…', '_id': ObjectId('5e1d09376be78d8673599e9a')}
{'created_at': 'Tue Jan 14 00:20:03 +0000 2020', 'id_str': '1216877600955621377', 'text': 'Everyone has his or her own way of analyzing data to find the right answers. This is why self-service in a business… https://t.co/264klNDvA1', '_id': ObjectId('5e1d09376be78d8673599e9b')}
{'created_at': 'Tue Jan 14 00:20:09 +0000 2020', 'id_str': '1216877627937579011', 'text': 'RT @Payara_Fish: JavaFX Strikes Back - Latest #Airhacks podcast from @AdamBien\nCatching up with Gluons @johanvos, talking about advantages…', '_id': ObjectId('5e1d093d6be78d8673599e9c')}
{'created_at': 'Tue Jan 14 00:20:13 +0000 2020', 'id_str': '1216877645977325569', 'text': '32 Tips For Every #WebDeveloper In 2020 #BetterProgramming via https://t.co/Q6JBQhnTTy https://t.co/3hwgAJhmSs', '_id': ObjectId('5e1d09426be78d8673599e9d')}
---------------------------------------------------------------------------
KeyboardInterrupt                         Traceback (most recent call last)
<ipython-input-262-c100010f28dc> in <module>
----> 1 mystream.filter(track=palavras_chave)

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\site-packages\tweepy\streaming.py in filter(self, follow, track, is_async, locations, stall_warnings, languages, encoding, filter_level)
    472             self.body['filter_level'] = filter_level.encode(encoding)
    473         self.session.params = {'delimited': 'length'}
--> 474         self._start(is_async)
    475 
    476     def sitestream(self, follow, stall_warnings=False,

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\site-packages\tweepy\streaming.py in _start(self, is_async)
    387             self._thread.start()
    388         else:
--> 389             self._run()
    390 
    391     def on_closed(self, resp):

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\site-packages\tweepy\streaming.py in _run(self)
    287                     self.snooze_time = self.snooze_time_step
    288                     self.listener.on_connect()
--> 289                     self._read_loop(resp)
    290             except (Timeout, ssl.SSLError) as exc:
    291                 # This is still necessary, as a SSLError can actually be

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\site-packages\tweepy\streaming.py in _read_loop(self, resp)
    337             length = 0
    338             while not resp.raw.closed:
--> 339                 line = buf.read_line()
    340                 stripped_line = line.strip() if line else line # line is sometimes None so we need to check here
    341                 if not stripped_line:

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\site-packages\tweepy\streaming.py in read_line(self, sep)
    198             else:
    199                 start = len(self._buffer)
--> 200             self._buffer += self._stream.read(self._chunk_size)
    201         return six.b('')
    202 

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\site-packages\urllib3\response.py in read(self, amt, decode_content, cache_content)
    505             else:
    506                 cache_content = False
--> 507                 data = self._fp.read(amt) if not fp_closed else b""
    508                 if (
    509                     amt != 0 and not data

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\http\client.py in read(self, amt)
    455             # Amount is given, implement using readinto
    456             b = bytearray(amt)
--> 457             n = self.readinto(b)
    458             return memoryview(b)[:n].tobytes()
    459         else:

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\http\client.py in readinto(self, b)
    489 
    490         if self.chunked:
--> 491             return self._readinto_chunked(b)
    492 
    493         if self.length is not None:

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\http\client.py in _readinto_chunked(self, b)
    584         try:
    585             while True:
--> 586                 chunk_left = self._get_chunk_left()
    587                 if chunk_left is None:
    588                     return total_bytes

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\http\client.py in _get_chunk_left(self)
    552                 self._safe_read(2)  # toss the CRLF at the end of the chunk
    553             try:
--> 554                 chunk_left = self._read_next_chunk_size()
    555             except ValueError:
    556                 raise IncompleteRead(b'')

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\http\client.py in _read_next_chunk_size(self)
    512     def _read_next_chunk_size(self):
    513         # Read the next chunk size from the file
--> 514         line = self.fp.readline(_MAXLINE + 1)
    515         if len(line) > _MAXLINE:
    516             raise LineTooLong("chunk size")

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\socket.py in readinto(self, b)
    587         while True:
    588             try:
--> 589                 return self._sock.recv_into(b)
    590             except timeout:
    591                 self._timeout_occurred = True

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\ssl.py in recv_into(self, buffer, nbytes, flags)
   1069                   "non-zero flags not allowed in calls to recv_into() on %s" %
   1070                   self.__class__)
-> 1071             return self.read(nbytes, buffer)
   1072         else:
   1073             return super().recv_into(buffer, nbytes, flags)

c:\users\lord_negrisoli\appdata\local\programs\python\python37\lib\ssl.py in read(self, len, buffer)
    927         try:
    928             if buffer is not None:
--> 929                 return self._sslobj.read(len, buffer)
    930             else:
    931                 return self._sslobj.read(len)

KeyboardInterrupt: 
In [263]:
mystream.disconnect()
In [264]:
colecao.estimated_document_count()
Out[264]:
129
In [265]:
for i in colecao.find():
    print(i)
{'_id': ObjectId('5e1d07f86be78d8673599e1d'), 'created_at': 'Tue Jan 14 00:14:44 +0000 2020', 'id_str': '1216876262846869504', 'text': 'RT @dcumoviepage: #ReleaseTheSnyderCut'}
{'_id': ObjectId('5e1d08316be78d8673599e1e'), 'created_at': 'Tue Jan 14 00:15:41 +0000 2020', 'id_str': '1216876503889326087', 'text': 'RT @InfluxDB: Discover how a new #fluxlang feature that supports months and years as intervals while windowing enables deeper analysis of #…'}
{'_id': ObjectId('5e1d083c6be78d8673599e1f'), 'created_at': 'Tue Jan 14 00:15:51 +0000 2020', 'id_str': '1216876547010809856', 'text': '@realDonaldTrump Trump thinks his voters are dumb.\n\nhttps://t.co/Av2038b7q3'}
{'_id': ObjectId('5e1d083e6be78d8673599e20'), 'created_at': 'Tue Jan 14 00:15:54 +0000 2020', 'id_str': '1216876557538451456', 'text': "RT @SethAbramson: 25/ Joel Zamel, a man close to the Israeli government—a key player in Flynn's Saudi Nuclear Deal—and a man recommended to…"}
{'_id': ObjectId('5e1d08496be78d8673599e21'), 'created_at': 'Tue Jan 14 00:16:05 +0000 2020', 'id_str': '1216876601830494208', 'text': '@Jhonitrejos @JorgeIvanOspina @lunadavid @kevingomezpaz @SergioMZamoraB @lftroyano Para que sea ciudad inteligente… https://t.co/WlSEnMOapV'}
{'_id': ObjectId('5e1d084c6be78d8673599e22'), 'created_at': 'Tue Jan 14 00:16:08 +0000 2020', 'id_str': '1216876616430821377', 'text': 'RT @sicsuper: ¡Proteger tus datos personales es muy importante!\nEncuentra las recomendaciones que Big Data y la #SICSuper te dejamos aquí 👉…'}
{'_id': ObjectId('5e1d08656be78d8673599e23'), 'created_at': 'Tue Jan 14 00:16:33 +0000 2020', 'id_str': '1216876719631556608', 'text': 'RT @CatalogueBack: We interrupt our regular programming of pop culture and anime discussion posts to bring you @Cancelathon something fun I…'}
{'_id': ObjectId('5e1d08676be78d8673599e24'), 'created_at': 'Tue Jan 14 00:16:35 +0000 2020', 'id_str': '1216876728389292032', 'text': 'RT @NomadXrp: ⏰  PRICE UPDATE  🚀 \n\n⭐️ $XRP $ 0.2132\n24h -0.56% 📉\n\n⭐️ $BTC $ 8128.82\n24h -0.60% 📉\n\n⭐️ $ETH $ 143.88\n24h -1.67% 📉\n\n$xrp #thes…'}
{'_id': ObjectId('5e1d08686be78d8673599e25'), 'created_at': 'Tue Jan 14 00:16:36 +0000 2020', 'id_str': '1216876733929938944', 'text': 'BIG KETS ARE STILL KETS 😻😻😻😻'}
{'_id': ObjectId('5e1d086a6be78d8673599e26'), 'created_at': 'Tue Jan 14 00:16:38 +0000 2020', 'id_str': '1216876741496582144', 'text': '[Cheat Sheet] Python Basics For Data Science https://t.co/LuZxXxs1dK'}
{'_id': ObjectId('5e1d086b6be78d8673599e27'), 'created_at': 'Tue Jan 14 00:16:39 +0000 2020', 'id_str': '1216876745992871936', 'text': 'RT @Justin_Stolpe: Happy Monday! Learning about the Instagram Graph API this week! What are you learning about?\n.\n.\n#instagram #instagramap…'}
{'_id': ObjectId('5e1d086c6be78d8673599e28'), 'created_at': 'Tue Jan 14 00:16:39 +0000 2020', 'id_str': '1216876748182257664', 'text': 'RT @davarcar1: @Jhonitrejos @JorgeIvanOspina @lunadavid @kevingomezpaz @SergioMZamoraB @lftroyano Para que sea ciudad inteligente de pasar…'}
{'_id': ObjectId('5e1d08746be78d8673599e29'), 'created_at': 'Tue Jan 14 00:16:47 +0000 2020', 'id_str': '1216876781480878080', 'text': '"They are typically very experienced, having worked on many different projects under a wide variety of circumstance… https://t.co/mWRTfNnRmX'}
{'_id': ObjectId('5e1d08776be78d8673599e2a'), 'created_at': 'Tue Jan 14 00:16:51 +0000 2020', 'id_str': '1216876795745751041', 'text': '@iceagereentry @rcsteeb Don’t worry, all is well. 😉 https://t.co/5jxh8gXtTk'}
{'_id': ObjectId('5e1d08786be78d8673599e2b'), 'created_at': 'Tue Jan 14 00:16:51 +0000 2020', 'id_str': '1216876798199451648', 'text': 'It "amazes" ME how an "influencer"  like @MarkDice hasn\'t TOUCHED UPON the "blatant" SYMBOLISM being shown on… https://t.co/WhB32QifGF'}
{'_id': ObjectId('5e1d087a6be78d8673599e2c'), 'created_at': 'Tue Jan 14 00:16:54 +0000 2020', 'id_str': '1216876808173432832', 'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…'}
{'_id': ObjectId('5e1d087b6be78d8673599e2d'), 'created_at': 'Tue Jan 14 00:16:55 +0000 2020', 'id_str': '1216876811906207745', 'text': 'RT @HawkinsTammy: Know #javascript and looking for a new gig in #California? #Blizzard Entertainment is looking for an Associate Software W…'}
{'_id': ObjectId('5e1d087c6be78d8673599e2e'), 'created_at': 'Tue Jan 14 00:16:55 +0000 2020', 'id_str': '1216876814187909124', 'text': 'Coffee and code. NodeJs tutorial. Then I will do some ReactJs tutorials.\n\nChristmas cat mug FTW! https://t.co/8ATWXMVAqV'}
{'_id': ObjectId('5e1d08816be78d8673599e2f'), 'created_at': 'Tue Jan 14 00:17:00 +0000 2020', 'id_str': '1216876836195618817', 'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…'}
{'_id': ObjectId('5e1d08816be78d8673599e30'), 'created_at': 'Tue Jan 14 00:17:01 +0000 2020', 'id_str': '1216876837185511424', 'text': "📚 Wiley's Professional JavaScript for Web Developers is an essential guide to next-level ES6 and ES7 JavaScript dev… https://t.co/uyZB7AJ0en"}
{'_id': ObjectId('5e1d08856be78d8673599e31'), 'created_at': 'Tue Jan 14 00:17:05 +0000 2020', 'id_str': '1216876855405490176', 'text': 'With a few commands I can upgrade: sysinternals notepadplusplus googlechrome 7zip firefox SQLSentryPlanExplorer  vi… https://t.co/JkfFZEZPyB'}
{'_id': ObjectId('5e1d08876be78d8673599e32'), 'created_at': 'Tue Jan 14 00:17:07 +0000 2020', 'id_str': '1216876864192569345', 'text': 'New #job: Senior Fullstack Dev - JAVA and API Location: Wellington Central .. https://t.co/R8zY2oD9w6 #jobs #hiring'}
{'_id': ObjectId('5e1d08886be78d8673599e33'), 'created_at': 'Tue Jan 14 00:17:08 +0000 2020', 'id_str': '1216876866948255745', 'text': 'Feature request: add `base16` default themes, the next evolution of `Tomorrow` themes https://t.co/e99xcYh1aL… https://t.co/ShFLk4a0mj'}
{'_id': ObjectId('5e1d088b6be78d8673599e34'), 'created_at': 'Tue Jan 14 00:17:11 +0000 2020', 'id_str': '1216876880080637953', 'text': 'insert baby yoda picture with caption \n\n“big kitties”'}
{'_id': ObjectId('5e1d088f6be78d8673599e35'), 'created_at': 'Tue Jan 14 00:17:14 +0000 2020', 'id_str': '1216876894664232961', 'text': 'RT @IsTheArchitect: Why #Python is better than #R for #DataScience careers.\n\nhttps://t.co/cyTiSBpV4P\n#dataengineering #bigdata'}
{'_id': ObjectId('5e1d08916be78d8673599e36'), 'created_at': 'Tue Jan 14 00:17:17 +0000 2020', 'id_str': '1216876905573634054', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…'}
{'_id': ObjectId('5e1d08946be78d8673599e37'), 'created_at': 'Tue Jan 14 00:17:20 +0000 2020', 'id_str': '1216876917439238144', 'text': 'RT @Brilliance100: We handle:\n\nStatistics online classes\nPrecalculus\nAlgebra\nTrigonometry\nLinear programming\nMeasurements\nData analysis\nSPS…'}
{'_id': ObjectId('5e1d08966be78d8673599e38'), 'created_at': 'Tue Jan 14 00:17:21 +0000 2020', 'id_str': '1216876924657717248', 'text': 'RT @AlRokerEnt: "We are proud to debut this African American focused channel, created by and for the members of the black community." - Jam…'}
{'_id': ObjectId('5e1d08966be78d8673599e39'), 'created_at': 'Tue Jan 14 00:17:22 +0000 2020', 'id_str': '1216876926750613505', 'text': 'RT @nep_developer: Day: 08 of #100DaysOfCode \n-Pause the Tracker App(for a week)\n-Started a new project Planner that used firebase,\n\n------…'}
{'_id': ObjectId('5e1d08976be78d8673599e3a'), 'created_at': 'Tue Jan 14 00:17:23 +0000 2020', 'id_str': '1216876930668036097', 'text': "RT @shog9: Well... I suddenly find myself in need of work. \nIf anyone's hiring: C++, JavaScript, C#, SQL + solid background in social softw…"}
{'_id': ObjectId('5e1d089a6be78d8673599e3b'), 'created_at': 'Tue Jan 14 00:17:25 +0000 2020', 'id_str': '1216876940537126912', 'text': 'RT @brunoborges: For all maintainers of #Java frameworks and libraries, ping @ashleymcnamara and share your story.\n\n// @jtgreene @phillip_w…'}
{'_id': ObjectId('5e1d089c6be78d8673599e3c'), 'created_at': 'Tue Jan 14 00:17:28 +0000 2020', 'id_str': '1216876949949308928', 'text': '¡El último Cience, Technology &amp; Programming  Daily! https://t.co/LTH701EPUt Gracias a @CTcard44 @schoolprobIems… https://t.co/CVFHa0My36'}
{'_id': ObjectId('5e1d089d6be78d8673599e3d'), 'created_at': 'Tue Jan 14 00:17:29 +0000 2020', 'id_str': '1216876954869256195', 'text': 'New #job: Business Intelligence Analyst Location: Las Vegas .. https://t.co/jXAS0kPEL6 #jobs #hiring'}
{'_id': ObjectId('5e1d08a06be78d8673599e3e'), 'created_at': 'Tue Jan 14 00:17:32 +0000 2020', 'id_str': '1216876967628353536', 'text': 'RT @DD_FaFa_: Data Science from Scratch: Comprehensive guide with essential principles of Data Science https://t.co/xgdtkXevAm #DataScience'}
{'_id': ObjectId('5e1d08a26be78d8673599e3f'), 'created_at': 'Tue Jan 14 00:17:34 +0000 2020', 'id_str': '1216876976943828993', 'text': 'RT @motherofnodejs: I am not lazy, I just save energy 😑 #programming #coding #programmer #javascript #coder #php #java #programminglife #de…'}
{'_id': ObjectId('5e1d08a36be78d8673599e40'), 'created_at': 'Tue Jan 14 00:17:34 +0000 2020', 'id_str': '1216876979254956033', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5'}
{'_id': ObjectId('5e1d08a36be78d8673599e41'), 'created_at': 'Tue Jan 14 00:17:35 +0000 2020', 'id_str': '1216876980294967296', 'text': 'FREE Webinar: Tuesday, 21 January 2020, 9 am EST for a review of #compositional #analysis by Handheld #XRF, along w… https://t.co/FvRX3YQDeB'}
{'_id': ObjectId('5e1d08a46be78d8673599e42'), 'created_at': 'Tue Jan 14 00:17:35 +0000 2020', 'id_str': '1216876982564278272', 'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…'}
{'_id': ObjectId('5e1d08a46be78d8673599e43'), 'created_at': 'Tue Jan 14 00:17:36 +0000 2020', 'id_str': '1216876984887906304', 'text': 'RT @susanhash: Leverage #CustomerData to identify opportunities for #proactive #custserv - Jon Christiansen of data science firm Ins &amp; Outs…'}
{'_id': ObjectId('5e1d08a46be78d8673599e44'), 'created_at': 'Tue Jan 14 00:17:36 +0000 2020', 'id_str': '1216876985009373184', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…'}
{'_id': ObjectId('5e1d08a46be78d8673599e45'), 'created_at': 'Tue Jan 14 00:17:36 +0000 2020', 'id_str': '1216876985126776832', 'text': "RT @h_ingo: TIL there's a Java version for one of the greatest performance diagnostics tools ever, PoorMansProfiler."}
{'_id': ObjectId('5e1d08a46be78d8673599e46'), 'created_at': 'Tue Jan 14 00:17:36 +0000 2020', 'id_str': '1216876985487523840', 'text': 'RT @lakwatsarah: BIG KETS ARE STILL KETS 😻😻😻😻'}
{'_id': ObjectId('5e1d08a66be78d8673599e47'), 'created_at': 'Tue Jan 14 00:17:38 +0000 2020', 'id_str': '1216876994060619776', 'text': 'RT @PriscillaWT: The grandson of House Democratic Whip James Clyburn, D-S.C., has cut a radio ad invoking his grandfather’s legacy and call…'}
{'_id': ObjectId('5e1d08a86be78d8673599e48'), 'created_at': 'Tue Jan 14 00:17:40 +0000 2020', 'id_str': '1216877002256539649', 'text': 'RT @ActionableInsi3: [Cheat Sheet] Python Basics For Data Science https://t.co/LuZxXxs1dK'}
{'_id': ObjectId('5e1d08a96be78d8673599e49'), 'created_at': 'Tue Jan 14 00:17:40 +0000 2020', 'id_str': '1216877003585884160', 'text': "RT @chey_cobb: Soooo... \nWhat's scarier?\n* Foreign intelligence agencies listening in on you?\n* Domestic intelligence agencies listening in…"}
{'_id': ObjectId('5e1d08aa6be78d8673599e4a'), 'created_at': 'Tue Jan 14 00:17:41 +0000 2020', 'id_str': '1216877008199856130', 'text': 'I want nothing more than to hug a mf lion. Look at how cute and cuddly this big fluffs are!!!! I can’t handle it 😍😍'}
{'_id': ObjectId('5e1d08aa6be78d8673599e4b'), 'created_at': 'Tue Jan 14 00:17:42 +0000 2020', 'id_str': '1216877009193906178', 'text': '☀ Hiring: #Big Data Engineer\n#AI #Analyst #BigData #Developer #Plano #techjobs #devjobs\nApply Now &gt;&gt;… https://t.co/f67B6uP1sU'}
{'_id': ObjectId('5e1d08ab6be78d8673599e4c'), 'created_at': 'Tue Jan 14 00:17:42 +0000 2020', 'id_str': '1216877012012486659', 'text': 'RT @pdakean: Original study that found relation was retracted for data manipulation. The relation was never there but now epidemics are com…'}
{'_id': ObjectId('5e1d08ae6be78d8673599e4d'), 'created_at': 'Tue Jan 14 00:17:46 +0000 2020', 'id_str': '1216877026864484353', 'text': '@PoetWalker We need an independent revival, like French New Wave, maybe. Films not involving enormous corporations… https://t.co/9PUgw6EdsE'}
{'_id': ObjectId('5e1d08b06be78d8673599e4e'), 'created_at': 'Tue Jan 14 00:17:48 +0000 2020', 'id_str': '1216877036414914561', 'text': '@EFL_law @KingMeren You are right - in theory this should not be that big of a deal. But you are giving the team mo… https://t.co/Cwn6ojUhX4'}
{'_id': ObjectId('5e1d08b16be78d8673599e4f'), 'created_at': 'Tue Jan 14 00:17:49 +0000 2020', 'id_str': '1216877038528868353', 'text': 'Practical Data Science with Hadoop and Spark: Designing and Building Effective Analytics at Scale (Addison-wesley D… https://t.co/zDsJpGTSoI'}
{'_id': ObjectId('5e1d08b26be78d8673599e50'), 'created_at': 'Tue Jan 14 00:17:50 +0000 2020', 'id_str': '1216877044623081477', 'text': 'RT @MikelJoachim: Starting a “methods journal club” with grad students &amp; post-docs in @UWBadgerAP to discuss data organization, study desig…'}
{'_id': ObjectId('5e1d08b36be78d8673599e51'), 'created_at': 'Tue Jan 14 00:17:50 +0000 2020', 'id_str': '1216877046351220736', 'text': 'RT @nep_developer: Day: 08 of #100DaysOfCode \n-Pause the Tracker App(for a week)\n-Started a new project Planner that used firebase,\n\n------…'}
{'_id': ObjectId('5e1d08b66be78d8673599e52'), 'created_at': 'Tue Jan 14 00:17:54 +0000 2020', 'id_str': '1216877059789742080', 'text': 'RT @NoContextVinny: And we return to your regular programming. https://t.co/N9bbwoYtkp'}
{'_id': ObjectId('5e1d08b66be78d8673599e53'), 'created_at': 'Tue Jan 14 00:17:54 +0000 2020', 'id_str': '1216877061152878598', 'text': 'Current standard of discourse on the net: "I know nothing I write here will change your mind, because you are alrea… https://t.co/OMa09Z0Gz6'}
{'_id': ObjectId('5e1d08b76be78d8673599e54'), 'created_at': 'Tue Jan 14 00:17:55 +0000 2020', 'id_str': '1216877065481252867', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5'}
{'_id': ObjectId('5e1d08b96be78d8673599e55'), 'created_at': 'Tue Jan 14 00:17:56 +0000 2020', 'id_str': '1216877070594211840', 'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…'}
{'_id': ObjectId('5e1d08b96be78d8673599e56'), 'created_at': 'Tue Jan 14 00:17:56 +0000 2020', 'id_str': '1216877071177342979', 'text': 'actual footage of me because i have to TA  programming classes tomorrow for a total of 4 hours'}
{'_id': ObjectId('5e1d08bd6be78d8673599e57'), 'created_at': 'Tue Jan 14 00:18:01 +0000 2020', 'id_str': '1216877088730439680', 'text': 'Take part in the #SPIE Career Summit, our professional development programming at #PhotonicsWest 2020! \n\nCheck out… https://t.co/L1ej80GLtq'}
{'_id': ObjectId('5e1d08be6be78d8673599e58'), 'created_at': 'Tue Jan 14 00:17:58 +0000 2020', 'id_str': '1216877076021534720', 'text': '@Mandoline_Blue Those energies, hard coded into our genetic programming, can (not always) find a twisted way out if… https://t.co/TLAJEnJc6h'}
{'_id': ObjectId('5e1d08be6be78d8673599e59'), 'created_at': 'Tue Jan 14 00:18:02 +0000 2020', 'id_str': '1216877095667716096', 'text': 'もう火曜日。\nImperative  programming vs. Declarative :\n命令型プログラミング vs. 宣言型プログラミング'}
{'_id': ObjectId('5e1d08bf6be78d8673599e5a'), 'created_at': 'Tue Jan 14 00:18:02 +0000 2020', 'id_str': '1216877096472940544', 'text': 'Itu csy kalo suatu saat nongol di Java Jazz, gue ga heran'}
{'_id': ObjectId('5e1d08c06be78d8673599e5b'), 'created_at': 'Tue Jan 14 00:18:03 +0000 2020', 'id_str': '1216877099937603584', 'text': 'Medical identity theft can leave you with big bills for procedures, treatment and equipment you never asked for or… https://t.co/hikhwEFoPo'}
{'_id': ObjectId('5e1d08c26be78d8673599e5c'), 'created_at': 'Tue Jan 14 00:18:06 +0000 2020', 'id_str': '1216877109865537537', 'text': '[Feature] Babel plugin: Add import URL version tag https://t.co/uObz0wNfua #github #JavaScript #TypeScript #CSS #HTML'}
{'_id': ObjectId('5e1d08c26be78d8673599e5d'), 'created_at': 'Tue Jan 14 00:18:03 +0000 2020', 'id_str': '1216877097899130880', 'text': 'There are many ways to profit off your health data, which leaves you with a big and sometimes life-threatening mess… https://t.co/nMhkQ793oe'}
{'_id': ObjectId('5e1d08c36be78d8673599e5e'), 'created_at': 'Tue Jan 14 00:18:07 +0000 2020', 'id_str': '1216877114709946369', 'text': 'RT @javascriptflx: 30 Free Resources To Help You Learn JavaScript Fundamentals https://t.co/W1C5eXVUkp  #Javascript'}
{'_id': ObjectId('5e1d08c36be78d8673599e5f'), 'created_at': 'Tue Jan 14 00:18:07 +0000 2020', 'id_str': '1216877116308033536', 'text': "Sr DevOps Developer - perm/downtown Toronto - Java/Python/Ruby or C req'd - build software to improve build/release… https://t.co/3qmpVgWt9Q"}
{'_id': ObjectId('5e1d08cd6be78d8673599e60'), 'created_at': 'Tue Jan 14 00:18:17 +0000 2020', 'id_str': '1216877157114437632', 'text': 'Malicious JavaScript package was only active on the npm repository for two weeks. Microsoft spots malicious npm pac… https://t.co/hZHWiiadOh'}
{'_id': ObjectId('5e1d08cf6be78d8673599e61'), 'created_at': 'Tue Jan 14 00:18:19 +0000 2020', 'id_str': '1216877166555627520', 'text': 'RT @SevenHillsUlti: We are submitting bids for YCC this summer! For more details or answers to some questions, check out our website: https…'}
{'_id': ObjectId('5e1d08d26be78d8673599e62'), 'created_at': 'Tue Jan 14 00:18:21 +0000 2020', 'id_str': '1216877175460200448', 'text': "RT @juddy_96: Let me put Japan's situation in smash terms. Smash 4 Shulk. Hey he has all this great stuff. Let's give him shit frame data.…"}
{'_id': ObjectId('5e1d08d26be78d8673599e63'), 'created_at': 'Tue Jan 14 00:18:22 +0000 2020', 'id_str': '1216877177062481920', 'text': 'RT @BenjySarlin: A realistic scenario right now:\n\n-Trump WH asks courts to end protections for pre-existing conditions\n\n-Trump re-elected w…'}
{'_id': ObjectId('5e1d08d26be78d8673599e64'), 'created_at': 'Tue Jan 14 00:18:22 +0000 2020', 'id_str': '1216877178580803584', 'text': "RT @Brilliance100: We'll give you A's in your classes. Pay us for\n#essay\n#homework\n#assignment\n#discussion\n#code Java PHP C#\n#Programming p…"}
{'_id': ObjectId('5e1d08d36be78d8673599e65'), 'created_at': 'Tue Jan 14 00:18:22 +0000 2020', 'id_str': '1216877179658698752', 'text': 'RT @sicsuper: ¡Proteger tus datos personales es muy importante!\nEncuentra las recomendaciones que Big Data y la #SICSuper te dejamos aquí 👉…'}
{'_id': ObjectId('5e1d08d66be78d8673599e66'), 'created_at': 'Tue Jan 14 00:18:25 +0000 2020', 'id_str': '1216877192744849408', 'text': 'We back to regular programming boiiiis'}
{'_id': ObjectId('5e1d08d86be78d8673599e67'), 'created_at': 'Tue Jan 14 00:18:27 +0000 2020', 'id_str': '1216877200940683265', 'text': "RT @Cawfree: Here's the Boston Housing dataset for training #regression networks in #tensorflow #NeuralNetworks in #javascript.\n\nhttps://t.…"}
{'_id': ObjectId('5e1d08d96be78d8673599e68'), 'created_at': 'Tue Jan 14 00:18:28 +0000 2020', 'id_str': '1216877205730426881', 'text': 'RT @nytimesworld: “There aren’t that many things that are quintessentially Canadian, but skating is one of them,” said a university profess…'}
{'_id': ObjectId('5e1d08de6be78d8673599e69'), 'created_at': 'Tue Jan 14 00:18:34 +0000 2020', 'id_str': '1216877226819489792', 'text': 'What to Pay #JavaScript #Developers in 2020 via https://t.co/prqxSCAEJ8 https://t.co/3nNlRg8PQK'}
{'_id': ObjectId('5e1d08df6be78d8673599e6a'), 'created_at': 'Tue Jan 14 00:18:35 +0000 2020', 'id_str': '1216877233584865281', 'text': '@msRachel9 As soon as we have programming news we’ll announce it here 😘'}
{'_id': ObjectId('5e1d08e36be78d8673599e6b'), 'created_at': 'Tue Jan 14 00:18:39 +0000 2020', 'id_str': '1216877249686855680', 'text': "My father just discovered that Steven Seagal was a real cop. Well he discovered Steven Seagal Law Man.\n\nThat's what… https://t.co/B1BMeIi25n"}
{'_id': ObjectId('5e1d08e66be78d8673599e6c'), 'created_at': 'Tue Jan 14 00:18:42 +0000 2020', 'id_str': '1216877261749735424', 'text': 'RT @RiverVanRain: What to Pay #JavaScript #Developers in 2020 via https://t.co/prqxSCAEJ8 https://t.co/3nNlRg8PQK'}
{'_id': ObjectId('5e1d08e66be78d8673599e6d'), 'created_at': 'Tue Jan 14 00:18:42 +0000 2020', 'id_str': '1216877262848581632', 'text': 'RT @MauraAlwyen: Science has just as many false prophets as religion and American politics does. Data, the Scriptures, and the Constitution…'}
{'_id': ObjectId('5e1d08ee6be78d8673599e6e'), 'created_at': 'Tue Jan 14 00:18:49 +0000 2020', 'id_str': '1216877293773238272', 'text': 'RT @MattKresslein: Join us for the SOKY Robot Royale on Feb. 26th @GRRECKY!  EV3 &amp; Sphero Competitions, Drone Programming/Flying, @Scribit_…'}
{'_id': ObjectId('5e1d08ee6be78d8673599e6f'), 'created_at': 'Tue Jan 14 00:18:50 +0000 2020', 'id_str': '1216877295765311489', 'text': 'RT @WjgotINrU14Z1fB: Javaで3年くらいやると、他言語の実業務に参加可能になるやつが増えてくる。\n\nなんでJavaだとそうなのかはわからないが、お堅い言語であるが故、信用されてる部分があるっぽい。\n\n実際のところ、言語転換の際に現場で困った話も聞かない。…'}
{'_id': ObjectId('5e1d08ee6be78d8673599e70'), 'created_at': 'Tue Jan 14 00:18:50 +0000 2020', 'id_str': '1216877296461795329', 'text': 'RT @Gurgling_MrD: Malicious JavaScript package was only active on the npm repository for two weeks. Microsoft spots malicious npm package s…'}
{'_id': ObjectId('5e1d08f06be78d8673599e71'), 'created_at': 'Tue Jan 14 00:18:52 +0000 2020', 'id_str': '1216877302845304832', 'text': "RT @JamesFourM: @dark_wisdom_ @b_ofrights @TrickFreee @dcpoll @ninaandtito @3L3V3NTH @CORLEBRA777 Hey bruh. Let's not forget Bob Dole ➡️ Ma…"}
{'_id': ObjectId('5e1d08f16be78d8673599e72'), 'created_at': 'Tue Jan 14 00:18:53 +0000 2020', 'id_str': '1216877308386185216', 'text': 'RT @platzi: 📚 Seis Libros para mejorar tu conocimiento de Data Science 👇\n#NuncaParesDeAprender\nhttps://t.co/569j3rREx0 https://t.co/69KqUNy…'}
{'_id': ObjectId('5e1d08f16be78d8673599e73'), 'created_at': 'Tue Jan 14 00:18:53 +0000 2020', 'id_str': '1216877308491051009', 'text': 'Applied for college and university today, mainly computer programming for Colledge and a English major for universi… https://t.co/WhrU7gq7Q9'}
{'_id': ObjectId('5e1d08f66be78d8673599e74'), 'created_at': 'Tue Jan 14 00:18:58 +0000 2020', 'id_str': '1216877328266981376', 'text': 'RT @JamesFourM: @CORLEBRA777\n@ninaandtito\n\nFounder &amp; pres of Grassroots Targeting worked for Bob &amp; Elizabeth Dole &amp; as  adviser to Reince P…'}
{'_id': ObjectId('5e1d08f86be78d8673599e75'), 'created_at': 'Tue Jan 14 00:19:00 +0000 2020', 'id_str': '1216877337070850048', 'text': "RT @sarah_edo: 🎉 If you're interested in learning how to animate on the web with JavaScript, I wrote up a post on how to animate with @gree…"}
{'_id': ObjectId('5e1d08fb6be78d8673599e76'), 'created_at': 'Tue Jan 14 00:19:02 +0000 2020', 'id_str': '1216877347292532736', 'text': 'RT @RobotMakerGirl: The first part of the “thing” is officially built and tested. Now on to the programming stage! Then the woodworking sta…'}
{'_id': ObjectId('5e1d08fb6be78d8673599e77'), 'created_at': 'Tue Jan 14 00:19:02 +0000 2020', 'id_str': '1216877347535826946', 'text': 'Moderated a data science panel yesterday\n当我准备总结一个数据科学研讨环节时,问三位嘉宾:假如,您公司现在就开始没有数据,您的业务将会怎样?他们那惊讶的神情,告诉了我们数据对业务发展的重要性… https://t.co/JXnU7igBRD'}
{'_id': ObjectId('5e1d08fe6be78d8673599e78'), 'created_at': 'Tue Jan 14 00:19:06 +0000 2020', 'id_str': '1216877361842544641', 'text': 'Hi, I can do the class for you\nDM or Email✉ EssayNerd7@gmail.com \n\nGuarantees:\n✴an A+ Grade√√\n✴Timely Completion ⏱… https://t.co/UBs4lIMgBG'}
{'_id': ObjectId('5e1d09016be78d8673599e79'), 'created_at': 'Tue Jan 14 00:19:08 +0000 2020', 'id_str': '1216877373045473280', 'text': 'For some reason remembering languages/tools I’ve developed in I haven’t heard much about in years.\n#Powerbuilder,… https://t.co/CcYD8Ux1pX'}
{'_id': ObjectId('5e1d09016be78d8673599e7a'), 'created_at': 'Tue Jan 14 00:19:09 +0000 2020', 'id_str': '1216877373586624514', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…'}
{'_id': ObjectId('5e1d09016be78d8673599e7b'), 'created_at': 'Tue Jan 14 00:19:09 +0000 2020', 'id_str': '1216877375968989184', 'text': 'Gina Carano in a suit.....thats is all, we will now go back to your regularly scheduled programming #thisistheway https://t.co/QIC4xdsuhv'}
{'_id': ObjectId('5e1d09026be78d8673599e7c'), 'created_at': 'Tue Jan 14 00:19:10 +0000 2020', 'id_str': '1216877378330218496', 'text': 'RT @spring_io: First milestone of Spring Boot 2.3 will be released this Thursday and will GA two weeks before Spring I/O.\n\nDon’t miss out a…'}
{'_id': ObjectId('5e1d09046be78d8673599e7d'), 'created_at': 'Tue Jan 14 00:19:11 +0000 2020', 'id_str': '1216877385930432512', 'text': 'RT @genentech: Heading to #JPM20? Download S3E05 of our #podcast and find out more about the role of big data in #PersonalizedMedicine from…'}
{'_id': ObjectId('5e1d09046be78d8673599e7e'), 'created_at': 'Tue Jan 14 00:19:12 +0000 2020', 'id_str': '1216877387318616064', 'text': 'おはようございます☀\n\n#今日の積み上げ  予定\n✅#30DAYSトライアル 2nd Day3\n\n引き続きJavaScriptの学習です🏃\u200d♂️\n\n通勤往復中にProgateアプリ版→帰宅後パソコン版の流れ最強だったので本日も同じスタイルでいきます💪\n\n#駆け出しエンジニア'}
{'_id': ObjectId('5e1d09046be78d8673599e7f'), 'created_at': 'Tue Jan 14 00:19:12 +0000 2020', 'id_str': '1216877388753264641', 'text': 'RT @PVNCCDSB: As a result of a planned one-day full withdrawal of service by our teachers on Tuesday, Jan. 21, 2020, the Board will be clos…'}
{'_id': ObjectId('5e1d09086be78d8673599e80'), 'created_at': 'Tue Jan 14 00:19:15 +0000 2020', 'id_str': '1216877401822466048', 'text': 'Tapos na event so wala na akong ipopost na annoucements and shiz I am back to regular programming welcome to my kal… https://t.co/NGsR2RSEtm'}
{'_id': ObjectId('5e1d09086be78d8673599e81'), 'created_at': 'Tue Jan 14 00:19:16 +0000 2020', 'id_str': '1216877404041379847', 'text': 'RT @platzi: 📚 Seis Libros para mejorar tu conocimiento de Data Science 👇\n#NuncaParesDeAprender\nhttps://t.co/569j3rREx0 https://t.co/69KqUNy…'}
{'_id': ObjectId('5e1d09096be78d8673599e82'), 'created_at': 'Tue Jan 14 00:19:17 +0000 2020', 'id_str': '1216877408147533824', 'text': 'RT @strnr: Eleven tips for working with big data https://t.co/KrdaN4gxSh\nKeep raw data raw\nViz\nRecord workflow\nUse version ctrl\nRecord meta…'}
{'_id': ObjectId('5e1d09096be78d8673599e83'), 'created_at': 'Tue Jan 14 00:19:17 +0000 2020', 'id_str': '1216877408718028800', 'text': '@AnimalDefenceBZ @DataCassette Please enforce the law against dog and wild boar fighting! Plz sign: https://t.co/n3pdX3hOP8'}
{'_id': ObjectId('5e1d090d6be78d8673599e84'), 'created_at': 'Tue Jan 14 00:19:20 +0000 2020', 'id_str': '1216877423142297600', 'text': 'Rock it: A Cradle Story — An Arduino-powered Baby Crib Rocker\n\n☞ https://t.co/jrrPvUwrGv\n\n#arduino #programming https://t.co/niOfINyVkE'}
{'_id': ObjectId('5e1d090e6be78d8673599e85'), 'created_at': 'Tue Jan 14 00:19:22 +0000 2020', 'id_str': '1216877428603117568', 'text': 'RT @xximbecile: Bullshit. I was born in Madiun, live most of my youth without internet because my family is poor. And I know I read a lot.…'}
{'_id': ObjectId('5e1d09106be78d8673599e86'), 'created_at': 'Tue Jan 14 00:19:24 +0000 2020', 'id_str': '1216877436916379652', 'text': 'RT @sethrosen: Just converted to @webflow after years of preaching squarespace. Wow - just wow. \n\nI truly see why *this* is called no-code.…'}
{'_id': ObjectId('5e1d09106be78d8673599e87'), 'created_at': 'Tue Jan 14 00:19:24 +0000 2020', 'id_str': '1216877437570543618', 'text': "@SimonJo37129961 @Rectitude20 On the contrary, you're not appealing to the science &amp; data because epidemiological s… https://t.co/sqR3pkPIeR"}
{'_id': ObjectId('5e1d09126be78d8673599e88'), 'created_at': 'Tue Jan 14 00:19:26 +0000 2020', 'id_str': '1216877445447438336', 'text': "Always the best bang for your buck of any pod out there, thank you guys. Y'all gotta check them out… https://t.co/gwg4EZKx58"}
{'_id': ObjectId('5e1d09156be78d8673599e89'), 'created_at': 'Tue Jan 14 00:19:29 +0000 2020', 'id_str': '1216877458613587976', 'text': 'RT @bass_analytics: An Effective Python Environment: Making Yourself at Home\n@realpython #Python #programming #coding\nhttps://t.co/jMkY3xyU…'}
{'_id': ObjectId('5e1d09166be78d8673599e8a'), 'created_at': 'Tue Jan 14 00:19:30 +0000 2020', 'id_str': '1216877463633969152', 'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…'}
{'_id': ObjectId('5e1d09186be78d8673599e8b'), 'created_at': 'Tue Jan 14 00:19:31 +0000 2020', 'id_str': '1216877469652914176', 'text': 'Acquista il libro "Big Data, WebFare e Reddito per tutti. Quaderni per il Reddito n°9". Sostieni il BIN Italia - BI… https://t.co/R55bbOsxa3'}
{'_id': ObjectId('5e1d09196be78d8673599e8c'), 'created_at': 'Tue Jan 14 00:19:33 +0000 2020', 'id_str': '1216877475239616513', 'text': 'RT @MajoLedes: ✨Dejo esto por aquí.. \n\nHice un apunte de 24 páginas sobre conceptos principales de ReactJS🙈\n\nPueden ver el apunte completo…'}
{'_id': ObjectId('5e1d091a6be78d8673599e8d'), 'created_at': 'Tue Jan 14 00:19:33 +0000 2020', 'id_str': '1216877477403840512', 'text': 'RT @iowahawkblog: fun fact: this advanced state-of-the are artificial intelligence powered big data pizza thinkbot system was invented by T…'}
{'_id': ObjectId('5e1d091b6be78d8673599e8e'), 'created_at': 'Tue Jan 14 00:19:35 +0000 2020', 'id_str': '1216877483796107267', 'text': 'RT @javascriptflx: Hermes: A new open source JavaScript engine optimized for mobile apps https://t.co/Zn7Zed8SkV  #Javascript'}
{'_id': ObjectId('5e1d09216be78d8673599e8f'), 'created_at': 'Tue Jan 14 00:19:40 +0000 2020', 'id_str': '1216877507754020866', 'text': "RT @parscale: Big data from Toledo:\n\n✅ 22,927 Voters Identified\n\n✅ 18,210 Voters From Ohio\n\n✅ 5,216 Registrants Didn't Vote in 2016\n\n✅ 21.9…"}
{'_id': ObjectId('5e1d09216be78d8673599e90'), 'created_at': 'Tue Jan 14 00:19:41 +0000 2020', 'id_str': '1216877508559343625', 'text': 'Big 5 Sporting Goods $BGFV Anticipates Fiscal 2019 Fourth Quarter EPS to Exceed High End of Prior Guidance Range… https://t.co/fCTX0sWhon'}
{'_id': ObjectId('5e1d09226be78d8673599e91'), 'created_at': 'Tue Jan 14 00:19:42 +0000 2020', 'id_str': '1216877514049695752', 'text': 'RT @Arthur81288011: @A_Chapman101 @Jack62084141 Clear @HMRCgovuk must NOT be given new powers to automate processes that could cause distre…'}
{'_id': ObjectId('5e1d09266be78d8673599e92'), 'created_at': 'Tue Jan 14 00:19:46 +0000 2020', 'id_str': '1216877530222743553', 'text': '@RandallKopchak @OptimistPanda The problem (if you can call it that) was that DS9 was way ahead of its time in term… https://t.co/y2UI7XQjYm'}
{'_id': ObjectId('5e1d092b6be78d8673599e93'), 'created_at': 'Tue Jan 14 00:19:51 +0000 2020', 'id_str': '1216877549860663296', 'text': 'This thing is only growing. Excited to see what Gatsby will be like even 5 years from now.'}
{'_id': ObjectId('5e1d092c6be78d8673599e94'), 'created_at': 'Tue Jan 14 00:19:52 +0000 2020', 'id_str': '1216877555946414081', 'text': "2.  but oh well, it's cool data science!"}
{'_id': ObjectId('5e1d092e6be78d8673599e95'), 'created_at': 'Tue Jan 14 00:19:53 +0000 2020', 'id_str': '1216877561839484929', 'text': 'RT @KinarmLab: Kinarm Camp registration is now open!  Come join us June 8-12th in beautiful #ygk for a week of intensive #kinarm programmin…'}
{'_id': ObjectId('5e1d09306be78d8673599e96'), 'created_at': 'Tue Jan 14 00:19:56 +0000 2020', 'id_str': '1216877570819600389', 'text': 'RT @ElemTeachersTO: The #TDSB has cut $13 million dollars of French programming and is planning to eliminate Extended French starting next…'}
{'_id': ObjectId('5e1d09306be78d8673599e97'), 'created_at': 'Tue Jan 14 00:19:56 +0000 2020', 'id_str': '1216877570978803712', 'text': 'RT @byLilyV: FEATURED #COURSES\n\nThe #Data #Science #Course 2019: Complete Data Science Bootcamp\n\nBest Seller 144,730 students enrolled\n\nCom…'}
{'_id': ObjectId('5e1d09346be78d8673599e98'), 'created_at': 'Tue Jan 14 00:20:00 +0000 2020', 'id_str': '1216877588385271808', 'text': 'How to pack #Angular 8 applications on regular war files https://t.co/t1AXyA1wD1 #javascript #typescript #frontend #webdev'}
{'_id': ObjectId('5e1d09346be78d8673599e99'), 'created_at': 'Tue Jan 14 00:20:00 +0000 2020', 'id_str': '1216877589110951936', 'text': 'CoStar Group (@TheCoStarGroup) is hiring https://t.co/cWm6u5KE5o #reactjs #angularjs'}
{'_id': ObjectId('5e1d09376be78d8673599e9a'), 'created_at': 'Tue Jan 14 00:20:02 +0000 2020', 'id_str': '1216877599143665669', 'text': 'RT @NexWebSites: #Programming\n👇\nVisual Studio @code Keyboard Board Shortcuts for:\n \n👉Windows : PDF🔗: https://t.co/xxPqHUMjS3\n 👉#Linux : PDF…'}
{'_id': ObjectId('5e1d09376be78d8673599e9b'), 'created_at': 'Tue Jan 14 00:20:03 +0000 2020', 'id_str': '1216877600955621377', 'text': 'Everyone has his or her own way of analyzing data to find the right answers. This is why self-service in a business… https://t.co/264klNDvA1'}
{'_id': ObjectId('5e1d093d6be78d8673599e9c'), 'created_at': 'Tue Jan 14 00:20:09 +0000 2020', 'id_str': '1216877627937579011', 'text': 'RT @Payara_Fish: JavaFX Strikes Back - Latest #Airhacks podcast from @AdamBien\nCatching up with Gluons @johanvos, talking about advantages…'}
{'_id': ObjectId('5e1d09426be78d8673599e9d'), 'created_at': 'Tue Jan 14 00:20:13 +0000 2020', 'id_str': '1216877645977325569', 'text': '32 Tips For Every #WebDeveloper In 2020 #BetterProgramming via https://t.co/Q6JBQhnTTy https://t.co/3hwgAJhmSs'}

03 - Importando e analisando dados com Pandas e Scikit Learn

In [268]:
dataset = [{"created_at": item["created_at"], "text": item["text"]} for item in colecao.find()]
dataset
Out[268]:
[{'created_at': 'Tue Jan 14 00:14:44 +0000 2020',
  'text': 'RT @dcumoviepage: #ReleaseTheSnyderCut'},
 {'created_at': 'Tue Jan 14 00:15:41 +0000 2020',
  'text': 'RT @InfluxDB: Discover how a new #fluxlang feature that supports months and years as intervals while windowing enables deeper analysis of #…'},
 {'created_at': 'Tue Jan 14 00:15:51 +0000 2020',
  'text': '@realDonaldTrump Trump thinks his voters are dumb.\n\nhttps://t.co/Av2038b7q3'},
 {'created_at': 'Tue Jan 14 00:15:54 +0000 2020',
  'text': "RT @SethAbramson: 25/ Joel Zamel, a man close to the Israeli government—a key player in Flynn's Saudi Nuclear Deal—and a man recommended to…"},
 {'created_at': 'Tue Jan 14 00:16:05 +0000 2020',
  'text': '@Jhonitrejos @JorgeIvanOspina @lunadavid @kevingomezpaz @SergioMZamoraB @lftroyano Para que sea ciudad inteligente… https://t.co/WlSEnMOapV'},
 {'created_at': 'Tue Jan 14 00:16:08 +0000 2020',
  'text': 'RT @sicsuper: ¡Proteger tus datos personales es muy importante!\nEncuentra las recomendaciones que Big Data y la #SICSuper te dejamos aquí 👉…'},
 {'created_at': 'Tue Jan 14 00:16:33 +0000 2020',
  'text': 'RT @CatalogueBack: We interrupt our regular programming of pop culture and anime discussion posts to bring you @Cancelathon something fun I…'},
 {'created_at': 'Tue Jan 14 00:16:35 +0000 2020',
  'text': 'RT @NomadXrp: ⏰  PRICE UPDATE  🚀 \n\n⭐️ $XRP $ 0.2132\n24h -0.56% 📉\n\n⭐️ $BTC $ 8128.82\n24h -0.60% 📉\n\n⭐️ $ETH $ 143.88\n24h -1.67% 📉\n\n$xrp #thes…'},
 {'created_at': 'Tue Jan 14 00:16:36 +0000 2020',
  'text': 'BIG KETS ARE STILL KETS 😻😻😻😻'},
 {'created_at': 'Tue Jan 14 00:16:38 +0000 2020',
  'text': '[Cheat Sheet] Python Basics For Data Science https://t.co/LuZxXxs1dK'},
 {'created_at': 'Tue Jan 14 00:16:39 +0000 2020',
  'text': 'RT @Justin_Stolpe: Happy Monday! Learning about the Instagram Graph API this week! What are you learning about?\n.\n.\n#instagram #instagramap…'},
 {'created_at': 'Tue Jan 14 00:16:39 +0000 2020',
  'text': 'RT @davarcar1: @Jhonitrejos @JorgeIvanOspina @lunadavid @kevingomezpaz @SergioMZamoraB @lftroyano Para que sea ciudad inteligente de pasar…'},
 {'created_at': 'Tue Jan 14 00:16:47 +0000 2020',
  'text': '"They are typically very experienced, having worked on many different projects under a wide variety of circumstance… https://t.co/mWRTfNnRmX'},
 {'created_at': 'Tue Jan 14 00:16:51 +0000 2020',
  'text': '@iceagereentry @rcsteeb Don’t worry, all is well. 😉 https://t.co/5jxh8gXtTk'},
 {'created_at': 'Tue Jan 14 00:16:51 +0000 2020',
  'text': 'It "amazes" ME how an "influencer"  like @MarkDice hasn\'t TOUCHED UPON the "blatant" SYMBOLISM being shown on… https://t.co/WhB32QifGF'},
 {'created_at': 'Tue Jan 14 00:16:54 +0000 2020',
  'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…'},
 {'created_at': 'Tue Jan 14 00:16:55 +0000 2020',
  'text': 'RT @HawkinsTammy: Know #javascript and looking for a new gig in #California? #Blizzard Entertainment is looking for an Associate Software W…'},
 {'created_at': 'Tue Jan 14 00:16:55 +0000 2020',
  'text': 'Coffee and code. NodeJs tutorial. Then I will do some ReactJs tutorials.\n\nChristmas cat mug FTW! https://t.co/8ATWXMVAqV'},
 {'created_at': 'Tue Jan 14 00:17:00 +0000 2020',
  'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…'},
 {'created_at': 'Tue Jan 14 00:17:01 +0000 2020',
  'text': "📚 Wiley's Professional JavaScript for Web Developers is an essential guide to next-level ES6 and ES7 JavaScript dev… https://t.co/uyZB7AJ0en"},
 {'created_at': 'Tue Jan 14 00:17:05 +0000 2020',
  'text': 'With a few commands I can upgrade: sysinternals notepadplusplus googlechrome 7zip firefox SQLSentryPlanExplorer  vi… https://t.co/JkfFZEZPyB'},
 {'created_at': 'Tue Jan 14 00:17:07 +0000 2020',
  'text': 'New #job: Senior Fullstack Dev - JAVA and API Location: Wellington Central .. https://t.co/R8zY2oD9w6 #jobs #hiring'},
 {'created_at': 'Tue Jan 14 00:17:08 +0000 2020',
  'text': 'Feature request: add `base16` default themes, the next evolution of `Tomorrow` themes https://t.co/e99xcYh1aL… https://t.co/ShFLk4a0mj'},
 {'created_at': 'Tue Jan 14 00:17:11 +0000 2020',
  'text': 'insert baby yoda picture with caption \n\n“big kitties”'},
 {'created_at': 'Tue Jan 14 00:17:14 +0000 2020',
  'text': 'RT @IsTheArchitect: Why #Python is better than #R for #DataScience careers.\n\nhttps://t.co/cyTiSBpV4P\n#dataengineering #bigdata'},
 {'created_at': 'Tue Jan 14 00:17:17 +0000 2020',
  'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…'},
 {'created_at': 'Tue Jan 14 00:17:20 +0000 2020',
  'text': 'RT @Brilliance100: We handle:\n\nStatistics online classes\nPrecalculus\nAlgebra\nTrigonometry\nLinear programming\nMeasurements\nData analysis\nSPS…'},
 {'created_at': 'Tue Jan 14 00:17:21 +0000 2020',
  'text': 'RT @AlRokerEnt: "We are proud to debut this African American focused channel, created by and for the members of the black community." - Jam…'},
 {'created_at': 'Tue Jan 14 00:17:22 +0000 2020',
  'text': 'RT @nep_developer: Day: 08 of #100DaysOfCode \n-Pause the Tracker App(for a week)\n-Started a new project Planner that used firebase,\n\n------…'},
 {'created_at': 'Tue Jan 14 00:17:23 +0000 2020',
  'text': "RT @shog9: Well... I suddenly find myself in need of work. \nIf anyone's hiring: C++, JavaScript, C#, SQL + solid background in social softw…"},
 {'created_at': 'Tue Jan 14 00:17:25 +0000 2020',
  'text': 'RT @brunoborges: For all maintainers of #Java frameworks and libraries, ping @ashleymcnamara and share your story.\n\n// @jtgreene @phillip_w…'},
 {'created_at': 'Tue Jan 14 00:17:28 +0000 2020',
  'text': '¡El último Cience, Technology &amp; Programming  Daily! https://t.co/LTH701EPUt Gracias a @CTcard44 @schoolprobIems… https://t.co/CVFHa0My36'},
 {'created_at': 'Tue Jan 14 00:17:29 +0000 2020',
  'text': 'New #job: Business Intelligence Analyst Location: Las Vegas .. https://t.co/jXAS0kPEL6 #jobs #hiring'},
 {'created_at': 'Tue Jan 14 00:17:32 +0000 2020',
  'text': 'RT @DD_FaFa_: Data Science from Scratch: Comprehensive guide with essential principles of Data Science https://t.co/xgdtkXevAm #DataScience'},
 {'created_at': 'Tue Jan 14 00:17:34 +0000 2020',
  'text': 'RT @motherofnodejs: I am not lazy, I just save energy 😑 #programming #coding #programmer #javascript #coder #php #java #programminglife #de…'},
 {'created_at': 'Tue Jan 14 00:17:34 +0000 2020',
  'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5'},
 {'created_at': 'Tue Jan 14 00:17:35 +0000 2020',
  'text': 'FREE Webinar: Tuesday, 21 January 2020, 9 am EST for a review of #compositional #analysis by Handheld #XRF, along w… https://t.co/FvRX3YQDeB'},
 {'created_at': 'Tue Jan 14 00:17:35 +0000 2020',
  'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…'},
 {'created_at': 'Tue Jan 14 00:17:36 +0000 2020',
  'text': 'RT @susanhash: Leverage #CustomerData to identify opportunities for #proactive #custserv - Jon Christiansen of data science firm Ins &amp; Outs…'},
 {'created_at': 'Tue Jan 14 00:17:36 +0000 2020',
  'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…'},
 {'created_at': 'Tue Jan 14 00:17:36 +0000 2020',
  'text': "RT @h_ingo: TIL there's a Java version for one of the greatest performance diagnostics tools ever, PoorMansProfiler."},
 {'created_at': 'Tue Jan 14 00:17:36 +0000 2020',
  'text': 'RT @lakwatsarah: BIG KETS ARE STILL KETS 😻😻😻😻'},
 {'created_at': 'Tue Jan 14 00:17:38 +0000 2020',
  'text': 'RT @PriscillaWT: The grandson of House Democratic Whip James Clyburn, D-S.C., has cut a radio ad invoking his grandfather’s legacy and call…'},
 {'created_at': 'Tue Jan 14 00:17:40 +0000 2020',
  'text': 'RT @ActionableInsi3: [Cheat Sheet] Python Basics For Data Science https://t.co/LuZxXxs1dK'},
 {'created_at': 'Tue Jan 14 00:17:40 +0000 2020',
  'text': "RT @chey_cobb: Soooo... \nWhat's scarier?\n* Foreign intelligence agencies listening in on you?\n* Domestic intelligence agencies listening in…"},
 {'created_at': 'Tue Jan 14 00:17:41 +0000 2020',
  'text': 'I want nothing more than to hug a mf lion. Look at how cute and cuddly this big fluffs are!!!! I can’t handle it 😍😍'},
 {'created_at': 'Tue Jan 14 00:17:42 +0000 2020',
  'text': '☀ Hiring: #Big Data Engineer\n#AI #Analyst #BigData #Developer #Plano #techjobs #devjobs\nApply Now &gt;&gt;… https://t.co/f67B6uP1sU'},
 {'created_at': 'Tue Jan 14 00:17:42 +0000 2020',
  'text': 'RT @pdakean: Original study that found relation was retracted for data manipulation. The relation was never there but now epidemics are com…'},
 {'created_at': 'Tue Jan 14 00:17:46 +0000 2020',
  'text': '@PoetWalker We need an independent revival, like French New Wave, maybe. Films not involving enormous corporations… https://t.co/9PUgw6EdsE'},
 {'created_at': 'Tue Jan 14 00:17:48 +0000 2020',
  'text': '@EFL_law @KingMeren You are right - in theory this should not be that big of a deal. But you are giving the team mo… https://t.co/Cwn6ojUhX4'},
 {'created_at': 'Tue Jan 14 00:17:49 +0000 2020',
  'text': 'Practical Data Science with Hadoop and Spark: Designing and Building Effective Analytics at Scale (Addison-wesley D… https://t.co/zDsJpGTSoI'},
 {'created_at': 'Tue Jan 14 00:17:50 +0000 2020',
  'text': 'RT @MikelJoachim: Starting a “methods journal club” with grad students &amp; post-docs in @UWBadgerAP to discuss data organization, study desig…'},
 {'created_at': 'Tue Jan 14 00:17:50 +0000 2020',
  'text': 'RT @nep_developer: Day: 08 of #100DaysOfCode \n-Pause the Tracker App(for a week)\n-Started a new project Planner that used firebase,\n\n------…'},
 {'created_at': 'Tue Jan 14 00:17:54 +0000 2020',
  'text': 'RT @NoContextVinny: And we return to your regular programming. https://t.co/N9bbwoYtkp'},
 {'created_at': 'Tue Jan 14 00:17:54 +0000 2020',
  'text': 'Current standard of discourse on the net: "I know nothing I write here will change your mind, because you are alrea… https://t.co/OMa09Z0Gz6'},
 {'created_at': 'Tue Jan 14 00:17:55 +0000 2020',
  'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5'},
 {'created_at': 'Tue Jan 14 00:17:56 +0000 2020',
  'text': 'RT @neilonsoftware: "They are typically very experienced, having worked on many different projects under a wide variety of circumstances."…'},
 {'created_at': 'Tue Jan 14 00:17:56 +0000 2020',
  'text': 'actual footage of me because i have to TA  programming classes tomorrow for a total of 4 hours'},
 {'created_at': 'Tue Jan 14 00:18:01 +0000 2020',
  'text': 'Take part in the #SPIE Career Summit, our professional development programming at #PhotonicsWest 2020! \n\nCheck out… https://t.co/L1ej80GLtq'},
 {'created_at': 'Tue Jan 14 00:17:58 +0000 2020',
  'text': '@Mandoline_Blue Those energies, hard coded into our genetic programming, can (not always) find a twisted way out if… https://t.co/TLAJEnJc6h'},
 {'created_at': 'Tue Jan 14 00:18:02 +0000 2020',
  'text': 'もう火曜日。\nImperative  programming vs. Declarative :\n命令型プログラミング vs. 宣言型プログラミング'},
 {'created_at': 'Tue Jan 14 00:18:02 +0000 2020',
  'text': 'Itu csy kalo suatu saat nongol di Java Jazz, gue ga heran'},
 {'created_at': 'Tue Jan 14 00:18:03 +0000 2020',
  'text': 'Medical identity theft can leave you with big bills for procedures, treatment and equipment you never asked for or… https://t.co/hikhwEFoPo'},
 {'created_at': 'Tue Jan 14 00:18:06 +0000 2020',
  'text': '[Feature] Babel plugin: Add import URL version tag https://t.co/uObz0wNfua #github #JavaScript #TypeScript #CSS #HTML'},
 {'created_at': 'Tue Jan 14 00:18:03 +0000 2020',
  'text': 'There are many ways to profit off your health data, which leaves you with a big and sometimes life-threatening mess… https://t.co/nMhkQ793oe'},
 {'created_at': 'Tue Jan 14 00:18:07 +0000 2020',
  'text': 'RT @javascriptflx: 30 Free Resources To Help You Learn JavaScript Fundamentals https://t.co/W1C5eXVUkp  #Javascript'},
 {'created_at': 'Tue Jan 14 00:18:07 +0000 2020',
  'text': "Sr DevOps Developer - perm/downtown Toronto - Java/Python/Ruby or C req'd - build software to improve build/release… https://t.co/3qmpVgWt9Q"},
 {'created_at': 'Tue Jan 14 00:18:17 +0000 2020',
  'text': 'Malicious JavaScript package was only active on the npm repository for two weeks. Microsoft spots malicious npm pac… https://t.co/hZHWiiadOh'},
 {'created_at': 'Tue Jan 14 00:18:19 +0000 2020',
  'text': 'RT @SevenHillsUlti: We are submitting bids for YCC this summer! For more details or answers to some questions, check out our website: https…'},
 {'created_at': 'Tue Jan 14 00:18:21 +0000 2020',
  'text': "RT @juddy_96: Let me put Japan's situation in smash terms. Smash 4 Shulk. Hey he has all this great stuff. Let's give him shit frame data.…"},
 {'created_at': 'Tue Jan 14 00:18:22 +0000 2020',
  'text': 'RT @BenjySarlin: A realistic scenario right now:\n\n-Trump WH asks courts to end protections for pre-existing conditions\n\n-Trump re-elected w…'},
 {'created_at': 'Tue Jan 14 00:18:22 +0000 2020',
  'text': "RT @Brilliance100: We'll give you A's in your classes. Pay us for\n#essay\n#homework\n#assignment\n#discussion\n#code Java PHP C#\n#Programming p…"},
 {'created_at': 'Tue Jan 14 00:18:22 +0000 2020',
  'text': 'RT @sicsuper: ¡Proteger tus datos personales es muy importante!\nEncuentra las recomendaciones que Big Data y la #SICSuper te dejamos aquí 👉…'},
 {'created_at': 'Tue Jan 14 00:18:25 +0000 2020',
  'text': 'We back to regular programming boiiiis'},
 {'created_at': 'Tue Jan 14 00:18:27 +0000 2020',
  'text': "RT @Cawfree: Here's the Boston Housing dataset for training #regression networks in #tensorflow #NeuralNetworks in #javascript.\n\nhttps://t.…"},
 {'created_at': 'Tue Jan 14 00:18:28 +0000 2020',
  'text': 'RT @nytimesworld: “There aren’t that many things that are quintessentially Canadian, but skating is one of them,” said a university profess…'},
 {'created_at': 'Tue Jan 14 00:18:34 +0000 2020',
  'text': 'What to Pay #JavaScript #Developers in 2020 via https://t.co/prqxSCAEJ8 https://t.co/3nNlRg8PQK'},
 {'created_at': 'Tue Jan 14 00:18:35 +0000 2020',
  'text': '@msRachel9 As soon as we have programming news we’ll announce it here 😘'},
 {'created_at': 'Tue Jan 14 00:18:39 +0000 2020',
  'text': "My father just discovered that Steven Seagal was a real cop. Well he discovered Steven Seagal Law Man.\n\nThat's what… https://t.co/B1BMeIi25n"},
 {'created_at': 'Tue Jan 14 00:18:42 +0000 2020',
  'text': 'RT @RiverVanRain: What to Pay #JavaScript #Developers in 2020 via https://t.co/prqxSCAEJ8 https://t.co/3nNlRg8PQK'},
 {'created_at': 'Tue Jan 14 00:18:42 +0000 2020',
  'text': 'RT @MauraAlwyen: Science has just as many false prophets as religion and American politics does. Data, the Scriptures, and the Constitution…'},
 {'created_at': 'Tue Jan 14 00:18:49 +0000 2020',
  'text': 'RT @MattKresslein: Join us for the SOKY Robot Royale on Feb. 26th @GRRECKY!  EV3 &amp; Sphero Competitions, Drone Programming/Flying, @Scribit_…'},
 {'created_at': 'Tue Jan 14 00:18:50 +0000 2020',
  'text': 'RT @WjgotINrU14Z1fB: Javaで3年くらいやると、他言語の実業務に参加可能になるやつが増えてくる。\n\nなんでJavaだとそうなのかはわからないが、お堅い言語であるが故、信用されてる部分があるっぽい。\n\n実際のところ、言語転換の際に現場で困った話も聞かない。…'},
 {'created_at': 'Tue Jan 14 00:18:50 +0000 2020',
  'text': 'RT @Gurgling_MrD: Malicious JavaScript package was only active on the npm repository for two weeks. Microsoft spots malicious npm package s…'},
 {'created_at': 'Tue Jan 14 00:18:52 +0000 2020',
  'text': "RT @JamesFourM: @dark_wisdom_ @b_ofrights @TrickFreee @dcpoll @ninaandtito @3L3V3NTH @CORLEBRA777 Hey bruh. Let's not forget Bob Dole ➡️ Ma…"},
 {'created_at': 'Tue Jan 14 00:18:53 +0000 2020',
  'text': 'RT @platzi: 📚 Seis Libros para mejorar tu conocimiento de Data Science 👇\n#NuncaParesDeAprender\nhttps://t.co/569j3rREx0 https://t.co/69KqUNy…'},
 {'created_at': 'Tue Jan 14 00:18:53 +0000 2020',
  'text': 'Applied for college and university today, mainly computer programming for Colledge and a English major for universi… https://t.co/WhrU7gq7Q9'},
 {'created_at': 'Tue Jan 14 00:18:58 +0000 2020',
  'text': 'RT @JamesFourM: @CORLEBRA777\n@ninaandtito\n\nFounder &amp; pres of Grassroots Targeting worked for Bob &amp; Elizabeth Dole &amp; as  adviser to Reince P…'},
 {'created_at': 'Tue Jan 14 00:19:00 +0000 2020',
  'text': "RT @sarah_edo: 🎉 If you're interested in learning how to animate on the web with JavaScript, I wrote up a post on how to animate with @gree…"},
 {'created_at': 'Tue Jan 14 00:19:02 +0000 2020',
  'text': 'RT @RobotMakerGirl: The first part of the “thing” is officially built and tested. Now on to the programming stage! Then the woodworking sta…'},
 {'created_at': 'Tue Jan 14 00:19:02 +0000 2020',
  'text': 'Moderated a data science panel yesterday\n当我准备总结一个数据科学研讨环节时,问三位嘉宾:假如,您公司现在就开始没有数据,您的业务将会怎样?他们那惊讶的神情,告诉了我们数据对业务发展的重要性… https://t.co/JXnU7igBRD'},
 {'created_at': 'Tue Jan 14 00:19:06 +0000 2020',
  'text': 'Hi, I can do the class for you\nDM or Email✉ EssayNerd7@gmail.com \n\nGuarantees:\n✴an A+ Grade√√\n✴Timely Completion ⏱… https://t.co/UBs4lIMgBG'},
 {'created_at': 'Tue Jan 14 00:19:08 +0000 2020',
  'text': 'For some reason remembering languages/tools I’ve developed in I haven’t heard much about in years.\n#Powerbuilder,… https://t.co/CcYD8Ux1pX'},
 {'created_at': 'Tue Jan 14 00:19:09 +0000 2020',
  'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…'},
 {'created_at': 'Tue Jan 14 00:19:09 +0000 2020',
  'text': 'Gina Carano in a suit.....thats is all, we will now go back to your regularly scheduled programming #thisistheway https://t.co/QIC4xdsuhv'},
 {'created_at': 'Tue Jan 14 00:19:10 +0000 2020',
  'text': 'RT @spring_io: First milestone of Spring Boot 2.3 will be released this Thursday and will GA two weeks before Spring I/O.\n\nDon’t miss out a…'},
 {'created_at': 'Tue Jan 14 00:19:11 +0000 2020',
  'text': 'RT @genentech: Heading to #JPM20? Download S3E05 of our #podcast and find out more about the role of big data in #PersonalizedMedicine from…'},
 {'created_at': 'Tue Jan 14 00:19:12 +0000 2020',
  'text': 'おはようございます☀\n\n#今日の積み上げ  予定\n✅#30DAYSトライアル 2nd Day3\n\n引き続きJavaScriptの学習です🏃\u200d♂️\n\n通勤往復中にProgateアプリ版→帰宅後パソコン版の流れ最強だったので本日も同じスタイルでいきます💪\n\n#駆け出しエンジニア'},
 {'created_at': 'Tue Jan 14 00:19:12 +0000 2020',
  'text': 'RT @PVNCCDSB: As a result of a planned one-day full withdrawal of service by our teachers on Tuesday, Jan. 21, 2020, the Board will be clos…'},
 {'created_at': 'Tue Jan 14 00:19:15 +0000 2020',
  'text': 'Tapos na event so wala na akong ipopost na annoucements and shiz I am back to regular programming welcome to my kal… https://t.co/NGsR2RSEtm'},
 {'created_at': 'Tue Jan 14 00:19:16 +0000 2020',
  'text': 'RT @platzi: 📚 Seis Libros para mejorar tu conocimiento de Data Science 👇\n#NuncaParesDeAprender\nhttps://t.co/569j3rREx0 https://t.co/69KqUNy…'},
 {'created_at': 'Tue Jan 14 00:19:17 +0000 2020',
  'text': 'RT @strnr: Eleven tips for working with big data https://t.co/KrdaN4gxSh\nKeep raw data raw\nViz\nRecord workflow\nUse version ctrl\nRecord meta…'},
 {'created_at': 'Tue Jan 14 00:19:17 +0000 2020',
  'text': '@AnimalDefenceBZ @DataCassette Please enforce the law against dog and wild boar fighting! Plz sign: https://t.co/n3pdX3hOP8'},
 {'created_at': 'Tue Jan 14 00:19:20 +0000 2020',
  'text': 'Rock it: A Cradle Story — An Arduino-powered Baby Crib Rocker\n\n☞ https://t.co/jrrPvUwrGv\n\n#arduino #programming https://t.co/niOfINyVkE'},
 {'created_at': 'Tue Jan 14 00:19:22 +0000 2020',
  'text': 'RT @xximbecile: Bullshit. I was born in Madiun, live most of my youth without internet because my family is poor. And I know I read a lot.…'},
 {'created_at': 'Tue Jan 14 00:19:24 +0000 2020',
  'text': 'RT @sethrosen: Just converted to @webflow after years of preaching squarespace. Wow - just wow. \n\nI truly see why *this* is called no-code.…'},
 {'created_at': 'Tue Jan 14 00:19:24 +0000 2020',
  'text': "@SimonJo37129961 @Rectitude20 On the contrary, you're not appealing to the science &amp; data because epidemiological s… https://t.co/sqR3pkPIeR"},
 {'created_at': 'Tue Jan 14 00:19:26 +0000 2020',
  'text': "Always the best bang for your buck of any pod out there, thank you guys. Y'all gotta check them out… https://t.co/gwg4EZKx58"},
 {'created_at': 'Tue Jan 14 00:19:29 +0000 2020',
  'text': 'RT @bass_analytics: An Effective Python Environment: Making Yourself at Home\n@realpython #Python #programming #coding\nhttps://t.co/jMkY3xyU…'},
 {'created_at': 'Tue Jan 14 00:19:30 +0000 2020',
  'text': 'RT @thegrugq: Alternative take: knowing Haskell will get you a job delivering pizza, but JavaScript will get you a job at the big 5 https:/…'},
 {'created_at': 'Tue Jan 14 00:19:31 +0000 2020',
  'text': 'Acquista il libro "Big Data, WebFare e Reddito per tutti. Quaderni per il Reddito n°9". Sostieni il BIN Italia - BI… https://t.co/R55bbOsxa3'},
 {'created_at': 'Tue Jan 14 00:19:33 +0000 2020',
  'text': 'RT @MajoLedes: ✨Dejo esto por aquí.. \n\nHice un apunte de 24 páginas sobre conceptos principales de ReactJS🙈\n\nPueden ver el apunte completo…'},
 {'created_at': 'Tue Jan 14 00:19:33 +0000 2020',
  'text': 'RT @iowahawkblog: fun fact: this advanced state-of-the are artificial intelligence powered big data pizza thinkbot system was invented by T…'},
 {'created_at': 'Tue Jan 14 00:19:35 +0000 2020',
  'text': 'RT @javascriptflx: Hermes: A new open source JavaScript engine optimized for mobile apps https://t.co/Zn7Zed8SkV  #Javascript'},
 {'created_at': 'Tue Jan 14 00:19:40 +0000 2020',
  'text': "RT @parscale: Big data from Toledo:\n\n✅ 22,927 Voters Identified\n\n✅ 18,210 Voters From Ohio\n\n✅ 5,216 Registrants Didn't Vote in 2016\n\n✅ 21.9…"},
 {'created_at': 'Tue Jan 14 00:19:41 +0000 2020',
  'text': 'Big 5 Sporting Goods $BGFV Anticipates Fiscal 2019 Fourth Quarter EPS to Exceed High End of Prior Guidance Range… https://t.co/fCTX0sWhon'},
 {'created_at': 'Tue Jan 14 00:19:42 +0000 2020',
  'text': 'RT @Arthur81288011: @A_Chapman101 @Jack62084141 Clear @HMRCgovuk must NOT be given new powers to automate processes that could cause distre…'},
 {'created_at': 'Tue Jan 14 00:19:46 +0000 2020',
  'text': '@RandallKopchak @OptimistPanda The problem (if you can call it that) was that DS9 was way ahead of its time in term… https://t.co/y2UI7XQjYm'},
 {'created_at': 'Tue Jan 14 00:19:51 +0000 2020',
  'text': 'This thing is only growing. Excited to see what Gatsby will be like even 5 years from now.'},
 {'created_at': 'Tue Jan 14 00:19:52 +0000 2020',
  'text': "2.  but oh well, it's cool data science!"},
 {'created_at': 'Tue Jan 14 00:19:53 +0000 2020',
  'text': 'RT @KinarmLab: Kinarm Camp registration is now open!  Come join us June 8-12th in beautiful #ygk for a week of intensive #kinarm programmin…'},
 {'created_at': 'Tue Jan 14 00:19:56 +0000 2020',
  'text': 'RT @ElemTeachersTO: The #TDSB has cut $13 million dollars of French programming and is planning to eliminate Extended French starting next…'},
 {'created_at': 'Tue Jan 14 00:19:56 +0000 2020',
  'text': 'RT @byLilyV: FEATURED #COURSES\n\nThe #Data #Science #Course 2019: Complete Data Science Bootcamp\n\nBest Seller 144,730 students enrolled\n\nCom…'},
 {'created_at': 'Tue Jan 14 00:20:00 +0000 2020',
  'text': 'How to pack #Angular 8 applications on regular war files https://t.co/t1AXyA1wD1 #javascript #typescript #frontend #webdev'},
 {'created_at': 'Tue Jan 14 00:20:00 +0000 2020',
  'text': 'CoStar Group (@TheCoStarGroup) is hiring https://t.co/cWm6u5KE5o #reactjs #angularjs'},
 {'created_at': 'Tue Jan 14 00:20:02 +0000 2020',
  'text': 'RT @NexWebSites: #Programming\n👇\nVisual Studio @code Keyboard Board Shortcuts for:\n \n👉Windows : PDF🔗: https://t.co/xxPqHUMjS3\n 👉#Linux : PDF…'},
 {'created_at': 'Tue Jan 14 00:20:03 +0000 2020',
  'text': 'Everyone has his or her own way of analyzing data to find the right answers. This is why self-service in a business… https://t.co/264klNDvA1'},
 {'created_at': 'Tue Jan 14 00:20:09 +0000 2020',
  'text': 'RT @Payara_Fish: JavaFX Strikes Back - Latest #Airhacks podcast from @AdamBien\nCatching up with Gluons @johanvos, talking about advantages…'},
 {'created_at': 'Tue Jan 14 00:20:13 +0000 2020',
  'text': '32 Tips For Every #WebDeveloper In 2020 #BetterProgramming via https://t.co/Q6JBQhnTTy https://t.co/3hwgAJhmSs'}]
In [279]:
import pandas as pd

df = pd.DataFrame(dataset) 
df.head(20)
Out[279]:
created_at text
0 Tue Jan 14 00:14:44 +0000 2020 RT @dcumoviepage: #ReleaseTheSnyderCut
1 Tue Jan 14 00:15:41 +0000 2020 RT @InfluxDB: Discover how a new #fluxlang fea...
2 Tue Jan 14 00:15:51 +0000 2020 @realDonaldTrump Trump thinks his voters are d...
3 Tue Jan 14 00:15:54 +0000 2020 RT @SethAbramson: 25/ Joel Zamel, a man close ...
4 Tue Jan 14 00:16:05 +0000 2020 @Jhonitrejos @JorgeIvanOspina @lunadavid @kevi...
5 Tue Jan 14 00:16:08 +0000 2020 RT @sicsuper: ¡Proteger tus datos personales e...
6 Tue Jan 14 00:16:33 +0000 2020 RT @CatalogueBack: We interrupt our regular pr...
7 Tue Jan 14 00:16:35 +0000 2020 RT @NomadXrp: ⏰ PRICE UPDATE 🚀 \n\n⭐️ $XRP $...
8 Tue Jan 14 00:16:36 +0000 2020 BIG KETS ARE STILL KETS 😻😻😻😻
9 Tue Jan 14 00:16:38 +0000 2020 [Cheat Sheet] Python Basics For Data Science h...
10 Tue Jan 14 00:16:39 +0000 2020 RT @Justin_Stolpe: Happy Monday! Learning abou...
11 Tue Jan 14 00:16:39 +0000 2020 RT @davarcar1: @Jhonitrejos @JorgeIvanOspina @...
12 Tue Jan 14 00:16:47 +0000 2020 "They are typically very experienced, having w...
13 Tue Jan 14 00:16:51 +0000 2020 @iceagereentry @rcsteeb Don’t worry, all is we...
14 Tue Jan 14 00:16:51 +0000 2020 It "amazes" ME how an "influencer" like @Mark...
15 Tue Jan 14 00:16:54 +0000 2020 RT @neilonsoftware: "They are typically very e...
16 Tue Jan 14 00:16:55 +0000 2020 RT @HawkinsTammy: Know #javascript and looking...
17 Tue Jan 14 00:16:55 +0000 2020 Coffee and code. NodeJs tutorial. Then I will ...
18 Tue Jan 14 00:17:00 +0000 2020 RT @neilonsoftware: "They are typically very e...
19 Tue Jan 14 00:17:01 +0000 2020 📚 Wiley's Professional JavaScript for Web Deve...
In [274]:
from sklearn.feature_extraction.text import CountVectorizer
In [278]:
cv = CountVectorizer()
count_matrix = cv.fit_transform(df.text)
In [284]:
word_count = pd.DataFrame(cv.get_feature_names(), columns=["word"])
word_count["count"] = count_matrix.sum(axis = 0).tolist()[0]
word_count = word_count.sort_values("count", ascending = False).reset_index(drop = True)
In [289]:
word_count[:50]
Out[289]:
word count
0 rt 73
1 https 71
2 co 65
3 the 43
4 of 39
5 for 37
6 to 34
7 data 29
8 you 28
9 and 28
10 in 26
11 javascript 23
12 big 22
13 programming 21
14 are 19
15 will 19
16 on 17
17 is 14
18 science 14
19 job 14
20 that 12
21 get 12
22 this 11
23 with 11
24 we 11
25 at 10
26 but 10
27 was 9
28 new 9
29 amp 8
30 many 8
31 now 7
32 not 7
33 pizza 7
34 an 7
35 java 7
36 take 7
37 as 7
38 your 7
39 out 7
40 how 6
41 knowing 6
42 from 6
43 what 6
44 it 6
45 our 6
46 can 6
47 delivering 6
48 alternative 6
49 thegrugq 6