In [5]:
import tweepy 
import numpy as np 
import csv
import pandas as pd
import sqlite3
import matplotlib.pyplot as plt
conn = sqlite3.connect('tweets.db')
c = conn.cursor()

data = pd.read_sql('select * from crypto',conn)
#data.to_csv("text.csv")
data
Out[5]:
id geo created retweet_count coordinates user_name user_created user_followers user_bg_color user_location id_str user_description polarity subjectivity text
0 1 None 2017-12-22 18:10:02.000000 0 None lucier_naga25 2010-07-02 21:44:34.000000 49 C0DEED None 944268810240057344 None 0.000000 0.000000 RT @Milenio: #Bitcoin pierde 25% de su valor e...
1 2 None 2017-12-22 18:10:02.000000 0 None marionnoeske181 2017-10-19 07:52:15.000000 1 F5F8FA None 944268808587481090 ET CHCKS 0.000000 0.000000 RT @RandyHilarski: #Bitcoin News Stocks That S...
2 3 None 2017-12-22 18:10:02.000000 0 None EurVirtualCoins 2012-07-11 19:40:16.000000 167 000000 None 944268811007676417 Main virtual coin values in dollars and euros.... 0.000000 0.000000 1 bitcoin = $13081.4 / 11049.963€\n1 bitcoin-c...
3 4 None 2017-12-22 18:10:02.000000 0 None RobbieTay24 2011-02-19 11:55:59.000000 69 C0DEED suffolk 944268811309649922 None 0.000000 0.000000 RT @SPEEROTHEKID: $4,000\nBitcoin will crash\n...
4 5 None 2017-12-22 18:10:02.000000 0 None zwoelfzwanzig 2017-08-29 14:55:16.000000 161 000000 wien 22 944268810995068930 wenn nicht mit rap dann mit den punkern 0.000000 0.000000 RT @zachbraff: Bitcoin to investors today. htt...
5 6 None 2017-12-22 18:10:02.000000 0 None ChokseRamirez 2017-06-23 00:03:24.000000 614 F5F8FA Cleveland, OH 944268811418656770 @merryflashmas @Clefanforlife @jonmikey34 @eva... 0.000000 0.000000 RT @IsiahWhitlockJr: You bought #Bitcoin three...
6 7 None 2017-12-22 18:10:02.000000 0 None RamizKaraeski61 2016-08-26 11:30:46.000000 1403 F5F8FA Dünya 944268811494191104 Biz bu davayı yolda bulmadık 0.000000 0.000000 RT @AmiralYamamoto: Bitcoin sert bir sekilde d...
7 8 None 2017-12-22 18:10:02.000000 0 None Gmelanie13 2013-01-21 12:19:29.000000 5163 C0DEED Троицк 944268808847527937 Совесть - это тонкая материя, поэтому у толсто... 0.000000 0.000000 https://t.co/5kWOovgrHz
8 9 None 2017-12-22 18:10:02.000000 0 None LaurenceTheBird 2013-09-16 23:26:01.000000 347 C0DEED ...living in the moment 944268808486875137 See it, say it , act ! 🤜🏻🤛🏻 0.000000 0.000000 RT @_tm3k: Bitcoin price today https://t.co/2y...
9 10 None 2017-12-22 18:10:03.000000 0 None giov_nigro 2010-06-16 10:48:01.000000 164 0099B9 None 944268812983111682 Studio Giurisprudenza all'Università di Pisa 0.000000 0.000000 RT @NenciniPsi: Bitcoin è una criptomoneta che...
10 11 None 2017-12-22 18:10:03.000000 0 None Ajsoti 2010-07-21 20:26:16.000000 1996 C0DEED None 944268813373202433 NY, NY / Sports, Politics, & BS Takes. Liberal... 0.800000 0.700000 @scarmozzinoBiz It has no value yet its beginn...
11 12 None 2017-12-22 18:10:03.000000 0 None sobaliving 2008-12-07 16:44:04.000000 87506 C0DEED AZ, CA, NJ, TX 944268811720646658 We are an addiction treatment center with seve... 0.059091 0.238636 Sober Recovery Center New video https://t.co/...
12 13 None 2017-12-22 18:10:03.000000 0 None bituccar 2015-08-22 16:20:26.000000 88214 000000 İstanbul, Türkiye 944268813704531968 Trying to conquer darkness by $BTC and remembe... 0.000000 0.000000 Varsayalım ki bu ihracatın tamamında ödemeler ...
13 14 None 2017-12-22 18:10:03.000000 0 None miyabi93yp 2012-03-31 12:49:22.000000 610 1A1B1F 修羅 944268814463655936 クソリプマン。\n みやびと呼んで下さいな。\nシャドバ。\n遊戯王やってた。九産杯主催。人... 0.000000 0.000000 BTC!BTC!さっさとBTC!上がれよ!!
14 15 None 2017-12-22 18:10:03.000000 0 None paulinebankoff3 2017-02-26 14:13:29.000000 1 F5F8FA None 944268814929276929 howtospellguys How To Spell FOLLOWES? L--V-E-Y... 0.095833 0.300000 RT @officialmcafee: Coin of the day: BURST -- ...
15 16 None 2017-12-22 18:10:03.000000 0 None andersonhoje 2009-07-13 17:41:12.000000 44912 BDBDBD República Rio-Grandense, tchê! 944268815277359104 YAAKOV יעקב - Gaúcho, separatista, judeu, sion... 1.000000 0.300000 RT @andersonhoje: Now is the best time to buy ...
16 17 None 2017-12-22 18:10:03.000000 0 None horselythighs 2012-08-30 02:15:23.000000 3619 FFFFFF None 944268815302578177 the end is neigh. -0.400000 0.600000 This is my son, bitcoin, and my daughter, EVER...
17 18 None 2017-12-22 18:10:03.000000 0 None sandeep_rupani 2017-11-22 06:08:52.000000 30 F5F8FA Bangalore , Karnataka ,India 944268815432585216 None 0.600000 0.700000 RT @barronsonline: Why it's wise to be more ca...
18 19 None 2017-12-22 18:10:04.000000 0 None MuchSalty 2015-12-20 04:36:47.000000 18 000000 Weenie Hut Juniors 944268815902367744 None 0.000000 0.000000 RT @_tm3k: Bitcoin price today https://t.co/2y...
19 20 None 2017-12-22 18:10:04.000000 0 None L00Y 2013-10-01 03:16:53.000000 1299 C0DEED (テスト運用中) 944268816036405248 10分に1度ビットコインの価格を呟きます。 0.000000 0.000000 12/23 03:10 現在のビットコインの価格\nBTC/JPY bid: 1,767,4...
20 21 None 2017-12-22 18:10:04.000000 0 None talha32481 2017-12-21 21:00:06.000000 1 F5F8FA None 944268816250523651 None 0.042262 0.525595 RT @WhiteBitcoin: BitcoinWhite platform makes ...
21 22 None 2017-12-22 18:10:04.000000 0 None aacificBamboo 2014-03-23 09:00:36.000000 27 C6E2EE Sulphur Springs, Texas 944268816913260545 Supporting sustainable agriculture, bamboo re... 0.500000 0.500000 RT @RachelleJervis: I have more sensible shoes...
22 23 None 2017-12-22 18:10:04.000000 0 None DiogeneofSinope 2014-11-14 04:16:47.000000 2131 000000 Ponce, USA 944268817143869442 Of what use is a philosopher who doesn't hurt ... 0.000000 0.000000 @addiction82 Yeah but we know bitcoin will bpunce
23 24 None 2017-12-22 18:10:04.000000 0 None addiktoo 2015-08-14 09:58:53.000000 3134 C0DEED None 944268817114521600 None -0.250000 0.250000 RT @CharlieShrem: LISTEN: For those who’ve cal...
24 25 None 2017-12-22 18:10:03.000000 0 None janellekuprewic 2017-08-10 09:19:52.000000 7162 F5F8FA None 944268813511434240 None 0.000000 0.000000 RT @turnkeyfans: HOW TO MAKE #MONEY \n\n1.) BU...
25 26 None 2017-12-22 18:10:04.000000 0 None hffdmjeafyxruv1 2017-01-27 16:54:25.000000 1 F5F8FA None 944268817802387456 Not your typica black man. Into various things... 0.000000 0.100000 RT @MarketStockNewz: $VIDA Big News Out - Phiv...
26 27 None 2017-12-22 18:10:04.000000 0 None alexthebean 2010-05-14 10:06:33.000000 276 FFFFFF London 944268817638752257 Energetic and enthusiatic individual...always ... 0.066667 0.200000 Bitcoin loses more than a third of value over ...
27 28 None 2017-12-22 18:10:04.000000 0 None JuIes10857 2010-02-06 03:49:39.000000 44193 000000 None 944268818603433984 Consultant Bitcoin | https://t.me/CryptoJ0ules... 0.375000 0.475000 @Manisha3005 @BTCTN Bitcoin Diamond ($BCD) suc...
28 29 None 2017-12-22 18:10:04.000000 0 None carmengonz02 2016-09-15 20:23:58.000000 626 000000 Cartagena, Colombia 944268818817409024 El sol no brilla para unas pocas flores y árbo... 0.000000 0.000000 RT @ELTIEMPO: El bitcoin se encamina a cerrar ...
29 30 None 2017-12-22 18:10:04.000000 0 None Kurghen 2009-04-30 07:37:23.000000 490 C0DEED Florida 944268818909749248 Founder & CEO, @MeraglimAI Predictive Data Ana... 0.250000 0.250000 RT @OnTheMoneyCBC: Bitcoin is a fraud: One of ...
... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...
499949 499950 None 2018-02-06 18:48:31.000000 0 None DouglasABailey 2009-07-16 02:43:23.000000 295 1A1B1F Sydney 960948336307007493 Business Intelligence Analyst, Camera Operator... 0.000000 0.000000 @Laface88 @stephanlivera I purchase XRP with f...
499950 499951 None 2018-02-06 18:48:31.000000 0 None lostonwallst_ 2016-11-16 01:15:36.000000 302 F5F8FA New York, NY 960948337733197824 A "DIY" business website. Empowering people to... 0.000000 0.750000 Yeah, that makes total sense. #Bitcoin #stocks...
499951 499952 None 2018-02-06 18:48:32.000000 0 None DmitryYudin6 2017-10-15 16:03:25.000000 2699 F5F8FA None 960948339431886849 #btc #Trading #bounty #Altcoins #eth #Cryptocu... 0.000000 0.000000 RT @FireLottery: @FireLottery started publicat...
499952 499953 None 2018-02-06 18:48:32.000000 0 None 6189_ryu 2011-10-22 13:44:52.000000 316 C0DEED None 960948339842822144 個人トレーダー。仮想通貨ではなく電子金貨だと捉えてます。金融専門家ではありませんが、色々考え... 0.000000 0.000000 RT @s091084: ブラックロックは、世界最大の資産運用会社。運用資産規模は、なんと6...
499953 499954 None 2018-02-06 18:48:32.000000 0 None real_vijay 2009-12-06 20:29:33.000000 4529 FFF04D The Emerald City 960948341600223232 Tu ne cede malis, sed contra audentior ito 0.200000 0.383333 @elonmusk For a second I thought this was some...
499954 499955 None 2018-02-06 18:48:33.000000 0 None Bertskie 2009-05-25 05:45:58.000000 82 C0DEED Manila 960948342401486848 None 0.000000 0.000000 #Airdrop #Bitcoin #Blockchain #Bilibit #XRP \n...
499955 499956 None 2018-02-06 18:48:33.000000 0 None Nikkau 2007-10-03 21:20:39.000000 955 C0DEED Paris, France 960948345446567936 None 0.500000 0.500000 RT @BryceElder: Okay, so Bitcoin.
499956 499957 None 2018-02-06 18:48:34.000000 0 None Shillman_Crypto 2017-12-04 12:43:23.000000 2151 F5F8FA None 960948346696368128 Political Scientist specialized in governance,... -0.050000 0.400000 RT @CryptoRampage: Inverse H&S forming and...
499957 499958 None 2018-02-06 18:48:34.000000 0 None lB9WQgHSIwFO71s 2017-08-27 11:08:44.000000 0 F5F8FA None 960948346516070400 None 0.375000 0.475000 @CoinAxis Bitcoin Gold (BTG) successfully laun...
499958 499959 None 2018-02-06 18:48:34.000000 0 None mlsbd100 2017-11-01 10:47:12.000000 5951 F5F8FA None 960948347371581440 Follow me i will follow back 100% 0.275000 0.666667 RT @Quantum1Net: "The first person or group to...
499959 499960 None 2018-02-06 18:48:34.000000 0 None ChrisEli705 2016-10-28 21:05:19.000000 46 F5F8FA Paris, France 960948347552124929 #digital #BI #BigData #life 0.000000 0.000000 RT @jblefevre60: 4 Areas Of #Blockchain Applic...
499960 499961 None 2018-02-06 18:48:34.000000 0 None SeattleCoug88 2011-03-19 03:07:52.000000 245 1A1B1F Cascadia 960948349170937858 Sports, Politics, Finance, Tech, #GoCougs 0.000000 0.000000 RT @eringriffith: teachable moment in r/bitcoi...
499961 499962 None 2018-02-06 18:48:34.000000 0 None Anvar_ub 2017-12-21 19:53:30.000000 35 F5F8FA Uzbekistan 960948349712175104 None 0.700000 0.600000 RT @DigitalLawrence: 💎🔥 Looking good... #crypt...
499962 499963 None 2018-02-06 18:48:35.000000 0 None cryptobuzzwords 2017-11-18 08:53:09.000000 6 F5F8FA None 960948351498846208 The most efficient way to follow the latest cr... 0.000000 0.000000 Without Bitcoin, There Would Be No Blockchain:...
499963 499964 None 2018-02-06 18:48:35.000000 0 None DetroitCrypto 2017-07-06 19:56:05.000000 12 F5F8FA None 960948352799203328 None 0.000000 0.000000 Cryptocurrency: #HempCoin\nPrice USD: 0.134043...
499964 499965 None 2018-02-06 18:48:35.000000 0 None lB9WQgHSIwFO71s 2017-08-27 11:08:44.000000 0 F5F8FA None 960948352635596800 None 0.375000 0.475000 @AlexxxTekilla Bitcoin Gold (BTG) successfully...
499965 499966 None 2018-02-06 18:48:35.000000 0 None cecilyparmar241 2018-02-06 18:18:56.000000 0 F5F8FA Drigh Road, Pakistan 960948353122095104 None 0.000000 0.000000 RT @applancer_crypt: Goldman Sachman Bitcoin t...
499966 499967 None 2018-02-06 18:48:35.000000 0 None AleksandrClever 2018-01-14 09:11:45.000000 1340 F5F8FA Санкт-Петербург, Россия 960948353797382150 #Blockchain #Cryptocurrency #Bitcoin #Followback 0.000000 0.000000 ICO Paymon уже идёт! https://t.co/Jihfc097yr
499967 499968 None 2018-02-06 18:48:35.000000 0 None Helloshanugupta 2017-10-25 09:19:58.000000 70 F5F8FA India 960948354262814720 Unemployed \n\nXRP\nAdd: rEb8TK3gBgk5auZkwc6sH... -0.700000 0.666667 @BTCTN XRP BTC ETH are so badly connected \nXT...
499968 499969 None 2018-02-06 18:48:36.000000 0 None nicollyons437 2018-02-04 13:17:31.000000 1 F5F8FA None 960948354904743939 26CF8F2 - arguen 0.200000 0.300000 RT @The1000pClub: ATH (Athenian Warrior Token)...
499969 499970 None 2018-02-06 18:48:36.000000 0 None AdioFanky 2017-05-05 14:42:28.000000 92 F5F8FA 北海道 960948355160457216 歩くadidasこと★FANKY-ADIO★と申します!MMA(RIZIN・DEEP・JEW... 0.000000 0.000000 RT @Nakman27: Tether問題がスルーだったことで、暴落は避けた形。\nただ、...
499970 499971 None 2018-02-06 18:48:36.000000 0 None HotBTCNews 2017-12-03 06:39:59.000000 8 F5F8FA Lille, France 960948355445661696 None 0.000000 0.000000 #XinFin ICO token sale https://t.co/GZyhpaerey...
499971 499972 None 2018-02-06 18:48:36.000000 0 None DmitryYudin6 2017-10-15 16:03:25.000000 2699 F5F8FA None 960948355844268034 #btc #Trading #bounty #Altcoins #eth #Cryptocu... 0.000000 0.000000 RT @FireLottery: @FireLottery on #ICETotallyG...
499972 499973 None 2018-02-06 18:48:36.000000 0 None DmitrSmironv 2017-07-25 17:20:38.000000 2130 F5F8FA None 960948356645359616 None 0.000000 0.000000 RT @REGA20847530: You can send it to your mom ...
499973 499974 None 2018-02-06 18:48:36.000000 0 None A_CRyptoLoRD 2017-12-29 12:29:37.000000 79 F5F8FA Future Past Present 960948357161209856 Tardis, EOS and Sunset lover. Time traveler + ... 0.700000 0.600000 RT @CryptoSays: I am getting lots of DMs about...
499974 499975 None 2018-02-06 18:48:36.000000 0 None lB9WQgHSIwFO71s 2017-08-27 11:08:44.000000 0 F5F8FA None 960948358855712769 None 0.375000 0.475000 @ButerinVitalyk @officialmcafee Bitcoin Gold (...
499975 499976 None 2018-02-06 18:48:37.000000 0 None Khadeermohmmed 2010-07-12 03:50:46.000000 18 C0DEED None 960948359132536832 None 0.625000 0.800000 Free หารายได้เสริม จากการเก็บ Bitcoin เก็บฟรี....
499976 499977 None 2018-02-06 18:48:37.000000 0 None CyberDomain 2010-10-23 18:38:38.000000 17556 131516 Cyber Domain 960948359501631488 It took only 14 days to decode 9EC4C12949A4F31... 0.100000 0.100000 The Megaphone Desktop Tool is a Windows "actio...
499977 499978 None 2018-02-06 18:48:38.000000 0 None _timo_t_ 2009-11-25 06:10:11.000000 46 B2DFDA None 960948363549138945 None 0.000000 1.000000 RT @coinbase: Our engineering team has begun t...
499978 499979 None 2018-02-06 18:48:38.000000 0 None Dantu_u 2013-08-27 15:45:17.000000 381 000000 Guatemala 960948363540676608 Programando mi vida y desarrollando la mejor e... 0.000000 0.000000 RT @josedlujan: Buenos días a todos, como les ...

499979 rows × 15 columns

In [6]:
from textblob import TextBlob
import re

def clean_tweet(tweet):
    '''
    Utility function to clean the text in a tweet by removing 
    links and special characters using regex.
    '''
    return ' '.join(re.sub("(@[A-Za-z0-9]+)|([^0-9A-Za-z \t])|(\w+:\/\/\S+)", " ", tweet).split())

def analize_sentiment(tweet):
    '''
    Utility function to classify the polarity of a tweet
    using textblob.
    '''
    analysis = TextBlob(clean_tweet(tweet))
    if analysis.sentiment.polarity > 0:
        return 1
    elif analysis.sentiment.polarity == 0:
        return 0
    else:
        return -1
In [7]:
# We create a column with the result of the analysis:
data['SA'] = np.array([ analize_sentiment(tweet) for tweet in data['text'] ])

# We display the updated dataframe with the new column:
data.head()
#data.to_csv("rocket_ship.csv")
Out[7]:
id geo created retweet_count coordinates user_name user_created user_followers user_bg_color user_location id_str user_description polarity subjectivity text SA
0 1 None 2017-12-22 18:10:02.000000 0 None lucier_naga25 2010-07-02 21:44:34.000000 49 C0DEED None 944268810240057344 None 0.0 0.0 RT @Milenio: #Bitcoin pierde 25% de su valor e... 0
1 2 None 2017-12-22 18:10:02.000000 0 None marionnoeske181 2017-10-19 07:52:15.000000 1 F5F8FA None 944268808587481090 ET CHCKS 0.0 0.0 RT @RandyHilarski: #Bitcoin News Stocks That S... 0
2 3 None 2017-12-22 18:10:02.000000 0 None EurVirtualCoins 2012-07-11 19:40:16.000000 167 000000 None 944268811007676417 Main virtual coin values in dollars and euros.... 0.0 0.0 1 bitcoin = $13081.4 / 11049.963€\n1 bitcoin-c... 0
3 4 None 2017-12-22 18:10:02.000000 0 None RobbieTay24 2011-02-19 11:55:59.000000 69 C0DEED suffolk 944268811309649922 None 0.0 0.0 RT @SPEEROTHEKID: $4,000\nBitcoin will crash\n... 0
4 5 None 2017-12-22 18:10:02.000000 0 None zwoelfzwanzig 2017-08-29 14:55:16.000000 161 000000 wien 22 944268810995068930 wenn nicht mit rap dann mit den punkern 0.0 0.0 RT @zachbraff: Bitcoin to investors today. htt... 0
In [8]:
# We construct lists with classified tweets:

pos_tweets = [ tweet for index, tweet in enumerate(data['text']) if data['SA'][index] > 0]
neu_tweets = [ tweet for index, tweet in enumerate(data['text']) if data['SA'][index] == 0]
neg_tweets = [ tweet for index, tweet in enumerate(data['text']) if data['SA'][index] < 0]
In [9]:
print("Percentage of positive tweets: {}%".format(len(pos_tweets)*100/len(data['text'])))
print("Percentage of neutral tweets: {}%".format(len(neu_tweets)*100/len(data['text'])))
print("Percentage de negative tweets: {}%".format(len(neg_tweets)*100/len(data['text'])))
Percentage of positive tweets: 33.33800019600823%
Percentage of neutral tweets: 55.51153148432234%
Percentage de negative tweets: 11.150468319669427%
In [10]:
sen_pos = format(len(pos_tweets)*100/len(data['text']))
sen_neu = format(len(neu_tweets)*100/len(data['text']))
sen_neg = format(len(neg_tweets)*100/len(data['text']))
In [11]:
fig = plt.figure()
fig.suptitle('Twitter Sentiment for Keyword Bitcoin', fontsize=14, fontweight='bold')

labels = "positive","neutral","Negitive"
sizes = [sen_pos,sen_neu,sen_neg]
colors = ['green', 'gold', 'red']
explode = (0.1,0.1,0)  # "explode" Slices for looks

plt.pie(sizes, explode=explode, labels=labels, colors=colors,
        autopct='%1.1f%%', shadow=True, startangle=90)
# Set aspect ratio to be equal so that pie is drawn as a circle.
plt.axis('equal')

plt.show()