%matplotlib inline

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

# 데이터 출처 : # Data Source : https://www.blockchain.com/ko/charts/market-price?timespan=60days
file_path = '/home/jaeyoon89/python-data-analysis/data/market-price.csv'
bitcoin_df = pd.read_csv(file_path, names = ['day','price'])

print(bitcoin_df.shape)
print(bitcoin_df.info())
bitcoin_df.tail()

(365, 2)
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 365 entries, 0 to 364
Data columns (total 2 columns):
 #   Column  Non-Null Count  Dtype  
---  ------  --------------  -----  
 0   day     365 non-null    object 
 1   price   365 non-null    float64
dtypes: float64(1), object(1)
memory usage: 5.8+ KB
None


bitcoin_df['day'] = pd.to_datetime(bitcoin_df['day'])

bitcoin_df.index = bitcoin_df['day']
bitcoin_df.set_index('day', inplace=True)

bitcoin_df.plot()
plt.show()


from statsmodels.tsa.arima_model import ARIMA
import statsmodels.api as sm

model = ARIMA(bitcoin_df.price.values, order=(2,1,2))
model_fit = model.fit(trend='c', full_output=True, disp=True)
print(model_fit.summary())

/home/jaeyoon89/.local/lib/python3.6/site-packages/statsmodels/tsa/arima_model.py:472: FutureWarning: 
statsmodels.tsa.arima_model.ARMA and statsmodels.tsa.arima_model.ARIMA have
been deprecated in favor of statsmodels.tsa.arima.model.ARIMA (note the .
between arima and model) and
statsmodels.tsa.SARIMAX. These will be removed after the 0.12 release.

statsmodels.tsa.arima.model.ARIMA makes use of the statespace framework and
is both well tested and maintained.

To silence this warning and continue using ARMA and ARIMA until they are
removed, use:

import warnings
warnings.filterwarnings('ignore', 'statsmodels.tsa.arima_model.ARMA',
                        FutureWarning)
warnings.filterwarnings('ignore', 'statsmodels.tsa.arima_model.ARIMA',
                        FutureWarning)

  warnings.warn(ARIMA_DEPRECATION_WARN, FutureWarning)

                             ARIMA Model Results                              
==============================================================================
Dep. Variable:                    D.y   No. Observations:                  364
Model:                 ARIMA(2, 1, 2)   Log Likelihood               -2787.553
Method:                       css-mle   S.D. of innovations            512.415
Date:                Wed, 14 Apr 2021   AIC                           5587.107
Time:                        23:13:52   BIC                           5610.490
Sample:                             1   HQIC                          5596.400
                                                                              
==============================================================================
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          6.3192     27.794      0.227      0.820     -48.156      60.795
ar.L1.D.y     -0.3788      1.827     -0.207      0.836      -3.959       3.201
ar.L2.D.y      0.1586      1.191      0.133      0.894      -2.175       2.492
ma.L1.D.y      0.4569      1.822      0.251      0.802      -3.115       4.028
ma.L2.D.y     -0.1941      1.337     -0.145      0.885      -2.816       2.427
                                    Roots                                    
=============================================================================
                  Real          Imaginary           Modulus         Frequency
-----------------------------------------------------------------------------
AR.1           -1.5864           +0.0000j            1.5864            0.5000
AR.2            3.9753           +0.0000j            3.9753            0.0000
MA.1           -1.3797           +0.0000j            1.3797            0.5000
MA.2            3.7332           +0.0000j            3.7332            0.0000
-----------------------------------------------------------------------------

/home/jaeyoon89/.local/lib/python3.6/site-packages/statsmodels/tsa/arima_model.py:472: FutureWarning: 
statsmodels.tsa.arima_model.ARMA and statsmodels.tsa.arima_model.ARIMA have
been deprecated in favor of statsmodels.tsa.arima.model.ARIMA (note the .
between arima and model) and
statsmodels.tsa.SARIMAX. These will be removed after the 0.12 release.

statsmodels.tsa.arima.model.ARIMA makes use of the statespace framework and
is both well tested and maintained.

To silence this warning and continue using ARMA and ARIMA until they are
removed, use:

import warnings
warnings.filterwarnings('ignore', 'statsmodels.tsa.arima_model.ARMA',
                        FutureWarning)
warnings.filterwarnings('ignore', 'statsmodels.tsa.arima_model.ARIMA',
                        FutureWarning)

  warnings.warn(ARIMA_DEPRECATION_WARN, FutureWarning)


fig = model_fit.plot_predict() 
residuals = pd.DataFrame(model_fit.resid) 
residuals.plot()

<AxesSubplot:>


forecast_data = model_fit.forecast(steps=5)

test_file_path = '/home/jaeyoon89/python-data-analysis/data/market-price-test.csv'
bitcoin_test_df = pd.read_csv(test_file_path, names=['ds', 'y'])

pred_y = forecast_data[0].tolist()
test_y = bitcoin_test_df.y.values

pred_y_lower = []
pred_y_upper = []
for lower_upper in forecast_data[2]:
    lower = lower_upper[0]
    upper = lower_upper[1]
    pred_y_lower.append(lower)
    pred_y_upper.append(upper)


plt.plot(pred_y, color="gold")
plt.plot(pred_y_lower, color="red")
plt.plot(pred_y_upper, color="blue")
plt.plot(test_y, color="green")

[<matplotlib.lines.Line2D at 0x7fa1dc736a90>]


plt.plot(pred_y, color="gold")
plt.plot(test_y, color="green")

[<matplotlib.lines.Line2D at 0x7fa1e41034a8>]


from sklearn.metrics import mean_squared_error, r2_score
from math import sqrt

rmse = sqrt(mean_squared_error(pred_y, test_y))
print(rmse)

270.85258806066304


from fbprophet import Prophet


bitcoin_df = pd.read_csv(file_path, names=['ds', 'y'])
prophet = Prophet(seasonality_mode='multiplicative', 
                  yearly_seasonality=True,
                  weekly_seasonality=True, daily_seasonality=True,
                  changepoint_prior_scale=0.5)
prophet.fit(bitcoin_df)

<fbprophet.forecaster.Prophet at 0x7fa1dc9821d0>


future_data = prophet.make_future_dataframe(periods=5, freq='d')
forecast_data = prophet.predict(future_data)


forecast_data.tail(5)


forecast_data[['ds', 'yhat', 'yhat_lower', 'yhat_upper']].tail(5)


fig1 = prophet.plot(forecast_data)


fig2 = prophet.plot_components(forecast_data)

/home/jaeyoon89/.local/lib/python3.6/site-packages/fbprophet/plot.py:422: UserWarning: FixedFormatter should only be used together with FixedLocator
  ax.set_yticklabels(yticklabels)
/home/jaeyoon89/.local/lib/python3.6/site-packages/fbprophet/plot.py:422: UserWarning: FixedFormatter should only be used together with FixedLocator
  ax.set_yticklabels(yticklabels)
/home/jaeyoon89/.local/lib/python3.6/site-packages/fbprophet/plot.py:422: UserWarning: FixedFormatter should only be used together with FixedLocator
  ax.set_yticklabels(yticklabels)


bitcoin_test_df = pd.read_csv(test_file_path, names=['ds','y'])

pred_y = forecast_data.yhat.values[-5:]
test_y = bitcoin_test_df.y.values
pred_y_lower = forecast_data.yhat_lower.values[-5:]
pred_y_upper = forecast_data.yhat_upper.values[-5:]


plt.plot(pred_y, color="gold") 
plt.plot(pred_y_lower, color="red")
plt.plot(pred_y_upper, color="blue") 
plt.plot(test_y, color="green")

[<matplotlib.lines.Line2D at 0x7fa1dc847080>]


plt.plot(pred_y, color="gold")
plt.plot(test_y, color="green")

[<matplotlib.lines.Line2D at 0x7fa1dc6f4f28>]


rmse = sqrt(mean_squared_error(pred_y, test_y))
print(rmse)

105.41853842279897


bitcoin_df = pd.read_csv(file_path, names=['ds','y'])

bitcoin_df['cap'] = 20000

prophet = Prophet(seasonality_mode='multiplicative', 
                  growth='logistic',
                  yearly_seasonality=True,
                  weekly_seasonality=True, daily_seasonality=True,
                  changepoint_prior_scale=0.5)
prophet.fit(bitcoin_df)

<fbprophet.forecaster.Prophet at 0x7fa2193723c8>


future_data = prophet.make_future_dataframe(periods=5, freq='d')

future_data['cap'] = 20000
forecast_data = prophet.predict(future_data)

fig = prophet.plot(forecast_data)


bitcoin_test_df = pd.read_csv(test_file_path, names=['ds','y'])

pred_y = forecast_data.yhat.values[-5:]
test_y = bitcoin_test_df.y.values
pred_y_lower = forecast_data.yhat_lower.values[-5:]
pred_y_upper = forecast_data.yhat_upper.values[-5:]


plt.plot(pred_y, color="gold") 
plt.plot(pred_y_lower, color="red") 
plt.plot(pred_y_upper, color="blue") 
plt.plot(test_y, color="green")

[<matplotlib.lines.Line2D at 0x7fa21920f470>]


bitcoin_df = pd.read_csv(file_path, names=['ds', 'y'])
bitcoin_df.loc[bitcoin_df['y'] > 18000, 'y'] = None


prophet = Prophet(seasonality_mode='multiplicative',
                  yearly_seasonality=True,
                  weekly_seasonality=True, daily_seasonality=True,
                  changepoint_prior_scale=0.5)

prophet.fit(bitcoin_df)

future_data = prophet.make_future_dataframe(periods=5, freq='d')
forecast_data = prophet.predict(future_data)

fig = prophet.plot(forecast_data)


bitcoin_test_df = pd.read_csv(test_file_path, names = ['ds', 'y'])

pred_y = forecast_data.yhat.values[-5:]
test_y = bitcoin_test_df.y.values
pred_y_lower = forecast_data.yhat_lower.values[-5:]
pred_y_upper = forecast_data.yhat_upper.values[-5:]


plt.plot(pred_y, color="gold") 
plt.plot(pred_y_lower, color="red") 
plt.plot(pred_y_upper, color="blue") 
plt.plot(test_y, color="green")

[<matplotlib.lines.Line2D at 0x7fa1dcad5748>]


plt.plot(pred_y, color="gold")
plt.plot(test_y, color="green")

[<matplotlib.lines.Line2D at 0x7fa1dcc2d198>]


rmse = sqrt(mean_squared_error(pred_y, test_y))
print(rmse)

171.83159828333595

	day	price
360	2018-08-22 00:00:00	6575.229167
361	2018-08-23 00:00:00	6434.881667
362	2018-08-24 00:00:00	6543.645714
363	2018-08-25 00:00:00	6719.429231
364	2018-08-26 00:00:00	6673.274167

	ds	trend	yhat_lower	yhat_upper	trend_lower	trend_upper	daily	daily_lower	daily_upper	multiplicative_terms	...	weekly	weekly_lower	weekly_upper	yearly	yearly_lower	yearly_upper	yhat
365	2018-08-27	595.073916	6244.684071	7541.386994	595.073916	595.073916	10.907431	10.907431	10.907431	10.544862	...	-0.007796	-0.007796	-0.007796	-0.354773	-0.354773	-0.354773	6870.046369
366	2018-08-28	598.125014	6283.276467	7646.269844	598.125014	598.125014	10.907431	10.907431	10.907431	10.633309	...	0.026363	0.026363	0.026363	-0.300485	-0.300485	-0.300485	6958.173352
367	2018-08-29	601.176113	6245.853845	7709.353527	601.176113	601.176113	10.907431	10.907431	10.907431	10.588920	...	-0.055193	-0.055193	-0.055193	-0.263318	-0.263318	-0.263318	6966.981989
368	2018-08-30	604.227211	6274.519297	7786.241714	595.135376	610.384660	10.907431	10.907431	10.907431	10.631542	...	-0.029402	-0.029402	-0.029402	-0.246487	-0.246487	-0.246487	7028.094432
369	2018-08-31	607.278310	6245.421765	7895.588102	585.171677	621.710651	10.907431	10.907431	10.907431	10.694373	...	0.039476	0.039476	0.039476	-0.252535	-0.252535	-0.252535	7101.738804

	ds	yhat	yhat_lower	yhat_upper
365	2018-08-27	6870.046369	6244.684071	7541.386994
366	2018-08-28	6958.173352	6283.276467	7646.269844
367	2018-08-29	6966.981989	6245.853845	7709.353527
368	2018-08-30	7028.094432	6274.519297	7786.241714
369	2018-08-31	7101.738804	6245.421765	7895.588102

이것이 데이터 분석이다 with 파이썬 ch4-1(타이타닉 생존자 가려내기) (0)	2021.04.16
이것이 데이터 분석이다 with 파이썬 ch3-3(미래에 볼 영화의 평점 예측하기) (0)	2021.04.15
이것이 데이터 분석이다 with 파이썬 ch3-1(프로야구 선수의 다음 해 연봉 예측하기) (0)	2021.04.12
이것이 데이터 분석이다 with 파이썬 ch1-2(국가별 음주 데이터 분석하기) (0)	2021.04.11
이것이 데이터 분석이다 with 파이썬 ch1-1(chipotle 주문 데이터 분석하기) (0)	2021.04.09

speed&direction

티스토리 뷰

이것이 데이터 분석이다 with 파이썬 ch3-2(비트코인 시세 예측하기)

3.2 비트코인 시세 예측하기¶

step.1 탐색: 시간 정보가 포함된 데이터 살펴보기¶

step.2 예측: 파이썬 라이브러리를 활용해 시세 예측하기¶

step.3 활용: 더 나은 결과를 위한 방법¶

'이것이 데이터분석이다 with 파이썬' 카테고리의 다른 글

티스토리툴바

« 2025/07 »
일	월	화	수	목	금	토
		1	2	3	4	5
6	7	8	9	10	11	12
13	14	15	16	17	18	19
20	21	22	23	24	25	26
27	28	29	30	31