0% found this document useful (0 votes)

22 views1 page

( ) - ( ) ( ('Lower New - Vaccinations - Smoothed') ) ( ('Upper New - Vaccinations - Smoothed') ) - (., ,, 'B', )

Uploaded by

Nathaniel Handan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

22 views1 page

( ) - ( ) ( ('Lower New - Vaccinations - Smoothed') ) ( ('Upper New - Vaccinations - Smoothed') ) - (., ,, 'B', )

Uploaded by

Nathaniel Handan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 1

In [ ]: # IMPORTANT: RUN THIS CELL IN ORDER TO IMPORT YOUR KAGGLE DATA SOURCES

# TO THE CORRECT LOCATION (/kaggle/input) IN YOUR NOTEBOOK,

# THEN FEEL FREE TO DELETE THIS CELL.
# NOTE: THIS NOTEBOOK ENVIRONMENT DIFFERS FROM KAGGLE'S PYTHON
# ENVIRONMENT SO THERE MAY BE MISSING LIBRARIES USED BY YOUR
# NOTEBOOK.

import os
import sys
from tempfile import NamedTemporaryFile
from urllib.request import urlopen
from urllib.parse import unquote, urlparse
from urllib.error import HTTPError
from zipfile import ZipFile
import tarfile
import shutil

CHUNK_SIZE = 40960
DATA_SOURCE_MAPPING = 'latest-covid-19-dataset-worldwide:https%3A%2F%2Fsiteproxy.ruqli.workers.dev%3A443%2Fhttps%2Fstorage.googleapis.com%2Fkaggle-data-sets%2F1852043%2F3023973%2Fbundle%2Farc

KAGGLE_INPUT_PATH='/kaggle/input'
KAGGLE_WORKING_PATH='/kaggle/working'
KAGGLE_SYMLINK='kaggle'

!umount /kaggle/input/ 2> /dev/null

shutil.rmtree('/kaggle/input', ignore_errors=True)
os.makedirs(KAGGLE_INPUT_PATH, 0o777, exist_ok=True)
os.makedirs(KAGGLE_WORKING_PATH, 0o777, exist_ok=True)

try:
os.symlink(KAGGLE_INPUT_PATH, os.path.join("..", 'input'), target_is_directory=True)
except FileExistsError:
pass
try:
os.symlink(KAGGLE_WORKING_PATH, os.path.join("..", 'working'), target_is_directory=True)
except FileExistsError:
pass

for data_source_mapping in DATA_SOURCE_MAPPING.split(','):

directory, download_url_encoded = data_source_mapping.split(':')
download_url = unquote(download_url_encoded)
filename = urlparse(download_url).path
destination_path = os.path.join(KAGGLE_INPUT_PATH, directory)
try:
with urlopen(download_url) as fileres, NamedTemporaryFile() as tfile:
total_length = fileres.headers['content-length']
print(f'Downloading {directory}, {total_length} bytes compressed')
dl = 0
data = fileres.read(CHUNK_SIZE)
while len(data) > 0:
dl += len(data)
tfile.write(data)
done = int(50 * dl / int(total_length))
sys.stdout.write(f"\r[{'=' * done}{' ' * (50-done)}] {dl} bytes downloaded")
sys.stdout.flush()
data = fileres.read(CHUNK_SIZE)
if filename.endswith('.zip'):
with ZipFile(tfile) as zfile:
zfile.extractall(destination_path)
else:
with tarfile.open(tfile.name) as tarfile:
tarfile.extractall(destination_path)
print(f'\nDownloaded and uncompressed: {directory}')
except HTTPError as e:
print(f'Failed to load (likely expired) {download_url} to path {destination_path}')
continue
except OSError as e:
print(f'Failed to load {download_url} to path {destination_path}')
continue

print('Data source import complete.')

Downloading latest-covid-19-dataset-worldwide, 8526536 bytes compressed

[==================================================] 8526536 bytes downloaded
Downloaded and uncompressed: latest-covid-19-dataset-worldwide
Data source import complete.

In [ ]: import numpy as np # Lineal algebra

import pandas as pd # Data wrangling
from statsmodels.tsa.arima.model import ARIMA #ARIMA model (arima_model is deprecated, use this one instead!)
from statsmodels.tsa.stattools import adfuller #Dickey-Fuller test for stationarity

# Plotting
import seaborn as sns
import matplotlib.pyplot as plt
from statsmodels.graphics.tsaplots import plot_acf, plot_pacf

In [ ]: df = pd.read_csv('../input/latest-covid-19-dataset-worldwide/owid-covid-data (2).csv')

In [ ]: df['date'] = pd.to_datetime(df['date'])
df = df[df['iso_code']=='NGA']
df = df.set_index('date')
hospitalized = df[['new_vaccinations_smoothed']]
hospitalized = hospitalized.resample('W-MON').mean()

In [ ]: hospitalized.plot()

Out[ ]: <Axes: xlabel='date'>

In [ ]: hospitalized = hospitalized.dropna()

In [ ]: hospitalized.plot()

Out[ ]: <Axes: xlabel='date'>

In [ ]: #hospitalized = np.log(hospitalized) # Apply a log transformation to reduce heterocedasticity

hospitalized.plot()

Out[ ]: <Axes: xlabel='date'>

In [ ]: result = adfuller(hospitalized)
print('ADF Statistic: %f' % result[0])
print('p-value: %f' % result[1])

ADF Statistic: -1.904860

p-value: 0.329778

In [ ]: diffhosp = hospitalized.diff().dropna() # Save the first difference

result = adfuller(diffhosp)
print('ADF Statistic: %f' % result[0])
print('p-value: %f' % result[1])

ADF Statistic: -5.184212

p-value: 0.000009

In [ ]: diffhosp.plot()
pacf = plot_pacf(diffhosp)
acf = plot_acf(diffhosp)

In [ ]: model = ARIMA(hospitalized,order= (2,1,2)).fit()

model.summary()

Out[ ]: SARIMAX Results

Dep. Variable: new_vaccinations_smoothed No. Observations: 45

Model: ARIMA(2, 1, 2) Log Likelihood -500.258

Date: Thu, 02 May 2024 AIC 1010.516

Time: 13:12:17 BIC 1019.436

Sample: 03-08-2021 HQIC 1013.824

- 01-10-2022

Covariance Type: opg

coef std err z P>|z| [0.025 0.975]

ar.L1 0.1947 0.569 0.342 0.732 -0.920 1.310

ar.L2 0.3753 0.587 0.639 0.523 -0.776 1.526

ma.L1 0.0333 0.501 0.066 0.947 -0.949 1.016

ma.L2 -0.7574 0.533 -1.421 0.155 -1.802 0.287

sigma2 4.906e+08 3.17e-09 1.55e+17 0.000 4.91e+08 4.91e+08

Ljung-Box (L1) (Q): 0.01 Jarque-Bera (JB): 1.58

Prob(Q): 0.92 Prob(JB): 0.45

Heteroskedasticity (H): 2.53 Skew: 0.29

Prob(H) (two-sided): 0.08 Kurtosis: 3.73

Warnings:
[1] Covariance matrix calculated using the outer product of gradients (complex-step).
[2] Covariance matrix is singular or near-singular, with condition number 4.63e+32. Standard errors may be unstable.

In [ ]: predictions = model.predict()
plt.figure(figsize=(15,10))
plt.plot(predictions[1:])
plt.plot(hospitalized)

Out[ ]: [<matplotlib.lines.Line2D at 0x7c9e30a300d0>]

In [ ]: train = hospitalized[:-5]
test = hospitalized[-5:]
model = ARIMA(train,order= (2,1,2)).fit()
model.summary()

Out[ ]: SARIMAX Results

Dep. Variable: new_vaccinations_smoothed No. Observations: 40

Model: ARIMA(2, 1, 2) Log Likelihood -439.084

Date: Thu, 02 May 2024 AIC 888.168

Time: 13:13:46 BIC 896.486

Sample: 03-08-2021 HQIC 891.153

- 12-06-2021

Covariance Type: opg

coef std err z P>|z| [0.025 0.975]

ar.L1 0.7882 0.495 1.591 0.112 -0.183 1.759

ar.L2 -0.3523 0.380 -0.927 0.354 -1.097 0.392

ma.L1 -0.5648 0.619 -0.913 0.361 -1.777 0.648

ma.L2 -0.2435 0.560 -0.435 0.664 -1.341 0.854

sigma2 3.94e+08 1.83e-09 2.16e+17 0.000 3.94e+08 3.94e+08

Ljung-Box (L1) (Q): 0.14 Jarque-Bera (JB): 7.62

Prob(Q): 0.71 Prob(JB): 0.02

Heteroskedasticity (H): 1.29 Skew: 0.62

Prob(H) (two-sided): 0.65 Kurtosis: 4.78

Warnings:
[1] Covariance matrix calculated using the outer product of gradients (complex-step).
[2] Covariance matrix is singular or near-singular, with condition number 2.09e+33. Standard errors may be unstable.

In [ ]: predictions = model.get_forecast(5,alpha = 0.95)

plt.figure(figsize=(15,10))
plt.plot((train))
plt.plot((predictions.predicted_mean))
plt.plot((test))
conf= predictions.conf_int(alpha=0.05)
upper = (conf['lower new_vaccinations_smoothed'])
lower = (conf['upper new_vaccinations_smoothed'])
plt.fill_between(upper.index, upper,lower, color='b', alpha=.1)

---------------------------------------------------------------------------
IndexError Traceback (most recent call last)
<ipython-input-29-c01453b67fd5> in <cell line: 7>()
5 plt.plot((test))
6 conf= predictions.conf_int(alpha=0.05)
----> 7 upper = (conf['lower new_vaccinations_smoothed'])
8 lower = (conf['upper new_vaccinations_smoothed'])
9 plt.fill_between(upper.index, upper,lower, color='b', alpha=.1)

IndexError: only integers, slices (`:`), ellipsis (`...`), numpy.newaxis (`None`) and integer or boolean arrays are valid indices

In [ ]: size = int(len(hospitalized) * 0.66)

train, test = hospitalized[0:size], hospitalized[size:len(hospitalized)]
prediction = []
data = train.values
for t in test.values:
model = model = ARIMA(data,order= (2,1,2)).fit()
y = model.forecast()
prediction.append(y[0])
data = np.append(data, t)
test_res = pd.DataFrame(test)
test_res['preds'] = prediction

In [ ]: plt.figure(figsize=(15,6))
plt.plot((train))
plt.plot((test_res))

Out[ ]: [<matplotlib.lines.Line2D at 0x7c9e2ceb7010>,

<matplotlib.lines.Line2D at 0x7c9e2ceb6fe0>]

In [ ]: for column_name in df.columns:

df[column_name] = pd.to_numeric(df[column_name], errors='coerce')

corr = df.corr()
hospcorr = corr['new_vaccinations_smoothed']
hospcorr = hospcorr[np.abs(hospcorr)>0.4]
hospcorr.sort_values()

Out[ ]: stringency_index -0.574414

new_cases_smoothed 0.498517
new_cases_smoothed_per_million 0.498526
positive_rate 0.506732
total_tests 0.651580
total_tests_per_thousand 0.651585
total_deaths_per_million 0.686572
total_deaths 0.686583
total_cases_per_million 0.707083
total_cases 0.707083
people_fully_vaccinated 0.719701
people_fully_vaccinated_per_hundred 0.720430
total_vaccinations_per_hundred 0.770341
total_vaccinations 0.770371
people_vaccinated_per_hundred 0.778505
people_vaccinated 0.778598
new_vaccinations 0.804425
new_people_vaccinated_smoothed 0.947457
new_people_vaccinated_smoothed_per_hundred 0.947986
new_vaccinations_smoothed_per_million 0.999999
new_vaccinations_smoothed 1.000000
Name: new_vaccinations_smoothed, dtype: float64

In [ ]: exogfeats = df[['stringency_index','total_deaths_per_million','total_cases_per_million']]

In [ ]: for column in exogfeats.columns:

exogfeats[column]= exogfeats[column].fillna(exogfeats[column].mean())

In [ ]: exogfeats = exogfeats.resample('W-MON').mean()
exogfeats = exogfeats.iloc[(exogfeats.index >= hospitalized.first_valid_index()) & (exogfeats.index<= hospitalized.last_valid_index())]

In [ ]: fig, ax = plt.subplots(3, 1, figsize=(12, 8), tight_layout=True)

exogfeats.plot(ax=ax, subplots=True, rot=60)

Out[ ]: array([<Axes: xlabel='date'>, <Axes: xlabel='date'>,

<Axes: xlabel='date'>], dtype=object)

In [ ]: model = ARIMA(hospitalized,order= (2,1,2),exog=exogfeats).fit()

predictions = model.predict()
model.summary()

Out[ ]: SARIMAX Results

Dep. Variable: new_vaccinations_smoothed No. Observations: 45

Model: ARIMA(2, 1, 2) Log Likelihood -497.400

Date: Thu, 02 May 2024 AIC 1010.800

Time: 13:24:52 BIC 1025.074

Sample: 03-08-2021 HQIC 1016.094

- 01-10-2022

Covariance Type: opg

coef std err z P>|z| [0.025 0.975]

stringency_index -145.7513 1080.049 -0.135 0.893 -2262.608 1971.106

total_deaths_per_million 4.708e+04 2.33e+04 2.019 0.044 1365.727 9.28e+04

total_cases_per_million -164.9822 269.965 -0.611 0.541 -694.104 364.140

ar.L1 0.9271 0.176 5.279 0.000 0.583 1.271

ar.L2 -0.9354 0.162 -5.759 0.000 -1.254 -0.617

ma.L1 -0.8978 0.290 -3.092 0.002 -1.467 -0.329

ma.L2 0.8878 0.237 3.744 0.000 0.423 1.353

sigma2 4.544e+08 0.191 2.37e+09 0.000 4.54e+08 4.54e+08

Ljung-Box (L1) (Q): 0.66 Jarque-Bera (JB): 1.95

Prob(Q): 0.42 Prob(JB): 0.38

Heteroskedasticity (H): 4.95 Skew: -0.46

Prob(H) (two-sided): 0.00 Kurtosis: 3.45

Warnings:
[1] Covariance matrix calculated using the outer product of gradients (complex-step).
[2] Covariance matrix is singular or near-singular, with condition number 5.09e+26. Standard errors may be unstable.

In [ ]: plt.figure(figsize=(15,6))
plt.legend(["a","b"])
plt.plot(hospitalized)
plt.plot(predictions[1:])
plt.show()

In [ ]: test_length = 5
train = hospitalized[:-test_length]
test = hospitalized[-test_length:]
train_exog = exogfeats[:-test_length]
test_exog = exogfeats[-test_length:]
model = ARIMA(train,order= (2,1,2),exog=train_exog).fit()

In [ ]: predictions = model.get_forecast(5,exog = test_exog,alpha = 0.95)

Out[ ]: <matplotlib.collections.PolyCollection at 0x7c9e2c72dd20>

In [ ]:

Maxbox Starter149 Statistic Package Statsmodels
No ratings yet
Maxbox Starter149 Statistic Package Statsmodels
9 pages
Sales Forecasting
100% (1)
Sales Forecasting
10 pages
ML Lab6.Ipynb - Colaboratory
100% (1)
ML Lab6.Ipynb - Colaboratory
5 pages
Regression Anallysis Hands0n 1
100% (1)
Regression Anallysis Hands0n 1
3 pages
FINALREPORTGROUP
No ratings yet
FINALREPORTGROUP
41 pages
CS2 CMP Upgrade 2022
No ratings yet
CS2 CMP Upgrade 2022
148 pages
18BCE10291 - Outliers Assignment
No ratings yet
18BCE10291 - Outliers Assignment
10 pages
TP Regression
100% (1)
TP Regression
1 page
EVS-EN ISO 19650-4
No ratings yet
EVS-EN ISO 19650-4
20 pages
CS2 CMP Upgrade 2022
No ratings yet
CS2 CMP Upgrade 2022
128 pages
M4M 30 - User - Manual - PDF
No ratings yet
M4M 30 - User - Manual - PDF
84 pages
Distributed Operating System - Wikipedia
No ratings yet
Distributed Operating System - Wikipedia
53 pages
Kata Pengantar Vano
No ratings yet
Kata Pengantar Vano
86 pages
Cyber Security Notes Unit 4
No ratings yet
Cyber Security Notes Unit 4
15 pages
AZURE HANDOUTS
No ratings yet
AZURE HANDOUTS
45 pages
30-Day Planner
No ratings yet
30-Day Planner
29 pages
DIT 0102 - Word Manual
No ratings yet
DIT 0102 - Word Manual
58 pages
Multi-Programmer User Guide (PC+Tool)
No ratings yet
Multi-Programmer User Guide (PC+Tool)
32 pages
Teste
No ratings yet
Teste
42 pages
Chapter 4 Compute Architecture and s 2023 Programming Massively Parallel P
No ratings yet
Chapter 4 Compute Architecture and s 2023 Programming Massively Parallel P
24 pages
SRM Instructions UG
No ratings yet
SRM Instructions UG
38 pages
ARIMA Models in Python Chapter2
No ratings yet
ARIMA Models in Python Chapter2
43 pages
Unit 4 - Games
No ratings yet
Unit 4 - Games
23 pages
Onboarding Guide
No ratings yet
Onboarding Guide
21 pages
Tutorial - How To Use Dropbox Behind A Corporate Proxy Server Using CNTLM - I Code and Code
No ratings yet
Tutorial - How To Use Dropbox Behind A Corporate Proxy Server Using CNTLM - I Code and Code
12 pages
Apoorva p 17th March TSF
No ratings yet
Apoorva p 17th March TSF
47 pages
ForecastingIndividualassignment MohammadMujtaba 12020063
No ratings yet
ForecastingIndividualassignment MohammadMujtaba 12020063
20 pages
Kotlin 1 5 If - When
No ratings yet
Kotlin 1 5 If - When
12 pages
Tarea de Ma
No ratings yet
Tarea de Ma
18 pages
Bda Assign
No ratings yet
Bda Assign
15 pages
PPP Models - GARCH & NARNN - Ipynb - Colaboratory
No ratings yet
PPP Models - GARCH & NARNN - Ipynb - Colaboratory
13 pages
Agreed Terms & Condition
No ratings yet
Agreed Terms & Condition
15 pages
Sen Answer Class Test 1
No ratings yet
Sen Answer Class Test 1
14 pages
Huraira
No ratings yet
Huraira
26 pages
Unit 4: Process Automation in Manufacturing and Supply Chain - Part 1
No ratings yet
Unit 4: Process Automation in Manufacturing and Supply Chain - Part 1
8 pages
Data Analytics
No ratings yet
Data Analytics
18 pages
Hasil Dan Analisa Data Bru
No ratings yet
Hasil Dan Analisa Data Bru
25 pages
AQL Based Acceptance Sampling Schemes
No ratings yet
AQL Based Acceptance Sampling Schemes
11 pages
FCUBS 14.5 - L1 Technical Training Plan - BB Bank - v1
No ratings yet
FCUBS 14.5 - L1 Technical Training Plan - BB Bank - v1
9 pages
Society Management System
No ratings yet
Society Management System
8 pages
Interview Questions Part 1
No ratings yet
Interview Questions Part 1
8 pages
PPP Models - ARIMA & NARNN - Ipynb - Colaboratory
No ratings yet
PPP Models - ARIMA & NARNN - Ipynb - Colaboratory
8 pages
Exercise 6: Time Series Analysis and Stochastic Modelling
No ratings yet
Exercise 6: Time Series Analysis and Stochastic Modelling
18 pages
Soruma SECOND ASSEsiment Final l Reg
No ratings yet
Soruma SECOND ASSEsiment Final l Reg
34 pages
FINAL (اسئلة متوقعة تيجي في الامتحان)
No ratings yet
FINAL (اسئلة متوقعة تيجي في الامتحان)
7 pages
CPI.vt (1)
No ratings yet
CPI.vt (1)
11 pages
R Abal
No ratings yet
R Abal
13 pages
Modules
No ratings yet
Modules
12 pages
Sarima
No ratings yet
Sarima
7 pages
PPP Models - SARIMA & NARNN - Ipynb - Colaboratory
No ratings yet
PPP Models - SARIMA & NARNN - Ipynb - Colaboratory
8 pages
Untitled 11
No ratings yet
Untitled 11
12 pages
Output - Group - Work - Project - 4652 - GWP1.ipynb - Colaboratory
No ratings yet
Output - Group - Work - Project - 4652 - GWP1.ipynb - Colaboratory
6 pages
EJEMPLO
No ratings yet
EJEMPLO
11 pages
Arima Model
No ratings yet
Arima Model
6 pages
TestExercise 3.ipynb - Colab
No ratings yet
TestExercise 3.ipynb - Colab
8 pages
Ilovepdf Merged
No ratings yet
Ilovepdf Merged
13 pages
Week 2 MrSumanBera HandsOn
No ratings yet
Week 2 MrSumanBera HandsOn
9 pages
Practicals Data
No ratings yet
Practicals Data
26 pages
Pronóstico: Leer Datos
No ratings yet
Pronóstico: Leer Datos
5 pages
Maisam CV Latest
No ratings yet
Maisam CV Latest
3 pages
Simple_and_Multiple_Regression
No ratings yet
Simple_and_Multiple_Regression
9 pages
Ausimm Paper Template
No ratings yet
Ausimm Paper Template
3 pages
Unit 1 - Unit 4 Links Crypto
No ratings yet
Unit 1 - Unit 4 Links Crypto
3 pages
Linear Regression
No ratings yet
Linear Regression
7 pages
OLSLinear Regquestion
No ratings yet
OLSLinear Regquestion
5 pages
Assignment 6
No ratings yet
Assignment 6
6 pages
Da 5
No ratings yet
Da 5
3 pages
Kuldeep Cv
No ratings yet
Kuldeep Cv
2 pages
DA EXP 07
No ratings yet
DA EXP 07
6 pages
percobaan 3
No ratings yet
percobaan 3
14 pages
run stata 17-11
No ratings yet
run stata 17-11
7 pages
Percobaan 16 Nov(2)
No ratings yet
Percobaan 16 Nov(2)
7 pages
Uji Asumsi Klasik 1
No ratings yet
Uji Asumsi Klasik 1
6 pages
Itvoyagers Bi Practical 10 Mu Tyit
No ratings yet
Itvoyagers Bi Practical 10 Mu Tyit
8 pages
Ecotric Project
No ratings yet
Ecotric Project
3 pages
TMT Procedure - Management Review P2
No ratings yet
TMT Procedure - Management Review P2
1 page
assignment2
No ratings yet
assignment2
5 pages
7
No ratings yet
7
5 pages
9
No ratings yet
9
5 pages
Transport Sync-Up Process Document: Sap/ Sunil Ghatage
No ratings yet
Transport Sync-Up Process Document: Sap/ Sunil Ghatage
8 pages
samp_doc
No ratings yet
samp_doc
4 pages
R-code
No ratings yet
R-code
7 pages
Percobaan 19 Nov
No ratings yet
Percobaan 19 Nov
7 pages
ARIMA Predict Forecast
No ratings yet
ARIMA Predict Forecast
1 page
Percobaan 19 Nov 15-19
No ratings yet
Percobaan 19 Nov 15-19
4 pages
annotated-Lab 1 Spring 2025 Assignment.Rmd
No ratings yet
annotated-Lab 1 Spring 2025 Assignment.Rmd
3 pages
Pregunta 5
No ratings yet
Pregunta 5
2 pages
Assignment_1_Tuneer (1)
No ratings yet
Assignment_1_Tuneer (1)
5 pages
Project
No ratings yet
Project
16 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet