import requests as r
from bs4 import BeautifulSoup
import json
import pandas as pd
from Historic_Crypto import HistoricalData
from Historic_Crypto import Cryptocurrencies
from datetime import datetime
import datetime as dt
import numpy as np

import plotly.io as pio
import plotly.graph_objects as go
import plotly.express as px
from plotly.subplots import make_subplots

from sklearn.preprocessing import MinMaxScaler
from sklearn.ensemble import RandomForestRegressor
from sklearn.metrics import mean_squared_error, r2_score
from sklearn.model_selection import train_test_split

from keras.models import Sequential
from keras.layers import LSTM, Dense

# Required settings in order for plotly to render properly. Will cover plotly later in the tutorial
pio.renderers.default = "notebook+plotly_mimetype+png+jpeg+svg+pdf"


# Defining the URL of the webpage that we would like to make a GET request.
cmp_url = "https://coinmarketcap.com/"

# Executing the GET request using requests library.
result = r.get(cmp_url)

# Printing to see if the request went through and what the status of the request is.
print(result)

<Response [200]>


# Passing in the raw HTML content to setup BeautifulSoup for data extraction.
root = BeautifulSoup(result.content)

# Getting to the body of the HTML document so that we can start searching for the table
root = root.find("body", {"class": "DAY"})

# Navigating through body to get to the page division that contains the table
root = root.find("div").find("div").find("div").find("div", {"class" : "cmc-body-wrapper"}).find("div") \
.find("div").find("div", {"class" : "sc-beb003d5-2 bkNrIb"}).find("table")

# Utilizing the built in function for reading HTML to process the data into a list of information
top_crypto_df_list = pd.read_html(root.prettify())

# Putting together the elements of the list of information to form a dataframe
top_crypto_df = pd.concat(top_crypto_df_list)

# Viewing the first 5 entries in the dataframe
top_crypto_df.head(10)


# Reading in CSV of historical data
historical_data_df = pd.read_csv('dataset.csv')

# Viewing the dataframe constructed from the CSV.
historical_data_df


top_crypto_df = top_crypto_df.drop(columns=['Last 7 Days', 'Unnamed: 0', 'Unnamed: 11', '#'])
top_crypto_df


# Carrying out as a column operation.
# Taking the value in name, splitting it, and putting the last element of the resultant list as the ticker
# and making the first value of the resultant list the name
top_crypto_df['Ticker'] = top_crypto_df['Name'].str.split(" ").str[-1] # Gets the last element in the list
top_crypto_df['Name'] = top_crypto_df['Name'].str.split(" ").str[0]

top_crypto_df


# Here, we get the top 5 rows, and then take the Name column giving us a Pandas series of the top 5 names.
top_10_list = top_crypto_df.head(10)['Name']

# Now, we want the series to be a string array so we set the series type to be a string and then convert it to a
# list using the built in function.
top_10_list = top_10_list.astype(str).tolist()
print(top_10_list)

['Bitcoin', 'Ethereum', 'Tether', 'BNB', 'USD', 'XRP', 'Cardano', 'Dogecoin', 'Solana', 'Polygon']


# We need to check if the library can get data on our top 10, if not we can just shift further down the list and
# get the top 10 that are retrievable.

# The library returns all of the possible tickers if none match the search criteria. In order to figure out if
# this is what happened we call it once with no search string and save the # of rows in the dataframe to know.
not_possible = (Cryptocurrencies(extended_output=False).find_crypto_pairs()).shape[0]

available = []

count = 10
while(len(available) != 10):
    # Since the library function requires the ticker and currency, we can get the tickers for the top 10
    # in our top_crypto_df and then append USD to the value since the rest of our data is in USD as well.
    top_10_ticker_list = top_crypto_df.head(count)['Ticker']
    top_10_name_list = top_crypto_df.head(count)['Name']
    
    top_10_ticker_list = top_10_ticker_list.astype(str).tolist()
    top_10_name_list = top_10_name_list.astype(str).tolist()
    
    combined_top_10_list = list(zip(top_10_name_list, top_10_ticker_list))
    
    # resetting for iteration
    available = []
    
    # Looping through current options and checking to see which are avaiable and which are not
    for name,ticker in combined_top_10_list:
        
        ticker_info = ticker+'-USD'
        options = Cryptocurrencies(coin_search = ticker_info, extended_output = False).find_crypto_pairs()
        
        # Okay so we know that the symbol is available, now we need to check that the specific one that we want
        # is online
        if options.shape[0] != not_possible:
            if 'delisted' not in options.loc[options['id'] == ticker_info]['status'].astype('str').tolist():
                available.append((name,ticker))
    
    count += 1

# Looping through and printing out results
idx = 1

print("Our list is as follows\n")

for name,ticker in available:
    print(f"{idx}: {name} - {ticker}")
    idx += 1

print("\n")

top_10_list = available

Connected to the CoinBase Pro API.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 4 instances containing the term BTC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 5 instances containing the term ETH-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term USDT-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term XRP-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term ADA-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term DOGE-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term SOL-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term MATIC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 4 instances containing the term BTC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 5 instances containing the term ETH-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term USDT-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term XRP-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term ADA-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term DOGE-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term SOL-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term MATIC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 4 instances containing the term BTC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 5 instances containing the term ETH-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term USDT-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term XRP-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term ADA-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term DOGE-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term SOL-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term MATIC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term DOT-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 4 instances containing the term BTC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 5 instances containing the term ETH-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term USDT-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term XRP-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term ADA-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term DOGE-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term SOL-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term MATIC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term DOT-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term LTC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 4 instances containing the term BTC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 5 instances containing the term ETH-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term USDT-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term XRP-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term ADA-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term DOGE-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term SOL-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term MATIC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term DOT-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term LTC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term BUSD-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 4 instances containing the term BTC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 5 instances containing the term ETH-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term USDT-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term XRP-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term ADA-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term DOGE-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 3 instances containing the term SOL-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term MATIC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Unable to find specific search term, returning all available data.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term DOT-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term LTC-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 1 instances containing the term BUSD-USD.
Extended Output is False, returning reduced dataset.
Connected to the CoinBase Pro API.
Found 2 instances containing the term SHIB-USD.
Extended Output is False, returning reduced dataset.
Our list is as follows

1: Bitcoin - BTC
2: Ethereum - ETH
3: Tether - USDT
4: Cardano - ADA
5: Dogecoin - DOGE
6: Solana - SOL
7: Polygon - MATIC
8: Polkadot - DOT
9: Litecoin - LTC
10: Shiba - SHIB


# We will loop through the top 10 list we made and gather the data for each coin in a new dataframe.

# Making a dictionary of dataframes so we can store the data.
top_10_recent = pd.DataFrame()

# Since our start date from when we want to start gathering data doesnt change, we can just hardcode it.
start_date = '2022-10-24-00-00'

for name,ticker in top_10_list:
    
    ticker_info = ticker+'-USD'
    # This is the interval between datapoints, 86400 seconds is one day which is what we want.
    granularity = 86400 
    request_df = HistoricalData(ticker_info, granularity, start_date).retrieve_data()
    
    # Adding name and ticker to resultant df for consistency with other data source and so that we know
    # what coin the data corresponds to
    request_df['Name'] = name
    request_df['Ticker'] = ticker
    
    # Adding result data to the dataframe holding the results of all the top 10
    top_10_recent = pd.concat([top_10_recent, request_df])

top_10_recent

Checking input parameters are in the correct format.
Formatting Dates.
Checking if user supplied is available on the CoinBase Pro API.
Connected to the CoinBase Pro API.
Ticker 'BTC-USD' found at the CoinBase Pro API, continuing to extraction.
Retrieved Data from Coinbase Pro API.
Returning data.
Checking input parameters are in the correct format.
Formatting Dates.
Checking if user supplied is available on the CoinBase Pro API.
Connected to the CoinBase Pro API.
Ticker 'ETH-USD' found at the CoinBase Pro API, continuing to extraction.
Retrieved Data from Coinbase Pro API.
Returning data.
Checking input parameters are in the correct format.
Formatting Dates.
Checking if user supplied is available on the CoinBase Pro API.
Connected to the CoinBase Pro API.
Ticker 'USDT-USD' found at the CoinBase Pro API, continuing to extraction.
Retrieved Data from Coinbase Pro API.
Returning data.
Checking input parameters are in the correct format.
Formatting Dates.
Checking if user supplied is available on the CoinBase Pro API.
Connected to the CoinBase Pro API.
Ticker 'ADA-USD' found at the CoinBase Pro API, continuing to extraction.
Retrieved Data from Coinbase Pro API.
Returning data.
Checking input parameters are in the correct format.
Formatting Dates.
Checking if user supplied is available on the CoinBase Pro API.
Connected to the CoinBase Pro API.
Ticker 'DOGE-USD' found at the CoinBase Pro API, continuing to extraction.
Retrieved Data from Coinbase Pro API.
Returning data.
Checking input parameters are in the correct format.
Formatting Dates.
Checking if user supplied is available on the CoinBase Pro API.
Connected to the CoinBase Pro API.
Ticker 'SOL-USD' found at the CoinBase Pro API, continuing to extraction.
Retrieved Data from Coinbase Pro API.
Returning data.
Checking input parameters are in the correct format.
Formatting Dates.
Checking if user supplied is available on the CoinBase Pro API.
Connected to the CoinBase Pro API.
Ticker 'MATIC-USD' found at the CoinBase Pro API, continuing to extraction.
Retrieved Data from Coinbase Pro API.
Returning data.
Checking input parameters are in the correct format.
Formatting Dates.
Checking if user supplied is available on the CoinBase Pro API.
Connected to the CoinBase Pro API.
Ticker 'DOT-USD' found at the CoinBase Pro API, continuing to extraction.
Retrieved Data from Coinbase Pro API.
Returning data.
Checking input parameters are in the correct format.
Formatting Dates.
Checking if user supplied is available on the CoinBase Pro API.
Connected to the CoinBase Pro API.
Ticker 'LTC-USD' found at the CoinBase Pro API, continuing to extraction.
Retrieved Data from Coinbase Pro API.
Returning data.
Checking input parameters are in the correct format.
Formatting Dates.
Checking if user supplied is available on the CoinBase Pro API.
Connected to the CoinBase Pro API.
Ticker 'SHIB-USD' found at the CoinBase Pro API, continuing to extraction.
Retrieved Data from Coinbase Pro API.
Returning data.


top_10_recent.info()

<class 'pandas.core.frame.DataFrame'>
DatetimeIndex: 2010 entries, 2022-10-24 to 2023-05-12
Data columns (total 7 columns):
 #   Column  Non-Null Count  Dtype  
---  ------  --------------  -----  
 0   low     2010 non-null   float64
 1   high    2010 non-null   float64
 2   open    2010 non-null   float64
 3   close   2010 non-null   float64
 4   volume  2010 non-null   float64
 5   Name    2010 non-null   object 
 6   Ticker  2010 non-null   object 
dtypes: float64(5), object(2)
memory usage: 125.6+ KB


top_10_recent = top_10_recent.reset_index()
top_10_recent


top_10_recent.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 2010 entries, 0 to 2009
Data columns (total 8 columns):
 #   Column  Non-Null Count  Dtype         
---  ------  --------------  -----         
 0   time    2010 non-null   datetime64[ns]
 1   low     2010 non-null   float64       
 2   high    2010 non-null   float64       
 3   open    2010 non-null   float64       
 4   close   2010 non-null   float64       
 5   volume  2010 non-null   float64       
 6   Name    2010 non-null   object        
 7   Ticker  2010 non-null   object        
dtypes: datetime64[ns](1), float64(5), object(2)
memory usage: 125.8+ KB


top_10_recent[['Name', 'Ticker']] = top_10_recent[['Name', 'Ticker']].astype('string')
top_10_recent.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 2010 entries, 0 to 2009
Data columns (total 8 columns):
 #   Column  Non-Null Count  Dtype         
---  ------  --------------  -----         
 0   time    2010 non-null   datetime64[ns]
 1   low     2010 non-null   float64       
 2   high    2010 non-null   float64       
 3   open    2010 non-null   float64       
 4   close   2010 non-null   float64       
 5   volume  2010 non-null   float64       
 6   Name    2010 non-null   string        
 7   Ticker  2010 non-null   string        
dtypes: datetime64[ns](1), float64(5), string(2)
memory usage: 125.8 KB


# Changing instances of Shiba in the dataframe to Shiba Inu
top_10_recent = top_10_recent.replace('Shiba', 'Shiba Inu')

# Reassigning columns attribute of dataframe so that the column names are all capitalized.
top_10_recent.columns = ['Date', 'Low', 'High', 'Open', 'Close', 'Volume', 'Name', 'Ticker']

# Using the iloc function to get the columns and put them in a more logical order. Numbers correspond to the index
# of the column in terms of the list of column names passed in above.
top_10_recent = top_10_recent.iloc[:, [0,6,7,3,2,1,4,5]]

top_10_recent


historical_data_df


historical_data_df = historical_data_df.drop(columns=['Unnamed: 0', 'timestamp'])
historical_data_df


historical_data_df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 72946 entries, 0 to 72945
Data columns (total 8 columns):
 #   Column       Non-Null Count  Dtype  
---  ------       --------------  -----  
 0   open         72946 non-null  float64
 1   high         72946 non-null  float64
 2   low          72946 non-null  float64
 3   close        72946 non-null  float64
 4   volume       72946 non-null  float64
 5   marketCap    72946 non-null  float64
 6   crypto_name  72946 non-null  object 
 7   date         72946 non-null  object 
dtypes: float64(6), object(2)
memory usage: 4.5+ MB


historical_data_df['date'] = pd.to_datetime(historical_data_df['date'])
historical_data_df['crypto_name'] = historical_data_df['crypto_name'].astype('string')
historical_data_df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 72946 entries, 0 to 72945
Data columns (total 8 columns):
 #   Column       Non-Null Count  Dtype         
---  ------       --------------  -----         
 0   open         72946 non-null  float64       
 1   high         72946 non-null  float64       
 2   low          72946 non-null  float64       
 3   close        72946 non-null  float64       
 4   volume       72946 non-null  float64       
 5   marketCap    72946 non-null  float64       
 6   crypto_name  72946 non-null  string        
 7   date         72946 non-null  datetime64[ns]
dtypes: datetime64[ns](1), float64(6), string(1)
memory usage: 4.5 MB


# Using list comprehension to get the names of the top 10
name_list = [name for name,ticker in top_10_list]

# Accounting for the inconsistency in name
name_list[-1] = 'Shiba Inu'

# Using the pandas
historical_data_df = historical_data_df[historical_data_df['crypto_name'].isin(name_list)]
historical_data_df


# Fix discrepancy mistake
top_10_list[-1] = ('Shiba Inu', 'SHIB')

# set up dictionary
name_to_ticker_dict = {}

# inserting into dictionary
for name,ticker in top_10_list:
    name_to_ticker_dict[name] = ticker

# Adding column to dataframe w/ temp values
historical_data_df.insert(0, 'Ticker', np.nan)
    
# Setting ticker values for the dataframe
for index,row in historical_data_df.iterrows():
    historical_data_df.at[index, 'Ticker'] = name_to_ticker_dict[historical_data_df.at[index, 'crypto_name']]
    
historical_data_df


historical_data_df.columns = ['Ticker', 'Open', 'High', 'Low', 'Close', 'Volume', 'Market Cap.', 'Name', 'Date']
historical_data_df = historical_data_df.iloc[:, [8,7,0,1,2,3,4,5,6]]
historical_data_df


top_10_recent


# Putting together two data sources
final_df = pd.concat([historical_data_df, top_10_recent])

# Sorting the combined dataset first by date and then by name within organized dates
final_df.sort_values(by=['Date', 'Name'], inplace=True)

# Since market capitalization data is missing in our more recent data, we can get rid of the column as it is
# of no use to us if it isn't complete
final_df = final_df.drop(columns=['Market Cap.'])

final_df


# creating a copy just in case dataset gets messed up and original is needed.
final_cp = final_df.copy()
final_cp


for name in name_list:
    temp_df = final_cp[final_cp['Name'] == name]
    
    trace = go.Ohlc(x=temp_df['Date'], open = temp_df['Open'], high = temp_df['High'], low = temp_df['Low'], \
                   close = temp_df['Close'])
    
    fig = go.Figure(data=trace)
    
    fig.update_layout(
    title=f"OHLC for {name} Over Time", \
    xaxis_title='Year', yaxis_title='Price per Coin (USD)')
    
    fig.show()


final_cp.insert(8, 'Average', np.nan)
final_cp['Average'] = (final_cp['Open'] + final_cp['Close']) / 2
final_cp


# Using plotly express to create the graph
fig = px.line(final_cp, x='Date', y='Average', color='Name', symbol='Ticker')

# adding title and labeling axis
fig.update_layout(title=f"Average Price Over Time", xaxis_title='Year', yaxis_title='Price per Coin (USD)')

fig.show()


# Coins to exclude
remove = ['Bitcoin', 'Ethereum']

# Keeping rows that do not have information pertaining to Bitcoin or Ethereum
final_cp_2 = final_cp[~final_cp['Name'].isin(remove)]

# Plotting remaining data
fig = px.line(final_cp_2, x='Date', y='Average', color='Name', symbol='Ticker')

# Setting plot title and axis labels
fig.update_layout(title=f"Average Price Over Time", xaxis_title='Year', yaxis_title='Price per Coin (USD)')

fig.show()


# reordering for calculation of SMA's
final_cp = final_cp.sort_values(['Name', 'Date'])

# calculating SMA's
final_cp['SMA25'] = final_cp.groupby('Name')['Average'].rolling(window = 25).mean().reset_index(0, drop=True)
final_cp['SMA50'] = final_cp.groupby('Name')['Average'].rolling(window = 50).mean().reset_index(0, drop=True)
final_cp['SMA100'] = final_cp.groupby('Name')['Average'].rolling(window = 100).mean().reset_index(0, drop=True)


for name in name_list:
    
    fig = make_subplots(rows = 1, cols = 1)
    
    # Filtering list to only data for the coin we are currently looking at
    filtered_df = (final_cp[final_cp['Name'] == name]).copy()
    
    # Creating graph components for each line.
    trace1 = go.Scatter(x=filtered_df['Date'], y=filtered_df['Average'], name="Average")
    trace2 = go.Scatter(x=filtered_df['Date'], y=filtered_df['SMA25'], name="SMA25")
    trace3 = go.Scatter(x=filtered_df['Date'], y=filtered_df['SMA50'], name="SMA50")
    trace4 = go.Scatter(x=filtered_df['Date'], y=filtered_df['SMA100'], name="SMA100")
    
    # Putting lines onto the figure.
    fig.add_trace(trace1)
    fig.add_trace(trace2)
    fig.add_trace(trace3)
    fig.add_trace(trace4)
    
    # Setting title and axis labels
    fig.update_layout(title=f"Price of {name} with 25, 50, and 100 day SMAs", 
                      xaxis_title="Date", yaxis_title="Price per Coin (USD)")
    
    fig.show()


# generating new column filled with NaN
final_cp.insert(12, 'Growth', np.nan)

# formula for calculating growth
final_cp['Growth'] = ((final_cp['Close'] / final_cp['Open']) - 1) * 100

final_cp


# Generating growth over time graph for all of the cryptocurrencies we are looking at
fig = px.line(final_cp, x='Date', y='Growth', color='Name', symbol='Ticker')

fig.update_layout(title="Growth of Cryptocurrencies Over Time", 
                      xaxis_title="Date", yaxis_title="Price per Coin (USD)")

fig.show()


final_cp['Volume']

0      0.000000e+00
2      0.000000e+00
4      0.000000e+00
7      0.000000e+00
9      0.000000e+00
           ...     
598    1.071410e+08
599    7.751265e+07
600    1.013193e+08
601    9.465740e+07
602    8.327807e+07
Name: Volume, Length: 21153, dtype: float64


# Resorting dataframe for easier calculation of volume changed
final_cp = final_cp.sort_values(['Name', 'Date'])

final_cp['C_Volume'] = final_cp.groupby('Name')['Volume'].diff()

final_cp


# Generating scatterplot of data points
fig = px.scatter(final_cp, x='C_Volume', y='Growth', color='Name', symbol='Ticker')

# Adding title and axis labels
fig.update_layout(title="Growth of Cryptocurrenices over Volume Traded", 
                      xaxis_title="Change in Volume of Coins Traded", yaxis_title="Growth")

fig.show()


# sorting dataset for groupby to work properly
final_cp = final_cp.sort_values(['Name', 'Date'])

# Calculating ranges and saving as column
final_cp['H-L'] = final_cp.groupby('Name').apply(lambda x: x['High'] - x['Low']).reset_index(0, drop=True)
final_cp['H-C1'] = final_cp.groupby('Name').apply(lambda x: np.abs(x['High'] - 
                                                                   x['Close'].shift())).reset_index(0, drop=True)
final_cp['L-C1'] = final_cp.groupby('Name').apply(lambda x: np.abs(x['Low'] - 
                                                                   x['Close'].shift())).reset_index(0, drop=True)

# Calculating the true range, which is the largest of the three ranges calculated before
final_cp['TR'] = final_cp.groupby('Name').apply(lambda x: np.max(pd.concat([x['H-L'], x['H-C1'], x['L-C1']], axis=1), axis=1)).reset_index(0, drop=True)

# We are calculating 14 day ATR
final_cp['ATR'] = final_cp.groupby('Name')['TR'].rolling(14).mean().reset_index(0, drop=True)

final_cp = final_cp.drop(columns=['H-L', 'H-C1', 'L-C1', 'TR'])

final_cp


for name in name_list:
    
    # Filtering list to only data for the coin we are currently looking at
    filtered_df = (final_cp[final_cp['Name'] == name]).copy()
    
    fig = px.scatter(filtered_df, x='ATR', y='Close', trendline='ols')
    
    # Setting title and axis labels
    fig.update_layout(title=f"Close Price of {name} over ATR", 
                      xaxis_title="Price per Coin (USD)", yaxis_title="Price per Coin (USD)")
    
    fig.show()


interval = 5

# Preparing dataset by sorting for groupby's
final_cp = final_cp.sort_values(['Name', 'Date'])

# Calculating positive and negative changes
final_cp['h_diff'] = final_cp.groupby('Name')['High'].diff()
final_cp['l_diff'] = final_cp.groupby('Name').apply(lambda x: x['Low'].shift() - x['Low']).reset_index(0, drop=True)

# Calculating the positive and negative directional movement
final_cp['+DM'] = final_cp.apply(lambda x: x['h_diff'] if x['h_diff'] > x['l_diff'] else 0, axis=1)
final_cp['-DM'] = final_cp.apply(lambda x: x['l_diff'] if x['l_diff'] > x['h_diff'] else 0, axis=1)

# Calculating Smoothed positive and negative directional movement
final_cp['+DM_s'] = final_cp.groupby('Name')['+DM'].rolling(interval).mean().reset_index(0, drop=True)
final_cp['-DM_s'] = final_cp.groupby('Name')['-DM'].rolling(interval).mean().reset_index(0, drop=True)

# Calculating positive and negative directional index
final_cp['+DI'] = final_cp['+DM_s'] / final_cp['ATR']
final_cp['-DI'] = final_cp['-DM_s'] / final_cp['ATR']

# Using formula, calculating ADX
final_cp['ADX'] = 100 * (np.abs(final_cp['+DI'] - final_cp['-DI']) / np.abs(final_cp['+DI'] + final_cp['-DI']))

final_cp = final_cp.drop(columns=['h_diff', 'l_diff', '+DM', '-DM', '+DM_s', '-DM_s', '+DI', '-DI'])

final_cp


for name in name_list:
    
    fig = make_subplots(specs=[[{"secondary_y": True}]])
    
    # Filtering list to only data for the coin we are currently looking at
    filtered_df = (final_cp[final_cp['Name'] == name]).copy()
    
    # Creating graph components for each line.
    trace1 = go.Scatter(x=filtered_df['Date'], y=filtered_df['ADX'], name="ADX")
    trace2 = go.Scatter(x=filtered_df['Date'], y=filtered_df['Average'], name="Average")
    trace3 = go.Scatter(x=filtered_df['Date'], y=filtered_df['SMA25'], name="SMA25")
    trace4 = go.Scatter(x=filtered_df['Date'], y=filtered_df['SMA50'], name="SMA50")
    trace5 = go.Scatter(x=filtered_df['Date'], y=filtered_df['SMA100'], name="SMA100")
    
    # Putting lines onto the figure.
    fig.add_trace(trace1, secondary_y=True)
    fig.add_trace(trace2, secondary_y=False)
    fig.add_trace(trace3, secondary_y=False)
    fig.add_trace(trace4, secondary_y=False)
    fig.add_trace(trace5, secondary_y=False)
    
    # Setting title and axis labels
    fig.update_layout(title=f"Averages of {name} with ADX over Time", 
                      xaxis_title="Date", yaxis_title="Price per Coin (USD)")
    
    fig.show()


# Sorting dataset properly in order for groupby to work properly
final_cp = final_cp.sort_values(['Name', 'Date'])

# Getting C differentials
final_cp['C_Close'] = final_cp.groupby('Name')['Close'].diff()

# Calculating the closing price difference up an down
final_cp['C_Close_Up'] = final_cp['C_Close'].clip(lower=0)
final_cp['C_Close_Down'] = -1 * final_cp['C_Close'].clip(upper=0)

# Calculating the Average Gain and Average Loss
final_cp['Avg_Up'] = final_cp.groupby('Name')['C_Close_Up'].rolling(14).mean().reset_index(0, drop=True)
final_cp['Avg_Down'] = final_cp.groupby('Name')['C_Close_Down'].rolling(14).mean().reset_index(0, drop=True)

# Using RSI formula and calculating
final_cp['RS'] = final_cp['Avg_Up'] / final_cp['Avg_Down']
final_cp['RSI'] = 100 - ( 100 / (1 + final_cp['RS']) )

final_cp = final_cp.drop(columns=['C_Close', 'C_Close_Up', 'C_Close_Down', 'Avg_Up', 'Avg_Down', 'RS'])

final_cp


for name in name_list:
    
    fig = make_subplots(specs=[[{"secondary_y": True}]])
    
    # Filtering list to only data for the coin we are currently looking at
    filtered_df = (final_cp[final_cp['Name'] == name]).copy()
    
    # Creating graph components for each line.
    trace1 = go.Scatter(x=filtered_df['Date'], y=filtered_df['Average'], name="Average")
    trace2 = go.Scatter(x=filtered_df['Date'], y=filtered_df['RSI'], name="RSI")
    trace3 = go.Scatter(x=filtered_df['Date'], y=filtered_df['High'], name="High")
    trace4 = go.Scatter(x=filtered_df['Date'], y=filtered_df['Low'], name="Low")
    
    # Putting lines onto the figure.
    fig.add_trace(trace1, secondary_y=False)
    fig.add_trace(trace2, secondary_y=True)
    fig.add_trace(trace3, secondary_y=False)
    fig.add_trace(trace4, secondary_y=False)
    
    # Setting title and axis labels
    fig.update_layout(title=f"Price of {name} with Low, High, Average, and RSI", 
                      xaxis_title="Date", yaxis_title="Price per Coin (USD)")
    
    fig.show()


final_ml = final_cp.copy()
final_ml


for name in name_list:
    
    # Narrow down our list to just one coin at a time as that is the only way this model can predict
    regressor_df = (final_ml[final_ml['Name'] == name]).copy()

    # Sorting by date so that we have the proper ordering
    regressor_df = regressor_df.sort_values(['Date'])
    
    regressor_df = regressor_df.set_index('Date')
    
    # Getting rid of non-numerical and quantities that don't want used for regression
    regressor_df = regressor_df.drop(columns=['Volume', 'Name', 'Ticker'])

    # Removing all rows with NaN or inf values
    regressor_df = regressor_df.dropna()
    regressor_df = regressor_df[~regressor_df.isin([np.nan, np.inf, -np.inf]).any(1)]
    
    # Shift everything down 1 so that you have yeserday's data to predict today's average.
    regressor_shifted = pd.concat([regressor_df.iloc[:, 1:4].shift(1),
                                   regressor_df['Average'],
                                   regressor_df.iloc[:, 5:].shift(1)], axis=1)
    
   
    # clean up NaN again
    regressor_shifted = regressor_shifted.dropna()
    
    # Splitting into training and test data
    x_train, x_test, y_train, y_test = train_test_split(regressor_shifted.drop(columns=['Average']), 
                                                        regressor_shifted['Average'])
    
    # Creating Random Forest Regressor with base parameters and start training
    rf = RandomForestRegressor(n_estimators=50, random_state=0).fit(x_train, y_train)
    
    # Use trained model to predict on test data
    prediction = rf.predict(x_test)
    
    # Take results and append to dataframe for visualization
    x_test = x_test.reset_index()
    
    actual_y = y_test.reset_index().sort_values('Date')
    
    combined_results = pd.concat([x_test, pd.Series(prediction, name="Predicted")], axis=1)
    combined_results = combined_results.sort_values('Date')
    
    fig = make_subplots(rows = 1, cols = 1)
    
    # Creating traces for actual and predicted
    trace1 = go.Scatter(x=combined_results['Date'], y=combined_results['Predicted'], name="Predicted")
    trace2 = go.Scatter(x=actual_y['Date'], y=actual_y['Average'], name="Actual")
    
    fig.add_trace(trace1, row=1, col=1)
    fig.add_trace(trace2, row=1, col=1)
    
    # Setting title and axis labels
    fig.update_layout(title=f"Actual and Predicted Average Price of {name} Over Time", 
                      xaxis_title="Date", yaxis_title="Price per Coin (USD)")
    
    fig.show()
    
    # Calculate MSE, RMSE and R^2 value to see how well the model did
    mse = mean_squared_error(y_test, prediction)
    rmse = mean_squared_error(y_test, prediction, squared=False)
    r_2 = r2_score(y_test, prediction)
    
    print(f'Random Forest Regressor Model for {name}')
    print('Mean squared error:', mse)
    print('Root mean squared error:', rmse)
    print('R-squared:', r_2)
    print("\n")

/var/folders/ry/hnnkjnnd15j3yzs0qmtbwnv40000gn/T/ipykernel_2682/283871246.py:16: FutureWarning:

In a future version of pandas all arguments of DataFrame.any and Series.any will be keyword-only.

Random Forest Regressor Model for Bitcoin
Mean squared error: 286973.5969311636
Root mean squared error: 535.6991664462095
R-squared: 0.9986472716405851

/var/folders/ry/hnnkjnnd15j3yzs0qmtbwnv40000gn/T/ipykernel_2682/283871246.py:16: FutureWarning:

In a future version of pandas all arguments of DataFrame.any and Series.any will be keyword-only.

Random Forest Regressor Model for Ethereum
Mean squared error: 2005.4328645104265
Root mean squared error: 44.782059627828936
R-squared: 0.9980645002297991

/var/folders/ry/hnnkjnnd15j3yzs0qmtbwnv40000gn/T/ipykernel_2682/283871246.py:16: FutureWarning:

In a future version of pandas all arguments of DataFrame.any and Series.any will be keyword-only.

Random Forest Regressor Model for Tether
Mean squared error: 1.036084692556676e-05
Root mean squared error: 0.0032188269486828213
R-squared: 0.865471259588598

/var/folders/ry/hnnkjnnd15j3yzs0qmtbwnv40000gn/T/ipykernel_2682/283871246.py:16: FutureWarning:

In a future version of pandas all arguments of DataFrame.any and Series.any will be keyword-only.

Random Forest Regressor Model for Cardano
Mean squared error: 0.0009526060586103359
Root mean squared error: 0.03086431691468865
R-squared: 0.997058372751413

/var/folders/ry/hnnkjnnd15j3yzs0qmtbwnv40000gn/T/ipykernel_2682/283871246.py:16: FutureWarning:

In a future version of pandas all arguments of DataFrame.any and Series.any will be keyword-only.

Random Forest Regressor Model for Dogecoin
Mean squared error: 3.969158945535347e-05
Root mean squared error: 0.006300126145987354
R-squared: 0.9938422023954274

	Unnamed: 0	#	Name	Price	1h %	24h %	7d %	Market Cap	Volume(24h)	Circulating Supply	Last 7 Days	Unnamed: 11
0	NaN	1.0	Bitcoin 1 BTC	$26,467.81	0.64%	1.45%	10.31%	$512.52B $512,517,484,139	$17,908,091,334 676,863 BTC	19,371,375 BTC	NaN	NaN
1	NaN	2.0	Ethereum 2 ETH	$1,788.10	0.99%	0.10%	10.02%	$220.01B $220,005,830,732	$8,338,380,767 4,654,292 ETH	122,802,176 ETH	NaN	NaN
2	NaN	3.0	Tether 3 USDT	$1.00	0.04%	0.05%	0.02%	$82.79B $82,788,137,577	$26,881,856,452 26,861,845,571 USDT	82,726,510,004 USDT	NaN	NaN
3	NaN	4.0	BNB 4 BNB	$306.26	0.21%	0.06%	6.18%	$47.75B $47,752,156,743	$487,392,775 1,590,821 BNB	155,860,209 BNB	NaN	NaN
4	NaN	5.0	USD Coin 5 USDC	$1.00	0.04%	0.06%	0.02%	$29.97B $29,967,992,391	$3,962,403,789 3,961,076,343 USDC	29,957,952,807 USDC	NaN	NaN
5	NaN	6.0	XRP 6 XRP	$0.4249	0.48%	2.16%	9.20%	$22.03B $22,026,197,113	$1,150,113,730 2,706,749,094 XRP	51,837,820,505 XRP	NaN	NaN
6	NaN	7.0	Cardano 7 ADA	$0.3608	0.23%	2.00%	8.48%	$12.57B $12,571,058,654	$243,247,046 674,180,030 ADA	34,841,766,154 ADA	NaN	NaN
7	NaN	8.0	Dogecoin 8 DOGE	$0.07128	0.13%	1.35%	10.29%	$9.93B $9,930,789,434	$373,075,835 5,233,844,884 DOGE	139,318,086,384 DOGE	NaN	NaN
8	NaN	9.0	Solana 9 SOL	$20.49	0.71%	2.38%	10.57%	$8.10B $8,102,862,403	$326,094,987 15,912,803 SOL	395,403,978 SOL	NaN	NaN
9	NaN	10.0	Polygon 10 MATIC	$0.8479	1.43%	1.22%	15.43%	$7.84B $7,842,302,945	$439,832,282 518,752,605 MATIC	9,249,469,069 MATIC	NaN	NaN

	Unnamed: 0	open	high	low	close	volume	marketCap	timestamp	crypto_name	date
0	0	112.900002	118.800003	107.142998	115.910004	0.000000e+00	1.288693e+09	2013-05-05T23:59:59.999Z	Bitcoin	2013-05-05
1	1	3.493130	3.692460	3.346060	3.590890	0.000000e+00	6.229819e+07	2013-05-05T23:59:59.999Z	Litecoin	2013-05-05
2	2	115.980003	124.663002	106.639999	112.300003	0.000000e+00	1.249023e+09	2013-05-06T23:59:59.999Z	Bitcoin	2013-05-06
3	3	3.594220	3.781020	3.116020	3.371250	0.000000e+00	5.859436e+07	2013-05-06T23:59:59.999Z	Litecoin	2013-05-06
4	4	112.250000	113.444000	97.699997	111.500000	0.000000e+00	1.240594e+09	2013-05-07T23:59:59.999Z	Bitcoin	2013-05-07
...	...	...	...	...	...	...	...	...	...	...
72941	72941	0.022604	0.022988	0.022197	0.022796	4.040134e+07	1.652957e+09	2022-10-23T23:59:59.999Z	VeChain	2022-10-23
72942	72942	1.468244	1.530464	1.435415	1.517878	2.844351e+07	1.572825e+09	2022-10-23T23:59:59.999Z	Flow	2022-10-23
72943	72943	4.950431	5.148565	4.945280	5.117206	1.069497e+08	1.559551e+09	2022-10-23T23:59:59.999Z	Filecoin	2022-10-23
72944	72944	0.000233	0.000243	0.000226	0.000239	2.143268e+08	1.576291e+09	2022-10-23T23:59:59.999Z	Terra Classic	2022-10-23
72945	72945	0.465490	0.471006	0.453438	0.469033	9.509743e+08	2.339868e+10	2022-10-23T23:59:59.999Z	XRP	2022-10-23

	Name	Price	1h %	24h %	7d %	Market Cap	Volume(24h)	Circulating Supply
0	Bitcoin 1 BTC	$26,467.81	0.64%	1.45%	10.31%	$512.52B $512,517,484,139	$17,908,091,334 676,863 BTC	19,371,375 BTC
1	Ethereum 2 ETH	$1,788.10	0.99%	0.10%	10.02%	$220.01B $220,005,830,732	$8,338,380,767 4,654,292 ETH	122,802,176 ETH
2	Tether 3 USDT	$1.00	0.04%	0.05%	0.02%	$82.79B $82,788,137,577	$26,881,856,452 26,861,845,571 USDT	82,726,510,004 USDT
3	BNB 4 BNB	$306.26	0.21%	0.06%	6.18%	$47.75B $47,752,156,743	$487,392,775 1,590,821 BNB	155,860,209 BNB
4	USD Coin 5 USDC	$1.00	0.04%	0.06%	0.02%	$29.97B $29,967,992,391	$3,962,403,789 3,961,076,343 USDC	29,957,952,807 USDC
...	...	...	...	...	...	...	...	...
95	PancakeSwap CAKE	$ 1.79	NaN	NaN	NaN	NaN	NaN	NaN
96	Convex Finance CVX	$ 4.45	NaN	NaN	NaN	NaN	NaN	NaN
97	FLOKI FLOKI	$ 0.00	NaN	NaN	NaN	NaN	NaN	NaN
98	1inch Network 1INCH	$ 0.41	NaN	NaN	NaN	NaN	NaN	NaN
99	Enjin Coin ENJ	$ 0.33	NaN	NaN	NaN	NaN	NaN	NaN

	low	high	open	close	volume	Name	Ticker
time
2022-10-24	19159.350000	19603.570000	19572.200000	19330.410000	2.943258e+04	Bitcoin	BTC
2022-10-25	19240.760000	20420.880000	19332.110000	20086.280000	4.245234e+04	Bitcoin	BTC
2022-10-26	20055.850000	21022.810000	20086.270000	20775.400000	4.361899e+04	Bitcoin	BTC
2022-10-27	20196.010000	20878.170000	20773.590000	20296.970000	3.412358e+04	Bitcoin	BTC
2022-10-28	20000.000000	20755.090000	20295.770000	20597.910000	2.958175e+04	Bitcoin	BTC
...	...	...	...	...	...	...	...
2023-05-08	0.000008	0.000009	0.000009	0.000009	1.680438e+12	Shiba	SHIB
2023-05-09	0.000009	0.000009	0.000009	0.000009	9.494224e+11	Shiba	SHIB
2023-05-10	0.000009	0.000009	0.000009	0.000009	9.374366e+11	Shiba	SHIB
2023-05-11	0.000009	0.000009	0.000009	0.000009	9.152456e+11	Shiba	SHIB
2023-05-12	0.000008	0.000009	0.000009	0.000009	7.590283e+11	Shiba	SHIB

	time	low	high	open	close	volume	Name	Ticker
0	2022-10-24	19159.350000	19603.570000	19572.200000	19330.410000	2.943258e+04	Bitcoin	BTC
1	2022-10-25	19240.760000	20420.880000	19332.110000	20086.280000	4.245234e+04	Bitcoin	BTC
2	2022-10-26	20055.850000	21022.810000	20086.270000	20775.400000	4.361899e+04	Bitcoin	BTC
3	2022-10-27	20196.010000	20878.170000	20773.590000	20296.970000	3.412358e+04	Bitcoin	BTC
4	2022-10-28	20000.000000	20755.090000	20295.770000	20597.910000	2.958175e+04	Bitcoin	BTC
...	...	...	...	...	...	...	...	...
2005	2023-05-08	0.000008	0.000009	0.000009	0.000009	1.680438e+12	Shiba	SHIB
2006	2023-05-09	0.000009	0.000009	0.000009	0.000009	9.494224e+11	Shiba	SHIB
2007	2023-05-10	0.000009	0.000009	0.000009	0.000009	9.374366e+11	Shiba	SHIB
2008	2023-05-11	0.000009	0.000009	0.000009	0.000009	9.152456e+11	Shiba	SHIB
2009	2023-05-12	0.000008	0.000009	0.000009	0.000009	7.590283e+11	Shiba	SHIB

Analysis of Top Cryptocurrencies¶

Introduction¶

Imports¶

Data Collection¶

Data Cleaning¶

Top 10 Data¶

Historical Data¶

Top 10 Data Cleaning¶

Removing Columns¶

Cleaning Up Name Field¶

Historical Data Cleaning¶

Gathering Recent Data¶

Cleaning Recent Data¶

Fixing Column Types¶

Fixing Inconsistent Values and Columns Manipulation¶

Historical Data Cleaning¶

Removing Useless Columns¶

Fixing Column Types¶

Filtering Data to Top 10 Currencies¶

Adding Missing Columns and Column Manipulation¶

Combining Data¶

Exploratory Analysis and Data Visualization¶

OHLC Charts¶

Average Price¶

Simple Moving Average¶

Growth¶

Average True Range¶

Average Directional Index¶

Relative Strength Index¶

Model: Analysis, Hypothesis Testing, and ML¶

Hypothesis:¶

Model Selection¶

Random Forest Regressor¶

Hypothesis Conclusion¶

Interpretation: Insight & Policy Decision¶