import fredapi as fa
import pandas as pd
import numpy as np
from dotenv import load_dotenv
import os
import matplotlib.pyplot as plt


silver = pd.read_csv('XAG_USD Historical Data.csv', usecols=["Date", "Price", "Change %"], index_col="Date", parse_dates=['Date'])
silver_2= pd.read_csv('XAG_USD Historical Data_2.csv', usecols=["Date","Price", "Change %"], index_col="Date", parse_dates=['Date'])
gold = pd.read_csv('XAU_USD Historical Data.csv', usecols=["Date", "Price", "Change %"], index_col="Date", parse_dates=['Date'])
gold_2 = pd.read_csv('XAU_USD Historical Data_2.csv', usecols=["Date", "Price", "Change %"], index_col="Date", parse_dates=['Date'])


# Concatenating csv files
df_silver = pd.concat([silver, silver_2])
df_gold = pd.concat([gold_2, gold])


# Renaming columns
df_silver.rename(columns={'Price':'price','Change %':'pct_change'}, inplace=True)
df_gold.rename(columns={'Price':'price','Change %':'pct_change'}, inplace=True)


print(f'Gold:\n {df_gold.dtypes}\n')
print(f'Silver:\n {df_silver.dtypes}')

Gold:
 price         object
pct_change    object
dtype: object

Silver:
 price         float64
pct_change     object
dtype: object


# Converting gold price from string to float
df_gold['price'] = df_gold['price'].str.replace(',', '').astype(float)


# Converting pct_change columns in both datasets to numeric
df_gold['pct_change'] = df_gold['pct_change'].str.replace('%','').astype(float)
df_silver['pct_change'] = df_silver['pct_change'].str.replace('%','').astype(float)


len(df_silver) == len(df_gold)

False


# Merging both datasets 

df_combined = df_silver.merge(df_gold, left_index=True, right_index=True, how='outer', suffixes=('_silver', '_gold'))


df_combined = df_combined.sort_index()


df_combined.head()


# Identifying missing values

df_combined[(df_combined['price_silver'].isnull()) | (df_combined['price_gold'].isnull())]


df_combined['day'] = df_combined.index.day
df_combined['month'] = df_combined.index.month


df_combined[(df_combined['day'] == 25) & (df_combined['month'] == 12)]


df_imputed = df_combined.copy()


# silver
df_imputed.loc["1995-12-25", ["price_silver", "pct_change_silver"]] = [5.16, (5.16 / df_imputed["price_silver"].shift(1).loc["1995-12-25"] - 1) * 100]
df_imputed.loc["2019-12-25", ["price_silver", "pct_change_silver"]] = [17.765, (17.765 / df_imputed["price_silver"].shift(1).loc["2019-12-25"] - 1) * 100]
# gold
df_imputed.loc["2006-01-02", ["price_gold", "pct_change_gold"]] = [517.12, (517.12 / df_imputed["price_gold"].shift(1).loc["2006-01-02"] - 1) * 100]
df_imputed.loc["2014-12-25", ["price_gold", "pct_change_gold"]] = [1173.6, (1173.6 / df_imputed["price_gold"].shift(1).loc["2014-12-25"] - 1) * 100]
df_imputed.loc["2018-12-25", ["price_gold", "pct_change_gold"]] = [1269.8, (1269.8 / df_imputed["price_gold"].shift(1).loc["2018-12-25"] - 1) * 100]
df_imputed.loc["2019-04-19", ["price_gold", "pct_change_gold"]] = [1275.51, (1275.51 / df_imputed["price_gold"].shift(1).loc["2019-04-19"] - 1) * 100]


# check
df_imputed[df_imputed.index.isin(['1995-12-25', '2006-01-02','2014-12-25', '2018-12-25', '2019-04-19', '2019-12-25'])]


plt.style.available # choosing the style for charts

['Solarize_Light2',
 '_classic_test_patch',
 '_mpl-gallery',
 '_mpl-gallery-nogrid',
 'bmh',
 'classic',
 'dark_background',
 'fast',
 'fivethirtyeight',
 'ggplot',
 'grayscale',
 'seaborn-v0_8',
 'seaborn-v0_8-bright',
 'seaborn-v0_8-colorblind',
 'seaborn-v0_8-dark',
 'seaborn-v0_8-dark-palette',
 'seaborn-v0_8-darkgrid',
 'seaborn-v0_8-deep',
 'seaborn-v0_8-muted',
 'seaborn-v0_8-notebook',
 'seaborn-v0_8-paper',
 'seaborn-v0_8-pastel',
 'seaborn-v0_8-poster',
 'seaborn-v0_8-talk',
 'seaborn-v0_8-ticks',
 'seaborn-v0_8-white',
 'seaborn-v0_8-whitegrid',
 'tableau-colorblind10']


# Histogram of daily returns
plt.style.use('bmh')
plt.figure(figsize=(10,5))
plt.hist(df_imputed['pct_change_gold'], bins=100, histtype='step', linewidth=1, color='red', label='gold daily returns')
plt.hist(df_imputed['pct_change_silver'], bins=100, alpha = 0.8, label='silver daily returns')
plt.title('Distribution of daily returns Gold vs Silver')
plt.xlabel('Daily returns %')
plt.legend()
plt.show()


silver_annual_returns = (
    df_imputed['price_silver']
    .resample('Y')
    .last()
    .pct_change()
    .mul(100)
    .to_frame()
    .rename(columns={'price_silver':'returns'})
)    
silver_annual_returns.dropna(inplace=True)


silver_annual_returns.head()


plt.figure(figsize=(12,5)) 
plt.bar(silver_annual_returns.index, silver_annual_returns['returns'], width=200) 
plt.xticks(silver_annual_returns.index, rotation=90)
plt.annotate('Ongoing', 
             xy=(silver_annual_returns.index[29], silver_annual_returns['returns'].iloc[29]), 
             fontsize=13,
             xytext=(silver_annual_returns.index[29], silver_annual_returns['returns'].iloc[29] + 15), 
             arrowprops=dict(facecolor='black', width=1))
plt.title("Silver's annual returns")
plt.ylabel('Returns [%]')
plt.xlabel('Year')
plt.show()


gold_annual_returns = (
    df_imputed['price_gold']
    .resample('Y')
    .last()
    .pct_change()
    .mul(100)
    .to_frame()
    .rename(columns={'price_gold':'returns'})
)    
gold_annual_returns.dropna(inplace=True)


plt.figure(figsize=(12,5)) 
plt.bar(gold_annual_returns.index, gold_annual_returns['returns'], width=200) 
plt.xticks(gold_annual_returns.index, rotation=90)
plt.annotate('Ongoing', 
             xy=(gold_annual_returns.index[29], gold_annual_returns['returns'].iloc[29]), 
             fontsize=13,
             xytext=(gold_annual_returns.index[29], gold_annual_returns['returns'].iloc[29] + 15), 
             arrowprops=dict(facecolor='black', width=1))
plt.title("Gold's annual returns")
plt.ylabel('Returns [%]')
plt.xlabel('Year')
plt.show()


df_imputed['log_returns_gold'] = np.log(df_imputed['price_gold'].div(df_imputed['price_gold'].shift(1)))


df_imputed['log_returns_silver'] = np.log(df_imputed['price_silver'].div(df_imputed['price_silver'].shift(1)))


df_imputed


np.exp(df_imputed['log_returns_gold'].sum())

7.661620775153328


np.exp(df_imputed['log_returns_silver'].sum())

6.687832310838415


# anual mean returns gold
df_imputed['log_returns_gold'].mean() * 252

0.06539165729650645


# anual mean returns silver
df_imputed['log_returns_silver'].mean() * 252

0.06102625591775513


df_imputed['log_returns_gold'].std() * np.sqrt(252)

0.15873235673833885


df_imputed['log_returns_silver'].std() * np.sqrt(252)

0.2854965823065996


df_imputed['cum_returns_gold'] = df_imputed['log_returns_gold'].cumsum().apply(np.exp)
df_imputed['cum_returns_silver'] = df_imputed['log_returns_silver'].cumsum().apply(np.exp)


plt.figure(figsize=(12,7))
df_imputed['cum_returns_gold'].plot(label = 'gold')
df_imputed['cum_returns_silver'].plot(label = 'silver', alpha=0.5)
plt.title("Cummulative returns Gold vs Silver")
plt.ylabel('Cummulative returns [USD]')
plt.xlabel('Date')
plt.legend()
plt.show()


df_imputed['cummax_gold'] = df_imputed['cum_returns_gold'].cummax()
df_imputed['cummax_silver'] = df_imputed['cum_returns_silver'].cummax()


df_imputed[['cum_returns_gold','cummax_gold']].plot()
df_imputed[['cum_returns_silver','cummax_silver']].plot()
plt.show()


df_imputed['drawdown_gold'] = df_imputed['cummax_gold'] - df_imputed['cum_returns_gold']
df_imputed['drawdown_silver'] = df_imputed['cummax_silver'] - df_imputed['cum_returns_silver']
df_imputed.head()


df_imputed['drawdown_gold'].max() # gold's biggest drawdown - dollar perspective

2.215189873417721


df_imputed['drawdown_gold'].idxmax() # when it took place

Timestamp('2015-12-17 00:00:00')


df_imputed.loc['2015-12-17',['cum_returns_gold','cummax_gold']]

cum_returns_gold    2.744982
cummax_gold         4.960172
Name: 2015-12-17 00:00:00, dtype: float64


df_imputed['drawdown_silver'].max()

7.458077709611461


df_imputed['drawdown_silver'].idxmax()

Timestamp('2020-03-18 00:00:00')


df_imputed.loc['2020-03-18',['cum_returns_silver','cummax_silver']]

cum_returns_silver    2.449898
cummax_silver         9.907975
Name: 2020-03-18 00:00:00, dtype: float64


df_imputed['%drawdown_gold']= (df_imputed['cummax_gold'] - df_imputed['cum_returns_gold']) / df_imputed['cummax_gold']
df_imputed['%drawdown_silver']= (df_imputed['cummax_silver'] - df_imputed['cum_returns_silver']) / df_imputed['cummax_silver']
df_imputed.head()


df_imputed['%drawdown_gold'].max()

0.44659535172508297


df_imputed['%drawdown_gold'].idxmax()

Timestamp('2015-12-17 00:00:00')


df_imputed['%drawdown_silver'].max()

0.7527347781217767


df_imputed['%drawdown_silver'].idxmax()

Timestamp('2020-03-18 00:00:00')


df_imputed['ratio'] = round(df_imputed['price_gold'].div(df_imputed['price_silver']),2)


plt.style.use('bmh')
plt.figure(figsize=(10,5))
plt.plot(df_imputed['ratio'], label='gold/silver ratio')
plt.axhspan(40, 80, color='green', alpha=0.3)
plt.legend()
plt.show()


load_dotenv()
api_key=os.environ.get('FredAPI')
fred = fa.Fred(api_key)


fred.search('Recession')


# Read the notes to understand the data
fred.search('Recession').loc['JHDUSRGDPBR','notes']

'The series assigns dates to U.S. recessions based on a mathematical model of the way that recessions differ from expansions. Whereas the NBER business cycle dates are based on a subjective assessment of a variety of indicators, the dates here are entirely mechanical and are calculated solely from historically reported GDP data. Whenever the GDP-based recession indicator index rises above 67%, the economy is determined to be in a recession. The date that the recession is determined to have begun is the first quarter prior to that date for which the inference from the mathematical model using all data available at that date would have been above 50%. The next time the GDP-based recession indicator index falls below 33%, the recession is determined to be over, and the last quarter of the recession is the first quarter for which the inference from the mathematical model using all available data at that date would have been below 50%.  For more information about this series visit http://econbrowser.com/recession-index.'


recession = fred.get_series('JHDUSRGDPBR')
# Filter recession quarters starting from 1995
recession[recession==1].loc['1995':]

2001-01-01    1.0
2001-04-01    1.0
2001-07-01    1.0
2007-10-01    1.0
2008-01-01    1.0
2008-04-01    1.0
2008-07-01    1.0
2008-10-01    1.0
2009-01-01    1.0
2009-04-01    1.0
2020-01-01    1.0
2020-04-01    1.0
dtype: float64


# Prepare recession ranges to be plotted according to the rules stated in the notes

# first recession
x1_min, x1_max = '2000-10-01', '2001-07-01'
# second recession
x2_min, x2_max = '2007-07-01', '2009-04-01'
# third recession
x3_min, x3_max = '2019-10-01', '2020-04-01'

rec_periods = [(x1_min, x1_max),(x2_min, x2_max),(x3_min, x3_max)]


plt.style.use('bmh')
plt.figure(figsize=(15,10))
plt.subplots_adjust(hspace=0.5)

titles = ["Gold performance during recessions", 
          "Silver performance during recessions", 
          "Gold/Silver ratio performance during recessions"]

columns = ['price_gold', 'price_silver', 'ratio']

for i, (title, col) in enumerate(zip(titles, columns), 1):
    plt.subplot(3, 1, i)
    plt.plot(df_imputed[col], label=col)
    plt.title(title)
    plt.legend()

    for r in rec_periods:
        plt.axvspan(r[0], r[1], color='green', alpha=0.4)

plt.show()

	price_silver	pct_change_silver	price_gold	pct_change_gold
Date
1995-01-02	4.89	0.00	383.15	0.08
1995-01-03	4.75	-2.86	379.70	-0.90
1995-01-04	4.62	-2.74	374.55	-1.36
1995-01-05	4.71	1.95	375.55	0.27
1995-01-06	4.64	-1.49	371.95	-0.96

	price_silver	pct_change_silver	price_gold	pct_change_gold
Date
1995-12-25	NaN	NaN	387.50	0.06
2006-01-02	8.84	0.23	NaN	NaN
2014-12-25	15.74	0.13	NaN	NaN
2018-12-25	14.78	0.03	NaN	NaN
2019-04-19	14.93	-0.40	NaN	NaN
2019-12-25	NaN	NaN	1499.55	0.00

	price_silver	pct_change_silver	price_gold	pct_change_gold	day	month
Date
1995-12-25	NaN	NaN	387.50	0.06	25	12
1996-12-25	4.8500	0.00	368.90	0.01	25	12
1997-12-25	6.3900	0.00	296.75	0.10	25	12
1998-12-25	4.9400	0.00	286.75	0.14	25	12
2000-12-25	4.6200	0.00	274.05	0.04	25	12
2001-12-25	4.5400	0.00	279.50	0.52	25	12
2002-12-25	4.6500	0.00	345.50	-0.39	25	12
2003-12-25	5.7700	0.00	412.00	0.00	25	12
2006-12-25	12.5900	-0.08	620.75	-0.04	25	12
2007-12-25	14.4100	-0.89	807.00	-0.60	25	12
2008-12-25	10.3800	0.00	846.00	-0.18	25	12
2009-12-25	17.5500	0.40	1104.50	-0.09	25	12
2012-12-25	29.8800	-0.10	1658.90	0.09	25	12
2013-12-25	19.5100	0.52	1204.70	0.03	25	12
2014-12-25	15.7400	0.13	NaN	NaN	25	12
2015-12-25	14.3700	-0.07	1075.88	0.00	25	12
2017-12-25	16.3800	0.06	1275.24	0.02	25	12
2018-12-25	14.7800	0.03	NaN	NaN	25	12
2019-12-25	NaN	NaN	1499.55	0.00	25	12
2020-12-25	25.8500	0.04	1875.82	-0.04	25	12
2023-12-25	24.2365	0.29	2054.93	0.10	25	12

	returns
Date
1996-12-31	-7.899807
1997-12-31	25.523013
1998-12-31	-16.000000
1999-12-31	7.539683
2000-12-31	-15.129151

	price_silver	pct_change_silver	price_gold	pct_change_gold	day	month	log_returns_gold	log_returns_silver
Date
1995-01-02	4.8900	0.00	383.15	0.08	2	1	NaN	NaN
1995-01-03	4.7500	-2.86	379.70	-0.90	3	1	-0.009045	-0.029048
1995-01-04	4.6200	-2.74	374.55	-1.36	4	1	-0.013656	-0.027750
1995-01-05	4.7100	1.95	375.55	0.27	5	1	0.002666	0.019293
1995-01-06	4.6400	-1.49	371.95	-0.96	6	1	-0.009632	-0.014974
...	...	...	...	...	...	...	...	...
2025-02-13	32.3595	0.44	2929.03	0.87	13	2	0.008699	0.004358
2025-02-14	32.1367	-0.69	2883.18	-1.57	14	2	-0.015777	-0.006909
2025-02-17	32.7900	2.03	2897.66	0.50	17	2	0.005010	0.020125
2025-02-18	32.8691	0.24	2935.58	1.31	18	2	0.013002	0.002409
2025-02-19	32.7035	-0.50	2935.55	0.00	19	2	-0.000010	-0.005051

Analysis of gold and silver performance over the last 30 years¶

Data loading¶

Data cleaning¶

Data analysis¶

Simple returns year by year¶

Exploring Gold/Silver ratio¶

Performance during recessions¶

Summary¶

	price_silver	pct_change_silver	price_gold	pct_change_gold	day	month
Date
1995-12-25	5.160	-0.193424	387.50	0.060000	25	12
2006-01-02	8.840	0.230000	517.12	-0.092736	2	1
2014-12-25	15.740	0.130000	1173.60	-0.017039	25	12
2018-12-25	14.780	0.030000	1269.80	0.052792	25	12
2019-04-19	14.930	-0.400000	1275.51	0.009409	19	4
2019-12-25	17.765	-0.112454	1499.55	0.000000	25	12

	id	realtime_start	realtime_end	title	observation_start	observation_end	frequency	frequency_short	units	units_short	seasonal_adjustment	seasonal_adjustment_short	last_updated	popularity	notes
series id
SAHMREALTIME	SAHMREALTIME	2025-02-27	2025-02-27	Real-time Sahm Rule Recession Indicator	1959-12-01	2025-01-01	Monthly	M	Percentage Points	Percentage Points	Seasonally Adjusted	SA	2025-02-07 07:59:03-06:00	80	Sahm Recession Indicator signals the start of ...
RECPROUSM156N	RECPROUSM156N	2025-02-27	2025-02-27	Smoothed U.S. Recession Probabilities	1967-06-01	2024-12-01	Monthly	M	Percent	%	Not Seasonally Adjusted	NSA	2025-02-03 09:54:02-06:00	73	Smoothed recession probabilities for the Unite...
JHDUSRGDPBR	JHDUSRGDPBR	2025-02-27	2025-02-27	Dates of U.S. recessions as inferred by GDP-ba...	1967-10-01	2024-07-01	Quarterly	Q	+1 or 0	+1 or 0	Not Seasonally Adjusted	NSA	2025-01-30 19:01:01-06:00	69	The series assigns dates to U.S. recessions ba...
USREC	USREC	2025-02-27	2025-02-27	NBER based Recession Indicators for the United...	1854-12-01	2025-01-01	Monthly	M	+1 or 0	+1 or 0	Not Seasonally Adjusted	NSA	2025-02-03 18:01:01-06:00	69	This time series is an interpretation of US Bu...
USRECD	USRECD	2025-02-27	2025-02-27	NBER based Recession Indicators for the United...	1854-12-01	2025-02-25	Daily, 7-Day	D	+1 or 0	+1 or 0	Not Seasonally Adjusted	NSA	2025-02-26 18:02:04-06:00	53	This time series is an interpretation of US Bu...
...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...
DHIDFHRVIEHS	DHIDFHRVIEHS	2025-02-27	2025-02-27	DHI-DFH Index of Recruiting Intensity per Vaca...	2001-01-01	2018-04-01	Monthly	M	Index	Index	Not Seasonally Adjusted	NSA	2018-06-11 09:21:04-05:00	1	Monthly updates of the DHI Hiring Indicators h...
DHIDFHRIVMW	DHIDFHRIVMW	2025-02-27	2025-02-27	DHI-DFH Index of Recruiting Intensity per Vaca...	2001-01-01	2018-04-01	Monthly	M	Index	Index	Not Seasonally Adjusted	NSA	2018-06-11 09:21:04-05:00	0	Monthly updates of the DHI Hiring Indicators h...
DHIDFHRVIHS	DHIDFHRVIHS	2025-02-27	2025-02-27	DHI-DFH Index of Recruiting Intensity per Vaca...	2001-01-01	2018-04-01	Monthly	M	Index	Index	Not Seasonally Adjusted	NSA	2018-06-11 09:21:04-05:00	0	Monthly updates of the DHI Hiring Indicators h...
DHIDFHRVIFS	DHIDFHRVIFS	2025-02-27	2025-02-27	DHI-DFH Index of Recruiting Intensity per Vaca...	2001-01-01	2018-04-01	Monthly	M	Index	Index	Not Seasonally Adjusted	NSA	2018-06-11 09:21:04-05:00	0	Monthly updates of the DHI Hiring Indicators h...
DHIDFHRVIWTU	DHIDFHRVIWTU	2025-02-27	2025-02-27	DHI-DFH Index of Recruiting Intensity per Vaca...	2001-01-01	2018-04-01	Monthly	M	Index	Index	Not Seasonally Adjusted	NSA	2018-06-11 09:21:03-05:00	0	Monthly updates of the DHI Hiring Indicators h...