library(data.table)
library(readr)


#setwd('')
industry_portfolios = na.omit(read.csv('US_Industry_Portfolios_Daily.csv'))
factors = na.omit(read.csv('F-F_Research_Data_Factors_daily.csv'))
colnames(factors)[1] = 'Date'
factors = factors[20113:25419,]


industry_portfolios$Date = NULL
factors$Date = NULL

betas = list()
alphas = list()
r_squares = list()
t_stats = list()

for(i in 1:ncol(industry_portfolios)){
  model1 = coef(lm(industry_portfolios[,i]-factors$RF ~ factors$Mkt.RF+factors$SMB+factors$HML))[2:4]
  betas[[i]] = model1
  names(betas)[i] = colnames(industry_portfolios)[i]
  model2 = coef(lm(industry_portfolios[,i]-factors$RF ~ factors$Mkt.RF+factors$SMB+factors$HML))[1]*252 # Yearly alpha.
  alphas[[i]] = model2
  names(alphas)[i] = colnames(industry_portfolios)[i]
  model3 = summary(lm(industry_portfolios[,i]-factors$RF ~ factors$Mkt.RF+factors$SMB+factors$HML))$r.squared
  r_squares[[i]] = model3
  names(r_squares)[i] = colnames(industry_portfolios)[i]
  model4 = summary(lm(industry_portfolios[,i]-factors$RF ~ factors$Mkt.RF+factors$SMB+factors$HML))$coefficients[2:4,3]
  t_stats[[i]] = model4
  names(t_stats)[i] = colnames(industry_portfolios)[i]
}


betas = transpose(as.data.frame(betas))
rownames(betas)= colnames(industry_portfolios)
colnames(betas) = c('MKT_RF','SMB','HML')
alphas = transpose(as.data.frame(alphas))
rownames(alphas) = colnames(industry_portfolios)
colnames(alphas) = 'Yearly Alphas'
r_squares = transpose(as.data.frame(r_squares))
rownames(r_squares) = colnames(industry_portfolios)
colnames(r_squares) = 'R_Squares'
t_stats = transpose(as.data.frame(t_stats))
rownames(t_stats) = colnames(industry_portfolios)
colnames(t_stats) = c('Tstat_MKT_RF','Tstat_SMB','Tstat_HML')

stats = cbind(betas,alphas,r_squares,t_stats)


MKT = stats[order(stats$MKT_RF,decreasing = FALSE),]
barplot(x1$MKT_RF,horiz = T,cex.names = 0.7,col = 'blue4',las = 1,names.arg =rownames(x1) ,main = 'Market Betas',xlim = c(0,1.5))


SMB = stats[order(stats$SMB,decreasing = FALSE),]
barplot(x2$SMB,horiz = T,cex.names = 0.7,col = 'blue4',las = 1,names.arg =rownames(x2) ,main = 'Size Betas',xlim = c(-0.3,1))


HML = stats[order(stats$HML,decreasing = FALSE),]
barplot(x3$HML,horiz = T,cex.names = 0.7,col = 'blue4',las = 1,names.arg =rownames(x3) ,main = 'Value Betas')


# Read in data and format
mom_factors = na.omit(read.csv('F-F_Momentum_Factor_daily.csv')) # Read in momentum factor data and remove missing values
colnames(mom_factors)[1] = 'Date' # Rename the first column to "Date"
mom_factors = mom_factors[20012:25318,] # Subset to only the dates we need
mom_factors$Date = NULL # Remove the "Date" column

# Initialize output lists
betas = list() # For storing beta coefficients
alphas = list() # For storing alphas
r_squares = list() # For storing R-squared values
t_stats = list() # For storing t-statistics

# Loop over each industry portfolio
for(i in 1:ncol(industry_portfolios)){
  # Estimate regression model and store results in output lists
  model1 = coef(lm(industry_portfolios[,i]-factors$RF ~ factors$Mkt.RF+factors$SMB+factors$HML+mom_factors$Mom))[2:5] # Store beta coefficients
  betas[[i]] = model1
  names(betas)[i] = colnames(industry_portfolios)[i]
  model2 = coef(lm(industry_portfolios[,i]-factors$RF ~ factors$Mkt.RF+factors$SMB+factors$HML+mom_factors$Mom))[1]*252 # Store annualized alpha
  alphas[[i]] = model2
  names(alphas)[i] = colnames(industry_portfolios)[i]
  model3 = summary(lm(industry_portfolios[,i]-factors$RF ~ factors$Mkt.RF+factors$SMB+factors$HML+mom_factors$Mom))$r.squared # Store R-squared value
  r_squares[[i]] = model3
  names(r_squares)[i] = colnames(industry_portfolios)[i]
  model4 = summary(lm(industry_portfolios[,i]-factors$RF ~ factors$Mkt.RF+factors$SMB+factors$HML+mom_factors$Mom))$coefficients[2:5,3] # Store t-statistics
  t_stats[[i]] = model4
  names(t_stats)[i] = colnames(industry_portfolios)[i]
}


betas = transpose(as.data.frame(betas))
rownames(betas)= colnames(industry_portfolios)
colnames(betas) = c('MKT_RF','SMB','HML','WML')
alphas = transpose(as.data.frame(alphas))
rownames(alphas) = colnames(industry_portfolios)
colnames(alphas) = 'Yearly Alphas'
r_squares = transpose(as.data.frame(r_squares))
rownames(r_squares) = colnames(industry_portfolios)
colnames(r_squares) = 'R_Squares'
t_stats = transpose(as.data.frame(t_stats))
rownames(t_stats) = colnames(industry_portfolios)
colnames(t_stats) = c('Tstat_MKT_RF','Tstat_SMB','Tstat_HML','Tstat_WML')

stats = cbind(betas,alphas,r_squares,t_stats)


Market = stats[order(stats$MKT_RF,decreasing = FALSE),]
barplot(x1$MKT_RF,horiz = T,cex.names = 0.7,col = 'blue4',las = 1,names.arg =rownames(x1) ,main = 'Market Betas',xlim = c(0,1.5))


Size = stats[order(stats$SMB,decreasing = FALSE),]
barplot(x2$SMB,horiz = T,cex.names = 0.7,col = 'blue4',las = 1,names.arg =rownames(x2) ,main = 'Size Betas',xlim = c(-0.3,1))


Value = stats[order(stats$HML,decreasing = FALSE),]
barplot(x3$HML,horiz = T,cex.names = 0.7,col = 'blue4',las = 1,names.arg =rownames(x3) ,main = 'Value Betas')


Momentum = stats[order(stats$WML,decreasing = FALSE),]
barplot(x4$WML,horiz = T,cex.names = 0.7,col = 'blue4',las = 1,names.arg =rownames(x4) ,main = 'Momentum Betas')

$$USA\ INDUSTRY\ DAİLY\ RETURN\ AND\\ FAMA\ -FRENCH\ 3\ FACTOR\ DAİLY\ RETURN$$¶

1. Using “US_Industry_Portfolios_Daily.csv” data and Fama-French 3 factor daily returns, run the following regression for each sector portfolio i.¶

$$R_{it}-R_{ft}=\alpha_{i}+\beta_{i1}(R_{mt-R_{ft}})+\beta_{i2^{SMB_{t}}}+\beta_{i2^{HML_{t}}}+e_{it}$$¶

> website: All exercises based on the R program language¶

a) Compute the alphas, factor betas and R2 for each sector portfolio.¶

Do you think that SMB and HML are priced factors?¶

Compute the alphas, factor betas and R2 for each sector portfolio. Discuss your observations¶

Do you think that SMB and HML are priced factors? Why?¶

2. Add the daily momentum factor which is also available from Kenneth French’s website.¶

Do your results change? Is a four-factor model more suitable at capturing the fluctuation in sector portfolio returns? Discuss your observations¶

$$R_{it}-R_{ft}=\alpha_{i}+\beta_{i1}(R_{mt-R_{ft}})+\beta_{i2^{SMB_{t}}}+\beta_{i2^{HML_{t}}}+e_{it}$$¶