This is an R Markdown Notebook. When you execute code within the notebook, the results appear beneath the code.

Try executing this chunk by clicking the Run button within the chunk or by placing your cursor inside it and pressing Ctrl+Shift+Enter.

library(ggplot2)
library(plotly)
library(dplyr)
library(readr)
library(lubridate)
library(stringr)
library(ggthemes)
library(extrafont)
library(gapminder)
official_table <- read.csv(file='AAPL_Pre_Official_DB_7_31.csv',check.names=F,stringsAsFactors = F)#Reading the official file
month_summary<- subset(official_table) %>% group_by(Month) %>% summarize(Mean_volume=mean(Volume), .groups = 'keep') #create summary table for months by volume 
month_plt <- ggplot(month_summary,aes(x=Month,y=Mean_volume)) #import dataset into ggplot2
month_plt + geom_line() + 
  
  theme_minimal() +
  scale_fill_gradient(low = "black", high = "#8de1f0") +
  labs(title = "Total Volume By months") +

  theme(panel.grid.major=element_blank(),
        panel.grid.minor=element_blank(),
        text = element_text(family="DM Sans"),
        plot.title = element_text(hjust = 0.5),
        legend.position = "none")

NA

year_summary_season <- subset(official_table) %>% group_by(Year, Season)  %>% summarize(Mean_volume=mean(Volume), .groups = 'keep') #create summary table


plt_year_summary_season <- ggplot(year_summary_season,aes(x=Year,y=Mean_volume,color=Season)) #import dataset into ggplot2

plt_year_summary_season + geom_point() + labs(x="Year", y="Mean_volume", color="Season", title ="Summary of Volume per Season & Year" )#add scatter plot with labels

year_lastTenSeason <- subset(official_table, Year > 2015 & Year <= 2020) %>% group_by(Year, Season)  %>% summarize(Mean_volume=mean(Volume), .groups = 'keep') #create summary table
plt_year_lastTenSeason <- ggplot(year_lastTenSeason,aes(x=Year,y=Mean_volume,color=Season)) #import dataset into ggplot2

plt_year_lastTenSeason + geom_point() + labs(x="Year", y="Mean_volume", color="Season", title="Summary of Volume in Last 5 Years for Seasons")#add scatter plot with labels

year_summary_quarter <- subset(official_table) %>% group_by(Year, Quarter)  %>% summarize(Mean_volume=mean(Volume), .groups = 'keep') #create summary table

plt_year_summary_quarter <- ggplot(year_summary_quarter,aes(x=Year,y=Mean_volume,color=Quarter)) #import dataset into ggplot2

plt_year_summary_quarter + geom_point() + labs(x="Year", y="Mean_volume", color="Quarter", title ="Summary of Volume per Quarters & Year")#add scatter plot with labels

NA
NA
year_lastTenQuarter <- subset(official_table, Year > 2015 & Year <= 2020) %>% group_by(Year, Quarter)  %>% summarize(Mean_volume=mean(Volume), .groups = 'keep') #create summary table
plt_year_lastTenQuarter <- ggplot(year_lastTenQuarter,aes(x=Year,y=Mean_volume,color=Quarter)) #import dataset into ggplot2

plt_year_lastTenQuarter + geom_point() + labs(x="Year", y="Mean_volume", color="Quarters", title="Summary of Volume in Last 5 Years for Quarters")#add scatter plot with labels

month_summary_Gain_Loss_Open_season <- subset(official_table) %>% group_by(Gain_Loss_Open, Month , Season)  %>% summarize(Mean_volume=mean(Volume), .groups = 'keep') #create summary table for Gain_Loss_Open in each seasons for the months

plt_month_summary_Gain_Loss_Open_season <- ggplot(month_summary_Gain_Loss_Open_season,aes(x=Month,y=Mean_volume,color=Season,shape = Gain_Loss_Open)) #import dataset into ggplot2

plt_month_summary_Gain_Loss_Open_season + geom_point() + labs(x="Month", y="Mean_volume", color="Season", shape ="Gain_Loss_Open")#add scatter plot with labels



month_summary_Gain_Loss_Open_quarter <- subset(official_table) %>% group_by(Gain_Loss_Open, Month , Quarter)  %>% summarize(Mean_volume=mean(Volume), .groups = 'keep') #create summary table for Gain_Loss_Open in each quarters for the months

plt_month_summary_Gain_Loss_Open <- ggplot(month_summary_Gain_Loss_Open_quarter,aes(x=Month,y=Mean_volume,color=Quarter,shape = Gain_Loss_Open)) #import dataset into ggplot2


plt_month_summary_Gain_Loss_Open + geom_point() + labs(x="Month", y="Mean_volume", color="Quarter", shape ="Gain_Loss_Open")#add scatter plot with labels


#create summary table for quarter by volume 
quarter_summary_<- subset(official_table) %>% group_by(Quarter) %>% 
  summarize(Mean_volume=mean(Volume), .groups = 'keep') 


##create summary table for Gain_Loss_Open in each quarter 
quarter_summary_Gain_Loss_Open <- subset(official_table) %>% 
  group_by(Gain_Loss_Open, Quarter)  %>% 
  summarize(Mean_volume=mean(Volume), .groups = 'keep') #

#import dataset into ggplot2
plt_quarter_summary_Gain_Loss_Open <- 
  ggplot(quarter_summary_Gain_Loss_Open,
         aes(x=Quarter,y=Mean_volume,color=Quarter,shape = Gain_Loss_Open)) 

#add scatter plot with labels
plt_quarter_summary_Gain_Loss_Open + geom_point() + 
  labs(x="Quarter", y="Mean_volume", title ="Quarter_G/L_Open",
       color="Quarter", shape ="Gain_Loss_Open")


##create summary table for Gain_Loss_Closein each quarter 
quarter_summary_Gain_Loss_Close <- subset(official_table) %>% 
  group_by(Gain_Loss_Close, Quarter)  %>% 
  summarize(Mean_volume=mean(Volume), .groups = 'keep') #

#import dataset into ggplot2
plt_quarter_summary_Gain_Loss_Close <- 
  ggplot(quarter_summary_Gain_Loss_Close,
         aes(x=Quarter,y=Mean_volume,color=Quarter,shape = Gain_Loss_Close)) 

#add scatter plot with labels
plt_quarter_summary_Gain_Loss_Close + geom_point() + 
  labs(x="Quarter", y="Mean_volume", title ="Quarter_G/L_Close",
       color="Quarter", shape ="Gain_Loss_Close")


##create summary table for Gain_Loss_High in each quarter 
quarter_summary_Gain_Loss_High <- subset(official_table) %>% 
  group_by(Gain_Loss_High, Quarter)  %>% 
  summarize(Mean_volume=mean(Volume), .groups = 'keep') #

#import dataset into ggplot2
plt_quarter_summary_Gain_Loss_High <- 
  ggplot(quarter_summary_Gain_Loss_High,
         aes(x=Quarter,y=Mean_volume,color=Quarter,shape = Gain_Loss_High)) 

#add scatter plot with labels
plt_quarter_summary_Gain_Loss_High + geom_point() + 
  labs(x="Quarter", y="Mean_volume", title ="Quarter_G/L_High",
       color="Quarter", shape ="Gain_Loss_High")


##create summary table for Gain_Loss_Low in each quarter 
quarter_summary_Gain_Loss_Low <- subset(official_table) %>% 
  group_by(Gain_Loss_Low, Quarter)  %>% 
  summarize(Mean_volume=mean(Volume), .groups = 'keep') #

#import dataset into ggplot2
plt_quarter_summary_Gain_Loss_Low <- 
  ggplot(quarter_summary_Gain_Loss_Low,
         aes(x=Quarter,y=Mean_volume,color=Quarter,shape = Gain_Loss_Low)) 

#add scatter plot with labels
plt_quarter_summary_Gain_Loss_Low + geom_point() + 
  labs(x="Quarter", y="Mean_volume", title ="Quarter_G/L_Low",
       color="Quarter", shape ="Gain_Loss_Low")


#create summary table for season by volume 
season_summary_<- subset(official_table) %>% group_by(Season) %>% 
  summarize(Mean_volume=mean(Volume), .groups = 'keep')

##create summary table for Gain_Loss_Open in each season
season_summary_Gain_Loss_Open <- subset(official_table) %>% 
  group_by(Gain_Loss_Open, Season)  %>% 
  summarize(Mean_volume=mean(Volume), .groups = 'keep') #

#import dataset into ggplot2
plt_season_summary_Gain_Loss_Open <- 
  ggplot(season_summary_Gain_Loss_Open,
         aes(x=Season,y=Mean_volume,color=Season,shape = Gain_Loss_Open)) 

#add scatter plot with labels
plt_season_summary_Gain_Loss_Open + geom_point() + 
  labs(x="Season", y="Mean_volume", title ="Season_G/L_Open",
       color="Season", shape ="Gain_Loss_Open")


##create summary table for Gain_Loss_Close in each season
season_summary_Gain_Loss_Close <- subset(official_table) %>% 
  group_by(Gain_Loss_Close, Season)  %>% 
  summarize(Mean_volume=mean(Volume), .groups = 'keep') #

#import dataset into ggplot2
plt_season_summary_Gain_Loss_Close <- 
  ggplot(season_summary_Gain_Loss_Close,
         aes(x=Season,y=Mean_volume,color=Season,shape = Gain_Loss_Close)) 

#add scatter plot with labels
plt_season_summary_Gain_Loss_Close + geom_point() + 
  labs(x="Season", y="Mean_volume", title ="Season_G/L_Close",
       color="Season", shape ="Gain_Loss_Close")



##create summary table for Gain_Loss_High in each season
season_summary_Gain_Loss_High <- subset(official_table) %>% 
  group_by(Gain_Loss_High, Season)  %>% 
  summarize(Mean_volume=mean(Volume), .groups = 'keep') #

#import dataset into ggplot2
plt_season_summary_Gain_Loss_High <- 
  ggplot(season_summary_Gain_Loss_High,
         aes(x=Season,y=Mean_volume,color=Season,shape = Gain_Loss_High)) 

#add scatter plot with labels
plt_season_summary_Gain_Loss_High + geom_point() + 
  labs(x="Season", y="Mean_volume", title ="Season_G/L_High",
       color="Season", shape ="Gain_Loss_High")


##create summary table for Gain_Loss_Low in each season
season_summary_Gain_Loss_Low <- subset(official_table) %>% 
  group_by(Gain_Loss_Low, Season)  %>% 
  summarize(Mean_volume=mean(Volume), .groups = 'keep') #

#import dataset into ggplot2
plt_season_summary_Gain_Loss_Low <- 
  ggplot(season_summary_Gain_Loss_Low,
         aes(x=Season,y=Mean_volume,color=Season,shape = Gain_Loss_Low)) 

#add scatter plot with labels
plt_season_summary_Gain_Loss_Low + geom_point() + 
  labs(x="Season", y="Mean_volume", title ="Season_G/L_Low",
       color="Season", shape ="Gain_Loss_Low")

NA
NA
NA
NA
