simulations_with_percents.R

#Step 1 - define current bar function (if not previously defined in workspace)
#Step 2 - generate time and data functions (see data_for_trials)

setwd("/Users/khaglich/Desktop/Edited REU Main/Variations_of_bars")
source("baar.R")

setwd("/Users/khaglich/Desktop/Edited REU Main")
source("data_for_trials.R")

#Step 3 - set up for simulation
data_fun = test_data_0_a #edit here !!! (defines function for generating draws)
title = "Current Test Data" #edit here !!! (title for graphing)
runs = 9
iterations = 2000
current_bar = baar #barA - think that's ol #edit here !!! (which version of bars is being run)
save_name = "TestList.RData" #edit here !!! (format: "bar#_data#.RData")
make = 0.3
percent = 0.03
col_num = 3 #number of columns needed for Proposed/AcceptedSteps (either 3 or 4)
lambda = 1

#Step 4 - run simulation

simulation = function(data_fun, runs, iterations, current_bar, make, percent, lambda){

	#initializing storage for returns from all BAR runs
	current_list = list()
	current_list[[1]] = list() #AcceptRate
	current_list[[2]] = data.frame(matrix(ncol=col_num, nrow=0)) #ProposedSteps
	current_list[[3]] = data.frame(matrix(ncol=col_num, nrow=0)) #AcceptedSteps
	current_list[[4]] = data.frame(matrix(ncol=0, nrow=iterations)) #MSE
	current_list[[5]] = data.frame(matrix(ncol=0, nrow=iterations)) #BIC
	current_list[[6]] = data.frame(matrix(ncol=0, nrow=iterations)) #Breakpoints
	current_list[[7]] = data.frame(matrix(ncol=0, nrow=iterations)) #NumBkpts
	names(current_list) = c("AcceptRate", "ProposedSteps", "AcceptedSteps", "MSE", "BIC", "Breakpoints", "NumBkpts")
 
	#getting the initial points using the Bai-Perron test 
	library("strucchange")

	#running BAR the specified number of times and storing the results
	for(i in 1:runs){

		current_data = data_fun()
		break_p = breakpoints(current_data[,2] ~ current_data[,1], breaks = 5, h = 0.1)
		starting_breakpoints = break_p$breakpoints
		current_result = current_bar(starting_breakpoints, current_data[,1], current_data[,2], iterations, make, percent, lambda)
		#There's a Error: $ operator is invalid for atomic vectors in lines 48-54
	  current_list[[1]] = c(current_list[[1]], current_result$AcceptRate[[1]], recursive = TRUE)
	  current_list[[2]] = rbind(current_list[[2]], current_result$ProposedSteps)
	  current_list[[3]] = rbind(current_list[[3]], current_result$AcceptedSteps)
	  current_list[[4]] = cbind(current_list[[4]], current_result$MSE)
	  current_list[[5]] = cbind(current_list[[5]], current_result$BIC)
	  current_list[[6]] = cbind(current_list[[6]], current_result$Breakpoints)
	  current_list[[7]] = cbind(current_list[[7]], current_result$NumBkpts)

	}

	#returning results of all BAR runs
	return(current_list)
}

sim_list = simulation(data_fun, runs, iterations, current_bar, make, percent, lambda)

#Step 5 - clean up and define final version of $Breakpoints from simulation results

split_num = NULL #initializing

colnames(sim_list[[6]]) <- gsub(x = colnames(sim_list[[6]]), pattern = "all_k_best...c..1...ncol.all_k_best...", replacement = "X1")  

for(i in 2:ncol(sim_list[[6]])){ #detecting where to split up columns in $Breakpoint object
  
	if(endsWith(colnames(sim_list[[6]])[i], "X1") == TRUE){
		split_num = c(split_num, i)
	}
  
}

final_list = list() #initializing

for(i in 1:length(split_num)){ #splitting up columns in $Breakpoint object

	if(i == 1){ #breakpoints from first run
		final_list[[i]] = sim_list[[6]][,1:(split_num[i]-1)]
	}else if(i < length(split_num)){# breakpoints from middle runs
		final_list[[i]] = sim_list[[6]][,split_num[i-1]:(split_num[i]-1)]
	}else{ #breakpoints from penultimate and final runs
		final_list[[i]] = sim_list[[6]][,split_num[i-1]:(split_num[i]-1)]
		final_list[[i+1]] = sim_list[[6]][,split_num[i]:ncol(sim_list[[6]])]
	}
  
}

sim_list[[6]] = final_list #saving final version of $Breakpoint object

#Step 6 - saving the final list, make sure working directory goes to correct folder

saveRDS(sim_list, file=save_name) #edit name here !!!

#sim_list = readRDS() #to load an existing RDS

#Step 7 - graphing

#which_run = 1 #which run you want to plot

#plotting the MSE
#plot(sim_list$MSE[,which_run], ylab = "MSE" , xlab = "time", main = title)

#setup for plotting histograms 
#x.label = "Location of Breakpoint" #label setup

#frequency of breakpoints 
#if(is.atomic(sim_list$Breakpoints[[which_run]]) == TRUE) {
#	hist(sim_list$Breakpoints[[which_run]], xlab = x.label, main = title, col="red", breaks=max(time), xlim=c(0,max(time))) 
#}else if(dim(sim_list$Breakpoints[[which_run]])[2] >= 2) {
#	column_list = NULL
#	for(i in 1:dim(sim_list$Breakpoints[[which_run]])[2]){
#		column_list = c(column_list, sim_list$Breakpoints[[which_run]][,i], recursive=TRUE)
#	}
#	hist(column_list, xlab = x.label, main = title, col="red", breaks=max(time), xlim=c(0,max(time))) 
#}