# NOT RUN {
data(data_individual_file)
data(data_population_file)
data(ICD_group_GLOBOCAN)
#Group individual data by:
#5 year age group
#ICD grouping from dataframe ICD_group_GLOBOCAN
#year extract from date of incidence
df_data_year <- csu_group_cases(data_individual_file,
var_age="age",
group_by=c("sex", "regcode", "reglabel"),
df_ICD = ICD_group_GLOBOCAN,
var_ICD ="site",
var_year = "doi")
#Merge 5-years age grouped data with population by year (automatic) and sex
df_data <- csu_merge_cases_pop(
df_data_year,
data_population_file,
var_age = "age_group",
var_cases = "cases",
var_py = "pop",
group_by = c("sex"))
# calculate asr
df_asr <- csu_asr(df_data,
"age_group",
"cases",
"pop",
group_by=c("sex", "ICD_group", "LABEL"),
missing_age =19)
#remove Other cancer
df_asr <- df_asr[df_asr$LABEL != "Other",]
df_asr <- df_asr[df_asr$LABEL != "Other skin",]
#keep male
df_asr_M <- df_asr[df_asr$sex==1,]
#Single sided bar plot
data1 <- csu_bar_top(
df_asr_M,
var_value="cases",
var_bar="LABEL",
nb_top = 10,
plot_title = "Top 10 cancer sites",
xtitle= "Number of cases",
color= c("#2c7bb6"),
digits=0)
#Double sided bar plot example 1
data2 <- csu_bar_top(
df_asr,
var_value="cases",
var_bar="LABEL",
group_by="sex",
nb_top = 15,
plot_title = "Top 15 cancer sites",
xtitle= "Number of cases",
label_by=c("Male", "Female"),
color = c("#2c7bb6","#b62ca1"),
digits=0)
#Double sided bar plot example 2
data3 <- csu_bar_top(
df_asr,
var_value="asr",
var_bar="LABEL",
group_by="sex",
nb_top = 10,
plot_title = "Top 10 cancer sites",
xtitle= "Age-standardized rate per 100,000",
label_by=c("Male", "Female"),
color = c("#2c7bb6","#b62ca1"),
digits=1)
# }
Run the code above in your browser using DataLab