Click the see the code
# importing necessary packages
library(tidyverse)
library(readxl)
library(readr)
library(gridExtra)
library(dplyr)
<- read_excel("C:\\Users\\melike\\desktop\\DataVizards_FinalDataFrame.xlsx")
population names(population) <- c('IDD','city','regionid','regions','totalpop','male','female','age04','age59','age1014','age1519','age2024','age2529','age3034','age3539','age4044','otherage','unknowns','doctorate','primaryedu','elementaryedu','highschool','literatebutnoschool','notliterate','middleschool','master','university','fertilityrate','electricity','numberofattempts','housingsalesnumbers')
<- read_excel("C:\\Users\\melike\\desktop\\DataVizards_FinalDataFrame.xlsx", sheet = "Bolge26")
region26 names(region26) <- c('region','region2id','workforce15plus','workforce1564','usableincome')
<- read_excel("C:\\Users\\melike\\desktop\\DataVizards_FinalDataFrame.xlsx")
migration <- read_excel("C:\\Users\\melike\\desktop\\DataVizards_FinalDataFrame.xlsx")
population names(population) <- c('IDD','city','regionid','regions','totalpop','male','female','age04','age59','age1014','age1519','age2024','age2529','age3034','age3539','age4044','otherage','unknowns','doctorate','primaryedu','elementaryedu','highschool','literatebutnoschool','notliterate','middleschool','master','university','fertilityrate','electricity','numberofattempts','housingsalesnumbers')
<- read_excel("C:\\Users\\melike\\desktop\\DataVizards_FinalDataFrame.xlsx", sheet = "Bolge26")
region26 names(region26) <- c('region','region2id','workforce15plus','workforce1564','usableincome')
<- read_excel("C:\\Users\\melike\\desktop\\DataVizards_FinalDataFrame.xlsx", sheet = "Goc Bilgileri")
migration
<- read_excel("C:\\Users\\melike\\desktop\\DataVizards_FinalDataFrame.xlsx")
population names(population) <- c('IDD','city','regionid','regions','totalpop','male','female','age04','age59','age1014','age1519','age2024','age2529','age3034','age3539','age4044','otherage','unknowns','doctorate','primaryedu','elementaryedu','highschool','literatebutnoschool','notliterate','middleschool','master','university','fertilityrate','electricity','numberofattempts','housingsalesnumbers')
<- read_excel("C:\\Users\\melike\\desktop\\DataVizards_FinalDataFrame.xlsx", sheet = "Bolge26")
region26 names(region26) <- c('region','region2id','workforce15plus','workforce1564','usableincome')
<- read_excel("C:\\Users\\melike\\desktop\\DataVizards_FinalDataFrame.xlsx", sheet = "Goc Bilgileri")
migration
names(migration) <- c('IDD','male2','female2','turnbackfamily','unknowns2','betterlifecond','others','education','retirement','buyhome','familymig','finjob','maritalstatuschange','health','appointment','age04_2','age59_2','age1014_2','age1519_2','age2024_2','age2529_2','age3034_2','age3539_2','age4044_2','university2','highschool2','middleschool2', 'elementaryschool2')
# tidy migration dataset
$city <- population$city
migration$regions <- population$regions
migration
<- migration |> pivot_longer(c(male2,female2),names_to = "gender2",values_to = "gender_value2")
tidy_data_gender
<- tidy_data_gender |> pivot_longer(c(turnbackfamily,unknowns2,betterlifecond,others,education,
tidy_data_causes names_to = "migrationcauses",values_to = "migrationcauses_value")
retirement,buyhome,familymig,finjob,maritalstatuschange,health,appointment),
<- tidy_data_causes |> pivot_longer(c(age04_2,age59_2,age1014_2,age1519_2,
tidy_data_age names_to = "agerange2",values_to = "agerange_value2")
age2024_2,age2529_2,age3034_2,age3539_2,age4044_2),
<- tidy_data_age |> pivot_longer(c(university2,highschool2,middleschool2,elementaryschool2),names_to = "education2",values_to = "education_value2")
last_migration_tidy_data head(last_migration_tidy_data)
# A tibble: 6 × 11
IDD city regions gender2 gender_value2 migrationcauses
<dbl> <chr> <chr> <chr> <dbl> <chr>
1 1 Adana Akdeniz Bölgesi male2 25200 turnbackfamily
2 1 Adana Akdeniz Bölgesi male2 25200 turnbackfamily
3 1 Adana Akdeniz Bölgesi male2 25200 turnbackfamily
4 1 Adana Akdeniz Bölgesi male2 25200 turnbackfamily
5 1 Adana Akdeniz Bölgesi male2 25200 turnbackfamily
6 1 Adana Akdeniz Bölgesi male2 25200 turnbackfamily
# ℹ 5 more variables: migrationcauses_value <dbl>, agerange2 <chr>,
# agerange_value2 <dbl>, education2 <chr>, education_value2 <dbl>
Click the see the code
# tidy region26 dataset
<- region26 |> pivot_longer(c(workforce15plus,workforce1564),names_to = "workforce",values_to = "workforce_values")
tidy_region26 head(tidy_region26)
# A tibble: 6 × 5
region region2id usableincome workforce workforce_values
<chr> <chr> <dbl> <chr> <dbl>
1 Adana, Mersin TR62 0.382 workforce1… 1579
2 Adana, Mersin TR62 0.382 workforce1… 1528
3 Ağrı, Kars, Iğdır, Ardahan TRA2 0.381 workforce1… 383
4 Ağrı, Kars, Iğdır, Ardahan TRA2 0.381 workforce1… 369
5 Ankara TR51 0.353 workforce1… 2341
6 Ankara TR51 0.353 workforce1… 2308
Click the see the code
# tidy population dataset
<- population |> pivot_longer(c(male,female),names_to = "gender",values_to = "gender_value")
tidy_data_gender2
<- tidy_data_gender2 |> pivot_longer(c(age04,age59,age1014,age1519,
tidy_data_age names_to = "agerange",values_to = "agerange_value")
age2024,age2529,age3034,age3539,age4044,otherage),
<- tidy_data_age |> pivot_longer(c(unknowns,literatebutnoschool,notliterate),names_to = "literate",values_to = "literate_values")
tidy_literate
<- tidy_literate|> pivot_longer(c(university,highschool,middleschool,elementaryedu,doctorate,primaryedu,master),names_to = "education",values_to = "education_value")
last_tidy_data_education2
<- last_tidy_data_education2 |> pivot_longer(c(fertilityrate,electricity,numberofattempts,housingsalesnumbers),names_to = "othervariables",values_to = "othervariables_value")
last_population_tidy_data head(last_population_tidy_data)
# A tibble: 6 × 15
IDD city regionid regions totalpop gender gender_value agerange
<dbl> <chr> <chr> <chr> <dbl> <chr> <dbl> <chr>
1 1 Adana A Akdeniz Bölgesi 2263373 male 1130862 age04
2 1 Adana A Akdeniz Bölgesi 2263373 male 1130862 age04
3 1 Adana A Akdeniz Bölgesi 2263373 male 1130862 age04
4 1 Adana A Akdeniz Bölgesi 2263373 male 1130862 age04
5 1 Adana A Akdeniz Bölgesi 2263373 male 1130862 age04
6 1 Adana A Akdeniz Bölgesi 2263373 male 1130862 age04
# ℹ 7 more variables: agerange_value <dbl>, literate <chr>,
# literate_values <dbl>, education <chr>, education_value <dbl>,
# othervariables <chr>, othervariables_value <dbl>
Click the see the code
$`region2id`<- ""
populationfor (i in 1:nrow(population)) {
<- population$city[i]
city
for (j in 1:length(region26$region)) {
if (grepl(city, region26$region[j])) {
$`region2id`[i] <- paste(region26$`region2id`[j])
populationbreak
}
} }