• R/O
  • SSH

提交

标签
No Tags

Frequently used words (click to add to your profile)

javac++androidlinuxc#windowsobjective-ccocoa誰得qtpythonphprubygameguibathyscaphec計画中(planning stage)翻訳omegatframeworktwitterdomtestvb.netdirectxゲームエンジンbtronarduinopreviewer

Commit MetaInfo

修订版171bb0230e69fb3df7af8ab5f22703244d890119 (tree)
时间2023-01-31 06:19:29
作者Lorenzo Isella <lorenzo.isella@gmai...>
CommiterLorenzo Isella

Log Message

I added the option to save/read the ESTAT downloaded data.

更改概述

差异

diff -r 570dc39f106f -r 171bb0230e69 R-codes/process_tam_RO.R
--- a/R-codes/process_tam_RO.R Sun Jan 29 21:39:00 2023 +0100
+++ b/R-codes/process_tam_RO.R Mon Jan 30 22:19:29 2023 +0100
@@ -21,10 +21,15 @@
2121 ## clean_names
2222
2323
24+read_estat <- 0
25+
2426 df_ro_ini <- read_csv("Copy_of_ExportTransparenta_20220919.csv") |>
2527 clean_names()
2628
29+repeated_entries <- df_ro_ini |>
30+ get_dupes_short()
2731
32+save_excel(repeated_entries, "repeated_entries_Romania.xlsx")
2833
2934 ## tam <- read_parquet("tam.parquet") |>
3035 ## slice(1:5)
@@ -63,7 +68,8 @@
6368
6469 df_ro_name <- df_ro |>
6570 rename_many(df_name$english,ini_names) |>
66- clean_data() |>
71+ clean_data( remove_duplicated_rows=F
72+ ) |>
6773 select(-national_identification_for_other_categories_foreign_undertakings) |>
6874 mutate(aid_award_granted_date=dmy(aid_award_granted_date)) |>
6975 mutate(year=year(aid_award_granted_date),
@@ -83,12 +89,21 @@
8389
8490
8591
86-
92+if (read_estat!=1){
8793
8894 all_rates_ini <- estat_retrieval(query) |>
8995 clean_names() |>
9096 select(time_period, obs_value) |>
9197 mutate(time_period=as.numeric(time_period))
98+ saveRDS(all_rates_ini, "all_rates.RDS")
99+
100+
101+
102+} else{
103+
104+all_rates_ini <- readRDS("all_rates.RDS")
105+
106+}
92107
93108
94109
@@ -166,6 +181,8 @@
166181 covid <- read_excel("SA-Covid19.xlsx") |>
167182 clean_names()
168183
184+nace <- readRDS("../nace_codes/df_nace.RDS") |>
185+ select(-code)
169186
170187 df.out <- df_temp |>
171188 rename("aid_award_instrument"="aid_award_instrument_other_english") |>
@@ -175,8 +192,16 @@
175192 granted_value_extended_eur=granted_aid_absolute_eur,
176193 is_covid_case=if_else(case_reference %in% covid$case_reference, "Yes", "No")) |>
177194 mutate(granted_value_extended_eur=if_else(is_covid_case=="No", granted_value_extended_eur, NA_real_)) |>
178- filter(year!=2022)
195+ filter(year!=2022) |>
196+ mutate(beneficiary_sector=if_else(nchar(beneficiary_sector)==3,
197+ paste("0", beneficiary_sector, sep=""), beneficiary_sector)) |>
198+ left_join(y=nace, by=c("beneficiary_sector"="code2")) |>
199+ mutate(beneficiary_sector=paste(beneficiary_sector, description,
200+ sep=" - ")) |>
201+ select(-description)
179202
203+## test <- df.out |>
204+## filter(is.na(description))
180205
181206
182207 save_excel(df.out, "romania_extra_tam.xlsx")