Revisión | fc61ccc61df4069e9df1def452aa45aef27b70ec (tree) |
---|---|
Tiempo | 2024-07-19 22:58:04 |
Autor | Lorenzo Isella <lorenzo.isella@gmai...> |
Commiter | Lorenzo Isella |
I fixed a bug (I used to save twice the jobs in English!).
@@ -5,12 +5,12 @@ | ||
5 | 5 | source("/home/lorenzo/myprojects-hg/R-codes/stat_lib.R") |
6 | 6 | |
7 | 7 | |
8 | -from_scratch <- 0 | |
8 | +from_scratch <- 1 | |
9 | 9 | |
10 | -df_jobs <- read_csv("wi_dataset.csv") | |
10 | +df_jobs <- read_csv("../input/wi_dataset.csv") | |
11 | 11 | |
12 | 12 | |
13 | -labels <- read_csv("wi_labels.csv") | |
13 | +labels <- read_csv("../input/wi_labels.csv") | |
14 | 14 | |
15 | 15 | jobs <- df_jobs |> |
16 | 16 | pull(description) |
@@ -37,23 +37,23 @@ | ||
37 | 37 | } |
38 | 38 | |
39 | 39 | |
40 | -saveRDS(job_language, "job_language_list.RDS") | |
40 | +saveRDS(job_language, "../output/job_language_list.RDS") | |
41 | 41 | } else { |
42 | 42 | |
43 | - job_language <- readRDS("job_language_list.RDS") | |
43 | + job_language <- readRDS("../output/job_language_list.RDS") | |
44 | 44 | } |
45 | 45 | |
46 | 46 | df_jobs_en <- df_jobs |> |
47 | 47 | filter(job_language=="en") |
48 | 48 | |
49 | -saveRDS(df_jobs_en, "jobs_in_english.RDS") | |
49 | +saveRDS(df_jobs_en, "../output/jobs_in_english.RDS") | |
50 | 50 | |
51 | 51 | |
52 | 52 | df_jobs_non_en <- df_jobs |> |
53 | - filter(job_language=="en") | |
53 | + filter(job_language!="en") | |
54 | 54 | |
55 | 55 | |
56 | -saveRDS(df_jobs_non_en, "jobs_not_in_english.RDS") | |
56 | +saveRDS(df_jobs_non_en, "../output/jobs_not_in_english.RDS") | |
57 | 57 | |
58 | 58 | |
59 | 59 |