Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
68 commits
Select commit Hold shift + click to select a range
8688fe8
Updated links.
massaoHigaskino Oct 12, 2019
d6953a9
Merge branch 'master' of https://github.com/massaoHigaskino/DSWP
massaoHigaskino Oct 12, 2019
6ba9ce5
Testing relative pathing
massaoHigaskino Oct 12, 2019
b83b91f
Changed Material folder references to relative paths.
massaoHigaskino Oct 12, 2019
547ce3d
Testing Dataframes relative pathing.
massaoHigaskino Oct 12, 2019
fb93975
Changed Material folder references to relative paths.
massaoHigaskino Oct 12, 2019
1b8af5b
Reverted Notebook changes
massaoHigaskino Oct 12, 2019
ef8252d
Edited gitignore
massaoHigaskino Oct 12, 2019
7975679
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 12, 2019
4123b50
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 12, 2019
19369ec
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 12, 2019
a06c37c
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 12, 2019
c11bc3f
Laboratory 01
massaoHigaskino Oct 12, 2019
66d49b3
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 19, 2019
8081002
Merge branch 'master' into 2019_10_12_lecture
massaoHigaskino Oct 19, 2019
8b7628d
Revert "Merge branch 'master' into 2019_10_12_lecture"
massaoHigaskino Oct 19, 2019
f8ba896
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 19, 2019
3a92504
Merge branch 'master' into 2019_10_19_lecture
massaoHigaskino Oct 19, 2019
32a8eb5
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 19, 2019
cf187c6
Merge branch 'master' into 2019_10_19_lecture
massaoHigaskino Oct 19, 2019
a5d5df4
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 19, 2019
a200e4f
Merge branch 'master' into 2019_10_19_lecture
massaoHigaskino Oct 19, 2019
b1b99e5
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 19, 2019
debe4bb
Merge branch 'master' into 2019_10_19_lecture
massaoHigaskino Oct 19, 2019
1eda87c
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 19, 2019
d0808fc
Merge branch 'master' into 2019_10_19_lecture
massaoHigaskino Oct 19, 2019
76b70eb
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 19, 2019
493f62e
Merge remote-tracking branch 'origin/2019_10_19_lecture' into 2019_10…
massaoHigaskino Oct 19, 2019
69cfa77
Revert "Merge remote-tracking branch 'origin/2019_10_19_lecture' into…
massaoHigaskino Oct 19, 2019
aa77202
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 19, 2019
1d13655
Merge branch 'master' into 2019_10_19_lecture
massaoHigaskino Oct 19, 2019
9fd341b
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 19, 2019
63ef44d
Merge branch 'master' into 2019_10_19_lecture
massaoHigaskino Oct 19, 2019
5b61494
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 25, 2019
99cef86
Merge branch 'master' into 2019_10_19_lecture
massaoHigaskino Oct 25, 2019
2f8fd3d
Fixed some issues. Loaded first exercise.
massaoHigaskino Oct 25, 2019
10857e7
Solved exercise 1
massaoHigaskino Oct 25, 2019
d71dbd3
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 26, 2019
56d9921
Merge
massaoHigaskino Oct 26, 2019
c9a7925
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 26, 2019
b339b7a
Merge
massaoHigaskino Oct 26, 2019
ad1549a
Merge remote-tracking branch 'upstream/master' into 2019_10_26_lecture
massaoHigaskino Oct 26, 2019
b713af2
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 26, 2019
41568e0
Revert "Merge remote-tracking branch 'upstream/master' into 2019_10_2…
massaoHigaskino Oct 26, 2019
dab397a
Merge branch 'master' into 2019_10_26_lecture
massaoHigaskino Oct 26, 2019
dedfe27
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 26, 2019
345aeb1
Merge branch 'master' into 2019_10_26_lecture
massaoHigaskino Oct 26, 2019
82b57c5
Iris exercise.
massaoHigaskino Oct 26, 2019
5529d0f
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Oct 26, 2019
fc8acdf
Merge
massaoHigaskino Oct 26, 2019
dcfdba5
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Nov 6, 2019
b8ccfcb
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Nov 9, 2019
534f0c9
Merge branch 'master' into lectures/2019_11_10
massaoHigaskino Nov 9, 2019
162b4f7
Prepared datasets for DB import
massaoHigaskino Nov 9, 2019
d5d1fd7
Added files working with postgresql.
massaoHigaskino Nov 9, 2019
9a9b355
Merge branch 'master' into lectures/2019_10_12
massaoHigaskino Nov 9, 2019
220d33e
Merge branch 'master' into lectures/2019_10_19
massaoHigaskino Nov 9, 2019
34722da
Merge branch 'master' into lectures/2019_10_26
massaoHigaskino Nov 9, 2019
ed54532
Merge branch 'lectures/2019_10_12'
massaoHigaskino Nov 9, 2019
d8e132e
Merge branch 'lectures/2019_10_19'
massaoHigaskino Nov 9, 2019
6242be2
Merge branch 'lectures/2019_10_26'
massaoHigaskino Nov 9, 2019
20c6ea3
Added some scripts to create views to prepare to application.
massaoHigaskino Nov 9, 2019
aee76c3
Merge branch 'master' into lectures/2019_11_09
massaoHigaskino Nov 9, 2019
008feb7
Merge branch 'lectures/2019_11_09'
massaoHigaskino Nov 9, 2019
5144f70
Merge branch 'master' into upstream/master
massaoHigaskino Nov 16, 2019
2202770
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Nov 16, 2019
fd3c3b0
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Nov 16, 2019
c111a93
Merge remote-tracking branch 'upstream/master'
massaoHigaskino Apr 27, 2020
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 3 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -102,3 +102,6 @@ venv.bak/

# mypy
.mypy_cache/

# Jetbrains IDEs
.idea/
30,001 changes: 30,001 additions & 0 deletions Dataframes/Viagem_test.csv

Large diffs are not rendered by default.

50,001 changes: 50,001 additions & 0 deletions Dataframes/Viagem_train.csv

Large diffs are not rendered by default.

1 change: 1 addition & 0 deletions Dataframes/adult.data
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
age, workclass, fnlwgt, education, education-num, marital-status, occupation, relationship, race, sex, capital-gain, capital-loss, hours-per-week, native-country, target
39, State-gov, 77516, Bachelors, 13, Never-married, Adm-clerical, Not-in-family, White, Male, 2174, 0, 40, United-States, <=50K
50, Self-emp-not-inc, 83311, Bachelors, 13, Married-civ-spouse, Exec-managerial, Husband, White, Male, 0, 0, 13, United-States, <=50K
38, Private, 215646, HS-grad, 9, Divorced, Handlers-cleaners, Not-in-family, White, Male, 0, 0, 40, United-States, <=50K
Expand Down
1 change: 1 addition & 0 deletions Dataframes/adult.test
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
|1x3 Cross validator
age, workclass, fnlwgt, education, education-num, marital-status, occupation, relationship, race, sex, capital-gain, capital-loss, hours-per-week, native-country, target
25, Private, 226802, 11th, 7, Never-married, Machine-op-inspct, Own-child, Black, Male, 0, 0, 40, United-States, <=50K.
38, Private, 89814, HS-grad, 9, Married-civ-spouse, Farming-fishing, Husband, White, Male, 0, 0, 50, United-States, <=50K.
28, Local-gov, 336951, Assoc-acdm, 12, Married-civ-spouse, Protective-serv, Husband, White, Male, 0, 0, 40, United-States, >50K.
Expand Down
16,283 changes: 16,283 additions & 0 deletions Dataframes/adult2.test

Large diffs are not rendered by default.

59 changes: 59 additions & 0 deletions Execution/adult_50k/adult_50k.sql
Original file line number Diff line number Diff line change
@@ -0,0 +1,59 @@
select count(*) from banking_aws.t_50k_adult_data;



select b.job, count(b.job) from banking_aws.banking_aws b group by b.job;


select b.marital, count(b.marital) from banking_aws.banking_aws b group by b.marital;


select * from adult_50k.adult_data;

update adult_50k.adult_test
set "workclass" = trim("workclass"),
"education" = trim("education"),
"marital-status" = trim("marital-status"),
"occupation" = trim("occupation"),
"relationship" = trim("relationship"),
"race" = trim("race"),
"sex" = trim("sex"),
"native-country" = trim("native-country"),
"target" = trim("target");

alter table adult_50k.adult_test rename column "education-num" to education_num;

alter table adult_50k.adult_test rename column "marital-status" to marital_status;

alter table adult_50k.adult_test rename column "capital-gain" to capital_gain;

alter table adult_50k.adult_test rename column "capital-loss" to capital_loss;

alter table adult_50k.adult_test rename column "hours-per-week" to hours_per_week;

alter table adult_50k.adult_test rename column "native-country" to native_country;




select count(*) from adult_50k.adult_data;

select a.workclass, count(a.workclass) from adult_50k.adult_data a group by a.workclass;

select a.education, count(a.education) from adult_50k.adult_data a group by a.education;

select a."marital_status", count(a."marital_status") from adult_50k.adult_data a group by a."marital_status";

select a.occupation, count(a.occupation) from adult_50k.adult_data a group by a.occupation;

select a.relationship, count(a.relationship) from adult_50k.adult_data a group by a.relationship;

select a.race, count(a.race) from adult_50k.adult_data a group by a.race;

select a.sex, count(a.sex) from adult_50k.adult_data a group by a.sex;

select a."native_country", count(a."native_country") from adult_50k.adult_data a group by a."native_country";

ALTER TABLE adult_50k.adult_data ADD COLUMN id SERIAL PRIMARY KEY;
ALTER TABLE adult_50k.adult_test ADD COLUMN id SERIAL PRIMARY KEY;

32,562 changes: 32,562 additions & 0 deletions Execution/adult_50k/datascience_adult_50k_adult_data.csv

Large diffs are not rendered by default.

16,282 changes: 16,282 additions & 0 deletions Execution/adult_50k/datascience_adult_50k_adult_test.csv

Large diffs are not rendered by default.

55 changes: 55 additions & 0 deletions Execution/adult_50k/t1_views.sql
Original file line number Diff line number Diff line change
@@ -0,0 +1,55 @@

drop view if exists adult_50k.v_t1_adult_data_target;

create view adult_50k.v_t1_adult_data_target as
select id,
case when target = '>50K' then 1 else 0 end as target
from adult_50k.adult_data;

drop view if exists adult_50k.v_t1_adult_data_dataset;

create view adult_50k.v_t1_adult_data_dataset as
select id,
age,
workclass,
fnlwgt,
education,
education_num,
marital_status,
occupation,
relationship,
race,
sex,
capital_gain,
capital_loss,
hours_per_week,
native_country
from adult_50k.adult_data;


drop view if exists adult_50k.v_t1_adult_test_target;

create view adult_50k.v_t1_adult_test_target as
select id,
case when target = '>50K' then 1 else 0 end as target
from adult_50k.adult_test;

drop view if exists adult_50k.v_t1_adult_test_dataset;

create view adult_50k.v_t1_adult_test_dataset as
select id,
age,
workclass,
fnlwgt,
education,
education_num,
marital_status,
occupation,
relationship,
race,
sex,
capital_gain,
capital_loss,
hours_per_week,
native_country
from adult_50k.adult_test;
Binary file added Material/Test_Data Scientist_eDreams ODIGEO.pdf
Binary file not shown.
Loading