diff --git a/exercicios/para-casa/Rafaella-Fiel/tarefa.ipynb b/exercicios/para-casa/Rafaella-Fiel/tarefa.ipynb new file mode 100644 index 0000000..3a5aa5d --- /dev/null +++ b/exercicios/para-casa/Rafaella-Fiel/tarefa.ipynb @@ -0,0 +1,2379 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Importando as planilhas" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | customer_id | \n", + "customer_unique_id | \n", + "zip_code_prefix | \n", + "customer_city | \n", + "customer_state | \n", + "
---|---|---|---|---|---|
0 | \n", + "06b8999e2fba1a1fbc88172c00ba8bc7 | \n", + "861eff4711a542e4b93843c6dd7febb0 | \n", + "14409 | \n", + "franca | \n", + "SP | \n", + "
1 | \n", + "18955e83d337fd6b2def6b18a428ac77 | \n", + "290c77bc529b7ac935b93aa66c333dc3 | \n", + "9790 | \n", + "sao bernardo do campo | \n", + "SP | \n", + "
2 | \n", + "4e7b3e00288586ebd08712fdd0374a03 | \n", + "060e732b5b29e8181a18229c7b0b2b5e | \n", + "1151 | \n", + "sao paulo | \n", + "SP | \n", + "
3 | \n", + "b2b6027bc5c5109e529d4dc6358b12c3 | \n", + "259dac757896d24d7702b9acbbff3f3c | \n", + "8775 | \n", + "mogi das cruzes | \n", + "SP | \n", + "
4 | \n", + "4f2d8ab171c80ec8364f7c12e35b23ad | \n", + "345ecd01c38d18a9036ed96c73b8d066 | \n", + "13056 | \n", + "campinas | \n", + "SP | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
99436 | \n", + "17ddf5dd5d51696bb3d7c6291687be6f | \n", + "1a29b476fee25c95fbafc67c5ac95cf8 | \n", + "3937 | \n", + "sao paulo | \n", + "SP | \n", + "
99437 | \n", + "e7b71a9017aa05c9a7fd292d714858e8 | \n", + "d52a67c98be1cf6a5c84435bd38d095d | \n", + "6764 | \n", + "taboao da serra | \n", + "SP | \n", + "
99438 | \n", + "5e28dfe12db7fb50a4b2f691faecea5e | \n", + "e9f50caf99f032f0bf3c55141f019d99 | \n", + "60115 | \n", + "fortaleza | \n", + "CE | \n", + "
99439 | \n", + "56b18e2166679b8a959d72dd06da27f9 | \n", + "73c2643a0a458b49f58cea58833b192e | \n", + "92120 | \n", + "canoas | \n", + "RS | \n", + "
99440 | \n", + "274fa6071e5e17fe303b9748641082c8 | \n", + "84732c5050c01db9b23e19ba39899398 | \n", + "6703 | \n", + "cotia | \n", + "SP | \n", + "
99441 rows × 5 columns
\n", + "\n", + " | zip_code_prefix | \n", + "geolocation_lat | \n", + "geolocation_lng | \n", + "geolocation_city | \n", + "geolocation_state | \n", + "
---|---|---|---|---|---|
0 | \n", + "1037 | \n", + "-23.545621 | \n", + "-46.639292 | \n", + "sao paulo | \n", + "SP | \n", + "
1 | \n", + "1046 | \n", + "-23.546081 | \n", + "-46.644820 | \n", + "sao paulo | \n", + "SP | \n", + "
2 | \n", + "1046 | \n", + "-23.546129 | \n", + "-46.642951 | \n", + "sao paulo | \n", + "SP | \n", + "
3 | \n", + "1041 | \n", + "-23.544392 | \n", + "-46.639499 | \n", + "sao paulo | \n", + "SP | \n", + "
4 | \n", + "1035 | \n", + "-23.541578 | \n", + "-46.641607 | \n", + "sao paulo | \n", + "SP | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
1000158 | \n", + "99950 | \n", + "-28.068639 | \n", + "-52.010705 | \n", + "tapejara | \n", + "RS | \n", + "
1000159 | \n", + "99900 | \n", + "-27.877125 | \n", + "-52.224882 | \n", + "getulio vargas | \n", + "RS | \n", + "
1000160 | \n", + "99950 | \n", + "-28.071855 | \n", + "-52.014716 | \n", + "tapejara | \n", + "RS | \n", + "
1000161 | \n", + "99980 | \n", + "-28.388932 | \n", + "-51.846871 | \n", + "david canabarro | \n", + "RS | \n", + "
1000162 | \n", + "99950 | \n", + "-28.070104 | \n", + "-52.018658 | \n", + "tapejara | \n", + "RS | \n", + "
1000163 rows × 5 columns
\n", + "\n", + " | seller_id | \n", + "zip_code_prefix | \n", + "seller_city | \n", + "seller_state | \n", + "
---|---|---|---|---|
0 | \n", + "3442f8959a84dea7ee197c632cb2df15 | \n", + "13023 | \n", + "campinas | \n", + "SP | \n", + "
1 | \n", + "d1b65fc7debc3361ea86b5f14c68d2e2 | \n", + "13844 | \n", + "mogi guacu | \n", + "SP | \n", + "
2 | \n", + "ce3ad9de960102d0677a81f5d0bb7b2d | \n", + "20031 | \n", + "rio de janeiro | \n", + "RJ | \n", + "
3 | \n", + "c0f3eea2e14555b6faeea3dd58c1b1c3 | \n", + "4195 | \n", + "sao paulo | \n", + "SP | \n", + "
4 | \n", + "51a04a8a6bdcb23deccc82b0b80742cf | \n", + "12914 | \n", + "braganca paulista | \n", + "SP | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
3090 | \n", + "98dddbc4601dd4443ca174359b237166 | \n", + "87111 | \n", + "sarandi | \n", + "PR | \n", + "
3091 | \n", + "f8201cab383e484733266d1906e2fdfa | \n", + "88137 | \n", + "palhoca | \n", + "SC | \n", + "
3092 | \n", + "74871d19219c7d518d0090283e03c137 | \n", + "4650 | \n", + "sao paulo | \n", + "SP | \n", + "
3093 | \n", + "e603cf3fec55f8697c9059638d6c8eb5 | \n", + "96080 | \n", + "pelotas | \n", + "RS | \n", + "
3094 | \n", + "9e25199f6ef7e7c347120ff175652c3b | \n", + "12051 | \n", + "taubate | \n", + "SP | \n", + "
3095 rows × 4 columns
\n", + "\n", + " | customer_id | \n", + "zip_code_prefix | \n", + "customer_city | \n", + "customer_state | \n", + "
---|---|---|---|---|
0 | \n", + "06b8999e2fba1a1fbc88172c00ba8bc7 | \n", + "14409 | \n", + "franca | \n", + "SP | \n", + "
1 | \n", + "18955e83d337fd6b2def6b18a428ac77 | \n", + "9790 | \n", + "sao bernardo do campo | \n", + "SP | \n", + "
2 | \n", + "4e7b3e00288586ebd08712fdd0374a03 | \n", + "1151 | \n", + "sao paulo | \n", + "SP | \n", + "
3 | \n", + "b2b6027bc5c5109e529d4dc6358b12c3 | \n", + "8775 | \n", + "mogi das cruzes | \n", + "SP | \n", + "
4 | \n", + "4f2d8ab171c80ec8364f7c12e35b23ad | \n", + "13056 | \n", + "campinas | \n", + "SP | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
99436 | \n", + "17ddf5dd5d51696bb3d7c6291687be6f | \n", + "3937 | \n", + "sao paulo | \n", + "SP | \n", + "
99437 | \n", + "e7b71a9017aa05c9a7fd292d714858e8 | \n", + "6764 | \n", + "taboao da serra | \n", + "SP | \n", + "
99438 | \n", + "5e28dfe12db7fb50a4b2f691faecea5e | \n", + "60115 | \n", + "fortaleza | \n", + "CE | \n", + "
99439 | \n", + "56b18e2166679b8a959d72dd06da27f9 | \n", + "92120 | \n", + "canoas | \n", + "RS | \n", + "
99440 | \n", + "274fa6071e5e17fe303b9748641082c8 | \n", + "6703 | \n", + "cotia | \n", + "SP | \n", + "
99441 rows × 4 columns
\n", + "\n", + " | customer_id | \n", + "zip_code_prefix | \n", + "customer_city | \n", + "customer_state | \n", + "
---|---|---|---|---|
count | \n", + "99441 | \n", + "99441.000000 | \n", + "99441 | \n", + "99441 | \n", + "
unique | \n", + "99441 | \n", + "NaN | \n", + "4119 | \n", + "27 | \n", + "
top | \n", + "06b8999e2fba1a1fbc88172c00ba8bc7 | \n", + "NaN | \n", + "sao paulo | \n", + "SP | \n", + "
freq | \n", + "1 | \n", + "NaN | \n", + "15540 | \n", + "41746 | \n", + "
mean | \n", + "NaN | \n", + "35137.474583 | \n", + "NaN | \n", + "NaN | \n", + "
std | \n", + "NaN | \n", + "29797.938996 | \n", + "NaN | \n", + "NaN | \n", + "
min | \n", + "NaN | \n", + "1003.000000 | \n", + "NaN | \n", + "NaN | \n", + "
25% | \n", + "NaN | \n", + "11347.000000 | \n", + "NaN | \n", + "NaN | \n", + "
50% | \n", + "NaN | \n", + "24416.000000 | \n", + "NaN | \n", + "NaN | \n", + "
75% | \n", + "NaN | \n", + "58900.000000 | \n", + "NaN | \n", + "NaN | \n", + "
max | \n", + "NaN | \n", + "99990.000000 | \n", + "NaN | \n", + "NaN | \n", + "
\n", + " | zip_code_prefix | \n", + "geolocation_lat | \n", + "geolocation_lng | \n", + "geolocation_city | \n", + "geolocation_state | \n", + "
---|---|---|---|---|---|
count | \n", + "1.000163e+06 | \n", + "1.000163e+06 | \n", + "1.000163e+06 | \n", + "1000163 | \n", + "1000163 | \n", + "
unique | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "8011 | \n", + "27 | \n", + "
top | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "sao paulo | \n", + "SP | \n", + "
freq | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "135800 | \n", + "404268 | \n", + "
mean | \n", + "3.657417e+04 | \n", + "-2.117615e+01 | \n", + "-4.639054e+01 | \n", + "NaN | \n", + "NaN | \n", + "
std | \n", + "3.054934e+04 | \n", + "5.715866e+00 | \n", + "4.269748e+00 | \n", + "NaN | \n", + "NaN | \n", + "
min | \n", + "1.001000e+03 | \n", + "-3.660537e+01 | \n", + "-1.014668e+02 | \n", + "NaN | \n", + "NaN | \n", + "
25% | \n", + "1.107500e+04 | \n", + "-2.360355e+01 | \n", + "-4.857317e+01 | \n", + "NaN | \n", + "NaN | \n", + "
50% | \n", + "2.653000e+04 | \n", + "-2.291938e+01 | \n", + "-4.663788e+01 | \n", + "NaN | \n", + "NaN | \n", + "
75% | \n", + "6.350400e+04 | \n", + "-1.997962e+01 | \n", + "-4.376771e+01 | \n", + "NaN | \n", + "NaN | \n", + "
max | \n", + "9.999000e+04 | \n", + "4.506593e+01 | \n", + "1.211054e+02 | \n", + "NaN | \n", + "NaN | \n", + "
\n", + " | seller_id | \n", + "zip_code_prefix | \n", + "seller_city | \n", + "seller_state | \n", + "
---|---|---|---|---|
count | \n", + "3095 | \n", + "3095.000000 | \n", + "3095 | \n", + "3095 | \n", + "
unique | \n", + "3095 | \n", + "NaN | \n", + "611 | \n", + "23 | \n", + "
top | \n", + "3442f8959a84dea7ee197c632cb2df15 | \n", + "NaN | \n", + "sao paulo | \n", + "SP | \n", + "
freq | \n", + "1 | \n", + "NaN | \n", + "694 | \n", + "1849 | \n", + "
mean | \n", + "NaN | \n", + "32291.059451 | \n", + "NaN | \n", + "NaN | \n", + "
std | \n", + "NaN | \n", + "32713.453830 | \n", + "NaN | \n", + "NaN | \n", + "
min | \n", + "NaN | \n", + "1001.000000 | \n", + "NaN | \n", + "NaN | \n", + "
25% | \n", + "NaN | \n", + "7093.500000 | \n", + "NaN | \n", + "NaN | \n", + "
50% | \n", + "NaN | \n", + "14940.000000 | \n", + "NaN | \n", + "NaN | \n", + "
75% | \n", + "NaN | \n", + "64552.500000 | \n", + "NaN | \n", + "NaN | \n", + "
max | \n", + "NaN | \n", + "99730.000000 | \n", + "NaN | \n", + "NaN | \n", + "
\n", + " | customer_id | \n", + "zip_code_prefix | \n", + "customer_city | \n", + "customer_state | \n", + "geolocation_lat | \n", + "geolocation_lng | \n", + "geolocation_city | \n", + "geolocation_state | \n", + "
---|---|---|---|---|---|---|---|---|
0 | \n", + "06b8999e2fba1a1fbc88172c00ba8bc7 | \n", + "14409 | \n", + "franca | \n", + "SP | \n", + "-20.509897 | \n", + "-47.397866 | \n", + "franca | \n", + "SP | \n", + "
1 | \n", + "06b8999e2fba1a1fbc88172c00ba8bc7 | \n", + "14409 | \n", + "franca | \n", + "SP | \n", + "-20.497396 | \n", + "-47.399241 | \n", + "franca | \n", + "SP | \n", + "
2 | \n", + "06b8999e2fba1a1fbc88172c00ba8bc7 | \n", + "14409 | \n", + "franca | \n", + "SP | \n", + "-20.510459 | \n", + "-47.399553 | \n", + "franca | \n", + "SP | \n", + "
3 | \n", + "06b8999e2fba1a1fbc88172c00ba8bc7 | \n", + "14409 | \n", + "franca | \n", + "SP | \n", + "-20.480940 | \n", + "-47.394161 | \n", + "franca | \n", + "SP | \n", + "
4 | \n", + "06b8999e2fba1a1fbc88172c00ba8bc7 | \n", + "14409 | \n", + "franca | \n", + "SP | \n", + "-20.515413 | \n", + "-47.398194 | \n", + "franca | \n", + "SP | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
15083450 | \n", + "d9110683c7a282144e9fc97660026a28 | \n", + "74980 | \n", + "aparecida de goiania | \n", + "GO | \n", + "-16.821866 | \n", + "-49.244027 | \n", + "aparecida de goiania | \n", + "GO | \n", + "
15083451 | \n", + "d9110683c7a282144e9fc97660026a28 | \n", + "74980 | \n", + "aparecida de goiania | \n", + "GO | \n", + "-16.821866 | \n", + "-49.244027 | \n", + "aparecida de goiania | \n", + "GO | \n", + "
15083452 | \n", + "d9110683c7a282144e9fc97660026a28 | \n", + "74980 | \n", + "aparecida de goiania | \n", + "GO | \n", + "-16.822945 | \n", + "-49.244615 | \n", + "aparecida de goiania | \n", + "GO | \n", + "
15083453 | \n", + "6fb4f2354f36e554ac80141e9128f528 | \n", + "99043 | \n", + "passo fundo | \n", + "RS | \n", + "-28.226596 | \n", + "-52.467505 | \n", + "passo fundo | \n", + "RS | \n", + "
15083454 | \n", + "6fb4f2354f36e554ac80141e9128f528 | \n", + "99043 | \n", + "passo fundo | \n", + "RS | \n", + "-28.226596 | \n", + "-52.467505 | \n", + "passo fundo | \n", + "RS | \n", + "
15083455 rows × 8 columns
\n", + "\n", + " | customer_id | \n", + "zip_code_prefix | \n", + "customer_city | \n", + "customer_state | \n", + "geolocation_lat | \n", + "geolocation_lng | \n", + "geolocation_city | \n", + "geolocation_state | \n", + "seller_id | \n", + "seller_city | \n", + "seller_state | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "4f2d8ab171c80ec8364f7c12e35b23ad | \n", + "13056 | \n", + "campinas | \n", + "SP | \n", + "-22.987222 | \n", + "-47.151073 | \n", + "campinas | \n", + "SP | \n", + "8d46553a36e68f95350a200c12f8f2e2 | \n", + "campinas | \n", + "SP | \n", + "
1 | \n", + "4f2d8ab171c80ec8364f7c12e35b23ad | \n", + "13056 | \n", + "campinas | \n", + "SP | \n", + "-22.964194 | \n", + "-47.146534 | \n", + "campinas | \n", + "SP | \n", + "8d46553a36e68f95350a200c12f8f2e2 | \n", + "campinas | \n", + "SP | \n", + "
2 | \n", + "4f2d8ab171c80ec8364f7c12e35b23ad | \n", + "13056 | \n", + "campinas | \n", + "SP | \n", + "-22.961982 | \n", + "-47.146298 | \n", + "campinas | \n", + "SP | \n", + "8d46553a36e68f95350a200c12f8f2e2 | \n", + "campinas | \n", + "SP | \n", + "
3 | \n", + "4f2d8ab171c80ec8364f7c12e35b23ad | \n", + "13056 | \n", + "campinas | \n", + "SP | \n", + "-22.968059 | \n", + "-47.147139 | \n", + "campinas | \n", + "SP | \n", + "8d46553a36e68f95350a200c12f8f2e2 | \n", + "campinas | \n", + "SP | \n", + "
4 | \n", + "4f2d8ab171c80ec8364f7c12e35b23ad | \n", + "13056 | \n", + "campinas | \n", + "SP | \n", + "-22.977905 | \n", + "-47.145693 | \n", + "campinas | \n", + "SP | \n", + "8d46553a36e68f95350a200c12f8f2e2 | \n", + "campinas | \n", + "SP | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
11492510 | \n", + "7fb62e47282b83f023cf1fef8d8309c9 | \n", + "4319 | \n", + "sao paulo | \n", + "SP | \n", + "-23.646627 | \n", + "-46.638771 | \n", + "sao paulo | \n", + "SP | \n", + "ab91571efab27993ff2f6b36e38055c3 | \n", + "sao paulo | \n", + "SP | \n", + "
11492511 | \n", + "7fb62e47282b83f023cf1fef8d8309c9 | \n", + "4319 | \n", + "sao paulo | \n", + "SP | \n", + "-23.647430 | \n", + "-46.636954 | \n", + "sao paulo | \n", + "SP | \n", + "ab91571efab27993ff2f6b36e38055c3 | \n", + "sao paulo | \n", + "SP | \n", + "
11492512 | \n", + "7fb62e47282b83f023cf1fef8d8309c9 | \n", + "4319 | \n", + "sao paulo | \n", + "SP | \n", + "-23.647765 | \n", + "-46.635971 | \n", + "sao paulo | \n", + "SP | \n", + "ab91571efab27993ff2f6b36e38055c3 | \n", + "sao paulo | \n", + "SP | \n", + "
11492513 | \n", + "7fb62e47282b83f023cf1fef8d8309c9 | \n", + "4319 | \n", + "sao paulo | \n", + "SP | \n", + "-23.647430 | \n", + "-46.636954 | \n", + "sao paulo | \n", + "SP | \n", + "ab91571efab27993ff2f6b36e38055c3 | \n", + "sao paulo | \n", + "SP | \n", + "
11492514 | \n", + "7fb62e47282b83f023cf1fef8d8309c9 | \n", + "4319 | \n", + "sao paulo | \n", + "SP | \n", + "-23.647471 | \n", + "-46.636862 | \n", + "são paulo | \n", + "SP | \n", + "ab91571efab27993ff2f6b36e38055c3 | \n", + "sao paulo | \n", + "SP | \n", + "
11492515 rows × 11 columns
\n", + "\n", + " | customer_id | \n", + "
---|---|
zip_code_prefix | \n", + "\n", + " |
22790 | \n", + "142 | \n", + "
22793 | \n", + "121 | \n", + "
22775 | \n", + "110 | \n", + "
29101 | \n", + "101 | \n", + "
13212 | \n", + "95 | \n", + "
... | \n", + "... | \n", + "
87230 | \n", + "1 | \n", + "
6696 | \n", + "1 | \n", + "
6513 | \n", + "1 | \n", + "
6506 | \n", + "1 | \n", + "
99730 | \n", + "1 | \n", + "
2160 rows × 1 columns
\n", + "