From b561ae73ad9ab1facd626dd44acd63448f67218e Mon Sep 17 00:00:00 2001 From: Daniel Young Date: Tue, 2 Apr 2024 09:39:33 -0700 Subject: [PATCH 1/4] Linted some more of project. Ignore ESP file. Clean redundancy in CI script --- .github/workflows/eluc.yml | 2 +- use_cases/eluc/.pylintrc | 8 ++++++-- use_cases/eluc/README.md | 2 +- use_cases/eluc/data/conversion.py | 4 +++- use_cases/eluc/prescriptors/nsga2/nsga2_utils.py | 2 +- .../eluc/prescriptors/nsga2/torch_prescriptor.py | 16 ++++++++-------- use_cases/eluc/tests/test_nsga2.py | 4 ++-- 7 files changed, 22 insertions(+), 16 deletions(-) diff --git a/.github/workflows/eluc.yml b/.github/workflows/eluc.yml index d5a9ec1..1e6241a 100644 --- a/.github/workflows/eluc.yml +++ b/.github/workflows/eluc.yml @@ -30,7 +30,7 @@ jobs: pip install pylint if [ -f requirements.txt ]; then pip install -r requirements.txt; fi - name: Lint with PyLint - run: pylint --ignore="demo" --recursive=y --fail-under=9 ./* + run: pylint ./* - name: Run unit tests run: python -m unittest diff --git a/use_cases/eluc/.pylintrc b/use_cases/eluc/.pylintrc index 036fe36..b65f941 100644 --- a/use_cases/eluc/.pylintrc +++ b/use_cases/eluc/.pylintrc @@ -1,5 +1,9 @@ [MASTER] -ignore=demo +ignore=demo, prescriptors/esp + +recursive=y + +fail-under=9.0 jobs=0 @@ -7,4 +11,4 @@ max-line-length=120 suggestion-mode=yes -good-names=X_train, X_val, X_test, y_train, y_val, y_test, X, Y, y, X_test_scaled \ No newline at end of file +good-names=X_train, X_val, X_test, y_train, y_val, y_test, X, Y, y, X_test_scaled, df, da, ds, i, n \ No newline at end of file diff --git a/use_cases/eluc/README.md b/use_cases/eluc/README.md index b334648..c19d9d6 100644 --- a/use_cases/eluc/README.md +++ b/use_cases/eluc/README.md @@ -23,7 +23,7 @@ BLUE simulations with committed emissions could be used to estimate the long-ter "Committed emissions" means all the emissions that are caused by a land-use change event are attributed to the year of the event. BLUE (bookkeeping of land use emissions) is a bookkeeping model that attributes carbon fluxes to land use activities. -See [BLUE: Bookkeeping of land use emissions](https://doi.org/10.1002/2014GB004997) for more details. +See [BLUE: Bookkeeping of Land Use Emissions](https://doi.org/10.1002/2014GB004997) for more details. ### LUC diff --git a/use_cases/eluc/data/conversion.py b/use_cases/eluc/data/conversion.py index f71e099..efe1e72 100644 --- a/use_cases/eluc/data/conversion.py +++ b/use_cases/eluc/data/conversion.py @@ -58,6 +58,8 @@ def construct_countries_df(): for i in range(len(countries_df)): old_abbrev = countries_df.iloc[i]["abbrevs"] if old_abbrev in MANUAL_MAP and MANUAL_MAP[old_abbrev] in codes_df["Numeric code"].unique(): - countries_df.iloc[i]["abbrevs"] = codes_df[codes_df["Numeric code"] == MANUAL_MAP[old_abbrev]]["Alpha-2 code"].iloc[0] + numeric_code = codes_df["Numeric code"] + old_abbrev = MANUAL_MAP[old_abbrev] + countries_df.iloc[i]["abbrevs"] = codes_df[numeric_code == old_abbrev]["Alpha-2 code"].iloc[0] return countries_df \ No newline at end of file diff --git a/use_cases/eluc/prescriptors/nsga2/nsga2_utils.py b/use_cases/eluc/prescriptors/nsga2/nsga2_utils.py index 7f39cc8..72f92c6 100644 --- a/use_cases/eluc/prescriptors/nsga2/nsga2_utils.py +++ b/use_cases/eluc/prescriptors/nsga2/nsga2_utils.py @@ -64,7 +64,7 @@ def calculate_crowding_distance(front): n_objectives = len(front[0].metrics) distances = [0 for _ in range(len(front))] for m in range(n_objectives): - front.sort(key=lambda c: c.metrics[m]) + front.sort(key=lambda cand: cand.metrics[m]) obj_min = front[0].metrics[m] obj_max = front[-1].metrics[m] distances[0] = float('inf') diff --git a/use_cases/eluc/prescriptors/nsga2/torch_prescriptor.py b/use_cases/eluc/prescriptors/nsga2/torch_prescriptor.py index 5b06b62..cf0ed81 100644 --- a/use_cases/eluc/prescriptors/nsga2/torch_prescriptor.py +++ b/use_cases/eluc/prescriptors/nsga2/torch_prescriptor.py @@ -32,7 +32,7 @@ def __init__(self, batch_size: int, candidate_params: dict, seed_dir=None): - + self.candidate_params = candidate_params self.pop_size = pop_size self.n_generations = n_generations @@ -149,7 +149,7 @@ def _select_parents(self, candidates: list[Candidate], n_parents: int) -> list[C for candidate, distance in zip(front, crowding_distance): candidate.distance = distance if len(parents) + len(front) > n_parents: # If adding this front exceeds num_parents - front = sorted(front, key=lambda c: c.distance, reverse=True) + front = sorted(front, key=lambda cand: cand.distance, reverse=True) parents += front[:n_parents - len(parents)] break parents += front @@ -169,7 +169,7 @@ def _make_new_pop(self, parents: list[Candidate], pop_size: int, gen:int) -> lis Makes new population by creating children from parents. We use tournament selection to select parents for crossover. """ - sorted_parents = sorted(parents, key=lambda c: (c.rank, -c.distance)) + sorted_parents = sorted(parents, key=lambda cand: (cand.rank, -cand.distance)) children = [] for i in range(pop_size): parent1, parent2 = self._tournament_selection(sorted_parents) @@ -226,15 +226,15 @@ def _record_gen_results(self, gen: int, candidates: list[Candidate], save_path: Save the pareto front to disk. """ # Save statistics of candidates - gen_results = [c.record_state() for c in candidates] + gen_results = [cand.record_state() for cand in candidates] gen_results_df = pd.DataFrame(gen_results) gen_results_df.to_csv(save_path / f"{gen}.csv", index=False) # Save rank 1 candidate state dicts (save_path / f"{gen}").mkdir(parents=True, exist_ok=True) - pareto_candidates = [c for c in candidates if c.rank == 1] - for c in pareto_candidates: - torch.save(c.state_dict(), save_path / f"{gen}" / f"{c.gen}_{c.cand_id}.pt") + pareto_candidates = [cand for cand in candidates if cand.rank == 1] + for cand in pareto_candidates: + torch.save(cand.state_dict(), save_path / f"{gen}" / f"{cand.gen}_{cand.cand_id}.pt") def _record_candidate_avgs(self, gen: int, candidates: list[Candidate]) -> dict: """ @@ -242,7 +242,7 @@ def _record_candidate_avgs(self, gen: int, candidates: list[Candidate]) -> dict: """ avg_eluc = np.mean([c.metrics[0] for c in candidates]) avg_change = np.mean([c.metrics[1] for c in candidates]) - return {"gen": gen, "eluc": avg_eluc, "change": avg_change} + return {"gen": gen, "eluc": avg_eluc, "change": avg_change} def prescribe_land_use(self, context_df: pd.DataFrame, **kwargs) -> pd.DataFrame: """ diff --git a/use_cases/eluc/tests/test_nsga2.py b/use_cases/eluc/tests/test_nsga2.py index 4e965ff..6dcfb20 100644 --- a/use_cases/eluc/tests/test_nsga2.py +++ b/use_cases/eluc/tests/test_nsga2.py @@ -21,7 +21,7 @@ def get_fields(df): Dummy fields method to create the encoder for dummy data. """ fields_df = df[constants.CAO_MAPPING["context"] + constants.CAO_MAPPING["actions"] + ["ELUC"]].astype("float64") - fields = dict() + fields = {} for col in constants.CAO_MAPPING["context"] + constants.CAO_MAPPING["actions"] + ["ELUC"]: # Set range of land and diff land uses manually to their true ranges because they # do not need to be scaled @@ -52,7 +52,7 @@ def get_fields(df): "valued": "CONTINUOUS" } - return fields + return fields class TestTorchPrescriptor(unittest.TestCase): """ From 91d774cbdff880808595def1cfd35fa8ce65801b Mon Sep 17 00:00:00 2001 From: Daniel Young Date: Tue, 14 May 2024 09:50:36 -0700 Subject: [PATCH 2/4] changed cand to candidate, ignore md files in pylint --- use_cases/eluc/.pylintrc | 2 ++ use_cases/eluc/prescriptors/nsga2/candidate.py | 2 +- use_cases/eluc/prescriptors/nsga2/nsga2_utils.py | 2 +- .../eluc/prescriptors/nsga2/torch_prescriptor.py | 12 ++++++------ 4 files changed, 10 insertions(+), 8 deletions(-) diff --git a/use_cases/eluc/.pylintrc b/use_cases/eluc/.pylintrc index b65f941..d10bd76 100644 --- a/use_cases/eluc/.pylintrc +++ b/use_cases/eluc/.pylintrc @@ -1,6 +1,8 @@ [MASTER] ignore=demo, prescriptors/esp +ignore-patterns=*.md + recursive=y fail-under=9.0 diff --git a/use_cases/eluc/prescriptors/nsga2/candidate.py b/use_cases/eluc/prescriptors/nsga2/candidate.py index aaa6035..43fec5b 100644 --- a/use_cases/eluc/prescriptors/nsga2/candidate.py +++ b/use_cases/eluc/prescriptors/nsga2/candidate.py @@ -43,7 +43,7 @@ def __init__(self, in_size: int, hidden_size: int, out_size: int, self.parents = parents @classmethod - def from_crossover(cls, parent1, parent2, p_mutation: float, gen: int, cand_id: int): + def from_crossover(cls, parent1, parent2, p_mutation: float, gen: int, cand_id: int) -> "Candidate": """ Crossover two parents to create a child. Take a random 50/50 choice of either parent's weights diff --git a/use_cases/eluc/prescriptors/nsga2/nsga2_utils.py b/use_cases/eluc/prescriptors/nsga2/nsga2_utils.py index 72f92c6..0340294 100644 --- a/use_cases/eluc/prescriptors/nsga2/nsga2_utils.py +++ b/use_cases/eluc/prescriptors/nsga2/nsga2_utils.py @@ -64,7 +64,7 @@ def calculate_crowding_distance(front): n_objectives = len(front[0].metrics) distances = [0 for _ in range(len(front))] for m in range(n_objectives): - front.sort(key=lambda cand: cand.metrics[m]) + front.sort(key=lambda candidate: candidate.metrics[m]) obj_min = front[0].metrics[m] obj_max = front[-1].metrics[m] distances[0] = float('inf') diff --git a/use_cases/eluc/prescriptors/nsga2/torch_prescriptor.py b/use_cases/eluc/prescriptors/nsga2/torch_prescriptor.py index cf0ed81..5a32874 100644 --- a/use_cases/eluc/prescriptors/nsga2/torch_prescriptor.py +++ b/use_cases/eluc/prescriptors/nsga2/torch_prescriptor.py @@ -149,7 +149,7 @@ def _select_parents(self, candidates: list[Candidate], n_parents: int) -> list[C for candidate, distance in zip(front, crowding_distance): candidate.distance = distance if len(parents) + len(front) > n_parents: # If adding this front exceeds num_parents - front = sorted(front, key=lambda cand: cand.distance, reverse=True) + front = sorted(front, key=lambda candidate: candidate.distance, reverse=True) parents += front[:n_parents - len(parents)] break parents += front @@ -169,7 +169,7 @@ def _make_new_pop(self, parents: list[Candidate], pop_size: int, gen:int) -> lis Makes new population by creating children from parents. We use tournament selection to select parents for crossover. """ - sorted_parents = sorted(parents, key=lambda cand: (cand.rank, -cand.distance)) + sorted_parents = sorted(parents, key=lambda candidate: (candidate.rank, -candidate.distance)) children = [] for i in range(pop_size): parent1, parent2 = self._tournament_selection(sorted_parents) @@ -226,15 +226,15 @@ def _record_gen_results(self, gen: int, candidates: list[Candidate], save_path: Save the pareto front to disk. """ # Save statistics of candidates - gen_results = [cand.record_state() for cand in candidates] + gen_results = [candidate.record_state() for candidate in candidates] gen_results_df = pd.DataFrame(gen_results) gen_results_df.to_csv(save_path / f"{gen}.csv", index=False) # Save rank 1 candidate state dicts (save_path / f"{gen}").mkdir(parents=True, exist_ok=True) - pareto_candidates = [cand for cand in candidates if cand.rank == 1] - for cand in pareto_candidates: - torch.save(cand.state_dict(), save_path / f"{gen}" / f"{cand.gen}_{cand.cand_id}.pt") + pareto_candidates = [candidate for candidate in candidates if candidate.rank == 1] + for candidate in pareto_candidates: + torch.save(candidate.state_dict(), save_path / f"{gen}" / f"{candidate.gen}_{candidate.cand_id}.pt") def _record_candidate_avgs(self, gen: int, candidates: list[Candidate]) -> dict: """ From 6a70c0c58a0f5e2ed808fda33cd50f7c08c7567b Mon Sep 17 00:00:00 2001 From: Daniel Young Date: Tue, 14 May 2024 10:14:15 -0700 Subject: [PATCH 3/4] Fixed requirements so that wcwidth will not error --- use_cases/eluc/requirements.txt | 1 + 1 file changed, 1 insertion(+) diff --git a/use_cases/eluc/requirements.txt b/use_cases/eluc/requirements.txt index 5f5e9b3..ade7bf8 100644 --- a/use_cases/eluc/requirements.txt +++ b/use_cases/eluc/requirements.txt @@ -171,6 +171,7 @@ traitlets==5.9.0 transformers==4.31.0 typing_extensions==4.6.2 uri-template==1.2.0 +wcwidth==0.2.13 webcolors==1.13 webencodings==0.5.1 websocket-client==1.5.3 From 7d7434ad17bf371b51ee4d97ebbf0db96c88d5ee Mon Sep 17 00:00:00 2001 From: Daniel Young Date: Tue, 14 May 2024 10:34:01 -0700 Subject: [PATCH 4/4] Ignore readme for some reason --- use_cases/eluc/.pylintrc | 2 -- 1 file changed, 2 deletions(-) diff --git a/use_cases/eluc/.pylintrc b/use_cases/eluc/.pylintrc index d10bd76..b65f941 100644 --- a/use_cases/eluc/.pylintrc +++ b/use_cases/eluc/.pylintrc @@ -1,8 +1,6 @@ [MASTER] ignore=demo, prescriptors/esp -ignore-patterns=*.md - recursive=y fail-under=9.0