-
Notifications
You must be signed in to change notification settings - Fork 10
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Implement fully parallel upload processing
This adds another variant to the `PARALLEL_PROCESSING` feature/rollout flag which prefers the parallel upload processing pipeline in favor of running it as an experiment. Upload Processing can run in essentially 4 modes: - Completely serial processing - Serial processing, but running "experiment" code (`EXPERIMENT_SERIAL`): - In this mode, the final (`is_final`) `UploadProcessor` task saves a copy of the final report for later verification. - Parallel processing, but running "experiment" code (`EXPERIMENT_PARALLEL`): - In this mode, another parallel set of `UploadProcessor` tasks runs *after* the main set up tasks. - These tasks are not persisting any of their results in the database, instead the final `UploadFinisher` task will launch the `ParallelVerification` task. - Fully parallel processing (`PARALLEL`): - In this mode, the final `UploadFinisher` task is responsible for merging the final report and persisting it. An example Task chain might look like this, in "experiment" mode: - Upload - UploadProcessor - UploadProcessor - UploadProcessor (`EXPERIMENT_SERIAL` (the final one)) - UploadFinisher - UploadProcessor (`EXPERIMENT_PARALLEL`) - UploadProcessor (`EXPERIMENT_PARALLEL`) - UploadProcessor (`EXPERIMENT_PARALLEL`) - UploadFinisher (`EXPERIMENT_PARALLEL`) - ParallelVerification The `PARALLEL` mode looks like this: - Upload - UploadProcessor (`PARALLEL`) - UploadProcessor (`PARALLEL`) - UploadProcessor (`PARALLEL`) - UploadFinisher (`PARALLEL`)
- Loading branch information
Showing
7 changed files
with
322 additions
and
156 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,96 @@ | ||
from __future__ import annotations | ||
|
||
from enum import Enum | ||
|
||
from rollouts import PARALLEL_UPLOAD_PROCESSING_BY_REPO | ||
|
||
""" | ||
This encapsulates Parallel Upload Processing logic | ||
Upload Processing can run in essentially 4 modes: | ||
- Completely serial processing | ||
- Serial processing, but running "experiment" code (`EXPERIMENT_SERIAL`): | ||
- In this mode, the final (`is_final`) `UploadProcessor` task saves a copy | ||
of the final report for later verification. | ||
- Parallel processing, but running "experiment" code (`EXPERIMENT_PARALLEL`): | ||
- In this mode, another parallel set of `UploadProcessor` tasks runs *after* | ||
the main set up tasks. | ||
- These tasks are not persisting any of their results in the database, | ||
instead the final `UploadFinisher` task will launch the `ParallelVerification` task. | ||
- Fully parallel processing (`PARALLEL`): | ||
- In this mode, the final `UploadFinisher` task is responsible for merging | ||
the final report and persisting it. | ||
An example Task chain might look like this, in "experiment" mode: | ||
- Upload | ||
- UploadProcessor | ||
- UploadProcessor | ||
- UploadProcessor (`EXPERIMENT_SERIAL` (the final one)) | ||
- UploadFinisher | ||
- UploadProcessor (`EXPERIMENT_PARALLEL`) | ||
- UploadProcessor (`EXPERIMENT_PARALLEL`) | ||
- UploadProcessor (`EXPERIMENT_PARALLEL`) | ||
- UploadFinisher (`EXPERIMENT_PARALLEL`) | ||
- ParallelVerification | ||
The `PARALLEL` mode looks like this: | ||
- Upload | ||
- UploadProcessor (`PARALLEL`) | ||
- UploadProcessor (`PARALLEL`) | ||
- UploadProcessor (`PARALLEL`) | ||
- UploadFinisher (`PARALLEL`) | ||
""" | ||
|
||
|
||
class ParallelFeature(Enum): | ||
SERIAL = "serial" | ||
EXPERIMENT = "experiment" | ||
PARALLEL = "parallel" | ||
|
||
@classmethod | ||
def load(cls, repoid: int) -> ParallelFeature: | ||
feature = PARALLEL_UPLOAD_PROCESSING_BY_REPO.check_value( | ||
identifier=repoid, default="serial" | ||
) | ||
|
||
if feature == "experiment" or feature is True: | ||
return ParallelFeature.EXPERIMENT | ||
if feature == "parallel": | ||
return ParallelFeature.PARALLEL | ||
return ParallelFeature.SERIAL | ||
|
||
|
||
class ParallelProcessing(Enum): | ||
SERIAL = "serial" | ||
EXPERIMENT_SERIAL = "experiment-serial" | ||
EXPERIMENT_PARALLEL = "experiment-parallel" | ||
PARALLEL = "parallel" | ||
|
||
@property | ||
def is_parallel(self) -> bool: | ||
return ( | ||
self is ParallelProcessing.EXPERIMENT_PARALLEL | ||
or self is ParallelProcessing.PARALLEL | ||
) | ||
|
||
@classmethod | ||
def from_task_args( | ||
cls, | ||
repoid: int, | ||
in_parallel: bool = False, | ||
is_final: bool = False, | ||
**kwargs, | ||
) -> ParallelProcessing: | ||
feature = ParallelFeature.load(repoid) | ||
|
||
if feature is ParallelFeature.SERIAL: | ||
return ParallelProcessing.SERIAL | ||
if feature is ParallelFeature.PARALLEL: | ||
return ParallelProcessing.PARALLEL | ||
|
||
if in_parallel: | ||
return ParallelProcessing.EXPERIMENT_PARALLEL | ||
if is_final: | ||
return ParallelProcessing.EXPERIMENT_SERIAL | ||
return ParallelProcessing.SERIAL |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.