Skip to content

Commit

Permalink
add the graphcapture
Browse files Browse the repository at this point in the history
  • Loading branch information
lambda7xx committed Feb 3, 2024
1 parent 1043f1d commit 57a86d1
Show file tree
Hide file tree
Showing 5 changed files with 502 additions and 493 deletions.
1 change: 1 addition & 0 deletions include/flexflow/ops/fused.h
Original file line number Diff line number Diff line change
Expand Up @@ -101,6 +101,7 @@ class FusedOp : public Op {
Op *operators[MAX_NUM_FUSED_OPERATORS];
FusedOpMeta fused_meta[MAX_NUM_WORKERS];
int numOperators;
bool graphCaptured;
};

}; // namespace FlexFlow
Expand Down
2 changes: 2 additions & 0 deletions profile.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
nsys profile -w true -t cuda,nvtx,osrt,cudnn,cublas -s cpu -o TP4B4newLegion-lambda -f true -x true \
./inference/incr_decoding/incr_decoding --ll:util 8 -ll:cpu 4 -ll:fsize 20000 -ll:zsize 30000 -llm-model meta-llama/Llama-2-7b-hf -cache-folder /home/xiaoxias/weights --fusion -ll:gpu 4 -prompt ../inference/prompt/chatgpt.json -tensor-parallelism-degree 4
3 changes: 3 additions & 0 deletions run.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@


python3 ./inference/utils/download_hf_model.py meta-llama/Llama-2-7b-hf --cache-folder /home/xiaoxias/weights
1 change: 1 addition & 0 deletions src/ops/fused.cc
Original file line number Diff line number Diff line change
Expand Up @@ -53,6 +53,7 @@ FusedOp::FusedOp(FFModel &model, Op *op)
0 /*weights*/,
0 /*outputs*/) {
numInputs = 0;
graphCaptured = false;
for (int i = 0; i < op->numInputs; i++) {
bool found = false;
// we also need to check region duplicate for the first op in a fused op
Expand Down
Loading

0 comments on commit 57a86d1

Please sign in to comment.