From a7ef50085610c394e55cda02e8bf517f81d0d8c7 Mon Sep 17 00:00:00 2001 From: lambda7xx Date: Thu, 8 Feb 2024 22:10:37 -0500 Subject: [PATCH] fix the head file --- deps/legion | 2 +- deps/nccl | 2 +- include/flexflow/ops/fused.h | 12 ++++++++++++ llama.sh | 1 + src/ops/fused.cu | 14 ++------------ 5 files changed, 17 insertions(+), 14 deletions(-) create mode 100644 llama.sh diff --git a/deps/legion b/deps/legion index 15b23cf0d..626b55689 160000 --- a/deps/legion +++ b/deps/legion @@ -1 +1 @@ -Subproject commit 15b23cf0d95f186297f05c76611ddd3e2cbbe9f9 +Subproject commit 626b55689c77848b246e1da19678c7ad58899f0c diff --git a/deps/nccl b/deps/nccl index 399656269..6e24ef4e1 160000 --- a/deps/nccl +++ b/deps/nccl @@ -1 +1 @@ -Subproject commit 399656269027c1818fc999ccf8ec4dd838cec50d +Subproject commit 6e24ef4e1f1eac9f104d115ef65429f179924ee7 diff --git a/include/flexflow/ops/fused.h b/include/flexflow/ops/fused.h index dd80cf2f0..af2f26a39 100644 --- a/include/flexflow/ops/fused.h +++ b/include/flexflow/ops/fused.h @@ -6,6 +6,18 @@ namespace FlexFlow { +// declare Legion names +using Legion::Context; +using Legion::coord_t; +using Legion::Domain; +using Legion::Future; +using Legion::LogicalPartition; +using Legion::LogicalRegion; +using Legion::Memory; +using Legion::PhysicalRegion; +using Legion::Runtime; +using Legion::Task; + class FusedOp; class FusedOpMeta { public: diff --git a/llama.sh b/llama.sh new file mode 100644 index 000000000..dd3beed71 --- /dev/null +++ b/llama.sh @@ -0,0 +1 @@ +./build/inference/incr_decoding/incr_decoding --ll:util 8 -ll:cpu 4 -ll:fsize 20000 -ll:zsize 30000 -llm-model meta-llama/Llama-2-7b-hf -cache-folder /home/xiaoxias/weights --fusion -ll:gpu 4 -prompt /home/xiaoxias/cudagraph/inference/prompt/chatgpt.json -tensor-parallelism-degree 4 > llama2.log 2>&1 diff --git a/src/ops/fused.cu b/src/ops/fused.cu index 88c301bae..488c9e00c 100644 --- a/src/ops/fused.cu +++ b/src/ops/fused.cu @@ -47,17 +47,6 @@ #include "flexflow/ffconst_utils.h" namespace FlexFlow { -// declare Legion names -using Legion::Context; -using Legion::coord_t; -using Legion::Domain; -using Legion::Future; -using Legion::LogicalPartition; -using Legion::LogicalRegion; -using Legion::Memory; -using Legion::PhysicalRegion; -using Legion::Runtime; -using Legion::Task; OpMeta *FusedOp::init_task(Task const *task, std::vector const ®ions, @@ -1127,7 +1116,7 @@ __host__ void FusedOp::capture_graph(Task const *task, output_accessors_to_save.push_back(output_accessor[i + ooff]); } assert(task->index_point.get_dim() == 1); - int shard_id = task->index_point.point_data[0]; + shard_id = task->index_point.point_data[0]; FusedOp::save_inference_tensors_to_file(metas->meta[op], shard_id, bc, @@ -1176,6 +1165,7 @@ __host__ void bc->num_active_tokens(), bc->num_generation_tokens > 0); int scenario = 0; + int shard_id = task->index_point.point_data[0]; auto it = metas->graph_collections.find(graph_params); if(it != metas->graph_collections.end()) { instance = it->second;