Skip to content

Commit e321062

Browse files
committed
fix
1 parent fa981e9 commit e321062

File tree

3 files changed

+12
-13
lines changed

3 files changed

+12
-13
lines changed

scripts/run_all_textgen_benchmark_breakdown.sh

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -9,12 +9,12 @@
99
./scripts/run_textgen_benchmark_breakdown.sh santacoder bigcode/gpt_bigcode-santacoder 256 2040 11 1
1010

1111
# Large model
12-
./scripts/run_textgen_benchmark_breakdown.sh large_model ./data/bigcode_large-model 1 8190 11 0
13-
./scripts/run_textgen_benchmark_breakdown.sh large_model ./data/bigcode_large-model 8 8190 11 0
14-
./scripts/run_textgen_benchmark_breakdown.sh large_model ./data/bigcode_large-model 32 8190 11 0
15-
./scripts/run_textgen_benchmark_breakdown.sh large_model ./data/bigcode_large-model 256 8190 11 0 # OOM?
12+
./scripts/run_textgen_benchmark_breakdown.sh starcoder ./data/bigcode_large-model 1 8190 11 0
13+
./scripts/run_textgen_benchmark_breakdown.sh starcoder ./data/bigcode_large-model 8 8190 11 0
14+
./scripts/run_textgen_benchmark_breakdown.sh starcoder ./data/bigcode_large-model 32 8190 11 0
15+
./scripts/run_textgen_benchmark_breakdown.sh starcoder ./data/bigcode_large-model 256 8190 11 0 # OOM?
1616

17-
./scripts/run_textgen_benchmark_breakdown.sh large_model ./data/bigcode_large-model 1 8190 29 1 1
18-
./scripts/run_textgen_benchmark_breakdown.sh large_model ./data/bigcode_large-model 8 8190 29 1 1
19-
./scripts/run_textgen_benchmark_breakdown.sh large_model ./data/bigcode_large-model 32 8190 29 1 1
20-
./scripts/run_textgen_benchmark_breakdown.sh large_model ./data/bigcode_large-model 256 8190 29 1 1 # OOM?
17+
./scripts/run_textgen_benchmark_breakdown.sh starcoder ./data/bigcode_large-model 1 8190 29 1 1
18+
./scripts/run_textgen_benchmark_breakdown.sh starcoder ./data/bigcode_large-model 8 8190 29 1 1
19+
./scripts/run_textgen_benchmark_breakdown.sh starcoder ./data/bigcode_large-model 32 8190 29 1 1
20+
./scripts/run_textgen_benchmark_breakdown.sh starcoder ./data/bigcode_large-model 256 8190 29 1 1 # OOM?

scripts/run_textgen_benchmark_breakdown.sh

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -12,12 +12,11 @@ TOKEN_STEP=${5:-5}
1212
STEP_ID=${6:-""}
1313
CYCLES=${7:-10}
1414

15-
SAVE_DIR=data/benchmarks/v4
16-
#BATCH_SIZES="1 2 4 8 16 24 32 48 64 96 128 160 224 256"
15+
SAVE_DIR=data/benchmarks/v5
1716
RUN="python3 -m src.main --pipeline_class=TG_Pipeline --max_log_outputs=0 --dtype=float16 --device=cuda --custom_generate --breakdown_latency --ignore_oom --no_fast_init "
1817

1918

20-
IMPL=("flash" "causal" "vector" "bigcode" "bigcode2")
19+
IMPL=("flash" "causal" "vector" "bigcode" "bigcode2" "bigcode3")
2120

2221

2322
STEP=("" "--no_cache")
@@ -38,7 +37,7 @@ run () { # run(step, runtime, attn)
3837
fi
3938
}
4039

41-
for impl in {0..4}
40+
for impl in {0..5}
4241
do
4342
if [ "${STEP_ID}" -eq "0" ]
4443
then

src/pipeline.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -491,7 +491,7 @@ def __init__(self, **kwargs):
491491
if self.device != torch.device("cuda:0"):
492492
raise ValueError(f"Textgen does not support device {self.device}")
493493

494-
self.config = self.model.model.transformer.config
494+
self.config = getattr(self.model, "config", None) or self.model.model.transformer.config
495495

496496
def _get_config(
497497
self,

0 commit comments

Comments
 (0)