Skip to content

Commit c29cebf

Browse files
authored
Deprecate model_api examples (#2999)
Signed-off-by: Superjomn <[email protected]>
1 parent 11f9ecb commit c29cebf

File tree

8 files changed

+0
-340
lines changed

8 files changed

+0
-340
lines changed

examples/model_api/README.md

-67
This file was deleted.

examples/model_api/llama.py

-67
This file was deleted.

examples/model_api/llama_multi_gpu.py

-97
This file was deleted.

examples/model_api/llama_quantize.py

-77
This file was deleted.

tests/integration/defs/test_e2e.py

-27
Original file line numberDiff line numberDiff line change
@@ -1223,22 +1223,6 @@ def test_openai_multinodes_chat_tp8pp2(llm_root, llm_venv):
12231223
])
12241224

12251225

1226-
@pytest.mark.skip_less_device_memory(40000)
1227-
def test_model_api_examples(llm_root, llm_venv, engine_dir):
1228-
example_root = Path(llm_root) / "examples" / "model_api"
1229-
llm_venv.run_cmd([
1230-
str(example_root / "llama.py"), "--engine_dir",
1231-
f"{engine_dir}/model_api", "--hf_model_dir",
1232-
f"{llm_models_root()}/llama-models/llama-7b-hf"
1233-
])
1234-
1235-
llm_venv.run_cmd([
1236-
str(example_root / "llama_quantize.py"), "--cache_dir",
1237-
f"{engine_dir}/model_api_quantized", "--hf_model_dir",
1238-
f"{llm_models_root()}/llama-models/llama-7b-hf"
1239-
])
1240-
1241-
12421226
def test_build_time_benchmark_sanity(llm_root, llm_venv):
12431227
temp = tempfile.TemporaryDirectory()
12441228
llm_venv.run_cmd([
@@ -1248,17 +1232,6 @@ def test_build_time_benchmark_sanity(llm_root, llm_venv):
12481232
])
12491233

12501234

1251-
@pytest.mark.skip_less_device(2)
1252-
@pytest.mark.skip_less_device_memory(40000)
1253-
def test_model_api_examples_tp2(llm_root, llm_venv, engine_dir):
1254-
example_root = Path(llm_root) / "examples" / "model_api"
1255-
llm_venv.run_cmd([
1256-
str(example_root / "llama_multi_gpu.py"), "--engine_dir",
1257-
f"{engine_dir}/model_api_tp2", "--hf_model_dir",
1258-
f"{llm_models_root()}/llama-models/llama-7b-hf"
1259-
])
1260-
1261-
12621235
### LLMAPI examples
12631236
def _run_llmapi_example(llm_root, engine_dir, llm_venv, script_name: str,
12641237
*args):

tests/integration/test_lists/test-db/l0_a10.yml

-1
Original file line numberDiff line numberDiff line change
@@ -125,7 +125,6 @@ l0_a10:
125125
- test_e2e.py::test_benchmark_sanity[t5_base]
126126
- examples/test_openai.py::test_llm_openai_triton_1gpu
127127
- examples/test_openai.py::test_llm_openai_triton_plugingen_1gpu
128-
- test_e2e.py::test_model_api_examples # check with Tao can we remove it
129128
- test_e2e.py::test_build_time_benchmark_sanity
130129
- examples/test_whisper.py::test_llm_whisper_general[large-v3-enable_gemm_plugin-enable_attention_plugin-disable_weight_only-float16-nb:1-use_python_runtime]
131130
- examples/test_whisper.py::test_llm_whisper_general[large-v3-disable_gemm_plugin-enable_attention_plugin-disable_weight_only-float16-nb:1-use_python_runtime] # 4 mins

tests/integration/test_lists/test-db/l0_h100.yml

-1
Original file line numberDiff line numberDiff line change
@@ -152,5 +152,4 @@ l0_h100:
152152
- test_e2e.py::test_benchmark_sanity_enable_fp8[llama_7b] # 55.77s H100 only
153153
- test_e2e.py::test_benchmark_sanity_enable_fp8[gpt_350m] # 34.07s H100 only
154154
- unittest/bindings # 8 mins on H100
155-
- test_e2e.py::test_model_api_examples
156155
- test_e2e.py::test_build_time_benchmark_sanity

tests/integration/test_lists/waives.txt

-3
Original file line numberDiff line numberDiff line change
@@ -62,7 +62,6 @@ examples/test_multimodal.py::test_llm_multimodal_general[video-neva-pp:1-tp:1-bf
6262
examples/test_gpt.py::test_llm_gpt2_next_prompt_tuning[use_cpp_session-tp1] SKIP (http://nvbugs/4985405)
6363
examples/test_gpt.py::test_llm_gpt2_next_prompt_tuning[use_py_session-tp1] SKIP (http://nvbugs/4985405)
6464
examples/test_gpt.py::test_llm_gpt2_next_prompt_tuning[use_py_session-tp2] SKIP (http://nvbugs/4985405)
65-
test_e2e.py::test_model_api_examples_tp2 SKIP (executor.py MGMN is broken, https://nvbugs/200490052)
6665
examples/test_gemma.py::test_llm_gemma_1gpu_summary[gemma-7b-it-flax-int8_kv_cache-bfloat16-8] SKIP (https://nvbugs/4979772)
6766
examples/test_nemotron.py::test_llm_nemotron_3_8b_1gpu[bfloat16-full_prec] SKIP (https://nvbugs/5000026)
6867
examples/test_nemotron.py::test_llm_nemotron_3_8b_1gpu[bfloat16-int4_awq] SKIP (https://nvbugs/5000026)
@@ -129,7 +128,6 @@ full:B200_PCIe/unittest/quantization SKIP (Disable for Blackwell)
129128
full:B200_PCIe/accuracy/test_accuracy.py::TestVicuna7B::test_medusa[] SKIP (Disable for Blackwell)
130129
full:B200_PCIe/accuracy/test_accuracy.py::TestVicuna7B::test_medusa[cuda_graph] SKIP (Disable for Blackwell)
131130
full:B200_PCIe/accuracy/test_accuracy.py::TestVicuna7B::test_lookahead SKIP (Disable for Blackwell)
132-
full:B200_PCIe/test_e2e.py::test_model_api_examples SKIP (Disable for Blackwell)
133131
full:B200_PCIe/unittest/attention/test_bert_attention.py SKIP (Disable for Blackwell)
134132
full:B200_PCIe/unittest/model/test_mamba.py SKIP (Disable for Blackwell)
135133
full:B200_PCIe/examples/test_phi.py::test_llm_phi_single_gpu_summary[Phi-3-mini-128k-instruct-bfloat16-enable_gemm_plugin-enable_attention_plugin-enable_fmha_with_fp32_acc-nb:1] SKIP (Disable for Blackwell)
@@ -246,7 +244,6 @@ full:B200/unittest/quantization SKIP (Disable for Blackwell)
246244
full:B200/accuracy/test_accuracy.py::TestVicuna7B::test_medusa[] SKIP (Disable for Blackwell)
247245
full:B200/accuracy/test_accuracy.py::TestVicuna7B::test_medusa[cuda_graph] SKIP (Disable for Blackwell)
248246
full:B200/accuracy/test_accuracy.py::TestVicuna7B::test_lookahead SKIP (Disable for Blackwell)
249-
full:B200/test_e2e.py::test_model_api_examples SKIP (Disable for Blackwell)
250247
full:B200/unittest/attention/test_bert_attention.py SKIP (Disable for Blackwell)
251248
full:B200/unittest/model/test_mamba.py SKIP (Disable for Blackwell)
252249
full:B200/examples/test_phi.py::test_llm_phi_single_gpu_summary[Phi-3-mini-128k-instruct-bfloat16-enable_gemm_plugin-enable_attention_plugin-enable_fmha_with_fp32_acc-nb:1] SKIP (Disable for Blackwell)

0 commit comments

Comments
 (0)