diff --git a/tests/e2e/vLLM/dklede/fp8_dynamic_per_token.yaml b/tests/e2e/vLLM/dklede/fp8_dynamic_per_token.yaml deleted file mode 100644 index b37bbde09..000000000 --- a/tests/e2e/vLLM/dklede/fp8_dynamic_per_token.yaml +++ /dev/null @@ -1,4 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -scheme: FP8_DYNAMIC \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/fp8_static_per_tensor.yaml b/tests/e2e/vLLM/dklede/fp8_static_per_tensor.yaml deleted file mode 100644 index 9d0e3c1a1..000000000 --- a/tests/e2e/vLLM/dklede/fp8_static_per_tensor.yaml +++ /dev/null @@ -1,6 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -scheme: FP8 -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/fp8_weight_only_channel.yaml b/tests/e2e/vLLM/dklede/fp8_weight_only_channel.yaml deleted file mode 100644 index 89f845279..000000000 --- a/tests/e2e/vLLM/dklede/fp8_weight_only_channel.yaml +++ /dev/null @@ -1,5 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -recipe: tests/e2e/vLLM/recipes/FP8/recipe_fp8_weight_only_channel.yaml -scheme: FP8A16_channel \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/fp8_weight_only_tensor.yaml b/tests/e2e/vLLM/dklede/fp8_weight_only_tensor.yaml deleted file mode 100644 index 1239287f2..000000000 --- a/tests/e2e/vLLM/dklede/fp8_weight_only_tensor.yaml +++ /dev/null @@ -1,5 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -recipe: tests/e2e/vLLM/recipes/FP8/recipe_fp8_weight_only_per_tensor.yaml -scheme: FP8A16_tensor \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/int8_channel_weight_static_per_tensor_act.yaml b/tests/e2e/vLLM/dklede/int8_channel_weight_static_per_tensor_act.yaml deleted file mode 100644 index ecdd84938..000000000 --- a/tests/e2e/vLLM/dklede/int8_channel_weight_static_per_tensor_act.yaml +++ /dev/null @@ -1,7 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -recipe: tests/e2e/vLLM/recipes/INT8/recipe_int8_channel_weight_static_per_tensor_act.yaml -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft -scheme: W8A8_channel_weight_static_per_tensor \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/int8_dynamic_per_token.yaml b/tests/e2e/vLLM/dklede/int8_dynamic_per_token.yaml deleted file mode 100644 index befa14beb..000000000 --- a/tests/e2e/vLLM/dklede/int8_dynamic_per_token.yaml +++ /dev/null @@ -1,6 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -scheme: W8A8 -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/int8_tensor_weight_static_per_tensor_act.yaml b/tests/e2e/vLLM/dklede/int8_tensor_weight_static_per_tensor_act.yaml deleted file mode 100644 index 4af8e65ad..000000000 --- a/tests/e2e/vLLM/dklede/int8_tensor_weight_static_per_tensor_act.yaml +++ /dev/null @@ -1,7 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -recipe: tests/e2e/vLLM/recipes/INT8/recipe_int8_tensor_weight_static_per_tensor_act.yaml -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft -scheme: W8A8_tensor_weight_static_per_tensor_act diff --git a/tests/e2e/vLLM/dklede/kv_cache_gptq_tinyllama.yaml b/tests/e2e/vLLM/dklede/kv_cache_gptq_tinyllama.yaml deleted file mode 100644 index 6dd112d3c..000000000 --- a/tests/e2e/vLLM/dklede/kv_cache_gptq_tinyllama.yaml +++ /dev/null @@ -1,7 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -recipe: tests/e2e/vLLM/recipes/kv_cache/gptq.yaml -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft -scheme: kv_cache_default_tinyllama \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/w4a16_2of4_channel_quant.yaml b/tests/e2e/vLLM/dklede/w4a16_2of4_channel_quant.yaml deleted file mode 100644 index dafd24025..000000000 --- a/tests/e2e/vLLM/dklede/w4a16_2of4_channel_quant.yaml +++ /dev/null @@ -1,7 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -scheme: W4A16_2of4_channel -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft -recipe: tests/e2e/vLLM/recipes/WNA16_2of4/2of4_w4a16_recipe.yaml \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/w4a16_2of4_grouped_quant.yaml b/tests/e2e/vLLM/dklede/w4a16_2of4_grouped_quant.yaml deleted file mode 100644 index 01135dd9d..000000000 --- a/tests/e2e/vLLM/dklede/w4a16_2of4_grouped_quant.yaml +++ /dev/null @@ -1,7 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -scheme: W4A16_2of4 -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft -recipe: tests/e2e/vLLM/recipes/WNA16_2of4/2of4_w4a16_group-128_recipe.yaml \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/w4a16_actorder_group.yaml b/tests/e2e/vLLM/dklede/w4a16_actorder_group.yaml deleted file mode 100644 index bb02c51ef..000000000 --- a/tests/e2e/vLLM/dklede/w4a16_actorder_group.yaml +++ /dev/null @@ -1,9 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -recipe: tests/e2e/vLLM/recipes/actorder/recipe_w4a16_actorder_group.yaml -dataset_id: openai/gsm8k -dataset_config: main -dataset_split: train -scheme: W4A16_actorder_group -save_dir: TinyLlama-1.1B-Chat-v1.0-actorder-group \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/w4a16_actorder_weight.yaml b/tests/e2e/vLLM/dklede/w4a16_actorder_weight.yaml deleted file mode 100644 index 318e4706e..000000000 --- a/tests/e2e/vLLM/dklede/w4a16_actorder_weight.yaml +++ /dev/null @@ -1,9 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -recipe: tests/e2e/vLLM/recipes/actorder/recipe_w4a16_actorder_weight.yaml -dataset_id: openai/gsm8k -dataset_config: main -dataset_split: train -scheme: W4A16_actorder_weight -save_dir: TinyLlama-1.1B-Chat-v1.0-actorder-weight \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/w4a16_channel_quant.yaml b/tests/e2e/vLLM/dklede/w4a16_channel_quant.yaml deleted file mode 100644 index f08a64159..000000000 --- a/tests/e2e/vLLM/dklede/w4a16_channel_quant.yaml +++ /dev/null @@ -1,7 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -scheme: W4A16_channel -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft -recipe: tests/e2e/vLLM/recipes/WNA16/recipe_w4a16_channel_quant.yaml \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/w4a16_grouped_quant.yaml b/tests/e2e/vLLM/dklede/w4a16_grouped_quant.yaml deleted file mode 100644 index 6a53963e0..000000000 --- a/tests/e2e/vLLM/dklede/w4a16_grouped_quant.yaml +++ /dev/null @@ -1,7 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -scheme: W4A16 -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft -quant_type: "GPTQ" \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/w8a16_channel_quant.yaml b/tests/e2e/vLLM/dklede/w8a16_channel_quant.yaml deleted file mode 100644 index f9adbc506..000000000 --- a/tests/e2e/vLLM/dklede/w8a16_channel_quant.yaml +++ /dev/null @@ -1,7 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -scheme: W8A16_channel -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft -recipe: tests/e2e/vLLM/recipes/WNA16/recipe_w8a16_channel_quant.yaml \ No newline at end of file diff --git a/tests/e2e/vLLM/dklede/w8a16_grouped_quant.yaml b/tests/e2e/vLLM/dklede/w8a16_grouped_quant.yaml deleted file mode 100644 index 44fd79032..000000000 --- a/tests/e2e/vLLM/dklede/w8a16_grouped_quant.yaml +++ /dev/null @@ -1,7 +0,0 @@ -cadence: "nightly" -test_type: "regression" -model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 -scheme: W8A16 -dataset_id: HuggingFaceH4/ultrachat_200k -dataset_split: train_sft -quant_type: "GPTQ" \ No newline at end of file