diff --git a/language/llama3.1-8b/SUT_VLLM.py b/language/llama3.1-8b/SUT_VLLM.py index 94ee14abdd..a26118f7fe 100644 --- a/language/llama3.1-8b/SUT_VLLM.py +++ b/language/llama3.1-8b/SUT_VLLM.py @@ -1,3 +1,19 @@ +# Copyright 2025 The MLPerf Authors. All Rights Reserved. +# Copyright 2026 Arm Limited and affiliates. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================= + import asyncio import os import time @@ -49,9 +65,6 @@ def __init__( self.dtype = dtype self.tensor_parallel_size = tensor_parallel_size - if not torch.cuda.is_available(): - assert False, "torch gpu is not available, exiting..." - self.dataset_path = dataset_path self.data_object = Dataset( self.model_path,