Import EETQ kernels

1dc29e9 9 months ago

837 Bytes

	/*
	* Copyright (c) 2022-2024, NVIDIA CORPORATION. All rights reserved.
	*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/
	#pragma once
	#include "common.h"

	namespace tensorrt_llm
	{
	namespace kernels
	{
	void weight_only_batched_gemv_launcher(const WeightOnlyParams& params, cudaStream_t stream);
	}
	} // namespace tensorrt_llm