Skip to content

Commit

Permalink
add license info
Browse files Browse the repository at this point in the history
  • Loading branch information
ZX-ModelCloud committed Jul 30, 2024
1 parent 2bdbe4f commit 4a571cc
Show file tree
Hide file tree
Showing 5 changed files with 13 additions and 12 deletions.
3 changes: 3 additions & 0 deletions gptqmodel/nn_modules/qlinear/qlinear_marlin_inference.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,6 @@
# License: GPTQModel/licenses/LICENSE.apache
# Adapted from vllm at https://github.com/vllm-project/vllm/blob/main/vllm/model_executor/layers/quantization/gptq_marlin.py

from typing import Any, Dict, List, Optional, Tuple

import gptqmodel_marlin_cuda_inference
Expand Down
3 changes: 3 additions & 0 deletions gptqmodel_ext/marlin_inference/marlin.cuh
Original file line number Diff line number Diff line change
@@ -1,3 +1,6 @@
# License: GPTQModel/licenses/LICENSE.apache
# Adapted from vllm at https://github.com/vllm-project/vllm/blob/main/csrc/quantization/gptq_marlin/marlin.cuh

#pragma once

#include <torch/all.h>
Expand Down
14 changes: 2 additions & 12 deletions gptqmodel_ext/marlin_inference/marlin_cuda_kernel.cu
Original file line number Diff line number Diff line change
Expand Up @@ -2,21 +2,11 @@
* Modified by Neural Magic
* Copyright (C) Marlin.2024 Elias Frantar
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* License: GPTQModel/licenses/LICENSE.apache
*/

/*
* Adapted from https://github.com/IST-DASLab/marlin
* Adapted from vllm at https://github.com/vllm-project/vllm/blob/main/csrc/quantization/gptq_marlin/gptq_marlin.cu
*/

#include "marlin.cuh"
Expand Down
2 changes: 2 additions & 0 deletions gptqmodel_ext/marlin_inference/marlin_dtypes.cuh
Original file line number Diff line number Diff line change
@@ -1,3 +1,5 @@
# License: GPTQModel/licenses/LICENSE.apache
# Adapted from vllm at https://github.com/vllm-project/vllm/blob/main/csrc/quantization/gptq_marlin/marlin_dtypes.cuh

#ifndef _data_types_cuh
#define _data_types_cuh
Expand Down
3 changes: 3 additions & 0 deletions gptqmodel_ext/marlin_inference/marlin_repack.cu
Original file line number Diff line number Diff line change
@@ -1,3 +1,6 @@
# License: GPTQModel/licenses/LICENSE.apache
# Adapted from vllm at https://github.com/vllm-project/vllm/blob/main/csrc/quantization/gptq_marlin/gptq_marlin_repack.cu

#include "marlin.cuh"

#if defined(__CUDA_ARCH__) && __CUDA_ARCH__ < 800
Expand Down

0 comments on commit 4a571cc

Please sign in to comment.