Skip to content

Commit

Permalink
seperate lower precision GEMM from the main files
Browse files Browse the repository at this point in the history
  • Loading branch information
airMeng committed Jun 18, 2024
1 parent a94e6ff commit a7614fa
Show file tree
Hide file tree
Showing 12 changed files with 8,659 additions and 8,054 deletions.
9,122 changes: 1,068 additions & 8,054 deletions ggml-sycl.cpp

Large diffs are not rendered by default.

5 changes: 5 additions & 0 deletions ggml-sycl/backend.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -14,5 +14,10 @@
#define GGML_SYCL_BACKEND_HPP

#include "common.hpp"
#include "convert.hpp"
#include "dequantize.hpp"
#include "dmmv.hpp"
#include "mmq.hpp"
#include "mmvq.hpp"

#endif // GGML_SYCL_BACKEND_HPP
544 changes: 544 additions & 0 deletions ggml-sycl/convert.cpp

Large diffs are not rendered by default.

27 changes: 27 additions & 0 deletions ggml-sycl/convert.hpp
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
//
// MIT license
// Copyright (C) 2024 Intel Corporation
// SPDX-License-Identifier: MIT
//

//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//

#ifndef GGML_SYCL_CONVERT_HPP
#define GGML_SYCL_CONVERT_HPP

#include "common.hpp"

template <typename T>
using to_t_sycl_t = void (*)(const void *__restrict__ x, T *__restrict__ y,
int k, dpct::queue_ptr stream);
typedef to_t_sycl_t<float> to_fp32_sycl_t;
typedef to_t_sycl_t<sycl::half> to_fp16_sycl_t;

to_fp16_sycl_t ggml_get_to_fp16_sycl(ggml_type type);
to_fp32_sycl_t ggml_get_to_fp32_sycl(ggml_type type);

#endif // GGML_SYCL_CONVERT_HPP
Loading

0 comments on commit a7614fa

Please sign in to comment.