diff --git a/previews/PR63/.documenter-siteinfo.json b/previews/PR63/.documenter-siteinfo.json
index cb37dd1..167bf3e 100644
--- a/previews/PR63/.documenter-siteinfo.json
+++ b/previews/PR63/.documenter-siteinfo.json
@@ -1 +1 @@
-{"documenter":{"julia_version":"1.11.2","generation_timestamp":"2024-12-11T18:43:06","documenter_version":"1.8.0"}}
\ No newline at end of file
+{"documenter":{"julia_version":"1.11.2","generation_timestamp":"2024-12-11T19:32:24","documenter_version":"1.8.0"}}
\ No newline at end of file
diff --git a/previews/PR63/generic/index.html b/previews/PR63/generic/index.html
index 409a89b..40f47ef 100644
--- a/previews/PR63/generic/index.html
+++ b/previews/PR63/generic/index.html
@@ -1,5 +1,5 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Generic API · CUDSS.jl</title><meta name="title" content="Generic API · CUDSS.jl"/><meta property="og:title" content="Generic API · CUDSS.jl"/><meta property="twitter:title" content="Generic API · CUDSS.jl"/><meta name="description" content="Documentation for CUDSS.jl."/><meta property="og:description" content="Documentation for CUDSS.jl."/><meta property="twitter:description" content="Documentation for CUDSS.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit"><a href="../">CUDSS.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><a class="tocitem" href="../">Home</a></li><li class="is-active"><a class="tocitem" href>Generic API</a><ul class="internal"><li><a class="tocitem" href="#LLᵀ-and-LLᴴ"><span>LLᵀ and LLᴴ</span></a></li><li><a class="tocitem" href="#LDLᵀ-and-LDLᴴ"><span>LDLᵀ and LDLᴴ</span></a></li><li><a class="tocitem" href="#LU"><span>LU</span></a></li></ul></li><li><a class="tocitem" href="../options/">Options</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Generic API</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Generic API</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/exanauts/CUDSS.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/exanauts/CUDSS.jl/blob/main/docs/src/generic.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h2 id="LLᵀ-and-LLᴴ"><a class="docs-heading-anchor" href="#LLᵀ-and-LLᴴ">LLᵀ and LLᴴ</a><a id="LLᵀ-and-LLᴴ-1"></a><a class="docs-heading-anchor-permalink" href="#LLᵀ-and-LLᴴ" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.cholesky-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.cholesky-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.cholesky</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = cholesky(A::CuSparseMatrixCSR{T,Cint}; view::Char=&#39;F&#39;)</code></pre><p>Compute the LLᴴ factorization of a sparse matrix <code>A</code> on an NVIDIA GPU. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p><strong>Input argument</strong></p><ul><li><code>A</code>: a sparse Hermitian positive definite matrix stored in the <code>CuSparseMatrixCSR</code> format.</li></ul><p><strong>Keyword argument</strong></p><p>*<code>view</code>: A character that specifies which triangle of the sparse matrix is provided. Possible options are <code>L</code> for the lower triangle, <code>U</code> for the upper triangle, and <code>F</code> for the full matrix.</p><p><strong>Output argument</strong></p><ul><li><code>solver</code>: Opaque structure <a href="../#CUDSS.CudssSolver"><code>CudssSolver</code></a> that stores the factors of the LLᴴ decomposition.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/generic.jl#L87-L104">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.cholesky!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.cholesky!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.cholesky!</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = cholesky!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})</code></pre><p>Compute the LLᴴ factorization of a sparse matrix <code>A</code> on an NVIDIA GPU, reusing the symbolic factorization stored in <code>solver</code>. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/generic.jl#L119-L124">source</a></section></article><pre><code class="language-julia hljs">using CUDA, CUDA.CUSPARSE
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Generic API · CUDSS.jl</title><meta name="title" content="Generic API · CUDSS.jl"/><meta property="og:title" content="Generic API · CUDSS.jl"/><meta property="twitter:title" content="Generic API · CUDSS.jl"/><meta name="description" content="Documentation for CUDSS.jl."/><meta property="og:description" content="Documentation for CUDSS.jl."/><meta property="twitter:description" content="Documentation for CUDSS.jl."/><script data-outdated-warner src="../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL=".."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../assets/documenter.js"></script><script src="../search_index.js"></script><script src="../siteinfo.js"></script><script src="../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../assets/themeswap.js"></script></head><body><div id="documenter"><nav class="docs-sidebar"><div class="docs-package-name"><span class="docs-autofit"><a href="../">CUDSS.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><a class="tocitem" href="../">Home</a></li><li class="is-active"><a class="tocitem" href>Generic API</a><ul class="internal"><li><a class="tocitem" href="#LLᵀ-and-LLᴴ"><span>LLᵀ and LLᴴ</span></a></li><li><a class="tocitem" href="#LDLᵀ-and-LDLᴴ"><span>LDLᵀ and LDLᴴ</span></a></li><li><a class="tocitem" href="#LU"><span>LU</span></a></li></ul></li><li><a class="tocitem" href="../options/">Options</a></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Generic API</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Generic API</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/exanauts/CUDSS.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/exanauts/CUDSS.jl/blob/main/docs/src/generic.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h2 id="LLᵀ-and-LLᴴ"><a class="docs-heading-anchor" href="#LLᵀ-and-LLᴴ">LLᵀ and LLᴴ</a><a id="LLᵀ-and-LLᴴ-1"></a><a class="docs-heading-anchor-permalink" href="#LLᵀ-and-LLᴴ" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.cholesky-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.cholesky-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.cholesky</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = cholesky(A::CuSparseMatrixCSR{T,Cint}; view::Char=&#39;F&#39;)</code></pre><p>Compute the LLᴴ factorization of a sparse matrix <code>A</code> on an NVIDIA GPU. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p><strong>Input argument</strong></p><ul><li><code>A</code>: a sparse Hermitian positive definite matrix stored in the <code>CuSparseMatrixCSR</code> format.</li></ul><p><strong>Keyword argument</strong></p><p>*<code>view</code>: A character that specifies which triangle of the sparse matrix is provided. Possible options are <code>L</code> for the lower triangle, <code>U</code> for the upper triangle, and <code>F</code> for the full matrix.</p><p><strong>Output argument</strong></p><ul><li><code>solver</code>: Opaque structure <a href="../#CUDSS.CudssSolver"><code>CudssSolver</code></a> that stores the factors of the LLᴴ decomposition.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/generic.jl#L87-L104">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.cholesky!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.cholesky!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.cholesky!</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = cholesky!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})</code></pre><p>Compute the LLᴴ factorization of a sparse matrix <code>A</code> on an NVIDIA GPU, reusing the symbolic factorization stored in <code>solver</code>. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/generic.jl#L119-L124">source</a></section></article><pre><code class="language-julia hljs">using CUDA, CUDA.CUSPARSE
 using CUDSS
 using LinearAlgebra
 using SparseArrays
@@ -33,7 +33,7 @@
 
 R_gpu = C_gpu - ( CuSparseMatrixCSR(A_cpu) + Diagonal(d_gpu) ) * X_gpu
 norm(R_gpu)</code></pre><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If we only store one triangle of <code>A_gpu</code>, we can also use the wrappers <code>Symmetric</code> and <code>Hermitian</code> instead of using the keyword argument <code>view</code> in <code>cholesky</code>. For real matrices, both wrappers are allowed but only <code>Hermitian</code> can be used for complex matrices.</p></div></div><pre><code class="language-julia hljs">H_gpu = Hermitian(A_gpu, :U)
-F = cholesky(H_gpu)</code></pre><h2 id="LDLᵀ-and-LDLᴴ"><a class="docs-heading-anchor" href="#LDLᵀ-and-LDLᴴ">LDLᵀ and LDLᴴ</a><a id="LDLᵀ-and-LDLᴴ-1"></a><a class="docs-heading-anchor-permalink" href="#LDLᵀ-and-LDLᴴ" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.ldlt-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.ldlt-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.ldlt</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = ldlt(A::CuSparseMatrixCSR{T,Cint}; view::Char=&#39;F&#39;)</code></pre><p>Compute the LDLᴴ factorization of a sparse matrix <code>A</code> on an NVIDIA GPU. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p><strong>Input argument</strong></p><ul><li><code>A</code>: a sparse Hermitian matrix stored in the <code>CuSparseMatrixCSR</code> format.</li></ul><p><strong>Keyword argument</strong></p><p>*<code>view</code>: A character that specifies which triangle of the sparse matrix is provided. Possible options are <code>L</code> for the lower triangle, <code>U</code> for the upper triangle, and <code>F</code> for the full matrix.</p><p><strong>Output argument</strong></p><ul><li><code>solver</code>: Opaque structure <a href="../#CUDSS.CudssSolver"><code>CudssSolver</code></a> that stores the factors of the LDLᴴ decomposition.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/generic.jl#L40-L57">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.ldlt!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.ldlt!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.ldlt!</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = ldlt!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})</code></pre><p>Compute the LDLᴴ factorization of a sparse matrix <code>A</code> on an NVIDIA GPU, reusing the symbolic factorization stored in <code>solver</code>. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/generic.jl#L72-L77">source</a></section></article><pre><code class="language-julia hljs">using CUDA, CUDA.CUSPARSE
+F = cholesky(H_gpu)</code></pre><h2 id="LDLᵀ-and-LDLᴴ"><a class="docs-heading-anchor" href="#LDLᵀ-and-LDLᴴ">LDLᵀ and LDLᴴ</a><a id="LDLᵀ-and-LDLᴴ-1"></a><a class="docs-heading-anchor-permalink" href="#LDLᵀ-and-LDLᴴ" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.ldlt-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.ldlt-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.ldlt</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = ldlt(A::CuSparseMatrixCSR{T,Cint}; view::Char=&#39;F&#39;)</code></pre><p>Compute the LDLᴴ factorization of a sparse matrix <code>A</code> on an NVIDIA GPU. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p><strong>Input argument</strong></p><ul><li><code>A</code>: a sparse Hermitian matrix stored in the <code>CuSparseMatrixCSR</code> format.</li></ul><p><strong>Keyword argument</strong></p><p>*<code>view</code>: A character that specifies which triangle of the sparse matrix is provided. Possible options are <code>L</code> for the lower triangle, <code>U</code> for the upper triangle, and <code>F</code> for the full matrix.</p><p><strong>Output argument</strong></p><ul><li><code>solver</code>: Opaque structure <a href="../#CUDSS.CudssSolver"><code>CudssSolver</code></a> that stores the factors of the LDLᴴ decomposition.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/generic.jl#L40-L57">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.ldlt!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.ldlt!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.ldlt!</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = ldlt!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})</code></pre><p>Compute the LDLᴴ factorization of a sparse matrix <code>A</code> on an NVIDIA GPU, reusing the symbolic factorization stored in <code>solver</code>. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/generic.jl#L72-L77">source</a></section></article><pre><code class="language-julia hljs">using CUDA, CUDA.CUSPARSE
 using CUDSS
 using LinearAlgebra
 using SparseArrays
@@ -67,7 +67,7 @@
 
 R_gpu = C_gpu - ( CuSparseMatrixCSR(A_cpu) + Diagonal(d_gpu) ) * X_gpu
 norm(R_gpu)</code></pre><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>If we only store one triangle of <code>A_gpu</code>, we can also use the wrappers <code>Symmetric</code> and <code>Hermitian</code> instead of using the keyword argument <code>view</code> in <code>ldlt</code>. For real matrices, both wrappers are allowed but only <code>Hermitian</code> can be used for complex matrices.</p></div></div><pre><code class="language-julia hljs">S_gpu = Symmetric(A_gpu, :L)
-F = ldlt(S_gpu)</code></pre><h2 id="LU"><a class="docs-heading-anchor" href="#LU">LU</a><a id="LU-1"></a><a class="docs-heading-anchor-permalink" href="#LU" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.lu-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.lu-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.lu</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = lu(A::CuSparseMatrixCSR{T,Cint})</code></pre><p>Compute the LU factorization of a sparse matrix <code>A</code> on an NVIDIA GPU. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p><strong>Input argument</strong></p><ul><li><code>A</code>: a sparse square matrix stored in the <code>CuSparseMatrixCSR</code> format.</li></ul><p><strong>Output argument</strong></p><ul><li><code>solver</code>: an opaque structure <a href="../#CUDSS.CudssSolver"><code>CudssSolver</code></a> that stores the factors of the LU decomposition.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/generic.jl#L1-L14">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.lu!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.lu!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.lu!</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = lu!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})</code></pre><p>Compute the LU factorization of a sparse matrix <code>A</code> on an NVIDIA GPU, reusing the symbolic factorization stored in <code>solver</code>. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/generic.jl#L25-L30">source</a></section></article><pre><code class="language-julia hljs">using CUDA, CUDA.CUSPARSE
+F = ldlt(S_gpu)</code></pre><h2 id="LU"><a class="docs-heading-anchor" href="#LU">LU</a><a id="LU-1"></a><a class="docs-heading-anchor-permalink" href="#LU" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.lu-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.lu-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.lu</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = lu(A::CuSparseMatrixCSR{T,Cint})</code></pre><p>Compute the LU factorization of a sparse matrix <code>A</code> on an NVIDIA GPU. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p><strong>Input argument</strong></p><ul><li><code>A</code>: a sparse square matrix stored in the <code>CuSparseMatrixCSR</code> format.</li></ul><p><strong>Output argument</strong></p><ul><li><code>solver</code>: an opaque structure <a href="../#CUDSS.CudssSolver"><code>CudssSolver</code></a> that stores the factors of the LU decomposition.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/generic.jl#L1-L14">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="LinearAlgebra.lu!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}" href="#LinearAlgebra.lu!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T&lt;:Union{Float32, Float64, ComplexF64, ComplexF32}"><code>LinearAlgebra.lu!</code></a> — <span class="docstring-category">Method</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = lu!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})</code></pre><p>Compute the LU factorization of a sparse matrix <code>A</code> on an NVIDIA GPU, reusing the symbolic factorization stored in <code>solver</code>. The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/generic.jl#L25-L30">source</a></section></article><pre><code class="language-julia hljs">using CUDA, CUDA.CUSPARSE
 using CUDSS
 using LinearAlgebra
 using SparseArrays
@@ -96,4 +96,4 @@
 ldiv!(x_gpu, F, c_gpu)
 
 r_gpu = c_gpu - A_gpu * x_gpu
-norm(r_gpu)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../">« Home</a><a class="docs-footer-nextpage" href="../options/">Options »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.8.0 on <span class="colophon-date" title="Wednesday 11 December 2024 18:43">Wednesday 11 December 2024</span>. Using Julia version 1.11.2.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+norm(r_gpu)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../">« Home</a><a class="docs-footer-nextpage" href="../options/">Options »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.8.0 on <span class="colophon-date" title="Wednesday 11 December 2024 19:32">Wednesday 11 December 2024</span>. Using Julia version 1.11.2.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/previews/PR63/index.html b/previews/PR63/index.html
index 1c88a7f..fab2955 100644
--- a/previews/PR63/index.html
+++ b/previews/PR63/index.html
@@ -3,16 +3,16 @@
 pkg&gt; add CUDSS
 pkg&gt; test CUDSS</code></pre><h2 id="Types"><a class="docs-heading-anchor" href="#Types">Types</a><a id="Types-1"></a><a class="docs-heading-anchor-permalink" href="#Types" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.CudssMatrix" href="#CUDSS.CudssMatrix"><code>CUDSS.CudssMatrix</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">matrix = CudssMatrix(v::CuVector{T})
 matrix = CudssMatrix(A::CuMatrix{T})
-matrix = CudssMatrix(A::CuSparseMatrixCSR{T,Cint}, struture::String, view::Char; index::Char=&#39;O&#39;)</code></pre><p>The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p><code>CudssMatrix</code> is a wrapper for <code>CuVector</code>, <code>CuMatrix</code> and <code>CuSparseMatrixCSR</code>. <code>CudssMatrix</code> is used to pass matrix of the linear system, as well as solution and right-hand side.</p><p><code>structure</code> specifies the stucture for sparse matrices:</p><ul><li><code>&quot;G&quot;</code>: General matrix – LDU factorization;</li><li><code>&quot;S&quot;</code>: Real symmetric matrix – LDLᵀ factorization;</li><li><code>&quot;H&quot;</code>: Complex Hermitian matrix – LDLᴴ factorization;</li><li><code>&quot;SPD&quot;</code>: Symmetric positive-definite matrix – LLᵀ factorization;</li><li><code>&quot;HPD&quot;</code>: Hermitian positive-definite matrix – LLᴴ factorization.</li></ul><p><code>view</code> specifies matrix view for sparse matrices:</p><ul><li><code>&#39;L&#39;</code>: Lower-triangular matrix and all values above the main diagonal are ignored;</li><li><code>&#39;U&#39;</code>: Upper-triangular matrix and all values below the main diagonal are ignored;</li><li><code>&#39;F&#39;</code>: Full matrix.</li></ul><p><code>index</code> specifies indexing base for sparse matrix indices:</p><ul><li><code>&#39;Z&#39;</code>: 0-based indexing;</li><li><code>&#39;O&#39;</code>: 1-based indexing.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/helpers.jl#L6-L31">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.CudssConfig" href="#CUDSS.CudssConfig"><code>CUDSS.CudssConfig</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">config = CudssConfig()</code></pre><p><code>CudssConfig</code> stores configuration settings for the solver.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/helpers.jl#L127-L131">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.CudssData" href="#CUDSS.CudssData"><code>CUDSS.CudssData</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">data = CudssData()
-data = CudssData(cudss_handle::cudssHandle_t)</code></pre><p><code>CudssData</code> holds internal data (e.g., LU factors arrays).</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/helpers.jl#L95-L100">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.CudssSolver" href="#CUDSS.CudssSolver"><code>CUDSS.CudssSolver</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = CudssSolver(A::CuSparseMatrixCSR{T,Cint}, structure::String, view::Char; index::Char=&#39;O&#39;)
-solver = CudssSolver(matrix::CudssMatrix{T}, config::CudssConfig, data::CudssData)</code></pre><p>The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p><code>CudssSolver</code> contains all structures required to solve linear systems with cuDSS. One constructor of <code>CudssSolver</code> takes as input the same parameters as <a href="#CUDSS.CudssMatrix"><code>CudssMatrix</code></a>.</p><p><code>structure</code> specifies the stucture for sparse matrices:</p><ul><li><code>&quot;G&quot;</code>: General matrix – LDU factorization;</li><li><code>&quot;S&quot;</code>: Real symmetric matrix – LDLᵀ factorization;</li><li><code>&quot;H&quot;</code>: Complex Hermitian matrix – LDLᴴ factorization;</li><li><code>&quot;SPD&quot;</code>: Symmetric positive-definite matrix – LLᵀ factorization;</li><li><code>&quot;HPD&quot;</code>: Hermitian positive-definite matrix – LLᴴ factorization.</li></ul><p><code>view</code> specifies matrix view for sparse matrices:</p><ul><li><code>&#39;L&#39;</code>: Lower-triangular matrix and all values above the main diagonal are ignored;</li><li><code>&#39;U&#39;</code>: Upper-triangular matrix and all values below the main diagonal are ignored;</li><li><code>&#39;F&#39;</code>: Full matrix.</li></ul><p><code>index</code> specifies indexing base for sparse matrix indices:</p><ul><li><code>&#39;Z&#39;</code>: 0-based indexing;</li><li><code>&#39;O&#39;</code>: 1-based indexing.</li></ul><p><code>CudssSolver</code> can be also constructed from the three structures <code>CudssMatrix</code>, <code>CudssConfig</code> and <code>CudssData</code> if needed.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/interfaces.jl#L3-L29">source</a></section></article><h2 id="Functions"><a class="docs-heading-anchor" href="#Functions">Functions</a><a id="Functions-1"></a><a class="docs-heading-anchor-permalink" href="#Functions" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.cudss_set" href="#CUDSS.cudss_set"><code>CUDSS.cudss_set</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">cudss_set(matrix::CudssMatrix{T}, v::CuVector{T})
+matrix = CudssMatrix(A::CuSparseMatrixCSR{T,Cint}, struture::String, view::Char; index::Char=&#39;O&#39;)</code></pre><p>The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p><code>CudssMatrix</code> is a wrapper for <code>CuVector</code>, <code>CuMatrix</code> and <code>CuSparseMatrixCSR</code>. <code>CudssMatrix</code> is used to pass matrix of the linear system, as well as solution and right-hand side.</p><p><code>structure</code> specifies the stucture for sparse matrices:</p><ul><li><code>&quot;G&quot;</code>: General matrix – LDU factorization;</li><li><code>&quot;S&quot;</code>: Real symmetric matrix – LDLᵀ factorization;</li><li><code>&quot;H&quot;</code>: Complex Hermitian matrix – LDLᴴ factorization;</li><li><code>&quot;SPD&quot;</code>: Symmetric positive-definite matrix – LLᵀ factorization;</li><li><code>&quot;HPD&quot;</code>: Hermitian positive-definite matrix – LLᴴ factorization.</li></ul><p><code>view</code> specifies matrix view for sparse matrices:</p><ul><li><code>&#39;L&#39;</code>: Lower-triangular matrix and all values above the main diagonal are ignored;</li><li><code>&#39;U&#39;</code>: Upper-triangular matrix and all values below the main diagonal are ignored;</li><li><code>&#39;F&#39;</code>: Full matrix.</li></ul><p><code>index</code> specifies indexing base for sparse matrix indices:</p><ul><li><code>&#39;Z&#39;</code>: 0-based indexing;</li><li><code>&#39;O&#39;</code>: 1-based indexing.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/helpers.jl#L6-L31">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.CudssConfig" href="#CUDSS.CudssConfig"><code>CUDSS.CudssConfig</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">config = CudssConfig()</code></pre><p><code>CudssConfig</code> stores configuration settings for the solver.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/helpers.jl#L127-L131">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.CudssData" href="#CUDSS.CudssData"><code>CUDSS.CudssData</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">data = CudssData()
+data = CudssData(cudss_handle::cudssHandle_t)</code></pre><p><code>CudssData</code> holds internal data (e.g., LU factors arrays).</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/helpers.jl#L95-L100">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.CudssSolver" href="#CUDSS.CudssSolver"><code>CUDSS.CudssSolver</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">solver = CudssSolver(A::CuSparseMatrixCSR{T,Cint}, structure::String, view::Char; index::Char=&#39;O&#39;)
+solver = CudssSolver(matrix::CudssMatrix{T}, config::CudssConfig, data::CudssData)</code></pre><p>The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p><code>CudssSolver</code> contains all structures required to solve linear systems with cuDSS. One constructor of <code>CudssSolver</code> takes as input the same parameters as <a href="#CUDSS.CudssMatrix"><code>CudssMatrix</code></a>.</p><p><code>structure</code> specifies the stucture for sparse matrices:</p><ul><li><code>&quot;G&quot;</code>: General matrix – LDU factorization;</li><li><code>&quot;S&quot;</code>: Real symmetric matrix – LDLᵀ factorization;</li><li><code>&quot;H&quot;</code>: Complex Hermitian matrix – LDLᴴ factorization;</li><li><code>&quot;SPD&quot;</code>: Symmetric positive-definite matrix – LLᵀ factorization;</li><li><code>&quot;HPD&quot;</code>: Hermitian positive-definite matrix – LLᴴ factorization.</li></ul><p><code>view</code> specifies matrix view for sparse matrices:</p><ul><li><code>&#39;L&#39;</code>: Lower-triangular matrix and all values above the main diagonal are ignored;</li><li><code>&#39;U&#39;</code>: Upper-triangular matrix and all values below the main diagonal are ignored;</li><li><code>&#39;F&#39;</code>: Full matrix.</li></ul><p><code>index</code> specifies indexing base for sparse matrix indices:</p><ul><li><code>&#39;Z&#39;</code>: 0-based indexing;</li><li><code>&#39;O&#39;</code>: 1-based indexing.</li></ul><p><code>CudssSolver</code> can be also constructed from the three structures <code>CudssMatrix</code>, <code>CudssConfig</code> and <code>CudssData</code> if needed.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/interfaces.jl#L3-L29">source</a></section></article><h2 id="Functions"><a class="docs-heading-anchor" href="#Functions">Functions</a><a id="Functions-1"></a><a class="docs-heading-anchor-permalink" href="#Functions" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.cudss_set" href="#CUDSS.cudss_set"><code>CUDSS.cudss_set</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">cudss_set(matrix::CudssMatrix{T}, v::CuVector{T})
 cudss_set(matrix::CudssMatrix{T}, A::CuMatrix{T})
 cudss_set(matrix::CudssMatrix{T}, A::CuSparseMatrixCSR{T,Cint})
 cudss_set(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})
 cudss_set(solver::CudssSolver, parameter::String, value)
 cudss_set(config::CudssConfig, parameter::String, value)
-cudss_set(data::CudssData, parameter::String, value)</code></pre><p>The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p>The available configuration parameters are:</p><ul><li><code>&quot;reordering_alg&quot;</code>: Algorithm for the reordering phase (<code>&quot;default&quot;</code>, <code>&quot;algo1&quot;</code>, <code>&quot;algo2&quot;</code> or <code>&quot;algo3&quot;</code>);</li><li><code>&quot;factorization_alg&quot;</code>: Algorithm for the factorization phase (<code>&quot;default&quot;</code>, <code>&quot;algo1&quot;</code>, <code>&quot;algo2&quot;</code> or <code>&quot;algo3&quot;</code>);</li><li><code>&quot;solve_alg&quot;</code>: Algorithm for the solving phase (<code>&quot;default&quot;</code>, <code>&quot;algo1&quot;</code>, <code>&quot;algo2&quot;</code> or <code>&quot;algo3&quot;</code>);</li><li><code>&quot;matching_type&quot;</code>: Type of matching;</li><li><code>&quot;solve_mode&quot;</code>: Potential modificator on the system matrix (transpose or adjoint);</li><li><code>&quot;ir_n_steps&quot;</code>: Number of steps during the iterative refinement;</li><li><code>&quot;ir_tol&quot;</code>: Iterative refinement tolerance;</li><li><code>&quot;pivot_type&quot;</code>: Type of pivoting (<code>&#39;C&#39;</code>, <code>&#39;R&#39;</code> or <code>&#39;N&#39;</code>);</li><li><code>&quot;pivot_threshold&quot;</code>: Pivoting threshold which is used to determine if digonal element is subject to pivoting;</li><li><code>&quot;pivot_epsilon&quot;</code>: Pivoting epsilon, absolute value to replace singular diagonal elements;</li><li><code>&quot;max_lu_nnz&quot;</code>: Upper limit on the number of nonzero entries in LU factors for non-symmetric matrices;</li><li><code>&quot;hybrid_mode&quot;</code>: Memory mode – <code>0</code> (default = device-only) or <code>1</code> (hybrid = host/device);</li><li><code>&quot;hybrid_device_memory_limit&quot;</code>: User-defined device memory limit (number of bytes) for the hybrid memory mode;</li><li><code>&quot;use_cuda_register_memory&quot;</code>: A flag to enable (<code>1</code>) or disable (<code>0</code>) usage of <code>cudaHostRegister()</code> by the hybrid memory mode.</li></ul><p>The available data parameters are:</p><ul><li><code>&quot;user_perm&quot;</code>: User permutation to be used instead of running the reordering algorithms;</li><li><code>&quot;comm&quot;</code>: Communicator for Multi-GPU multi-node mode.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/interfaces.jl#L47-L77">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.cudss_get" href="#CUDSS.cudss_get"><code>CUDSS.cudss_get</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">value = cudss_get(solver::CudssSolver, parameter::String)
+cudss_set(data::CudssData, parameter::String, value)</code></pre><p>The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p>The available configuration parameters are:</p><ul><li><code>&quot;reordering_alg&quot;</code>: Algorithm for the reordering phase (<code>&quot;default&quot;</code>, <code>&quot;algo1&quot;</code>, <code>&quot;algo2&quot;</code> or <code>&quot;algo3&quot;</code>);</li><li><code>&quot;factorization_alg&quot;</code>: Algorithm for the factorization phase (<code>&quot;default&quot;</code>, <code>&quot;algo1&quot;</code>, <code>&quot;algo2&quot;</code> or <code>&quot;algo3&quot;</code>);</li><li><code>&quot;solve_alg&quot;</code>: Algorithm for the solving phase (<code>&quot;default&quot;</code>, <code>&quot;algo1&quot;</code>, <code>&quot;algo2&quot;</code> or <code>&quot;algo3&quot;</code>);</li><li><code>&quot;matching_type&quot;</code>: Type of matching;</li><li><code>&quot;solve_mode&quot;</code>: Potential modificator on the system matrix (transpose or adjoint);</li><li><code>&quot;ir_n_steps&quot;</code>: Number of steps during the iterative refinement;</li><li><code>&quot;ir_tol&quot;</code>: Iterative refinement tolerance;</li><li><code>&quot;pivot_type&quot;</code>: Type of pivoting (<code>&#39;C&#39;</code>, <code>&#39;R&#39;</code> or <code>&#39;N&#39;</code>);</li><li><code>&quot;pivot_threshold&quot;</code>: Pivoting threshold which is used to determine if digonal element is subject to pivoting;</li><li><code>&quot;pivot_epsilon&quot;</code>: Pivoting epsilon, absolute value to replace singular diagonal elements;</li><li><code>&quot;max_lu_nnz&quot;</code>: Upper limit on the number of nonzero entries in LU factors for non-symmetric matrices;</li><li><code>&quot;hybrid_mode&quot;</code>: Memory mode – <code>0</code> (default = device-only) or <code>1</code> (hybrid = host/device);</li><li><code>&quot;hybrid_device_memory_limit&quot;</code>: User-defined device memory limit (number of bytes) for the hybrid memory mode;</li><li><code>&quot;use_cuda_register_memory&quot;</code>: A flag to enable (<code>1</code>) or disable (<code>0</code>) usage of <code>cudaHostRegister()</code> by the hybrid memory mode.</li></ul><p>The available data parameters are:</p><ul><li><code>&quot;user_perm&quot;</code>: User permutation to be used instead of running the reordering algorithms;</li><li><code>&quot;comm&quot;</code>: Communicator for Multi-GPU multi-node mode.</li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/interfaces.jl#L47-L77">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.cudss_get" href="#CUDSS.cudss_get"><code>CUDSS.cudss_get</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">value = cudss_get(solver::CudssSolver, parameter::String)
 value = cudss_get(config::CudssConfig, parameter::String)
-value = cudss_get(data::CudssData, parameter::String)</code></pre><p>The available configuration parameters are:</p><ul><li><code>&quot;reordering_alg&quot;</code>: Algorithm for the reordering phase;</li><li><code>&quot;factorization_alg&quot;</code>: Algorithm for the factorization phase;</li><li><code>&quot;solve_alg&quot;</code>: Algorithm for the solving phase;</li><li><code>&quot;matching_type&quot;</code>: Type of matching;</li><li><code>&quot;solve_mode&quot;</code>: Potential modificator on the system matrix (transpose or adjoint);</li><li><code>&quot;ir_n_steps&quot;</code>: Number of steps during the iterative refinement;</li><li><code>&quot;ir_tol&quot;</code>: Iterative refinement tolerance;</li><li><code>&quot;pivot_type&quot;</code>: Type of pivoting;</li><li><code>&quot;pivot_threshold&quot;</code>: Pivoting threshold which is used to determine if digonal element is subject to pivoting;</li><li><code>&quot;pivot_epsilon&quot;</code>: Pivoting epsilon, absolute value to replace singular diagonal elements;</li><li><code>&quot;max_lu_nnz&quot;</code>: Upper limit on the number of nonzero entries in LU factors for non-symmetric matrices;</li><li><code>&quot;hybrid_mode&quot;</code>: Memory mode – <code>0</code> (default = device-only) or <code>1</code> (hybrid = host/device);</li><li><code>&quot;hybrid_device_memory_limit&quot;</code>: User-defined device memory limit (number of bytes) for the hybrid memory mode;</li><li><code>&quot;use_cuda_register_memory&quot;</code>: A flag to enable (<code>1</code>) or disable (<code>0</code>) usage of <code>cudaHostRegister()</code> by the hybrid memory mode.</li></ul><p>The available data parameters are:</p><ul><li><code>&quot;info&quot;</code>: Device-side error information;</li><li><code>&quot;lu_nnz&quot;</code>: Number of non-zero entries in LU factors;</li><li><code>&quot;npivots&quot;</code>: Number of pivots encountered during factorization;</li><li><code>&quot;inertia&quot;</code>: Tuple of positive and negative indices of inertia for symmetric and hermitian non positive-definite matrix types;</li><li><code>&quot;perm_reorder_row&quot;</code>: Reordering permutation for the rows;</li><li><code>&quot;perm_reorder_col&quot;</code>: Reordering permutation for the columns;</li><li><code>&quot;perm_row&quot;</code>: Final row permutation (which includes effects of both reordering and pivoting);</li><li><code>&quot;perm_col&quot;</code>: Final column permutation (which includes effects of both reordering and pivoting);</li><li><code>&quot;diag&quot;</code>: Diagonal of the factorized matrix;</li><li><code>&quot;hybrid_device_memory_min&quot;</code>: Minimal amount of device memory (number of bytes) required in the hybrid memory mode.</li></ul><p>The data parameters <code>&quot;info&quot;</code>, <code>&quot;lu_nnz&quot;</code>, <code>&quot;perm_reorder_row&quot;</code>, <code>&quot;perm_reorder_col&quot;</code> and <code>&quot;hybrid_device_memory_min&quot;</code> require the phase <code>&quot;analyse&quot;</code> performed by <a href="#CUDSS.cudss"><code>cudss</code></a>. The data parameters <code>&quot;npivots&quot;</code>, <code>&quot;inertia&quot;</code> and <code>&quot;diag&quot;</code> require the phases <code>&quot;analyse&quot;</code> and <code>&quot;factorization&quot;</code> performed by <a href="#CUDSS.cudss"><code>cudss</code></a>. The data parameters <code>&quot;perm_row&quot;</code> and <code>&quot;perm_col&quot;</code> are available but not yet functional.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/interfaces.jl#L122-L158">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.cudss" href="#CUDSS.cudss"><code>CUDSS.cudss</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">cudss(phase::String, solver::CudssSolver{T}, x::CuVector{T}, b::CuVector{T})
+value = cudss_get(data::CudssData, parameter::String)</code></pre><p>The available configuration parameters are:</p><ul><li><code>&quot;reordering_alg&quot;</code>: Algorithm for the reordering phase;</li><li><code>&quot;factorization_alg&quot;</code>: Algorithm for the factorization phase;</li><li><code>&quot;solve_alg&quot;</code>: Algorithm for the solving phase;</li><li><code>&quot;matching_type&quot;</code>: Type of matching;</li><li><code>&quot;solve_mode&quot;</code>: Potential modificator on the system matrix (transpose or adjoint);</li><li><code>&quot;ir_n_steps&quot;</code>: Number of steps during the iterative refinement;</li><li><code>&quot;ir_tol&quot;</code>: Iterative refinement tolerance;</li><li><code>&quot;pivot_type&quot;</code>: Type of pivoting;</li><li><code>&quot;pivot_threshold&quot;</code>: Pivoting threshold which is used to determine if digonal element is subject to pivoting;</li><li><code>&quot;pivot_epsilon&quot;</code>: Pivoting epsilon, absolute value to replace singular diagonal elements;</li><li><code>&quot;max_lu_nnz&quot;</code>: Upper limit on the number of nonzero entries in LU factors for non-symmetric matrices;</li><li><code>&quot;hybrid_mode&quot;</code>: Memory mode – <code>0</code> (default = device-only) or <code>1</code> (hybrid = host/device);</li><li><code>&quot;hybrid_device_memory_limit&quot;</code>: User-defined device memory limit (number of bytes) for the hybrid memory mode;</li><li><code>&quot;use_cuda_register_memory&quot;</code>: A flag to enable (<code>1</code>) or disable (<code>0</code>) usage of <code>cudaHostRegister()</code> by the hybrid memory mode.</li></ul><p>The available data parameters are:</p><ul><li><code>&quot;info&quot;</code>: Device-side error information;</li><li><code>&quot;lu_nnz&quot;</code>: Number of non-zero entries in LU factors;</li><li><code>&quot;npivots&quot;</code>: Number of pivots encountered during factorization;</li><li><code>&quot;inertia&quot;</code>: Tuple of positive and negative indices of inertia for symmetric and hermitian non positive-definite matrix types;</li><li><code>&quot;perm_reorder_row&quot;</code>: Reordering permutation for the rows;</li><li><code>&quot;perm_reorder_col&quot;</code>: Reordering permutation for the columns;</li><li><code>&quot;perm_row&quot;</code>: Final row permutation (which includes effects of both reordering and pivoting);</li><li><code>&quot;perm_col&quot;</code>: Final column permutation (which includes effects of both reordering and pivoting);</li><li><code>&quot;diag&quot;</code>: Diagonal of the factorized matrix;</li><li><code>&quot;hybrid_device_memory_min&quot;</code>: Minimal amount of device memory (number of bytes) required in the hybrid memory mode;</li><li><code>&quot;memory_estimates&quot;</code>: Memory estimates (in bytes) for host and device memory required for the chosen memory mode.</li></ul><p>The data parameters <code>&quot;info&quot;</code>, <code>&quot;lu_nnz&quot;</code>, <code>&quot;perm_reorder_row&quot;</code>, <code>&quot;perm_reorder_col&quot;</code>, <code>&quot;hybrid_device_memory_min&quot;</code> and <code>&quot;memory_estimates&quot;</code> require the phase <code>&quot;analyse&quot;</code> performed by <a href="#CUDSS.cudss"><code>cudss</code></a>. The data parameters <code>&quot;npivots&quot;</code>, <code>&quot;inertia&quot;</code> and <code>&quot;diag&quot;</code> require the phases <code>&quot;analyse&quot;</code> and <code>&quot;factorization&quot;</code> performed by <a href="#CUDSS.cudss"><code>cudss</code></a>. The data parameters <code>&quot;perm_row&quot;</code> and <code>&quot;perm_col&quot;</code> are available but not yet functional.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/interfaces.jl#L122-L159">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="CUDSS.cudss" href="#CUDSS.cudss"><code>CUDSS.cudss</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">cudss(phase::String, solver::CudssSolver{T}, x::CuVector{T}, b::CuVector{T})
 cudss(phase::String, solver::CudssSolver{T}, X::CuMatrix{T}, B::CuMatrix{T})
-cudss(phase::String, solver::CudssSolver{T}, X::CudssMatrix{T}, B::CudssMatrix{T})</code></pre><p>The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p>The available phases are <code>&quot;analysis&quot;</code>, <code>&quot;factorization&quot;</code>, <code>&quot;refactorization&quot;</code> and <code>&quot;solve&quot;</code>. The phases <code>&quot;solve_fwd&quot;</code>, <code>&quot;solve_diag&quot;</code> and <code>&quot;solve_bwd&quot;</code> are available but not yet functional.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/0ca1098ca6d2e5b0f26cd32983cf6e199b961635/src/interfaces.jl#L197-L206">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-nextpage" href="generic/">Generic API »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.8.0 on <span class="colophon-date" title="Wednesday 11 December 2024 18:43">Wednesday 11 December 2024</span>. Using Julia version 1.11.2.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+cudss(phase::String, solver::CudssSolver{T}, X::CudssMatrix{T}, B::CudssMatrix{T})</code></pre><p>The type <code>T</code> can be <code>Float32</code>, <code>Float64</code>, <code>ComplexF32</code> or <code>ComplexF64</code>.</p><p>The available phases are <code>&quot;analysis&quot;</code>, <code>&quot;factorization&quot;</code>, <code>&quot;refactorization&quot;</code> and <code>&quot;solve&quot;</code>. The phases <code>&quot;solve_fwd&quot;</code>, <code>&quot;solve_diag&quot;</code> and <code>&quot;solve_bwd&quot;</code> are available but not yet functional.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/exanauts/CUDSS.jl/blob/cc7ab6098ce589140400928e8f4c3904c45ac9a6/src/interfaces.jl#L198-L207">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-nextpage" href="generic/">Generic API »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.8.0 on <span class="colophon-date" title="Wednesday 11 December 2024 19:32">Wednesday 11 December 2024</span>. Using Julia version 1.11.2.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/previews/PR63/options/index.html b/previews/PR63/options/index.html
index 3611d33..f800a20 100644
--- a/previews/PR63/options/index.html
+++ b/previews/PR63/options/index.html
@@ -86,4 +86,4 @@
 cudss(&quot;solve&quot;, solver, x_gpu, b_gpu)
 
 r_gpu = b_gpu - CuSparseMatrixCSR(A_cpu) * x_gpu
-norm(r_gpu)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../generic/">« Generic API</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.8.0 on <span class="colophon-date" title="Wednesday 11 December 2024 18:43">Wednesday 11 December 2024</span>. Using Julia version 1.11.2.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+norm(r_gpu)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../generic/">« Generic API</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.8.0 on <span class="colophon-date" title="Wednesday 11 December 2024 19:32">Wednesday 11 December 2024</span>. Using Julia version 1.11.2.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/previews/PR63/search_index.js b/previews/PR63/search_index.js
index e0cbcc7..b5a298a 100644
--- a/previews/PR63/search_index.js
+++ b/previews/PR63/search_index.js
@@ -1,3 +1,3 @@
 var documenterSearchIndex = {"docs":
-[{"location":"options/#Iterative-refinement","page":"Options","title":"Iterative refinement","text":"","category":"section"},{"location":"options/","page":"Options","title":"Options","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\n\nT = Float64\nn = 100\np = 5\nA_cpu = sprand(T, n, n, 0.01)\nA_cpu = A_cpu + I\nB_cpu = rand(T, n, p)\n\nA_gpu = CuSparseMatrixCSR(A_cpu)\nB_gpu = CuMatrix(B_cpu)\nX_gpu = similar(B_gpu)\n\nsolver = CudssSolver(A_gpu, \"G\", 'F')\n\n# Perform one step of iterative refinement\nir = 1\ncudss_set(solver, \"ir_n_steps\", ir)\n\ncudss(\"analysis\", solver, X_gpu, B_gpu)\ncudss(\"factorization\", solver, X_gpu, B_gpu)\ncudss(\"solve\", solver, X_gpu, B_gpu)\n\nR_gpu = B_gpu - CuSparseMatrixCSR(A_cpu) * X_gpu\nnorm(R_gpu)","category":"page"},{"location":"options/#User-permutation","page":"Options","title":"User permutation","text":"","category":"section"},{"location":"options/","page":"Options","title":"Options","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\nusing AMD\n\nT = ComplexF64\nn = 100\nA_cpu = sprand(T, n, n, 0.01)\nA_cpu = A_cpu' * A_cpu + I\nb_cpu = rand(T, n)\n\nA_gpu = CuSparseMatrixCSR(A_cpu)\nb_gpu = CuVector(b_cpu)\nx_gpu = similar(b_gpu)\n\nsolver = CudssSolver(A_gpu, \"HPD\", 'F')\n\n# Provide a user permutation\npermutation = amd(A_cpu) |> Vector{Cint}\ncudss_set(solver, \"user_perm\", permutation)\n\ncudss(\"analysis\", solver, x_gpu, b_gpu)\ncudss(\"factorization\", solver, x_gpu, b_gpu)\ncudss(\"solve\", solver, x_gpu, b_gpu)\n\nr_gpu = b_gpu - CuSparseMatrixCSR(A_cpu) * x_gpu\nnorm(r_gpu)","category":"page"},{"location":"options/#Hybrid-mode","page":"Options","title":"Hybrid mode","text":"","category":"section"},{"location":"options/","page":"Options","title":"Options","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\n\nT = Float64\nn = 100\nA_cpu = sprand(T, n, n, 0.01)\nA_cpu = A_cpu + A_cpu' + I\nb_cpu = rand(T, n)\n\nA_gpu = CuSparseMatrixCSR(A_cpu)\nb_gpu = CuVector(b_cpu)\nx_gpu = similar(b_gpu)\n\nsolver = CudssSolver(A_gpu, \"S\", 'F')\n\n# Use the hybrid mode (host and device memory)\ncudss_set(solver, \"hybrid_mode\", 1)\n\ncudss(\"analysis\", solver, x_gpu, b_gpu)\n\n# Minimal amount of device memory required in the hybrid memory mode.\nnbytes_gpu = cudss_get(solver, \"hybrid_device_memory_min\")\n\n# Device memory limit for the hybrid memory mode.\n# Only use it if you don't want to rely on the internal default heuristic.\ncudss_set(solver, \"hybrid_device_memory_limit\", nbytes_gpu)\n\ncudss(\"factorization\", solver, x_gpu, b_gpu)\ncudss(\"solve\", solver, x_gpu, b_gpu)\n\nr_gpu = b_gpu - CuSparseMatrixCSR(A_cpu) * x_gpu\nnorm(r_gpu)","category":"page"},{"location":"#Home","page":"Home","title":"CUDSS.jl documentation","text":"","category":"section"},{"location":"#Overview","page":"Home","title":"Overview","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"CUDSS.jl is a Julia interface to the NVIDIA cuDSS library. NVIDIA cuDSS provides three factorizations (LDU, LDLᵀ, LLᵀ) for solving sparse linear systems on GPUs. For more details on using cuDSS, refer to the official cuDSS documentation.","category":"page"},{"location":"#Installation","page":"Home","title":"Installation","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"julia> ]\npkg> add CUDSS\npkg> test CUDSS","category":"page"},{"location":"#Types","page":"Home","title":"Types","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"CudssMatrix\nCudssConfig\nCudssData\nCudssSolver","category":"page"},{"location":"#CUDSS.CudssMatrix","page":"Home","title":"CUDSS.CudssMatrix","text":"matrix = CudssMatrix(v::CuVector{T})\nmatrix = CudssMatrix(A::CuMatrix{T})\nmatrix = CudssMatrix(A::CuSparseMatrixCSR{T,Cint}, struture::String, view::Char; index::Char='O')\n\nThe type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nCudssMatrix is a wrapper for CuVector, CuMatrix and CuSparseMatrixCSR. CudssMatrix is used to pass matrix of the linear system, as well as solution and right-hand side.\n\nstructure specifies the stucture for sparse matrices:\n\n\"G\": General matrix – LDU factorization;\n\"S\": Real symmetric matrix – LDLᵀ factorization;\n\"H\": Complex Hermitian matrix – LDLᴴ factorization;\n\"SPD\": Symmetric positive-definite matrix – LLᵀ factorization;\n\"HPD\": Hermitian positive-definite matrix – LLᴴ factorization.\n\nview specifies matrix view for sparse matrices:\n\n'L': Lower-triangular matrix and all values above the main diagonal are ignored;\n'U': Upper-triangular matrix and all values below the main diagonal are ignored;\n'F': Full matrix.\n\nindex specifies indexing base for sparse matrix indices:\n\n'Z': 0-based indexing;\n'O': 1-based indexing.\n\n\n\n\n\n","category":"type"},{"location":"#CUDSS.CudssConfig","page":"Home","title":"CUDSS.CudssConfig","text":"config = CudssConfig()\n\nCudssConfig stores configuration settings for the solver.\n\n\n\n\n\n","category":"type"},{"location":"#CUDSS.CudssData","page":"Home","title":"CUDSS.CudssData","text":"data = CudssData()\ndata = CudssData(cudss_handle::cudssHandle_t)\n\nCudssData holds internal data (e.g., LU factors arrays).\n\n\n\n\n\n","category":"type"},{"location":"#CUDSS.CudssSolver","page":"Home","title":"CUDSS.CudssSolver","text":"solver = CudssSolver(A::CuSparseMatrixCSR{T,Cint}, structure::String, view::Char; index::Char='O')\nsolver = CudssSolver(matrix::CudssMatrix{T}, config::CudssConfig, data::CudssData)\n\nThe type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nCudssSolver contains all structures required to solve linear systems with cuDSS. One constructor of CudssSolver takes as input the same parameters as CudssMatrix.\n\nstructure specifies the stucture for sparse matrices:\n\n\"G\": General matrix – LDU factorization;\n\"S\": Real symmetric matrix – LDLᵀ factorization;\n\"H\": Complex Hermitian matrix – LDLᴴ factorization;\n\"SPD\": Symmetric positive-definite matrix – LLᵀ factorization;\n\"HPD\": Hermitian positive-definite matrix – LLᴴ factorization.\n\nview specifies matrix view for sparse matrices:\n\n'L': Lower-triangular matrix and all values above the main diagonal are ignored;\n'U': Upper-triangular matrix and all values below the main diagonal are ignored;\n'F': Full matrix.\n\nindex specifies indexing base for sparse matrix indices:\n\n'Z': 0-based indexing;\n'O': 1-based indexing.\n\nCudssSolver can be also constructed from the three structures CudssMatrix, CudssConfig and CudssData if needed.\n\n\n\n\n\n","category":"type"},{"location":"#Functions","page":"Home","title":"Functions","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"cudss_set\ncudss_get\ncudss","category":"page"},{"location":"#CUDSS.cudss_set","page":"Home","title":"CUDSS.cudss_set","text":"cudss_set(matrix::CudssMatrix{T}, v::CuVector{T})\ncudss_set(matrix::CudssMatrix{T}, A::CuMatrix{T})\ncudss_set(matrix::CudssMatrix{T}, A::CuSparseMatrixCSR{T,Cint})\ncudss_set(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})\ncudss_set(solver::CudssSolver, parameter::String, value)\ncudss_set(config::CudssConfig, parameter::String, value)\ncudss_set(data::CudssData, parameter::String, value)\n\nThe type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nThe available configuration parameters are:\n\n\"reordering_alg\": Algorithm for the reordering phase (\"default\", \"algo1\", \"algo2\" or \"algo3\");\n\"factorization_alg\": Algorithm for the factorization phase (\"default\", \"algo1\", \"algo2\" or \"algo3\");\n\"solve_alg\": Algorithm for the solving phase (\"default\", \"algo1\", \"algo2\" or \"algo3\");\n\"matching_type\": Type of matching;\n\"solve_mode\": Potential modificator on the system matrix (transpose or adjoint);\n\"ir_n_steps\": Number of steps during the iterative refinement;\n\"ir_tol\": Iterative refinement tolerance;\n\"pivot_type\": Type of pivoting ('C', 'R' or 'N');\n\"pivot_threshold\": Pivoting threshold which is used to determine if digonal element is subject to pivoting;\n\"pivot_epsilon\": Pivoting epsilon, absolute value to replace singular diagonal elements;\n\"max_lu_nnz\": Upper limit on the number of nonzero entries in LU factors for non-symmetric matrices;\n\"hybrid_mode\": Memory mode – 0 (default = device-only) or 1 (hybrid = host/device);\n\"hybrid_device_memory_limit\": User-defined device memory limit (number of bytes) for the hybrid memory mode;\n\"use_cuda_register_memory\": A flag to enable (1) or disable (0) usage of cudaHostRegister() by the hybrid memory mode.\n\nThe available data parameters are:\n\n\"user_perm\": User permutation to be used instead of running the reordering algorithms;\n\"comm\": Communicator for Multi-GPU multi-node mode.\n\n\n\n\n\n","category":"function"},{"location":"#CUDSS.cudss_get","page":"Home","title":"CUDSS.cudss_get","text":"value = cudss_get(solver::CudssSolver, parameter::String)\nvalue = cudss_get(config::CudssConfig, parameter::String)\nvalue = cudss_get(data::CudssData, parameter::String)\n\nThe available configuration parameters are:\n\n\"reordering_alg\": Algorithm for the reordering phase;\n\"factorization_alg\": Algorithm for the factorization phase;\n\"solve_alg\": Algorithm for the solving phase;\n\"matching_type\": Type of matching;\n\"solve_mode\": Potential modificator on the system matrix (transpose or adjoint);\n\"ir_n_steps\": Number of steps during the iterative refinement;\n\"ir_tol\": Iterative refinement tolerance;\n\"pivot_type\": Type of pivoting;\n\"pivot_threshold\": Pivoting threshold which is used to determine if digonal element is subject to pivoting;\n\"pivot_epsilon\": Pivoting epsilon, absolute value to replace singular diagonal elements;\n\"max_lu_nnz\": Upper limit on the number of nonzero entries in LU factors for non-symmetric matrices;\n\"hybrid_mode\": Memory mode – 0 (default = device-only) or 1 (hybrid = host/device);\n\"hybrid_device_memory_limit\": User-defined device memory limit (number of bytes) for the hybrid memory mode;\n\"use_cuda_register_memory\": A flag to enable (1) or disable (0) usage of cudaHostRegister() by the hybrid memory mode.\n\nThe available data parameters are:\n\n\"info\": Device-side error information;\n\"lu_nnz\": Number of non-zero entries in LU factors;\n\"npivots\": Number of pivots encountered during factorization;\n\"inertia\": Tuple of positive and negative indices of inertia for symmetric and hermitian non positive-definite matrix types;\n\"perm_reorder_row\": Reordering permutation for the rows;\n\"perm_reorder_col\": Reordering permutation for the columns;\n\"perm_row\": Final row permutation (which includes effects of both reordering and pivoting);\n\"perm_col\": Final column permutation (which includes effects of both reordering and pivoting);\n\"diag\": Diagonal of the factorized matrix;\n\"hybrid_device_memory_min\": Minimal amount of device memory (number of bytes) required in the hybrid memory mode.\n\nThe data parameters \"info\", \"lu_nnz\", \"perm_reorder_row\", \"perm_reorder_col\" and \"hybrid_device_memory_min\" require the phase \"analyse\" performed by cudss. The data parameters \"npivots\", \"inertia\" and \"diag\" require the phases \"analyse\" and \"factorization\" performed by cudss. The data parameters \"perm_row\" and \"perm_col\" are available but not yet functional.\n\n\n\n\n\n","category":"function"},{"location":"#CUDSS.cudss","page":"Home","title":"CUDSS.cudss","text":"cudss(phase::String, solver::CudssSolver{T}, x::CuVector{T}, b::CuVector{T})\ncudss(phase::String, solver::CudssSolver{T}, X::CuMatrix{T}, B::CuMatrix{T})\ncudss(phase::String, solver::CudssSolver{T}, X::CudssMatrix{T}, B::CudssMatrix{T})\n\nThe type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nThe available phases are \"analysis\", \"factorization\", \"refactorization\" and \"solve\". The phases \"solve_fwd\", \"solve_diag\" and \"solve_bwd\" are available but not yet functional.\n\n\n\n\n\n","category":"function"},{"location":"generic/#LLᵀ-and-LLᴴ","page":"Generic API","title":"LLᵀ and LLᴴ","text":"","category":"section"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"    LinearAlgebra.cholesky(A::CuSparseMatrixCSR{T,Cint}; view::Char='F') where T <: LinearAlgebra.BlasFloat\n    LinearAlgebra.cholesky!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint}) where T <: LinearAlgebra.BlasFloat","category":"page"},{"location":"generic/#LinearAlgebra.cholesky-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.cholesky","text":"solver = cholesky(A::CuSparseMatrixCSR{T,Cint}; view::Char='F')\n\nCompute the LLᴴ factorization of a sparse matrix A on an NVIDIA GPU. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nInput argument\n\nA: a sparse Hermitian positive definite matrix stored in the CuSparseMatrixCSR format.\n\nKeyword argument\n\n*view: A character that specifies which triangle of the sparse matrix is provided. Possible options are L for the lower triangle, U for the upper triangle, and F for the full matrix.\n\nOutput argument\n\nsolver: Opaque structure CudssSolver that stores the factors of the LLᴴ decomposition.\n\n\n\n\n\n","category":"method"},{"location":"generic/#LinearAlgebra.cholesky!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.cholesky!","text":"solver = cholesky!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})\n\nCompute the LLᴴ factorization of a sparse matrix A on an NVIDIA GPU, reusing the symbolic factorization stored in solver. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\n\n\n\n\n","category":"method"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\n\nT = ComplexF64\nR = real(T)\nn = 100\np = 5\nA_cpu = sprand(T, n, n, 0.01)\nA_cpu = A_cpu * A_cpu' + I\nB_cpu = rand(T, n, p)\n\nA_gpu = CuSparseMatrixCSR(A_cpu |> triu)\nB_gpu = CuMatrix(B_cpu)\nX_gpu = similar(B_gpu)\n\nF = cholesky(A_gpu, view='U')\nX_gpu = F \\ B_gpu\n\nR_gpu = B_gpu - CuSparseMatrixCSR(A_cpu) * X_gpu\nnorm(R_gpu)\n\n# In-place LLᴴ\nd_gpu = rand(R, n) |> CuVector\nA_gpu = A_gpu + Diagonal(d_gpu)\ncholesky!(F, A_gpu)\n\nC_cpu = rand(T, n, p)\nC_gpu = CuMatrix(C_cpu)\nldiv!(X_gpu, F, C_gpu)\n\nR_gpu = C_gpu - ( CuSparseMatrixCSR(A_cpu) + Diagonal(d_gpu) ) * X_gpu\nnorm(R_gpu)","category":"page"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"note: Note\nIf we only store one triangle of A_gpu, we can also use the wrappers Symmetric and Hermitian instead of using the keyword argument view in cholesky. For real matrices, both wrappers are allowed but only Hermitian can be used for complex matrices.","category":"page"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"H_gpu = Hermitian(A_gpu, :U)\nF = cholesky(H_gpu)","category":"page"},{"location":"generic/#LDLᵀ-and-LDLᴴ","page":"Generic API","title":"LDLᵀ and LDLᴴ","text":"","category":"section"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"    LinearAlgebra.ldlt(A::CuSparseMatrixCSR{T,Cint}; view::Char='F') where T <: LinearAlgebra.BlasFloat\n    LinearAlgebra.ldlt!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint}) where T <: LinearAlgebra.BlasFloat","category":"page"},{"location":"generic/#LinearAlgebra.ldlt-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.ldlt","text":"solver = ldlt(A::CuSparseMatrixCSR{T,Cint}; view::Char='F')\n\nCompute the LDLᴴ factorization of a sparse matrix A on an NVIDIA GPU. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nInput argument\n\nA: a sparse Hermitian matrix stored in the CuSparseMatrixCSR format.\n\nKeyword argument\n\n*view: A character that specifies which triangle of the sparse matrix is provided. Possible options are L for the lower triangle, U for the upper triangle, and F for the full matrix.\n\nOutput argument\n\nsolver: Opaque structure CudssSolver that stores the factors of the LDLᴴ decomposition.\n\n\n\n\n\n","category":"method"},{"location":"generic/#LinearAlgebra.ldlt!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.ldlt!","text":"solver = ldlt!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})\n\nCompute the LDLᴴ factorization of a sparse matrix A on an NVIDIA GPU, reusing the symbolic factorization stored in solver. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\n\n\n\n\n","category":"method"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\n\nT = Float64\nR = real(T)\nn = 100\np = 5\nA_cpu = sprand(T, n, n, 0.05) + I\nA_cpu = A_cpu + A_cpu'\nB_cpu = rand(T, n, p)\n\nA_gpu = CuSparseMatrixCSR(A_cpu |> tril)\nB_gpu = CuMatrix(B_cpu)\nX_gpu = similar(B_gpu)\n\nF = ldlt(A_gpu, view='L')\nX_gpu = F \\ B_gpu\n\nR_gpu = B_gpu - CuSparseMatrixCSR(A_cpu) * X_gpu\nnorm(R_gpu)\n\n# In-place LDLᵀ\nd_gpu = rand(R, n) |> CuVector\nA_gpu = A_gpu + Diagonal(d_gpu)\nldlt!(F, A_gpu)\n\nC_cpu = rand(T, n, p)\nC_gpu = CuMatrix(C_cpu)\nldiv!(X_gpu, F, C_gpu)\n\nR_gpu = C_gpu - ( CuSparseMatrixCSR(A_cpu) + Diagonal(d_gpu) ) * X_gpu\nnorm(R_gpu)","category":"page"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"note: Note\nIf we only store one triangle of A_gpu, we can also use the wrappers Symmetric and Hermitian instead of using the keyword argument view in ldlt. For real matrices, both wrappers are allowed but only Hermitian can be used for complex matrices.","category":"page"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"S_gpu = Symmetric(A_gpu, :L)\nF = ldlt(S_gpu)","category":"page"},{"location":"generic/#LU","page":"Generic API","title":"LU","text":"","category":"section"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"    LinearAlgebra.lu(A::CuSparseMatrixCSR{T,Cint}) where T <: LinearAlgebra.BlasFloat\n    LinearAlgebra.lu!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint}) where T <: LinearAlgebra.BlasFloat","category":"page"},{"location":"generic/#LinearAlgebra.lu-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.lu","text":"solver = lu(A::CuSparseMatrixCSR{T,Cint})\n\nCompute the LU factorization of a sparse matrix A on an NVIDIA GPU. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nInput argument\n\nA: a sparse square matrix stored in the CuSparseMatrixCSR format.\n\nOutput argument\n\nsolver: an opaque structure CudssSolver that stores the factors of the LU decomposition.\n\n\n\n\n\n","category":"method"},{"location":"generic/#LinearAlgebra.lu!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.lu!","text":"solver = lu!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})\n\nCompute the LU factorization of a sparse matrix A on an NVIDIA GPU, reusing the symbolic factorization stored in solver. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\n\n\n\n\n","category":"method"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\n\nT = Float64\nn = 100\nA_cpu = sprand(T, n, n, 0.05) + I\nb_cpu = rand(T, n)\n\nA_gpu = CuSparseMatrixCSR(A_cpu)\nb_gpu = CuVector(b_cpu)\n\nF = lu(A_gpu)\nx_gpu = F \\ b_gpu\n\nr_gpu = b_gpu - A_gpu * x_gpu\nnorm(r_gpu)\n\n# In-place LU\nd_gpu = rand(T, n) |> CuVector\nA_gpu = A_gpu + Diagonal(d_gpu)\nlu!(F, A_gpu)\n\nc_cpu = rand(T, n)\nc_gpu = CuVector(c_cpu)\nldiv!(x_gpu, F, c_gpu)\n\nr_gpu = c_gpu - A_gpu * x_gpu\nnorm(r_gpu)","category":"page"}]
+[{"location":"options/#Iterative-refinement","page":"Options","title":"Iterative refinement","text":"","category":"section"},{"location":"options/","page":"Options","title":"Options","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\n\nT = Float64\nn = 100\np = 5\nA_cpu = sprand(T, n, n, 0.01)\nA_cpu = A_cpu + I\nB_cpu = rand(T, n, p)\n\nA_gpu = CuSparseMatrixCSR(A_cpu)\nB_gpu = CuMatrix(B_cpu)\nX_gpu = similar(B_gpu)\n\nsolver = CudssSolver(A_gpu, \"G\", 'F')\n\n# Perform one step of iterative refinement\nir = 1\ncudss_set(solver, \"ir_n_steps\", ir)\n\ncudss(\"analysis\", solver, X_gpu, B_gpu)\ncudss(\"factorization\", solver, X_gpu, B_gpu)\ncudss(\"solve\", solver, X_gpu, B_gpu)\n\nR_gpu = B_gpu - CuSparseMatrixCSR(A_cpu) * X_gpu\nnorm(R_gpu)","category":"page"},{"location":"options/#User-permutation","page":"Options","title":"User permutation","text":"","category":"section"},{"location":"options/","page":"Options","title":"Options","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\nusing AMD\n\nT = ComplexF64\nn = 100\nA_cpu = sprand(T, n, n, 0.01)\nA_cpu = A_cpu' * A_cpu + I\nb_cpu = rand(T, n)\n\nA_gpu = CuSparseMatrixCSR(A_cpu)\nb_gpu = CuVector(b_cpu)\nx_gpu = similar(b_gpu)\n\nsolver = CudssSolver(A_gpu, \"HPD\", 'F')\n\n# Provide a user permutation\npermutation = amd(A_cpu) |> Vector{Cint}\ncudss_set(solver, \"user_perm\", permutation)\n\ncudss(\"analysis\", solver, x_gpu, b_gpu)\ncudss(\"factorization\", solver, x_gpu, b_gpu)\ncudss(\"solve\", solver, x_gpu, b_gpu)\n\nr_gpu = b_gpu - CuSparseMatrixCSR(A_cpu) * x_gpu\nnorm(r_gpu)","category":"page"},{"location":"options/#Hybrid-mode","page":"Options","title":"Hybrid mode","text":"","category":"section"},{"location":"options/","page":"Options","title":"Options","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\n\nT = Float64\nn = 100\nA_cpu = sprand(T, n, n, 0.01)\nA_cpu = A_cpu + A_cpu' + I\nb_cpu = rand(T, n)\n\nA_gpu = CuSparseMatrixCSR(A_cpu)\nb_gpu = CuVector(b_cpu)\nx_gpu = similar(b_gpu)\n\nsolver = CudssSolver(A_gpu, \"S\", 'F')\n\n# Use the hybrid mode (host and device memory)\ncudss_set(solver, \"hybrid_mode\", 1)\n\ncudss(\"analysis\", solver, x_gpu, b_gpu)\n\n# Minimal amount of device memory required in the hybrid memory mode.\nnbytes_gpu = cudss_get(solver, \"hybrid_device_memory_min\")\n\n# Device memory limit for the hybrid memory mode.\n# Only use it if you don't want to rely on the internal default heuristic.\ncudss_set(solver, \"hybrid_device_memory_limit\", nbytes_gpu)\n\ncudss(\"factorization\", solver, x_gpu, b_gpu)\ncudss(\"solve\", solver, x_gpu, b_gpu)\n\nr_gpu = b_gpu - CuSparseMatrixCSR(A_cpu) * x_gpu\nnorm(r_gpu)","category":"page"},{"location":"#Home","page":"Home","title":"CUDSS.jl documentation","text":"","category":"section"},{"location":"#Overview","page":"Home","title":"Overview","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"CUDSS.jl is a Julia interface to the NVIDIA cuDSS library. NVIDIA cuDSS provides three factorizations (LDU, LDLᵀ, LLᵀ) for solving sparse linear systems on GPUs. For more details on using cuDSS, refer to the official cuDSS documentation.","category":"page"},{"location":"#Installation","page":"Home","title":"Installation","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"julia> ]\npkg> add CUDSS\npkg> test CUDSS","category":"page"},{"location":"#Types","page":"Home","title":"Types","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"CudssMatrix\nCudssConfig\nCudssData\nCudssSolver","category":"page"},{"location":"#CUDSS.CudssMatrix","page":"Home","title":"CUDSS.CudssMatrix","text":"matrix = CudssMatrix(v::CuVector{T})\nmatrix = CudssMatrix(A::CuMatrix{T})\nmatrix = CudssMatrix(A::CuSparseMatrixCSR{T,Cint}, struture::String, view::Char; index::Char='O')\n\nThe type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nCudssMatrix is a wrapper for CuVector, CuMatrix and CuSparseMatrixCSR. CudssMatrix is used to pass matrix of the linear system, as well as solution and right-hand side.\n\nstructure specifies the stucture for sparse matrices:\n\n\"G\": General matrix – LDU factorization;\n\"S\": Real symmetric matrix – LDLᵀ factorization;\n\"H\": Complex Hermitian matrix – LDLᴴ factorization;\n\"SPD\": Symmetric positive-definite matrix – LLᵀ factorization;\n\"HPD\": Hermitian positive-definite matrix – LLᴴ factorization.\n\nview specifies matrix view for sparse matrices:\n\n'L': Lower-triangular matrix and all values above the main diagonal are ignored;\n'U': Upper-triangular matrix and all values below the main diagonal are ignored;\n'F': Full matrix.\n\nindex specifies indexing base for sparse matrix indices:\n\n'Z': 0-based indexing;\n'O': 1-based indexing.\n\n\n\n\n\n","category":"type"},{"location":"#CUDSS.CudssConfig","page":"Home","title":"CUDSS.CudssConfig","text":"config = CudssConfig()\n\nCudssConfig stores configuration settings for the solver.\n\n\n\n\n\n","category":"type"},{"location":"#CUDSS.CudssData","page":"Home","title":"CUDSS.CudssData","text":"data = CudssData()\ndata = CudssData(cudss_handle::cudssHandle_t)\n\nCudssData holds internal data (e.g., LU factors arrays).\n\n\n\n\n\n","category":"type"},{"location":"#CUDSS.CudssSolver","page":"Home","title":"CUDSS.CudssSolver","text":"solver = CudssSolver(A::CuSparseMatrixCSR{T,Cint}, structure::String, view::Char; index::Char='O')\nsolver = CudssSolver(matrix::CudssMatrix{T}, config::CudssConfig, data::CudssData)\n\nThe type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nCudssSolver contains all structures required to solve linear systems with cuDSS. One constructor of CudssSolver takes as input the same parameters as CudssMatrix.\n\nstructure specifies the stucture for sparse matrices:\n\n\"G\": General matrix – LDU factorization;\n\"S\": Real symmetric matrix – LDLᵀ factorization;\n\"H\": Complex Hermitian matrix – LDLᴴ factorization;\n\"SPD\": Symmetric positive-definite matrix – LLᵀ factorization;\n\"HPD\": Hermitian positive-definite matrix – LLᴴ factorization.\n\nview specifies matrix view for sparse matrices:\n\n'L': Lower-triangular matrix and all values above the main diagonal are ignored;\n'U': Upper-triangular matrix and all values below the main diagonal are ignored;\n'F': Full matrix.\n\nindex specifies indexing base for sparse matrix indices:\n\n'Z': 0-based indexing;\n'O': 1-based indexing.\n\nCudssSolver can be also constructed from the three structures CudssMatrix, CudssConfig and CudssData if needed.\n\n\n\n\n\n","category":"type"},{"location":"#Functions","page":"Home","title":"Functions","text":"","category":"section"},{"location":"","page":"Home","title":"Home","text":"cudss_set\ncudss_get\ncudss","category":"page"},{"location":"#CUDSS.cudss_set","page":"Home","title":"CUDSS.cudss_set","text":"cudss_set(matrix::CudssMatrix{T}, v::CuVector{T})\ncudss_set(matrix::CudssMatrix{T}, A::CuMatrix{T})\ncudss_set(matrix::CudssMatrix{T}, A::CuSparseMatrixCSR{T,Cint})\ncudss_set(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})\ncudss_set(solver::CudssSolver, parameter::String, value)\ncudss_set(config::CudssConfig, parameter::String, value)\ncudss_set(data::CudssData, parameter::String, value)\n\nThe type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nThe available configuration parameters are:\n\n\"reordering_alg\": Algorithm for the reordering phase (\"default\", \"algo1\", \"algo2\" or \"algo3\");\n\"factorization_alg\": Algorithm for the factorization phase (\"default\", \"algo1\", \"algo2\" or \"algo3\");\n\"solve_alg\": Algorithm for the solving phase (\"default\", \"algo1\", \"algo2\" or \"algo3\");\n\"matching_type\": Type of matching;\n\"solve_mode\": Potential modificator on the system matrix (transpose or adjoint);\n\"ir_n_steps\": Number of steps during the iterative refinement;\n\"ir_tol\": Iterative refinement tolerance;\n\"pivot_type\": Type of pivoting ('C', 'R' or 'N');\n\"pivot_threshold\": Pivoting threshold which is used to determine if digonal element is subject to pivoting;\n\"pivot_epsilon\": Pivoting epsilon, absolute value to replace singular diagonal elements;\n\"max_lu_nnz\": Upper limit on the number of nonzero entries in LU factors for non-symmetric matrices;\n\"hybrid_mode\": Memory mode – 0 (default = device-only) or 1 (hybrid = host/device);\n\"hybrid_device_memory_limit\": User-defined device memory limit (number of bytes) for the hybrid memory mode;\n\"use_cuda_register_memory\": A flag to enable (1) or disable (0) usage of cudaHostRegister() by the hybrid memory mode.\n\nThe available data parameters are:\n\n\"user_perm\": User permutation to be used instead of running the reordering algorithms;\n\"comm\": Communicator for Multi-GPU multi-node mode.\n\n\n\n\n\n","category":"function"},{"location":"#CUDSS.cudss_get","page":"Home","title":"CUDSS.cudss_get","text":"value = cudss_get(solver::CudssSolver, parameter::String)\nvalue = cudss_get(config::CudssConfig, parameter::String)\nvalue = cudss_get(data::CudssData, parameter::String)\n\nThe available configuration parameters are:\n\n\"reordering_alg\": Algorithm for the reordering phase;\n\"factorization_alg\": Algorithm for the factorization phase;\n\"solve_alg\": Algorithm for the solving phase;\n\"matching_type\": Type of matching;\n\"solve_mode\": Potential modificator on the system matrix (transpose or adjoint);\n\"ir_n_steps\": Number of steps during the iterative refinement;\n\"ir_tol\": Iterative refinement tolerance;\n\"pivot_type\": Type of pivoting;\n\"pivot_threshold\": Pivoting threshold which is used to determine if digonal element is subject to pivoting;\n\"pivot_epsilon\": Pivoting epsilon, absolute value to replace singular diagonal elements;\n\"max_lu_nnz\": Upper limit on the number of nonzero entries in LU factors for non-symmetric matrices;\n\"hybrid_mode\": Memory mode – 0 (default = device-only) or 1 (hybrid = host/device);\n\"hybrid_device_memory_limit\": User-defined device memory limit (number of bytes) for the hybrid memory mode;\n\"use_cuda_register_memory\": A flag to enable (1) or disable (0) usage of cudaHostRegister() by the hybrid memory mode.\n\nThe available data parameters are:\n\n\"info\": Device-side error information;\n\"lu_nnz\": Number of non-zero entries in LU factors;\n\"npivots\": Number of pivots encountered during factorization;\n\"inertia\": Tuple of positive and negative indices of inertia for symmetric and hermitian non positive-definite matrix types;\n\"perm_reorder_row\": Reordering permutation for the rows;\n\"perm_reorder_col\": Reordering permutation for the columns;\n\"perm_row\": Final row permutation (which includes effects of both reordering and pivoting);\n\"perm_col\": Final column permutation (which includes effects of both reordering and pivoting);\n\"diag\": Diagonal of the factorized matrix;\n\"hybrid_device_memory_min\": Minimal amount of device memory (number of bytes) required in the hybrid memory mode;\n\"memory_estimates\": Memory estimates (in bytes) for host and device memory required for the chosen memory mode.\n\nThe data parameters \"info\", \"lu_nnz\", \"perm_reorder_row\", \"perm_reorder_col\", \"hybrid_device_memory_min\" and \"memory_estimates\" require the phase \"analyse\" performed by cudss. The data parameters \"npivots\", \"inertia\" and \"diag\" require the phases \"analyse\" and \"factorization\" performed by cudss. The data parameters \"perm_row\" and \"perm_col\" are available but not yet functional.\n\n\n\n\n\n","category":"function"},{"location":"#CUDSS.cudss","page":"Home","title":"CUDSS.cudss","text":"cudss(phase::String, solver::CudssSolver{T}, x::CuVector{T}, b::CuVector{T})\ncudss(phase::String, solver::CudssSolver{T}, X::CuMatrix{T}, B::CuMatrix{T})\ncudss(phase::String, solver::CudssSolver{T}, X::CudssMatrix{T}, B::CudssMatrix{T})\n\nThe type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nThe available phases are \"analysis\", \"factorization\", \"refactorization\" and \"solve\". The phases \"solve_fwd\", \"solve_diag\" and \"solve_bwd\" are available but not yet functional.\n\n\n\n\n\n","category":"function"},{"location":"generic/#LLᵀ-and-LLᴴ","page":"Generic API","title":"LLᵀ and LLᴴ","text":"","category":"section"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"    LinearAlgebra.cholesky(A::CuSparseMatrixCSR{T,Cint}; view::Char='F') where T <: LinearAlgebra.BlasFloat\n    LinearAlgebra.cholesky!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint}) where T <: LinearAlgebra.BlasFloat","category":"page"},{"location":"generic/#LinearAlgebra.cholesky-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.cholesky","text":"solver = cholesky(A::CuSparseMatrixCSR{T,Cint}; view::Char='F')\n\nCompute the LLᴴ factorization of a sparse matrix A on an NVIDIA GPU. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nInput argument\n\nA: a sparse Hermitian positive definite matrix stored in the CuSparseMatrixCSR format.\n\nKeyword argument\n\n*view: A character that specifies which triangle of the sparse matrix is provided. Possible options are L for the lower triangle, U for the upper triangle, and F for the full matrix.\n\nOutput argument\n\nsolver: Opaque structure CudssSolver that stores the factors of the LLᴴ decomposition.\n\n\n\n\n\n","category":"method"},{"location":"generic/#LinearAlgebra.cholesky!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.cholesky!","text":"solver = cholesky!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})\n\nCompute the LLᴴ factorization of a sparse matrix A on an NVIDIA GPU, reusing the symbolic factorization stored in solver. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\n\n\n\n\n","category":"method"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\n\nT = ComplexF64\nR = real(T)\nn = 100\np = 5\nA_cpu = sprand(T, n, n, 0.01)\nA_cpu = A_cpu * A_cpu' + I\nB_cpu = rand(T, n, p)\n\nA_gpu = CuSparseMatrixCSR(A_cpu |> triu)\nB_gpu = CuMatrix(B_cpu)\nX_gpu = similar(B_gpu)\n\nF = cholesky(A_gpu, view='U')\nX_gpu = F \\ B_gpu\n\nR_gpu = B_gpu - CuSparseMatrixCSR(A_cpu) * X_gpu\nnorm(R_gpu)\n\n# In-place LLᴴ\nd_gpu = rand(R, n) |> CuVector\nA_gpu = A_gpu + Diagonal(d_gpu)\ncholesky!(F, A_gpu)\n\nC_cpu = rand(T, n, p)\nC_gpu = CuMatrix(C_cpu)\nldiv!(X_gpu, F, C_gpu)\n\nR_gpu = C_gpu - ( CuSparseMatrixCSR(A_cpu) + Diagonal(d_gpu) ) * X_gpu\nnorm(R_gpu)","category":"page"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"note: Note\nIf we only store one triangle of A_gpu, we can also use the wrappers Symmetric and Hermitian instead of using the keyword argument view in cholesky. For real matrices, both wrappers are allowed but only Hermitian can be used for complex matrices.","category":"page"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"H_gpu = Hermitian(A_gpu, :U)\nF = cholesky(H_gpu)","category":"page"},{"location":"generic/#LDLᵀ-and-LDLᴴ","page":"Generic API","title":"LDLᵀ and LDLᴴ","text":"","category":"section"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"    LinearAlgebra.ldlt(A::CuSparseMatrixCSR{T,Cint}; view::Char='F') where T <: LinearAlgebra.BlasFloat\n    LinearAlgebra.ldlt!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint}) where T <: LinearAlgebra.BlasFloat","category":"page"},{"location":"generic/#LinearAlgebra.ldlt-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.ldlt","text":"solver = ldlt(A::CuSparseMatrixCSR{T,Cint}; view::Char='F')\n\nCompute the LDLᴴ factorization of a sparse matrix A on an NVIDIA GPU. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nInput argument\n\nA: a sparse Hermitian matrix stored in the CuSparseMatrixCSR format.\n\nKeyword argument\n\n*view: A character that specifies which triangle of the sparse matrix is provided. Possible options are L for the lower triangle, U for the upper triangle, and F for the full matrix.\n\nOutput argument\n\nsolver: Opaque structure CudssSolver that stores the factors of the LDLᴴ decomposition.\n\n\n\n\n\n","category":"method"},{"location":"generic/#LinearAlgebra.ldlt!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.ldlt!","text":"solver = ldlt!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})\n\nCompute the LDLᴴ factorization of a sparse matrix A on an NVIDIA GPU, reusing the symbolic factorization stored in solver. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\n\n\n\n\n","category":"method"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\n\nT = Float64\nR = real(T)\nn = 100\np = 5\nA_cpu = sprand(T, n, n, 0.05) + I\nA_cpu = A_cpu + A_cpu'\nB_cpu = rand(T, n, p)\n\nA_gpu = CuSparseMatrixCSR(A_cpu |> tril)\nB_gpu = CuMatrix(B_cpu)\nX_gpu = similar(B_gpu)\n\nF = ldlt(A_gpu, view='L')\nX_gpu = F \\ B_gpu\n\nR_gpu = B_gpu - CuSparseMatrixCSR(A_cpu) * X_gpu\nnorm(R_gpu)\n\n# In-place LDLᵀ\nd_gpu = rand(R, n) |> CuVector\nA_gpu = A_gpu + Diagonal(d_gpu)\nldlt!(F, A_gpu)\n\nC_cpu = rand(T, n, p)\nC_gpu = CuMatrix(C_cpu)\nldiv!(X_gpu, F, C_gpu)\n\nR_gpu = C_gpu - ( CuSparseMatrixCSR(A_cpu) + Diagonal(d_gpu) ) * X_gpu\nnorm(R_gpu)","category":"page"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"note: Note\nIf we only store one triangle of A_gpu, we can also use the wrappers Symmetric and Hermitian instead of using the keyword argument view in ldlt. For real matrices, both wrappers are allowed but only Hermitian can be used for complex matrices.","category":"page"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"S_gpu = Symmetric(A_gpu, :L)\nF = ldlt(S_gpu)","category":"page"},{"location":"generic/#LU","page":"Generic API","title":"LU","text":"","category":"section"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"    LinearAlgebra.lu(A::CuSparseMatrixCSR{T,Cint}) where T <: LinearAlgebra.BlasFloat\n    LinearAlgebra.lu!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint}) where T <: LinearAlgebra.BlasFloat","category":"page"},{"location":"generic/#LinearAlgebra.lu-Union{Tuple{CuSparseMatrixCSR{T, Int32}}, Tuple{T}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.lu","text":"solver = lu(A::CuSparseMatrixCSR{T,Cint})\n\nCompute the LU factorization of a sparse matrix A on an NVIDIA GPU. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\nInput argument\n\nA: a sparse square matrix stored in the CuSparseMatrixCSR format.\n\nOutput argument\n\nsolver: an opaque structure CudssSolver that stores the factors of the LU decomposition.\n\n\n\n\n\n","category":"method"},{"location":"generic/#LinearAlgebra.lu!-Union{Tuple{T}, Tuple{CudssSolver{T}, CuSparseMatrixCSR{T, Int32}}} where T<:Union{Float32, Float64, ComplexF64, ComplexF32}","page":"Generic API","title":"LinearAlgebra.lu!","text":"solver = lu!(solver::CudssSolver{T}, A::CuSparseMatrixCSR{T,Cint})\n\nCompute the LU factorization of a sparse matrix A on an NVIDIA GPU, reusing the symbolic factorization stored in solver. The type T can be Float32, Float64, ComplexF32 or ComplexF64.\n\n\n\n\n\n","category":"method"},{"location":"generic/","page":"Generic API","title":"Generic API","text":"using CUDA, CUDA.CUSPARSE\nusing CUDSS\nusing LinearAlgebra\nusing SparseArrays\n\nT = Float64\nn = 100\nA_cpu = sprand(T, n, n, 0.05) + I\nb_cpu = rand(T, n)\n\nA_gpu = CuSparseMatrixCSR(A_cpu)\nb_gpu = CuVector(b_cpu)\n\nF = lu(A_gpu)\nx_gpu = F \\ b_gpu\n\nr_gpu = b_gpu - A_gpu * x_gpu\nnorm(r_gpu)\n\n# In-place LU\nd_gpu = rand(T, n) |> CuVector\nA_gpu = A_gpu + Diagonal(d_gpu)\nlu!(F, A_gpu)\n\nc_cpu = rand(T, n)\nc_gpu = CuVector(c_cpu)\nldiv!(x_gpu, F, c_gpu)\n\nr_gpu = c_gpu - A_gpu * x_gpu\nnorm(r_gpu)","category":"page"}]
 }