Graphite Version 3
An experimental 3D geometry processing program
Loading...
Searching...
No Matches
nl_blas.h
Go to the documentation of this file.
1/*
2 * Copyright (c) 2000-2022 Inria
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * * Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 * * Redistributions in binary form must reproduce the above copyright notice,
11 * this list of conditions and the following disclaimer in the documentation
12 * and/or other materials provided with the distribution.
13 * * Neither the name of the ALICE Project-Team nor the names of its
14 * contributors may be used to endorse or promote products derived from this
15 * software without specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
21 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
27 * POSSIBILITY OF SUCH DAMAGE.
28 *
29 * Contact: Bruno Levy
30 *
31 * https://www.inria.fr/fr/bruno-levy
32 *
33 * Inria,
34 * Domaine de Voluceau,
35 * 78150 Le Chesnay - Rocquencourt
36 * FRANCE
37 *
38 */
39
40#include "nl_private.h"
41
48#ifndef OPENNL_BLAS_H
49#define OPENNL_BLAS_H
50
51#ifdef __cplusplus
52extern "C" {
53#endif
54
58 struct NLBlas;
59
63 typedef struct NLBlas* NLBlas_t;
64
69 typedef enum {
70 NoTranspose=0, Transpose=1, ConjugateTranspose=2
72
77 typedef enum {
78 UpperTriangle=0, LowerTriangle=1
80
85 typedef enum {
86 UnitTriangular=0, NotUnitTriangular=1
88
94 typedef enum {
95 NL_HOST_MEMORY, NL_DEVICE_MEMORY
97
107 typedef void* (*FUNPTR_malloc)(
108 NLBlas_t blas, NLmemoryType type, size_t size
109 );
110
120 typedef void (*FUNPTR_free)(
121 NLBlas_t blas, NLmemoryType type, size_t size, void* ptr
122 );
123
135 typedef void (*FUNPTR_memcpy)(
136 NLBlas_t blas,
137 void* to, NLmemoryType to_type,
138 void* from, NLmemoryType from_type,
139 size_t size
140 );
141
151 typedef void (*FUNPTR_memset)(
152 NLBlas_t blas,
153 void* to, NLmemoryType to_type,
154 int c, size_t size
155 );
156
169 typedef void (*FUNPTR_dcopy)(
170 NLBlas_t blas, int n, const double *x, int incx, double *y, int incy
171 );
172
182 typedef void (*FUNPTR_dscal)(
183 NLBlas_t blas, int n, double a, double *x, int incx
184 );
185
186
199 typedef double (*FUNPTR_ddot)(
200 NLBlas_t blas,
201 int n, const double *x, int incx, const double *y, int incy
202 );
203
213 typedef double (*FUNPTR_dnrm2)(
214 NLBlas_t blas, int n, const double *x, int incx
215 );
216
230 typedef void (*FUNPTR_daxpy)(
231 NLBlas_t blas, int n,
232 double a, const double *x, int incx, double *y, int incy
233 );
234
235
244 typedef void (*FUNPTR_dmul)(
245 NLBlas_t blas, int n,
246 const double* x, const double* y, double* z
247 );
248
285 typedef void (*FUNPTR_dgemv)(
286 NLBlas_t blas, MatrixTranspose trans, int m, int n, double alpha,
287 const double *A, int ldA, const double *x, int incx,
288 double beta, double *y, int incy
289 );
290
291
333 typedef void (*FUNPTR_dtpsv)(
334 NLBlas_t blas, MatrixTriangle uplo, MatrixTranspose trans,
335 MatrixUnitTriangular diag, int n, const double *AP,
336 double *x, int incx
337 );
338
339
340
345 typedef void (*FUNPTR_show_stats)(NLBlas_t blas);
346
351 typedef void (*FUNPTR_reset_stats)(NLBlas_t blas);
352
353 struct NLBlas {
354 FUNPTR_malloc Malloc;
355 FUNPTR_free Free;
356 FUNPTR_memcpy Memcpy;
357 FUNPTR_memset Memset;
358
359 FUNPTR_dcopy Dcopy;
360 FUNPTR_dscal Dscal;
361 FUNPTR_ddot Ddot;
362 FUNPTR_dnrm2 Dnrm2;
363 FUNPTR_daxpy Daxpy;
364 FUNPTR_dmul Dmul;
365 FUNPTR_dgemv Dgemv;
366 FUNPTR_dtpsv Dtpsv;
367
368 FUNPTR_reset_stats reset_stats;
369 FUNPTR_show_stats show_stats;
370
371 NLboolean has_unified_memory;
372 double start_time;
373 NLulong flops;
374 NLulong used_ram[2];
375 NLulong max_used_ram[2];
376
377 /*
378 * Used for stats of the linear solver
379 * (a bit ugly, should not be here, but
380 * more convenient for now...)
381 */
382 double sq_rnorm;
383 double sq_bnorm;
384
385 double aux_time;
386 };
387
396
401 NLAPI void NLAPIENTRY nlBlasResetStats(NLBlas_t blas);
402
407 NLAPI void NLAPIENTRY nlBlasShowStats(NLBlas_t blas);
408
415 NLAPI double NLAPIENTRY nlBlasGFlops(NLBlas_t blas);
416
425 NLAPI NLulong NLAPIENTRY nlBlasUsedRam(NLBlas_t blas, NLmemoryType type);
426
435 NLAPI NLulong NLAPIENTRY nlBlasMaxUsedRam(NLBlas_t blas, NLmemoryType type);
436
442 NLAPI NLBlas_t NLAPIENTRY nlHostBlas(void);
443
450#define NL_NEW_VECTOR(blas, memtype, dim) \
451 (double*)blas->Malloc(blas,memtype,(size_t)(dim)*sizeof(double))
452
460#define NL_DELETE_VECTOR(blas, memtype, dim, ptr) \
461 blas->Free(blas,memtype,(size_t)(dim)*sizeof(double),ptr)
462
463/******************************************************************************/
464
465#ifdef __cplusplus
466}
467#endif
468
469#endif
uint64_t NLulong
A 8-bytes unsigned integer.
Definition nl.h:273
unsigned char NLboolean
A truth value (NL_TRUE or NL_FALSE).
Definition nl.h:221
void(* FUNPTR_dscal)(NLBlas_t blas, int n, double a, double *x, int incx)
Scales a vector.
Definition nl_blas.h:182
MatrixTriangle
Specifies which triangular part of a matrix should be used.
Definition nl_blas.h:77
MatrixTranspose
Specifies whether matrix should be transposed.
Definition nl_blas.h:69
NLAPI void NLAPIENTRY nlBlasResetStats(NLBlas_t blas)
Resets the statistics associated with a BLAS context.
void(* FUNPTR_memcpy)(NLBlas_t blas, void *to, NLmemoryType to_type, void *from, NLmemoryType from_type, size_t size)
Copies a bloc of memory.
Definition nl_blas.h:135
void(* FUNPTR_daxpy)(NLBlas_t blas, int n, double a, const double *x, int incx, double *y, int incy)
Computes a linear combination of two vectors.
Definition nl_blas.h:230
MatrixUnitTriangular
Specifies which triangular part of a matrix should be used.
Definition nl_blas.h:85
void *(* FUNPTR_malloc)(NLBlas_t blas, NLmemoryType type, size_t size)
Allocates memory in host or in device.
Definition nl_blas.h:107
NLAPI NLulong NLAPIENTRY nlBlasMaxUsedRam(NLBlas_t blas, NLmemoryType type)
Gets the high mark of used amount of memory computed since creation of the BLAS abstaction layer or s...
struct NLBlas * NLBlas_t
A handle to a BLAS abstraction layer.
Definition nl_blas.h:63
void(* FUNPTR_dtpsv)(NLBlas_t blas, MatrixTriangle uplo, MatrixTranspose trans, MatrixUnitTriangular diag, int n, const double *AP, double *x, int incx)
Solves a linear system.
Definition nl_blas.h:333
NLAPI NLulong NLAPIENTRY nlBlasUsedRam(NLBlas_t blas, NLmemoryType type)
Gets the currently used amount of memory computed since creation of the BLAS abstaction layer or sinc...
NLAPI void NLAPIENTRY nlBlasShowStats(NLBlas_t blas)
Displays the statistics associated with a BLAS context.
void(* FUNPTR_dcopy)(NLBlas_t blas, int n, const double *x, int incx, double *y, int incy)
Copies a vector.
Definition nl_blas.h:169
double(* FUNPTR_dnrm2)(NLBlas_t blas, int n, const double *x, int incx)
Computes the norm of a vector.
Definition nl_blas.h:213
void(* FUNPTR_reset_stats)(NLBlas_t blas)
Resets the statistics associated with a BLAS context.
Definition nl_blas.h:351
void(* FUNPTR_free)(NLBlas_t blas, NLmemoryType type, size_t size, void *ptr)
Frees memory from host or from device.
Definition nl_blas.h:120
NLmemoryType
Specifies on which type of memory a function should be applied.
Definition nl_blas.h:94
NLAPI NLboolean NLAPIENTRY nlBlasHasUnifiedMemory(NLBlas_t blas)
Tests whether BLAS device uses the same address space as the CPU.
NLAPI NLBlas_t NLAPIENTRY nlHostBlas(void)
Gets a pointer to the BLAS abstraction layer for BLAS operation on the host CPU.
double(* FUNPTR_ddot)(NLBlas_t blas, int n, const double *x, int incx, const double *y, int incy)
Computes the dot product between two vectors.
Definition nl_blas.h:199
NLAPI double NLAPIENTRY nlBlasGFlops(NLBlas_t blas)
Gets the number of floating point operations per seconds computed since creation of the BLAS abstacti...
void(* FUNPTR_show_stats)(NLBlas_t blas)
Displays the statistics associated with a BLAS context.
Definition nl_blas.h:345
void(* FUNPTR_dgemv)(NLBlas_t blas, MatrixTranspose trans, int m, int n, double alpha, const double *A, int ldA, const double *x, int incx, double beta, double *y, int incy)
Computes a matrix-vector product.
Definition nl_blas.h:285
void(* FUNPTR_memset)(NLBlas_t blas, void *to, NLmemoryType to_type, int c, size_t size)
Sets a bloc of memory.
Definition nl_blas.h:151
void(* FUNPTR_dmul)(NLBlas_t blas, int n, const double *x, const double *y, double *z)
Component-wise multiplication.
Definition nl_blas.h:244
Some macros and functions used internally by OpenNL.