Mentions légales du service
Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
Chameleon
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Build
Pipelines
Jobs
Pipeline schedules
Artifacts
Deploy
Releases
Package Registry
Container Registry
Operate
Environments
Terraform modules
Monitor
Service Desk
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
solverstack
Chameleon
Commits
2f9dd95a
Commit
2f9dd95a
authored
6 years ago
by
Mathieu Faverge
Browse files
Options
Downloads
Patches
Plain Diff
Small changes to fix documentation and/or code
parent
f343a4fa
No related branches found
Branches containing commit
No related tags found
Tags containing commit
1 merge request
!129
Fix #56 - Issue in CUDA_zparfb kernels for TT case
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
coreblas/compute/core_zparfb.c
+3
-2
3 additions, 2 deletions
coreblas/compute/core_zparfb.c
coreblas/compute/core_ztpmlqt.c
+8
-7
8 additions, 7 deletions
coreblas/compute/core_ztpmlqt.c
coreblas/compute/core_zttmlq.c
+11
-11
11 additions, 11 deletions
coreblas/compute/core_zttmlq.c
with
22 additions
and
20 deletions
coreblas/compute/core_zparfb.c
+
3
−
2
View file @
2f9dd95a
...
@@ -18,7 +18,7 @@
...
@@ -18,7 +18,7 @@
* @author Mathieu Faverge
* @author Mathieu Faverge
* @author Emmanuel Agullo
* @author Emmanuel Agullo
* @author Cedric Castagnede
* @author Cedric Castagnede
* @date 201
1-06-14
* @date 201
8-11-09
* @precisions normal z -> c d s
* @precisions normal z -> c d s
*
*
*/
*/
...
@@ -139,7 +139,8 @@
...
@@ -139,7 +139,8 @@
*/
*/
/* This kernel is never traced so return type on previous line for convert2eztrace.pl script */
/* This kernel is never traced so return type on previous line for convert2eztrace.pl script */
int
int
CORE_zparfb
(
cham_side_t
side
,
cham_trans_t
trans
,
cham_dir_t
direct
,
cham_store_t
storev
,
CORE_zparfb
(
cham_side_t
side
,
cham_trans_t
trans
,
cham_dir_t
direct
,
cham_store_t
storev
,
int
M1
,
int
N1
,
int
M2
,
int
N2
,
int
K
,
int
L
,
int
M1
,
int
N1
,
int
M2
,
int
N2
,
int
K
,
int
L
,
CHAMELEON_Complex64_t
*
A1
,
int
LDA1
,
CHAMELEON_Complex64_t
*
A1
,
int
LDA1
,
CHAMELEON_Complex64_t
*
A2
,
int
LDA2
,
CHAMELEON_Complex64_t
*
A2
,
int
LDA2
,
...
...
This diff is collapsed.
Click to expand it.
coreblas/compute/core_ztpmlqt.c
+
8
−
7
View file @
2f9dd95a
...
@@ -13,7 +13,7 @@
...
@@ -13,7 +13,7 @@
*
*
* @version 1.0.0
* @version 1.0.0
* @author Mathieu Faverge
* @author Mathieu Faverge
* @date 201
6
-1
2-15
* @date 201
8
-1
1-09
* @precisions normal z -> c d s
* @precisions normal z -> c d s
*
*
*/
*/
...
@@ -24,9 +24,11 @@
...
@@ -24,9 +24,11 @@
*
*
* @ingroup CORE_CHAMELEON_Complex64_t
* @ingroup CORE_CHAMELEON_Complex64_t
*
*
* CORE_ztpmlqt applies a complex orthogonal matrix Q obtained from a
* @brief Applies a complex orthogonal matrix Q.
* "triangular-pentagonal" complex block reflector H to a general complex matrix
*
* C, which consists of two blocks A and B.
* The matrix Q is obtained from a "triangular-pentagonal" complex block
* reflector H to a general complex matrix C, which consists of two blocks A and
* B.
*
*
*******************************************************************************
*******************************************************************************
*
*
...
@@ -128,9 +130,8 @@
...
@@ -128,9 +130,8 @@
*
*
*******************************************************************************
*******************************************************************************
*
*
* @return
* @retval CHAMELEON_SUCCESS successful exit
* \retval CHAMELEON_SUCCESS successful exit
* @retval <0 if -i, the i-th argument had an illegal value
* \retval <0 if -i, the i-th argument had an illegal value
*
*
*/
*/
...
...
This diff is collapsed.
Click to expand it.
coreblas/compute/core_zttmlq.c
+
11
−
11
View file @
2f9dd95a
...
@@ -19,7 +19,7 @@
...
@@ -19,7 +19,7 @@
* @author Mathieu Faverge
* @author Mathieu Faverge
* @author Emmanuel Agullo
* @author Emmanuel Agullo
* @author Cedric Castagnede
* @author Cedric Castagnede
* @date 201
0
-11-
15
* @date 201
8
-11-
09
* @precisions normal z -> c d s
* @precisions normal z -> c d s
*
*
*/
*/
...
@@ -127,9 +127,9 @@ int CORE_zttmlq(cham_side_t side, cham_trans_t trans,
...
@@ -127,9 +127,9 @@ int CORE_zttmlq(cham_side_t side, cham_trans_t trans,
const
CHAMELEON_Complex64_t
*
T
,
int
LDT
,
const
CHAMELEON_Complex64_t
*
T
,
int
LDT
,
CHAMELEON_Complex64_t
*
WORK
,
int
LDWORK
)
CHAMELEON_Complex64_t
*
WORK
,
int
LDWORK
)
{
{
int
i
,
i1
,
i3
,
l
;
int
i
,
i1
,
i3
;
int
NW
;
int
NW
;
int
kb
;
int
kb
,
l
;
int
ic
=
0
;
int
ic
=
0
;
int
jc
=
0
;
int
jc
=
0
;
int
mi1
=
M1
;
int
mi1
=
M1
;
...
@@ -205,11 +205,13 @@ int CORE_zttmlq(cham_side_t side, cham_trans_t trans,
...
@@ -205,11 +205,13 @@ int CORE_zttmlq(cham_side_t side, cham_trans_t trans,
}
}
/* Quick return */
/* Quick return */
if
((
M1
==
0
)
||
(
N1
==
0
)
||
(
M2
==
0
)
||
(
N2
==
0
)
||
(
K
==
0
)
||
(
IB
==
0
))
if
((
M1
==
0
)
||
(
N1
==
0
)
||
(
M2
==
0
)
||
(
N2
==
0
)
||
(
K
==
0
)
||
(
IB
==
0
))
{
return
CHAMELEON_SUCCESS
;
return
CHAMELEON_SUCCESS
;
}
if
(((
side
==
ChamLeft
)
&&
(
trans
==
ChamNoTrans
))
if
(
((
side
==
ChamLeft
)
&&
(
trans
==
ChamNoTrans
))
||
||
((
side
==
ChamRight
)
&&
(
trans
!=
ChamNoTrans
)))
{
((
side
==
ChamRight
)
&&
(
trans
!=
ChamNoTrans
))
)
{
i1
=
0
;
i1
=
0
;
i3
=
IB
;
i3
=
IB
;
}
}
...
@@ -248,13 +250,11 @@ int CORE_zttmlq(cham_side_t side, cham_trans_t trans,
...
@@ -248,13 +250,11 @@ int CORE_zttmlq(cham_side_t side, cham_trans_t trans,
CORE_zparfb
(
CORE_zparfb
(
side
,
trans
,
ChamDirForward
,
ChamRowwise
,
side
,
trans
,
ChamDirForward
,
ChamRowwise
,
mi1
,
ni1
,
mi2
,
ni2
,
kb
,
l
,
mi1
,
ni1
,
mi2
,
ni2
,
kb
,
l
,
&
A1
[
LDA1
*
jc
+
ic
]
,
LDA1
,
A1
+
LDA1
*
jc
+
ic
,
LDA1
,
A2
,
LDA2
,
A2
,
LDA2
,
&
V
[
i
]
,
LDV
,
V
+
i
,
LDV
,
&
T
[
LDT
*
i
]
,
LDT
,
T
+
LDT
*
i
,
LDT
,
WORK
,
LDWORK
);
WORK
,
LDWORK
);
}
}
return
CHAMELEON_SUCCESS
;
return
CHAMELEON_SUCCESS
;
}
}
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment