Skip to content

Commit

Permalink
add alg that does O(N^5) on CPU but other on GPU, which is slower
Browse files Browse the repository at this point in the history
  • Loading branch information
jeffhammond committed Oct 16, 2024
1 parent c562fc8 commit f3b5539
Showing 1 changed file with 9 additions and 1 deletion.
10 changes: 9 additions & 1 deletion src/tce/ccsd/ccsd_t2.F
Original file line number Diff line number Diff line change
Expand Up @@ -309,11 +309,19 @@ SUBROUTINE ccsd_t2(rtdb,d_f1,d_i0,d_t1,d_t2,d_v2,
CALL ccsd_t2_7_3(d_t2,k_t2_offset,d_v2,k_v2_offset,
& d_i1,k_i1_offset)
else if (ccsd_t2_7_alg.eq.2) then
! no GPU in 7_1_x yet - it just does transpose
CALL ccsd_t2_7_1_x(d_v2,k_v2_offset,
& d_i1,k_i1_offset,maxh,maxp)
CALL ccsd_t2_7_2_x(d_t1,k_t1_offset,d_v2,k_v2_offset,
& d_i1,k_i1_offset,maxh,maxp)
CALL ccsd_t2_7_3_x(d_t2,k_t2_offset,d_v2,k_v2_offset,
& d_i1,k_i1_offset,maxh,maxp)
else if (ccsd_t2_7_alg.eq.3) then
CALL ccsd_t2_7_1(d_v2,k_v2_offset,
& d_i1,k_i1_offset,maxh,maxp)
CALL ccsd_t2_7_2(d_t1,k_t1_offset,d_v2,k_v2_offset,
& d_i1,k_i1_offset,maxh,maxp)
CALL ccsd_t2_7_3_x(d_t2,k_t2_offset,d_v2,k_v2_offset,
& d_i1,k_i1_offset,maxh,maxp)
else
CALL errquit('ccsd_t2_7_alg',ccsd_t2_7_alg,INPUT_ERR)
Expand All @@ -322,7 +330,7 @@ SUBROUTINE ccsd_t2(rtdb,d_f1,d_i0,d_t1,d_t2,d_v2,
if (ccsd_t2_7_alg.eq.1) then
CALL ccsd_t2_7(d_t2,k_t2_offset,d_i1,k_i1_offset,
& d_i0,k_i0_offset)
else if (ccsd_t2_7_alg.eq.2) then
else if (ccsd_t2_7_alg.gt.1) then
CALL ccsd_t2_7_x(d_t2,k_t2_offset,d_i1,k_i1_offset,
& d_i0,k_i0_offset,maxh,maxp)
else
Expand Down

0 comments on commit f3b5539

Please sign in to comment.