Skip to content
This repository was archived by the owner on Apr 24, 2022. It is now read-only.

Commit e8451b3

Browse files
committedAug 3, 2018
One last small GCN3 optimization
- This group of s_nops is a remnant of a previous implementation and serves no purpose other than to slow us down.
1 parent c3afc3d commit e8451b3

13 files changed

+4
-5
lines changed
 
-32 Bytes
Binary file not shown.
-32 Bytes
Binary file not shown.
-32 Bytes
Binary file not shown.
-32 Bytes
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
-32 Bytes
Binary file not shown.
-32 Bytes
Binary file not shown.
-32 Bytes
Binary file not shown.
-32 Bytes
Binary file not shown.
-32 Bytes
Binary file not shown.

‎libethash-cl/kernels/isa/GCN3_ethash_search.isa

+4-5
Original file line numberDiff line numberDiff line change
@@ -187,7 +187,6 @@
187187
s_load_dwordx8 header_content, header, 0x0
188188
s_waitcnt lgkmcnt(0)
189189

190-
.align 32
191190
v_mov_b32 state7, header_content[7]
192191
v_mov_b32 state6, header_content[6]
193192
v_mov_b32 state5, header_content[5]
@@ -642,7 +641,7 @@
642641

643642
s_movk_i32 mix_index, 0x0
644643

645-
.align 32
644+
.align 32
646645
.mix_loop_\mix_id:
647646
s_bfe_u32 scalar_temp0, mix_index, 0x20003
648647
v_and_b32 temp0, 0xfc, local_id
@@ -791,7 +790,7 @@
791790
s_movk_i32 keccak_round, 0x0
792791
s_branch .keccak_loop
793792

794-
.align 32
793+
.align 32
795794
.test:
796795
/* increment hash count */
797796
v_cmp_eq_u32 vcc, 0, local_id
@@ -855,8 +854,8 @@
855854
s_waitcnt vmcnt(0) & lgkmcnt(0)
856855

857856
s_mov_b64 exec, s[46:47]
858-
s_endpgm
857+
s_endpgm
859858

860-
.align 32
859+
.align 32
861860
fastexit:
862861
s_endpgm

0 commit comments

Comments
 (0)
This repository has been archived.