@@ -308,20 +308,20 @@ function matmulsplitn!(C::AbstractStridedPointer{T}, A, B, α, β, ::StaticInt{M
308
308
_nspawn = Mblocks * Nblocks
309
309
Mbsize_Mrem, Mbsize_ = promote (Mbsize + W, Mbsize)
310
310
Nbsize_Nrem, Nbsize_ = promote (Nbsize + One (), Nbsize)
311
- (tnum, tuu) = Polyester . initial_state (threads)
311
+ (tnum, tuu) = PolyesterWeave . initial_state (threads)
312
312
let _A = A, _B = B, _C = C, n = 0 , Nrc = Nblocks - Nrem, Mrc = Mblocks - Mrem, __Mblocks = Mblocks - One ()
313
313
while true
314
314
nsize = ifelse (Nblocks > Nrc, Nbsize_Nrem, Nbsize_); Nblocks -= 1
315
315
let _A = _A, _C = _C, __Mblocks = __Mblocks
316
316
while __Mblocks != 0
317
317
msize = ifelse (__Mblocks ≥ Mrc, Mbsize_Mrem, Mbsize_); __Mblocks -= 1
318
- (tnum, tuu) = Polyester . iter (tnum, tuu)
318
+ (tnum, tuu) = PolyesterWeave . iter (tnum, tuu)
319
319
launch_thread_mul! (_C, _A, _B, α, β, msize, K, nsize, tnum, Val {PACK} ())
320
320
_A = gesp (_A, (msize, Zero ()))
321
321
_C = gesp (_C, (msize, Zero ()))
322
322
end
323
323
if Nblocks != 0
324
- (tnum, tuu) = Polyester . iter (tnum, tuu)
324
+ (tnum, tuu) = PolyesterWeave . iter (tnum, tuu)
325
325
launch_thread_mul! (_C, _A, _B, α, β, Mremfinal, K, nsize, tnum, Val {PACK} ())
326
326
else
327
327
call_loopmul! (_C, _A, _B, α, β, Mremfinal, K, nsize, Val {PACK} ())
@@ -360,8 +360,8 @@ function __matmul!(
360
360
clamp (div_fast (M * N, StaticInt {256} () * W), 0 , _nthread- 1 )
361
361
end
362
362
# nkern = cld_fast(M * N, MᵣW * Nᵣ)
363
- threads, torelease = Polyester . __request_threads (_nrequest % UInt32, Polyester . worker_pointer ())
364
- # _threads, _torelease = Polyester .request_threads(Threads.threadid()%UInt32, _nrequest)
363
+ threads, torelease = PolyesterWeave . __request_threads (_nrequest % UInt32, PolyesterWeave . worker_pointer ())
364
+ # _threads, _torelease = PolyesterWeave .request_threads(Threads.threadid()%UInt32, _nrequest)
365
365
366
366
nrequest = threads. i
367
367
iszero (nrequest) && @goto SINGLETHREAD
@@ -388,7 +388,7 @@ function __matmul!(
388
388
else # TODO : Allow splitting along `N` for `matmul_pack_A_and_B!`
389
389
matmul_pack_A_and_B! (C, A, B, α, β, M, K, N, threads, W₁Default (), W₂Default (), R₁Default (), R₂Default ())
390
390
end
391
- Polyester . free_threads! (torelease)
391
+ PolyesterWeave . free_threads! (torelease)
392
392
nothing
393
393
end
394
394
@@ -398,9 +398,9 @@ function waitonmultasks(threads, nthread)
398
398
# for (_,tid) ∈ threads
399
399
# wait(tid)
400
400
# end
401
- (tnum, tuu) = Polyester . initial_state (threads)
401
+ (tnum, tuu) = PolyesterWeave . initial_state (threads)
402
402
for _ ∈ CloseOpen (One (), nthread)
403
- (tnum, tuu) = Polyester . iter (tnum, tuu)
403
+ (tnum, tuu) = PolyesterWeave . iter (tnum, tuu)
404
404
wait (tnum)
405
405
end
406
406
end
@@ -423,13 +423,13 @@ function matmul_pack_A_and_B!(
423
423
end
424
424
Mblock_Mrem, Mblock_ = promote (Mbsize + W, Mbsize)
425
425
u_to_spawn = _to_spawn % UInt
426
- (tnum, tuu) = Polyester . initial_state (threads)
426
+ (tnum, tuu) = PolyesterWeave . initial_state (threads)
427
427
bc = _use_bcache ()
428
428
bc_ptr = Base. unsafe_convert (typeof (pointer (C)), pointer (bc))
429
429
last_id = _to_spawn - One ()
430
430
for m ∈ CloseOpen (last_id) # ...thus the fact that `CloseOpen()` iterates at least once is okay.
431
431
Mblock = ifelse (m < Mrem, Mblock_Mrem, Mblock_)
432
- (tnum, tuu) = Polyester . iter (tnum, tuu)
432
+ (tnum, tuu) = PolyesterWeave . iter (tnum, tuu)
433
433
launch_thread_mul! (C, A, B, α, β, Mblock, K, N, p, bc_ptr, tnum, m % UInt, u_to_spawn, StaticFloat64 {W₁} (),StaticFloat64 {W₂} (),StaticFloat64 {R₁} (),StaticFloat64 {R₂} ())
434
434
A = gesp (A, (Mblock, Zero ()))
435
435
C = gesp (C, (Mblock, Zero ()))
0 commit comments