wassname
|
fa7bd34b36
|
act grousp
|
2025-03-14 16:43:00 +08:00 |
|
wassname
|
9d63a74fc6
|
try stacking acts
|
2025-03-14 16:18:04 +08:00 |
|
wassname
|
9f21a00862
|
also trim logits as it's large
|
2025-03-12 16:53:11 +08:00 |
|
wassname
|
6fed0032f2
|
change default
|
2025-03-12 15:30:33 +08:00 |
|
wassname
|
756b653913
|
handle 0d tensors like loss
|
2025-03-12 14:06:40 +08:00 |
|
wassname
|
237b8217d5
|
simplify
|
2025-03-12 13:56:09 +08:00 |
|
wassname
|
bcd47da026
|
tidy
|
2025-03-12 13:55:47 +08:00 |
|
wassname
|
72e20deba3
|
tidy and fix token slice
|
2025-03-12 13:55:43 +08:00 |
|
wassname
|
116ab04050
|
tweaks to prevent OOM
|
2025-03-12 13:32:00 +08:00 |
|
wassname
|
20a117b9fb
|
wip
|
2025-03-12 12:04:36 +08:00 |
|
wassname
|
0ebb049529
|
add __init__
|
2025-03-12 12:04:29 +08:00 |
|
wassname
|
ec863d5d14
|
res
|
2025-02-17 20:40:57 +08:00 |
|
wassname
|
5ac406ebd5
|
supressed seems better
|
2025-02-16 19:28:34 +08:00 |
|
wassname
|
66bc0be046
|
working, a little
|
2025-02-16 15:36:43 +08:00 |
|
wassname
|
c7984ffc0c
|
works... just
|
2025-02-16 13:32:37 +08:00 |
|
wassname
|
ec5bcd5dee
|
tidy
|
2025-02-16 11:50:46 +08:00 |
|
wassname
|
eaeb99cc1a
|
wip
|
2025-02-16 11:50:20 +08:00 |
|
wassname
|
eeca873ca6
|
wip
|
2025-02-16 11:49:53 +08:00 |
|
wassname
|
5f5e2973ab
|
wip
|
2025-02-16 11:24:31 +08:00 |
|
wassname
|
0d6560e8dd
|
wip
|
2025-02-16 11:23:30 +08:00 |
|
wassname
|
bd10c2ef8c
|
readme
|
2025-02-16 11:04:30 +08:00 |
|
wassname
|
f0311c022f
|
another example
|
2025-02-16 09:56:23 +08:00 |
|
wassname
|
2f82c4bdec
|
wip
|
2025-02-16 09:41:13 +08:00 |
|
wassname
|
8a61bfeba0
|
parquet
|
2025-02-15 22:03:52 +08:00 |
|
wassname
|
0e18875b25
|
comments
|
2025-02-15 21:21:36 +08:00 |
|
wassname
|
f186243fe1
|
working
|
2025-02-15 21:15:15 +08:00 |
|
wassname
|
691d290c47
|
init
|
2025-02-15 19:30:09 +08:00 |
|