-
Notifications
You must be signed in to change notification settings - Fork 0
/
type.d2
91 lines (79 loc) · 2.21 KB
/
type.d2
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
placeholder: {
grid-columns: 1
PackedOn16BytesWrapper: {
PackedOn16Bytes\<T\>: {
shape: class
}
PackedOn16Bytes\<T\> -> PackedFloat: T: float
PackedOn16Bytes\<T\> -> PackedFloat\': T: float
PackedOn16Bytes\<T\> -> PackedHalf: T: half
PackedOn16Bytes\<T\> -> PackedHalf\': T: half
PackedFloat: {
shape: class
int4: packed
}
PackedFloat\': {
shape: class
float: unpacked\[4\]
}
PackedHalf: {
shape: class
int4: packed
}
PackedHalf\': {
shape: class
half2: unpacked\[4\]
}
}
PackedOn16BytesWrapper.style.opacity: 0
ParamsWrapper: {
AllReduceParams {
shape: class
size_t: elts_total, elts_per_rank, elts_per_block
size_t\': local_rank
void\*: peer_comm_buffer_ptrs\[MAX_RANKS_PER_NODE\]
void\*\': local_output_buffer_ptr
const void\*: local_input_buffer_ptr
AllReduceFusionParams: fusion_params
deserialize(int64_t\* buffer, size_t tpSize, size_t tpRank): AllReduceParams
}
AllReduceParams -> AllReduceFusionParams: fusion_params {
style: {
stroke: black
stroke-dash: 6
}
}
AllReduceFusionParams: {
shape: class
# `bias_buffer` is GEMM bias.
const void\*: bias_buffer, residual_buffer
# RMSNorm
int: hidden_size
const void\*\': weight_buffer
float: eps
void\*: intermediate_buffer
}
}
ParamsWrapper.style.opacity: 0
EnumWrapper: {
AllReduceStrategyType: {
shape: sql_table
NCCL: 0
ONESHOT: 1
TWOSHOT: 2
AUTO: 3
}
AllReduceStrategyConfig {
shape: sql_table
USE_MEMCPY: 1
RESIDUAL_RMS_NORM: 2
}
AllReduceFusionOp: {
shape: sql_table
NONE: 0
RESIDUAL_RMS_NORM: 1
}
}
EnumWrapper.style.opacity: 0
}
placeholder.style.opacity: 0