@@ -12,36 +12,36 @@ static EBPF_INLINE int cuda_correlation(struct pt_regs *ctx)
1212 return 0 ;
1313 }
1414
15- u32 cudaId = 0 ;
15+ u32 cuda_id = 0 ;
1616 int err ;
1717
1818#if defined(__aarch64__ )
1919 // ARM64: Arguments: 4@[sp, 36]
2020 u64 sp = ctx -> sp ;
21- err = bpf_probe_read_user (& cudaId , sizeof (cudaId ), (void * )(sp + 36 ));
21+ err = bpf_probe_read_user (& cuda_id , sizeof (cuda_id ), (void * )(sp + 36 ));
2222#else
2323 // AMD64: Arguments: 4@-36(%rbp)
2424 u64 rbp = ctx -> bp ;
25- err = bpf_probe_read_user (& cudaId , sizeof (cudaId ), (void * )rbp - 36 );
25+ err = bpf_probe_read_user (& cuda_id , sizeof (cuda_id ), (void * )rbp - 36 );
2626#endif
2727
2828 if (err )
2929 return err ;
30- DEBUG_PRINT ("cuda_correlation_probe: correlationId =%u" , cudaId );
30+ DEBUG_PRINT ("cuda_correlation_probe: correlation_id =%u" , cuda_id );
3131
3232 u64 ts = bpf_ktime_get_ns ();
33- return collect_trace (ctx , TRACE_CUDA_LAUNCH , pid , tid , ts , 0 , cudaId );
33+ return collect_trace (ctx , TRACE_CUDA_LAUNCH , pid , tid , ts , 0 , cuda_id );
3434}
3535
3636struct kernel_timing {
3737 u32 pid ;
3838 u32 correlation_id ;
3939 u64 start ;
4040 u64 end ;
41- u32 deviceId ;
42- u32 streamId ;
43- u32 graphId ;
44- char kernelName [128 ];
41+ u32 device_id ;
42+ u32 stream_id ;
43+ u32 graph_id ;
44+ char kernel_name [128 ];
4545};
4646
4747bpf_map_def SEC ("maps" ) cuda_timing_events = {
@@ -51,7 +51,7 @@ bpf_map_def SEC("maps") cuda_timing_events = {
5151 .max_entries = 0 ,
5252};
5353
54- // uint64_t start, uint64_t end, uint32_t correlationId , uint32_t deviceId , const char *kernelName
54+ // uint64_t start, uint64_t end, uint32_t correlation_id , uint32_t device_id , const char *kernelName
5555// AMD64 Arguments: 8@%rax 8@%rdx 8@-40(%rbp) 4@%ecx 8@%rsi
5656// ARM64 Arguments: 8@x1 8@x2 8@[sp, 112] 4@x3 8@x0
5757static EBPF_INLINE int cuda_kernel_exec (struct pt_regs * ctx )
@@ -60,8 +60,8 @@ static EBPF_INLINE int cuda_kernel_exec(struct pt_regs *ctx)
6060 u32 pid = pid_tgid >> 32 ;
6161
6262 u64 start , end ;
63- u64 correlationId = 0 ;
64- u32 deviceId ;
63+ u64 correlation_id = 0 ;
64+ u32 device_id ;
6565 const char * name ;
6666 int err ;
6767
@@ -70,28 +70,28 @@ static EBPF_INLINE int cuda_kernel_exec(struct pt_regs *ctx)
7070 start = PT_REGS_PARM2 (ctx ); // x1
7171 end = PT_REGS_PARM3 (ctx ); // x2
7272 u64 sp = ctx -> sp ;
73- err = bpf_probe_read_user (& correlationId , sizeof (correlationId ), (void * )(sp + 112 ));
73+ err = bpf_probe_read_user (& correlation_id , sizeof (correlation_id ), (void * )(sp + 112 ));
7474 if (err ) {
75- correlationId = 0 ;
75+ correlation_id = 0 ;
7676 }
77- deviceId = PT_REGS_PARM4 (ctx ); // x3
78- name = (const char * )PT_REGS_PARM1 (ctx ); // x0
77+ device_id = PT_REGS_PARM4 (ctx ); // x3
78+ name = (const char * )PT_REGS_PARM1 (ctx ); // x0
7979#else
8080 // AMD64: 8@%rax 8@%rdx 8@-40(%rbp) 4@%ecx 8@%rsi
8181 start = ctx -> ax ;
8282 end = ctx -> dx ;
8383 u64 rbp = ctx -> bp ;
84- err = bpf_probe_read_user (& correlationId , sizeof (correlationId ), (void * )rbp - 40 );
84+ err = bpf_probe_read_user (& correlation_id , sizeof (correlation_id ), (void * )rbp - 40 );
8585 if (err ) {
86- correlationId = 0 ;
86+ correlation_id = 0 ;
8787 }
88- deviceId = ctx -> cx ;
89- name = (const char * )ctx -> si ;
88+ device_id = ctx -> cx ;
89+ name = (const char * )ctx -> si ;
9090#endif
9191
92- u32 cuda_id = correlationId & 0xFFFFFFFF ;
93- u32 devId = deviceId ;
94- u32 streamId = (correlationId >> 32 ) & 0xFFFFFFFF ;
92+ u32 cuda_id = correlation_id & 0xFFFFFFFF ;
93+ u32 dev_id = device_id ;
94+ u32 stream_id = (correlation_id >> 32 ) & 0xFFFFFFFF ;
9595 u64 duration_ns = end - start ;
9696
9797 DEBUG_PRINT (
@@ -103,27 +103,29 @@ static EBPF_INLINE int cuda_kernel_exec(struct pt_regs *ctx)
103103 .correlation_id = cuda_id ,
104104 .start = start ,
105105 .end = end ,
106- .deviceId = devId ,
107- .streamId = streamId ,
108- .graphId = 0 ,
106+ .device_id = dev_id ,
107+ .stream_id = stream_id ,
108+ .graph_id = 0 ,
109109 };
110110
111111 // copy name into timing.name
112- int chars = bpf_probe_read_user_str ((char * )& timing .kernelName , sizeof (timing .kernelName ), name );
112+ int chars =
113+ bpf_probe_read_user_str ((char * )& timing .kernel_name , sizeof (timing .kernel_name ), name );
113114 // empty string is a graph launch so put in a sentinel value
114115 if (chars <= 0 ) {
115116 // error reading string
116- timing .kernelName [0 ] = '\1' ;
117- timing .kernelName [1 ] = '\2' ;
118- timing .kernelName [2 ] = '\3' ;
117+ timing .kernel_name [0 ] = 'e' ;
118+ timing .kernel_name [1 ] = 'r' ;
119+ timing .kernel_name [2 ] = 'r' ;
120+ timing .kernel_name [3 ] = '\0' ;
119121 }
120122
121123 bpf_perf_event_output (ctx , & cuda_timing_events , BPF_F_CURRENT_CPU , & timing , sizeof (timing ));
122124
123125 return 0 ;
124126}
125127
126- // uint64_t start, uint64_t end, uint32_t correlationId , uint32_t deviceId , uint32_t graphId
128+ // uint64_t start, uint64_t end, uint32_t correlation_id , uint32_t device_id , uint32_t graph_id
127129// AMD64 Arguments: 8@%rax 8@%rdx 8@-64(%rbp) 4@%ecx 4@%esi
128130// ARM64 Arguments: 8@x1 8@x2 8@[sp, 88] 4@x3 4@x0
129131static EBPF_INLINE int cuda_graph_exec (struct pt_regs * ctx )
@@ -132,51 +134,54 @@ static EBPF_INLINE int cuda_graph_exec(struct pt_regs *ctx)
132134 u32 pid = pid_tgid >> 32 ;
133135
134136 u64 start , end ;
135- u64 correlationId = 0 ;
136- u32 deviceId , graphId ;
137+ u64 correlation_id = 0 ;
138+ u32 device_id , graph_id ;
137139 int err ;
138140
139141#if defined(__aarch64__ )
140142 // ARM64: 8@x1 8@x2 8@[sp, 88] 4@x3 4@x0
141143 start = PT_REGS_PARM2 (ctx ); // x1
142144 end = PT_REGS_PARM3 (ctx ); // x2
143145 u64 sp = ctx -> sp ;
144- err = bpf_probe_read_user (& correlationId , sizeof (correlationId ), (void * )(sp + 88 ));
146+ err = bpf_probe_read_user (& correlation_id , sizeof (correlation_id ), (void * )(sp + 88 ));
145147 if (err ) {
146- correlationId = 0 ;
148+ correlation_id = 0 ;
147149 }
148- deviceId = PT_REGS_PARM4 (ctx ); // x3
149- graphId = PT_REGS_PARM1 (ctx ); // x0
150+ device_id = PT_REGS_PARM4 (ctx ); // x3
151+ graph_id = PT_REGS_PARM1 (ctx ); // x0
150152#else
151153 // AMD64: 8@%rax 8@%rdx 8@-64(%rbp) 4@%ecx 4@%esi
152154 start = ctx -> ax ;
153155 end = ctx -> dx ;
154156 u64 rbp = ctx -> bp ;
155- err = bpf_probe_read_user (& correlationId , sizeof (correlationId ), (void * )rbp - 64 );
157+ err = bpf_probe_read_user (& correlation_id , sizeof (correlation_id ), (void * )rbp - 64 );
156158 if (err ) {
157- correlationId = 0 ;
159+ correlation_id = 0 ;
158160 }
159- deviceId = ctx -> cx ;
160- graphId = ctx -> si ;
161+ device_id = ctx -> cx ;
162+ graph_id = ctx -> si ;
161163#endif
162164
163- u32 cuda_id = correlationId & 0xFFFFFFFF ;
164- u32 devId = deviceId ;
165- u32 streamId = (correlationId >> 32 ) & 0xFFFFFFFF ;
165+ u32 cuda_id = correlation_id & 0xFFFFFFFF ;
166+ u32 dev_id = device_id ;
167+ u32 stream_id = (correlation_id >> 32 ) & 0xFFFFFFFF ;
166168 u64 duration_ns = end - start ;
167169
168170 DEBUG_PRINT (
169- "cuda_graph_exec: kernel_id=%u, duration_ns=%llu graph_id=%u\n" , cuda_id , duration_ns , graphId );
171+ "cuda_graph_exec: kernel_id=%u, duration_ns=%llu graph_id=%u\n" ,
172+ cuda_id ,
173+ duration_ns ,
174+ graph_id );
170175
171176 // Send the actual timing data from the function parameters
172177 struct kernel_timing timing = {
173178 .pid = pid ,
174179 .correlation_id = cuda_id ,
175180 .start = start ,
176181 .end = end ,
177- .deviceId = devId ,
178- .streamId = streamId ,
179- .graphId = graphId ,
182+ .device_id = dev_id ,
183+ .stream_id = stream_id ,
184+ .graph_id = graph_id ,
180185 };
181186
182187 bpf_perf_event_output (ctx , & cuda_timing_events , BPF_F_CURRENT_CPU , & timing , sizeof (timing ));
0 commit comments