-
-
Notifications
You must be signed in to change notification settings - Fork 308
Open
Description
Greetings, seems the project abandoned ? hope its doesnt
well, i have a error :
nvrtc: error: invalid value for --gpu-architecture (-arch)
` //actual loading
auto * input0 = reinterpret_cast<const scalar_t*>(data[0+1]) + block_work_size * idx;
#pragma unroll
for (int i = 0; i<loop_size; i++){
const auto vec0 = load_vector<vec_size>(input0, thread_idx);
#pragma unroll
for (int j=0; j < vec_size; j++){
arg0[vec_size * i + j] = vec0.val[j];
}
thread_idx += num_threads;
}
#pragma unroll
for (int j = 0; j < thread_work_size; j++) {
out0[j] = abs_kernel<std::complex<float>>(arg0[j] );
}
using vec_t_output = aligned_vector<std::complex<float>, vec_size>;
vec_t_output* to_0 = reinterpret_cast<vec_t_output*>(data[0]) + block_work_size / vec_size * idx;
int thread_idx = threadIdx.x;
#pragma unroll
for (int i = 0; i<loop_size; i++){
vec_t_output v;
#pragma unroll
for (int j=0; j<vec_size; j++){
v.val[j] = out0[vec_size * i + j];
}
to_0[thread_idx] = v;
thread_idx += num_threads;
}
}
}
nvrtc: error: invalid value for --gpu-architecture (-arch)`
Seems like code cant work with RTX 5070
Who knows how to solve it ?
Metadata
Metadata
Assignees
Labels
No labels