CARVIEW |
Select Language
HTTP/2 200
date: Wed, 23 Jul 2025 05:52:27 GMT
content-type: text/html; charset=utf-8
vary: X-PJAX, X-PJAX-Container, Turbo-Visit, Turbo-Frame, X-Requested-With,Accept-Encoding, Accept, X-Requested-With
x-robots-tag: none
etag: W/"4f6a492d49d0037b4c0d4c0ce4e3a30e"
cache-control: max-age=0, private, must-revalidate
strict-transport-security: max-age=31536000; includeSubdomains; preload
x-frame-options: deny
x-content-type-options: nosniff
x-xss-protection: 0
referrer-policy: no-referrer-when-downgrade
content-security-policy: default-src 'none'; base-uri 'self'; child-src github.githubassets.com github.com/assets-cdn/worker/ github.com/assets/ gist.github.com/assets-cdn/worker/; connect-src 'self' uploads.github.com www.githubstatus.com collector.github.com raw.githubusercontent.com api.github.com github-cloud.s3.amazonaws.com github-production-repository-file-5c1aeb.s3.amazonaws.com github-production-upload-manifest-file-7fdce7.s3.amazonaws.com github-production-user-asset-6210df.s3.amazonaws.com *.rel.tunnels.api.visualstudio.com wss://*.rel.tunnels.api.visualstudio.com objects-origin.githubusercontent.com copilot-proxy.githubusercontent.com proxy.individual.githubcopilot.com proxy.business.githubcopilot.com proxy.enterprise.githubcopilot.com *.actions.githubusercontent.com wss://*.actions.githubusercontent.com productionresultssa0.blob.core.windows.net/ productionresultssa1.blob.core.windows.net/ productionresultssa2.blob.core.windows.net/ productionresultssa3.blob.core.windows.net/ productionresultssa4.blob.core.windows.net/ productionresultssa5.blob.core.windows.net/ productionresultssa6.blob.core.windows.net/ productionresultssa7.blob.core.windows.net/ productionresultssa8.blob.core.windows.net/ productionresultssa9.blob.core.windows.net/ productionresultssa10.blob.core.windows.net/ productionresultssa11.blob.core.windows.net/ productionresultssa12.blob.core.windows.net/ productionresultssa13.blob.core.windows.net/ productionresultssa14.blob.core.windows.net/ productionresultssa15.blob.core.windows.net/ productionresultssa16.blob.core.windows.net/ productionresultssa17.blob.core.windows.net/ productionresultssa18.blob.core.windows.net/ productionresultssa19.blob.core.windows.net/ github-production-repository-image-32fea6.s3.amazonaws.com github-production-release-asset-2e65be.s3.amazonaws.com insights.github.com wss://alive.github.com api.githubcopilot.com api.individual.githubcopilot.com api.business.githubcopilot.com api.enterprise.githubcopilot.com; font-src github.githubassets.com; form-action 'self' github.com gist.github.com copilot-workspace.githubnext.com objects-origin.githubusercontent.com; frame-ancestors 'none'; frame-src viewscreen.githubusercontent.com notebooks.githubusercontent.com; img-src 'self' data: blob: github.githubassets.com media.githubusercontent.com camo.githubusercontent.com identicons.github.com avatars.githubusercontent.com private-avatars.githubusercontent.com github-cloud.s3.amazonaws.com objects.githubusercontent.com release-assets.githubusercontent.com secured-user-images.githubusercontent.com/ user-images.githubusercontent.com/ private-user-images.githubusercontent.com opengraph.githubassets.com copilotprodattachments.blob.core.windows.net/github-production-copilot-attachments/ github-production-user-asset-6210df.s3.amazonaws.com customer-stories-feed.github.com spotlights-feed.github.com objects-origin.githubusercontent.com *.githubusercontent.com; manifest-src 'self'; media-src github.com user-images.githubusercontent.com/ secured-user-images.githubusercontent.com/ private-user-images.githubusercontent.com github-production-user-asset-6210df.s3.amazonaws.com gist.github.com; script-src github.githubassets.com; style-src 'unsafe-inline' github.githubassets.com; upgrade-insecure-requests; worker-src github.githubassets.com github.com/assets-cdn/worker/ github.com/assets/ gist.github.com/assets-cdn/worker/
server: github.com
content-encoding: gzip
accept-ranges: bytes
set-cookie: _gh_sess=l9iRv1q9YxgNn36Om7v0jxqeNjOitr5taS25ghkMlpYFh7V1pWcYbitgakG6kSY%2FdBFBJFKnA542noDRRxxPFH9qsrqZZ%2BIE3O%2FN8GYPVuQw2WvNR5syrP4ItPm4gdLhbl0TKjoMz7rzuwZzmQdAem5nZSthN%2BLa5gRpg%2BYCZF8tnGSSm%2F8GSOZ4di%2FjYAnLep9La1ucboUe9Wh5STyO%2FKEAvpxu7yIEWTKeI015yzpZrnnFqNopmeaxCU5aLpjduOY79PEsxFxy9dANoLLRjg%3D%3D--WV8YeHIzWG3l23EV--HUUr0vP8%2F%2BiPsdbZY2r87g%3D%3D; Path=/; HttpOnly; Secure; SameSite=Lax
set-cookie: _octo=GH1.1.1501823471.1753249946; Path=/; Domain=github.com; Expires=Thu, 23 Jul 2026 05:52:26 GMT; Secure; SameSite=Lax
set-cookie: logged_in=no; Path=/; Domain=github.com; Expires=Thu, 23 Jul 2026 05:52:26 GMT; HttpOnly; Secure; SameSite=Lax
x-github-request-id: B9C0:261FF2:476E8F:5E20FA:6880789A
Optimisation Guide · kaanolgu/bfs-sycl-fpga Wiki · GitHub
Skip to content
Navigation Menu
{{ message }}
-
Notifications
You must be signed in to change notification settings - Fork 0
Optimisation Guide
kaanolgu edited this page Aug 3, 2023
·
1 revision
This page is used for the paper (doi soon) to showcase the code optimisations done and their effect on the performance metrics All the test results are according to the tests with RMAT-19-32 with 4 Compute units
// Old code
unsigned int nodes_start = usm_nodes_start[idx];
unsigned int nodes_end = usm_nodes_start[idx +1 ];
// New code with split device pointers
device_ptr<unsigned int> DevicePtr_start(usm_nodes_start+offset);
device_ptr<unsigned int> DevicePtr_end(usm_nodes_start + 1+offset);
unsigned int nodes_start = DevicePtr_start[idx];
unsigned int nodes_end = DevicePtr_end[idx];
Vector version - execution time : 0.10s Single version - execution time : 0.08s
// Vector code
std::vector<event> e_vec;
e_vec.push_back(e1);
e_vec.push_back(e2);
e_vec.push_back(e3);
auto e =q.single_task<class Task>( e_vec, [=](){
...
// Seperate Events
auto e =q.single_task<class Task>( {e1,e2,e3}, [=]() {
...
Throughput : parallel_for > singletask > NDrange
q.single_task<class SingleTask>( [=]() [[intel::kernel_args_restrict]] {
#pragma unroll 16
for(int tid =0; tid < no_of_nodes; tid++){
unsigned int condition = usm_updating_mask[tid];
if(condition){
usm_updating_mask[tid]=0;
}
}
});
q.parallel_for<class ParallelFor>(no_of_nodes, [=]() [[intel::kernel_args_restrict]] {
unsigned int condition = usm_updating_mask[tid];
if(condition){
usm_updating_mask[tid]=0;
}
});
int BLOCK_SIZE = 512;
int global_work_size = (no_of_nodes + BLOCK_SIZE - 1) / BLOCK_SIZE * BLOCK_SIZE;
range<1> gws (global_work_size);
range<1> lws (BLOCK_SIZE);
q.parallel_for<class NDRange>(nd_range<1>(gws, lws), [=] (nd_item<1> item) [[intel::kernel_args_restrict]] {
int gid = item.get_global_id();
if(gid<no_of_nodes){
unsigned int condition = usm_updating_mask[tid];
if(condition){
usm_updating_mask[tid]=0;
}
}
});
Clone this wiki locally
You can’t perform that action at this time.