
{  
   "types" : {
      "Bookmark" : {
         "pluralLabel" : "Bookmarks"
      },
      "Publication" : {
         "pluralLabel" : "Publications"
      },
      "GoldStandardPublication" : {
         "pluralLabel" : "GoldStandardPublications"
      },
      "GoldStandardBookmark" : {
         "pluralLabel" : "GoldStandardBookmarks"
      },
      "Tag" : {
         "pluralLabel" : "Tags"
      },
      "User" : {
         "pluralLabel" : "Users"
      },
      "Group" : {
         "pluralLabel" : "Groups"
      },
      "Sphere" : {
         "pluralLabel" : "Spheres"
      }
   },
   
   "properties" : {
      "count" : {
         "valueType" : "number"
      },
      "date" : {
         "valueType" : "date"
      },
      "changeDate" : {
         "valueType" : "date"
      },
      "url" : {
         "valueType" : "url"
      },
      "id" : {
         "valueType" : "url"
      },
      "tags" : {
         "valueType" : "item"
      },
      "user" : {
         "valueType" : "item"
      }      
   },
   
   "items" : [
   	  
      {
         "type" : "Publication",
         "id"   : "https://puma.ub.uni-stuttgart.de/bibtex/2e8ebd2f42b453167d2065725486828cb/ipvs-sgs",         
         "tags" : [
            "myown","Performance","CPU","Evaluation","SVM","SYCL","GPU","AISA","exc2075","aisa"
         ],
         
         "intraHash" : "e8ebd2f42b453167d2065725486828cb",
         "interHash" : "bfbc52cd98d241445f5051b284bf6ded",
         "label" : "Evaluation of SYCL\u2019s Different Data Parallel Kernels",
         "user" : "ipvs-sgs",
         "description" : "",
         "date" : "2024-09-30 13:17:58",
         "changeDate" : "2025-06-23 09:45:25",
         "count" : 10,
         "pub-type": "inproceedings",
         "booktitle": "Proceedings of the 12th International Workshop on OpenCL and SYCL","series": "IWOCL '24","publisher":"Association for Computing Machinery","address":"New York, NY, USA",
         "year": "2024", 
         "url": "https://doi.org/10.1145/3648115.3648130", 
         
         "author": [ 
            "Marcel Breyer","Alexander Van Craen","Dirk Pflüger"
         ],
         "authors": [
         	
            	{"first" : "Marcel",	"last" : "Breyer"},
            	{"first" : "Alexander",	"last" : "Van Craen"},
            	{"first" : "Dirk",	"last" : "Pflüger"}
         ],
         "pages": "1-4","abstract": "SYCL provides programmers with four, and in the case of AdaptiveCpp even five, ways for calling and writing a device kernel. This paper analyzes the performance of these diverse kernel invocation types for DPC++ and AdaptiveCpp as SYCL implementations on an NVIDIA A100 GPU, an AMD Instinct MI210 GPU, and a dual-socket AMD EPYC 9274F CPU. Using the example of a kernel matrix assembly, we show why the performance can differ by a factor of 100 in the worst case on the same hardware for the same problem using different SYCL implementations and kernel invocation types.",
         "isbn" : "9798400717901",
         
         "language" : "english",
         
         "numpages" : "4",
         
         "articleno" : "10",
         
         "location" : "Chicago, IL, USA",
         
         "doi" : "10.1145/3648115.3648130",
         
         "bibtexKey": "breyer2024evaluation"

      }
	  
   ]
}
