implementation: started transpiler section

2025-05-03 12:25:34 +02:00
parent e8e457eae9
commit 18d89e27ca
4 changed files with 68 additions and 13 deletions
--- a/package/src/Interpreter.jl
+++ b/package/src/Interpreter.jl
@ -34,12 +34,10 @@ function interpret(expressions::Vector{Expr}, variables::Matrix{Float32}, parame
 	@inbounds for i in eachindex(exprs)
 		# TODO: Currently only the first expression gets evaluated. Either use a view on "cudaExprs" to determine the correct expression or extend cudaStepsize to include this information (this information was removed in a previous commit)
 		# If a "view" is used, then the ExpressionProcessing must be updated to always include the stop opcode at the end
-		kernel = @cuda launch=false fastmath=true interpret_expression(cudaExprs, cudaVars, cudaParams, cudaResults, cudaStepsize, i)
-		# config = launch_configuration(kernel.fun)
-		threads = min(variableCols, 128)
-		blocks = cld(variableCols, threads)
+		numThreads = min(variableCols, 128)
+		numBlocks = cld(variableCols, numThreads)

-		kernel(cudaExprs, cudaVars, cudaParams, cudaResults, cudaStepsize, i; threads, blocks)
+		@cuda threads=numThreads blocks=numBlocks fastmath=true interpret_expression(cudaExprs, cudaVars, cudaParams, cudaResults, cudaStepsize, i)
 	end

 	return cudaResults