@@ -636,15 +636,10 @@ def __call__(self, arg_id_to_arg) -> ArrayContainer:
636636 input_kwargs_for_loopy = _args_to_device_buffers (
637637 self .actx , self .input_id_to_name_in_program , arg_id_to_arg , fn_name )
638638
639- evt , out_dict = self .pytato_program (queue = self .actx .queue ,
639+ _evt , out_dict = self .pytato_program (queue = self .actx .queue ,
640640 allocator = self .actx .allocator ,
641641 ** input_kwargs_for_loopy )
642642
643- # FIXME Kernels (for now) allocate tons of memory in temporaries. If we
644- # race too far ahead with enqueuing, there is a distinct risk of
645- # running out of memory. This mitigates that risk a bit, for now.
646- evt .wait ()
647-
648643 def to_output_template (keys , _ ):
649644 name_in_program = self .output_id_to_name_in_program [keys ]
650645 return self .actx .thaw (to_tagged_cl_array (
@@ -680,15 +675,10 @@ def __call__(self, arg_id_to_arg) -> ArrayContainer:
680675 input_kwargs_for_loopy = _args_to_device_buffers (
681676 self .actx , self .input_id_to_name_in_program , arg_id_to_arg , fn_name )
682677
683- evt , out_dict = self .pytato_program (queue = self .actx .queue ,
678+ _evt , out_dict = self .pytato_program (queue = self .actx .queue ,
684679 allocator = self .actx .allocator ,
685680 ** input_kwargs_for_loopy )
686681
687- # FIXME Kernels (for now) allocate tons of memory in temporaries. If we
688- # race too far ahead with enqueuing, there is a distinct risk of
689- # running out of memory. This mitigates that risk a bit, for now.
690- evt .wait ()
691-
692682 return self .actx .thaw (to_tagged_cl_array (out_dict [self .output_name ],
693683 axes = get_cl_axes_from_pt_axes (
694684 self .output_axes ),
0 commit comments