Thank you! that makes 100% sense.. Pandas does not know about the Modin - it is the other way around ..
I have taken your advice and managed to take an InputDataSet that was sent to a Modin data frame and convert it successfully back to a Pandas Data Frame.
Do you perhaps know why I cannot apply a lamba function on my Modin frame - when I call this Python script via SQL?
- This works fine when running via a Jupyter notebook. (dfModin["XXX"] = dfModin["XXX"].apply(lambda x: myfunc(x)))
Msg 39019, Level 16, State 2, Line 5
An external script error occurred:
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\modin\pandas\base.py", line 2638, in __getitem__
return self._getitem(key)
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\modin\pandas\dataframe.py", line 2371, in _getitem
return self._getitem_column(key)
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\modin\pandas\dataframe.py", line 1945, in _getitem_column
query_compiler=self._query_compiler.getitem_column_array([key])
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\modin\backends\pandas\query_compiler.py", line 2157, in getitem_column_array
new_modin_frame = self._modin_frame.mask(col_indices=key)
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\modin\engines\base\frame\data.py", line 614, in mask
Msg 39019, Level 16, State 2, Line 5
An external script error occurred:
for row_idx, row_internal_indices in row_partitions_list.items()
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\modin\engines\base\frame\data.py", line 616, in <listcomp>
or len(row_internal_indices) > 0
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\modin\engines\base\frame\data.py", line 612, in <listcomp>
or len(col_internal_indices) > 0
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\modin\engines\dask\pandas_on_dask\frame\partition.py", line 99, in mask
lambda df: pandas.DataFrame(df.iloc[row_indices, col_indices])
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\modin\engines\dask\pandas_on_dask\frame\partition.py", line 88, in add_to_apply_calls
self.future, call_queue=self.call_queue + [[pkl.dumps(func), kwargs]]
Msg 39019, Level 16, State 2, Line 5
An external script error occurred:
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\cloudpickle\cloudpickle_fast.py", line 102, in dumps
cp.dump(obj)
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\cloudpickle\cloudpickle_fast.py", line 563, in dump
return Pickler.dump(self, obj)
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\pickle.py", line 437, in dump
self.save(obj)
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\pickle.py", line 504, in save
f(self, obj) # Call unbound method with explicit self
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\cloudpickle\cloudpickle_fast.py", line 745, in save_function
*self._dynamic_function_reduce(obj), obj=obj
Msg 39019, Level 16, State 2, Line 5
An external script error occurred:
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\cloudpickle\cloudpickle_fast.py", line 682, in _save_reduce_pickle5
dictitems=dictitems, obj=obj
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\pickle.py", line 638, in save_reduce
save(args)
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\pickle.py", line 504, in save
f(self, obj) # Call unbound method with explicit self
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\pickle.py", line 786, in save_tuple
save(element)
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\pickle.py", line 504, in save
f(self, obj) # Call unbound method with explicit self
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\pickle.py", line 771, in save_tuple
save(element)
Msg 39019, Level 16, State 2, Line 5
An external script error occurred:
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\pickle.py", line 504, in save
f(self, obj) # Call unbound method with explicit self
File "D:\Software\Microsoft SQL Server\MSSQL15.MSSQL02\PYTHON_SERVICES\lib\site-packages\dill\_dill.py", line 1119, in save_cell
f = obj.cell_contents
ValueError: Cell is empty
SqlSatelliteCall error: Error in execution. Check the output for more information.