I'm able to fit a model that includes KerasClassifier as a model in the ensemble. How

It looks like you haven't successfully installed the PR <a class="issue-link js-issue-

KerasClassifier "can't pickle _thread.RLock objects" message when predicting,about flennerhag/mlens

onacrame commented on May 14, 2024 1

Just one thing to note. It's doesn't really impact me as I'm using a small dataset but when I use the KerasClassifier in the ensemble I can only get it to work with setting n_jobs=1. If I set to -1 it won't work.

from mlens.

flennerhag commented on May 14, 2024

Hi!

Looks like you can't make deep copies of Keras models. I took a look at the code and the use of deepcopy is excessively protective. It's a legacy product of a previous version. I've pushed a branch into PR #98 that solves your issue. Would be great if you could give it a try and check that it indeed solves your issue!

from mlens.

onacrame commented on May 14, 2024

Hi and thanks for the prompt feedback. Fantastic package and looking forward to seeing it develop!

Ok, so this did seem to work, however, if I used KerasClassifier as the meta estimator I get the same error during the fit stage:

`---------------------------------------------------------------------------
TypeError Traceback (most recent call last)
in ()
16 ensemble.add_meta(KerasClassifier(build_fn=create_model2, epochs=20, batch_size=5),proba=True)
17
---> 18 ensemble.fit(X[:294], y[:294],)
19
20

D:\Continuum\anaconda3\lib\site-packages\mlens\ensemble\base.py in fit(self, X, y, **kwargs)
514 self._id_train.fit(X)
515
--> 516 out = self._backend.fit(X, y, **kwargs)
517 if out is not self._backend:
518 # fit_transform

D:\Continuum\anaconda3\lib\site-packages\mlens\ensemble\base.py in fit(self, X, y, **kwargs)
156 with ParallelProcessing(self.backend, self.n_jobs,
157 max(self.verbose - 4, 0)) as manager:
--> 158 out = manager.stack(self, 'fit', X, y, **kwargs)
159
160 if self.verbose:

D:\Continuum\anaconda3\lib\site-packages\mlens\parallel\backend.py in stack(self, caller, job, X, y, path, return_preds, warm_start, split, **kwargs)
671 job=job, X=X, y=y, path=path, warm_start=warm_start,
672 return_preds=return_preds, split=split, stack=True)
--> 673 return self.process(caller=caller, out=out, **kwargs)
674
675 def process(self, caller, out, **kwargs):

D:\Continuum\anaconda3\lib\site-packages\mlens\parallel\backend.py in process(self, caller, out, **kwargs)
716 self.job.clear()
717
--> 718 self._partial_process(task, parallel, **kwargs)
719
720 if task.name in return_names:

D:\Continuum\anaconda3\lib\site-packages\mlens\parallel\backend.py in _partial_process(self, task, parallel, **kwargs)
737 self._gen_prediction_array(task, self.job.job, self.threading)
738
--> 739 task(self.job.args(**kwargs), parallel=parallel)
740
741 if not task.no_output and getattr(task, 'n_feature_prop', 0):

D:\Continuum\anaconda3\lib\site-packages\mlens\parallel\layer.py in call(self, args, parallel)
157
158 if job == 'fit':
--> 159 self.collect()
160
161 if self.verbose:

D:\Continuum\anaconda3\lib\site-packages\mlens\parallel\layer.py in collect(self, path)
169 transformer.collect(path)
170 for learner in self.learners:
--> 171 learner.collect(path)
172
173 def set_output_columns(self, X, y, job, n_left_concats=0):

D:\Continuum\anaconda3\lib\site-packages\mlens\parallel\learner.py in collect(self, path)
652 learner_data,
653 sublearner_files,
--> 654 sublearner_data) = self._collect(path)
655
656 self.clear()

D:\Continuum\anaconda3\lib\site-packages\mlens\parallel\learner.py in _collect(self, path)
709 if self.only_all:
710 # Sub learners are the same as the sub-learners
--> 711 sublearner_files, sublearner_data = replace(learner_files)
712
713 return learner_files, learner_data, sublearner_files, sublearner_data

D:\Continuum\anaconda3\lib\site-packages\mlens\parallel_base_functions.py in replace(source_files)
67 def replace(source_files):
68 """Utility function to replace empty files list"""
---> 69 replace_files = [deepcopy(o) for o in source_files]
70 for o in replace_files:
71 o.name = o.name[:-1] + '0'

D:\Continuum\anaconda3\lib\site-packages\mlens\parallel_base_functions.py in (.0)
67 def replace(source_files):
68 """Utility function to replace empty files list"""
---> 69 replace_files = [deepcopy(o) for o in source_files]
70 for o in replace_files:
71 o.name = o.name[:-1] + '0'

D:\Continuum\anaconda3\lib\copy.py in deepcopy(x, memo, _nil)
178 y = x
179 else:
--> 180 y = _reconstruct(x, memo, *rv)
181
182 # If is its own copy, don't memoize.

D:\Continuum\anaconda3\lib\copy.py in _reconstruct(x, memo, func, args, state, listiter, dictiter, deepcopy)
278 if state is not None:
279 if deep:
--> 280 state = deepcopy(state, memo)
281 if hasattr(y, 'setstate'):
282 y.setstate(state)

D:\Continuum\anaconda3\lib\copy.py in deepcopy(x, memo, _nil)
148 copier = _deepcopy_dispatch.get(cls)
149 if copier:
--> 150 y = copier(x, memo)
151 else:
152 try:

D:\Continuum\anaconda3\lib\copy.py in _deepcopy_tuple(x, memo, deepcopy)
218
219 def _deepcopy_tuple(x, memo, deepcopy=deepcopy):
--> 220 y = [deepcopy(a, memo) for a in x]
221 # We're not going to put the tuple in the memo, but it's still important we
222 # check for it, in case the tuple contains recursive mutable structures.

D:\Continuum\anaconda3\lib\copy.py in (.0)
218
219 def _deepcopy_tuple(x, memo, deepcopy=deepcopy):
--> 220 y = [deepcopy(a, memo) for a in x]
221 # We're not going to put the tuple in the memo, but it's still important we
222 # check for it, in case the tuple contains recursive mutable structures.

D:\Continuum\anaconda3\lib\copy.py in deepcopy(x, memo, _nil)
178 y = x
179 else:
--> 180 y = _reconstruct(x, memo, *rv)
181
182 # If is its own copy, don't memoize.

D:\Continuum\anaconda3\lib\copy.py in _reconstruct(x, memo, func, args, state, listiter, dictiter, deepcopy)
278 if state is not None:
279 if deep:
--> 280 state = deepcopy(state, memo)
281 if hasattr(y, 'setstate'):
282 y.setstate(state)

D:\Continuum\anaconda3\lib\copy.py in deepcopy(x, memo, _nil)
148 copier = _deepcopy_dispatch.get(cls)
149 if copier:
--> 150 y = copier(x, memo)
151 else:
152 try:

D:\Continuum\anaconda3\lib\copy.py in _deepcopy_dict(x, memo, deepcopy)
238 memo[id(x)] = y
239 for key, value in x.items():
--> 240 y[deepcopy(key, memo)] = deepcopy(value, memo)
241 return y
242 d[dict] = _deepcopy_dict