UnicodeEncodeError: 'ascii' codec can't encode characters in position 18-23: ordinal not in range(128)
UnicodeEncodeError: 'ascii' codec can't encode characters in position 18-23: ordinal not in range(128)
我试图拟合模型,但出现了一个奇怪的错误
所以,我有 Win10(64),Python 3.7
这是我的代码:
clf = LogisticRegression(solver='saga')
param_grid = {
'C': np.arange(1, 5),
'penalty': ['l1', 'l2'],
}
search = GridSearchCV(clf, param_grid, n_jobs=-1, cv=5, refit=True, scoring='accuracy')
search.fit(feature_matrix, labels)
这是回溯:
---------------------------------------------------------------------------
UnicodeEncodeError Traceback (most recent call last)
<ipython-input-13-93a1aa3c1ec2> in <module>
12
13
---> 14 search.fit(feature_matrix, labels)
15
C:\Anaconda3\lib\site-packages\sklearn\utils\validation.py in inner_f(*args, **kwargs)
71 FutureWarning)
72 kwargs.update({k: arg for k, arg in zip(sig.parameters, args)})
---> 73 return f(**kwargs)
74 return inner_f
75
C:\Anaconda3\lib\site-packages\sklearn\model_selection\_search.py in fit(self, X, y, groups, **fit_params)
693 verbose=self.verbose)
694 results = {}
--> 695 with parallel:
696 all_candidate_params = []
697 all_out = []
C:\Anaconda3\lib\site-packages\joblib\parallel.py in __enter__(self)
709 def __enter__(self):
710 self._managed_backend = True
--> 711 self._initialize_backend()
712 return self
713
C:\Anaconda3\lib\site-packages\joblib\parallel.py in _initialize_backend(self)
720 try:
721 n_jobs = self._backend.configure(n_jobs=self.n_jobs, parallel=self,
--> 722 **self._backend_args)
723 if self.timeout is not None and not self._backend.supports_timeout:
724 warnings.warn(
C:\Anaconda3\lib\site-packages\joblib\_parallel_backends.py in configure(self, n_jobs, parallel, prefer, require, idle_worker_timeout, **memmappingexecutor_args)
495 n_jobs, timeout=idle_worker_timeout,
496 env=self._prepare_worker_env(n_jobs=n_jobs),
--> 497 context_id=parallel._id, **memmappingexecutor_args)
498 self.parallel = parallel
499 return n_jobs
C:\Anaconda3\lib\site-packages\joblib\executor.py in get_memmapping_executor(n_jobs, **kwargs)
18
19 def get_memmapping_executor(n_jobs, **kwargs):
---> 20 return MemmappingExecutor.get_memmapping_executor(n_jobs, **kwargs)
21
22
C:\Anaconda3\lib\site-packages\joblib\executor.py in get_memmapping_executor(cls, n_jobs, timeout, initializer, initargs, env, temp_folder, context_id, **backend_args)
40 _executor_args = executor_args
41
---> 42 manager = TemporaryResourcesManager(temp_folder)
43
44 # reducers access the temporary folder in which to store temporary
C:\Anaconda3\lib\site-packages\joblib\_memmapping_reducer.py in __init__(self, temp_folder_root, context_id)
529 # exposes exposes too many low-level details.
530 context_id = uuid4().hex
--> 531 self.set_current_context(context_id)
532
533 def set_current_context(self, context_id):
C:\Anaconda3\lib\site-packages\joblib\_memmapping_reducer.py in set_current_context(self, context_id)
533 def set_current_context(self, context_id):
534 self._current_context_id = context_id
--> 535 self.register_new_context(context_id)
536
537 def register_new_context(self, context_id):
C:\Anaconda3\lib\site-packages\joblib\_memmapping_reducer.py in register_new_context(self, context_id)
558 new_folder_name, self._temp_folder_root
559 )
--> 560 self.register_folder_finalizer(new_folder_path, context_id)
561 self._cached_temp_folders[context_id] = new_folder_path
562
C:\Anaconda3\lib\site-packages\joblib\_memmapping_reducer.py in register_folder_finalizer(self, pool_subfolder, context_id)
588 # semaphores and pipes
589 pool_module_name = whichmodule(delete_folder, 'delete_folder')
--> 590 resource_tracker.register(pool_subfolder, "folder")
591
592 def _cleanup():
C:\Anaconda3\lib\site-packages\joblib\externals\loky\backend\resource_tracker.py in register(self, name, rtype)
189 '''Register a named resource, and increment its refcount.'''
190 self.ensure_running()
--> 191 self._send('REGISTER', name, rtype)
192
193 def unregister(self, name, rtype):
C:\Anaconda3\lib\site-packages\joblib\externals\loky\backend\resource_tracker.py in _send(self, cmd, name, rtype)
202
203 def _send(self, cmd, name, rtype):
--> 204 msg = '{0}:{1}:{2}\n'.format(cmd, name, rtype).encode('ascii')
205 if len(name) > 512:
206 # posix guarantees that writes to a pipe of less than PIPE_BUF
UnicodeEncodeError: 'ascii' codec can't encode characters in position 18-23: ordinal not in range(128)
我试图通过剪切 .encode('ascii') 来修复 _send,但它对我没有帮助。它会生成另一个错误(需要一个类似字节的对象,而不是 'str'),其中包含来自上面回溯的变量 msg
我正在寻找有关此的建议。非常感谢。
尝试使用 utf-8
编码。
msg = '{0}:{1}:{2}\n'.format(cmd, name, rtype).encode('utf-8')
这些消息通常意味着您正在尝试将 Unicode strings
与 8-bit strings
混合,或者正在尝试将 Unicode 字符串写入仅处理 ASCII
的输出文件或设备.
执行此操作时,Python 通常会假定 8 位字符串仅包含 ASCII 数据,如果不是这样,则会引发错误。
在输入时避免这种情况的最佳方法是 convert all incoming strings to Unicode
,以 Unicode 进行处理,然后在输出时转换回编码字节字符串。
我试图拟合模型,但出现了一个奇怪的错误 所以,我有 Win10(64),Python 3.7 这是我的代码:
clf = LogisticRegression(solver='saga')
param_grid = {
'C': np.arange(1, 5),
'penalty': ['l1', 'l2'],
}
search = GridSearchCV(clf, param_grid, n_jobs=-1, cv=5, refit=True, scoring='accuracy')
search.fit(feature_matrix, labels)
这是回溯:
---------------------------------------------------------------------------
UnicodeEncodeError Traceback (most recent call last)
<ipython-input-13-93a1aa3c1ec2> in <module>
12
13
---> 14 search.fit(feature_matrix, labels)
15
C:\Anaconda3\lib\site-packages\sklearn\utils\validation.py in inner_f(*args, **kwargs)
71 FutureWarning)
72 kwargs.update({k: arg for k, arg in zip(sig.parameters, args)})
---> 73 return f(**kwargs)
74 return inner_f
75
C:\Anaconda3\lib\site-packages\sklearn\model_selection\_search.py in fit(self, X, y, groups, **fit_params)
693 verbose=self.verbose)
694 results = {}
--> 695 with parallel:
696 all_candidate_params = []
697 all_out = []
C:\Anaconda3\lib\site-packages\joblib\parallel.py in __enter__(self)
709 def __enter__(self):
710 self._managed_backend = True
--> 711 self._initialize_backend()
712 return self
713
C:\Anaconda3\lib\site-packages\joblib\parallel.py in _initialize_backend(self)
720 try:
721 n_jobs = self._backend.configure(n_jobs=self.n_jobs, parallel=self,
--> 722 **self._backend_args)
723 if self.timeout is not None and not self._backend.supports_timeout:
724 warnings.warn(
C:\Anaconda3\lib\site-packages\joblib\_parallel_backends.py in configure(self, n_jobs, parallel, prefer, require, idle_worker_timeout, **memmappingexecutor_args)
495 n_jobs, timeout=idle_worker_timeout,
496 env=self._prepare_worker_env(n_jobs=n_jobs),
--> 497 context_id=parallel._id, **memmappingexecutor_args)
498 self.parallel = parallel
499 return n_jobs
C:\Anaconda3\lib\site-packages\joblib\executor.py in get_memmapping_executor(n_jobs, **kwargs)
18
19 def get_memmapping_executor(n_jobs, **kwargs):
---> 20 return MemmappingExecutor.get_memmapping_executor(n_jobs, **kwargs)
21
22
C:\Anaconda3\lib\site-packages\joblib\executor.py in get_memmapping_executor(cls, n_jobs, timeout, initializer, initargs, env, temp_folder, context_id, **backend_args)
40 _executor_args = executor_args
41
---> 42 manager = TemporaryResourcesManager(temp_folder)
43
44 # reducers access the temporary folder in which to store temporary
C:\Anaconda3\lib\site-packages\joblib\_memmapping_reducer.py in __init__(self, temp_folder_root, context_id)
529 # exposes exposes too many low-level details.
530 context_id = uuid4().hex
--> 531 self.set_current_context(context_id)
532
533 def set_current_context(self, context_id):
C:\Anaconda3\lib\site-packages\joblib\_memmapping_reducer.py in set_current_context(self, context_id)
533 def set_current_context(self, context_id):
534 self._current_context_id = context_id
--> 535 self.register_new_context(context_id)
536
537 def register_new_context(self, context_id):
C:\Anaconda3\lib\site-packages\joblib\_memmapping_reducer.py in register_new_context(self, context_id)
558 new_folder_name, self._temp_folder_root
559 )
--> 560 self.register_folder_finalizer(new_folder_path, context_id)
561 self._cached_temp_folders[context_id] = new_folder_path
562
C:\Anaconda3\lib\site-packages\joblib\_memmapping_reducer.py in register_folder_finalizer(self, pool_subfolder, context_id)
588 # semaphores and pipes
589 pool_module_name = whichmodule(delete_folder, 'delete_folder')
--> 590 resource_tracker.register(pool_subfolder, "folder")
591
592 def _cleanup():
C:\Anaconda3\lib\site-packages\joblib\externals\loky\backend\resource_tracker.py in register(self, name, rtype)
189 '''Register a named resource, and increment its refcount.'''
190 self.ensure_running()
--> 191 self._send('REGISTER', name, rtype)
192
193 def unregister(self, name, rtype):
C:\Anaconda3\lib\site-packages\joblib\externals\loky\backend\resource_tracker.py in _send(self, cmd, name, rtype)
202
203 def _send(self, cmd, name, rtype):
--> 204 msg = '{0}:{1}:{2}\n'.format(cmd, name, rtype).encode('ascii')
205 if len(name) > 512:
206 # posix guarantees that writes to a pipe of less than PIPE_BUF
UnicodeEncodeError: 'ascii' codec can't encode characters in position 18-23: ordinal not in range(128)
我试图通过剪切 .encode('ascii') 来修复 _send,但它对我没有帮助。它会生成另一个错误(需要一个类似字节的对象,而不是 'str'),其中包含来自上面回溯的变量 msg 我正在寻找有关此的建议。非常感谢。
尝试使用 utf-8
编码。
msg = '{0}:{1}:{2}\n'.format(cmd, name, rtype).encode('utf-8')
这些消息通常意味着您正在尝试将 Unicode strings
与 8-bit strings
混合,或者正在尝试将 Unicode 字符串写入仅处理 ASCII
的输出文件或设备.
执行此操作时,Python 通常会假定 8 位字符串仅包含 ASCII 数据,如果不是这样,则会引发错误。
在输入时避免这种情况的最佳方法是 convert all incoming strings to Unicode
,以 Unicode 进行处理,然后在输出时转换回编码字节字符串。