Open
Description
On Windows, a UnicodeDecodeError is raised when using split_wiki:
----> 1 dest = split_wiki(path,lang)
~\projects\forks\course-nlp\nlputils.py in split_wiki(path, lang, encoding)
46 if f: f.close()
47 f = (dest/f'{title}.txt').open('w')
---> 48 else: f.write(l)
49 f.close()
50 return dest
~\AppData\Local\Continuum\anaconda3\envs\fastai-v1-py37\lib\encodings\cp1252.py in encode(self, input, final)
17 class IncrementalEncoder(codecs.IncrementalEncoder):
18 def encode(self, input, final=False):
---> 19 return codecs.charmap_encode(input,self.errors,encoding_table)[0]
20
21 class IncrementalDecoder(codecs.IncrementalDecoder):
UnicodeEncodeError: 'charmap' codec can't encode character '\u0103' in position 21: character maps to <undefined>
Metadata
Metadata
Assignees
Labels
No labels