Also tried this as well, and again I ran into the very same errorā¦
EDIT: So I transfered all the code from the Jupyter Notebook into a plain .py
script and let the relevant part run again, now actually receiving a different error message. Not sure tho, if this may help to come closer to the issue 
Using custom data configuration default-8f1dcd17d8b8834c
Reusing dataset text (C:\Users\s_scho53\.cache\huggingface\datasets\text\default-8f1dcd17d8b8834c\0.0.0\e16f44aa1b321ece1f87b07977cc5d70be93d69b20486d6dacd62e12cf25c9a5)
Token indices sequence length is longer than the specified maximum sequence length for this model (4078 > 512). Running this sequence through the model will result in indexing errors
Using custom data configuration default-8f1dcd17d8b8834c
Reusing dataset text (C:\Users\s_scho53\.cache\huggingface\datasets\text\default-8f1dcd17d8b8834c\0.0.0\e16f44aa1b321ece1f87b07977cc5d70be93d69b20486d6dacd62e12cf25c9a5)
Using custom data configuration default-8f1dcd17d8b8834c
Reusing dataset text (C:\Users\s_scho53\.cache\huggingface\datasets\text\default-8f1dcd17d8b8834c\0.0.0\e16f44aa1b321ece1f87b07977cc5d70be93d69b20486d6dacd62e12cf25c9a5)
Token indices sequence length is longer than the specified maximum sequence length for this model (4078 > 512). Running this sequence through the model will result in indexing errors
Token indices sequence length is longer than the specified maximum sequence length for this model (4078 > 512). Running this sequence through the model will result in indexing errors
Traceback (most recent call last):
File "<string>", line 1, in <module>
Traceback (most recent call last):
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 116, in spawn_main
File "<string>", line 1, in <module>
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 116, in spawn_main
exitcode = _main(fd, parent_sentinel)
exitcode = _main(fd, parent_sentinel)
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 125, in _main
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 125, in _main
prepare(preparation_data)
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 236, in prepare
prepare(preparation_data)
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 236, in prepare
_fixup_main_from_path(data['init_main_from_path'])
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 287, in _fixup_main_from_path
_fixup_main_from_path(data['init_main_from_path'])
main_content = runpy.run_path(main_path, File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 287, in _fixup_main_from_path
File "C:\Python\lib\runpy.py", line 265, in run_path
main_content = runpy.run_path(main_path,
File "C:\Python\lib\runpy.py", line 265, in run_path
return _run_module_code(code, init_globals, run_name, return _run_module_code(code, init_globals, run_name,
File "C:\Python\lib\runpy.py", line 97, in _run_module_code
File "C:\Python\lib\runpy.py", line 97, in _run_module_code
_run_code(code, mod_globals, init_globals,_run_code(code, mod_globals, init_globals,
File "C:\Python\lib\runpy.py", line 87, in _run_code
File "C:\Python\lib\runpy.py", line 87, in _run_code
exec(code, run_globals)exec(code, run_globals)
File "c:\Users\s_scho53\Desktop\L09_Desktop\_FiLMo\Untitled-1.py", line 41, in <module>
File "c:\Users\s_scho53\Desktop\L09_Desktop\_FiLMo\Untitled-1.py", line 41, in <module>
datasets = datasets.map(datasets = datasets.map(
File "C:\Python\lib\site-packages\datasets\dataset_dict.py", line 432, in map
File "C:\Python\lib\site-packages\datasets\dataset_dict.py", line 432, in map
{{
File "C:\Python\lib\site-packages\datasets\dataset_dict.py", line 433, in <dictcomp>
File "C:\Python\lib\site-packages\datasets\dataset_dict.py", line 433, in <dictcomp>
k: dataset.map(
File "C:\Python\lib\site-packages\datasets\arrow_dataset.py", line 1452, in map
k: dataset.map(
File "C:\Python\lib\site-packages\datasets\arrow_dataset.py", line 1452, in map
with Pool(num_proc, initargs=(RLock(),), initializer=tqdm.set_lock) as pool:with Pool(num_proc, initargs=(RLock(),), initializer=tqdm.set_lock) as pool:
File "C:\Python\lib\site-packages\multiprocess\context.py", line 119, in Pool
File "C:\Python\lib\site-packages\multiprocess\context.py", line 119, in Pool
return Pool(processes, initializer, initargs, maxtasksperchild,return Pool(processes, initializer, initargs, maxtasksperchild,
File "C:\Python\lib\site-packages\multiprocess\pool.py", line 212, in __init__
File "C:\Python\lib\site-packages\multiprocess\pool.py", line 212, in __init__
self._repopulate_pool()self._repopulate_pool()
File "C:\Python\lib\site-packages\multiprocess\pool.py", line 303, in _repopulate_pool
File "C:\Python\lib\site-packages\multiprocess\pool.py", line 303, in _repopulate_pool
return self._repopulate_pool_static(self._ctx, self.Process,
return self._repopulate_pool_static(self._ctx, self.Process, File "C:\Python\lib\site-packages\multiprocess\pool.py", line 326, in _repopulate_pool_static
File "C:\Python\lib\site-packages\multiprocess\pool.py", line 326, in _repopulate_pool_static
w.start()
File "C:\Python\lib\site-packages\multiprocess\process.py", line 121, in start
w.start()
File "C:\Python\lib\site-packages\multiprocess\process.py", line 121, in start
self._popen = self._Popen(self)
File "C:\Python\lib\site-packages\multiprocess\context.py", line 327, in _Popen
self._popen = self._Popen(self)
File "C:\Python\lib\site-packages\multiprocess\context.py", line 327, in _Popen
return Popen(process_obj)
File "C:\Python\lib\site-packages\multiprocess\popen_spawn_win32.py", line 45, in __init__
return Popen(process_obj)
File "C:\Python\lib\site-packages\multiprocess\popen_spawn_win32.py", line 45, in __init__
prep_data = spawn.get_preparation_data(process_obj._name)
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 154, in get_preparation_data
prep_data = spawn.get_preparation_data(process_obj._name)
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 154, in get_preparation_data
_check_not_importing_main()
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 134, in _check_not_importing_main
_check_not_importing_main()
File "C:\Python\lib\site-packages\multiprocess\spawn.py", line 134, in _check_not_importing_main
raise RuntimeError('''
RuntimeError: raise RuntimeError('''
An attempt has been made to start a new process before the
current process has finished its bootstrapping phase.
This probably means that you are not using fork to start your
child processes and you have forgotten to use the proper idiom
in the main module:
if __name__ == '__main__':
freeze_support()
...
The "freeze_support()" line can be omitted if the program
is not going to be frozen to produce an executable.
RuntimeError:
An attempt has been made to start a new process before the
current process has finished its bootstrapping phase.
This probably means that you are not using fork to start your
child processes and you have forgotten to use the proper idiom
in the main module:
if __name__ == '__main__':
freeze_support()
...
The "freeze_support()" line can be omitted if the program
is not going to be frozen to produce an executable.