|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
"""Utilities to handle file locking in `datasets`.""" |
|
|
|
import os |
|
|
|
from filelock import FileLock as FileLock_ |
|
from filelock import UnixFileLock |
|
from filelock import __version__ as _filelock_version |
|
from packaging import version |
|
|
|
|
|
class FileLock(FileLock_): |
|
""" |
|
A `filelock.FileLock` initializer that handles long paths. |
|
It also uses the current umask for lock files. |
|
""" |
|
|
|
MAX_FILENAME_LENGTH = 255 |
|
|
|
def __init__(self, lock_file, *args, **kwargs): |
|
|
|
|
|
if "mode" not in kwargs and version.parse(_filelock_version) >= version.parse("3.10.0"): |
|
umask = os.umask(0o666) |
|
os.umask(umask) |
|
kwargs["mode"] = 0o666 & ~umask |
|
lock_file = self.hash_filename_if_too_long(lock_file) |
|
super().__init__(lock_file, *args, **kwargs) |
|
|
|
@classmethod |
|
def hash_filename_if_too_long(cls, path: str) -> str: |
|
path = os.path.abspath(os.path.expanduser(path)) |
|
filename = os.path.basename(path) |
|
max_filename_length = cls.MAX_FILENAME_LENGTH |
|
if issubclass(cls, UnixFileLock): |
|
max_filename_length = min(max_filename_length, os.statvfs(os.path.dirname(path)).f_namemax) |
|
if len(filename) > max_filename_length: |
|
dirname = os.path.dirname(path) |
|
hashed_filename = str(hash(filename)) |
|
new_filename = ( |
|
filename[: max_filename_length - len(hashed_filename) - 8] + "..." + hashed_filename + ".lock" |
|
) |
|
return os.path.join(dirname, new_filename) |
|
else: |
|
return path |
|
|