mirror of
https://github.com/LmeSzinc/AzurLaneAutoScript.git
synced 2025-04-04 04:01:20 +08:00
Upd: [ALAS] atomic_failure_cleanup
This commit is contained in:
parent
19db66157e
commit
7a782138b6
259
deploy/atomic.py
259
deploy/atomic.py
@ -5,8 +5,13 @@ import string
|
||||
import time
|
||||
from typing import Union
|
||||
|
||||
# Max attempt if another process is reading/writing, effective only on Windows
|
||||
WINDOWS_MAX_ATTEMPT = 5
|
||||
# Base time to wait between retries (seconds)
|
||||
WINDOWS_RETRY_DELAY = 0.05
|
||||
|
||||
def random_id(length=6):
|
||||
|
||||
def random_id(length: int = 6) -> str:
|
||||
"""
|
||||
Args:
|
||||
length (int): 6 random letter (62^6 combinations) would be enough
|
||||
@ -17,11 +22,44 @@ def random_id(length=6):
|
||||
return ''.join(random.sample(string.ascii_letters + string.digits, length))
|
||||
|
||||
|
||||
def is_tmp_file(filename: str) -> bool:
|
||||
"""
|
||||
Check if a filename is tmp file
|
||||
"""
|
||||
# Check suffix first to reduce regex calls
|
||||
if not filename.endswith('.tmp'):
|
||||
return False
|
||||
# Check temp file format
|
||||
res = re.match(r'.*\.[a-zA-Z0-9]{6,}\.tmp$', filename)
|
||||
if not res:
|
||||
return False
|
||||
return True
|
||||
|
||||
|
||||
def to_tmp_file(filename: str) -> str:
|
||||
"""
|
||||
Convert a filename or directory name to tmp
|
||||
"""
|
||||
suffix = random_id(6)
|
||||
return f'{filename}.{suffix}.tmp'
|
||||
|
||||
|
||||
def windows_attempt_delay(attempt: int) -> float:
|
||||
"""
|
||||
Exponential Backoff if file is in use on Windows
|
||||
|
||||
Args:
|
||||
attempt: Current attempt, starting from 0
|
||||
|
||||
Returns:
|
||||
float: Seconds to wait
|
||||
"""
|
||||
return 2 ** attempt * WINDOWS_RETRY_DELAY
|
||||
|
||||
|
||||
def atomic_write(
|
||||
file: str,
|
||||
data: Union[str, bytes],
|
||||
max_attempt=5,
|
||||
retry_delay=0.05,
|
||||
):
|
||||
"""
|
||||
Atomic file write with minimal IO operation
|
||||
@ -33,12 +71,8 @@ def atomic_write(
|
||||
Args:
|
||||
file:
|
||||
data:
|
||||
max_attempt: Max attempt if another process is reading,
|
||||
effective only on Windows
|
||||
retry_delay: Base time to wait between retries (seconds)
|
||||
"""
|
||||
suffix = random_id(6)
|
||||
temp = f'{file}.{suffix}.tmp'
|
||||
temp = to_tmp_file(file)
|
||||
if isinstance(data, str):
|
||||
mode = 'w'
|
||||
encoding = 'utf-8'
|
||||
@ -74,9 +108,7 @@ def atomic_write(
|
||||
if os.name == 'nt':
|
||||
# PermissionError on Windows if another process is reading
|
||||
last_error = None
|
||||
if max_attempt < 1:
|
||||
max_attempt = 1
|
||||
for trial in range(max_attempt):
|
||||
for attempt in range(WINDOWS_MAX_ATTEMPT):
|
||||
try:
|
||||
# Atomic operation
|
||||
os.replace(temp, file)
|
||||
@ -84,7 +116,111 @@ def atomic_write(
|
||||
return
|
||||
except PermissionError as e:
|
||||
last_error = e
|
||||
delay = 2 ** trial * retry_delay
|
||||
delay = windows_attempt_delay(attempt)
|
||||
time.sleep(delay)
|
||||
continue
|
||||
except Exception as e:
|
||||
last_error = e
|
||||
break
|
||||
else:
|
||||
# Linux and Mac allow existing reading
|
||||
try:
|
||||
# Atomic operation
|
||||
os.replace(temp, file)
|
||||
# success
|
||||
return
|
||||
except Exception as e:
|
||||
last_error = e
|
||||
|
||||
# Clean up temp file on failure
|
||||
try:
|
||||
os.unlink(temp)
|
||||
except:
|
||||
pass
|
||||
if last_error is not None:
|
||||
raise last_error from None
|
||||
|
||||
|
||||
def atomic_stream_write(
|
||||
file: str,
|
||||
data_generator,
|
||||
):
|
||||
"""
|
||||
Atomic file write with streaming data support.
|
||||
Handles cases where file might be read by another process.
|
||||
os.replace() is an atomic operation among all OS,
|
||||
we write to temp file then do os.replace()
|
||||
|
||||
Only creates a file if the generator yields at least one data chunk.
|
||||
Automatically determines write mode based on the type of first chunk.
|
||||
|
||||
Args:
|
||||
file: Target file path
|
||||
data_generator: An iterable that yields data chunks (str or bytes)
|
||||
"""
|
||||
# Convert generator to iterator to ensure we can peek at first chunk
|
||||
data_iter = iter(data_generator)
|
||||
|
||||
# Try to get the first chunk
|
||||
try:
|
||||
first_chunk = next(data_iter)
|
||||
except StopIteration:
|
||||
# Generator is empty, no file will be created
|
||||
return
|
||||
|
||||
# Create temp file path
|
||||
temp = to_tmp_file(file)
|
||||
|
||||
# Determine mode, encoding and newline from first chunk
|
||||
if isinstance(first_chunk, str):
|
||||
mode = 'w'
|
||||
encoding = 'utf-8'
|
||||
newline = ''
|
||||
elif isinstance(first_chunk, bytes):
|
||||
mode = 'wb'
|
||||
encoding = None
|
||||
newline = None
|
||||
else:
|
||||
# Default to text mode for other types
|
||||
mode = 'w'
|
||||
encoding = 'utf-8'
|
||||
newline = ''
|
||||
|
||||
try:
|
||||
# Write temp file
|
||||
with open(temp, mode=mode, encoding=encoding, newline=newline) as f:
|
||||
f.write(first_chunk)
|
||||
for chunk in data_iter:
|
||||
f.write(chunk)
|
||||
# Ensure data flush to disk
|
||||
f.flush()
|
||||
os.fsync(f.fileno())
|
||||
except FileNotFoundError:
|
||||
# Create parent directory
|
||||
directory = os.path.dirname(file)
|
||||
if directory:
|
||||
os.makedirs(directory, exist_ok=True)
|
||||
# Write again
|
||||
with open(temp, mode=mode, encoding=encoding, newline=newline) as f:
|
||||
f.write(first_chunk)
|
||||
for chunk in data_iter:
|
||||
f.write(chunk)
|
||||
# Ensure data flush to disk
|
||||
f.flush()
|
||||
os.fsync(f.fileno())
|
||||
|
||||
last_error = None
|
||||
if os.name == 'nt':
|
||||
# PermissionError on Windows if another process is reading
|
||||
for attempt in range(WINDOWS_MAX_ATTEMPT):
|
||||
try:
|
||||
# Atomic operation
|
||||
os.replace(temp, file)
|
||||
# success
|
||||
return
|
||||
except PermissionError as e:
|
||||
last_error = e
|
||||
delay = windows_attempt_delay(attempt)
|
||||
time.sleep(delay)
|
||||
continue
|
||||
except Exception as e:
|
||||
@ -113,8 +249,6 @@ def atomic_read(
|
||||
file: str,
|
||||
mode: str = 'r',
|
||||
errors: str = 'strict',
|
||||
max_attempt=5,
|
||||
retry_delay=0.05,
|
||||
):
|
||||
"""
|
||||
Atomic file read with minimal IO operation
|
||||
@ -124,9 +258,6 @@ def atomic_read(
|
||||
file:
|
||||
mode: 'r' or 'rb'
|
||||
errors: 'strict', 'ignore', 'replace' and any other errors mode in open()
|
||||
max_attempt: Max attempt if another process is reading,
|
||||
effective only on Windows
|
||||
retry_delay: Base time to wait between retries (seconds)
|
||||
|
||||
Returns:
|
||||
str if mode is 'r'
|
||||
@ -141,9 +272,7 @@ def atomic_read(
|
||||
if os.name == 'nt':
|
||||
# PermissionError on Windows if another process is replacing
|
||||
last_error = None
|
||||
if max_attempt < 1:
|
||||
max_attempt = 1
|
||||
for trial in range(max_attempt):
|
||||
for attempt in range(WINDOWS_MAX_ATTEMPT):
|
||||
try:
|
||||
with open(file, mode=mode, encoding=encoding, errors=errors) as f:
|
||||
# success
|
||||
@ -152,12 +281,9 @@ def atomic_read(
|
||||
return ''
|
||||
except PermissionError as e:
|
||||
last_error = e
|
||||
delay = 2 ** trial * retry_delay
|
||||
delay = windows_attempt_delay(attempt)
|
||||
time.sleep(delay)
|
||||
continue
|
||||
except Exception as e:
|
||||
last_error = e
|
||||
break
|
||||
if last_error is not None:
|
||||
raise last_error from None
|
||||
else:
|
||||
@ -170,7 +296,39 @@ def atomic_read(
|
||||
return ''
|
||||
|
||||
|
||||
def atomic_failure_cleanup(path: str):
|
||||
def atomic_remove(file: str):
|
||||
"""
|
||||
Atomic file remove
|
||||
|
||||
Args:
|
||||
file:
|
||||
"""
|
||||
if os.name == 'nt':
|
||||
# PermissionError on Windows if another process is replacing
|
||||
last_error = None
|
||||
for attempt in range(WINDOWS_MAX_ATTEMPT):
|
||||
try:
|
||||
os.unlink(file)
|
||||
except FileNotFoundError:
|
||||
return
|
||||
except PermissionError as e:
|
||||
last_error = e
|
||||
delay = windows_attempt_delay(attempt)
|
||||
time.sleep(delay)
|
||||
continue
|
||||
if last_error is not None:
|
||||
raise last_error from None
|
||||
else:
|
||||
# Linux and Mac allow deleting while another process is reading
|
||||
# The directory entry is removed but the storage allocated to the file is not made available
|
||||
# until the original file is no longer in use.
|
||||
try:
|
||||
os.unlink(file)
|
||||
except FileNotFoundError:
|
||||
return
|
||||
|
||||
|
||||
def atomic_failure_cleanup(directory: str, recursive: bool = False):
|
||||
"""
|
||||
Cleanup remaining temp file under given path.
|
||||
In most cases there should be no remaining temp files unless write process get interrupted.
|
||||
@ -178,24 +336,33 @@ def atomic_failure_cleanup(path: str):
|
||||
This method should only be called at startup
|
||||
to avoid deleting temp files that another process is writing.
|
||||
"""
|
||||
with os.scandir(path) as entries:
|
||||
for entry in entries:
|
||||
if not entry.is_file():
|
||||
continue
|
||||
# Check suffix first to reduce regex calls
|
||||
name = entry.name
|
||||
if not name.endswith('.tmp'):
|
||||
continue
|
||||
# Check temp file format
|
||||
res = re.match(r'.*\.[a-zA-Z0-9]{6,}\.tmp$', name)
|
||||
if not res:
|
||||
continue
|
||||
# Delete temp file
|
||||
file = f'{path}{os.sep}{name}'
|
||||
try:
|
||||
os.unlink(file)
|
||||
except PermissionError:
|
||||
# Another process is reading/writing
|
||||
pass
|
||||
except:
|
||||
pass
|
||||
try:
|
||||
with os.scandir(directory) as entries:
|
||||
for entry in entries:
|
||||
if is_tmp_file(entry.name):
|
||||
# Delete temp file or directory
|
||||
if entry.is_dir(follow_symlinks=False):
|
||||
import shutil
|
||||
shutil.rmtree(entry.path, ignore_errors=True)
|
||||
else:
|
||||
try:
|
||||
os.unlink(entry.path)
|
||||
except PermissionError:
|
||||
# Another process is reading/writing
|
||||
pass
|
||||
except FileNotFoundError:
|
||||
# Another process removed current file while iterating
|
||||
pass
|
||||
except:
|
||||
pass
|
||||
else:
|
||||
if entry.is_dir(follow_symlinks=False):
|
||||
# Normal directory
|
||||
if recursive:
|
||||
atomic_failure_cleanup(entry.path, recursive=True)
|
||||
# Normal file
|
||||
# else:
|
||||
# pass
|
||||
except FileNotFoundError:
|
||||
# directory to clean up does not exist, no need to clean up
|
||||
pass
|
||||
|
Loading…
x
Reference in New Issue
Block a user