You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							58 lines
						
					
					
						
							1.9 KiB
						
					
					
				
			
		
		
	
	
							58 lines
						
					
					
						
							1.9 KiB
						
					
					
				import io
 | 
						|
import os
 | 
						|
import tempfile
 | 
						|
import contextlib
 | 
						|
import zstandard as zstd
 | 
						|
 | 
						|
LOG_COMPRESSION_LEVEL = 10 # little benefit up to level 15. level ~17 is a small step change
 | 
						|
 | 
						|
 | 
						|
class CallbackReader:
 | 
						|
  """Wraps a file, but overrides the read method to also
 | 
						|
  call a callback function with the number of bytes read so far."""
 | 
						|
  def __init__(self, f, callback, *args):
 | 
						|
    self.f = f
 | 
						|
    self.callback = callback
 | 
						|
    self.cb_args = args
 | 
						|
    self.total_read = 0
 | 
						|
 | 
						|
  def __getattr__(self, attr):
 | 
						|
    return getattr(self.f, attr)
 | 
						|
 | 
						|
  def read(self, *args, **kwargs):
 | 
						|
    chunk = self.f.read(*args, **kwargs)
 | 
						|
    self.total_read += len(chunk)
 | 
						|
    self.callback(*self.cb_args, self.total_read)
 | 
						|
    return chunk
 | 
						|
 | 
						|
 | 
						|
@contextlib.contextmanager
 | 
						|
def atomic_write_in_dir(path: str, mode: str = 'w', buffering: int = -1, encoding: str = None, newline: str = None,
 | 
						|
                        overwrite: bool = False):
 | 
						|
  """Write to a file atomically using a temporary file in the same directory as the destination file."""
 | 
						|
  dir_name = os.path.dirname(path)
 | 
						|
 | 
						|
  if not overwrite and os.path.exists(path):
 | 
						|
    raise FileExistsError(f"File '{path}' already exists. To overwrite it, set 'overwrite' to True.")
 | 
						|
 | 
						|
  with tempfile.NamedTemporaryFile(mode=mode, buffering=buffering, encoding=encoding, newline=newline, dir=dir_name, delete=False) as tmp_file:
 | 
						|
    yield tmp_file
 | 
						|
    tmp_file_name = tmp_file.name
 | 
						|
  os.replace(tmp_file_name, path)
 | 
						|
 | 
						|
 | 
						|
def get_upload_stream(filepath: str, should_compress: bool) -> tuple[io.BufferedIOBase, int]:
 | 
						|
  if not should_compress:
 | 
						|
    file_size = os.path.getsize(filepath)
 | 
						|
    file_stream = open(filepath, "rb")
 | 
						|
    return file_stream, file_size
 | 
						|
 | 
						|
  # Compress the file on the fly
 | 
						|
  compressed_stream = io.BytesIO()
 | 
						|
  compressor = zstd.ZstdCompressor(level=LOG_COMPRESSION_LEVEL)
 | 
						|
 | 
						|
  with open(filepath, "rb") as f:
 | 
						|
    compressor.copy_stream(f, compressed_stream)
 | 
						|
    compressed_size = compressed_stream.tell()
 | 
						|
    compressed_stream.seek(0)
 | 
						|
    return compressed_stream, compressed_size
 | 
						|
 |