class FtpTarget(_Target): """Represents a synchronization target on an FTP server. Attributes: path (str): Current working directory on FTP server. ftp (FTP): Instance of ftplib.FTP. host (str): hostname of FTP server port (int): FTP port (defaults to 21) username (str): password (str): """ DEFAULT_BLOCKSIZE = 8 * 1024 # ftplib uses 8k chunks by default MAX_SPOOL_MEM = 100 * 1024 # keep open_readable() buffer in memory if smaller than 100kB def __init__(self, path, host, port=0, username=None, password=None, tls=False, timeout=None, extra_opts=None): """Create FTP target with host, initial path, optional credentials and options. Args: path (str): root path on FTP server, relative to *host* host (str): hostname of FTP server port (int): FTP port (defaults to 21) username (str): password (str): tls (bool): encrypt the connection using TLS (Python 2.7/3.2+) timeout (int): the timeout to set against the ftp socket (seconds) extra_opts (dict): """ path = path or "/" super(FtpTarget, self).__init__(path, extra_opts) if tls: try: self.ftp = ftplib.FTP_TLS() except AttributeError: write("Python 2.7/3.2+ required for FTPS (TLS).") raise else: self.ftp = ftplib.FTP() self.ftp.set_debuglevel(self.get_option("ftp_debug", 0)) self.host = host self.port = port or 0 self.username = username self.password = password self.tls = tls self.timeout = timeout #: dict: written to ftp target root folder before synchronization starts. #: set to False, if write failed. Default: None self.lock_data = None self.is_unix = None self.time_zone_ofs = None self.clock_ofs = None self.ftp_socket_connected = False self.support_set_time = False def __str__(self): return "<{} + {}>".format( self.get_base_name(), relpath_url(self.cur_dir or "/", self.root_dir)) def get_base_name(self): scheme = "ftps" if self.tls else "ftp" return "{}://{}{}".format(scheme, self.host, self.root_dir) def open(self): assert not self.ftp_socket_connected super(FtpTarget, self).open() options = self.get_options_dict() no_prompt = self.get_option("no_prompt", True) store_password = self.get_option("store_password", False) self.ftp.set_debuglevel(self.get_option("ftp_debug", 0)) # Optionally use FTP active mode (default: PASV) (issue #21) force_active = self.get_option("ftp_active", False) self.ftp.set_pasv(not force_active) if self.timeout: self.ftp.connect(self.host, self.port, self.timeout) else: # Py2.7 uses -999 as default for `timeout`, Py3 uses None self.ftp.connect(self.host, self.port) self.ftp_socket_connected = True if self.username is None or self.password is None: creds = get_credentials_for_url(self.host, options, force_user=self.username) if creds: self.username, self.password = creds while True: try: # Login (as 'anonymous' if self.username is undefined): self.ftp.login(self.username, self.password) if self.get_option("verbose", 3) >= 4: write("Login as '{}'.".format( self.username if self.username else "anonymous")) break except ftplib.error_perm as e: # If credentials were passed, but authentication fails, prompt # for new password if not e.args[0].startswith("530"): raise # error other then '530 Login incorrect' write_error("Could not login to {}@{}: {}".format( self.username, self.host, e)) if no_prompt or not self.username: raise creds = prompt_for_password(self.host, self.username) self.username, self.password = creds # Continue while-loop if self.tls: # Upgrade data connection to TLS. self.ftp.prot_p() try: self.ftp.cwd(self.root_dir) except ftplib.error_perm as e: # If credentials were passed, but authentication fails, prompt # for new password if not e.args[0].startswith("550"): raise # error other then 550 No such directory' write_error( "Could not change directory to {} ({}): missing permissions?". format(self.root_dir, e)) pwd = self.ftp.pwd() if pwd != self.root_dir: raise RuntimeError( "Unable to navigate to working directory {!r} (now at {!r})". format(self.root_dir, pwd)) self.cur_dir = pwd # self.ftp_initialized = True # Successfully authenticated: store password if store_password: save_password(self.host, self.username, self.password) # TODO: case sensitivity? # resp = self.ftp.sendcmd("system") # self.is_unix = "unix" in resp.lower() # not necessarily true, better check with r/w tests self._lock() return def close(self): if self.lock_data: self._unlock(closing=True) if self.ftp_socket_connected: try: self.ftp.quit() except (CompatConnectionError, EOFError) as e: write_error("ftp.quit() failed: {}".format(e)) self.ftp_socket_connected = False super(FtpTarget, self).close() def _lock(self, break_existing=False): """Write a special file to the target root folder.""" # write("_lock") data = {"lock_time": time.time(), "lock_holder": None} try: assert self.cur_dir == self.root_dir self.write_text(DirMetadata.LOCK_FILE_NAME, json.dumps(data)) self.lock_data = data except Exception as e: errmsg = "{}".format(e) write_error("Could not write lock file: {}".format(errmsg)) if errmsg.startswith("550") and self.ftp.passiveserver: try: self.ftp.makepasv() except Exception: write_error( "The server probably requires FTP Active mode. " "Try passing the --ftp-active option.") # Set to False, so we don't try to remove later self.lock_data = False def _unlock(self, closing=False): """Remove lock file to the target root folder. """ # write("_unlock", closing) try: if self.cur_dir != self.root_dir: if closing: write( "Changing to ftp root folder to remove lock file: {}". format(self.root_dir)) self.cwd(self.root_dir) else: write_error( "Could not remove lock file, because CWD != ftp root: {}" .format(self.cur_dir)) return if self.lock_data is False: if self.get_option("verbose", 3) >= 4: write("Skip remove lock file (was not written).") else: # direct delete, without updating metadata or checking for target access: self.ftp.delete(DirMetadata.LOCK_FILE_NAME) # self.remove_file(DirMetadata.LOCK_FILE_NAME) self.lock_data = None except Exception as e: write_error("Could not remove lock file: {}".format(e)) raise def _probe_lock_file(self, reported_mtime): """Called by get_dir""" delta = reported_mtime - self.lock_data["lock_time"] if self.get_option("verbose", 3) >= 4: write("Server time offset: {0:.2f} seconds".format(delta)) def get_id(self): return self.host + self.root_dir def cwd(self, dir_name): path = normpath_url(join_url(self.cur_dir, dir_name)) if not path.startswith(self.root_dir): # paranoic check to prevent that our sync tool goes berserk raise RuntimeError("Tried to navigate outside root %r: %r" % (self.root_dir, path)) self.ftp.cwd(dir_name) self.cur_dir = path self.cur_dir_meta = None return self.cur_dir def pwd(self): return self.ftp.pwd() def mkdir(self, dir_name): self.check_write(dir_name) self.ftp.mkd(dir_name) def _rmdir_impl(self, dir_name, keep_root_folder=False, predicate=None): # FTP does not support deletion of non-empty directories. self.check_write(dir_name) names = [] nlst_res = self.ftp.nlst(dir_name) # write("rmdir(%s): %s" % (dir_name, nlst_res)) for name in nlst_res: if "/" in name: name = os.path.basename(name) if name in (".", ".."): continue if predicate and not predicate(name): continue names.append(name) if len(names) > 0: self.ftp.cwd(dir_name) try: for name in names: try: # try to delete this as a file self.ftp.delete(name) except ftplib.all_errors as _e: write( " ftp.delete({}) failed: {}, trying rmdir()...". format(name, _e)) # assume <name> is a folder self.rmdir(name) finally: if dir_name != ".": self.ftp.cwd("..") # write("ftp.rmd(%s)..." % (dir_name, )) if not keep_root_folder: self.ftp.rmd(dir_name) return def rmdir(self, dir_name): return self._rmdir_impl(dir_name) def get_dir(self): entry_list = [] entry_map = {} local_res = { "has_meta": False } # pass local variables outside func scope def _addline(line): data, _, name = line.partition("; ") res_type = size = mtime = unique = None fields = data.split(";") # http://tools.ietf.org/html/rfc3659#page-23 # "Size" / "Modify" / "Create" / "Type" / "Unique" / "Perm" / "Lang" # / "Media-Type" / "CharSet" / os-depend-fact / local-fact for field in fields: field_name, _, field_value = field.partition("=") field_name = field_name.lower() if field_name == "type": res_type = field_value elif field_name in ("sizd", "size"): size = int(field_value) elif field_name == "modify": # Use calendar.timegm() instead of time.mktime(), because # the date was returned as UTC if "." in field_value: mtime = calendar.timegm( time.strptime(field_value, "%Y%m%d%H%M%S.%f")) else: mtime = calendar.timegm( time.strptime(field_value, "%Y%m%d%H%M%S")) elif field_name == "unique": unique = field_value entry = None if res_type == "dir": entry = DirectoryEntry(self, self.cur_dir, name, size, mtime, unique) elif res_type == "file": if name == DirMetadata.META_FILE_NAME: # the meta-data file is silently ignored local_res["has_meta"] = True elif name == DirMetadata.LOCK_FILE_NAME and self.cur_dir == self.root_dir: # this is the root lock file. compare reported mtime with # local upload time self._probe_lock_file(mtime) else: entry = FileEntry(self, self.cur_dir, name, size, mtime, unique) elif res_type in ("cdir", "pdir"): pass else: raise NotImplementedError( "MLSD returned unsupported type: {!r}".format(res_type)) if entry: entry_map[name] = entry entry_list.append(entry) try: self.ftp.retrlines("MLSD", _addline) except ftplib.error_perm as e: # write_error("The FTP server responded with {}".format(e)) # raises error_perm "500 Unknown command" if command is not supported if "500" in str(e.args): raise RuntimeError( "The FTP server does not support the 'MLSD' command.") raise # load stored meta data if present self.cur_dir_meta = DirMetadata(self) if local_res["has_meta"]: try: self.cur_dir_meta.read() except IncompatibleMetadataVersion: raise # this should end the script (user should pass --migrate) except Exception as e: write_error("Could not read meta info {}: {}".format( self.cur_dir_meta, e)) meta_files = self.cur_dir_meta.list # Adjust file mtime from meta-data if present missing = [] for n in meta_files: meta = meta_files[n] if n in entry_map: # We have a meta-data entry for this resource upload_time = meta.get("u", 0) if (entry_map[n].size == meta.get("s") and FileEntry._eps_compare(entry_map[n].mtime, upload_time) <= 0): # Use meta-data mtime instead of the one reported by FTP server entry_map[n].meta = meta entry_map[n].mtime = meta["m"] # entry_map[n].dt_modified = datetime.fromtimestamp(meta["m"]) else: # Discard stored meta-data if # 1. the the mtime reported by the FTP server is later # than the stored upload time (which indicates # that the file was modified directly on the server) # or # 2. the reported files size is different than the # size we stored in the meta-data if self.get_option("verbose", 3) >= 5: write( ("META: Removing outdated meta entry {}\n" + " modified after upload ({} > {}), or\n" " cur. size ({}) != meta size ({})" ).format(n, time.ctime(entry_map[n].mtime), time.ctime(upload_time), entry_map[n].size, meta.get("s"))) missing.append(n) else: # File is stored in meta-data, but no longer exists on FTP server # write("META: Removing missing meta entry %s" % n) missing.append(n) # Remove missing or invalid files from cur_dir_meta for n in missing: self.cur_dir_meta.remove(n) return entry_list def open_readable(self, name): """Open cur_dir/name for reading. Note: we read everything into a buffer that supports .read(). Args: name (str): file name, located in self.curdir Returns: file-like (must support read() method) """ # print("FTP open_readable({})".format(name)) out = SpooledTemporaryFile(max_size=self.MAX_SPOOL_MEM, mode="w+b") self.ftp.retrbinary("RETR {}".format(name), out.write, FtpTarget.DEFAULT_BLOCKSIZE) out.seek(0) return out def write_file(self, name, fp_src, blocksize=DEFAULT_BLOCKSIZE, callback=None): """Write file-like `fp_src` to cur_dir/name. Args: name (str): file name, located in self.curdir fp_src (file-like): must support read() method blocksize (int, optional): callback (function, optional): Called like `func(buf)` for every written chunk """ self.check_write(name) # print("FTP write_file({})".format(name), blocksize) self.ftp.storbinary("STOR {}".format(name), fp_src, blocksize, callback) # TODO: check result def copy_to_file(self, name, fp_dest, callback=None): """Write cur_dir/name to file-like `fp_dest`. Args: name (str): file name, located in self.curdir fp_dest (file-like): must support write() method callback (function, optional): Called like `func(buf)` for every written chunk """ def _write_to_file(data): # print("_write_to_file() {} bytes.".format(len(data))) fp_dest.write(data) if callback: callback(data) self.ftp.retrbinary("RETR {}".format(name), _write_to_file, FtpTarget.DEFAULT_BLOCKSIZE) def remove_file(self, name): """Remove cur_dir/name.""" self.check_write(name) # self.cur_dir_meta.remove(name) self.ftp.delete(name) self.remove_sync_info(name) def set_mtime(self, name, mtime, size): self.check_write(name) # write("META set_mtime(%s): %s" % (name, time.ctime(mtime))) # We cannot set the mtime on FTP servers, so we store this as additional # meta data in the same directory # TODO: try "SITE UTIME", "MDTM (set version)", or "SRFT" command self.cur_dir_meta.set_mtime(name, mtime, size)
class FtpTarget(_Target): """Represents a synchronization target on a FTP server. Attributes: path (str): Current working directory on FTP server. ftp (FTP): Instance of ftplib.FTP. host (str): hostname of FTP server port (int): FTP port (defaults to 21) username (str): password (str): """ def __init__(self, path, host, port=0, username=None, password=None, tls=False, timeout=None, extra_opts=None): """Create FTP target with host, initial path, optional credentials and options. Args: path (str): root path on FTP server, relative to *host* host (str): hostname of FTP server port (int): FTP port (defaults to 21) username (str): password (str): tls (bool): encrypt the connection using TLS (Python 2.7/3.2+) timeout (int): the timeout to set against the ftp socket (seconds) extra_opts (dict): """ path = path or "/" super(FtpTarget, self).__init__(path, extra_opts) if tls: try: self.ftp = ftplib.FTP_TLS() except AttributeError: print("Python 2.7/3.2+ required for FTPS (TLS).") raise else: self.ftp = ftplib.FTP() self.ftp.debug(self.get_option("ftp_debug", 0)) self.host = host self.port = port or 0 self.username = username self.password = password self.tls = tls self.timeout = timeout self.lock_data = None self.is_unix = None self.time_zone_ofs = None self.clock_ofs = None self.ftp_socket_connected = False self.connected = False self.support_set_time = False # if connect: # self.open() def __str__(self): return "<%s + %s>" % (self.get_base_name(), relpath_url(self.cur_dir, self.root_dir)) def get_base_name(self): scheme = "ftps" if self.tls else "ftp" return "%s://%s%s" % (scheme, self.host, self.root_dir) def open(self): assert not self.connected no_prompt = self.get_option("no_prompt", True) store_password = self.get_option("store_password", False) if self.timeout: self.ftp.connect(self.host, self.port, self.timeout) else: # Py2.7 uses -999 as default for `timeout`, Py3 uses None self.ftp.connect(self.host, self.port) self.ftp_socket_connected = True if self.username is None or self.password is None: creds = get_credentials_for_url(self.host, allow_prompt=not no_prompt) if creds: self.username, self.password = creds try: # Login (as 'anonymous' if self.username is undefined): self.ftp.login(self.username, self.password) except error_perm as e: # If credentials were passed, but authentication fails, prompt # for new password if not e.args[0].startswith("530"): raise # error other then '530 Login incorrect' print(e) if not no_prompt: self.user, self.password = prompt_for_password( self.host, self.username) self.ftp.login(self.username, self.password) if self.tls: # Upgrade data connection to TLS. self.ftp.prot_p() try: self.ftp.cwd(self.root_dir) except error_perm as e: # If credentials were passed, but authentication fails, prompt # for new password if not e.args[0].startswith("550"): raise # error other then 550 No such directory' print( "Could not change directory to %s (%s): missing permissions?" % (self.root_dir, e)) pwd = self.ftp.pwd() if pwd != self.root_dir: raise RuntimeError( "Unable to navigate to working directory %r (now at %r)" % (self.root_dir, pwd)) self.cur_dir = pwd self.connected = True # Successfully authenticated: store password if store_password: save_password(self.host, self.username, self.password) # TODO: case sensitivity? # resp = self.ftp.sendcmd("system") # self.is_unix = "unix" in resp.lower() # not necessarily true, better check with read/write tests self._lock() return def close(self): if self.connected: self._unlock(closing=True) if self.ftp_socket_connected: self.ftp.quit() self.ftp_socket_connected = False self.connected = False def _lock(self, break_existing=False): """Write a special file to the target root folder.""" data = {"lock_time": time.time(), "lock_holder": None} try: assert self.cur_dir == self.root_dir self.write_text(DirMetadata.LOCK_FILE_NAME, json.dumps(data)) self.lock_data = data except Exception as e: print("Could not write lock file: %s" % e, file=sys.stderr) def _unlock(self, closing=False): """Remove lock file to the target root folder. """ try: if self.cur_dir != self.root_dir: if closing: print( "Changing to ftp root folder to remove lock file: {}". format(self.root_dir)) self.cwd(self.root_dir) else: print( "Could not remove lock file, because CWD != ftp root: {}" .format(self.cur_dir), file=sys.stderr) return # direct delete, without updating metadata or checking for target access: self.ftp.delete(DirMetadata.LOCK_FILE_NAME) # self.remove_file(DirMetadata.LOCK_FILE_NAME) self.lock_data = None except Exception as e: print("Could not remove lock file: %s" % e, file=sys.stderr) raise def _probe_lock_file(self, reported_mtime): """Called by get_dir""" delta = reported_mtime - self.lock_data["lock_time"] if self.get_option("verbose", 2) >= 2: print("Server time offset: {0:.2f} seconds".format(delta)) def get_id(self): return self.host + self.root_dir def cwd(self, dir_name): path = normpath_url(join_url(self.cur_dir, dir_name)) if not path.startswith(self.root_dir): # paranoic check to prevent that our sync tool goes berserk raise RuntimeError("Tried to navigate outside root %r: %r" % (self.root_dir, path)) self.ftp.cwd(dir_name) self.cur_dir = path self.cur_dir_meta = None return self.cur_dir def pwd(self): return self.ftp.pwd() def mkdir(self, dir_name): self.check_write(dir_name) self.ftp.mkd(dir_name) def _rmdir_impl(self, dir_name, keep_root_folder=False, predicate=None): # FTP does not support deletion of non-empty directories. # print("rmdir(%s)" % dir_name) self.check_write(dir_name) names = self.ftp.nlst(dir_name) # print("rmdir(%s): %s" % (dir_name, names)) # Skip ftp.cwd(), if dir is empty names = [n for n in names if n not in (".", "..")] if predicate: names = [n for n in names if predicate(n)] if len(names) > 0: self.ftp.cwd(dir_name) try: for name in names: try: # try to delete this as a file self.ftp.delete(name) except ftplib.all_errors as _e: # print(" ftp.delete(%s) failed: %s, trying rmdir()..." % (name, _e)) # assume <name> is a folder self.rmdir(name) finally: if dir_name != ".": self.ftp.cwd("..") # print("ftp.rmd(%s)..." % (dir_name, )) if not keep_root_folder: self.ftp.rmd(dir_name) return def rmdir(self, dir_name): return self._rmdir_impl(dir_name) def get_dir(self): entry_list = [] entry_map = {} local_res = { "has_meta": False } # pass local variables outside func scope def _addline(line): data, _, name = line.partition("; ") res_type = size = mtime = unique = None fields = data.split(";") # http://tools.ietf.org/html/rfc3659#page-23 # "Size" / "Modify" / "Create" / "Type" / "Unique" / "Perm" / "Lang" # / "Media-Type" / "CharSet" / os-depend-fact / local-fact for field in fields: field_name, _, field_value = field.partition("=") field_name = field_name.lower() if field_name == "type": res_type = field_value elif field_name in ("sizd", "size"): size = int(field_value) elif field_name == "modify": # Use calendar.timegm() instead of time.mktime(), because # the date was returned as UTC if "." in field_value: mtime = calendar.timegm( time.strptime(field_value, "%Y%m%d%H%M%S.%f")) else: mtime = calendar.timegm( time.strptime(field_value, "%Y%m%d%H%M%S")) # print("MLSD modify: ", field_value, "mtime", mtime, "ctime", time.ctime(mtime)) elif field_name == "unique": unique = field_value entry = None if res_type == "dir": entry = DirectoryEntry(self, self.cur_dir, name, size, mtime, unique) elif res_type == "file": if name == DirMetadata.META_FILE_NAME: # the meta-data file is silently ignored local_res["has_meta"] = True elif name == DirMetadata.LOCK_FILE_NAME and self.cur_dir == self.root_dir: # this is the root lock file. compare reported mtime with # local upload time self._probe_lock_file(mtime) elif not name in (DirMetadata.DEBUG_META_FILE_NAME, ): entry = FileEntry(self, self.cur_dir, name, size, mtime, unique) elif res_type in ("cdir", "pdir"): pass else: raise NotImplementedError( "MLSD returned unsupported type: {!r}".format(res_type)) if entry: entry_map[name] = entry entry_list.append(entry) try: self.ftp.retrlines("MLSD", _addline) except error_perm as e: # print("The FTP server responded with {}".format(e), file=sys.stderr) # raises error_perm "500 Unknown command" if command is not supported if "500" in str(e.args): raise RuntimeError( "The FTP server does not support the 'MLSD' command.") raise # load stored meta data if present self.cur_dir_meta = DirMetadata(self) if local_res["has_meta"]: try: self.cur_dir_meta.read() except Exception as e: print("Could not read meta info {}: {}".format( self.cur_dir_meta, e), file=sys.stderr) meta_files = self.cur_dir_meta.list # Adjust file mtime from meta-data if present missing = [] for n in meta_files: meta = meta_files[n] if n in entry_map: # We have a meta-data entry for this resource upload_time = meta.get("u", 0) if (entry_map[n].size == meta.get("s") and FileEntry._eps_compare(entry_map[n].mtime, upload_time) <= 0): # Use meta-data mtime instead of the one reported by FTP server entry_map[n].meta = meta entry_map[n].mtime = meta["m"] entry_map[n].dt_modified = datetime.fromtimestamp( meta["m"]) else: # Discard stored meta-data if # 1. the the mtime reported by the FTP server is later # than the stored upload time (which indicates # that the file was modified directly on the server) # or # 2. the reported files size is different than the # size we stored in the meta-data if self.get_option("verbose", 2) >= 3: print(("META: Removing outdated meta entry %s\n" + " modified after upload (%s > %s)") % (n, time.ctime(entry_map[n].mtime), time.ctime(upload_time))) missing.append(n) else: # File is stored in meta-data, but no longer exists on FTP server # print("META: Removing missing meta entry %s" % n) missing.append(n) # Remove missing or invalid files from cur_dir_meta for n in missing: self.cur_dir_meta.remove(n) return entry_list def open_readable(self, name): """Open cur_dir/name for reading.""" out = io.BytesIO() self.ftp.retrbinary("RETR %s" % name, out.write) out.flush() out.seek(0) return out def write_file(self, name, fp_src, blocksize=DEFAULT_BLOCKSIZE, callback=None): self.check_write(name) self.ftp.storbinary("STOR %s" % name, fp_src, blocksize, callback) # TODO: check result def remove_file(self, name): """Remove cur_dir/name.""" self.check_write(name) # self.cur_dir_meta.remove(name) self.ftp.delete(name) self.remove_sync_info(name) def set_mtime(self, name, mtime, size): self.check_write(name) # print("META set_mtime(%s): %s" % (name, time.ctime(mtime))) # We cannot set the mtime on FTP servers, so we store this as additional # meta data in the same directory # TODO: try "SITE UTIME", "MDTM (set version)", or "SRFT" command self.cur_dir_meta.set_mtime(name, mtime, size)
class _Target(object): def __init__(self, root_dir, extra_opts): if root_dir != "/": root_dir = root_dir.rstrip("/") self.root_dir = root_dir self.extra_opts = extra_opts or {} self.readonly = False self.dry_run = False self.host = None self.synchronizer = None # Set by BaseSynchronizer.__init__() self.peer = None self.cur_dir = None self.connected = False self.save_mode = True self.case_sensitive = None # TODO: don't know yet self.time_ofs = None # TODO: see _probe_lock_file() self.support_set_time = None # Derived class knows self.cur_dir_meta = DirMetadata(self) self.meta_stack = [] def __del__(self): # TODO: http://pydev.blogspot.de/2015/01/creating-safe-cyclic-reference.html self.close() def get_base_name(self): return "%s" % self.root_dir def is_local(self): return self.synchronizer.local is self def is_unbund(self): return self.synchronizer is None def get_option(self, key, default=None): """Return option from synchronizer (possibly overridden by target extra_opts).""" if self.synchronizer: return self.extra_opts.get( key, self.synchronizer.options.get(key, default)) return self.extra_opts.get(key, default) def open(self): self.connected = True def close(self): self.connected = False def check_write(self, name): """Raise exception if writing cur_dir/name is not allowed.""" if self.readonly and name not in (DirMetadata.META_FILE_NAME, DirMetadata.LOCK_FILE_NAME): raise RuntimeError("target is read-only: %s + %s / " % (self, name)) def get_id(self): return self.root_dir def get_sync_info(self, name, key=None): """Get mtime/size when this target's current dir was last synchronized with remote.""" peer_target = self.peer if self.is_local(): info = self.cur_dir_meta.dir["peer_sync"].get(peer_target.get_id()) else: info = peer_target.cur_dir_meta.dir["peer_sync"].get(self.get_id()) if name is not None: info = info.get(name) if info else None if info and key: info = info.get(key) return info def cwd(self, dir_name): raise NotImplementedError def push_meta(self): self.meta_stack.append(self.cur_dir_meta) self.cur_dir_meta = None def pop_meta(self): self.cur_dir_meta = self.meta_stack.pop() def flush_meta(self): """Write additional meta information for current directory.""" if self.cur_dir_meta: self.cur_dir_meta.flush() def pwd(self, dir_name): raise NotImplementedError def mkdir(self, dir_name): raise NotImplementedError def rmdir(self, dir_name): """Remove cur_dir/name.""" raise NotImplementedError def get_dir(self): """Return a list of _Resource entries.""" raise NotImplementedError def walk(self, pred=None): """Iterate over all target entries recursively.""" for entry in self.get_dir(): if pred and pred(entry) is False: continue yield entry if isinstance(entry, DirectoryEntry): self.cwd(entry.name) for e in self.walk(pred): yield e self.cwd("..") return def open_readable(self, name): """Return file-like object opened in binary mode for cur_dir/name.""" raise NotImplementedError def read_text(self, name): """Read text string from cur_dir/name using open_readable().""" with self.open_readable(name) as fp: res = fp.read() # StringIO or file object # try: # res = fp.getvalue() # StringIO returned by FtpTarget # except AttributeError: # res = fp.read() # file object returned by FsTarget res = res.decode("utf8") return res def write_file(self, name, fp_src, blocksize=8192, callback=None): """Write binary data from file-like to cur_dir/name.""" raise NotImplementedError def write_text(self, name, s): """Write string data to cur_dir/name using write_file().""" buf = io.BytesIO(to_binary(s)) self.write_file(name, buf) def remove_file(self, name): """Remove cur_dir/name.""" raise NotImplementedError def set_mtime(self, name, mtime, size): raise NotImplementedError def set_sync_info(self, name, mtime, size): """Store mtime/size when this resource was last synchronized with remote.""" if not self.is_local(): return self.peer.set_sync_info(name, mtime, size) return self.cur_dir_meta.set_sync_info(name, mtime, size) def remove_sync_info(self, name): if not self.is_local(): return self.peer.remove_sync_info(name) if self.cur_dir_meta: return self.cur_dir_meta.remove(name) # print("%s.remove_sync_info(%s): nothing to do" % (self, name)) return
class FTPTarget(_Target): """Represents a synchronization target on an FTP server. Attributes: path (str): Current working directory on FTP server. ftp (FTP): Instance of ftplib.FTP. host (str): hostname of FTP server port (int): FTP port (defaults to 21) username (str): password (str): """ DEFAULT_BLOCKSIZE = 8 * 1024 # ftplib uses 8k chunks by default MAX_SPOOL_MEM = ( 100 * 1024 ) # keep open_readable() buffer in memory if smaller than 100kB def __init__( self, path, host, port=0, username=None, password=None, tls=False, timeout=None, extra_opts=None, ): """Create FTP target with host, initial path, optional credentials and options. Args: path (str): root path on FTP server, relative to *host* host (str): hostname of FTP server port (int): FTP port (defaults to 21) username (str): password (str): tls (bool): encrypt the connection using TLS (Python 2.7/3.2+) timeout (int): the timeout to set against the ftp socket (seconds) extra_opts (dict): """ self.encoding = _get_encoding_opt(None, extra_opts, "utf-8") # path = self.to_unicode(path) path = path or "/" assert is_native(path) super(FTPTarget, self).__init__(path, extra_opts) if tls: try: self.ftp = ftplib.FTP_TLS() except AttributeError: write("Python 2.7/3.2+ required for FTPS (TLS).") raise else: self.ftp = ftplib.FTP() self.ftp.set_debuglevel(self.get_option("ftp_debug", 0)) self.host = host self.port = port or 0 self.username = username self.password = password self.tls = tls self.timeout = timeout #: dict: written to ftp target root folder before synchronization starts. #: set to False, if write failed. Default: None self.lock_data = None self.lock_write_time = None self.feat_response = None self.syst_response = None self.is_unix = None #: True if server reports FEAT UTF8 self.support_utf8 = None #: Time difference between <local upload time> and the mtime that the server reports afterwards. #: The value is added to the 'u' time stored in meta data. #: (This is only a rough estimation, derived from the lock-file.) self.server_time_ofs = None self.ftp_socket_connected = False self.support_set_time = False # #: Optionally define an encoding for this server # encoding = self.get_option("encoding", "utf-8") # self.encoding = codecs.lookup(encoding).name # return def __str__(self): return "<{} + {}>".format( self.get_base_name(), relpath_url(self.cur_dir or "/", self.root_dir)) def get_base_name(self): scheme = "ftps" if self.tls else "ftp" return "{}://{}{}".format(scheme, self.host, self.root_dir) def open(self): assert not self.ftp_socket_connected super(FTPTarget, self).open() options = self.get_options_dict() no_prompt = self.get_option("no_prompt", True) store_password = self.get_option("store_password", False) verbose = self.get_option("verbose", 3) self.ftp.set_debuglevel(self.get_option("ftp_debug", 0)) # Optionally use FTP active mode (default: PASV) (issue #21) force_active = self.get_option("ftp_active", False) self.ftp.set_pasv(not force_active) self.ftp.connect(self.host, self.port, self.timeout) # if self.timeout: # self.ftp.connect(self.host, self.port, self.timeout) # else: # # Py2.7 uses -999 as default for `timeout`, Py3 uses None # self.ftp.connect(self.host, self.port) self.ftp_socket_connected = True if self.username is None or self.password is None: creds = get_credentials_for_url(self.host, options, force_user=self.username) if creds: self.username, self.password = creds while True: try: # Login (as 'anonymous' if self.username is undefined): self.ftp.login(self.username, self.password) if verbose >= 4: write("Login as '{}'.".format( self.username if self.username else "anonymous")) break except ftplib.error_perm as e: # If credentials were passed, but authentication fails, prompt # for new password if not e.args[0].startswith("530"): raise # error other then '530 Login incorrect' write_error("Could not login to {}@{}: {}".format( self.username, self.host, e)) if no_prompt or not self.username: raise creds = prompt_for_password(self.host, self.username) self.username, self.password = creds # Continue while-loop if self.tls: # Upgrade data connection to TLS. self.ftp.prot_p() try: self.syst_response = self.ftp.sendcmd("SYST") if verbose >= 5: write("SYST: '{}'.".format( self.syst_response.replace("\n", " "))) # self.is_unix = "unix" in resp.lower() # not necessarily true, better check with r/w tests # TODO: case sensitivity? except Exception as e: write("SYST command failed: '{}'".format(e)) try: self.feat_response = self.ftp.sendcmd("FEAT") self.support_utf8 = "UTF8" in self.feat_response if verbose >= 5: write("FEAT: '{}'.".format( self.feat_response.replace("\n", " "))) except Exception as e: write("FEAT command failed: '{}'".format(e)) if self.encoding == "utf-8": if not self.support_utf8 and verbose >= 4: write( "Server does not list utf-8 as supported feature (using it anyway).", warning=True, ) try: # Announce our wish to use UTF-8 to the server as proposed here: # See https://tools.ietf.org/html/draft-ietf-ftpext-utf-8-option-00 # Note: this RFC is inactive, expired, and failed on Strato self.ftp.sendcmd("OPTS UTF-8") if verbose >= 4: write("Sent 'OPTS UTF-8'.") except Exception as e: if verbose >= 4: write("Could not send 'OPTS UTF-8': '{}'".format(e), warning=True) try: # Announce our wish to use UTF-8 to the server as proposed here: # See https://tools.ietf.org/html/rfc2389 # https://www.cerberusftp.com/phpBB3/viewtopic.php?t=2608 # Note: this was accepted on Strato self.ftp.sendcmd("OPTS UTF8 ON") if verbose >= 4: write("Sent 'OPTS UTF8 ON'.") except Exception as e: write("Could not send 'OPTS UTF8 ON': '{}'".format(e), warning=True) if hasattr(self.ftp, "encoding"): # Python 3 encodes using latin-1 by default(!) # (In Python 2 ftp.encoding does not exist, but ascii is used) if self.encoding != codecs.lookup(self.ftp.encoding).name: write("Setting FTP encoding to {} (was {}).".format( self.encoding, self.ftp.encoding)) self.ftp.encoding = self.encoding try: self.ftp.cwd(self.root_dir) except ftplib.error_perm as e: if not e.args[0].startswith("550"): raise # error other then 550 No such directory' write_error( "Could not change directory to {} ({}): missing permissions?". format(self.root_dir, e)) pwd = self.pwd() # pwd = self.to_unicode(pwd) if pwd != self.root_dir: raise RuntimeError( "Unable to navigate to working directory {!r} (now at {!r})". format(self.root_dir, pwd)) self.cur_dir = pwd # self.ftp_initialized = True # Successfully authenticated: store password if store_password: save_password(self.host, self.username, self.password) self._lock() return def close(self): if self.lock_data: self._unlock(closing=True) if self.ftp_socket_connected: try: self.ftp.quit() except (ConnectionError, EOFError) as e: write_error("ftp.quit() failed: {}".format(e)) self.ftp_socket_connected = False super(FTPTarget, self).close() def _lock(self, break_existing=False): """Write a special file to the target root folder.""" # write("_lock") data = {"lock_time": time.time(), "lock_holder": None} try: assert self.cur_dir == self.root_dir self.write_text(DirMetadata.LOCK_FILE_NAME, json.dumps(data)) self.lock_data = data self.lock_write_time = time.time() except Exception as e: errmsg = "{}".format(e) write_error("Could not write lock file: {}".format(errmsg)) if errmsg.startswith("550") and self.ftp.passiveserver: try: self.ftp.makepasv() except Exception: write_error( "The server probably requires FTP Active mode. " "Try passing the --ftp-active option.") # Set to False, so we don't try to remove later self.lock_data = False def _unlock(self, closing=False): """Remove lock file to the target root folder.""" # write("_unlock", closing) try: if self.cur_dir != self.root_dir: if closing: write( "Changing to ftp root folder to remove lock file: {}". format(self.root_dir)) self.cwd(self.root_dir) else: write_error( "Could not remove lock file, because CWD != ftp root: {}" .format(self.cur_dir)) return if self.lock_data is False: if self.get_option("verbose", 3) >= 4: write("Skip remove lock file (was not written).") else: # direct delete, without updating metadata or checking for target access: try: self.ftp.delete(DirMetadata.LOCK_FILE_NAME) # self.remove_file(DirMetadata.LOCK_FILE_NAME) except Exception as e: # I have seen '226 Closing data connection' responses here, # probably when a previous command threw another error. # However here, 2xx response should be Ok(?): # A 226 reply code is sent by the server before closing the # data connection after successfully processing the previous client command if e.args[0][:3] == "226": write_error( "Ignoring 226 response for ftp.delete() lockfile") else: raise self.lock_data = None except Exception as e: write_error("Could not remove lock file: {}".format(e)) raise def _probe_lock_file(self, reported_mtime): """Called by get_dir""" delta = reported_mtime - self.lock_data["lock_time"] # delta2 = reported_mtime - self.lock_write_time self.server_time_ofs = delta if self.get_option("verbose", 3) >= 4: write("Server time offset: {:.2f} seconds.".format(delta)) # write("Server time offset2: {:.2f} seconds.".format(delta2)) def get_id(self): return self.host + self.root_dir def cwd(self, dir_name): assert is_native(dir_name) path = normpath_url(join_url(self.cur_dir, dir_name)) if not path.startswith(self.root_dir): # paranoic check to prevent that our sync tool goes berserk raise RuntimeError( "Tried to navigate outside root {!r}: {!r}".format( self.root_dir, path)) self.ftp.cwd(dir_name) self.cur_dir = path self.cur_dir_meta = None return self.cur_dir def pwd(self): """Return current working dir as native `str` (uses fallback-encoding).""" pwd = self._ftp_pwd() if pwd != "/": # #38 pwd = pwd.rstrip("/") return pwd def mkdir(self, dir_name): assert is_native(dir_name) self.check_write(dir_name) self.ftp.mkd(dir_name) def _rmdir_impl(self, dir_name, keep_root_folder=False, predicate=None): # FTP does not support deletion of non-empty directories. assert is_native(dir_name) self.check_write(dir_name) names = [] nlst_res = self._ftp_nlst(dir_name) # nlst_res = self.ftp.nlst(dir_name) # write("rmdir(%s): %s" % (dir_name, nlst_res)) for name in nlst_res: # name = self.re_encode_to_native(name) if "/" in name: name = os.path.basename(name) if name in (".", ".."): continue if predicate and not predicate(name): continue names.append(name) if len(names) > 0: self.ftp.cwd(dir_name) try: for name in names: try: # try to delete this as a file self.ftp.delete(name) except ftplib.all_errors as _e: write( " ftp.delete({}) failed: {}, trying rmdir()...". format(name, _e)) # assume <name> is a folder self.rmdir(name) finally: if dir_name != ".": self.ftp.cwd("..") # write("ftp.rmd(%s)..." % (dir_name, )) if not keep_root_folder: self.ftp.rmd(dir_name) return def rmdir(self, dir_name): return self._rmdir_impl(dir_name) def get_dir(self): entry_list = [] entry_map = {} local_var = { "has_meta": False } # pass local variables outside func scope encoding = self.encoding def _addline(status, line): # _ftp_retrlines_native() made sure that we always get `str` type lines assert status in (0, 1, 2) assert is_native(line) data, _, name = line.partition("; ") # print(status, name, u_name) if status == 1: write( "WARNING: File name seems not to be {}; re-encoded from CP-1252:" .format(encoding), name, ) elif status == 2: write_error("File name is neither UTF-8 nor CP-1252 encoded:", name) res_type = size = mtime = unique = None fields = data.split(";") # https://tools.ietf.org/html/rfc3659#page-23 # "Size" / "Modify" / "Create" / "Type" / "Unique" / "Perm" / "Lang" # / "Media-Type" / "CharSet" / os-depend-fact / local-fact for field in fields: field_name, _, field_value = field.partition("=") field_name = field_name.lower() if field_name == "type": res_type = field_value elif field_name in ("sizd", "size"): size = int(field_value) elif field_name == "modify": # Use calendar.timegm() instead of time.mktime(), because # the date was returned as UTC if "." in field_value: mtime = calendar.timegm( time.strptime(field_value, "%Y%m%d%H%M%S.%f")) else: mtime = calendar.timegm( time.strptime(field_value, "%Y%m%d%H%M%S")) elif field_name == "unique": unique = field_value entry = None if res_type == "dir": entry = DirectoryEntry(self, self.cur_dir, name, size, mtime, unique) elif res_type == "file": if name == DirMetadata.META_FILE_NAME: # the meta-data file is silently ignored local_var["has_meta"] = True elif (name == DirMetadata.LOCK_FILE_NAME and self.cur_dir == self.root_dir): # this is the root lock file. compare reported mtime with # local upload time self._probe_lock_file(mtime) else: entry = FileEntry(self, self.cur_dir, name, size, mtime, unique) elif res_type in ("cdir", "pdir"): pass else: write_error("Could not parse '{}'".format(line)) raise NotImplementedError( "MLSD returned unsupported type: {!r}".format(res_type)) if entry: entry_map[name] = entry entry_list.append(entry) try: # We use a custom wrapper here, so we can implement a codding fall back: self._ftp_retrlines_native("MLSD", _addline, encoding) # self.ftp.retrlines("MLSD", _addline) except ftplib.error_perm as e: # write_error("The FTP server responded with {}".format(e)) # raises error_perm "500 Unknown command" if command is not supported if "500" in str(e.args): raise RuntimeError( "The FTP server does not support the 'MLSD' command.") raise # load stored meta data if present self.cur_dir_meta = DirMetadata(self) if local_var["has_meta"]: try: self.cur_dir_meta.read() except IncompatibleMetadataVersion: raise # this should end the script (user should pass --migrate) except Exception as e: write_error("Could not read meta info {}: {}".format( self.cur_dir_meta, e)) meta_files = self.cur_dir_meta.list # Adjust file mtime from meta-data if present missing = [] for n in meta_files: meta = meta_files[n] if n in entry_map: # We have a meta-data entry for this resource upload_time = meta.get("u", 0) # Discard stored meta-data if # 1. the reported files size is different than the # size we stored in the meta-data # or # 2. the the mtime reported by the FTP server is later # than the stored upload time (which indicates # that the file was modified directly on the server) if entry_map[n].size != meta.get("s"): if self.get_option("verbose", 3) >= 5: write( "Removing meta entry {} (size changed from {} to {})." .format(n, entry_map[n].size, meta.get("s"))) missing.append(n) elif (entry_map[n].mtime - upload_time) > self.mtime_compare_eps: if self.get_option("verbose", 3) >= 5: write("Removing meta entry {} (modified {} > {}).". format( n, time.ctime(entry_map[n].mtime), time.ctime(upload_time), )) missing.append(n) else: # Use meta-data mtime instead of the one reported by FTP server entry_map[n].meta = meta entry_map[n].mtime = meta["m"] else: # File is stored in meta-data, but no longer exists on FTP server # write("META: Removing missing meta entry %s" % n) missing.append(n) # Remove missing or invalid files from cur_dir_meta for n in missing: self.cur_dir_meta.remove(n) return entry_list def open_readable(self, name): """Open cur_dir/name for reading. Note: we read everything into a buffer that supports .read(). Args: name (str): file name, located in self.curdir Returns: file-like (must support read() method) """ # print("FTP open_readable({})".format(name)) assert is_native(name) out = SpooledTemporaryFile(max_size=self.MAX_SPOOL_MEM, mode="w+b") self.ftp.retrbinary("RETR {}".format(name), out.write, FTPTarget.DEFAULT_BLOCKSIZE) out.seek(0) return out def write_file(self, name, fp_src, blocksize=DEFAULT_BLOCKSIZE, callback=None): """Write file-like `fp_src` to cur_dir/name. Args: name (str): file name, located in self.curdir fp_src (file-like): must support read() method blocksize (int, optional): callback (function, optional): Called like `func(buf)` for every written chunk """ # print("FTP write_file({})".format(name), blocksize) assert is_native(name) self.check_write(name) self.ftp.storbinary("STOR {}".format(name), fp_src, blocksize, callback) # TODO: check result def copy_to_file(self, name, fp_dest, callback=None): """Write cur_dir/name to file-like `fp_dest`. Args: name (str): file name, located in self.curdir fp_dest (file-like): must support write() method callback (function, optional): Called like `func(buf)` for every written chunk """ assert is_native(name) def _write_to_file(data): # print("_write_to_file() {} bytes.".format(len(data))) fp_dest.write(data) if callback: callback(data) self.ftp.retrbinary("RETR {}".format(name), _write_to_file, FTPTarget.DEFAULT_BLOCKSIZE) def remove_file(self, name): """Remove cur_dir/name.""" assert is_native(name) self.check_write(name) # self.cur_dir_meta.remove(name) self.ftp.delete(name) self.remove_sync_info(name) def set_mtime(self, name, mtime, size): assert is_native(name) self.check_write(name) # write("META set_mtime(%s): %s" % (name, time.ctime(mtime))) # We cannot set the mtime on FTP servers, so we store this as additional # meta data in the same directory # TODO: try "SITE UTIME", "MDTM (set version)", or "SRFT" command self.cur_dir_meta.set_mtime(name, mtime, size) def _ftp_pwd(self): """Variant of `self.ftp.pwd()` that supports encoding-fallback. Returns: Current working directory as native string. """ try: return self.ftp.pwd() except UnicodeEncodeError: if self.ftp.encoding != "utf-8": raise # should not happen, since Py2 does not try to encode # TODO: this is NOT THREAD-SAFE! prev_encoding = self.ftp.encoding try: write("ftp.pwd() failed with utf-8: trying Cp1252...", warning=True) return self.ftp.pwd() finally: self.ftp.encoding = prev_encoding def _ftp_nlst(self, dir_name): """Variant of `self.ftp.nlst()` that supports encoding-fallback.""" assert is_native(dir_name) lines = [] def _add_line(status, line): lines.append(line) cmd = "NLST " + dir_name self._ftp_retrlines_native(cmd, _add_line, self.encoding) # print(cmd, lines) return lines def _ftp_retrlines_native(self, command, callback, encoding): """A re-implementation of ftp.retrlines that returns lines as native `str`. This is needed on Python 3, where `ftp.retrlines()` returns unicode `str` by decoding the incoming command response using `ftp.encoding`. This would fail for the whole request if a single line of the MLSD listing cannot be decoded. FTPTarget wants to fall back to Cp1252 if UTF-8 fails for a single line, so we need to process the raw original binary input lines. On Python 2, the response is already bytes, but we try to decode in order to check validity and optionally re-encode from Cp1252. Args: command (str): A valid FTP command like 'NLST', 'MLSD', ... callback (function): Called for every line with these args: status (int): 0:ok 1:fallback used, 2:decode failed line (str): result line decoded using `encoding`. If `encoding` is 'utf-8', a fallback to cp1252 is accepted. encoding (str): Coding that is used to convert the FTP response to `str`. Returns: None """ LF = b"\n" # noqa N806 buffer = b"" # needed to access buffer accross function scope local_var = {"buffer": buffer} fallback_enc = "cp1252" if encoding == "utf-8" else None def _on_read_line(line): # Line is a byte string # print(" line ", line) status = 2 # fault line_decoded = None try: line_decoded = line.decode(encoding) status = 0 # successfully decoded except UnicodeDecodeError: if fallback_enc: try: line_decoded = line.decode(fallback_enc) status = 1 # used fallback encoding except UnicodeDecodeError: raise # if compat.PY2: # # line is a native binary `str`. # if status == 1: # # We used a fallback: re-encode # callback(status, line_decoded.encode(encoding)) # else: # callback(status, line) # else: # line_decoded is a native text `str`. callback(status, line_decoded) # on_read_line = _on_read_line_py2 if compat.PY2 else _on_read_line_py3 def _on_read_chunk(chunk): buffer = local_var["buffer"] # Normalize line endings chunk = chunk.replace(b"\r\n", LF) chunk = chunk.replace(b"\r", LF) chunk = buffer + chunk try: # print("Add chunk ", chunk, "to buffer", buffer) while True: item, chunk = chunk.split(LF, 1) _on_read_line(item) # + LF) except ValueError: pass # print("Rest chunk", chunk) local_var["buffer"] = chunk self.ftp.retrbinary(command, _on_read_chunk) if buffer: _on_read_line(buffer) return
class _Target: """Base class for :class:`FsTarget`, :class:`FTPTarget`, etc.""" DEFAULT_BLOCKSIZE = 16 * 1024 # shutil.copyobj() uses 16k blocks by default def __init__(self, root_dir, extra_opts): # All internal paths should use unicode. # (We cannot convert here, since we don't know the target encoding.) assert is_native(root_dir) if root_dir != "/": root_dir = root_dir.rstrip("/") # This target is not thread safe self._rlock = threading.RLock() #: The target's top-level folder self.root_dir = root_dir self.extra_opts = extra_opts or {} self.readonly = False self.dry_run = False self.host = None self.synchronizer = None # Set by BaseSynchronizer.__init__() self.peer = None self.cur_dir = None self.connected = False self.save_mode = True self.case_sensitive = None # TODO: don't know yet #: Time difference between <local upload time> and the mtime that the server reports afterwards. #: The value is added to the 'u' time stored in meta data. #: (This is only a rough estimation, derived from the lock-file.) self.server_time_ofs = None #: Maximum allowed difference between a reported mtime and the last known update time, #: before we classify the entry as 'modified externally' self.mtime_compare_eps = FileEntry.EPS_TIME self.cur_dir_meta = DirMetadata(self) self.meta_stack = [] # Optionally define an encoding for this target, but don't override # derived class's setting if not hasattr(self, "encoding"): #: Assumed encoding for this target. Used to decode binary paths. self.encoding = _get_encoding_opt(None, extra_opts, None) return def __del__(self): # TODO: http://pydev.blogspot.de/2015/01/creating-safe-cyclic-reference.html if self.connected: self.close() # def __enter__(self): # self.open() # return self # def __exit__(self, exc_type, exc_value, traceback): # self.close() def get_base_name(self): return "{}".format(self.root_dir) def is_local(self): return self.synchronizer.local is self def is_unbound(self): return self.synchronizer is None def get_options_dict(self): """Return options from synchronizer (possibly overridden by own extra_opts).""" d = self.synchronizer.options if self.synchronizer else {} d.update(self.extra_opts) return d def get_option(self, key, default=None): """Return option from synchronizer (possibly overridden by target extra_opts).""" if self.synchronizer: return self.extra_opts.get( key, self.synchronizer.options.get(key, default)) return self.extra_opts.get(key, default) def open(self): if self.connected: raise RuntimeError("Target already open: {}. ".format(self)) # Not thread safe (issue #20) if not self._rlock.acquire(False): raise RuntimeError("Could not acquire _Target lock on open") self.connected = True def close(self): if not self.connected: return if self.get_option("verbose", 3) >= 5: write("Closing target {}.".format(self)) self.connected = False self.readonly = False # issue #20 self._rlock.release() def check_write(self, name): """Raise exception if writing cur_dir/name is not allowed.""" assert is_native(name) if self.readonly and name not in ( DirMetadata.META_FILE_NAME, DirMetadata.LOCK_FILE_NAME, ): raise RuntimeError("Target is read-only: {} + {} / ".format( self, name)) def get_id(self): return self.root_dir def get_sync_info(self, name, key=None): """Get mtime/size when this target's current dir was last synchronized with remote.""" peer_target = self.peer if self.is_local(): info = self.cur_dir_meta.dir["peer_sync"].get(peer_target.get_id()) else: info = peer_target.cur_dir_meta.dir["peer_sync"].get(self.get_id()) if name is not None: info = info.get(name) if info else None if info and key: info = info.get(key) return info def cwd(self, dir_name): raise NotImplementedError @contextlib.contextmanager def enter_subdir(self, name): """Temporarily changes the working directory to `name`. Examples: with target.enter_subdir(folder): ... """ self.cwd(name) yield self.cwd("..") def push_meta(self): self.meta_stack.append(self.cur_dir_meta) self.cur_dir_meta = None def pop_meta(self): self.cur_dir_meta = self.meta_stack.pop() def flush_meta(self): """Write additional meta information for current directory.""" if self.cur_dir_meta: self.cur_dir_meta.flush() def pwd(self, dir_name): raise NotImplementedError def mkdir(self, dir_name): raise NotImplementedError def rmdir(self, dir_name): """Remove cur_dir/name.""" raise NotImplementedError def get_dir(self): """Return a list of _Resource entries.""" raise NotImplementedError def walk(self, pred=None, recursive=True): """Iterate over all target entries recursively. Args: pred (function, optional): Callback(:class:`ftpsync.resources._Resource`) should return `False` to ignore entry. Default: `None`. recursive (bool, optional): Pass `False` to generate top level entries only. Default: `True`. Yields: :class:`ftpsync.resources._Resource` """ for entry in self.get_dir(): if pred and pred(entry) is False: continue yield entry if recursive: if isinstance(entry, DirectoryEntry): self.cwd(entry.name) for e in self.walk(pred): yield e self.cwd("..") return def walk_tree(self, sort=True, files=False, pred=None, _prefixes=None): """Iterate over target hierarchy, depth-first, adding a connector prefix. This iterator walks the tree nodes, but slightly delays the output, in order to add information if a node is the *last* sibling. This information is then used to create pretty tree connector prefixes. Args: sort (bool): files (bool): pred (function, optional): Callback(:class:`ftpsync.resources._Resource`) should return `False` to ignore entry. Default: `None`. Yields: 3-tuple ( :class:`ftpsync.resources._Resource`, is_last_sibling, prefix, ) A +- a | +- 1 | | `- 1.1 | `- 2 | `- 2.1 `- b +- 1 | `- 1.1 ` 2 """ # List of parent's `is_last` flags: if _prefixes is None: _prefixes = [] def _yield_entry(entry, is_last): path = "".join([" " if last else " | " for last in _prefixes]) path += " `- " if is_last else " +- " yield path, entry if entry.is_dir(): with self.enter_subdir(entry.name): _prefixes.append(is_last) yield from self.walk_tree(sort, files, pred, _prefixes) _prefixes.pop() return dir_list = self.get_dir() if not files: dir_list = [entry for entry in dir_list if entry.is_dir()] if sort: # Sort by name, files first dir_list.sort( key=lambda entry: (entry.is_dir(), entry.name.lower())) prev_entry = None for next_entry in dir_list: if pred and pred(next_entry) is False: continue # Skip first entry if prev_entry is None: prev_entry = next_entry continue # Yield entry (this is never the last sibling) yield from _yield_entry(prev_entry, False) prev_entry = next_entry # Finally yield the last sibling if prev_entry: yield from _yield_entry(prev_entry, True) return def open_readable(self, name): """Return file-like object opened in binary mode for cur_dir/name.""" raise NotImplementedError def open_writable(self, name): """Return file-like object opened in binary mode for cur_dir/name.""" raise NotImplementedError def read_text(self, name): """Read text string from cur_dir/name using open_readable().""" with self.open_readable(name) as fp: res = fp.read() # StringIO or file object # try: # res = fp.getvalue() # StringIO returned by FTPTarget # except AttributeError: # res = fp.read() # file object returned by FsTarget res = res.decode("utf-8") return res def copy_to_file(self, name, fp_dest, callback=None): """Write cur_dir/name to file-like `fp_dest`. Args: name (str): file name, located in self.curdir fp_dest (file-like): must support write() method callback (function, optional): Called like `func(buf)` for every written chunk """ raise NotImplementedError def write_file(self, name, fp_src, blocksize=DEFAULT_BLOCKSIZE, callback=None): """Write binary data from file-like to cur_dir/name.""" raise NotImplementedError def write_text(self, name, s): """Write string data to cur_dir/name using write_file().""" buf = io.BytesIO(to_bytes(s)) self.write_file(name, buf) def remove_file(self, name): """Remove cur_dir/name.""" raise NotImplementedError def set_mtime(self, name, mtime, size): raise NotImplementedError def set_sync_info(self, name, mtime, size): """Store mtime/size when this resource was last synchronized with remote.""" if not self.is_local(): return self.peer.set_sync_info(name, mtime, size) return self.cur_dir_meta.set_sync_info(name, mtime, size) def remove_sync_info(self, name): if not self.is_local(): return self.peer.remove_sync_info(name) if self.cur_dir_meta: return self.cur_dir_meta.remove(name) # write("%s.remove_sync_info(%s): nothing to do" % (self, name)) return
class FtpTarget(_Target): """Represents a synchronization target on an FTP server. Attributes: path (str): Current working directory on FTP server. ftp (FTP): Instance of ftplib.FTP. host (str): hostname of FTP server port (int): FTP port (defaults to 21) username (str): password (str): """ DEFAULT_BLOCKSIZE = 8 * 1024 # ftplib uses 8k chunks by default MAX_SPOOL_MEM = ( 100 * 1024 ) # keep open_readable() buffer in memory if smaller than 100kB def __init__( self, path, host, port=0, username=None, password=None, tls=False, timeout=None, extra_opts=None, ): """Create FTP target with host, initial path, optional credentials and options. Args: path (str): root path on FTP server, relative to *host* host (str): hostname of FTP server port (int): FTP port (defaults to 21) username (str): password (str): tls (bool): encrypt the connection using TLS (Python 2.7/3.2+) timeout (int): the timeout to set against the ftp socket (seconds) extra_opts (dict): """ self.encoding = _get_encoding_opt(None, extra_opts, "utf-8") # path = self.to_unicode(path) path = path or "/" assert compat.is_native(path) super(FtpTarget, self).__init__(path, extra_opts) if tls: try: self.ftp = ftplib.FTP_TLS() except AttributeError: write("Python 2.7/3.2+ required for FTPS (TLS).") raise else: self.ftp = ftplib.FTP() self.ftp.set_debuglevel(self.get_option("ftp_debug", 0)) self.host = host self.port = port or 0 self.username = username self.password = password self.tls = tls self.timeout = timeout #: dict: written to ftp target root folder before synchronization starts. #: set to False, if write failed. Default: None self.lock_data = None self.lock_write_time = None self.feat_response = None self.syst_response = None self.is_unix = None #: True if server reports FEAT UTF8 self.support_utf8 = None #: Time difference between <local upload time> and the mtime that the server reports afterwards. #: The value is added to the 'u' time stored in meta data. #: (This is only a rough estimation, derived from the lock-file.) self.server_time_ofs = None self.ftp_socket_connected = False self.support_set_time = False # #: Optionally define an encoding for this server # encoding = self.get_option("encoding", "utf-8") # self.encoding = codecs.lookup(encoding).name # return def __str__(self): return "<{} + {}>".format( self.get_base_name(), relpath_url(self.cur_dir or "/", self.root_dir) ) def get_base_name(self): scheme = "ftps" if self.tls else "ftp" return "{}://{}{}".format(scheme, self.host, self.root_dir) def open(self): assert not self.ftp_socket_connected super(FtpTarget, self).open() options = self.get_options_dict() no_prompt = self.get_option("no_prompt", True) store_password = self.get_option("store_password", False) verbose = self.get_option("verbose", 3) self.ftp.set_debuglevel(self.get_option("ftp_debug", 0)) # Optionally use FTP active mode (default: PASV) (issue #21) force_active = self.get_option("ftp_active", False) self.ftp.set_pasv(not force_active) if self.timeout: self.ftp.connect(self.host, self.port, self.timeout) else: # Py2.7 uses -999 as default for `timeout`, Py3 uses None self.ftp.connect(self.host, self.port) self.ftp_socket_connected = True if self.username is None or self.password is None: creds = get_credentials_for_url( self.host, options, force_user=self.username ) if creds: self.username, self.password = creds while True: try: # Login (as 'anonymous' if self.username is undefined): self.ftp.login(self.username, self.password) if verbose >= 4: write( "Login as '{}'.".format( self.username if self.username else "anonymous" ) ) break except ftplib.error_perm as e: # If credentials were passed, but authentication fails, prompt # for new password if not e.args[0].startswith("530"): raise # error other then '530 Login incorrect' write_error( "Could not login to {}@{}: {}".format(self.username, self.host, e) ) if no_prompt or not self.username: raise creds = prompt_for_password(self.host, self.username) self.username, self.password = creds # Continue while-loop if self.tls: # Upgrade data connection to TLS. self.ftp.prot_p() try: self.syst_response = self.ftp.sendcmd("SYST") if verbose >= 5: write("SYST: '{}'.".format(self.syst_response.replace("\n", " "))) # self.is_unix = "unix" in resp.lower() # not necessarily true, better check with r/w tests # TODO: case sensitivity? except Exception as e: write("SYST command failed: '{}'".format(e)) try: self.feat_response = self.ftp.sendcmd("FEAT") self.support_utf8 = "UTF8" in self.feat_response if verbose >= 5: write("FEAT: '{}'.".format(self.feat_response.replace("\n", " "))) except Exception as e: write("FEAT command failed: '{}'".format(e)) if self.encoding == "utf-8": if not self.support_utf8 and verbose >= 4: write( "Server does not list utf-8 as supported feature (using it anyway).", warning=True, ) try: # Announce our wish to use UTF-8 to the server as proposed here: # See https://tools.ietf.org/html/draft-ietf-ftpext-utf-8-option-00 # Note: this RFC is inactive, expired, and failed on Strato self.ftp.sendcmd("OPTS UTF-8") if verbose >= 4: write("Sent 'OPTS UTF-8'.") except Exception as e: if verbose >= 4: write("Could not send 'OPTS UTF-8': '{}'".format(e), warning=True) try: # Announce our wish to use UTF-8 to the server as proposed here: # See https://tools.ietf.org/html/rfc2389 # https://www.cerberusftp.com/phpBB3/viewtopic.php?t=2608 # Note: this was accepted on Strato self.ftp.sendcmd("OPTS UTF8 ON") if verbose >= 4: write("Sent 'OPTS UTF8 ON'.") except Exception as e: write("Could not send 'OPTS UTF8 ON': '{}'".format(e), warning=True) if hasattr(self.ftp, "encoding"): # Python 3 encodes using latin-1 by default(!) # (In Python 2 ftp.encoding does not exist, but ascii is used) if self.encoding != codecs.lookup(self.ftp.encoding).name: write( "Setting FTP encoding to {} (was {}).".format( self.encoding, self.ftp.encoding ) ) self.ftp.encoding = self.encoding try: self.ftp.cwd(self.root_dir) except ftplib.error_perm as e: if not e.args[0].startswith("550"): raise # error other then 550 No such directory' write_error( "Could not change directory to {} ({}): missing permissions?".format( self.root_dir, e ) ) pwd = self.pwd() # pwd = self.to_unicode(pwd) if pwd != self.root_dir: raise RuntimeError( "Unable to navigate to working directory {!r} (now at {!r})".format( self.root_dir, pwd ) ) self.cur_dir = pwd # self.ftp_initialized = True # Successfully authenticated: store password if store_password: save_password(self.host, self.username, self.password) self._lock() return def close(self): if self.lock_data: self._unlock(closing=True) if self.ftp_socket_connected: try: self.ftp.quit() except (CompatConnectionError, EOFError) as e: write_error("ftp.quit() failed: {}".format(e)) self.ftp_socket_connected = False super(FtpTarget, self).close() def _lock(self, break_existing=False): """Write a special file to the target root folder.""" # write("_lock") data = {"lock_time": time.time(), "lock_holder": None} try: assert self.cur_dir == self.root_dir self.write_text(DirMetadata.LOCK_FILE_NAME, json.dumps(data)) self.lock_data = data self.lock_write_time = time.time() except Exception as e: errmsg = "{}".format(e) write_error("Could not write lock file: {}".format(errmsg)) if errmsg.startswith("550") and self.ftp.passiveserver: try: self.ftp.makepasv() except Exception: write_error( "The server probably requires FTP Active mode. " "Try passing the --ftp-active option." ) # Set to False, so we don't try to remove later self.lock_data = False def _unlock(self, closing=False): """Remove lock file to the target root folder. """ # write("_unlock", closing) try: if self.cur_dir != self.root_dir: if closing: write( "Changing to ftp root folder to remove lock file: {}".format( self.root_dir ) ) self.cwd(self.root_dir) else: write_error( "Could not remove lock file, because CWD != ftp root: {}".format( self.cur_dir ) ) return if self.lock_data is False: if self.get_option("verbose", 3) >= 4: write("Skip remove lock file (was not written).") else: # direct delete, without updating metadata or checking for target access: try: self.ftp.delete(DirMetadata.LOCK_FILE_NAME) # self.remove_file(DirMetadata.LOCK_FILE_NAME) except Exception as e: # I have seen '226 Closing data connection' responses here, # probably when a previous command threw another error. # However here, 2xx response should be Ok(?): # A 226 reply code is sent by the server before closing the # data connection after successfully processing the previous client command if e.args[0][:3] == "226": write_error("Ignoring 226 response for ftp.delete() lockfile") else: raise self.lock_data = None except Exception as e: write_error("Could not remove lock file: {}".format(e)) raise def _probe_lock_file(self, reported_mtime): """Called by get_dir""" delta = reported_mtime - self.lock_data["lock_time"] # delta2 = reported_mtime - self.lock_write_time self.server_time_ofs = delta if self.get_option("verbose", 3) >= 4: write("Server time offset: {:.2f} seconds.".format(delta)) # write("Server time offset2: {:.2f} seconds.".format(delta2)) def get_id(self): return self.host + self.root_dir def cwd(self, dir_name): assert compat.is_native(dir_name) path = normpath_url(join_url(self.cur_dir, dir_name)) if not path.startswith(self.root_dir): # paranoic check to prevent that our sync tool goes berserk raise RuntimeError( "Tried to navigate outside root %r: %r" % (self.root_dir, path) ) self.ftp.cwd(dir_name) self.cur_dir = path self.cur_dir_meta = None return self.cur_dir def pwd(self): """Return current working dir as native `str` (uses fallback-encoding).""" return self._ftp_pwd() # return self.ftp.pwd() def mkdir(self, dir_name): assert compat.is_native(dir_name) self.check_write(dir_name) self.ftp.mkd(dir_name) def _rmdir_impl(self, dir_name, keep_root_folder=False, predicate=None): # FTP does not support deletion of non-empty directories. assert compat.is_native(dir_name) self.check_write(dir_name) names = [] nlst_res = self._ftp_nlst(dir_name) # nlst_res = self.ftp.nlst(dir_name) # write("rmdir(%s): %s" % (dir_name, nlst_res)) for name in nlst_res: # name = self.re_encode_to_native(name) if "/" in name: name = os.path.basename(name) if name in (".", ".."): continue if predicate and not predicate(name): continue names.append(name) if len(names) > 0: self.ftp.cwd(dir_name) try: for name in names: try: # try to delete this as a file self.ftp.delete(name) except ftplib.all_errors as _e: write( " ftp.delete({}) failed: {}, trying rmdir()...".format( name, _e ) ) # assume <name> is a folder self.rmdir(name) finally: if dir_name != ".": self.ftp.cwd("..") # write("ftp.rmd(%s)..." % (dir_name, )) if not keep_root_folder: self.ftp.rmd(dir_name) return def rmdir(self, dir_name): return self._rmdir_impl(dir_name) def get_dir(self): entry_list = [] entry_map = {} local_var = {"has_meta": False} # pass local variables outside func scope encoding = self.encoding def _addline(status, line): # _ftp_retrlines_native() made sure that we always get `str` type lines assert status in (0, 1, 2) assert compat.is_native(line) data, _, name = line.partition("; ") # print(status, name, u_name) if status == 1: write( "WARNING: File name seems not to be {}; re-encoded from CP-1252:".format( encoding ), name, ) elif status == 2: write_error("File name is neither UTF-8 nor CP-1252 encoded:", name) res_type = size = mtime = unique = None fields = data.split(";") # https://tools.ietf.org/html/rfc3659#page-23 # "Size" / "Modify" / "Create" / "Type" / "Unique" / "Perm" / "Lang" # / "Media-Type" / "CharSet" / os-depend-fact / local-fact for field in fields: field_name, _, field_value = field.partition("=") field_name = field_name.lower() if field_name == "type": res_type = field_value elif field_name in ("sizd", "size"): size = int(field_value) elif field_name == "modify": # Use calendar.timegm() instead of time.mktime(), because # the date was returned as UTC if "." in field_value: mtime = calendar.timegm( time.strptime(field_value, "%Y%m%d%H%M%S.%f") ) else: mtime = calendar.timegm( time.strptime(field_value, "%Y%m%d%H%M%S") ) elif field_name == "unique": unique = field_value entry = None if res_type == "dir": entry = DirectoryEntry(self, self.cur_dir, name, size, mtime, unique) elif res_type == "file": if name == DirMetadata.META_FILE_NAME: # the meta-data file is silently ignored local_var["has_meta"] = True elif ( name == DirMetadata.LOCK_FILE_NAME and self.cur_dir == self.root_dir ): # this is the root lock file. compare reported mtime with # local upload time self._probe_lock_file(mtime) else: entry = FileEntry(self, self.cur_dir, name, size, mtime, unique) elif res_type in ("cdir", "pdir"): pass else: write_error("Could not parse '{}'".format(line)) raise NotImplementedError( "MLSD returned unsupported type: {!r}".format(res_type) ) if entry: entry_map[name] = entry entry_list.append(entry) try: # We use a custom wrapper here, so we can implement a codding fall back: self._ftp_retrlines_native("MLSD", _addline, encoding) # self.ftp.retrlines("MLSD", _addline) except ftplib.error_perm as e: # write_error("The FTP server responded with {}".format(e)) # raises error_perm "500 Unknown command" if command is not supported if "500" in str(e.args): raise RuntimeError( "The FTP server does not support the 'MLSD' command." ) raise # load stored meta data if present self.cur_dir_meta = DirMetadata(self) if local_var["has_meta"]: try: self.cur_dir_meta.read() except IncompatibleMetadataVersion: raise # this should end the script (user should pass --migrate) except Exception as e: write_error( "Could not read meta info {}: {}".format(self.cur_dir_meta, e) ) meta_files = self.cur_dir_meta.list # Adjust file mtime from meta-data if present missing = [] for n in meta_files: meta = meta_files[n] if n in entry_map: # We have a meta-data entry for this resource upload_time = meta.get("u", 0) # Discard stored meta-data if # 1. the reported files size is different than the # size we stored in the meta-data # or # 2. the the mtime reported by the FTP server is later # than the stored upload time (which indicates # that the file was modified directly on the server) if entry_map[n].size != meta.get("s"): if self.get_option("verbose", 3) >= 5: write( "Removing meta entry {} (size changed from {} to {}).".format( n, entry_map[n].size, meta.get("s") ) ) missing.append(n) elif (entry_map[n].mtime - upload_time) > self.mtime_compare_eps: if self.get_option("verbose", 3) >= 5: write( "Removing meta entry {} (modified {} > {}).".format( n, time.ctime(entry_map[n].mtime), time.ctime(upload_time), ) ) missing.append(n) else: # Use meta-data mtime instead of the one reported by FTP server entry_map[n].meta = meta entry_map[n].mtime = meta["m"] else: # File is stored in meta-data, but no longer exists on FTP server # write("META: Removing missing meta entry %s" % n) missing.append(n) # Remove missing or invalid files from cur_dir_meta for n in missing: self.cur_dir_meta.remove(n) return entry_list def open_readable(self, name): """Open cur_dir/name for reading. Note: we read everything into a buffer that supports .read(). Args: name (str): file name, located in self.curdir Returns: file-like (must support read() method) """ # print("FTP open_readable({})".format(name)) assert compat.is_native(name) out = SpooledTemporaryFile(max_size=self.MAX_SPOOL_MEM, mode="w+b") self.ftp.retrbinary( "RETR {}".format(name), out.write, FtpTarget.DEFAULT_BLOCKSIZE ) out.seek(0) return out def write_file(self, name, fp_src, blocksize=DEFAULT_BLOCKSIZE, callback=None): """Write file-like `fp_src` to cur_dir/name. Args: name (str): file name, located in self.curdir fp_src (file-like): must support read() method blocksize (int, optional): callback (function, optional): Called like `func(buf)` for every written chunk """ # print("FTP write_file({})".format(name), blocksize) assert compat.is_native(name) self.check_write(name) self.ftp.storbinary("STOR {}".format(name), fp_src, blocksize, callback) # TODO: check result def copy_to_file(self, name, fp_dest, callback=None): """Write cur_dir/name to file-like `fp_dest`. Args: name (str): file name, located in self.curdir fp_dest (file-like): must support write() method callback (function, optional): Called like `func(buf)` for every written chunk """ assert compat.is_native(name) def _write_to_file(data): # print("_write_to_file() {} bytes.".format(len(data))) fp_dest.write(data) if callback: callback(data) self.ftp.retrbinary( "RETR {}".format(name), _write_to_file, FtpTarget.DEFAULT_BLOCKSIZE ) def remove_file(self, name): """Remove cur_dir/name.""" assert compat.is_native(name) self.check_write(name) # self.cur_dir_meta.remove(name) self.ftp.delete(name) self.remove_sync_info(name) def set_mtime(self, name, mtime, size): assert compat.is_native(name) self.check_write(name) # write("META set_mtime(%s): %s" % (name, time.ctime(mtime))) # We cannot set the mtime on FTP servers, so we store this as additional # meta data in the same directory # TODO: try "SITE UTIME", "MDTM (set version)", or "SRFT" command self.cur_dir_meta.set_mtime(name, mtime, size) def _ftp_pwd(self): """Variant of `self.ftp.pwd()` that supports encoding-fallback. Returns: Current working directory as native string. """ try: return self.ftp.pwd() except UnicodeEncodeError: if compat.PY2 or self.ftp.encoding != "utf-8": raise # should not happen, since Py2 does not try to encode # TODO: this is NOT THREAD-SAFE! prev_encoding = self.ftp.encoding try: write("ftp.pwd() failed with utf-8: trying Cp1252...", warning=True) return self.ftp.pwd() finally: self.ftp.encoding = prev_encoding def _ftp_nlst(self, dir_name): """Variant of `self.ftp.nlst()` that supports encoding-fallback.""" assert compat.is_native(dir_name) lines = [] def _add_line(status, line): lines.append(line) cmd = "NLST " + dir_name self._ftp_retrlines_native(cmd, _add_line, self.encoding) # print(cmd, lines) return lines def _ftp_retrlines_native(self, command, callback, encoding): """A re-implementation of ftp.retrlines that returns lines as native `str`. This is needed on Python 3, where `ftp.retrlines()` returns unicode `str` by decoding the incoming command response using `ftp.encoding`. This would fail for the whole request if a single line of the MLSD listing cannot be decoded. FtpTarget wants to fall back to Cp1252 if UTF-8 fails for a single line, so we need to process the raw original binary input lines. On Python 2, the response is already bytes, but we try to decode in order to check validity and optionally re-encode from Cp1252. Args: command (str): A valid FTP command like 'NLST', 'MLSD', ... callback (function): Called for every line with these args: status (int): 0:ok 1:fallback used, 2:decode failed line (str): result line decoded using `encoding`. If `encoding` is 'utf-8', a fallback to cp1252 is accepted. encoding (str): Coding that is used to convert the FTP response to `str`. Returns: None """ LF = b"\n" buffer = b"" # needed to access buffer accross function scope local_var = {"buffer": buffer} fallback_enc = "cp1252" if encoding == "utf-8" else None def _on_read_line(line): # Line is a byte string # print(" line ", line) status = 2 # fault line_decoded = None try: line_decoded = line.decode(encoding) status = 0 # successfully decoded except UnicodeDecodeError: if fallback_enc: try: line_decoded = line.decode(fallback_enc) status = 1 # used fallback encoding except UnicodeDecodeError: raise if compat.PY2: # line is a native binary `str`. if status == 1: # We used a fallback: re-encode callback(status, line_decoded.encode(encoding)) else: callback(status, line) else: # line_decoded is a native text `str`. callback(status, line_decoded) # on_read_line = _on_read_line_py2 if compat.PY2 else _on_read_line_py3 def _on_read_chunk(chunk): buffer = local_var["buffer"] # Normalize line endings chunk = chunk.replace(b"\r\n", LF) chunk = chunk.replace(b"\r", LF) chunk = buffer + chunk try: # print("Add chunk ", chunk, "to buffer", buffer) while True: item, chunk = chunk.split(LF, 1) _on_read_line(item) # + LF) except ValueError: pass # print("Rest chunk", chunk) local_var["buffer"] = chunk self.ftp.retrbinary(command, _on_read_chunk) if buffer: _on_read_line(buffer) return
class _Target(object): """Base class for :class:`FsTarget`, :class:`FtpTarget`, etc.""" DEFAULT_BLOCKSIZE = 16 * 1024 # shutil.copyobj() uses 16k blocks by default def __init__(self, root_dir, extra_opts): # All internal paths should use unicode. # (We cannot convert here, since we don't know the target encoding.) assert compat.is_native(root_dir) if root_dir != "/": root_dir = root_dir.rstrip("/") # This target is not thread safe self._rlock = threading.RLock() #: The target's top-level folder self.root_dir = root_dir self.extra_opts = extra_opts or {} self.readonly = False self.dry_run = False self.host = None self.synchronizer = None # Set by BaseSynchronizer.__init__() self.peer = None self.cur_dir = None self.connected = False self.save_mode = True self.case_sensitive = None # TODO: don't know yet #: Time difference between <local upload time> and the mtime that the server reports afterwards. #: The value is added to the 'u' time stored in meta data. #: (This is only a rough estimation, derived from the lock-file.) self.server_time_ofs = None #: Maximum allowed difference between a reported mtime and the last known update time, #: before we classify the entry as 'modified externally' self.mtime_compare_eps = FileEntry.EPS_TIME self.cur_dir_meta = DirMetadata(self) self.meta_stack = [] # Optionally define an encoding for this target, but don't override # derived class's setting if not hasattr(self, "encoding"): #: Assumed encoding for this target. Used to decode binary paths. self.encoding = _get_encoding_opt(None, extra_opts, None) return def __del__(self): # TODO: http://pydev.blogspot.de/2015/01/creating-safe-cyclic-reference.html self.close() # def __enter__(self): # self.open() # return self # def __exit__(self, exc_type, exc_value, traceback): # self.close() def get_base_name(self): return "{}".format(self.root_dir) def is_local(self): return self.synchronizer.local is self def is_unbound(self): return self.synchronizer is None # def to_bytes(self, s): # """Convert `s` to bytes, using this target's encoding (does nothing if `s` is already bytes).""" # return compat.to_bytes(s, self.encoding) # def to_unicode(self, s): # """Convert `s` to unicode, using this target's encoding (does nothing if `s` is already unic).""" # return compat.to_unicode(s, self.encoding) # def to_native(self, s): # """Convert `s` to native, using this target's encoding (does nothing if `s` is already native).""" # return compat.to_native(s, self.encoding) # def re_encode_to_native(self, s): # """Return `s` in `str` format, assuming target.encoding. # On Python 2 return a binary `str`: # Encode unicode to UTF-8 binary str # Re-encode binary str from self.encoding to UTF-8 # On Python 3 return unicode `str`: # Leave unicode unmodified # Decode binary str using self.encoding # """ # if compat.PY2: # if isinstance(s, unicode): # noqa # s = s.encode("utf-8") # elif self.encoding != "utf-8": # s = s.decode(self.encoding) # s = s.encode("utf-8") # elif not isinstance(s, str): # s = s.decode(self.encoding) # return s def get_options_dict(self): """Return options from synchronizer (possibly overridden by own extra_opts).""" d = self.synchronizer.options if self.synchronizer else {} d.update(self.extra_opts) return d def get_option(self, key, default=None): """Return option from synchronizer (possibly overridden by target extra_opts).""" if self.synchronizer: return self.extra_opts.get( key, self.synchronizer.options.get(key, default)) return self.extra_opts.get(key, default) def open(self): if self.connected: raise RuntimeError("Target already open: {}. ".format(self)) # Not thread safe (issue #20) if not self._rlock.acquire(False): raise RuntimeError("Could not acquire _Target lock on open") self.connected = True def close(self): if not self.connected: return if self.get_option("verbose", 3) >= 5: write("Closing target {}.".format(self)) self.connected = False self.readonly = False # issue #20 self._rlock.release() def check_write(self, name): """Raise exception if writing cur_dir/name is not allowed.""" assert compat.is_native(name) if self.readonly and name not in ( DirMetadata.META_FILE_NAME, DirMetadata.LOCK_FILE_NAME, ): raise RuntimeError("Target is read-only: {} + {} / ".format( self, name)) def get_id(self): return self.root_dir def get_sync_info(self, name, key=None): """Get mtime/size when this target's current dir was last synchronized with remote.""" peer_target = self.peer if self.is_local(): info = self.cur_dir_meta.dir["peer_sync"].get(peer_target.get_id()) else: info = peer_target.cur_dir_meta.dir["peer_sync"].get(self.get_id()) if name is not None: info = info.get(name) if info else None if info and key: info = info.get(key) return info def cwd(self, dir_name): raise NotImplementedError def push_meta(self): self.meta_stack.append(self.cur_dir_meta) self.cur_dir_meta = None def pop_meta(self): self.cur_dir_meta = self.meta_stack.pop() def flush_meta(self): """Write additional meta information for current directory.""" if self.cur_dir_meta: self.cur_dir_meta.flush() def pwd(self, dir_name): raise NotImplementedError def mkdir(self, dir_name): raise NotImplementedError def rmdir(self, dir_name): """Remove cur_dir/name.""" raise NotImplementedError def get_dir(self): """Return a list of _Resource entries.""" raise NotImplementedError def walk(self, pred=None, recursive=True): """Iterate over all target entries recursively. Args: pred (function, optional): Callback(:class:`ftpsync.resources._Resource`) should return `False` to ignore entry. Default: `None`. recursive (bool, optional): Pass `False` to generate top level entries only. Default: `True`. Yields: :class:`ftpsync.resources._Resource` """ for entry in self.get_dir(): if pred and pred(entry) is False: continue yield entry if recursive: if isinstance(entry, DirectoryEntry): self.cwd(entry.name) for e in self.walk(pred): yield e self.cwd("..") return def open_readable(self, name): """Return file-like object opened in binary mode for cur_dir/name.""" raise NotImplementedError def open_writable(self, name): """Return file-like object opened in binary mode for cur_dir/name.""" raise NotImplementedError def read_text(self, name): """Read text string from cur_dir/name using open_readable().""" with self.open_readable(name) as fp: res = fp.read() # StringIO or file object # try: # res = fp.getvalue() # StringIO returned by FtpTarget # except AttributeError: # res = fp.read() # file object returned by FsTarget res = res.decode("utf-8") return res def copy_to_file(self, name, fp_dest, callback=None): """Write cur_dir/name to file-like `fp_dest`. Args: name (str): file name, located in self.curdir fp_dest (file-like): must support write() method callback (function, optional): Called like `func(buf)` for every written chunk """ raise NotImplementedError def write_file(self, name, fp_src, blocksize=DEFAULT_BLOCKSIZE, callback=None): """Write binary data from file-like to cur_dir/name.""" raise NotImplementedError def write_text(self, name, s): """Write string data to cur_dir/name using write_file().""" buf = io.BytesIO(compat.to_bytes(s)) self.write_file(name, buf) def remove_file(self, name): """Remove cur_dir/name.""" raise NotImplementedError def set_mtime(self, name, mtime, size): raise NotImplementedError def set_sync_info(self, name, mtime, size): """Store mtime/size when this resource was last synchronized with remote.""" if not self.is_local(): return self.peer.set_sync_info(name, mtime, size) return self.cur_dir_meta.set_sync_info(name, mtime, size) def remove_sync_info(self, name): if not self.is_local(): return self.peer.remove_sync_info(name) if self.cur_dir_meta: return self.cur_dir_meta.remove(name) # write("%s.remove_sync_info(%s): nothing to do" % (self, name)) return
class _Target(object): """Base class for :class:`FsTarget`, :class:`FtpTarget`, etc.""" DEFAULT_BLOCKSIZE = 16 * 1024 # shutil.copyobj() uses 16k blocks by default def __init__(self, root_dir, extra_opts): if root_dir != "/": root_dir = root_dir.rstrip("/") # This target is not thread safe self._rlock = threading.RLock() #: self.root_dir = root_dir self.extra_opts = extra_opts or {} self.readonly = False self.dry_run = False self.host = None self.synchronizer = None # Set by BaseSynchronizer.__init__() self.peer = None self.cur_dir = None self.connected = False self.save_mode = True self.case_sensitive = None # TODO: don't know yet self.time_ofs = None # TODO: see _probe_lock_file() self.support_set_time = None # Derived class knows self.cur_dir_meta = DirMetadata(self) self.meta_stack = [] def __del__(self): # TODO: http://pydev.blogspot.de/2015/01/creating-safe-cyclic-reference.html self.close() # def __enter__(self): # self.open() # return self # # def __exit__(self, exc_type, exc_value, traceback): # self.close() def get_base_name(self): return "{}".format(self.root_dir) def is_local(self): return self.synchronizer.local is self def is_unbound(self): return self.synchronizer is None def get_options_dict(self): """Return options from synchronizer (possibly overridden by own extra_opts).""" d = self.synchronizer.options if self.synchronizer else {} d.update(self.extra_opts) return d def get_option(self, key, default=None): """Return option from synchronizer (possibly overridden by target extra_opts).""" if self.synchronizer: return self.extra_opts.get( key, self.synchronizer.options.get(key, default)) return self.extra_opts.get(key, default) def open(self): if self.connected: raise RuntimeError("Target already open: {}. ".format(self)) # Not thread safe (issue #20) if not self._rlock.acquire(False): raise RuntimeError("Could not acquire _Target lock on open") self.connected = True def close(self): if not self.connected: return if self.get_option("verbose", 3) >= 5: write("Closing target {}.".format(self)) self.connected = False self.readonly = False # issue #20 self._rlock.release() def check_write(self, name): """Raise exception if writing cur_dir/name is not allowed.""" if self.readonly and name not in (DirMetadata.META_FILE_NAME, DirMetadata.LOCK_FILE_NAME): raise RuntimeError("Target is read-only: {} + {} / ".format( self, name)) def get_id(self): return self.root_dir def get_sync_info(self, name, key=None): """Get mtime/size when this target's current dir was last synchronized with remote.""" peer_target = self.peer if self.is_local(): info = self.cur_dir_meta.dir["peer_sync"].get(peer_target.get_id()) else: info = peer_target.cur_dir_meta.dir["peer_sync"].get(self.get_id()) if name is not None: info = info.get(name) if info else None if info and key: info = info.get(key) return info def cwd(self, dir_name): raise NotImplementedError def push_meta(self): self.meta_stack.append(self.cur_dir_meta) self.cur_dir_meta = None def pop_meta(self): self.cur_dir_meta = self.meta_stack.pop() def flush_meta(self): """Write additional meta information for current directory.""" if self.cur_dir_meta: self.cur_dir_meta.flush() def pwd(self, dir_name): raise NotImplementedError def mkdir(self, dir_name): raise NotImplementedError def rmdir(self, dir_name): """Remove cur_dir/name.""" raise NotImplementedError def get_dir(self): """Return a list of _Resource entries.""" raise NotImplementedError def walk(self, pred=None, recursive=True): """Iterate over all target entries recursively. Args: pred (function, optional): Callback(:class:`ftpsync.resources._Resource`) should return `False` to ignore entry. Default: `None`. recursive (bool, optional): Pass `False` to generate top level entries only. Default: `True`. Yields: :class:`ftpsync.resources._Resource` """ for entry in self.get_dir(): if pred and pred(entry) is False: continue yield entry if recursive: if isinstance(entry, DirectoryEntry): self.cwd(entry.name) for e in self.walk(pred): yield e self.cwd("..") return def open_readable(self, name): """Return file-like object opened in binary mode for cur_dir/name.""" raise NotImplementedError def open_writable(self, name): """Return file-like object opened in binary mode for cur_dir/name.""" raise NotImplementedError def read_text(self, name): """Read text string from cur_dir/name using open_readable().""" with self.open_readable(name) as fp: res = fp.read() # StringIO or file object # try: # res = fp.getvalue() # StringIO returned by FtpTarget # except AttributeError: # res = fp.read() # file object returned by FsTarget res = res.decode("utf8") return res def copy_to_file(self, name, fp_dest, callback=None): """Write cur_dir/name to file-like `fp_dest`. Args: name (str): file name, located in self.curdir fp_dest (file-like): must support write() method callback (function, optional): Called like `func(buf)` for every written chunk """ def write_file(self, name, fp_src, blocksize=DEFAULT_BLOCKSIZE, callback=None): """Write binary data from file-like to cur_dir/name.""" raise NotImplementedError def write_text(self, name, s): """Write string data to cur_dir/name using write_file().""" buf = io.BytesIO(compat.to_bytes(s)) self.write_file(name, buf) def remove_file(self, name): """Remove cur_dir/name.""" raise NotImplementedError def set_mtime(self, name, mtime, size): raise NotImplementedError def set_sync_info(self, name, mtime, size): """Store mtime/size when this resource was last synchronized with remote.""" if not self.is_local(): return self.peer.set_sync_info(name, mtime, size) return self.cur_dir_meta.set_sync_info(name, mtime, size) def remove_sync_info(self, name): if not self.is_local(): return self.peer.remove_sync_info(name) if self.cur_dir_meta: return self.cur_dir_meta.remove(name) # write("%s.remove_sync_info(%s): nothing to do" % (self, name)) return
class SFTPTarget(_Target): """Represents a synchronization target on an SFTP server. Attributes: path (str): Current working directory on SFTP server. sftp (pysftp.Connection): Instance of pysftp.Connection. host (str): hostname of SFTP server port (int): SFTP port (defaults to 22) username (str): password (str): """ DEFAULT_BLOCKSIZE = 8 * 1024 # ftplib uses 8k chunks by default MAX_SPOOL_MEM = ( 100 * 1024 ) # keep open_readable() buffer in memory if smaller than 100kB def __init__( self, path, host, port=22, username=None, password=None, timeout=None, extra_opts=None, ): """Create SFTP target with host, initial path, optional credentials and options. Args: path (str): root path on SFTP server, relative to *host* host (str): hostname of SFTP server port (int): SFTP port (defaults to 22) username (str): password (str): timeout (int): the timeout to set against the ftp socket (seconds) extra_opts (dict): """ self.encoding = _get_encoding_opt(None, extra_opts, "utf-8") # path = self.to_unicode(path) path = path or "/" assert is_native(path) super(SFTPTarget, self).__init__(path, extra_opts) self.sftp = None self.host = host self.port = port or 22 self.username = username self.password = password self.timeout = timeout #: dict: written to ftp target root folder before synchronization starts. #: set to False, if write failed. Default: None self.lock_data = None self.lock_write_time = None #: Time difference between <local upload time> and the mtime that the #: server reports afterwards. #: The value is added to the 'u' time stored in meta data. #: (This is only a rough estimation, derived from the lock-file.) self.server_time_ofs = None self.ftp_socket_connected = False # self.support_set_time = False # #: Optionally define an encoding for this server # encoding = self.get_option("encoding", "utf-8") # self.encoding = codecs.lookup(encoding).name return def __str__(self): return "<{} + {}>".format( self.get_base_name(), relpath_url(self.cur_dir or "/", self.root_dir) ) def get_base_name(self): scheme = "sftp" return "{}://{}{}".format(scheme, self.host, self.root_dir) def open(self): assert not self.ftp_socket_connected super(SFTPTarget, self).open() options = self.get_options_dict() no_prompt = self.get_option("no_prompt", True) store_password = self.get_option("store_password", False) verbose = self.get_option("verbose", 3) verify_host_keys = not self.get_option("no_verify_host_keys", False) if self.get_option("ftp_active", False): raise RuntimeError("SFTP does not have active/passive mode.") if verbose <= 3: logging.getLogger("paramiko.transport").setLevel(logging.WARNING) write("Connecting {}:*** to sftp://{}".format(self.username, self.host)) cnopts = pysftp.CnOpts() cnopts.log = self.get_option("ftp_debug", False) if not verify_host_keys: cnopts.hostkeys = None if self.username is None or self.password is None: creds = get_credentials_for_url( self.host, options, force_user=self.username ) if creds: self.username, self.password = creds assert self.sftp is None while True: try: self.sftp = pysftp.Connection( self.host, username=self.username, password=self.password, port=self.port, cnopts=cnopts, ) break except paramiko.ssh_exception.AuthenticationException as e: write_error( "Could not login to {}@{}: {}".format(self.username, self.host, e) ) if no_prompt or not self.username: raise creds = prompt_for_password(self.host, self.username) self.username, self.password = creds # Continue while-loop except paramiko.ssh_exception.SSHException as e: write_error( "{exc}: Try `ssh-keyscan HOST` to add it " "(or pass `--no-verify-host-keys` if you don't care about security).".format( exc=e ) ) raise if verbose >= 4: write( "Login as '{}'.".format(self.username if self.username else "anonymous") ) if self.sftp.logfile: write("Logging to {}".format(self.sftp.logfile)) self.sftp.timeout = self.timeout self.ftp_socket_connected = True try: self.sftp.cwd(self.root_dir) except IOError as e: # if not e.args[0].startswith("550"): # raise # error other then 550 No such directory' write_error( "Could not change directory to {} ({}): missing permissions?".format( self.root_dir, e ) ) pwd = self.pwd() # pwd = self.to_unicode(pwd) if pwd != self.root_dir: raise RuntimeError( "Unable to navigate to working directory {!r} (now at {!r})".format( self.root_dir, pwd ) ) self.cur_dir = pwd # self.ftp_initialized = True # Successfully authenticated: store password if store_password: save_password(self.host, self.username, self.password) self._lock() return def close(self): if self.lock_data: self._unlock(closing=True) if self.ftp_socket_connected: try: self.sftp.close() except (ConnectionError, EOFError) as e: write_error("sftp.close() failed: {}".format(e)) self.ftp_socket_connected = False super(SFTPTarget, self).close() def _lock(self, break_existing=False): """Write a special file to the target root folder.""" # write("_lock") data = {"lock_time": time.time(), "lock_holder": None} try: assert self.cur_dir == self.root_dir self.write_text(DirMetadata.LOCK_FILE_NAME, json.dumps(data)) self.lock_data = data self.lock_write_time = time.time() except Exception as e: write_error("Could not write lock file: {}".format(e)) # Set to False, so we don't try to remove later self.lock_data = False def _unlock(self, closing=False): """Remove lock file to the target root folder.""" # write("_unlock", closing) try: if self.cur_dir != self.root_dir: if closing: write( "Changing to ftp root folder to remove lock file: {}".format( self.root_dir ) ) self.cwd(self.root_dir) else: write_error( "Could not remove lock file, because CWD != ftp root: {}".format( self.cur_dir ) ) return if self.lock_data is False: if self.get_option("verbose", 3) >= 4: write("Skip remove lock file (was not written).") else: # direct delete, without updating metadata or checking for target access: self.sftp.remove(DirMetadata.LOCK_FILE_NAME) # self.remove_file(DirMetadata.LOCK_FILE_NAME) self.lock_data = None except Exception as e: write_error("Could not remove lock file: {}".format(e)) raise def _probe_lock_file(self, reported_mtime): """Called by get_dir""" delta = reported_mtime - self.lock_data["lock_time"] # delta2 = reported_mtime - self.lock_write_time self.server_time_ofs = delta if self.get_option("verbose", 3) >= 4: write("Server time offset: {:.2f} seconds.".format(delta)) # write("Server time offset2: {:.2f} seconds.".format(delta2)) def get_id(self): return self.host + self.root_dir def cwd(self, dir_name): assert is_native(dir_name) path = normpath_url(join_url(self.cur_dir, dir_name)) if not path.startswith(self.root_dir): # paranoic check to prevent that our sync tool goes berserk raise RuntimeError( "Tried to navigate outside root {!r}: {!r}".format(self.root_dir, path) ) self.sftp.cwd(dir_name) self.cur_dir = path self.cur_dir_meta = None return self.cur_dir def pwd(self): """Return current working dir as native `str` (uses fallback-encoding).""" pwd = self.sftp.pwd if pwd != "/": # #38 pwd = pwd.rstrip("/") return pwd def mkdir(self, dir_name): assert is_native(dir_name) self.check_write(dir_name) self.sftp.mkdir(dir_name) def rmdir(self, dir_name): self.check_write(dir_name) return self.sftp.rmdir(dir_name) _paramiko_py3compat_u = paramiko.py3compat.u @staticmethod def _paramiko_py3compat_u_wrapper(s, encoding="utf8"): try: return SFTPTarget._paramiko_py3compat_u(s, encoding) except UnicodeDecodeError: write_error( "Failed to decode {} using {}. Trying cp1252...".format(s, encoding) ) s = s.decode("cp1252") return s def get_dir(self): # Fallback to cp1252 if utf8 fails with patch("paramiko.message.u", SFTPTarget._paramiko_py3compat_u_wrapper): res = self._get_dir_impl() return res def _get_dir_impl(self): entry_list = [] entry_map = {} has_meta = False attr_list = self.sftp.listdir_attr() for de in attr_list: is_dir = stat.S_ISDIR(de.st_mode) name = de.filename entry = None if is_dir: if name not in (".", ".."): entry = DirectoryEntry( self, self.cur_dir, name, de.st_size, de.st_mtime, unique=None ) elif name == DirMetadata.META_FILE_NAME: # the meta-data file is silently ignored has_meta = True elif name == DirMetadata.LOCK_FILE_NAME and self.cur_dir == self.root_dir: # this is the root lock file. Compare reported mtime with # local upload time self._probe_lock_file(de.st_mtime) else: entry = FileEntry( self, self.cur_dir, name, de.st_size, de.st_mtime, unique=None ) if entry: entry_map[name] = entry entry_list.append(entry) # load stored meta data if present self.cur_dir_meta = DirMetadata(self) if has_meta: try: self.cur_dir_meta.read() except IncompatibleMetadataVersion: raise # this should end the script (user should pass --migrate) except Exception as e: write_error( "Could not read meta info {}: {}".format(self.cur_dir_meta, e) ) meta_files = self.cur_dir_meta.list # Adjust file mtime from meta-data if present missing = [] for n in meta_files: meta = meta_files[n] if n in entry_map: # We have a meta-data entry for this resource upload_time = meta.get("u", 0) # Discard stored meta-data if # 1. the reported files size is different than the # size we stored in the meta-data # or # 2. the the mtime reported by the SFTP server is later # than the stored upload time (which indicates # that the file was modified directly on the server) if entry_map[n].size != meta.get("s"): if self.get_option("verbose", 3) >= 5: write( "Removing meta entry {} (size changed from {} to {}).".format( n, entry_map[n].size, meta.get("s") ) ) missing.append(n) elif (entry_map[n].mtime - upload_time) > self.mtime_compare_eps: if self.get_option("verbose", 3) >= 5: write( "Removing meta entry {} (modified {} > {}).".format( n, time.ctime(entry_map[n].mtime), time.ctime(upload_time), ) ) missing.append(n) else: # Use meta-data mtime instead of the one reported by SFTP server entry_map[n].meta = meta entry_map[n].mtime = meta["m"] else: # File is stored in meta-data, but no longer exists on SFTP server # write("META: Removing missing meta entry %s" % n) missing.append(n) # Remove missing or invalid files from cur_dir_meta for n in missing: self.cur_dir_meta.remove(n) # print("entry_list", entry_list) return entry_list def open_readable(self, name): """Open cur_dir/name for reading. Note: we read everything into a buffer that supports .read(). Args: name (str): file name, located in self.curdir Returns: file-like (must support read() method) """ # print("SFTP open_readable({})".format(name)) assert is_native(name) # TODO: use sftp.open() instead? out = SpooledTemporaryFile(max_size=self.MAX_SPOOL_MEM, mode="w+b") self.sftp.getfo(name, out) out.seek(0) return out def write_file(self, name, fp_src, blocksize=DEFAULT_BLOCKSIZE, callback=None): """Write file-like `fp_src` to cur_dir/name. Args: name (str): file name, located in self.curdir fp_src (file-like): must support read() method blocksize (int, optional): callback (function, optional): Called like `func(buf)` for every written chunk """ # print("SFTP write_file({})".format(name), blocksize) assert is_native(name) self.check_write(name) self.sftp.putfo(fp_src, name) # , callback) # TODO: check result def copy_to_file(self, name, fp_dest, callback=None): """Write cur_dir/name to file-like `fp_dest`. Args: name (str): file name, located in self.curdir fp_dest (file-like): must support write() method callback (function, optional): Called like `func(buf)` for every written chunk """ assert is_native(name) self.sftp.getfo(name, fp_dest) def remove_file(self, name): """Remove cur_dir/name.""" assert is_native(name) self.check_write(name) # self.cur_dir_meta.remove(name) self.sftp.remove(name) self.remove_sync_info(name) def set_mtime(self, name, mtime, size): assert is_native(name) self.check_write(name) # write("META set_mtime(%s): %s" % (name, time.ctime(mtime))) # We cannot set the mtime on SFTP servers, so we store this as additional # meta data in the same directory # TODO: try "SITE UTIME", "MDTM (set version)", or "SRFT" command self.cur_dir_meta.set_mtime(name, mtime, size)