Mercurial > hg
changeset 50477:4cbdfab6f812
store: lazily get file size on demand for the fncache case
We don't have the information in the first place, so we can avoid querying the
file system inconditionnaly for use case we don't needs it.
This change requires the StoreFile class to be passed a vfs to retrieve the
file_size if needed.
In the non-fncache case, we already have the information from file system
walking, so we keep it and use it.
author | Pierre-Yves David <pierre-yves.david@octobus.net> |
---|---|
date | Mon, 15 May 2023 08:58:01 +0200 |
parents | 2b2284cf949b |
children | 1c0244a8cdaf |
files | mercurial/store.py mercurial/streamclone.py mercurial/verify.py |
diffstat | 3 files changed, 25 insertions(+), 19 deletions(-) [+] |
line wrap: on
line diff
--- a/mercurial/store.py Mon May 15 08:57:45 2023 +0200 +++ b/mercurial/store.py Mon May 15 08:58:01 2023 +0200 @@ -520,9 +520,17 @@ """a file matching an entry""" unencoded_path = attr.ib() - file_size = attr.ib() + _file_size = attr.ib(default=False) is_volatile = attr.ib(default=False) + def file_size(self, vfs): + if self._file_size is not None: + return self._file_size + try: + return vfs.stat(self.unencoded_path).st_size + except FileNotFoundError: + return 0 + class basicstore: '''base class for local repository stores''' @@ -900,16 +908,12 @@ # However the fncache might contains such file added by # previous version of Mercurial. continue - try: - yield RevlogStoreEntry( - unencoded_path=f, - revlog_type=FILEFLAGS_FILELOG, - is_revlog_main=bool(t & FILEFLAGS_REVLOG_MAIN), - is_volatile=bool(t & FILEFLAGS_VOLATILE), - file_size=self.getsize(ef), - ) - except FileNotFoundError: - pass + yield RevlogStoreEntry( + unencoded_path=f, + revlog_type=FILEFLAGS_FILELOG, + is_revlog_main=bool(t & FILEFLAGS_REVLOG_MAIN), + is_volatile=bool(t & FILEFLAGS_VOLATILE), + ) def copylist(self): d = (
--- a/mercurial/streamclone.py Mon May 15 08:57:45 2023 +0200 +++ b/mercurial/streamclone.py Mon May 15 08:58:01 2023 +0200 @@ -271,9 +271,10 @@ repo.ui.debug(b'scanning\n') for entry in _walkstreamfiles(repo): for f in entry.files(): - if f.file_size: - entries.append((f.unencoded_path, f.file_size)) - total_bytes += f.file_size + file_size = f.file_size(repo.store.vfs) + if file_size: + entries.append((f.unencoded_path, file_size)) + total_bytes += file_size _test_sync_point_walk_1(repo) _test_sync_point_walk_2(repo) @@ -680,12 +681,13 @@ for entry in _walkstreamfiles(repo, matcher): for f in entry.files(): - if f.file_size: + file_size = f.file_size(repo.store.vfs) + if file_size: ft = _fileappend if f.is_volatile: ft = _filefull - entries.append((_srcstore, f.unencoded_path, ft, f.file_size)) - totalfilesize += f.file_size + entries.append((_srcstore, f.unencoded_path, ft, file_size)) + totalfilesize += file_size for name in _walkstreamfullstorefiles(repo): if repo.svfs.exists(name): totalfilesize += repo.svfs.lstat(name).st_size
--- a/mercurial/verify.py Mon May 15 08:57:45 2023 +0200 +++ b/mercurial/verify.py Mon May 15 08:58:01 2023 +0200 @@ -410,7 +410,7 @@ for entry in repo.store.datafiles(undecodable=undecodable): for file_ in entry.files(): f = file_.unencoded_path - size = file_.file_size + size = file_.file_size(repo.store.vfs) if (size > 0 or not revlogv1) and f.startswith(b'meta/'): storefiles.add(_normpath(f)) subdirs.add(os.path.dirname(f)) @@ -477,7 +477,7 @@ undecodable = [] for entry in repo.store.datafiles(undecodable=undecodable): for file_ in entry.files(): - size = file_.file_size + size = file_.file_size(repo.store.vfs) f = file_.unencoded_path if (size > 0 or not revlogv1) and f.startswith(b'data/'): storefiles.add(_normpath(f))