in src/huggingface_hub/hf_file_system.py [0:0]
def info(self, path: str, refresh: bool = False, revision: Optional[str] = None, **kwargs) -> Dict[str, Any]:
"""
Get information about a file or directory.
For more details, refer to [fsspec documentation](https://filesystem-spec.readthedocs.io/en/latest/api.html#fsspec.spec.AbstractFileSystem.info).
<Tip warning={true}>
Note: When possible, use `HfApi.get_paths_info()` or `HfApi.repo_info()` for better performance.
</Tip>
Args:
path (`str`):
Path to get info for.
refresh (`bool`, *optional*):
If True, bypass the cache and fetch the latest data. Defaults to False.
revision (`str`, *optional*):
The git revision to get info from.
Returns:
`Dict[str, Any]`: Dictionary containing file information (type, size, commit info, etc.).
"""
resolved_path = self.resolve_path(path, revision=revision)
path = resolved_path.unresolve()
expand_info = kwargs.get(
"expand_info", True
) # don't expose it as a parameter in the public API to follow the spec
if not resolved_path.path_in_repo:
# Path is the root directory
out = {
"name": path,
"size": 0,
"type": "directory",
}
if expand_info:
last_commit = self._api.list_repo_commits(
resolved_path.repo_id, repo_type=resolved_path.repo_type, revision=resolved_path.revision
)[-1]
out = {
**out,
"tree_id": None, # TODO: tree_id of the root directory?
"last_commit": LastCommitInfo(
oid=last_commit.commit_id, title=last_commit.title, date=last_commit.created_at
),
}
else:
out = None
parent_path = self._parent(path)
if not expand_info and parent_path not in self.dircache:
# Fill the cache with cheap call
self.ls(parent_path, expand_info=False)
if parent_path in self.dircache:
# Check if the path is in the cache
out1 = [o for o in self.dircache[parent_path] if o["name"] == path]
if not out1:
_raise_file_not_found(path, None)
out = out1[0]
if refresh or out is None or (expand_info and out and out["last_commit"] is None):
paths_info = self._api.get_paths_info(
resolved_path.repo_id,
resolved_path.path_in_repo,
expand=expand_info,
revision=resolved_path.revision,
repo_type=resolved_path.repo_type,
)
if not paths_info:
_raise_file_not_found(path, None)
path_info = paths_info[0]
root_path = HfFileSystemResolvedPath(
resolved_path.repo_type,
resolved_path.repo_id,
resolved_path.revision,
path_in_repo="",
_raw_revision=resolved_path._raw_revision,
).unresolve()
if isinstance(path_info, RepoFile):
out = {
"name": root_path + "/" + path_info.path,
"size": path_info.size,
"type": "file",
"blob_id": path_info.blob_id,
"lfs": path_info.lfs,
"last_commit": path_info.last_commit,
"security": path_info.security,
}
else:
out = {
"name": root_path + "/" + path_info.path,
"size": 0,
"type": "directory",
"tree_id": path_info.tree_id,
"last_commit": path_info.last_commit,
}
if not expand_info:
out = {k: out[k] for k in ["name", "size", "type"]}
assert out is not None
return out