Skip to content

Commit

Permalink
fixup! [wip] Add tests and documentation for IPFS, TODO: SMB, DropBox…
Browse files Browse the repository at this point in the history
…, Hf
  • Loading branch information
mxmlnkn committed Oct 12, 2024
1 parent 3ee588b commit b198491
Show file tree
Hide file tree
Showing 4 changed files with 73 additions and 8 deletions.
20 changes: 14 additions & 6 deletions core/ratarmountcore/FSSpecMountSource.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,11 @@
except ImportError:
fsspec = None # type: ignore

try:
from webdav4.fsspec import WebdavFileSystem
except ImportError:
WebdavFileSystem = None # type: ignore


class FSSpecMountSource(MountSource):
"""
Expand Down Expand Up @@ -71,12 +76,14 @@ def __init__(self, urlOrFS, prefix: Optional[str] = None, **options) -> None:

# The fsspec filesystems are not uniform! http:// expects the arguments to isdir with prefixed
# protocol while other filesystem implementations are fine with only the path.
# https://github.com/ray-project/ray/issues/26423#issuecomment-1179561181
self._isHTTP = isinstance(self.fileSystem, fsspec.implementations.http.HTTPFileSystem)
# - https://github.com/ray-project/ray/issues/26423#issuecomment-1179561181
# - https://github.com/fsspec/filesystem_spec/issues/1713
# - https://github.com/skshetry/webdav4/issues/198
self._pathsRequireQuoting = isinstance(self.fileSystem, (fsspec.implementations.http.HTTPFileSystem, WebdavFileSystem))
self.prefix = prefix.rstrip("/") if prefix and prefix.strip("/") and self.fileSystem.isdir(prefix) else ""

def _getPath(self, path: str) -> str:
if self._isHTTP:
if self._pathsRequireQuoting:
path = urllib.parse.quote(path)
if self.prefix:
if not path or path == "/":
Expand Down Expand Up @@ -110,9 +117,10 @@ def _convertToFileInfo(entry, path) -> FileInfo:
# They kinda work only like hardlinks.
# https://github.com/fsspec/filesystem_spec/issues/1679
# https://github.com/fsspec/filesystem_spec/issues/1680
size = entry.get('size', 0)
return FileInfo(
# fmt: off
size = entry.get('size', 0),
size = size if size else 0,
mtime = FSSpecMountSource._getModificationTime(entry),
mode = FSSpecMountSource._getMode(entry),
linkname = "",
Expand Down Expand Up @@ -181,7 +189,7 @@ def _listDir(self, path: str, onlyMode: bool) -> Optional[Union[Iterable[str], D
)
for entry in result
}
if self._isHTTP:
if self._pathsRequireQuoting:
return {
urllib.parse.unquote(name): info for name, info in result.items() if not name.startswith(('?', '#'))
}
Expand Down Expand Up @@ -214,7 +222,7 @@ def _getFileInfoHTTP(self, path: str) -> Optional[FileInfo]:

@overrides(MountSource)
def getFileInfo(self, path: str, fileVersion: int = 0) -> Optional[FileInfo]:
if self._isHTTP:
if isinstance(self.fileSystem, fsspec.implementations.http.HTTPFileSystem):
return self._getFileInfoHTTP(path)

path = self._getPath(path)
Expand Down
28 changes: 28 additions & 0 deletions core/ratarmountcore/factory.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
# pylint: disable=no-member,abstract-method
# Disable pylint errors. See https://github.com/fsspec/filesystem_spec/issues/1678

import http
import os
import stat
import sys
Expand Down Expand Up @@ -255,6 +256,33 @@ def tryOpenURL(url, printDebug: int) -> Union[MountSource, IO[bytes], str]:
with warnings.catch_warnings():
warnings.simplefilter("ignore")
fileSystem, path = fsspec.url_to_fs(url)
elif protocol == 'webdav':
# This needs special handling because we need to decide between HTTP and HTTPS and because of:
# https://github.com/skshetry/webdav4/issues/197
try:
from webdav4.fsspec import WebdavFileSystem
except ImportError:
raise RatarmountError("Install the webdav4 Python package to mount webdav://.")

splitAtSlash = splitURI[1].split('/', 1)
if len(splitAtSlash) == 2:
baseURL, path = splitAtSlash
else:
baseURL = splitURI[1]
path = ""

def checkForHTTPS(url):
try:
connection = http.client.HTTPSConnection(url, timeout=2)
connection.request("HEAD", "/")
return bool(connection.getresponse())
except Exception as exception:
if printDebug >= 3:
print("[Info] Determined WebDAV URL to not use HTTP instead HTTPS because of:", exception)
return False

transportProtocol = "https" if checkForHTTPS(baseURL) else "http"
fileSystem = WebdavFileSystem(f"{transportProtocol}://{baseURL}")
else:
fileSystem, path = fsspec.url_to_fs(url)

Expand Down
2 changes: 2 additions & 0 deletions tests/requirements-tests.txt
Original file line number Diff line number Diff line change
Expand Up @@ -26,3 +26,5 @@ pyminizip
pyopenssl>=23
rangehttpserver
boto3
wsgidav
cheroot
31 changes: 29 additions & 2 deletions tests/runtests.sh
Original file line number Diff line number Diff line change
Expand Up @@ -2115,7 +2115,7 @@ checkURLProtocolS3()

weedFolder=$( mktemp -d --suffix .test.ratarmount )
TMP_FILES_TO_CLEANUP+=( "$weedFolder" )
./weed server -dir="$weedFolder" -s3 -s3.port "$port" -idleTimeout=30 -ip 127.0.0.1 2>weed.log &
./weed server -dir="$weedFolder" -s3 -s3.port "$port" -idleTimeout=30 -ip 127.0.0.1 &
pid=$!

# Wait for port to open
Expand Down Expand Up @@ -2222,9 +2222,11 @@ checkURLProtocolIPFS()
ipfs=kubo/ipfs
fi

local pid=
$ipfs init --profile server
if ! pgrep ipfs; then
$ipfs daemon &
pid=$!
sleep 5
fi

Expand All @@ -2240,6 +2242,31 @@ checkURLProtocolIPFS()
d3b07384d113edec49eaa6238ad5ff00 || returnError "$LINENO" 'Failed to read from IPFS'
checkFileInTARForeground "ipfs://QmZwm9gKZaayGWqYtMgj6cd4JaNK1Yp2ChYZhXrERGq4Gi" single-file.tar \
1a28538854d1884e4415cb9bfb7a2ad8 || returnError "$LINENO" 'Failed to read from IPFS'

if [[ -n "$pid" ]]; then kill "$pid"; fi
}


checkURLProtocolWebDAV()
{
if ! pip show wsgidav &>/dev/null; then
echoerr "Skipping WebDAV test because wsigdav package is not installed."
return 0
fi

local port=8047
# BEWARE OF LOOP MOUNTS when testing locally!
# It will time out, when trying to expose PWD via WebDAV while mounting into PWD/mounted.
wsgidav --host=127.0.0.1 --port=8047 --root="$PWD" --auth=anonymous &
local pid=$!
sleep 5

checkFileInTARForeground "webdav://127.0.0.1:$port/single-file.tar" bar \
d3b07384d113edec49eaa6238ad5ff00 || returnError "$LINENO" 'Failed to read from WebDAV server'
checkFileInTARForeground "webdav://127.0.0.1:$port" single-file.tar \
1a28538854d1884e4415cb9bfb7a2ad8 || returnError "$LINENO" 'Failed to read from WebDAV server'

kill "$pid"
}


Expand All @@ -2259,7 +2286,7 @@ checkRemoteSupport()
checkURLProtocolSSH || returnError 'Failed ssh:// check'

checkURLProtocolSamba || returnError 'Failed smb:// check'
# TODO Add and test IPFS
checkURLProtocolWebDAV || returnError 'Failed webdav:// check'
# TODO look for other fsspec implementations in an automated manner
}

Expand Down

0 comments on commit b198491

Please sign in to comment.