partyfuse: also support mounting nginx, iis
these additional parsers are not included in the sfx-embedded copy of partyfuse.py; grab it from github when necessary
This commit is contained in:
		
							parent
							
								
									f1646b96ca
								
							
						
					
					
						commit
						c81e898435
					
				| @ -1885,6 +1885,7 @@ interact with copyparty using non-browser clients | ||||
| 
 | ||||
| * FUSE: mount a copyparty server as a local filesystem | ||||
|   * cross-platform python client available in [./bin/](bin/) | ||||
|   * able to mount nginx and iis directory listings too, not just copyparty | ||||
|   * can be downloaded from copyparty: controlpanel -> connect -> [partyfuse.py](http://127.0.0.1:3923/.cpr/a/partyfuse.py) | ||||
|   * [rclone](https://rclone.org/) as client can give ~5x performance, see [./docs/rclone.md](docs/rclone.md) | ||||
| 
 | ||||
| @ -1924,7 +1925,7 @@ alternatively, some alternatives roughly sorted by speed (unreproducible benchma | ||||
| 
 | ||||
| * [rclone-webdav](./docs/rclone.md) (25s), read/WRITE (rclone v1.63 or later) | ||||
| * [rclone-http](./docs/rclone.md) (26s), read-only | ||||
| * [partyfuse.py](./bin/#partyfusepy) (35s), read-only | ||||
| * [partyfuse.py](./bin/#partyfusepy) (26s), read-only | ||||
| * [rclone-ftp](./docs/rclone.md) (47s), read/WRITE | ||||
| * davfs2 (103s), read/WRITE | ||||
| * [win10-webdav](#webdav-server) (138s), read/WRITE | ||||
|  | ||||
| @ -15,22 +15,18 @@ produces a chronological list of all uploads by collecting info from up2k databa | ||||
| # [`partyfuse.py`](partyfuse.py) | ||||
| * mount a copyparty server as a local filesystem (read-only) | ||||
| * **supports Windows!** -- expect `194 MiB/s` sequential read | ||||
| * **supports Linux** -- expect `117 MiB/s` sequential read | ||||
| * **supports Linux** -- expect `600 MiB/s` sequential read | ||||
| * **supports macos** -- expect `85 MiB/s` sequential read | ||||
| 
 | ||||
| filecache is default-on for windows and macos; | ||||
| * macos readsize is 64kB, so speed ~32 MiB/s without the cache | ||||
| * windows readsize varies by software; explorer=1M, pv=32k | ||||
| 
 | ||||
| note that copyparty should run with `-ed` to enable dotfiles (hidden otherwise) | ||||
| 
 | ||||
| also consider using [../docs/rclone.md](../docs/rclone.md) instead for 5x performance | ||||
| and consider using [../docs/rclone.md](../docs/rclone.md) instead; usually a bit faster, especially on windows | ||||
| 
 | ||||
| 
 | ||||
| ## to run this on windows: | ||||
| * install [winfsp](https://github.com/billziss-gh/winfsp/releases/latest) and [python 3](https://www.python.org/downloads/) | ||||
|   * [x] add python 3.x to PATH (it asks during install) | ||||
| * `python -m pip install --user fusepy` | ||||
| * `python -m pip install --user fusepy` (or grab a copy of `fuse.py` from the `connect` page on your copyparty, and keep it in the same folder) | ||||
| * `python ./partyfuse.py n: http://192.168.1.69:3923/` | ||||
| 
 | ||||
| 10% faster in [msys2](https://www.msys2.org/), 700% faster if debug prints are enabled: | ||||
|  | ||||
							
								
								
									
										218
									
								
								bin/partyfuse.py
									
									
									
									
									
								
							
							
						
						
									
										218
									
								
								bin/partyfuse.py
									
									
									
									
									
								
							| @ -6,6 +6,8 @@ __copyright__ = 2019 | ||||
| __license__ = "MIT" | ||||
| __url__ = "https://github.com/9001/copyparty/" | ||||
| 
 | ||||
| S_VERSION = "2.0" | ||||
| S_BUILD_DT = "2024-10-01" | ||||
| 
 | ||||
| """ | ||||
| mount a copyparty server (local or remote) as a filesystem | ||||
| @ -19,7 +21,7 @@ usage: | ||||
|   python partyfuse.py http://192.168.1.69:3923/  ./music | ||||
| 
 | ||||
| dependencies: | ||||
|   python3 -m pip install --user fusepy | ||||
|   python3 -m pip install --user fusepy  # or grab it from the connect page | ||||
|   + on Linux: sudo apk add fuse | ||||
|   + on Macos: https://osxfuse.github.io/ | ||||
|   + on Windows: https://github.com/billziss-gh/winfsp/releases/latest | ||||
| @ -59,6 +61,11 @@ WINDOWS = sys.platform == "win32" | ||||
| MACOS = platform.system() == "Darwin" | ||||
| UTC = timezone.utc | ||||
| 
 | ||||
| # !rm.yes> | ||||
| MON3S = "Jan Feb Mar Apr May Jun Jul Aug Sep Oct Nov Dec" | ||||
| MON3 = {b:a for a,b in enumerate(MON3S.split(), 1)} | ||||
| # !rm.no> | ||||
| 
 | ||||
| 
 | ||||
| def print(*args, **kwargs): | ||||
|     try: | ||||
| @ -104,12 +111,11 @@ except: | ||||
| 
 | ||||
| 
 | ||||
| def termsafe(txt): | ||||
|     enc = sys.stdout.encoding | ||||
|     try: | ||||
|         return txt.encode(sys.stdout.encoding, "backslashreplace").decode( | ||||
|             sys.stdout.encoding | ||||
|         ) | ||||
|         return txt.encode(enc, "backslashreplace").decode(enc) | ||||
|     except: | ||||
|         return txt.encode(sys.stdout.encoding, "replace").decode(sys.stdout.encoding) | ||||
|         return txt.encode(enc, "replace").decode(enc) | ||||
| 
 | ||||
| 
 | ||||
| def threadless_log(fmt, *a): | ||||
| @ -156,20 +162,10 @@ good_bad = {} | ||||
| def enwin(txt): | ||||
|     return "".join([bad_good.get(x, x) for x in txt]) | ||||
| 
 | ||||
|     for bad, good in bad_good.items(): | ||||
|         txt = txt.replace(bad, good) | ||||
| 
 | ||||
|     return txt | ||||
| 
 | ||||
| 
 | ||||
| def dewin(txt): | ||||
|     return "".join([good_bad.get(x, x) for x in txt]) | ||||
| 
 | ||||
|     for bad, good in bad_good.items(): | ||||
|         txt = txt.replace(good, bad) | ||||
| 
 | ||||
|     return txt | ||||
| 
 | ||||
| 
 | ||||
| class RecentLog(object): | ||||
|     def __init__(self, ar): | ||||
| @ -258,10 +254,14 @@ class CacheNode(object): | ||||
| 
 | ||||
| class Gateway(object): | ||||
|     def __init__(self, ar): | ||||
|         self.base_url = ar.base_url | ||||
|         zs = ar.base_url | ||||
|         if "://" not in zs: | ||||
|             zs = "http://" + zs | ||||
| 
 | ||||
|         self.base_url = zs | ||||
|         self.password = ar.a | ||||
| 
 | ||||
|         ui = urllib.parse.urlparse(self.base_url) | ||||
|         ui = urllib.parse.urlparse(zs) | ||||
|         self.web_root = ui.path.strip("/") | ||||
|         self.SRS = "/%s/" % (self.web_root,) if self.web_root else "/" | ||||
|         try: | ||||
| @ -289,6 +289,41 @@ class Gateway(object): | ||||
| 
 | ||||
|         self.conns = {} | ||||
| 
 | ||||
|         self.fsuf = "?raw" | ||||
|         self.dsuf = "?ls<&dots" | ||||
| 
 | ||||
|         # !rm.yes> | ||||
|         if not ar.html: | ||||
|             self.parse_html = None | ||||
| 
 | ||||
|         elif ar.html == "cpp": | ||||
|             self.parse_html = self.parse_cpp | ||||
|             self.dsuf = "?lt&dots" | ||||
|             self.re_row = re.compile( | ||||
|                 r'^<tr><td>(-|DIR|<a [^<]+</a>)</td><td><a[^>]* href="([^"]+)"[^>]*>([^<]+)</a></td><td>([^<]+)</td><td>.*</td><td>([^<]+)</td></tr>$' | ||||
|             ) | ||||
| 
 | ||||
|         elif ar.html == "nginx": | ||||
|             self.parse_html = self.parse_nginx | ||||
|             self.fsuf = "" | ||||
|             self.dsuf = "" | ||||
|             self.re_row = re.compile( | ||||
|                 r'^<a href="([^"]+)">([^<]+)</a> *([0-9]{2})-([A-Z][a-z]{2})-([0-9]{4}) ([0-9]{2}:[0-9]{2}) *(-|[0-9]+)\r?$' | ||||
|             ) | ||||
| 
 | ||||
|         elif ar.html == "iis": | ||||
|             self.parse_html = self.parse_iis | ||||
|             self.fsuf = "" | ||||
|             self.dsuf = "" | ||||
|             self.re_2nl = re.compile(br"<br>|</pre>") | ||||
|             self.re_row = re.compile( | ||||
|                 r'^ *([0-9]{1,2})/([0-9]{1,2})/([0-9]{4}) {1,2}([0-9]{1,2}:[0-9]{2}) ([AP]M) +(<dir>|[0-9]+) <A HREF="([^"]+)">([^<>]+)</A>$' | ||||
|             ) | ||||
| 
 | ||||
|         else: | ||||
|             raise Exception("unknown HTML dialect: [%s]" % (ar.html,)) | ||||
|         # !rm.no> | ||||
| 
 | ||||
|     def quotep(self, path): | ||||
|         path = path.encode("wtf-8") | ||||
|         return quote(path, safe="/") | ||||
| @ -353,7 +388,7 @@ class Gateway(object): | ||||
|             path = dewin(path) | ||||
| 
 | ||||
|         zs = "%s%s/" if path else "%s%s" | ||||
|         web_path = self.quotep(zs % (self.SRS, path)) + "?ls<&dots" | ||||
|         web_path = self.quotep(zs % (self.SRS, path)) + self.dsuf | ||||
|         r = self.sendreq("GET", web_path, {}) | ||||
|         if r.status != 200: | ||||
|             self.closeconn() | ||||
| @ -381,8 +416,7 @@ class Gateway(object): | ||||
|         if bad_good: | ||||
|             path = dewin(path) | ||||
| 
 | ||||
|         zs = "%s%s/" if path else "%s%s" | ||||
|         web_path = self.quotep(zs % (self.SRS, path)) + "?raw" | ||||
|         web_path = self.quotep("%s%s" % (self.SRS, path)) + self.fsuf | ||||
|         hdr_range = "bytes=%d-%d" % (ofs1, ofs2 - 1) | ||||
| 
 | ||||
|         t = "DL %4.0fK\033[36m%9d-%-9d\033[0m%r" | ||||
| @ -421,12 +455,15 @@ class Gateway(object): | ||||
|         return ret | ||||
| 
 | ||||
|     # !rm.yes> | ||||
|     def parse_html(self, sck): | ||||
|     #################################################################### | ||||
|     #################################################################### | ||||
| 
 | ||||
|     def parse_cpp(self, sck): | ||||
|         # https://a.ocv.me/pub/ | ||||
| 
 | ||||
|         ret = {} | ||||
|         rem = b"" | ||||
|         ptn = re.compile( | ||||
|             r'^<tr><td>(-|DIR|<a [^<]+</a>)</td><td><a[^>]* href="([^"]+)"[^>]*>([^<]+)</a></td><td>([^<]+)</td><td>.*</td><td>([^<]+)</td></tr>$' | ||||
|         ) | ||||
|         ptn = self.re_row | ||||
| 
 | ||||
|         while True: | ||||
|             buf = sck.read(1024 * 32) | ||||
| @ -459,7 +496,7 @@ class Gateway(object): | ||||
|                     sz = int(fsize) | ||||
|                     ts = calendar.timegm(time.strptime(fdate, "%Y-%m-%d %H:%M:%S")) | ||||
|                 except: | ||||
|                     info("bad HTML or OS [%r] [%r]", fdate, fsize) | ||||
|                     info("bad HTML or OS %r %r\n%r", fdate, fsize, line) | ||||
|                     # python cannot strptime(1959-01-01) on windows | ||||
| 
 | ||||
|                 if ftype != "DIR" and "zip=crc" not in ftype: | ||||
| @ -468,9 +505,112 @@ class Gateway(object): | ||||
|                     ret[fname] = self.stat_dir(ts, sz) | ||||
| 
 | ||||
|         return ret | ||||
| 
 | ||||
|     def parse_nginx(self, sck): | ||||
|         # https://ocv.me/stuff/  "06-Feb-2015 15:43" | ||||
| 
 | ||||
|         ret = {} | ||||
|         rem = b"" | ||||
|         re_row = self.re_row | ||||
| 
 | ||||
|         while True: | ||||
|             buf = sck.read(1024 * 32) | ||||
|             if not buf: | ||||
|                 break | ||||
| 
 | ||||
|             buf = rem + buf | ||||
|             rem = b"" | ||||
|             idx = buf.rfind(b"\n") | ||||
|             if idx >= 0: | ||||
|                 rem = buf[idx + 1 :] | ||||
|                 buf = buf[:idx] | ||||
| 
 | ||||
|             fdate = "" | ||||
|             lines = buf.decode("utf-8").split("\n") | ||||
|             for line in lines: | ||||
|                 m = re_row.match(line) | ||||
|                 if not m: | ||||
|                     continue | ||||
| 
 | ||||
|                 furl, fname, day, smon, year, hm, fsize = m.groups() | ||||
|                 fname = furl.rstrip("/").split("/")[-1] | ||||
|                 fname = unquote(fname) | ||||
|                 fname = fname.decode("wtf-8") | ||||
|                 if bad_good: | ||||
|                     fname = enwin(fname) | ||||
| 
 | ||||
|                 sz = 1 | ||||
|                 ts = 60 * 60 * 24 * 2 | ||||
|                 try: | ||||
|                     fdate = "%s-%02d-%s %s" % (year, MON3[smon], day, hm) | ||||
|                     ts = calendar.timegm(time.strptime(fdate, "%Y-%m-%d %H:%M")) | ||||
|                     sz = -1 if fsize == "-" else int(fsize) | ||||
|                 except: | ||||
|                     info("bad HTML or OS %r %r\n%r", fdate, fsize, line) | ||||
| 
 | ||||
|                 if sz == -1: | ||||
|                     ret[fname] = self.stat_dir(ts, 4096) | ||||
|                 else: | ||||
|                     ret[fname] = self.stat_file(ts, sz) | ||||
| 
 | ||||
|         return ret | ||||
| 
 | ||||
|     def parse_iis(self, sck): | ||||
|         # https://nedlasting.miljodirektoratet.no/miljodata/  " 9/28/2024  5:24 AM" | ||||
|         # https://grandcanyon.usgs.gov/photos/Foodbase/CISP/  " 6/29/2012  3:12 PM" | ||||
| 
 | ||||
|         ret = {} | ||||
|         rem = b"" | ||||
|         re_row = self.re_row | ||||
|         re_2nl = self.re_2nl | ||||
| 
 | ||||
|         while True: | ||||
|             buf = sck.read(1024 * 32) | ||||
|             if not buf: | ||||
|                 break | ||||
| 
 | ||||
|             buf = rem + buf | ||||
|             rem = b"" | ||||
|             buf = re_2nl.sub(b"\n", buf) | ||||
|             idx = buf.rfind(b"\n") | ||||
|             if idx >= 0: | ||||
|                 rem = buf[idx + 1 :] | ||||
|                 buf = buf[:idx] | ||||
| 
 | ||||
|             lines = buf.decode("utf-8").split("\n") | ||||
|             for line in lines: | ||||
|                 m = re_row.match(line) | ||||
|                 if not m: | ||||
|                     continue | ||||
| 
 | ||||
|                 mon, day, year, hm, xm, fsize, furl, fname = m.groups() | ||||
|                 fname = furl.rstrip("/").split("/")[-1] | ||||
|                 fname = unquote(fname) | ||||
|                 fname = fname.decode("wtf-8") | ||||
|                 if bad_good: | ||||
|                     fname = enwin(fname) | ||||
| 
 | ||||
|                 sz = 1 | ||||
|                 ts = 60 * 60 * 24 * 2 | ||||
|                 fdate = "%s-%s-%s %s %s" % (year, mon, day, hm, xm) | ||||
|                 try: | ||||
|                     ts = calendar.timegm(time.strptime(fdate, "%Y-%m-%d %H:%M %p")) | ||||
|                     sz = -1 if fsize == "<dir>" else int(fsize) | ||||
|                 except: | ||||
|                     info("bad HTML or OS %r %r\n%r", fdate, fsize, line) | ||||
| 
 | ||||
|                 if sz == -1: | ||||
|                     ret[fname] = self.stat_dir(ts, 4096) | ||||
|                 else: | ||||
|                     ret[fname] = self.stat_file(ts, sz) | ||||
| 
 | ||||
|         return ret | ||||
| 
 | ||||
|     #################################################################### | ||||
|     #################################################################### | ||||
|     # !rm.no> | ||||
| 
 | ||||
|     def stat_dir(self, ts, sz=4096): | ||||
|     def stat_dir(self, ts, sz): | ||||
|         return { | ||||
|             "st_mode": stat.S_IFDIR | 0o555, | ||||
|             "st_uid": 1000, | ||||
| @ -497,8 +637,6 @@ class Gateway(object): | ||||
| 
 | ||||
| class CPPF(Operations): | ||||
|     def __init__(self, ar): | ||||
|         self.use_ns = True | ||||
| 
 | ||||
|         self.gw = Gateway(ar) | ||||
|         self.junk_fh_ctr = 3 | ||||
|         self.t_dircache = ar.cds | ||||
| @ -839,17 +977,17 @@ class CPPF(Operations): | ||||
|             path = enwin(path)  # windows occasionally decodes f0xx to xx | ||||
| 
 | ||||
|         path = path.strip("/") | ||||
|         if not path: | ||||
|             ret = self.gw.stat_dir(time.time(), 4096) | ||||
|             dbg("/=%r", ret) | ||||
|             return ret | ||||
| 
 | ||||
|         try: | ||||
|             dirpath, fname = path.rsplit("/", 1) | ||||
|         except: | ||||
|             dirpath = "" | ||||
|             fname = path | ||||
| 
 | ||||
|         if not path: | ||||
|             ret = self.gw.stat_dir(time.time()) | ||||
|             dbg("=%r", ret) | ||||
|             return ret | ||||
| 
 | ||||
|         cn = self.get_cached_dir(dirpath) | ||||
|         if cn: | ||||
|             dents = cn.data | ||||
| @ -858,7 +996,9 @@ class CPPF(Operations): | ||||
|             dents = self._readdir(dirpath) | ||||
| 
 | ||||
|         try: | ||||
|             return dents[fname] | ||||
|             ret = dents[fname] | ||||
|             dbg("s=%r", ret) | ||||
|             return ret | ||||
|         except: | ||||
|             pass | ||||
| 
 | ||||
| @ -974,6 +1114,11 @@ def main(): | ||||
|     global info, dbg, is_dbg | ||||
|     time.strptime("19970815", "%Y%m%d")  # python#7980 | ||||
| 
 | ||||
|     ver = "{0}, v{1}".format(S_BUILD_DT, S_VERSION) | ||||
|     if "--version" in sys.argv: | ||||
|         print("partyfuse", ver) | ||||
|         return | ||||
| 
 | ||||
|     # filecache helps for reads that are ~64k or smaller; | ||||
|     #   windows likes to use 4k and 64k so cache is important, | ||||
|     #   linux generally does 128k so the cache is still nice, | ||||
| @ -996,6 +1141,7 @@ def main(): | ||||
| 
 | ||||
|     ap = argparse.ArgumentParser( | ||||
|         formatter_class=TheArgparseFormatter, | ||||
|         description="mount a copyparty server as a local filesystem -- " + ver, | ||||
|         epilog="example:" + ex_pre + ex_pre.join(examples), | ||||
|     ) | ||||
|     # fmt: off | ||||
| @ -1003,6 +1149,10 @@ def main(): | ||||
|     ap.add_argument("local_path", type=str, help=where + " to mount it on") | ||||
|     ap.add_argument("-a", metavar="PASSWORD", help="password or $filepath") | ||||
| 
 | ||||
|     # !rm.yes> | ||||
|     ap.add_argument("--html", metavar="TYPE", default="", help="which HTML parser to use; cpp, nginx, iis") | ||||
|     # !rm.no> | ||||
| 
 | ||||
|     ap2 = ap.add_argument_group("https/TLS") | ||||
|     ap2.add_argument("-te", metavar="PEMFILE", help="certificate to expect/verify") | ||||
|     ap2.add_argument("-td", action="store_true", help="disable certificate check") | ||||
|  | ||||
| @ -167,7 +167,7 @@ RUN     mv /z/fusepy-3.0.1/fuse.py /z/dist/f1 \ | ||||
|         && python3 /z/uncomment.py f1 \ | ||||
|         && sed -ri '/self.__critical_exception = e/d' f1 \ | ||||
|         && awk '/^log =/{s=0} !s; /^from traceback im/{s=1;print"from functools import partial";print"basestring = str"}' <f1 >f2 \ | ||||
|         && awk '/LoggingMixIn:/{exit} /Time as floating/{s=3}--s<0' <f2 >f1 \ | ||||
|         && awk '/LoggingMixIn:/{exit} --s<0;/self.use_ns = getattr/{s=7}' <f2 >f1 \ | ||||
|         && awk "/if _machine =/{s=0} /'(mips|ppc|ppc64)'/{s=1} !s" <f1 >f2 \ | ||||
|         && rm f1 && mv f2 fuse.py | ||||
| 
 | ||||
|  | ||||
		Loading…
	
		Reference in New Issue
	
	Block a user
	 ed
						ed