mirror of
				https://github.com/9001/copyparty.git
				synced 2025-10-31 04:32:20 -06:00 
			
		
		
		
	
		
			
				
	
	
		
			306 lines
		
	
	
		
			8.5 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable file
		
	
	
	
	
			
		
		
	
	
			306 lines
		
	
	
		
			8.5 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable file
		
	
	
	
	
| #!/usr/bin/env python3
 | |
| 
 | |
| import os
 | |
| import sys
 | |
| import time
 | |
| import shutil
 | |
| import sqlite3
 | |
| import argparse
 | |
| 
 | |
| DB_VER1 = 3
 | |
| DB_VER2 = 6
 | |
| 
 | |
| BY_PATH = None
 | |
| NC = None
 | |
| 
 | |
| 
 | |
| def die(msg):
 | |
|     print("\033[31m\n" + msg + "\n\033[0m")
 | |
|     sys.exit(1)
 | |
| 
 | |
| 
 | |
| def read_ver(db):
 | |
|     for tab in ["ki", "kv"]:
 | |
|         try:
 | |
|             c = db.execute(r"select v from {} where k = 'sver'".format(tab))
 | |
|         except:
 | |
|             continue
 | |
| 
 | |
|         rows = c.fetchall()
 | |
|         if rows:
 | |
|             return int(rows[0][0])
 | |
| 
 | |
|     return "corrupt"
 | |
| 
 | |
| 
 | |
| def ls(db):
 | |
|     nfiles = next(db.execute("select count(w) from up"))[0]
 | |
|     ntags = next(db.execute("select count(w) from mt"))[0]
 | |
|     print(f"{nfiles} files")
 | |
|     print(f"{ntags} tags\n")
 | |
| 
 | |
|     print("number of occurrences for each tag,")
 | |
|     print(" 'x' = file has no tags")
 | |
|     print(" 't:mtp' = the mtp flag (file not mtp processed yet)")
 | |
|     print()
 | |
|     for k, nk in db.execute("select k, count(k) from mt group by k order by k"):
 | |
|         print(f"{nk:9} {k}")
 | |
| 
 | |
| 
 | |
| def compare(n1, d1, n2, d2, verbose):
 | |
|     nt = next(d1.execute("select count(w) from up"))[0]
 | |
|     n = 0
 | |
|     miss = 0
 | |
|     for w1, rd, fn in d1.execute("select w, rd, fn from up"):
 | |
|         n += 1
 | |
|         if n % 25_000 == 0:
 | |
|             m = f"\033[36mchecked {n:,} of {nt:,} files in {n1} against {n2}\033[0m"
 | |
|             print(m)
 | |
| 
 | |
|         if rd.split("/", 1)[0] == ".hist":
 | |
|             continue
 | |
| 
 | |
|         if BY_PATH:
 | |
|             q = "select w from up where rd = ? and fn = ?"
 | |
|             hit = d2.execute(q, (rd, fn)).fetchone()
 | |
|         else:
 | |
|             q = "select w from up where substr(w,1,16) = ? and +w = ?"
 | |
|             hit = d2.execute(q, (w1[:16], w1)).fetchone()
 | |
| 
 | |
|         if not hit:
 | |
|             miss += 1
 | |
|             if verbose:
 | |
|                 print(f"file in {n1} missing in {n2}: [{w1}] {rd}/{fn}")
 | |
| 
 | |
|     print(f" {miss} files in {n1} missing in {n2}\n")
 | |
| 
 | |
|     nt = next(d1.execute("select count(w) from mt"))[0]
 | |
|     n = 0
 | |
|     miss = {}
 | |
|     nmiss = 0
 | |
|     for w1s, k, v in d1.execute("select * from mt"):
 | |
| 
 | |
|         n += 1
 | |
|         if n % 100_000 == 0:
 | |
|             m = f"\033[36mchecked {n:,} of {nt:,} tags in {n1} against {n2}, so far {nmiss} missing tags\033[0m"
 | |
|             print(m)
 | |
| 
 | |
|         q = "select w, rd, fn from up where substr(w,1,16) = ?"
 | |
|         w1, rd, fn = d1.execute(q, (w1s,)).fetchone()
 | |
|         if rd.split("/", 1)[0] == ".hist":
 | |
|             continue
 | |
| 
 | |
|         if BY_PATH:
 | |
|             q = "select w from up where rd = ? and fn = ?"
 | |
|             w2 = d2.execute(q, (rd, fn)).fetchone()
 | |
|         else:
 | |
|             q = "select w from up where substr(w,1,16) = ? and +w = ?"
 | |
|             w2 = d2.execute(q, (w1s, w1)).fetchone()
 | |
| 
 | |
|         if w2:
 | |
|             w2 = w2[0]
 | |
| 
 | |
|         v2 = None
 | |
|         if w2:
 | |
|             v2 = d2.execute(
 | |
|                 "select v from mt where w = ? and +k = ?", (w2[:16], k)
 | |
|             ).fetchone()
 | |
|             if v2:
 | |
|                 v2 = v2[0]
 | |
| 
 | |
|         # if v != v2 and v2 and k in [".bpm", "key"] and n2 == "src":
 | |
|         #    print(f"{w} [{rd}/{fn}] {k} = [{v}] / [{v2}]")
 | |
| 
 | |
|         if v2 is not None:
 | |
|             if k.startswith("."):
 | |
|                 try:
 | |
|                     diff = abs(float(v) - float(v2))
 | |
|                     if diff > float(v) / 0.9:
 | |
|                         v2 = None
 | |
|                     else:
 | |
|                         v2 = v
 | |
|                 except:
 | |
|                     pass
 | |
| 
 | |
|             if v != v2:
 | |
|                 v2 = None
 | |
| 
 | |
|         if v2 is None:
 | |
|             nmiss += 1
 | |
|             try:
 | |
|                 miss[k] += 1
 | |
|             except:
 | |
|                 miss[k] = 1
 | |
| 
 | |
|             if verbose:
 | |
|                 print(f"missing in {n2}: [{w1}] [{rd}/{fn}] {k} = {v}")
 | |
| 
 | |
|     for k, v in sorted(miss.items()):
 | |
|         if v:
 | |
|             print(f"{n1} has {v:7} more {k:<7} tags than {n2}")
 | |
| 
 | |
|     print(f"in total, {nmiss} missing tags in {n2}\n")
 | |
| 
 | |
| 
 | |
| def copy_mtp(d1, d2, tag, rm):
 | |
|     nt = next(d1.execute("select count(w) from mt where k = ?", (tag,)))[0]
 | |
|     n = 0
 | |
|     ncopy = 0
 | |
|     nskip = 0
 | |
|     for w1s, k, v in d1.execute("select * from mt where k = ?", (tag,)):
 | |
|         n += 1
 | |
|         if n % 25_000 == 0:
 | |
|             m = f"\033[36m{n:,} of {nt:,} tags checked, so far {ncopy} copied, {nskip} skipped\033[0m"
 | |
|             print(m)
 | |
| 
 | |
|         q = "select w, rd, fn from up where substr(w,1,16) = ?"
 | |
|         w1, rd, fn = d1.execute(q, (w1s,)).fetchone()
 | |
|         if rd.split("/", 1)[0] == ".hist":
 | |
|             continue
 | |
| 
 | |
|         if BY_PATH:
 | |
|             q = "select w from up where rd = ? and fn = ?"
 | |
|             w2 = d2.execute(q, (rd, fn)).fetchone()
 | |
|         else:
 | |
|             q = "select w from up where substr(w,1,16) = ? and +w = ?"
 | |
|             w2 = d2.execute(q, (w1s, w1)).fetchone()
 | |
| 
 | |
|         if not w2:
 | |
|             continue
 | |
| 
 | |
|         w2s = w2[0][:16]
 | |
|         hit = d2.execute("select v from mt where w = ? and +k = ?", (w2s, k)).fetchone()
 | |
|         if hit:
 | |
|             hit = hit[0]
 | |
| 
 | |
|         if hit != v:
 | |
|             if NC and hit is not None:
 | |
|                 nskip += 1
 | |
|                 continue
 | |
| 
 | |
|             ncopy += 1
 | |
|             if hit is not None:
 | |
|                 d2.execute("delete from mt where w = ? and +k = ?", (w2s, k))
 | |
| 
 | |
|             d2.execute("insert into mt values (?,?,?)", (w2s, k, v))
 | |
|             if rm:
 | |
|                 d2.execute("delete from mt where w = ? and +k = 't:mtp'", (w2s,))
 | |
| 
 | |
|     d2.commit()
 | |
|     print(f"copied {ncopy} {tag} tags over, skipped {nskip}")
 | |
| 
 | |
| 
 | |
| def examples():
 | |
|     print(
 | |
|         """
 | |
| # clearing the journal
 | |
| ./dbtool.py up2k.db
 | |
| 
 | |
| # copy tags ".bpm" and "key" from old.db to up2k.db, and remove the mtp flag from matching files (so copyparty won't run any mtps on it)
 | |
| ./dbtool.py -ls up2k.db
 | |
| ./dbtool.py -src old.db up2k.db -cmp
 | |
| ./dbtool.py -src old.v3 up2k.db -rm-mtp-flag -copy key
 | |
| ./dbtool.py -src old.v3 up2k.db -rm-mtp-flag -copy .bpm -vac
 | |
| 
 | |
| """
 | |
|     )
 | |
| 
 | |
| 
 | |
| def main():
 | |
|     global NC, BY_PATH  # pylint: disable=global-statement
 | |
|     os.system("")
 | |
|     print()
 | |
| 
 | |
|     ap = argparse.ArgumentParser()
 | |
|     ap.add_argument("db", help="database to work on")
 | |
|     ap.add_argument("-h2", action="store_true", help="show examples")
 | |
|     ap.add_argument("-src", metavar="DB", type=str, help="database to copy from")
 | |
| 
 | |
|     ap2 = ap.add_argument_group("informational / read-only stuff")
 | |
|     ap2.add_argument("-v", action="store_true", help="verbose")
 | |
|     ap2.add_argument("-ls", action="store_true", help="list summary for db")
 | |
|     ap2.add_argument("-cmp", action="store_true", help="compare databases")
 | |
| 
 | |
|     ap2 = ap.add_argument_group("options which modify target db")
 | |
|     ap2.add_argument("-copy", metavar="TAG", type=str, help="mtp tag to copy over")
 | |
|     ap2.add_argument(
 | |
|         "-rm-mtp-flag",
 | |
|         action="store_true",
 | |
|         help="when an mtp tag is copied over, also mark that file as done, so copyparty won't run any mtps on those files",
 | |
|     )
 | |
|     ap2.add_argument("-vac", action="store_true", help="optimize DB")
 | |
| 
 | |
|     ap2 = ap.add_argument_group("behavior modifiers")
 | |
|     ap2.add_argument(
 | |
|         "-nc",
 | |
|         action="store_true",
 | |
|         help="no-clobber; don't replace/overwrite existing tags",
 | |
|     )
 | |
|     ap2.add_argument(
 | |
|         "-by-path",
 | |
|         action="store_true",
 | |
|         help="match files based on location rather than warks (content-hash), use this if the databases have different wark salts",
 | |
|     )
 | |
| 
 | |
|     ar = ap.parse_args()
 | |
|     if ar.h2:
 | |
|         examples()
 | |
|         return
 | |
| 
 | |
|     NC = ar.nc
 | |
|     BY_PATH = ar.by_path
 | |
| 
 | |
|     for v in [ar.db, ar.src]:
 | |
|         if v and not os.path.exists(v):
 | |
|             die("database must exist")
 | |
| 
 | |
|     db = sqlite3.connect(ar.db)
 | |
|     ds = sqlite3.connect(ar.src) if ar.src else None
 | |
| 
 | |
|     # revert journals
 | |
|     for d, p in [[db, ar.db], [ds, ar.src]]:
 | |
|         if not d:
 | |
|             continue
 | |
| 
 | |
|         pj = "{}-journal".format(p)
 | |
|         if not os.path.exists(pj):
 | |
|             continue
 | |
| 
 | |
|         d.execute("create table foo (bar int)")
 | |
|         d.execute("drop table foo")
 | |
| 
 | |
|     if ar.copy:
 | |
|         db.close()
 | |
|         shutil.copy2(ar.db, "{}.bak.dbtool.{:x}".format(ar.db, int(time.time())))
 | |
|         db = sqlite3.connect(ar.db)
 | |
| 
 | |
|     for d, n in [[ds, "src"], [db, "dst"]]:
 | |
|         if not d:
 | |
|             continue
 | |
| 
 | |
|         ver = read_ver(d)
 | |
|         if ver == "corrupt":
 | |
|             die("{} database appears to be corrupt, sorry")
 | |
| 
 | |
|         iver = int(ver)
 | |
|         if iver < DB_VER1 or iver > DB_VER2:
 | |
|             m = f"{n} db is version {ver}, this tool only supports versions between {DB_VER1} and {DB_VER2}, please upgrade it with copyparty first"
 | |
|             die(m)
 | |
| 
 | |
|     if ar.ls:
 | |
|         ls(db)
 | |
| 
 | |
|     if ar.cmp:
 | |
|         if not ds:
 | |
|             die("need src db to compare against")
 | |
| 
 | |
|         compare("src", ds, "dst", db, ar.v)
 | |
|         compare("dst", db, "src", ds, ar.v)
 | |
| 
 | |
|     if ar.copy:
 | |
|         copy_mtp(ds, db, ar.copy, ar.rm_mtp_flag)
 | |
| 
 | |
| 
 | |
| if __name__ == "__main__":
 | |
|     main()
 |