#!/usr/bin/python3 import ast,hashlib,os,random,re,secrets,shutil,subprocess,sys,tempfile from uuid import uuid4 import sqlite3 as sql from base64 import b64encode,b64decode from Cryptodome.Cipher import AES ROOT_DIR=os.getcwd() # The directory where all directories and files of the index are located INDEX_FILE=ROOT_DIR+"/index.db" # The database file LINUX_APP_STARTER="xdg-open" # The command which opens the files in the default application ENCRYPT=True # True or False; Whether the default is to encrypt the file or to save it as a plain file class database(): def __init__(self,filepath = INDEX_FILE): self.connection=None self.crsr=None if not os.path.exists(filepath) : self.create_database(filepath) else: self.connection = sql.connect(filepath) self.crsr = self.connection.cursor() def add_index(self,vallist,collist=""): collist=self.collist if not collist else collist # compile the options into a command for the SQLite database colstring=",".join(collist) valstring='"{}"'.format('","'.join(vallist)) self.crsr.execute("""INSERT INTO {table} ({cols}) VALUES ({vals}); """.format(table=self.name,cols=colstring,vals=valstring)) self.connection.commit() def create_database(self, filepath): # create the database and tables self.connection = sql.connect(filepath) self.crsr = self.connection.cursor() sqlcommand = """CREATE TABLE FILES( FILE TEXT PRIMARY KEY NOT NULL, HASH TEXT NOT NULL, TITLE TEXT , SOURCE TEXT , CATEGORY TEXT NOT NULL, TAGS TEXT , CONTENT TEXT ); """ self.crsr.execute(sqlcommand) sqlcommand = """CREATE TABLE CATEGORY( NAME TEXT PRIMARY KEY NOT NULL, ALIAS TEXT ); """ self.crsr.execute(sqlcommand) sqlcommand = """CREATE TABLE TAGS( NAME TEXT PRIMARY KEY NOT NULL, ALIAS TEXT ); """ self.crsr.execute(sqlcommand) sqlcommand = """CREATE TABLE ENCRYPTION( NAME TEXT PRIMARY KEY NOT NULL, CIPHER TEXT NOT NULL, PASSWORD TEXT ); """ self.crsr.execute(sqlcommand) def delete_index(self,typ,item): self.crsr.execute("DELETE FROM {} WHERE {}='{}'".format(self.name,typ,item)) self.connection.commit() return True def get_col(self,column = "*"): # get the column of some table. If no options given, return all columns self.crsr.execute("SELECT {} FROM {}".format(column,self.name)) tres=self.crsr.fetchall() res=[] for i in tres: res.append(i) # if the table is empty, return "". if not res: res="" return res def get_item(self,column,where,specific=False): tres=[] if column == "*": for col in self.collist: temp_list=[] if specific: self.crsr.execute("SELECT * FROM {} WHERE {}='{}'".format(self.name,col,where)) else: self.crsr.execute("SELECT * FROM {} WHERE {} GLOB '*{}*'".format(self.name,col,where)) temp_list=self.crsr.fetchall() if temp_list: for i in temp_list: if not i in tres: tres.append(i) else: if specific: self.crsr.execute("SELECT * FROM {} WHERE {}='{}'".format(self.name,column,where)) else: self.crsr.execute("SELECT * FROM {} WHERE {} GLOB '*{}*'".format(self.name,column,where)) tres=self.crsr.fetchall() n=0 res=[] for i in tres: if not i in res: res.append(i) # if the table is empty, return "". if not res: return [""] return res def select_index(self,sel_list,quiet=False): if quiet == "strict": return sel_list if sel_list: res=[] if len(sel_list) > 1: n=0 print("Found several matches:") for tup in sel_list: temp_list=[] for j in tup: temp_list.append(j) print("Match [{}]".format(n)) if self.name == "FILES": print("\tTitle:\t ",temp_list[2]) name=ctb.get_alias(temp_list[4]) if name != "": category=name else: category=temp_list[4] print("\tCategory:",category) tags_list=[] for tag in temp_list[5].split(","): name=ttb.get_alias(tag) if name != "": tag=name tags_list.append(tag) print("\tTags:\t ",",".join(tags_list)) else: print("\tName:\t ",temp_list[0]) print("\tAlias:\t ",temp_list[1]) print("\tDescription: ",temp_list[2]) n+=1 eingabe=input("Enter number(s) (0-{}; '*' for all entries): ".format(n-1)) if not eingabe: return [""] num_list=[] if re.match('[*]',eingabe): for i in range(0,n): num_list.append(i) else: num_list=eingabe.split(' ') nminus=0 for i in num_list: if int(i) >= n: print("The number {} is too big!".format(i)) nminus+=1 continue res.append(sel_list[int(i)]) if not quiet: print("\nFinal match{}:".format("es" if len(num_list)-nminus > 1 else "")) else: if sel_list[0] == "": if not quiet == "strict": print("No matching entry found!") return [""] res=sel_list if not quiet == "strict": print("\nMatch found!") return res return 1 def sql_compare_list(self,typ,firstlist,secondlist,specific=False): if isinstance(firstlist, str): firstlist=firstlist.split(" ") if firstlist: n=0 temp_list=[] if not secondlist: n=0 for i in self.get_col(typ): aliases=[] if i == "" and self.name == "FILES": print("NO ENTRIES IN THE INDEX!") return "" # get aliases for the checks, but only for unspecific search! if self.name == "FILES": if typ == "*": for tag in i[5].split(","): aliases.append(ttb.get_alias(tag)) aliases.append(ctb.get_alias(i[4])) elif typ == "TAGS": for tag in i[0].split(","): aliases.append(ttb.get_alias(tag)) elif typ == "CATEGORY": aliases.append(ctb.get_alias(i[0])) istr=" ".join(i).lower() + " " + " ".join(aliases).lower() success=0 for j in firstlist: j=j.lower() if specific: for part in i: part=part.lower() if j == part: if not success == -1: success=1 if success == 0: success=-1 else: if j in istr: if not success == -1: success=1 else: success=-1 if success > 0: if typ == "*": temp_list.append(self.get_item("*",i[0],specific)[0]) else: for k in self.get_item(typ,i[0],specific): if not k in temp_list: temp_list.append(k) n+=1 else: if not secondlist[0] == "": for i in secondlist: for j in firstlist: if j in i: temp_list.append(secondlist[n]) n+=1 else: return secondlist if not temp_list: return [""] return temp_list return secondlist def update_index(self,typ,update,where,val): self.crsr.execute("UPDATE {} SET {}='{}' WHERE {}='{}'".format(self.name,typ,update,where,val)) self.connection.commit() return True class enctable(database): # https://www.thesecuritybuddy.com/cryptography-and-python/aes-encryption-and-decryption-using-pycryptodome-module-in-python/ def __init__(self, filepath = INDEX_FILE): self.name="ENCRYPTION" self.collist=["NAME","CIPHER","PASSWORD"] super().__init__(filepath) def derive_key_and_iv(self, password, salt, key_length, iv_length): #derive key and IV from password and salt. d = d_i = b'' while len(d) < key_length + iv_length: #d_i = hashlib.md5(d_i + str.encode(password) + salt).digest() #obtain the md5 hash value d_i = hashlib.md5(d_i + password + salt).digest() #obtain the md5 hash value d += d_i return d[:key_length], d[key_length:key_length+iv_length] def encrypt(self, in_file, out_filepath, password="", key_length=32): print("Encrypting...") in_file=open(in_file,"rb") out_uuid=out_filepath.split("/")[-1].split(".")[0] out_file=open(f"{out_filepath}","wb") bs = AES.block_size #16 bytes if not password: password = os.urandom(bs*random.randint(1,4)) if self.get_item("NAME", out_uuid)[0] == "": self.add_index([out_uuid.split(".")[0],"AES",b64encode(password).decode()]) else: password_list=self.get_item("NAME", in_uuid.split(".")[0]) if password_list[0] != "": if len(password_list) == 1: password=b64decode(password_list[0][2].encode()) else: print("ERROR: MULTIPLE PASSWORD ENTRIES FOUND!") return False #print("ERROR: ENTRY FOR UUID {} ALREADY EXISTS!".format(out_uuid)) #return False salt = os.urandom(bs) #return a string of random bytes key, iv = self.derive_key_and_iv(password, salt, key_length, bs) cipher = AES.new(key, AES.MODE_CBC, iv) out_file.write(salt) finished = False while not finished: chunk = in_file.read(1024 * bs) if len(chunk) == 0 or len(chunk) % bs != 0:#final block/chunk is padded before encryption padding_length = (bs - len(chunk) % bs) or bs chunk += str.encode(padding_length * chr(padding_length)) finished = True out_file.write(cipher.encrypt(chunk)) out_file.close() in_file.close() def is_encrypted(self, uuid): if self.get_item("NAME", uuid)[0] != "": return True return False def decrypt(self, in_filepath, out_file=None, password="", key_length=32): print("Decrypting...") in_file=open(f"{in_filepath}","rb") # open the encrypted file in_uuid=in_filepath.split("/")[-1] if not out_file: out_temp=tempfile.mkstemp(prefix="image-index-") filepath=out_temp[1] out_file=open(filepath,"wb") #out_file=temp_file else: filepath=out_file out_file=open(out_file,"wb") if not password: password_list=self.get_item("NAME", in_uuid.split(".")[0]) if password_list[0] != "": if len(password_list) == 1: password=b64decode(password_list[0][2].encode()) else: print("ERROR: MULTIPLE PASSWORD ENTRIES FOUND!") return False else: print("ERROR: NO PASSWORD FOUND FOR DECRYPTION!") return False bs = AES.block_size salt = in_file.read(bs) key, iv = self.derive_key_and_iv(password, salt, key_length, bs) cipher = AES.new(key, AES.MODE_CBC, iv) next_chunk = '' finished = False while not finished: chunk, next_chunk = next_chunk, cipher.decrypt(in_file.read(1024 * bs)) if len(next_chunk) == 0: padding_length = chunk[-1] chunk = chunk[:-padding_length] finished = True out_file.write(bytes(x for x in chunk)) out_file.close() in_file.close() return filepath def delete_index(self, uuid): super().delete_index("NAME", uuid) print("UUID",uuid) return True class metatable(database): def __init__(self,typ,filepath = INDEX_FILE): self.name=typ.upper() self.collist=["NAME","ALIAS"] super().__init__(filepath) def add_index(self,val,alias,randhex=None): if not randhex: randhex=get_randhex() if self.name == "TAGS" or bencrypt: val=get_randhex(8) else: val=re.sub('[ ,?!/\\:!*"<>|]', '', val) super().add_index([val[:8] + "-" + randhex,alias]) def check_index(self,typ): res=[] for i in tb.get_col(typ): success=0 for j in self.get_col("NAME"): if j[0].split(".")[0] in i[0]: success=1 if not i[0] in res and success == 0: res.append(i[0]) return res def get_alias(self,arg): if not arg: return "" selection=self.search_index(arg,"strict") item=selection[0] if item[0] != "": alias=item[1] else: alias = "" return alias def get_name(self,arg): if not arg: return "" selection=self.search_index(arg,"strict") item=selection[0] if not item: name="" else: name=item[0] return name def search_index(self,args,quiet=True): selection=[] selection=self.sql_compare_list("*", [args], selection,True) if selection[0] == "": slist=args.split(" ") selection=self.sql_compare_list("*", slist, [],False) if len(selection) > 1: print("Please enter a more specific search query!") return "" selection=self.select_index(selection,quiet) return selection def update_index(self, typ, update, where, val): selection=self.search_index(update,"strict") if selection[0] != "" and len(selection) >= 1: print("One entry is already called {}!".format(update)) return False else: super().update_index(typ, update, where, val) return True class filestable(database): def __init__(self,filepath = INDEX_FILE): self.name="FILES" self.collist=["FILE","HASH","TITLE","SOURCE","CATEGORY","TAGS","CONTENT"] super().__init__(filepath) def add_index(self,filepath,category="default",title="",source="",tags="",content=""): filehash=self.get_hash(filepath) # make hash of file before copy if filehash in str(self.get_col("HASH")): print("This file already has an entry!") return False n=0 # get the name of the category from the meta table if not category: category="default" name=ctb.get_name(category) if name: category=name else: ctb.add_index(category.lower(),category) category=ctb.get_name(category) # get the name of the tags from the meta table tags_list=[] for tag in tags.split(','): name=ttb.get_name(tag) if name != "": tag=name else: ttb.add_index(tag.lower(),tag) tags_list.append(ttb.get_name(tag)) tags=",".join(tags_list) fileext=os.path.splitext(filepath)[-1] fileuuid=str(uuid4()) filename=fileuuid+fileext if not os.path.exists("{}/{}".format(ROOT_DIR,category)): os.makedirs("{}/{}".format(ROOT_DIR,category)) # try to copy the file, return if error. try: if bencrypt: etb.encrypt(filepath, f"{ROOT_DIR}/{category}/{fileuuid}.enc") else: shutil.copy(filepath,f"{ROOT_DIR}/{category}/{filename}") except Exception as e: print(e) print("COULDN'T COPY FILE TO DESTINATION!") return False vallist=[filename,filehash,title,source,category,tags,content] super().add_index(vallist) return True def check_index(self): hash_list=[] path_list=[] enc_num=0 for i in self.get_col(): filename=i[0] fileuuid=filename.split(".")[0] category=i[4] filehash1=i[1] if etb.is_encrypted(fileuuid): enc_num+=1 filename=f"{fileuuid}.enc" filepath="{}/{}/{}".format(ROOT_DIR,category,filename) if not os.path.exists(filepath): path_list.append(i) if etb.is_encrypted(fileuuid): continue try: filehash2=self.get_hash(filepath) if not filehash1 == filehash2: hash_list.append(i) except Exception: path_list.append(i) print(f"Encrypted files: {enc_num}; hashes not checked.") return hash_list,path_list def delete_index(self,sel_list): item_list=self.get_item(self.collist[1],sel_list[1]) if len(item_list) == 1: item=item_list[0] category=item[4] filename=item[0] fileuuid=os.path.splitext(filename)[0] super().delete_index(self.collist[1],sel_list[1]) etb.delete_index(fileuuid) return True def replace_file(self,in_filepath,item): filehash=self.get_hash(in_filepath) category=item[4] filename=item[0] if filehash in str(self.get_col("HASH")): print("This file already has an entry!") return False fileuuid=os.path.splitext(filename)[-1] out_filepath=f"{ROOT_DIR}/{category}/{filename}" out_encpath=f"{ROOT_DIR}/{category}/{fileuuid}.enc" try: if etb.is_encrypted(fileuuid): etb.encrypt(in_filepath, out_encpath) else: shutil.copy(in_filepath, out_filepath) except Exception as e: print("ERROR:",e) return False super().update_index("HASH", filehash, self.collist[0], filename) return True def update_index(self,typ,update,sel_list,omnipotent=False): typ=typ.upper() if typ in ["FILE","HASH"] and not omnipotent: print("This type can't be changed!") return False category=sel_list[4] filehash=sel_list[1] filename=sel_list[0] fileuuid=sel_list[0].split(".")[0] if typ in ["CATEGORY"]: # get alias of category name=ctb.get_name(update) if name != "": update=name else: ctb.add_index(update.lower(),update) update=ctb.get_name(update) if not os.path.exists("{}/{}".format(ROOT_DIR,update)): os.makedirs("{}/{}".format(ROOT_DIR,update)) if etb.is_encrypted(fileuuid): filename=f"{fileuuid}.enc" shutil.move("{}/{}/{}".format(ROOT_DIR,category,filename), "{}/{}/{}".format(ROOT_DIR,update,filename)) if typ in ["TAGS"]: tags_list=[] if update[0][0] == "+": for tag in sel_list[5].split(","): tags_list.append(tag) for tag in update[1:].split(","): name=ttb.get_name(tag) if name == "": ttb.add_index(tag.lower(), tag) name=ttb.get_name(tag) tags_list.append(name) elif update[0][0] == "-": for tag in sel_list[5].split(","): success=0 for i in update[1:].split(","): name=ttb.get_name(i) if name == "": ttb.add_index(tag.lower(), tag) name=ttb.get_name(tag) if name == tag: success = -1 if success >= 0: tags_list.append(tag) else: for tag in update.split(","): name=ttb.get_name(tag) if name != "": tags_list.append(name) else: ttb.add_index(tag.lower(), tag) tags_list.append(ttb.get_name(tag)) update=",".join(tags_list) super().update_index(typ, update, "HASH", filehash) def get_hash(self,filepath): # https://www.quickprogrammingtips.com/python/how-to-calculate-md5-hash-of-a-file-in-python.html md5_hash = hashlib.md5() # hash selected file in chunks of 4KiB, read the link above if you ask why. with open(filepath,"rb") as f: for byte_block in iter(lambda: f.read(4096),b""): md5_hash.update(byte_block) f.close() return str(md5_hash.hexdigest()) def search_index(self,args,quiet=False): snext="all" shash=[] alle=[] category=[] sfile=[] content=[] source=[] title=[] tags=[] for arg in args: arg=arg.lower() if re.match('^[-]\w{1}$', arg): if arg == "-h": snext="hash" elif arg == "-a": # technically unneeded because of else at the end snext="all" elif arg == "-c": snext="category" elif arg == "-f": snext="file" elif arg == "-i": # Inhalt snext="content" elif arg == "-s": snext="source" elif arg == "-t": snext="title" elif arg == "-g": # Gruppe snext="tags" else: snext="all" continue if snext == "hash": shash.append(arg) elif snext == "all": alle.append(arg) elif snext == "category": name=ctb.get_name(arg) if name != "": arg=name category.append(arg) elif snext == "file": sfile.append(arg) elif snext == "content": content.append(arg) elif snext == "source": source.append(arg) elif snext == "title": title.append(arg) elif snext == "tags": '''if "," in arg: for tag in arg.split(","): name=ttb.get_name(arg) if name != "": arg=name tags.append(arg) else: name=ttb.get_name(arg) print("name",name) if name != "": arg=name''' tags.append(arg) else: alle.append(arg) # search for the right items selection=[] selection=self.sql_compare_list("*",alle,selection) selection=self.sql_compare_list("HASH",shash,selection) selection=self.sql_compare_list("CATEGORY",category,selection) selection=self.sql_compare_list("FILE",sfile,selection) selection=self.sql_compare_list("CONTENT",content,selection) selection=self.sql_compare_list("SOURCE",source,selection) selection=self.sql_compare_list("TITLE",title,selection) selection=self.sql_compare_list("TAGS",tags,selection) return self.select_index(selection,quiet) def get_randhex(count=5): randhex="" for i in range(count): randhex+=random.choice("0123456789abcdef") return randhex def add(args): if len(args) >= 6: tb.add_index(args[0],args[1],args[2],args[3],args[4],args[5]) return n=0 for i in ["Filepath","Category","Title","Source","Tags","Content"]: i=i.title() try: print("{}: {}".format(i,args[n])) except Exception: extra="" if i == "Tags": extra=" (Separate with ',')" eingabe = input("{}{}: ".format(i,extra)) if i in ["Category"] and not eingabe: print("{} set to 'default'".format(i)) eingabe="default" args.append(eingabe) if i in ["Filepath"]: filehash=tb.get_hash(args[n]) if filehash in str(tb.get_col("HASH")): print("This file already exists!") return False if not args[n]: print("{} must not be empty!".format(i)) return False else: if not os.path.isfile(args[n]): print(" The file '{}' doesn't exist or is not a file!".format(args[n])) return False n+=1 success=tb.add_index(args[0],args[1],args[2],args[3],args[4],args[5]) if success: print("Added '{}'!".format(args[2])) def copy(args): if len(args) == 0: out_filepath=input() sel_list=search([]) elif len(args) == 1: out_filepath=args[0] sel_list=search([]) else: out_filepath=args[0] sel_list=search(args[1:]) for item in sel_list: filename=item[0] out_fileext=os.path.splitext(filename)[-1] title=item[2] category=item[4] fileuuid=os.path.splitext(filename)[0] extra="" if os.path.exists(out_filepath): if os.path.isfile(out_filepath): if re.match('[nN].*', input(f"The file on path {out_filepath} already exists!\nDo you want to overwrite it? [Y/n] ")): return False if os.path.isdir(out_filepath): print("found DIRECTORY") extra=f"/{title}{out_fileext}" if etb.is_encrypted(fileuuid): etb.decrypt(f"{ROOT_DIR}/{category}/{fileuuid}.enc",f"{out_filepath}{extra}") else: shutil.copy(f"{ROOT_DIR}/{category}/{filename}", f"{out_filepath}{extra}") print(f"Copied '{title}' to {out_filepath}!") def check(args): success=0 hash_list,temp_list=tb.check_index() path_list=[] hashcheck=pathcheck=True verbose=False for arg in args: if arg == "-v": verbose=True elif arg == "-f": hashcheck=False elif arg == "-h": pathcheck=False if hash_list: print("{} file{} faulty!".format(len(hash_list),"s are" if len(hash_list) > 1 else " is")) success=-1 if verbose: for tup in hash_list: print("Title: ",tup[2]) print("\tCategory:",tup[4]) print("\tFilename:",tup[0]) for i in temp_list: if not i in path_list: path_list.append(i) if path_list: print("{} file{} missing!".format(len(path_list),"s are" if len(path_list) > 1 else " is")) success=-1 if verbose: for tup in path_list: print("Title: ",tup[2]) print("\tCategory:",tup[4]) print("\tFilename:",tup[0]) if success >= 0: print("Everything is good!") if hash_list and hashcheck: eingabe=input("Do you want to remove the faulty files? [y/N]: ") if re.match('[yY]',eingabe): print("Removing faulty files...") repair(hash_list) if path_list and pathcheck: eingabe=input("Do you want to remove the orphaned entries? [Y/n]: ") if not re.match('[nN]',eingabe): print("Removing orphaned entries...") repair(path_list) def delete(args): selection=search(args,True) for sel in selection: if sel[0] != "": try: category=sel[4] filename=sel[0] fileuuid=os.path.splitext(filename)[0] if etb.is_encrypted(fileuuid): filename=f"{fileuuid}.enc" os.remove("{}/{}/{}".format(ROOT_DIR,category,filename)) except Exception as e: print(e) print("Couldn't delete a file!") return 1 tb.delete_index(sel) print("Deleted '{}'!".format(sel[2])) def help(args): syntax=False for arg in args: if not syntax and not re.match('[mM]',arg): print("SYNTAX: image-index