toto10's picture
Upload folder using huggingface_hub (#1)
34097e9
raw
history blame
25.1 kB
import hashlib
import json
import os
import sqlite3
from modules import scripts
from PIL import Image
version = 6
path_recorder_file = os.path.join(scripts.basedir(), "path_recorder.txt")
aes_cache_file = os.path.join(scripts.basedir(), "aes_scores.json")
exif_cache_file = os.path.join(scripts.basedir(), "exif_data.json")
ranking_file = os.path.join(scripts.basedir(), "ranking.json")
archive = os.path.join(scripts.basedir(), "archive")
db_file = os.path.join(scripts.basedir(), "wib.sqlite3")
np = "Negative prompt: "
st = "Steps: "
timeout = 30
def create_filehash(cursor):
cursor.execute('''
CREATE TABLE IF NOT EXISTS filehash (
file TEXT PRIMARY KEY,
hash TEXT,
created TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
updated TIMESTAMP DEFAULT CURRENT_TIMESTAMP
)
''')
cursor.execute('''
CREATE TRIGGER filehash_tr
AFTER UPDATE ON filehash
BEGIN
UPDATE filehash SET updated = CURRENT_TIMESTAMP WHERE file = OLD.file;
END;
''')
return
def create_work_files(cursor):
cursor.execute('''
CREATE TABLE IF NOT EXISTS work_files (
file TEXT PRIMARY KEY
)
''')
return
def create_db(cursor):
cursor.execute('''
CREATE TABLE IF NOT EXISTS db_data (
key TEXT PRIMARY KEY,
value TEXT
)
''')
cursor.execute('''
CREATE TABLE IF NOT EXISTS path_recorder (
path TEXT PRIMARY KEY,
depth INT,
path_display TEXT,
created TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
updated TIMESTAMP DEFAULT CURRENT_TIMESTAMP
)
''')
cursor.execute('''
CREATE TRIGGER path_recorder_tr
AFTER UPDATE ON path_recorder
BEGIN
UPDATE path_recorder SET updated = CURRENT_TIMESTAMP WHERE path = OLD.path;
END;
''')
cursor.execute('''
CREATE TABLE IF NOT EXISTS exif_data (
file TEXT,
key TEXT,
value TEXT,
created TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
updated TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
PRIMARY KEY (file, key)
)
''')
cursor.execute('''
CREATE INDEX IF NOT EXISTS exif_data_key ON exif_data (key)
''')
cursor.execute('''
CREATE TRIGGER exif_data_tr
AFTER UPDATE ON exif_data
BEGIN
UPDATE exif_data SET updated = CURRENT_TIMESTAMP WHERE file = OLD.file AND key = OLD.key;
END;
''')
cursor.execute('''
CREATE TABLE IF NOT EXISTS ranking (
file TEXT PRIMARY KEY,
name TEXT,
ranking TEXT,
created TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
updated TIMESTAMP DEFAULT CURRENT_TIMESTAMP
)
''')
cursor.execute('''
CREATE INDEX IF NOT EXISTS ranking_name ON ranking (name)
''')
cursor.execute('''
CREATE TRIGGER ranking_tr
AFTER UPDATE ON ranking
BEGIN
UPDATE ranking SET updated = CURRENT_TIMESTAMP WHERE file = OLD.file;
END;
''')
create_filehash(cursor)
create_work_files(cursor)
return
def migrate_path_recorder(cursor):
if os.path.exists(path_recorder_file):
try:
with open(path_recorder_file) as f:
# json-version
path_recorder = json.load(f)
for path, values in path_recorder.items():
path = os.path.realpath(path)
depth = values["depth"]
path_display = f"{path} [{depth}]"
cursor.execute('''
INSERT INTO path_recorder (path, depth, path_display)
VALUES (?, ?, ?)
''', (path, depth, path_display))
except json.JSONDecodeError:
with open(path_recorder_file) as f:
# old txt-version
path = f.readline().rstrip("\n")
while len(path) > 0:
path = os.path.realpath(path)
cursor.execute('''
INSERT INTO path_recorder (path, depth, path_display)
VALUES (?, ?, ?)
''', (path, 0, f"{path} [0]"))
path = f.readline().rstrip("\n")
return
def update_exif_data(cursor, file, info):
prompt = "0"
negative_prompt = "0"
key_values = "0: 0"
if info != "0":
info_list = info.split("\n")
prompt = ""
negative_prompt = ""
key_values = ""
for info_item in info_list:
if info_item.startswith(st):
key_values = info_item
elif info_item.startswith(np):
negative_prompt = info_item.replace(np, "")
else:
if prompt == "":
prompt = info_item
else:
# multiline prompts
prompt = f"{prompt}\n{info_item}"
if key_values != "":
key_value_pairs = []
key_value = ""
quote_open = False
for char in key_values + ",":
key_value += char
if char == '"':
quote_open = not quote_open
if char == "," and not quote_open:
try:
k, v = key_value.strip(" ,").split(": ")
except ValueError:
k = key_value.strip(" ,").split(": ")[0]
v = ""
key_value_pairs.append((k, v))
key_value = ""
try:
cursor.execute('''
INSERT INTO exif_data (file, key, value)
VALUES (?, ?, ?)
''', (file, "prompt", prompt))
except sqlite3.IntegrityError:
# Duplicate, delete all "file" entries and try again
cursor.execute('''
DELETE FROM exif_data
WHERE file = ?
''', (file,))
cursor.execute('''
INSERT INTO exif_data (file, key, value)
VALUES (?, ?, ?)
''', (file, "prompt", prompt))
cursor.execute('''
INSERT INTO exif_data (file, key, value)
VALUES (?, ?, ?)
''', (file, "negative_prompt", negative_prompt))
for (key, value) in key_value_pairs:
try:
cursor.execute('''
INSERT INTO exif_data (file, key, value)
VALUES (?, ?, ?)
''', (file, key, value))
except sqlite3.IntegrityError:
pass
return
def migrate_exif_data(cursor):
if os.path.exists(exif_cache_file):
with open(exif_cache_file, 'r') as file:
exif_cache = json.load(file)
for file, info in exif_cache.items():
file = os.path.realpath(file)
update_exif_data(cursor, file, info)
return
def migrate_ranking(cursor):
if os.path.exists(ranking_file):
with open(ranking_file, 'r') as file:
ranking = json.load(file)
for file, info in ranking.items():
if info != "None":
file = os.path.realpath(file)
name = os.path.basename(file)
cursor.execute('''
INSERT INTO ranking (file, name, ranking)
VALUES (?, ?, ?)
''', (file, name, info))
return
def get_hash(file):
# Get filehash without exif info
try:
image = Image.open(file)
except Exception as e:
print(e)
hash = hashlib.sha512(image.tobytes()).hexdigest()
image.close()
return hash
def migrate_filehash(cursor, version):
if version <= "4":
create_filehash(cursor)
cursor.execute('''
SELECT file
FROM ranking
''')
for (file,) in cursor.fetchall():
if os.path.exists(file):
hash = get_hash(file)
cursor.execute('''
INSERT INTO filehash (file, hash)
VALUES (?, ?)
''', (file, hash))
return
def migrate_work_files(cursor):
create_work_files(cursor)
return
def update_db_data(cursor, key, value):
cursor.execute('''
INSERT OR REPLACE
INTO db_data (key, value)
VALUES (?, ?)
''', (key, value))
return
def get_version():
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
cursor.execute('''
SELECT value
FROM db_data
WHERE key = 'version'
''',)
db_version = cursor.fetchone()
return db_version
def migrate_path_recorder_dirs(cursor):
cursor.execute('''
SELECT path, path_display
FROM path_recorder
''')
for (path, path_display) in cursor.fetchall():
real_path = os.path.realpath(path)
if path != real_path:
update_from = path
update_to = real_path
try:
cursor.execute('''
UPDATE path_recorder
SET path = ?,
path_display = ? || SUBSTR(path_display, LENGTH(?) + 1)
WHERE path = ?
''', (update_to, update_to, update_from, update_from))
except sqlite3.IntegrityError as e:
# these are double keys, because the same file can be in the db with different path notations
(e_msg,) = e.args
if e_msg.startswith("UNIQUE constraint"):
cursor.execute('''
DELETE FROM path_recorder
WHERE path = ?
''', (update_from,))
else:
raise
return
def migrate_exif_data_dirs(cursor):
cursor.execute('''
SELECT file
FROM exif_data
''')
for (filepath,) in cursor.fetchall():
(path, file) = os.path.split(filepath)
real_path = os.path.realpath(path)
if path != real_path:
update_from = filepath
update_to = os.path.join(real_path, file)
try:
cursor.execute('''
UPDATE exif_data
SET file = ?
WHERE file = ?
''', (update_to, update_from))
except sqlite3.IntegrityError as e:
# these are double keys, because the same file can be in the db with different path notations
(e_msg,) = e.args
if e_msg.startswith("UNIQUE constraint"):
cursor.execute('''
DELETE FROM exif_data
WHERE file = ?
''', (update_from,))
else:
raise
return
def migrate_ranking_dirs(cursor, db_version):
if db_version == "1":
cursor.execute('''
ALTER TABLE ranking
ADD COLUMN name TEXT
''')
cursor.execute('''
CREATE INDEX IF NOT EXISTS ranking_name ON ranking (name)
''')
cursor.execute('''
SELECT file, ranking
FROM ranking
''')
for (filepath, ranking) in cursor.fetchall():
if filepath == "" or ranking == "None":
cursor.execute('''
DELETE FROM ranking
WHERE file = ?
''', (filepath,))
else:
(path, file) = os.path.split(filepath)
real_path = os.path.realpath(path)
name = file
update_from = filepath
update_to = os.path.join(real_path, file)
try:
cursor.execute('''
UPDATE ranking
SET file = ?,
name = ?
WHERE file = ?
''', (update_to, name, update_from))
except sqlite3.IntegrityError as e:
# these are double keys, because the same file can be in the db with different path notations
(e_msg,) = e.args
if e_msg.startswith("UNIQUE constraint"):
cursor.execute('''
DELETE FROM ranking
WHERE file = ?
''', (update_from,))
else:
raise
return
def check():
if not os.path.exists(db_file):
conn, cursor = transaction_begin()
print("Image Browser: Creating database")
create_db(cursor)
update_db_data(cursor, "version", version)
migrate_path_recorder(cursor)
migrate_exif_data(cursor)
migrate_ranking(cursor)
migrate_filehash(cursor, str(version))
transaction_end(conn, cursor)
print("Image Browser: Database created")
db_version = get_version()
conn, cursor = transaction_begin()
if db_version[0] <= "2":
# version 1 database had mixed path notations, changed them all to abspath
# version 2 database still had mixed path notations, because of windows short name, changed them all to realpath
print(f"Image Browser: Upgrading database from version {db_version[0]} to version {version}")
migrate_path_recorder_dirs(cursor)
migrate_exif_data_dirs(cursor)
migrate_ranking_dirs(cursor, db_version[0])
if db_version[0] <= "4":
migrate_filehash(cursor, db_version[0])
if db_version[0] <= "5":
migrate_work_files(cursor)
update_db_data(cursor, "version", version)
print(f"Image Browser: Database upgraded from version {db_version[0]} to version {version}")
transaction_end(conn, cursor)
return version
def load_path_recorder():
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
cursor.execute('''
SELECT path, depth, path_display
FROM path_recorder
''')
path_recorder = {path: {"depth": depth, "path_display": path_display} for path, depth, path_display in cursor.fetchall()}
return path_recorder
def select_ranking(file):
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
cursor.execute('''
SELECT ranking
FROM ranking
WHERE file = ?
''', (file,))
ranking_value = cursor.fetchone()
if ranking_value is None:
return_ranking = "None"
else:
(return_ranking,) = ranking_value
return return_ranking
def update_ranking(file, ranking):
name = os.path.basename(file)
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
if ranking == "None":
cursor.execute('''
DELETE FROM ranking
WHERE file = ?
''', (file,))
else:
cursor.execute('''
INSERT OR REPLACE
INTO ranking (file, name, ranking)
VALUES (?, ?, ?)
''', (file, name, ranking))
hash = get_hash(file)
cursor.execute('''
INSERT OR REPLACE
INTO filehash (file, hash)
VALUES (?, ?)
''', (file, hash))
return
def select_image_reward_score(cursor, file):
cursor.execute('''
SELECT value
FROM exif_data
WHERE file = ?
AND key = 'ImageRewardScore'
''', (file,))
image_reward_score = cursor.fetchone()
if image_reward_score is None:
return_image_reward_score = None
else:
(return_image_reward_score,) = image_reward_score
cursor.execute('''
SELECT value
FROM exif_data
WHERE file = ?
AND key = 'prompt'
''', (file,))
image_reward_prompt = cursor.fetchone()
if image_reward_prompt is None:
return_image_reward_prompt = None
else:
(return_image_reward_prompt,) = image_reward_prompt
return return_image_reward_score, return_image_reward_prompt
def update_image_reward_score(cursor, file, image_reward_score):
cursor.execute('''
INSERT OR REPLACE
INTO exif_data (file, key, value)
VALUES (?, ?, ?)
''', (file, "ImageRewardScore", image_reward_score))
return
def update_path_recorder(path, depth, path_display):
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
cursor.execute('''
INSERT OR REPLACE
INTO path_recorder (path, depth, path_display)
VALUES (?, ?, ?)
''', (path, depth, path_display))
return
def update_path_recorder(path, depth, path_display):
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
cursor.execute('''
INSERT OR REPLACE
INTO path_recorder (path, depth, path_display)
VALUES (?, ?, ?)
''', (path, depth, path_display))
return
def delete_path_recorder(path):
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
cursor.execute('''
DELETE FROM path_recorder
WHERE path = ?
''', (path,))
return
def update_path_recorder_mult(cursor, update_from, update_to):
cursor.execute('''
UPDATE path_recorder
SET path = ?,
path_display = ? || SUBSTR(path_display, LENGTH(?) + 1)
WHERE path = ?
''', (update_to, update_to, update_from, update_from))
return
def update_exif_data_mult(cursor, update_from, update_to):
update_from = update_from + os.path.sep
update_to = update_to + os.path.sep
cursor.execute('''
UPDATE exif_data
SET file = ? || SUBSTR(file, LENGTH(?) + 1)
WHERE file like ? || '%'
''', (update_to, update_from, update_from))
return
def update_ranking_mult(cursor, update_from, update_to):
update_from = update_from + os.path.sep
update_to = update_to + os.path.sep
cursor.execute('''
UPDATE ranking
SET file = ? || SUBSTR(file, LENGTH(?) + 1)
WHERE file like ? || '%'
''', (update_to, update_from, update_from))
return
def delete_exif_0(cursor):
cursor.execute('''
DELETE FROM exif_data
WHERE file IN (
SELECT file FROM exif_data a
WHERE value = '0'
GROUP BY file
HAVING COUNT(*) = (SELECT COUNT(*) FROM exif_data WHERE file = a.file)
)
''')
return
def get_ranking_by_file(cursor, file):
cursor.execute('''
SELECT ranking
FROM ranking
WHERE file = ?
''', (file,))
ranking_value = cursor.fetchone()
return ranking_value
def get_ranking_by_name(cursor, name):
cursor.execute('''
SELECT file, ranking
FROM ranking
WHERE name = ?
''', (name,))
ranking_value = cursor.fetchone()
if ranking_value is not None:
(file, _) = ranking_value
cursor.execute('''
SELECT hash
FROM filehash
WHERE file = ?
''', (file,))
hash_value = cursor.fetchone()
else:
hash_value = None
return ranking_value, hash_value
def insert_ranking(cursor, file, ranking, hash):
name = os.path.basename(file)
cursor.execute('''
INSERT INTO ranking (file, name, ranking)
VALUES (?, ?, ?)
''', (file, name, ranking))
cursor.execute('''
INSERT OR REPLACE
INTO filehash (file, hash)
VALUES (?, ?)
''', (file, hash))
return
def replace_ranking(cursor, file, alternate_file, hash):
name = os.path.basename(file)
cursor.execute('''
UPDATE ranking
SET file = ?
WHERE file = ?
''', (file, alternate_file))
cursor.execute('''
INSERT OR REPLACE
INTO filehash (file, hash)
VALUES (?, ?)
''', (file, hash))
return
def transaction_begin():
conn = sqlite3.connect(db_file, timeout=timeout)
conn.isolation_level = None
cursor = conn.cursor()
cursor.execute("BEGIN")
return conn, cursor
def transaction_end(conn, cursor):
cursor.execute("COMMIT")
conn.close()
return
def update_exif_data_by_key(cursor, file, key, value):
cursor.execute('''
INSERT OR REPLACE
INTO exif_data (file, key, value)
VALUES (?, ?, ?)
''', (file, key, value))
return
def select_prompts(file):
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
cursor.execute('''
SELECT key, value
FROM exif_data
WHERE file = ?
AND KEY in ('prompt', 'negative_prompt')
''', (file,))
rows = cursor.fetchall()
prompt = ""
neg_prompt = ""
for row in rows:
(key, value) = row
if key == 'prompt':
prompt = value
elif key == 'negative_prompt':
neg_prompt = value
return prompt, neg_prompt
def load_exif_data(exif_cache):
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
cursor.execute('''
SELECT file, group_concat(
case when key = 'prompt' or key = 'negative_prompt' then key || ': ' || value || '\n'
else key || ': ' || value
end, ', ') AS string
FROM (
SELECT *
FROM exif_data
ORDER BY
CASE WHEN key = 'prompt' THEN 0
WHEN key = 'negative_prompt' THEN 1
ELSE 2 END,
key
)
GROUP BY file
''')
rows = cursor.fetchall()
for row in rows:
exif_cache[row[0]] = row[1]
return exif_cache
def load_exif_data_by_key(cache, key1, key2):
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
cursor.execute('''
SELECT file, value
FROM exif_data
WHERE key IN (?, ?)
''', (key1, key2))
rows = cursor.fetchall()
for row in rows:
cache[row[0]] = row[1]
return cache
def get_exif_dirs():
with sqlite3.connect(db_file, timeout=timeout) as conn:
cursor = conn.cursor()
cursor.execute('''
SELECT file
FROM exif_data
''')
rows = cursor.fetchall()
dirs = {}
for row in rows:
dir = os.path.dirname(row[0])
dirs[dir] = dir
return dirs
def fill_work_files(cursor, fileinfos):
filenames = [x[0] for x in fileinfos]
cursor.execute('''
DELETE
FROM work_files
''')
sql = '''
INSERT INTO work_files (file)
VALUES (?)
'''
cursor.executemany(sql, [(x,) for x in filenames])
return
def filter_aes(cursor, fileinfos, aes_filter_min_num, aes_filter_max_num, score_type):
if score_type == "aesthetic_score":
key = "aesthetic_score"
else:
key = "ImageRewardScore"
cursor.execute('''
DELETE
FROM work_files
WHERE file not in (
SELECT file
FROM exif_data b
WHERE file = b.file
AND b.key = ?
AND CAST(b.value AS REAL) between ? and ?
)
''', (key, aes_filter_min_num, aes_filter_max_num))
cursor.execute('''
SELECT file
FROM work_files
''')
rows = cursor.fetchall()
fileinfos_dict = {pair[0]: pair[1] for pair in fileinfos}
fileinfos_new = []
for (file,) in rows:
if fileinfos_dict.get(file) is not None:
fileinfos_new.append((file, fileinfos_dict[file]))
return fileinfos_new
def filter_ranking(cursor, fileinfos, ranking_filter, ranking_filter_min_num, ranking_filter_max_num):
if ranking_filter == "None":
cursor.execute('''
DELETE
FROM work_files
WHERE file IN (
SELECT file
FROM ranking b
WHERE file = b.file
)
''')
elif ranking_filter == "Min-max":
cursor.execute('''
DELETE
FROM work_files
WHERE file NOT IN (
SELECT file
FROM ranking b
WHERE file = b.file
AND b.ranking BETWEEN ? AND ?
)
''', (ranking_filter_min_num, ranking_filter_max_num))
else:
cursor.execute('''
DELETE
FROM work_files
WHERE file NOT IN (
SELECT file
FROM ranking b
WHERE file = b.file
AND b.ranking = ?
)
''', (ranking_filter,))
cursor.execute('''
SELECT file
FROM work_files
''')
rows = cursor.fetchall()
fileinfos_dict = {pair[0]: pair[1] for pair in fileinfos}
fileinfos_new = []
for (file,) in rows:
if fileinfos_dict.get(file) is not None:
fileinfos_new.append((file, fileinfos_dict[file]))
return fileinfos_new
def select_x_y(cursor, file):
cursor.execute('''
SELECT value
FROM exif_data
WHERE file = ?
AND key = 'Size'
''', (file,))
size_value = cursor.fetchone()
if size_value is None:
x = "?"
y = "?"
else:
(size,) = size_value
parts = size.split("x")
x = parts[0]
y = parts[1]
return x, y