import hashlib import os import subprocess import sys from pathlib import Path from pymongo import MongoClient def _execute_exiftool(img_file: str) -> dict: res = subprocess.run( ['exiftool', img_file], capture_output=True, text=True, ) exif_metadata = {} for line in res.stdout.splitlines(): parts = line.split(':', 1) exif_metadata[parts[0].strip().lower().replace(' ', '_')] = parts[1].strip() return exif_metadata if __name__ == '__main__': # Authenticate against MongoDB server mongo = MongoClient(os.environ['MONGO_URI']) database = mongo.exif_database collection = database.pictures pictures_metadata = [] for file in Path(sys.argv[1]).rglob("*.ARW"): filename = os.fsdecode(file) print(filename) picture_metadata = _execute_exiftool(filename) pictures_metadata.append(picture_metadata) # Append MongoDB identifier picture_metadata['_id'] = hashlib.sha1(filename.lower().encode('utf-8')).hexdigest() picture_metadata['path'] = sys.argv[1] # Insert into MongoDB collection.insert_many(pictures_metadata)