diff --git a/hydit/data_loader/csv2arrow.py b/hydit/data_loader/csv2arrow.py index 10518e2..b2e364c 100644 --- a/hydit/data_loader/csv2arrow.py +++ b/hydit/data_loader/csv2arrow.py @@ -19,7 +19,7 @@ def parse_data(data): with open(img_path, "rb") as fp: image = fp.read() - md5 = hashlib.md5(fp.read()).hexdigest() + md5 = hashlib.md5(image).hexdigest() with Image.open(img_path) as f: width, height = f.size @@ -85,4 +85,4 @@ def make_arrow(csv_root, dataset_root, start_id=0, end_id=-1): csv_root = sys.argv[1] output_arrow_data_path = sys.argv[2] pool = Pool(500) - make_arrow(csv_root, output_arrow_data_path) \ No newline at end of file + make_arrow(csv_root, output_arrow_data_path)