-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathimghash.cpp
178 lines (143 loc) · 4.78 KB
/
imghash.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
#include <cstdint>
#include <fstream>
#include <iomanip>
#include <string>
#include <utility>
#include <tuple>
#include <boost/filesystem.hpp>
#include <cxxopts.hpp>
#include <spdlog/spdlog.h>
#include <indicators/progress_bar.hpp>
#include <indicators/cursor_control.hpp>
#include "dct_perceptual_hasher.hpp"
#include "hash_delimeter.hpp"
using namespace imgdupl;
using Hasher = DCTHasher<50, 64 * 2>;
namespace fs = boost::filesystem;
std::pair<bool, PHash> calc_image_hash(const std::string& image_file, const Hasher& hasher);
void process_file(const fs::path& file, const Hasher& hasher, std::ofstream& result);
void process_directory(std::string directory, const Hasher& hasher, std::ofstream& result);
size_t get_files_count(std::string directory);
std::ostream&
operator<<(std::ostream& out, const PHash& phash)
{
out << fmt::format("{}", fmt::join(phash, ","));
return out;
}
void
process_file(const fs::path& file, const Hasher& hasher, std::ofstream& result)
{
std::string filename = file.string();
bool status;
PHash phash;
std::tie(status, phash) = calc_image_hash(filename, hasher);
if (status) {
result << phash << '\t' << filename << std::endl;
} else {
spdlog::error("failed at '{}'", filename);
}
}
size_t
get_files_count(std::string directory)
{
size_t count = 0;
fs::path root(directory);
fs::recursive_directory_iterator cur_iter(root), end_iter;
for (; cur_iter != end_iter; ++cur_iter) {
if (fs::exists(cur_iter->path()) && fs::is_regular_file(cur_iter->path())) {
count++;
}
}
return count;
}
void
process_directory(std::string directory, const Hasher& hasher, std::ofstream& result)
{
auto total = get_files_count(directory);
if (total == 0) {
return;
}
// clang-format off
indicators::ProgressBar pb {
indicators::option::BarWidth {80},
indicators::option::Start {"["},
indicators::option::Fill {"="},
indicators::option::Lead {">"},
indicators::option::Remainder {" "},
indicators::option::End {"]"},
indicators::option::ForegroundColor {indicators::Color::white},
indicators::option::FontStyles {std::vector<indicators::FontStyle> {indicators::FontStyle::bold}},
indicators::option::MaxProgress{total}
};
// clang-format on
fs::path root(directory);
fs::recursive_directory_iterator cur_iter(root), end_iter;
for (size_t processed = 0; cur_iter != end_iter; ++cur_iter) {
const auto& file = cur_iter->path();
if (fs::exists(file) && fs::is_regular_file(file)) {
process_file(file, hasher, result);
processed++;
pb.set_option(indicators::option::PostfixText {
"Processing: " + std::to_string(processed) + "/" + std::to_string(total)});
pb.tick();
}
}
indicators::show_console_cursor(true);
}
std::pair<bool, PHash>
calc_image_hash(const std::string& image_file, const Hasher& hasher)
{
PHash phash;
bool status = true;
Magick::Image image;
try {
image.read(image_file.c_str());
image.trim();
} catch (Magick::Exception&) {
status = false;
goto end;
}
std::tie(status, phash) = hasher.hash(image);
end:
return std::make_pair(status, phash);
}
int
main(int argc, char** argv)
{
cxxopts::Options args(argv[0], "print clusters of perceptually similar images");
// clang-format off
args.add_options()
("h,help","show this help and exit")
("d,data", "path to a single image file or a directory with images", cxxopts::value<std::string>())
("r,result", "result file", cxxopts::value<std::string>())
;
// clang-format on
auto opts = args.parse(argc, argv);
if (opts.count("help")) {
fmt::print("{}\n", args.help());
return EXIT_SUCCESS;
}
if ((opts.count("data") == 0 && opts.count("d") == 0) || (opts.count("result") == 0 && opts.count("r") == 0)) {
spdlog::error("you have to specify --data and --result parameters. Run with --help for help.");
return EXIT_FAILURE;
}
Magick::InitializeMagick(nullptr);
std::ofstream result(opts["result"].as<std::string>().c_str());
if (result.fail()) {
spdlog::error("couldn't open file '{}' for writting!", opts["result"].as<std::string>());
return EXIT_FAILURE;
}
Hasher hasher;
auto path = opts["data"].as<std::string>();
if (fs::exists(path)) {
if (fs::is_regular_file(path)) {
process_file(path, hasher, result);
} else if (fs::is_directory(path)) {
process_directory(path, hasher, result);
}
} else {
spdlog::error("'{}' does not exist!\n", path);
return EXIT_FAILURE;
}
return EXIT_SUCCESS;
}