You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
604 lines
21 KiB
604 lines
21 KiB
// Copyright (C) 2024-2025 Simon Quigley <tsimonq2@ubuntu.com>
|
|
//
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
//
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU General Public License
|
|
// along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
#include "utilities.h"
|
|
|
|
#include "/usr/include/archive.h"
|
|
#include <archive_entry.h>
|
|
#include <fstream>
|
|
#include <iostream>
|
|
#include <filesystem>
|
|
#include <regex>
|
|
#include <zlib.h>
|
|
#include <curl/curl.h>
|
|
#include <sys/stat.h>
|
|
#include <sstream>
|
|
#include <random>
|
|
#include <ranges>
|
|
#include <format>
|
|
#include <unordered_set>
|
|
|
|
bool verbose = false;
|
|
|
|
// Define a semaphore with a maximum of 10 concurrent jobs
|
|
static std::counting_semaphore<10> sem(10);
|
|
|
|
// Job queue and synchronization primitives
|
|
static std::mutex queue_mutex;
|
|
static std::atomic<bool> daemon_running{false};
|
|
|
|
// Function to read the entire content of a file into a string
|
|
std::string read_file(const fs::path& file_path) {
|
|
std::ifstream in_file(file_path, std::ios::binary);
|
|
if (in_file) {
|
|
return std::string((std::istreambuf_iterator<char>(in_file)),
|
|
std::istreambuf_iterator<char>());
|
|
}
|
|
return "";
|
|
}
|
|
|
|
// Function to write a string into a file
|
|
void write_file(const fs::path& file_path, const std::string& content) {
|
|
std::ofstream out_file(file_path, std::ios::binary);
|
|
if (out_file) {
|
|
out_file << content;
|
|
}
|
|
}
|
|
|
|
// Function to perform in-place regex replace on a file
|
|
void regex_replace_in_file(const fs::path& file_path,
|
|
const std::string& pattern,
|
|
const std::string& replacement) {
|
|
std::string content = read_file(file_path);
|
|
content = std::regex_replace(content, std::regex(pattern), replacement);
|
|
write_file(file_path, content);
|
|
}
|
|
|
|
// Function to decompress gzipped files
|
|
std::string decompress_gzip(const fs::path& file_path) {
|
|
gzFile infile = gzopen(file_path.c_str(), "rb");
|
|
if (!infile) return "";
|
|
|
|
std::string decompressed_data;
|
|
char buffer[8192];
|
|
int num_read = 0;
|
|
while ((num_read = gzread(infile, buffer, sizeof(buffer))) > 0) {
|
|
decompressed_data.append(buffer, num_read);
|
|
}
|
|
gzclose(infile);
|
|
return decompressed_data;
|
|
}
|
|
|
|
// Helper function for libcurl write callback
|
|
size_t write_data(void* ptr, size_t size, size_t nmemb, void* stream) {
|
|
FILE* out = static_cast<FILE*>(stream);
|
|
return fwrite(ptr, size, nmemb, out);
|
|
}
|
|
|
|
// Function to download a file with timestamping using libcurl
|
|
void download_file_with_timestamping(const std::string& url,
|
|
const fs::path& output_path,
|
|
const fs::path& log_file_path,
|
|
std::mutex& log_mutex) {
|
|
CURL* curl;
|
|
CURLcode res;
|
|
FILE* fp;
|
|
curl = curl_easy_init();
|
|
if (curl) {
|
|
fs::path temp_file_path = output_path.string() + ".tmp";
|
|
fp = fopen(temp_file_path.c_str(), "wb");
|
|
|
|
if (!fp) {
|
|
std::cerr << "Failed to open file: " << temp_file_path << std::endl;
|
|
curl_easy_cleanup(curl);
|
|
return;
|
|
}
|
|
|
|
// Set curl options for downloading the file
|
|
curl_easy_setopt(curl, CURLOPT_URL, url.c_str());
|
|
curl_easy_setopt(curl, CURLOPT_WRITEFUNCTION, write_data);
|
|
curl_easy_setopt(curl, CURLOPT_WRITEDATA, fp);
|
|
|
|
// Timestamping: set If-Modified-Since header
|
|
struct stat file_info;
|
|
if (stat(output_path.c_str(), &file_info) == 0) {
|
|
// Set the time condition to If-Modified-Since
|
|
curl_easy_setopt(curl, CURLOPT_TIMECONDITION, CURL_TIMECOND_IFMODSINCE);
|
|
curl_easy_setopt(curl, CURLOPT_TIMEVALUE, file_info.st_mtime);
|
|
}
|
|
|
|
// Perform the file download
|
|
res = curl_easy_perform(curl);
|
|
|
|
// Get the HTTP response code
|
|
long response_code = 0;
|
|
curl_easy_getinfo(curl, CURLINFO_RESPONSE_CODE, &response_code);
|
|
|
|
fclose(fp);
|
|
curl_easy_cleanup(curl);
|
|
|
|
// Log the result and handle the downloaded file
|
|
{
|
|
std::lock_guard<std::mutex> lock(log_mutex);
|
|
std::ofstream log_file(log_file_path, std::ios::app);
|
|
if (res == CURLE_OK && (response_code == 200 || response_code == 201)) {
|
|
fs::rename(temp_file_path, output_path);
|
|
log_file << "Downloaded: " << url << std::endl;
|
|
} else if (response_code == 304) {
|
|
fs::remove(temp_file_path);
|
|
log_file << "Not Modified: " << url << std::endl;
|
|
} else {
|
|
fs::remove(temp_file_path);
|
|
log_file << "Failed to download: " << url << std::endl;
|
|
}
|
|
}
|
|
} else {
|
|
std::cerr << "Failed to initialize CURL." << std::endl;
|
|
}
|
|
}
|
|
|
|
std::filesystem::path create_temp_directory() {
|
|
auto temp_dir = std::filesystem::temp_directory_path() / generate_random_string(32);
|
|
std::filesystem::create_directory(temp_dir);
|
|
return temp_dir;
|
|
}
|
|
|
|
// Function to copy a directory recursively
|
|
void copy_directory(const fs::path& source, const fs::path& destination) {
|
|
if (!std::filesystem::exists(source) || !std::filesystem::is_directory(source)) {
|
|
throw std::runtime_error("Source directory does not exist or is not a directory: " + source.string());
|
|
}
|
|
|
|
// Create the destination directory
|
|
std::filesystem::create_directories(destination);
|
|
|
|
// Copy files and directories recursively
|
|
for (const auto& entry : std::filesystem::recursive_directory_iterator(source)) {
|
|
auto relative_path = std::filesystem::relative(entry.path(), source);
|
|
auto target_path = destination / relative_path;
|
|
|
|
try {
|
|
if (std::filesystem::is_directory(entry)) {
|
|
std::filesystem::create_directory(target_path);
|
|
} else if (std::filesystem::is_regular_file(entry)) {
|
|
std::filesystem::copy(entry, target_path, std::filesystem::copy_options::overwrite_existing);
|
|
}
|
|
} catch (...) {
|
|
continue;
|
|
}
|
|
}
|
|
}
|
|
|
|
// Function to generate a random string of given length
|
|
std::string generate_random_string(size_t length) {
|
|
const std::string chars =
|
|
"abcdefghijklmnopqrstuvwxyz"
|
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZ"
|
|
"0123456789";
|
|
thread_local std::mt19937 rg{std::random_device{}()};
|
|
thread_local std::uniform_int_distribution<> pick(0, chars.size() - 1);
|
|
std::string s;
|
|
s.reserve(length);
|
|
while (length--)
|
|
s += chars[pick(rg)];
|
|
return s;
|
|
}
|
|
|
|
// Function to get current UTC time formatted as per the given format string
|
|
std::string get_current_utc_time(const std::string& format) {
|
|
auto now = std::chrono::system_clock::now();
|
|
std::time_t now_time = std::chrono::system_clock::to_time_t(now);
|
|
std::tm tm_utc;
|
|
gmtime_r(&now_time, &tm_utc);
|
|
char buf[64]; // Ensure sufficient buffer size for different formats
|
|
std::strftime(buf, sizeof(buf), format.c_str(), &tm_utc);
|
|
return std::string(buf);
|
|
}
|
|
|
|
// Function to convert filesystem time to time_t
|
|
std::time_t to_time_t(const fs::file_time_type& ftime) {
|
|
using namespace std::chrono;
|
|
// Convert to system_clock time_point
|
|
auto sctp = time_point_cast<system_clock::duration>(
|
|
ftime - fs::file_time_type::clock::now() + system_clock::now()
|
|
);
|
|
return system_clock::to_time_t(sctp);
|
|
}
|
|
|
|
std::vector<std::string> split_string(const std::string& input, const std::string& delimiter) {
|
|
std::vector<std::string> result;
|
|
size_t start = 0;
|
|
size_t end = 0;
|
|
|
|
while ((end = input.find(delimiter, start)) != std::string::npos) {
|
|
result.emplace_back(input.substr(start, end - start));
|
|
start = end + delimiter.length();
|
|
}
|
|
|
|
// Add the remaining part of the string
|
|
result.emplace_back(input.substr(start));
|
|
return result;
|
|
}
|
|
|
|
std::string remove_suffix(const std::string& input, const std::string& suffix) {
|
|
if (input.size() >= suffix.size() &&
|
|
input.compare(input.size() - suffix.size(), suffix.size(), suffix) == 0) {
|
|
return input.substr(0, input.size() - suffix.size());
|
|
}
|
|
return input; // Return the original string if the suffix doesn't exist
|
|
}
|
|
|
|
// Utility which basically does the following:
|
|
// "noble" (std::string) -> 2504 (int)
|
|
// The bool represents whether this codename is the development release
|
|
std::pair<int, bool> get_version_from_codename(const std::string& codename) {
|
|
std::ifstream file("/usr/share/distro-info/ubuntu.csv");
|
|
if (!file.is_open()) {
|
|
throw std::runtime_error("Failed to open file.");
|
|
}
|
|
|
|
std::string line;
|
|
// Skip the header line
|
|
std::getline(file, line);
|
|
|
|
std::string last_codename;
|
|
int version = 0;
|
|
|
|
while (std::getline(file, line)) {
|
|
std::istringstream iss(line);
|
|
std::string version_str, name, series;
|
|
std::getline(iss, version_str, ',');
|
|
std::getline(iss, name, ',');
|
|
std::getline(iss, series, ',');
|
|
|
|
if (series == codename) {
|
|
version_str.erase(std::remove(version_str.begin(), version_str.end(), '.'),
|
|
version_str.end());
|
|
version = std::stoi(version_str);
|
|
}
|
|
last_codename = series;
|
|
}
|
|
|
|
bool is_last = (codename == last_codename);
|
|
|
|
if (version == 0) {
|
|
throw std::runtime_error("Codename not found.");
|
|
}
|
|
|
|
return {version, is_last};
|
|
}
|
|
|
|
void ensure_git_inited() {
|
|
static std::once_flag git_init_flag;
|
|
std::call_once(git_init_flag, []() {
|
|
git_libgit2_init();
|
|
});
|
|
}
|
|
|
|
void run_task_every(std::stop_token _stop_token, int interval_minutes, std::function<void()> task) {
|
|
if (interval_minutes < 2) interval_minutes = 2;
|
|
std::this_thread::sleep_for(std::chrono::minutes(interval_minutes / 2));
|
|
|
|
while (!_stop_token.stop_requested()) {
|
|
task();
|
|
std::this_thread::sleep_for(std::chrono::minutes(interval_minutes));
|
|
}
|
|
}
|
|
|
|
// Logger function implementations
|
|
void log_info(const std::string &msg) {
|
|
std::cout << "[INFO] " << msg << "\n";
|
|
}
|
|
|
|
void log_warning(const std::string &msg) {
|
|
std::cerr << "[WARNING] " << msg << "\n";
|
|
}
|
|
|
|
void log_error(const std::string &msg) {
|
|
std::cerr << "[ERROR] " << msg << "\n";
|
|
}
|
|
|
|
void log_verbose(const std::string &msg) {
|
|
if (verbose) {
|
|
std::cout << "[VERBOSE] " << msg << "\n";
|
|
}
|
|
}
|
|
|
|
namespace fs = std::filesystem;
|
|
|
|
bool run_command(const std::vector<std::string> &cmd,
|
|
const std::optional<std::filesystem::path> &cwd,
|
|
bool show_output,
|
|
std::shared_ptr<Log> log) {
|
|
if (cmd.empty()) {
|
|
throw std::runtime_error("Command is empty");
|
|
}
|
|
|
|
QProcess process;
|
|
|
|
// Set the working directory if provided
|
|
if (cwd) {
|
|
process.setWorkingDirectory(QString::fromStdString(cwd->string()));
|
|
}
|
|
|
|
// Set up the environment (if needed)
|
|
QProcessEnvironment env = QProcessEnvironment::systemEnvironment();
|
|
process.setProcessEnvironment(env);
|
|
|
|
// Extract executable and arguments
|
|
QString program = QString::fromStdString(cmd[0]);
|
|
QStringList arguments;
|
|
for (size_t i = 1; i < cmd.size(); ++i) {
|
|
arguments << QString::fromStdString(cmd[i]);
|
|
}
|
|
|
|
// Start the command
|
|
process.start(program, arguments);
|
|
if (!process.waitForStarted()) {
|
|
throw std::runtime_error("Failed to start the command: " + program.toStdString());
|
|
}
|
|
|
|
// Stream output while the process is running
|
|
while (process.state() == QProcess::Running) {
|
|
if (process.waitForReadyRead()) {
|
|
QByteArray output = process.readAllStandardOutput();
|
|
QByteArray error = process.readAllStandardError();
|
|
|
|
if (log) {
|
|
log->append(output.toStdString());
|
|
log->append(error.toStdString());
|
|
}
|
|
|
|
if (show_output) {
|
|
std::cout << output.toStdString();
|
|
std::cerr << error.toStdString();
|
|
}
|
|
}
|
|
}
|
|
|
|
// Wait for the process to finish
|
|
process.waitForFinished();
|
|
|
|
// Capture return code and errors
|
|
if (process.exitStatus() != QProcess::NormalExit || process.exitCode() != 0) {
|
|
QByteArray error_output = process.readAllStandardError();
|
|
std::string error_message = "Command failed with exit code: " + std::to_string(process.exitCode());
|
|
if (!error_output.isEmpty()) {
|
|
error_message += "\nError Output: " + error_output.toStdString();
|
|
}
|
|
throw std::runtime_error(error_message);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
// Function to extract excluded files from a copyright file
|
|
std::vector<std::string> extract_files_excluded(const std::string& filepath) {
|
|
std::ifstream file(filepath);
|
|
if (!file.is_open()) {
|
|
throw std::runtime_error("Failed to open file: " + filepath);
|
|
}
|
|
|
|
std::vector<std::string> files_excluded;
|
|
std::string line;
|
|
std::regex files_excluded_pattern(R"(Files-Excluded:\s*(.*))");
|
|
bool in_files_excluded = false;
|
|
|
|
while (std::getline(file, line)) {
|
|
if (std::regex_match(line, files_excluded_pattern)) {
|
|
in_files_excluded = true;
|
|
std::smatch match;
|
|
if (std::regex_search(line, match, files_excluded_pattern) && match.size() > 1) {
|
|
files_excluded.emplace_back(match[1]);
|
|
}
|
|
} else if (in_files_excluded) {
|
|
if (!line.empty() && (line[0] == ' ' || line[0] == '\t')) {
|
|
files_excluded.emplace_back(line.substr(1));
|
|
} else {
|
|
break; // End of Files-Excluded block
|
|
}
|
|
}
|
|
}
|
|
|
|
return files_excluded;
|
|
}
|
|
|
|
// Function to create a tarball
|
|
void create_tarball(const std::string& tarballPath, const std::string& directory, const std::vector<std::string>& exclusions, std::shared_ptr<Log> log) {
|
|
log->append("Creating tarball: " + tarballPath);
|
|
|
|
struct archive* a = archive_write_new();
|
|
if (!a) {
|
|
throw std::runtime_error("Failed to create a new archive.");
|
|
}
|
|
|
|
if (archive_write_add_filter_gzip(a) != ARCHIVE_OK) {
|
|
std::string err = "Failed to add gzip filter: ";
|
|
err += archive_error_string(a);
|
|
archive_write_free(a);
|
|
throw std::runtime_error(err);
|
|
}
|
|
|
|
if (archive_write_set_format_pax_restricted(a) != ARCHIVE_OK) {
|
|
std::string err = "Failed to set format: ";
|
|
err += archive_error_string(a);
|
|
archive_write_free(a);
|
|
throw std::runtime_error(err);
|
|
}
|
|
|
|
if (archive_write_open_filename(a, tarballPath.c_str()) != ARCHIVE_OK) {
|
|
std::string err = "Could not open tarball for writing: ";
|
|
err += archive_error_string(a);
|
|
archive_write_free(a);
|
|
throw std::runtime_error(err);
|
|
}
|
|
|
|
// Initialize a set to track added relative paths to prevent duplication
|
|
std::unordered_set<std::string> added_paths;
|
|
|
|
// Iterate through the directory recursively without following symlinks
|
|
for (auto it = fs::recursive_directory_iterator(
|
|
directory,
|
|
fs::directory_options::skip_permission_denied);
|
|
it != fs::recursive_directory_iterator(); ++it) {
|
|
const auto& path = it->path();
|
|
std::error_code ec;
|
|
|
|
fs::path relative_path = fs::relative(path, directory, ec);
|
|
if (ec) {
|
|
log->append("Failed to compute relative path for: " + path.string() + " Error: " + ec.message());
|
|
continue;
|
|
}
|
|
|
|
// Normalize the relative path to avoid discrepancies
|
|
fs::path normalized_relative_path = relative_path.lexically_normal();
|
|
std::string relative_path_str = normalized_relative_path.string();
|
|
|
|
// Check if this path has already been added
|
|
if (!added_paths.insert(relative_path_str).second) {
|
|
log->append("Duplicate path detected and skipped: " + relative_path_str);
|
|
continue; // Skip adding this duplicate path
|
|
}
|
|
|
|
// Exclusion logic (if any exclusions are provided)
|
|
bool excluded = std::any_of(exclusions.begin(), exclusions.end(), [&relative_path_str](const std::string& exclusion) {
|
|
return relative_path_str.find(exclusion) != std::string::npos;
|
|
});
|
|
if (excluded) { continue; }
|
|
|
|
fs::file_status fstatus = it->symlink_status(ec);
|
|
if (ec) {
|
|
log->append("Failed to get file status for: " + path.string() + " Error: " + ec.message());
|
|
continue;
|
|
}
|
|
|
|
struct archive_entry* entry = archive_entry_new();
|
|
if (!entry) {
|
|
log->append("Failed to create archive entry for: " + path.string());
|
|
archive_write_free(a);
|
|
throw std::runtime_error("Failed to create archive entry.");
|
|
}
|
|
|
|
std::string entry_path = relative_path_str;
|
|
if (fs::is_directory(fstatus)) {
|
|
// Ensure the directory pathname ends with '/'
|
|
if (!entry_path.empty() && entry_path.back() != '/') {
|
|
entry_path += '/';
|
|
}
|
|
archive_entry_set_pathname(entry, entry_path.c_str());
|
|
} else {
|
|
archive_entry_set_pathname(entry, entry_path.c_str());
|
|
}
|
|
|
|
// Set file type, permissions, and size
|
|
if (fs::is_regular_file(fstatus)) {
|
|
// Regular file
|
|
uintmax_t filesize = fs::file_size(path, ec);
|
|
if (ec) {
|
|
log->append("Cannot get file size for: " + path.string() + " Error: " + ec.message());
|
|
archive_entry_free(entry);
|
|
continue;
|
|
}
|
|
archive_entry_set_size(entry, static_cast<off_t>(filesize));
|
|
archive_entry_set_filetype(entry, AE_IFREG);
|
|
archive_entry_set_perm(entry, static_cast<mode_t>(fstatus.permissions()));
|
|
}
|
|
else if (fs::is_symlink(fstatus)) {
|
|
fs::path target = fs::read_symlink(path, ec);
|
|
if (ec) {
|
|
log->append("Cannot read symlink for: " + path.string() + " Error: " + ec.message());
|
|
archive_entry_free(entry);
|
|
continue;
|
|
}
|
|
archive_entry_set_symlink(entry, target.c_str());
|
|
archive_entry_set_filetype(entry, AE_IFLNK);
|
|
archive_entry_set_perm(entry, static_cast<mode_t>(fstatus.permissions()));
|
|
}
|
|
else if (fs::is_directory(fstatus)) {
|
|
archive_entry_set_size(entry, 0);
|
|
archive_entry_set_filetype(entry, AE_IFDIR);
|
|
archive_entry_set_perm(entry, static_cast<mode_t>(fstatus.permissions()));
|
|
}
|
|
else {
|
|
log->append("Unsupported file type for: " + path.string());
|
|
archive_entry_free(entry);
|
|
continue;
|
|
}
|
|
|
|
// Retrieve and set the modification time
|
|
fs::file_time_type ftime = fs::last_write_time(path, ec);
|
|
std::time_t mtime;
|
|
if (ec) {
|
|
log->append("Failed to get last write time for: " + path.string() + " Error: " + ec.message());
|
|
// Obtain current UTC time as fallback
|
|
auto now = std::chrono::system_clock::now();
|
|
mtime = std::chrono::system_clock::to_time_t(now);
|
|
log->append("Setting default mtime (current UTC time) for: " + path.string());
|
|
} else {
|
|
mtime = to_time_t(ftime);
|
|
}
|
|
archive_entry_set_mtime(entry, mtime, 0);
|
|
|
|
if (archive_write_header(a, entry) != ARCHIVE_OK) {
|
|
log->append("Failed to write header for: " + path.string() + " Error: " + archive_error_string(a));
|
|
archive_entry_free(entry);
|
|
continue;
|
|
}
|
|
|
|
if (fs::is_regular_file(fstatus)) {
|
|
std::ifstream fileStream(path, std::ios::binary);
|
|
if (!fileStream) {
|
|
log->append("Failed to open file for reading: " + path.string());
|
|
archive_entry_free(entry);
|
|
continue;
|
|
}
|
|
|
|
const std::size_t bufferSize = 8192;
|
|
char buffer[bufferSize];
|
|
while (fileStream) {
|
|
fileStream.read(buffer, bufferSize);
|
|
std::streamsize bytesRead = fileStream.gcount();
|
|
if (bytesRead > 0) {
|
|
if (archive_write_data(a, buffer, static_cast<size_t>(bytesRead)) < 0) {
|
|
log->append("Failed to write data for: " + path.string() + " Error: " + archive_error_string(a));
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (fileStream.bad()) {
|
|
log->append("Error reading file: " + path.string());
|
|
}
|
|
}
|
|
|
|
archive_entry_free(entry);
|
|
}
|
|
|
|
if (archive_write_close(a) != ARCHIVE_OK) {
|
|
std::string err = "Failed to close archive: ";
|
|
err += archive_error_string(a);
|
|
archive_write_free(a);
|
|
throw std::runtime_error(err);
|
|
}
|
|
|
|
if (archive_write_free(a) != ARCHIVE_OK) {
|
|
std::string err = "Failed to free archive: ";
|
|
err += archive_error_string(a);
|
|
throw std::runtime_error(err);
|
|
}
|
|
|
|
log->append("Tarball created and compressed: " + tarballPath);
|
|
}
|