#include #include #include "shared.hh" #include "globals.hh" #include "eval.hh" #include "store-api.hh" #include "common-opts.hh" #include "get-drvs.hh" #include "fs-accessor.hh" #include "thread-pool.hh" #include "sqlite.hh" #include "download.hh" #include "compression.hh" #include #include using namespace nix; using json = nlohmann::json; static const char * cacheSchema = R"sql( create table if not exists StorePaths ( id integer primary key autoincrement not null, path text unique not null ); create table if not exists StorePathContents ( storePath integer not null, subPath text not null, type integer not null, fileSize integer, isExecutable integer, primary key (storePath, subPath), foreign key (storePath) references StorePaths(id) on delete cascade ); )sql"; static const char * programsSchema = R"sql( create table if not exists Programs ( name text not null, system text not null, package text not null, primary key (name, system, package) ); )sql"; void mainWrapped(int argc, char * * argv) { initNix(); initGC(); if (argc != 6) throw Error("usage: generate-programs-index CACHE-DB PROGRAMS-DB STORE-URI STORE-PATHS NIXPKGS-PATH"); Path cacheDbPath = argv[1]; Path programsDbPath = argv[2]; Path storePathsFile = argv[4]; Path nixpkgsPath = argv[5]; settings.readOnlyMode = true; settings.showTrace = true; auto localStore = openStore(); std::string binaryCacheUri = argv[3]; if (hasSuffix(binaryCacheUri, "/")) binaryCacheUri.pop_back(); auto binaryCache = openStoreAt(binaryCacheUri); struct CacheState { SQLite db; SQLiteStmt queryPath, insertPath, queryFiles, insertFile; }; Sync cacheState_; /* Get the allowed store paths to be included in the database. */ auto allowedPaths = tokenizeString(readFile(storePathsFile, true)); PathSet allowedPathsClosure; for (auto & path : allowedPaths) if (!allowedPathsClosure.count(path)) binaryCache->computeFSClosure(path, allowedPathsClosure); printMsg(lvlInfo, format("%d top-level paths, %d paths in closure") % allowedPaths.size() % allowedPathsClosure.size()); /* Initialise the cache database. */ { auto cacheState(cacheState_.lock()); cacheState->db = SQLite(cacheDbPath); cacheState->db.exec("pragma foreign_keys = 1"); cacheState->db.exec(cacheSchema); if (sqlite3_busy_timeout(cacheState->db, 60 * 60 * 1000) != SQLITE_OK) throwSQLiteError(cacheState->db, "setting timeout"); cacheState->queryPath.create(cacheState->db, "select id from StorePaths where path = ?"); cacheState->insertPath.create(cacheState->db, "insert or ignore into StorePaths(path) values (?)"); cacheState->queryFiles.create(cacheState->db, "select subPath, type, fileSize, isExecutable from StorePathContents where storePath = ?"); cacheState->insertFile.create(cacheState->db, "insert into StorePathContents(storePath, subPath, type, fileSize, isExecutable) values (?, ?, ?, ?, ?)"); } /* Initialise the programs database. */ struct ProgramsState { SQLite db; SQLiteStmt insertProgram; }; Sync programsState_; { auto programsState(programsState_.lock()); programsState->db = SQLite(programsDbPath); programsState->db.exec("pragma synchronous = off"); programsState->db.exec("pragma main.journal_mode = truncate"); programsState->db.exec(programsSchema); programsState->insertProgram.create(programsState->db, "insert or replace into Programs(name, system, package) values (?, ?, ?)"); } EvalState state({}, localStore); Value vRoot; state.eval(state.parseExprFromFile(resolveExprPath(nixpkgsPath)), vRoot); /* Get all derivations. */ DrvInfos packages; for (auto system : std::set{"x86_64-linux", "i686-linux"}) { auto args = state.allocBindings(2); Value * vConfig = state.allocValue(); state.mkAttrs(*vConfig, 0); args->push_back(Attr(state.symbols.create("config"), vConfig)); Value * vSystem = state.allocValue(); mkString(*vSystem, system); args->push_back(Attr(state.symbols.create("system"), vSystem)); args->sort(); getDerivations(state, vRoot, "", *args, packages, true); } /* For each store path, figure out the package with the shortest attribute name. E.g. "nix" is preferred over "nixStable". */ std::map packagesByPath; for (auto & package : packages) try { auto outputs = package.queryOutputs(true); for (auto & output : outputs) { if (!allowedPathsClosure.count(output.second)) continue; auto i = packagesByPath.find(output.second); if (i != packagesByPath.end() && (i->second->attrPath.size() < package.attrPath.size() || (i->second->attrPath.size() == package.attrPath.size() && i->second->attrPath < package.attrPath))) continue; packagesByPath[output.second] = &package; } } catch (AssertionError & e) { } catch (Error & e) { e.addPrefix(format("in package ā€˜%sā€™: ") % package.attrPath); throw; } /* Return the files in a store path, using a SQLite database to cache the results. */ auto getFiles = [&](const Path & storePath) { std::map files; /* Look up the path in the SQLite cache. */ { auto cacheState(cacheState_.lock()); auto useQueryPath(cacheState->queryPath.use()(storePath)); if (useQueryPath.next()) { auto id = useQueryPath.getInt(0); auto useQueryFiles(cacheState->queryFiles.use()(id)); while (useQueryFiles.next()) { files[useQueryFiles.getStr(0)] = FSAccessor::Stat{ (FSAccessor::Type) useQueryFiles.getInt(1), (uint64_t) useQueryFiles.getInt(2), useQueryFiles.getInt(3) != 0}; } return files; } } /* It's not in the cache, so get the .ls.xz file (which contains a JSON serialisation of the listing of the NAR contents) from the binary cache. */ auto now1 = std::chrono::steady_clock::now(); DownloadRequest req(binaryCacheUri + "/" + storePathToHash(storePath) + ".ls.xz"); req.showProgress = DownloadRequest::no; auto ls = json::parse(*decompress("xz", *getDownloader()->download(req).data)); if (ls.value("version", 0) != 1) throw Error("NAR index for ā€˜%sā€™ has an unsupported version", storePath); std::function recurse; recurse = [&](const std::string & relPath, json & v) { FSAccessor::Stat st; std::string type = v["type"]; if (type == "directory") { st.type = FSAccessor::Type::tDirectory; for (auto i = v["entries"].begin(); i != v["entries"].end(); ++i) { std::string name = i.key(); recurse(relPath.empty() ? name : relPath + "/" + name, i.value()); } } else if (type == "regular") { st.type = FSAccessor::Type::tRegular; st.fileSize = v["size"]; st.isExecutable = v.value("executable", false); } else if (type == "symlink") { st.type = FSAccessor::Type::tSymlink; } else return; files[relPath] = st; }; recurse("", ls.at("root")); /* Insert the store path into the database. */ { auto cacheState(cacheState_.lock()); SQLiteTxn txn(cacheState->db); if (cacheState->queryPath.use()(storePath).next()) return files; cacheState->insertPath.use()(storePath).exec(); uint64_t id = sqlite3_last_insert_rowid(cacheState->db); for (auto & x : files) { cacheState->insertFile.use() (id) (x.first) (x.second.type) (x.second.fileSize, x.second.type == FSAccessor::Type::tRegular) (x.second.isExecutable, x.second.type == FSAccessor::Type::tRegular) .exec(); } txn.commit(); } auto now2 = std::chrono::steady_clock::now(); printInfo("processed %s in %d ms", storePath, std::chrono::duration_cast(now2 - now1).count()); return files; }; /* Note: we don't index hidden files. */ std::regex isProgram("bin/([^.][^/]*)"); /* Process each store path. */ auto doPath = [&](const Path & storePath, DrvInfo * package) { try { auto files = getFiles(storePath); if (files.empty()) return; std::set programs; for (auto & file : files) { // FIXME: we assume that symlinks point to // programs. Should check that. if (file.second.type == FSAccessor::Type::tDirectory || (file.second.type == FSAccessor::Type::tRegular && !file.second.isExecutable)) continue; std::smatch match; if (std::regex_match(file.first, match, isProgram)) programs.insert(match[1]); } if (programs.empty()) return; { auto programsState(programsState_.lock()); SQLiteTxn txn(programsState->db); for (auto & program : programs) programsState->insertProgram.use()(program)(package->system)(package->attrPath).exec(); txn.commit(); } } catch (DownloadError & e) { printInfo("warning: no listing of %s (%s) in binary cache", package->attrPath, storePath); } }; /* Enqueue work items for each package. */ ThreadPool threadPool(16); for (auto & i : packagesByPath) threadPool.enqueue(std::bind(doPath, i.first, i.second)); threadPool.process(); } int main(int argc, char * * argv) { return handleExceptions(argv[0], [&]() { mainWrapped(argc, argv); }); }