DfsFsck.java
- /*
- * Copyright (C) 2017, Google Inc. and others
- *
- * This program and the accompanying materials are made available under the
- * terms of the Eclipse Distribution License v. 1.0 which is available at
- * https://www.eclipse.org/org/documents/edl-v10.php.
- *
- * SPDX-License-Identifier: BSD-3-Clause
- */
- package org.eclipse.jgit.internal.storage.dfs;
- import static java.nio.charset.StandardCharsets.UTF_8;
- import static org.eclipse.jgit.internal.storage.pack.PackExt.INDEX;
- import static org.eclipse.jgit.internal.storage.pack.PackExt.PACK;
- import java.io.FileNotFoundException;
- import java.io.IOException;
- import org.eclipse.jgit.errors.CorruptPackIndexException;
- import org.eclipse.jgit.errors.MissingObjectException;
- import org.eclipse.jgit.internal.JGitText;
- import org.eclipse.jgit.internal.fsck.FsckError;
- import org.eclipse.jgit.internal.fsck.FsckError.CorruptIndex;
- import org.eclipse.jgit.internal.fsck.FsckError.CorruptObject;
- import org.eclipse.jgit.internal.fsck.FsckPackParser;
- import org.eclipse.jgit.internal.storage.dfs.DfsObjDatabase.PackSource;
- import org.eclipse.jgit.internal.submodule.SubmoduleValidator;
- import org.eclipse.jgit.internal.submodule.SubmoduleValidator.SubmoduleValidationException;
- import org.eclipse.jgit.lib.AnyObjectId;
- import org.eclipse.jgit.lib.Constants;
- import org.eclipse.jgit.lib.GitmoduleEntry;
- import org.eclipse.jgit.lib.NullProgressMonitor;
- import org.eclipse.jgit.lib.ObjectChecker;
- import org.eclipse.jgit.lib.ObjectId;
- import org.eclipse.jgit.lib.ObjectLoader;
- import org.eclipse.jgit.lib.ProgressMonitor;
- import org.eclipse.jgit.lib.Ref;
- import org.eclipse.jgit.revwalk.ObjectWalk;
- import org.eclipse.jgit.revwalk.RevObject;
- /**
- * Verify the validity and connectivity of a DFS repository.
- */
- public class DfsFsck {
- private final DfsRepository repo;
- private final DfsObjDatabase objdb;
- private ObjectChecker objChecker = new ObjectChecker();
- private boolean connectivityOnly;
- /**
- * Initialize DFS fsck.
- *
- * @param repository
- * the dfs repository to check.
- */
- public DfsFsck(DfsRepository repository) {
- repo = repository;
- objdb = repo.getObjectDatabase();
- }
- /**
- * Verify the integrity and connectivity of all objects in the object
- * database.
- *
- * @param pm
- * callback to provide progress feedback during the check.
- * @return all errors about the repository.
- * @throws java.io.IOException
- * if encounters IO errors during the process.
- */
- public FsckError check(ProgressMonitor pm) throws IOException {
- if (pm == null) {
- pm = NullProgressMonitor.INSTANCE;
- }
- FsckError errors = new FsckError();
- if (!connectivityOnly) {
- objChecker.reset();
- checkPacks(pm, errors);
- }
- checkConnectivity(pm, errors);
- return errors;
- }
- private void checkPacks(ProgressMonitor pm, FsckError errors)
- throws IOException, FileNotFoundException {
- try (DfsReader ctx = objdb.newReader()) {
- for (DfsPackFile pack : objdb.getPacks()) {
- DfsPackDescription packDesc = pack.getPackDescription();
- if (packDesc.getPackSource()
- == PackSource.UNREACHABLE_GARBAGE) {
- continue;
- }
- try (ReadableChannel rc = objdb.openFile(packDesc, PACK)) {
- verifyPack(pm, errors, ctx, pack, rc);
- } catch (MissingObjectException e) {
- errors.getMissingObjects().add(e.getObjectId());
- } catch (CorruptPackIndexException e) {
- errors.getCorruptIndices().add(new CorruptIndex(
- pack.getPackDescription().getFileName(INDEX),
- e.getErrorType()));
- }
- }
- }
- checkGitModules(pm, errors);
- }
- private void verifyPack(ProgressMonitor pm, FsckError errors, DfsReader ctx,
- DfsPackFile pack, ReadableChannel ch)
- throws IOException, CorruptPackIndexException {
- FsckPackParser fpp = new FsckPackParser(objdb, ch);
- fpp.setObjectChecker(objChecker);
- fpp.overwriteObjectCount(pack.getPackDescription().getObjectCount());
- fpp.parse(pm);
- errors.getCorruptObjects().addAll(fpp.getCorruptObjects());
- fpp.verifyIndex(pack.getPackIndex(ctx));
- }
- private void checkGitModules(ProgressMonitor pm, FsckError errors)
- throws IOException {
- pm.beginTask(JGitText.get().validatingGitModules,
- objChecker.getGitsubmodules().size());
- for (GitmoduleEntry entry : objChecker.getGitsubmodules()) {
- AnyObjectId blobId = entry.getBlobId();
- ObjectLoader blob = objdb.open(blobId, Constants.OBJ_BLOB);
- try {
- SubmoduleValidator.assertValidGitModulesFile(
- new String(blob.getBytes(), UTF_8));
- } catch (SubmoduleValidationException e) {
- CorruptObject co = new FsckError.CorruptObject(
- blobId.toObjectId(), Constants.OBJ_BLOB,
- e.getFsckMessageId());
- errors.getCorruptObjects().add(co);
- }
- pm.update(1);
- }
- pm.endTask();
- }
- private void checkConnectivity(ProgressMonitor pm, FsckError errors)
- throws IOException {
- pm.beginTask(JGitText.get().countingObjects, ProgressMonitor.UNKNOWN);
- try (ObjectWalk ow = new ObjectWalk(repo)) {
- for (Ref r : repo.getRefDatabase().getRefs()) {
- ObjectId objectId = r.getObjectId();
- if (objectId == null) {
- // skip unborn branch
- continue;
- }
- RevObject tip;
- try {
- tip = ow.parseAny(objectId);
- if (r.getLeaf().getName().startsWith(Constants.R_HEADS)
- && tip.getType() != Constants.OBJ_COMMIT) {
- // heads should only point to a commit object
- errors.getNonCommitHeads().add(r.getLeaf().getName());
- }
- ow.markStart(tip);
- } catch (MissingObjectException e) {
- errors.getMissingObjects().add(e.getObjectId());
- continue;
- }
- }
- try {
- ow.checkConnectivity();
- } catch (MissingObjectException e) {
- errors.getMissingObjects().add(e.getObjectId());
- }
- }
- pm.endTask();
- }
- /**
- * Use a customized object checker instead of the default one. Caller can
- * specify a skip list to ignore some errors.
- *
- * It will be reset at the start of each {{@link #check(ProgressMonitor)}
- * call.
- *
- * @param objChecker
- * A customized object checker.
- */
- public void setObjectChecker(ObjectChecker objChecker) {
- this.objChecker = objChecker;
- }
- /**
- * Whether fsck should bypass object validity and integrity checks and only
- * check connectivity.
- *
- * @param connectivityOnly
- * whether fsck should bypass object validity and integrity
- * checks and only check connectivity. The default is
- * {@code false}, meaning to run all checks.
- */
- public void setConnectivityOnly(boolean connectivityOnly) {
- this.connectivityOnly = connectivityOnly;
- }
- }