Commit aa1e1a4f authored by hinoka@chromium.org's avatar hinoka@chromium.org

Have git cache bootstrap repo if repo is corrupt

We're seeing fetches fail in interesting ways:
running "git fetch -v --progress origin +refs/heads/*:refs/heads/*" in "/mnt/scratch0/b_used/build/slave/cache_dir/chrome--internal.googlesource.com-chrome-src--internal"
error: object file ./objects/a1/4bd89aa4cc7d7bbad7594cba0ae73e99dbb54c is empty
error: object file ./objects/a1/4bd89aa4cc7d7bbad7594cba0ae73e99dbb54c is empty
fatal: loose object a14bd89aa4cc7d7bbad7594cba0ae73e99dbb54c (stored in ./objects/a1/4bd89aa4cc7d7bbad7594cba0ae73e99dbb54c) is corrupt
fatal: The remote end hung up unexpectedly

And then the cache becomes corrupted.  This blows the cache away if this happens.

BUG=261741

Review URL: https://codereview.chromium.org/352543003

git-svn-id: svn://svn.chromium.org/chrome/trunk/tools/depot_tools@280123 0039d316-1c4b-4281-b951-d872f2087c98
parent 905312cc
...@@ -13,6 +13,7 @@ import os ...@@ -13,6 +13,7 @@ import os
import re import re
import tempfile import tempfile
import time import time
import shutil
import subprocess import subprocess
import sys import sys
import urlparse import urlparse
...@@ -25,6 +26,8 @@ import subcommand ...@@ -25,6 +26,8 @@ import subcommand
# Analogous to gc.autopacklimit git config. # Analogous to gc.autopacklimit git config.
GC_AUTOPACKLIMIT = 50 GC_AUTOPACKLIMIT = 50
GIT_CACHE_CORRUPT_MESSAGE = 'WARNING: The Git cache is corrupt.'
try: try:
# pylint: disable=E0602 # pylint: disable=E0602
WinErr = WindowsError WinErr = WindowsError
...@@ -35,6 +38,8 @@ except NameError: ...@@ -35,6 +38,8 @@ except NameError:
class LockError(Exception): class LockError(Exception):
pass pass
class RefsHeadsFailedToFetch(Exception):
pass
class Lockfile(object): class Lockfile(object):
"""Class to represent a cross-platform process-specific lockfile.""" """Class to represent a cross-platform process-specific lockfile."""
...@@ -248,7 +253,10 @@ class Mirror(object): ...@@ -248,7 +253,10 @@ class Mirror(object):
self.RunGit(['config', '--add', 'remote.origin.fetch', refspec], cwd=cwd) self.RunGit(['config', '--add', 'remote.origin.fetch', refspec], cwd=cwd)
def bootstrap_repo(self, directory): def bootstrap_repo(self, directory):
"""Bootstrap the repo from Google Stroage if possible.""" """Bootstrap the repo from Google Stroage if possible.
More apt-ly named bootstrap_repo_from_cloud_if_possible_else_do_nothing().
"""
python_fallback = False python_fallback = False
if sys.platform.startswith('win') and not self.FindExecutable('7z'): if sys.platform.startswith('win') and not self.FindExecutable('7z'):
...@@ -309,36 +317,17 @@ class Mirror(object): ...@@ -309,36 +317,17 @@ class Mirror(object):
def exists(self): def exists(self):
return os.path.isfile(os.path.join(self.mirror_path, 'config')) return os.path.isfile(os.path.join(self.mirror_path, 'config'))
def populate(self, depth=None, shallow=False, bootstrap=False, def _ensure_bootstrapped(self, depth, bootstrap, force=False):
verbose=False, ignore_lock=False):
assert self.GetCachePath()
if shallow and not depth:
depth = 10000
gclient_utils.safe_makedirs(self.GetCachePath())
v = []
if verbose:
v = ['-v', '--progress']
d = []
if depth:
d = ['--depth', str(depth)]
lockfile = Lockfile(self.mirror_path)
if not ignore_lock:
lockfile.lock()
try:
# Setup from scratch if the repo is new or is in a bad state.
tempdir = None tempdir = None
config_file = os.path.join(self.mirror_path, 'config') config_file = os.path.join(self.mirror_path, 'config')
pack_dir = os.path.join(self.mirror_path, 'objects', 'pack') pack_dir = os.path.join(self.mirror_path, 'objects', 'pack')
pack_files = [] pack_files = []
if os.path.isdir(pack_dir): if os.path.isdir(pack_dir):
pack_files = [f for f in os.listdir(pack_dir) if f.endswith('.pack')] pack_files = [f for f in os.listdir(pack_dir) if f.endswith('.pack')]
should_bootstrap = (not os.path.exists(config_file) or should_bootstrap = (force or
not os.path.exists(config_file) or
len(pack_files) > GC_AUTOPACKLIMIT) len(pack_files) > GC_AUTOPACKLIMIT)
if should_bootstrap: if should_bootstrap:
tempdir = tempfile.mkdtemp( tempdir = tempfile.mkdtemp(
...@@ -346,6 +335,13 @@ class Mirror(object): ...@@ -346,6 +335,13 @@ class Mirror(object):
bootstrapped = not depth and bootstrap and self.bootstrap_repo(tempdir) bootstrapped = not depth and bootstrap and self.bootstrap_repo(tempdir)
if bootstrapped: if bootstrapped:
# Bootstrap succeeded; delete previous cache, if any. # Bootstrap succeeded; delete previous cache, if any.
try:
# Try to move folder to tempdir if possible.
defunct_dir = tempfile.mkdtemp()
shutil.move(self.mirror_path, defunct_dir)
self.print('Moved defunct directory for repository %s from %s to %s'
% (self.url, self.mirror_path, defunct_dir))
except Exception:
gclient_utils.rmtree(self.mirror_path) gclient_utils.rmtree(self.mirror_path)
elif not os.path.exists(config_file): elif not os.path.exists(config_file):
# Bootstrap failed, no previous cache; start with a bare git dir. # Bootstrap failed, no previous cache; start with a bare git dir.
...@@ -362,22 +358,55 @@ class Mirror(object): ...@@ -362,22 +358,55 @@ class Mirror(object):
if depth and os.path.exists(os.path.join(self.mirror_path, 'shallow')): if depth and os.path.exists(os.path.join(self.mirror_path, 'shallow')):
logging.warn( logging.warn(
'Shallow fetch requested, but repo cache already exists.') 'Shallow fetch requested, but repo cache already exists.')
d = [] return tempdir
rundir = tempdir or self.mirror_path def _fetch(self, rundir, verbose, depth):
self.config(rundir) self.config(rundir)
v = []
d = []
if verbose:
v = ['-v', '--progress']
if depth:
d = ['--depth', str(depth)]
fetch_cmd = ['fetch'] + v + d + ['origin'] fetch_cmd = ['fetch'] + v + d + ['origin']
fetch_specs = subprocess.check_output( fetch_specs = subprocess.check_output(
[self.git_exe, 'config', '--get-all', 'remote.origin.fetch'], [self.git_exe, 'config', '--get-all', 'remote.origin.fetch'],
cwd=rundir).strip().splitlines() cwd=rundir).strip().splitlines()
for spec in fetch_specs: for spec in fetch_specs:
try: try:
self.print('Fetching %s' % spec)
self.RunGit(fetch_cmd + [spec], cwd=rundir, retry=True) self.RunGit(fetch_cmd + [spec], cwd=rundir, retry=True)
except subprocess.CalledProcessError: except subprocess.CalledProcessError:
if spec == '+refs/heads/*:refs/heads/*':
raise RefsHeadsFailedToFetch
logging.warn('Fetch of %s failed' % spec) logging.warn('Fetch of %s failed' % spec)
def populate(self, depth=None, shallow=False, bootstrap=False,
verbose=False, ignore_lock=False):
assert self.GetCachePath()
if shallow and not depth:
depth = 10000
gclient_utils.safe_makedirs(self.GetCachePath())
lockfile = Lockfile(self.mirror_path)
if not ignore_lock:
lockfile.lock()
tempdir = None
try:
tempdir = self._ensure_bootstrapped(depth, bootstrap)
rundir = tempdir or self.mirror_path
self._fetch(rundir, verbose, depth)
except RefsHeadsFailedToFetch:
# This is a major failure, we need to clean and force a bootstrap.
gclient_utils.rmtree(rundir)
self.print(GIT_CACHE_CORRUPT_MESSAGE)
tempdir = self._ensure_bootstrapped(depth, bootstrap, force=True)
assert tempdir
self._fetch(tempdir or self.mirror_path, verbose, depth)
finally:
if tempdir: if tempdir:
os.rename(tempdir, self.mirror_path) os.rename(tempdir, self.mirror_path)
finally:
if not ignore_lock: if not ignore_lock:
lockfile.unlock() lockfile.unlock()
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment