Merge branch 'stable-2.15' into stable-2.16

* stable-2.15:
  Bazel: Enable Error-Prone by default
  Parallelize account migration in schema 146 migration
  Fix _nextStepHandle not being assigned a value when scrolling
  Elasticsearch: Remove redundant handling of 'ignore_unmapped' property
  Elasticsearch: Fix support for V6 versions earlier than 6.7.*
  ElasticVersionTest: Add missing assertions on V6_7

Change-Id: Ib655c541a28e3a9a2197465a58e1eff12123c6a5
This commit is contained in:
David Pursehouse
2019-05-28 11:51:47 +09:00
9 changed files with 150 additions and 24 deletions

View File

@@ -14,6 +14,9 @@
package com.google.gerrit.server.schema;
import com.google.common.base.Stopwatch;
import com.google.common.collect.Iterables;
import com.google.common.collect.Sets;
import com.google.gerrit.reviewdb.client.Account;
import com.google.gerrit.reviewdb.client.RefNames;
import com.google.gerrit.reviewdb.server.ReviewDb;
@@ -24,21 +27,36 @@ import com.google.gwtorm.server.OrmException;
import com.google.inject.Inject;
import com.google.inject.Provider;
import java.io.IOException;
import java.io.UncheckedIOException;
import java.sql.ResultSet;
import java.sql.SQLException;
import java.sql.Statement;
import java.sql.Timestamp;
import java.text.ParseException;
import java.util.Date;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Map.Entry;
import java.util.Set;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.locks.ReentrantLock;
import org.eclipse.jgit.internal.storage.file.FileRepository;
import org.eclipse.jgit.internal.storage.file.GC;
import org.eclipse.jgit.lib.CommitBuilder;
import org.eclipse.jgit.lib.Constants;
import org.eclipse.jgit.lib.ObjectId;
import org.eclipse.jgit.lib.ObjectInserter;
import org.eclipse.jgit.lib.PersonIdent;
import org.eclipse.jgit.lib.ProgressMonitor;
import org.eclipse.jgit.lib.Ref;
import org.eclipse.jgit.lib.RefUpdate;
import org.eclipse.jgit.lib.RefUpdate.Result;
import org.eclipse.jgit.lib.Repository;
import org.eclipse.jgit.lib.TextProgressMonitor;
import org.eclipse.jgit.revwalk.RevCommit;
import org.eclipse.jgit.revwalk.RevSort;
import org.eclipse.jgit.revwalk.RevWalk;
@@ -60,6 +78,10 @@ public class Schema_146 extends SchemaVersion {
private final GitRepositoryManager repoManager;
private final AllUsersName allUsersName;
private final PersonIdent serverIdent;
private AtomicInteger i = new AtomicInteger();
private Stopwatch sw = Stopwatch.createStarted();
ReentrantLock gcLock = new ReentrantLock();
private int size;
@Inject
Schema_146(
@@ -75,13 +97,41 @@ public class Schema_146 extends SchemaVersion {
@Override
protected void migrateData(ReviewDb db, UpdateUI ui) throws OrmException, SQLException {
ui.message("Migrating accounts");
Set<Entry<Account.Id, Timestamp>> accounts = scanAccounts(db, ui).entrySet();
gc(ui);
Set<List<Entry<Account.Id, Timestamp>>> batches =
Sets.newHashSet(Iterables.partition(accounts, 500));
ExecutorService pool = createExecutor(ui);
try {
batches.stream().forEach(batch -> pool.submit(() -> processBatch(batch, ui)));
pool.shutdown();
pool.awaitTermination(Long.MAX_VALUE, TimeUnit.DAYS);
} catch (InterruptedException e) {
throw new RuntimeException(e);
}
ui.message(
String.format("... (%.3f s) Migrated all %d accounts to schema 146", elapsed(), i.get()));
}
private ExecutorService createExecutor(UpdateUI ui) {
int threads;
try {
threads = Integer.parseInt(System.getProperty("threadcount"));
} catch (NumberFormatException e) {
threads = Runtime.getRuntime().availableProcessors();
}
ui.message(String.format("... using %d threads ...", threads));
return Executors.newFixedThreadPool(threads);
}
private void processBatch(List<Entry<Account.Id, Timestamp>> batch, UpdateUI ui) {
try (Repository repo = repoManager.openRepository(allUsersName);
RevWalk rw = new RevWalk(repo);
ObjectInserter oi = repo.newObjectInserter()) {
ObjectId emptyTree = emptyTree(oi);
int i = 0;
for (Map.Entry<Account.Id, Timestamp> e : scanAccounts(db).entrySet()) {
for (Map.Entry<Account.Id, Timestamp> e : batch) {
String refName = RefNames.refsUsers(e.getKey());
Ref ref = repo.exactRef(refName);
if (ref != null) {
@@ -89,14 +139,63 @@ public class Schema_146 extends SchemaVersion {
} else {
createUserBranch(repo, oi, emptyTree, e.getKey(), e.getValue());
}
i++;
if (i % 100 == 0) {
ui.message(String.format("... migrated %d users", i));
int count = i.incrementAndGet();
showProgress(ui, count);
if (count % 1000 == 0) {
gc(repo, true, ui);
}
}
ui.message(String.format("Migrated all %d users to schema 146", i));
} catch (IOException e) {
throw new OrmException("Failed to rewrite user branches.", e);
throw new UncheckedIOException(e);
}
}
private double elapsed() {
return sw.elapsed(TimeUnit.MILLISECONDS) / 1000d;
}
private void showProgress(UpdateUI ui, int count) {
if (count % 100 == 0) {
ui.message(
String.format(
"... (%.3f s) migrated %d%% (%d/%d) accounts",
elapsed(), Math.round(100.0 * count / size), count, size));
}
}
private void gc(UpdateUI ui) {
try (Repository repo = repoManager.openRepository(allUsersName)) {
gc(repo, false, ui);
} catch (IOException e) {
throw new UncheckedIOException(e);
}
}
private void gc(Repository repo, boolean refsOnly, UpdateUI ui) {
if (repo instanceof FileRepository && gcLock.tryLock()) {
ProgressMonitor pm = null;
try {
pm = new TextProgressMonitor();
FileRepository r = (FileRepository) repo;
GC gc = new GC(r);
gc.setProgressMonitor(pm);
pm.beginTask("gc", ProgressMonitor.UNKNOWN);
if (refsOnly) {
ui.message(String.format("... (%.3f s) pack refs", elapsed()));
gc.packRefs();
} else {
ui.message(String.format("... (%.3f s) gc --prune=now", elapsed()));
gc.setExpire(new Date());
gc.gc();
}
} catch (IOException | ParseException e) {
throw new RuntimeException(e);
} finally {
gcLock.unlock();
if (pm != null) {
pm.endTask();
}
}
}
}
@@ -189,13 +288,15 @@ public class Schema_146 extends SchemaVersion {
return oi.insert(Constants.OBJ_TREE, new byte[] {});
}
private Map<Account.Id, Timestamp> scanAccounts(ReviewDb db) throws SQLException {
private Map<Account.Id, Timestamp> scanAccounts(ReviewDb db, UpdateUI ui) throws SQLException {
ui.message(String.format("... (%.3f s) scan accounts", elapsed()));
try (Statement stmt = newStatement(db);
ResultSet rs = stmt.executeQuery("SELECT account_id, registered_on FROM accounts")) {
HashMap<Account.Id, Timestamp> m = new HashMap<>();
while (rs.next()) {
m.put(new Account.Id(rs.getInt(1)), rs.getTimestamp(2));
}
size = m.size();
return m;
}
}