You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

GC.java 50KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605
  1. /*
  2. * Copyright (C) 2012, Christian Halstrick <christian.halstrick@sap.com>
  3. * Copyright (C) 2011, Shawn O. Pearce <spearce@spearce.org>
  4. * and other copyright owners as documented in the project's IP log.
  5. *
  6. * This program and the accompanying materials are made available
  7. * under the terms of the Eclipse Distribution License v1.0 which
  8. * accompanies this distribution, is reproduced below, and is
  9. * available at http://www.eclipse.org/org/documents/edl-v10.php
  10. *
  11. * All rights reserved.
  12. *
  13. * Redistribution and use in source and binary forms, with or
  14. * without modification, are permitted provided that the following
  15. * conditions are met:
  16. *
  17. * - Redistributions of source code must retain the above copyright
  18. * notice, this list of conditions and the following disclaimer.
  19. *
  20. * - Redistributions in binary form must reproduce the above
  21. * copyright notice, this list of conditions and the following
  22. * disclaimer in the documentation and/or other materials provided
  23. * with the distribution.
  24. *
  25. * - Neither the name of the Eclipse Foundation, Inc. nor the
  26. * names of its contributors may be used to endorse or promote
  27. * products derived from this software without specific prior
  28. * written permission.
  29. *
  30. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
  31. * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
  32. * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  33. * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  34. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
  35. * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  36. * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  37. * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  38. * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  39. * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  40. * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  41. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
  42. * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  43. */
  44. package org.eclipse.jgit.internal.storage.file;
  45. import static org.eclipse.jgit.internal.storage.pack.PackExt.BITMAP_INDEX;
  46. import static org.eclipse.jgit.internal.storage.pack.PackExt.INDEX;
  47. import java.io.File;
  48. import java.io.FileOutputStream;
  49. import java.io.IOException;
  50. import java.io.OutputStream;
  51. import java.io.PrintWriter;
  52. import java.io.StringWriter;
  53. import java.nio.channels.Channels;
  54. import java.nio.channels.FileChannel;
  55. import java.nio.file.DirectoryNotEmptyException;
  56. import java.nio.file.DirectoryStream;
  57. import java.nio.file.Files;
  58. import java.nio.file.Path;
  59. import java.nio.file.StandardCopyOption;
  60. import java.text.MessageFormat;
  61. import java.text.ParseException;
  62. import java.time.Instant;
  63. import java.time.temporal.ChronoUnit;
  64. import java.util.ArrayList;
  65. import java.util.Collection;
  66. import java.util.Collections;
  67. import java.util.Comparator;
  68. import java.util.Date;
  69. import java.util.HashMap;
  70. import java.util.HashSet;
  71. import java.util.Iterator;
  72. import java.util.LinkedList;
  73. import java.util.List;
  74. import java.util.Map;
  75. import java.util.Objects;
  76. import java.util.Set;
  77. import java.util.TreeMap;
  78. import java.util.concurrent.Callable;
  79. import java.util.concurrent.ExecutorService;
  80. import java.util.regex.Pattern;
  81. import java.util.stream.Collectors;
  82. import java.util.stream.Stream;
  83. import org.eclipse.jgit.annotations.NonNull;
  84. import org.eclipse.jgit.dircache.DirCacheIterator;
  85. import org.eclipse.jgit.errors.CancelledException;
  86. import org.eclipse.jgit.errors.CorruptObjectException;
  87. import org.eclipse.jgit.errors.IncorrectObjectTypeException;
  88. import org.eclipse.jgit.errors.MissingObjectException;
  89. import org.eclipse.jgit.errors.NoWorkTreeException;
  90. import org.eclipse.jgit.internal.JGitText;
  91. import org.eclipse.jgit.internal.storage.pack.PackExt;
  92. import org.eclipse.jgit.internal.storage.pack.PackWriter;
  93. import org.eclipse.jgit.internal.storage.reftree.RefTreeNames;
  94. import org.eclipse.jgit.lib.ConfigConstants;
  95. import org.eclipse.jgit.lib.Constants;
  96. import org.eclipse.jgit.lib.FileMode;
  97. import org.eclipse.jgit.lib.NullProgressMonitor;
  98. import org.eclipse.jgit.lib.ObjectId;
  99. import org.eclipse.jgit.lib.ObjectIdSet;
  100. import org.eclipse.jgit.lib.ObjectLoader;
  101. import org.eclipse.jgit.lib.ObjectReader;
  102. import org.eclipse.jgit.lib.ProgressMonitor;
  103. import org.eclipse.jgit.lib.Ref;
  104. import org.eclipse.jgit.lib.Ref.Storage;
  105. import org.eclipse.jgit.lib.RefDatabase;
  106. import org.eclipse.jgit.lib.ReflogEntry;
  107. import org.eclipse.jgit.lib.ReflogReader;
  108. import org.eclipse.jgit.lib.internal.WorkQueue;
  109. import org.eclipse.jgit.revwalk.ObjectWalk;
  110. import org.eclipse.jgit.revwalk.RevObject;
  111. import org.eclipse.jgit.revwalk.RevWalk;
  112. import org.eclipse.jgit.storage.pack.PackConfig;
  113. import org.eclipse.jgit.treewalk.TreeWalk;
  114. import org.eclipse.jgit.treewalk.filter.TreeFilter;
  115. import org.eclipse.jgit.util.FileUtils;
  116. import org.eclipse.jgit.util.GitDateParser;
  117. import org.eclipse.jgit.util.SystemReader;
  118. import org.slf4j.Logger;
  119. import org.slf4j.LoggerFactory;
  120. /**
  121. * A garbage collector for git
  122. * {@link org.eclipse.jgit.internal.storage.file.FileRepository}. Instances of
  123. * this class are not thread-safe. Don't use the same instance from multiple
  124. * threads.
  125. *
  126. * This class started as a copy of DfsGarbageCollector from Shawn O. Pearce
  127. * adapted to FileRepositories.
  128. */
  129. public class GC {
  130. private final static Logger LOG = LoggerFactory
  131. .getLogger(GC.class);
  132. private static final String PRUNE_EXPIRE_DEFAULT = "2.weeks.ago"; //$NON-NLS-1$
  133. private static final String PRUNE_PACK_EXPIRE_DEFAULT = "1.hour.ago"; //$NON-NLS-1$
  134. private static final Pattern PATTERN_LOOSE_OBJECT = Pattern
  135. .compile("[0-9a-fA-F]{38}"); //$NON-NLS-1$
  136. private static final String PACK_EXT = "." + PackExt.PACK.getExtension();//$NON-NLS-1$
  137. private static final String BITMAP_EXT = "." //$NON-NLS-1$
  138. + PackExt.BITMAP_INDEX.getExtension();
  139. private static final String INDEX_EXT = "." + PackExt.INDEX.getExtension(); //$NON-NLS-1$
  140. private static final int DEFAULT_AUTOPACKLIMIT = 50;
  141. private static final int DEFAULT_AUTOLIMIT = 6700;
  142. private static volatile ExecutorService executor;
  143. /**
  144. * Set the executor for running auto-gc in the background. If no executor is
  145. * set JGit's own WorkQueue will be used.
  146. *
  147. * @param e
  148. * the executor to be used for running auto-gc
  149. * @since 4.8
  150. */
  151. public static void setExecutor(ExecutorService e) {
  152. executor = e;
  153. }
  154. private final FileRepository repo;
  155. private ProgressMonitor pm;
  156. private long expireAgeMillis = -1;
  157. private Date expire;
  158. private long packExpireAgeMillis = -1;
  159. private Date packExpire;
  160. private PackConfig pconfig = null;
  161. /**
  162. * the refs which existed during the last call to {@link #repack()}. This is
  163. * needed during {@link #prune(Set)} where we can optimize by looking at the
  164. * difference between the current refs and the refs which existed during
  165. * last {@link #repack()}.
  166. */
  167. private Collection<Ref> lastPackedRefs;
  168. /**
  169. * Holds the starting time of the last repack() execution. This is needed in
  170. * prune() to inspect only those reflog entries which have been added since
  171. * last repack().
  172. */
  173. private long lastRepackTime;
  174. /**
  175. * Whether gc should do automatic housekeeping
  176. */
  177. private boolean automatic;
  178. /**
  179. * Whether to run gc in a background thread
  180. */
  181. private boolean background;
  182. /**
  183. * Creates a new garbage collector with default values. An expirationTime of
  184. * two weeks and <code>null</code> as progress monitor will be used.
  185. *
  186. * @param repo
  187. * the repo to work on
  188. */
  189. public GC(FileRepository repo) {
  190. this.repo = repo;
  191. this.pm = NullProgressMonitor.INSTANCE;
  192. }
  193. /**
  194. * Runs a garbage collector on a
  195. * {@link org.eclipse.jgit.internal.storage.file.FileRepository}. It will
  196. * <ul>
  197. * <li>pack loose references into packed-refs</li>
  198. * <li>repack all reachable objects into new pack files and delete the old
  199. * pack files</li>
  200. * <li>prune all loose objects which are now reachable by packs</li>
  201. * </ul>
  202. *
  203. * If {@link #setAuto(boolean)} was set to {@code true} {@code gc} will
  204. * first check whether any housekeeping is required; if not, it exits
  205. * without performing any work.
  206. *
  207. * If {@link #setBackground(boolean)} was set to {@code true}
  208. * {@code collectGarbage} will start the gc in the background, and then
  209. * return immediately. In this case, errors will not be reported except in
  210. * gc.log.
  211. *
  212. * @return the collection of
  213. * {@link org.eclipse.jgit.internal.storage.file.PackFile}'s which
  214. * are newly created
  215. * @throws java.io.IOException
  216. * @throws java.text.ParseException
  217. * If the configuration parameter "gc.pruneexpire" couldn't be
  218. * parsed
  219. */
  220. // TODO(ms): in 5.0 change signature and return Future<Collection<PackFile>>
  221. public Collection<PackFile> gc() throws IOException, ParseException {
  222. if (!background) {
  223. return doGc();
  224. }
  225. final GcLog gcLog = new GcLog(repo);
  226. if (!gcLog.lock()) {
  227. // there is already a background gc running
  228. return Collections.emptyList();
  229. }
  230. Callable<Collection<PackFile>> gcTask = () -> {
  231. try {
  232. Collection<PackFile> newPacks = doGc();
  233. if (automatic && tooManyLooseObjects()) {
  234. String message = JGitText.get().gcTooManyUnpruned;
  235. gcLog.write(message);
  236. gcLog.commit();
  237. }
  238. return newPacks;
  239. } catch (IOException | ParseException e) {
  240. try {
  241. gcLog.write(e.getMessage());
  242. StringWriter sw = new StringWriter();
  243. e.printStackTrace(new PrintWriter(sw));
  244. gcLog.write(sw.toString());
  245. gcLog.commit();
  246. } catch (IOException e2) {
  247. e2.addSuppressed(e);
  248. LOG.error(e2.getMessage(), e2);
  249. }
  250. } finally {
  251. gcLog.unlock();
  252. }
  253. return Collections.emptyList();
  254. };
  255. // TODO(ms): in 5.0 change signature and return the Future
  256. executor().submit(gcTask);
  257. return Collections.emptyList();
  258. }
  259. private ExecutorService executor() {
  260. return (executor != null) ? executor : WorkQueue.getExecutor();
  261. }
  262. private Collection<PackFile> doGc() throws IOException, ParseException {
  263. if (automatic && !needGc()) {
  264. return Collections.emptyList();
  265. }
  266. pm.start(6 /* tasks */);
  267. packRefs();
  268. // TODO: implement reflog_expire(pm, repo);
  269. Collection<PackFile> newPacks = repack();
  270. prune(Collections.<ObjectId> emptySet());
  271. // TODO: implement rerere_gc(pm);
  272. return newPacks;
  273. }
  274. /**
  275. * Loosen objects in a pack file which are not also in the newly-created
  276. * pack files.
  277. *
  278. * @param inserter
  279. * @param reader
  280. * @param pack
  281. * @param existing
  282. * @throws IOException
  283. */
  284. private void loosen(ObjectDirectoryInserter inserter, ObjectReader reader, PackFile pack, HashSet<ObjectId> existing)
  285. throws IOException {
  286. for (PackIndex.MutableEntry entry : pack) {
  287. ObjectId oid = entry.toObjectId();
  288. if (existing.contains(oid)) {
  289. continue;
  290. }
  291. existing.add(oid);
  292. ObjectLoader loader = reader.open(oid);
  293. inserter.insert(loader.getType(),
  294. loader.getSize(),
  295. loader.openStream(),
  296. true /* create this object even though it's a duplicate */);
  297. }
  298. }
  299. /**
  300. * Delete old pack files. What is 'old' is defined by specifying a set of
  301. * old pack files and a set of new pack files. Each pack file contained in
  302. * old pack files but not contained in new pack files will be deleted. If
  303. * preserveOldPacks is set, keep a copy of the pack file in the preserve
  304. * directory. If an expirationDate is set then pack files which are younger
  305. * than the expirationDate will not be deleted nor preserved.
  306. * <p>
  307. * If we're not immediately expiring loose objects, loosen any objects
  308. * in the old pack files which aren't in the new pack files.
  309. *
  310. * @param oldPacks
  311. * @param newPacks
  312. * @throws ParseException
  313. * @throws IOException
  314. */
  315. private void deleteOldPacks(Collection<PackFile> oldPacks,
  316. Collection<PackFile> newPacks) throws ParseException, IOException {
  317. HashSet<ObjectId> ids = new HashSet<>();
  318. for (PackFile pack : newPacks) {
  319. for (PackIndex.MutableEntry entry : pack) {
  320. ids.add(entry.toObjectId());
  321. }
  322. }
  323. ObjectReader reader = repo.newObjectReader();
  324. ObjectDirectory dir = repo.getObjectDatabase();
  325. ObjectDirectoryInserter inserter = dir.newInserter();
  326. boolean shouldLoosen = !"now".equals(getPruneExpireStr()) && //$NON-NLS-1$
  327. getExpireDate() < Long.MAX_VALUE;
  328. prunePreserved();
  329. long packExpireDate = getPackExpireDate();
  330. oldPackLoop: for (PackFile oldPack : oldPacks) {
  331. checkCancelled();
  332. String oldName = oldPack.getPackName();
  333. // check whether an old pack file is also among the list of new
  334. // pack files. Then we must not delete it.
  335. for (PackFile newPack : newPacks)
  336. if (oldName.equals(newPack.getPackName()))
  337. continue oldPackLoop;
  338. if (!oldPack.shouldBeKept()
  339. && repo.getFS().lastModified(
  340. oldPack.getPackFile()) < packExpireDate) {
  341. oldPack.close();
  342. if (shouldLoosen) {
  343. loosen(inserter, reader, oldPack, ids);
  344. }
  345. prunePack(oldName);
  346. }
  347. }
  348. // close the complete object database. That's my only chance to force
  349. // rescanning and to detect that certain pack files are now deleted.
  350. repo.getObjectDatabase().close();
  351. }
  352. /**
  353. * Deletes old pack file, unless 'preserve-oldpacks' is set, in which case it
  354. * moves the pack file to the preserved directory
  355. *
  356. * @param packFile
  357. * @param packName
  358. * @param ext
  359. * @param deleteOptions
  360. * @throws IOException
  361. */
  362. private void removeOldPack(File packFile, String packName, PackExt ext,
  363. int deleteOptions) throws IOException {
  364. if (pconfig != null && pconfig.isPreserveOldPacks()) {
  365. File oldPackDir = repo.getObjectDatabase().getPreservedDirectory();
  366. FileUtils.mkdir(oldPackDir, true);
  367. String oldPackName = "pack-" + packName + ".old-" + ext.getExtension(); //$NON-NLS-1$ //$NON-NLS-2$
  368. File oldPackFile = new File(oldPackDir, oldPackName);
  369. FileUtils.rename(packFile, oldPackFile);
  370. } else {
  371. FileUtils.delete(packFile, deleteOptions);
  372. }
  373. }
  374. /**
  375. * Delete the preserved directory including all pack files within
  376. */
  377. private void prunePreserved() {
  378. if (pconfig != null && pconfig.isPrunePreserved()) {
  379. try {
  380. FileUtils.delete(repo.getObjectDatabase().getPreservedDirectory(),
  381. FileUtils.RECURSIVE | FileUtils.RETRY | FileUtils.SKIP_MISSING);
  382. } catch (IOException e) {
  383. // Deletion of the preserved pack files failed. Silently return.
  384. }
  385. }
  386. }
  387. /**
  388. * Delete files associated with a single pack file. First try to delete the
  389. * ".pack" file because on some platforms the ".pack" file may be locked and
  390. * can't be deleted. In such a case it is better to detect this early and
  391. * give up on deleting files for this packfile. Otherwise we may delete the
  392. * ".index" file and when failing to delete the ".pack" file we are left
  393. * with a ".pack" file without a ".index" file.
  394. *
  395. * @param packName
  396. */
  397. private void prunePack(String packName) {
  398. PackExt[] extensions = PackExt.values();
  399. try {
  400. // Delete the .pack file first and if this fails give up on deleting
  401. // the other files
  402. int deleteOptions = FileUtils.RETRY | FileUtils.SKIP_MISSING;
  403. for (PackExt ext : extensions)
  404. if (PackExt.PACK.equals(ext)) {
  405. File f = nameFor(packName, "." + ext.getExtension()); //$NON-NLS-1$
  406. removeOldPack(f, packName, ext, deleteOptions);
  407. break;
  408. }
  409. // The .pack file has been deleted. Delete as many as the other
  410. // files as you can.
  411. deleteOptions |= FileUtils.IGNORE_ERRORS;
  412. for (PackExt ext : extensions) {
  413. if (!PackExt.PACK.equals(ext)) {
  414. File f = nameFor(packName, "." + ext.getExtension()); //$NON-NLS-1$
  415. removeOldPack(f, packName, ext, deleteOptions);
  416. }
  417. }
  418. } catch (IOException e) {
  419. // Deletion of the .pack file failed. Silently return.
  420. }
  421. }
  422. /**
  423. * Like "git prune-packed" this method tries to prune all loose objects
  424. * which can be found in packs. If certain objects can't be pruned (e.g.
  425. * because the filesystem delete operation fails) this is silently ignored.
  426. *
  427. * @throws java.io.IOException
  428. */
  429. public void prunePacked() throws IOException {
  430. ObjectDirectory objdb = repo.getObjectDatabase();
  431. Collection<PackFile> packs = objdb.getPacks();
  432. File objects = repo.getObjectsDirectory();
  433. String[] fanout = objects.list();
  434. if (fanout != null && fanout.length > 0) {
  435. pm.beginTask(JGitText.get().pruneLoosePackedObjects, fanout.length);
  436. try {
  437. for (String d : fanout) {
  438. checkCancelled();
  439. pm.update(1);
  440. if (d.length() != 2)
  441. continue;
  442. String[] entries = new File(objects, d).list();
  443. if (entries == null)
  444. continue;
  445. for (String e : entries) {
  446. checkCancelled();
  447. if (e.length() != Constants.OBJECT_ID_STRING_LENGTH - 2)
  448. continue;
  449. ObjectId id;
  450. try {
  451. id = ObjectId.fromString(d + e);
  452. } catch (IllegalArgumentException notAnObject) {
  453. // ignoring the file that does not represent loose
  454. // object
  455. continue;
  456. }
  457. boolean found = false;
  458. for (PackFile p : packs) {
  459. checkCancelled();
  460. if (p.hasObject(id)) {
  461. found = true;
  462. break;
  463. }
  464. }
  465. if (found)
  466. FileUtils.delete(objdb.fileFor(id), FileUtils.RETRY
  467. | FileUtils.SKIP_MISSING
  468. | FileUtils.IGNORE_ERRORS);
  469. }
  470. }
  471. } finally {
  472. pm.endTask();
  473. }
  474. }
  475. }
  476. /**
  477. * Like "git prune" this method tries to prune all loose objects which are
  478. * unreferenced. If certain objects can't be pruned (e.g. because the
  479. * filesystem delete operation fails) this is silently ignored.
  480. *
  481. * @param objectsToKeep
  482. * a set of objects which should explicitly not be pruned
  483. * @throws java.io.IOException
  484. * @throws java.text.ParseException
  485. * If the configuration parameter "gc.pruneexpire" couldn't be
  486. * parsed
  487. */
  488. public void prune(Set<ObjectId> objectsToKeep) throws IOException,
  489. ParseException {
  490. long expireDate = getExpireDate();
  491. // Collect all loose objects which are old enough, not referenced from
  492. // the index and not in objectsToKeep
  493. Map<ObjectId, File> deletionCandidates = new HashMap<>();
  494. Set<ObjectId> indexObjects = null;
  495. File objects = repo.getObjectsDirectory();
  496. String[] fanout = objects.list();
  497. if (fanout == null || fanout.length == 0) {
  498. return;
  499. }
  500. pm.beginTask(JGitText.get().pruneLooseUnreferencedObjects,
  501. fanout.length);
  502. try {
  503. for (String d : fanout) {
  504. checkCancelled();
  505. pm.update(1);
  506. if (d.length() != 2)
  507. continue;
  508. File dir = new File(objects, d);
  509. File[] entries = dir.listFiles();
  510. if (entries == null || entries.length == 0) {
  511. FileUtils.delete(dir, FileUtils.IGNORE_ERRORS);
  512. continue;
  513. }
  514. for (File f : entries) {
  515. checkCancelled();
  516. String fName = f.getName();
  517. if (fName.length() != Constants.OBJECT_ID_STRING_LENGTH - 2)
  518. continue;
  519. if (repo.getFS().lastModified(f) >= expireDate)
  520. continue;
  521. try {
  522. ObjectId id = ObjectId.fromString(d + fName);
  523. if (objectsToKeep.contains(id))
  524. continue;
  525. if (indexObjects == null)
  526. indexObjects = listNonHEADIndexObjects();
  527. if (indexObjects.contains(id))
  528. continue;
  529. deletionCandidates.put(id, f);
  530. } catch (IllegalArgumentException notAnObject) {
  531. // ignoring the file that does not represent loose
  532. // object
  533. continue;
  534. }
  535. }
  536. }
  537. } finally {
  538. pm.endTask();
  539. }
  540. if (deletionCandidates.isEmpty()) {
  541. return;
  542. }
  543. checkCancelled();
  544. // From the set of current refs remove all those which have been handled
  545. // during last repack(). Only those refs will survive which have been
  546. // added or modified since the last repack. Only these can save existing
  547. // loose refs from being pruned.
  548. Collection<Ref> newRefs;
  549. if (lastPackedRefs == null || lastPackedRefs.isEmpty())
  550. newRefs = getAllRefs();
  551. else {
  552. Map<String, Ref> last = new HashMap<>();
  553. for (Ref r : lastPackedRefs) {
  554. last.put(r.getName(), r);
  555. }
  556. newRefs = new ArrayList<>();
  557. for (Ref r : getAllRefs()) {
  558. Ref old = last.get(r.getName());
  559. if (!equals(r, old)) {
  560. newRefs.add(r);
  561. }
  562. }
  563. }
  564. if (!newRefs.isEmpty()) {
  565. // There are new/modified refs! Check which loose objects are now
  566. // referenced by these modified refs (or their reflogentries).
  567. // Remove these loose objects
  568. // from the deletionCandidates. When the last candidate is removed
  569. // leave this method.
  570. ObjectWalk w = new ObjectWalk(repo);
  571. try {
  572. for (Ref cr : newRefs) {
  573. checkCancelled();
  574. w.markStart(w.parseAny(cr.getObjectId()));
  575. }
  576. if (lastPackedRefs != null)
  577. for (Ref lpr : lastPackedRefs) {
  578. w.markUninteresting(w.parseAny(lpr.getObjectId()));
  579. }
  580. removeReferenced(deletionCandidates, w);
  581. } finally {
  582. w.dispose();
  583. }
  584. }
  585. if (deletionCandidates.isEmpty())
  586. return;
  587. // Since we have not left the method yet there are still
  588. // deletionCandidates. Last chance for these objects not to be pruned is
  589. // that they are referenced by reflog entries. Even refs which currently
  590. // point to the same object as during last repack() may have
  591. // additional reflog entries not handled during last repack()
  592. ObjectWalk w = new ObjectWalk(repo);
  593. try {
  594. for (Ref ar : getAllRefs())
  595. for (ObjectId id : listRefLogObjects(ar, lastRepackTime)) {
  596. checkCancelled();
  597. w.markStart(w.parseAny(id));
  598. }
  599. if (lastPackedRefs != null)
  600. for (Ref lpr : lastPackedRefs) {
  601. checkCancelled();
  602. w.markUninteresting(w.parseAny(lpr.getObjectId()));
  603. }
  604. removeReferenced(deletionCandidates, w);
  605. } finally {
  606. w.dispose();
  607. }
  608. if (deletionCandidates.isEmpty())
  609. return;
  610. checkCancelled();
  611. // delete all candidates which have survived: these are unreferenced
  612. // loose objects. Make a last check, though, to avoid deleting objects
  613. // that could have been referenced while the candidates list was being
  614. // built (by an incoming push, for example).
  615. Set<File> touchedFanout = new HashSet<>();
  616. for (File f : deletionCandidates.values()) {
  617. if (f.lastModified() < expireDate) {
  618. f.delete();
  619. touchedFanout.add(f.getParentFile());
  620. }
  621. }
  622. for (File f : touchedFanout) {
  623. FileUtils.delete(f,
  624. FileUtils.EMPTY_DIRECTORIES_ONLY | FileUtils.IGNORE_ERRORS);
  625. }
  626. repo.getObjectDatabase().close();
  627. }
  628. private long getExpireDate() throws ParseException {
  629. long expireDate = Long.MAX_VALUE;
  630. if (expire == null && expireAgeMillis == -1) {
  631. String pruneExpireStr = getPruneExpireStr();
  632. if (pruneExpireStr == null)
  633. pruneExpireStr = PRUNE_EXPIRE_DEFAULT;
  634. expire = GitDateParser.parse(pruneExpireStr, null, SystemReader
  635. .getInstance().getLocale());
  636. expireAgeMillis = -1;
  637. }
  638. if (expire != null)
  639. expireDate = expire.getTime();
  640. if (expireAgeMillis != -1)
  641. expireDate = System.currentTimeMillis() - expireAgeMillis;
  642. return expireDate;
  643. }
  644. private String getPruneExpireStr() {
  645. return repo.getConfig().getString(
  646. ConfigConstants.CONFIG_GC_SECTION, null,
  647. ConfigConstants.CONFIG_KEY_PRUNEEXPIRE);
  648. }
  649. private long getPackExpireDate() throws ParseException {
  650. long packExpireDate = Long.MAX_VALUE;
  651. if (packExpire == null && packExpireAgeMillis == -1) {
  652. String prunePackExpireStr = repo.getConfig().getString(
  653. ConfigConstants.CONFIG_GC_SECTION, null,
  654. ConfigConstants.CONFIG_KEY_PRUNEPACKEXPIRE);
  655. if (prunePackExpireStr == null)
  656. prunePackExpireStr = PRUNE_PACK_EXPIRE_DEFAULT;
  657. packExpire = GitDateParser.parse(prunePackExpireStr, null,
  658. SystemReader.getInstance().getLocale());
  659. packExpireAgeMillis = -1;
  660. }
  661. if (packExpire != null)
  662. packExpireDate = packExpire.getTime();
  663. if (packExpireAgeMillis != -1)
  664. packExpireDate = System.currentTimeMillis() - packExpireAgeMillis;
  665. return packExpireDate;
  666. }
  667. /**
  668. * Remove all entries from a map which key is the id of an object referenced
  669. * by the given ObjectWalk
  670. *
  671. * @param id2File
  672. * @param w
  673. * @throws MissingObjectException
  674. * @throws IncorrectObjectTypeException
  675. * @throws IOException
  676. */
  677. private void removeReferenced(Map<ObjectId, File> id2File,
  678. ObjectWalk w) throws MissingObjectException,
  679. IncorrectObjectTypeException, IOException {
  680. RevObject ro = w.next();
  681. while (ro != null) {
  682. checkCancelled();
  683. if (id2File.remove(ro.getId()) != null)
  684. if (id2File.isEmpty())
  685. return;
  686. ro = w.next();
  687. }
  688. ro = w.nextObject();
  689. while (ro != null) {
  690. checkCancelled();
  691. if (id2File.remove(ro.getId()) != null)
  692. if (id2File.isEmpty())
  693. return;
  694. ro = w.nextObject();
  695. }
  696. }
  697. private static boolean equals(Ref r1, Ref r2) {
  698. if (r1 == null || r2 == null)
  699. return false;
  700. if (r1.isSymbolic()) {
  701. if (!r2.isSymbolic())
  702. return false;
  703. return r1.getTarget().getName().equals(r2.getTarget().getName());
  704. } else {
  705. if (r2.isSymbolic()) {
  706. return false;
  707. }
  708. return Objects.equals(r1.getObjectId(), r2.getObjectId());
  709. }
  710. }
  711. /**
  712. * Packs all non-symbolic, loose refs into packed-refs.
  713. *
  714. * @throws java.io.IOException
  715. */
  716. public void packRefs() throws IOException {
  717. Collection<Ref> refs = repo.getRefDatabase().getRefs(Constants.R_REFS).values();
  718. List<String> refsToBePacked = new ArrayList<>(refs.size());
  719. pm.beginTask(JGitText.get().packRefs, refs.size());
  720. try {
  721. for (Ref ref : refs) {
  722. checkCancelled();
  723. if (!ref.isSymbolic() && ref.getStorage().isLoose())
  724. refsToBePacked.add(ref.getName());
  725. pm.update(1);
  726. }
  727. ((RefDirectory) repo.getRefDatabase()).pack(refsToBePacked);
  728. } finally {
  729. pm.endTask();
  730. }
  731. }
  732. /**
  733. * Packs all objects which reachable from any of the heads into one pack
  734. * file. Additionally all objects which are not reachable from any head but
  735. * which are reachable from any of the other refs (e.g. tags), special refs
  736. * (e.g. FETCH_HEAD) or index are packed into a separate pack file. Objects
  737. * included in pack files which have a .keep file associated are never
  738. * repacked. All old pack files which existed before are deleted.
  739. *
  740. * @return a collection of the newly created pack files
  741. * @throws java.io.IOException
  742. * when during reading of refs, index, packfiles, objects,
  743. * reflog-entries or during writing to the packfiles
  744. * {@link java.io.IOException} occurs
  745. */
  746. public Collection<PackFile> repack() throws IOException {
  747. Collection<PackFile> toBeDeleted = repo.getObjectDatabase().getPacks();
  748. long time = System.currentTimeMillis();
  749. Collection<Ref> refsBefore = getAllRefs();
  750. Set<ObjectId> allHeadsAndTags = new HashSet<>();
  751. Set<ObjectId> allHeads = new HashSet<>();
  752. Set<ObjectId> allTags = new HashSet<>();
  753. Set<ObjectId> nonHeads = new HashSet<>();
  754. Set<ObjectId> txnHeads = new HashSet<>();
  755. Set<ObjectId> tagTargets = new HashSet<>();
  756. Set<ObjectId> indexObjects = listNonHEADIndexObjects();
  757. RefDatabase refdb = repo.getRefDatabase();
  758. for (Ref ref : refsBefore) {
  759. checkCancelled();
  760. nonHeads.addAll(listRefLogObjects(ref, 0));
  761. if (ref.isSymbolic() || ref.getObjectId() == null) {
  762. continue;
  763. }
  764. if (isHead(ref)) {
  765. allHeads.add(ref.getObjectId());
  766. } else if (isTag(ref)) {
  767. allTags.add(ref.getObjectId());
  768. } else if (RefTreeNames.isRefTree(refdb, ref.getName())) {
  769. txnHeads.add(ref.getObjectId());
  770. } else {
  771. nonHeads.add(ref.getObjectId());
  772. }
  773. if (ref.getPeeledObjectId() != null) {
  774. tagTargets.add(ref.getPeeledObjectId());
  775. }
  776. }
  777. List<ObjectIdSet> excluded = new LinkedList<>();
  778. for (final PackFile f : repo.getObjectDatabase().getPacks()) {
  779. checkCancelled();
  780. if (f.shouldBeKept())
  781. excluded.add(f.getIndex());
  782. }
  783. // Don't exclude tags that are also branch tips
  784. allTags.removeAll(allHeads);
  785. allHeadsAndTags.addAll(allHeads);
  786. allHeadsAndTags.addAll(allTags);
  787. // Hoist all branch tips and tags earlier in the pack file
  788. tagTargets.addAll(allHeadsAndTags);
  789. nonHeads.addAll(indexObjects);
  790. // Combine the GC_REST objects into the GC pack if requested
  791. if (pconfig != null && pconfig.getSinglePack()) {
  792. allHeadsAndTags.addAll(nonHeads);
  793. nonHeads.clear();
  794. }
  795. List<PackFile> ret = new ArrayList<>(2);
  796. PackFile heads = null;
  797. if (!allHeadsAndTags.isEmpty()) {
  798. heads = writePack(allHeadsAndTags, PackWriter.NONE, allTags,
  799. tagTargets, excluded);
  800. if (heads != null) {
  801. ret.add(heads);
  802. excluded.add(0, heads.getIndex());
  803. }
  804. }
  805. if (!nonHeads.isEmpty()) {
  806. PackFile rest = writePack(nonHeads, allHeadsAndTags, PackWriter.NONE,
  807. tagTargets, excluded);
  808. if (rest != null)
  809. ret.add(rest);
  810. }
  811. if (!txnHeads.isEmpty()) {
  812. PackFile txn = writePack(txnHeads, PackWriter.NONE, PackWriter.NONE,
  813. null, excluded);
  814. if (txn != null)
  815. ret.add(txn);
  816. }
  817. try {
  818. deleteOldPacks(toBeDeleted, ret);
  819. } catch (ParseException e) {
  820. // TODO: the exception has to be wrapped into an IOException because
  821. // throwing the ParseException directly would break the API, instead
  822. // we should throw a ConfigInvalidException
  823. throw new IOException(e);
  824. }
  825. prunePacked();
  826. deleteEmptyRefsFolders();
  827. deleteOrphans();
  828. deleteTempPacksIdx();
  829. lastPackedRefs = refsBefore;
  830. lastRepackTime = time;
  831. return ret;
  832. }
  833. private static boolean isHead(Ref ref) {
  834. return ref.getName().startsWith(Constants.R_HEADS);
  835. }
  836. private static boolean isTag(Ref ref) {
  837. return ref.getName().startsWith(Constants.R_TAGS);
  838. }
  839. private void deleteEmptyRefsFolders() throws IOException {
  840. Path refs = repo.getDirectory().toPath().resolve(Constants.R_REFS);
  841. // Avoid deleting a folder that was created after the threshold so that concurrent
  842. // operations trying to create a reference are not impacted
  843. Instant threshold = Instant.now().minus(30, ChronoUnit.SECONDS);
  844. try (Stream<Path> entries = Files.list(refs)) {
  845. Iterator<Path> iterator = entries.iterator();
  846. while (iterator.hasNext()) {
  847. try (Stream<Path> s = Files.list(iterator.next())) {
  848. s.filter(path -> canBeSafelyDeleted(path, threshold)).forEach(this::deleteDir);
  849. }
  850. }
  851. }
  852. }
  853. private boolean canBeSafelyDeleted(Path path, Instant threshold) {
  854. try {
  855. return Files.getLastModifiedTime(path).toInstant().isBefore(threshold);
  856. }
  857. catch (IOException e) {
  858. LOG.warn(MessageFormat.format(
  859. JGitText.get().cannotAccessLastModifiedForSafeDeletion,
  860. path), e);
  861. return false;
  862. }
  863. }
  864. private void deleteDir(Path dir) {
  865. try (Stream<Path> dirs = Files.walk(dir)) {
  866. dirs.filter(this::isDirectory).sorted(Comparator.reverseOrder())
  867. .forEach(this::delete);
  868. } catch (IOException e) {
  869. LOG.error(e.getMessage(), e);
  870. }
  871. }
  872. private boolean isDirectory(Path p) {
  873. return p.toFile().isDirectory();
  874. }
  875. private void delete(Path d) {
  876. try {
  877. Files.delete(d);
  878. } catch (DirectoryNotEmptyException e) {
  879. // Don't log
  880. } catch (IOException e) {
  881. LOG.error(MessageFormat.format(JGitText.get().cannotDeleteFile, d),
  882. e);
  883. }
  884. }
  885. /**
  886. * Deletes orphans
  887. * <p>
  888. * A file is considered an orphan if it is either a "bitmap" or an index
  889. * file, and its corresponding pack file is missing in the list.
  890. * </p>
  891. */
  892. private void deleteOrphans() {
  893. Path packDir = repo.getObjectDatabase().getPackDirectory().toPath();
  894. List<String> fileNames = null;
  895. try (Stream<Path> files = Files.list(packDir)) {
  896. fileNames = files.map(path -> path.getFileName().toString())
  897. .filter(name -> {
  898. return (name.endsWith(PACK_EXT)
  899. || name.endsWith(BITMAP_EXT)
  900. || name.endsWith(INDEX_EXT));
  901. }).sorted(Collections.reverseOrder())
  902. .collect(Collectors.toList());
  903. } catch (IOException e1) {
  904. // ignore
  905. }
  906. if (fileNames == null) {
  907. return;
  908. }
  909. String base = null;
  910. for (String n : fileNames) {
  911. if (n.endsWith(PACK_EXT)) {
  912. base = n.substring(0, n.lastIndexOf('.'));
  913. } else {
  914. if (base == null || !n.startsWith(base)) {
  915. try {
  916. Files.delete(FileUtils.toPath(new File(packDir.toFile(), n)));
  917. } catch (IOException e) {
  918. LOG.error(e.getMessage(), e);
  919. }
  920. }
  921. }
  922. }
  923. }
  924. private void deleteTempPacksIdx() {
  925. Path packDir = repo.getObjectDatabase().getPackDirectory().toPath();
  926. Instant threshold = Instant.now().minus(1, ChronoUnit.DAYS);
  927. try (DirectoryStream<Path> stream =
  928. Files.newDirectoryStream(packDir, "gc_*_tmp")) { //$NON-NLS-1$
  929. stream.forEach(t -> {
  930. try {
  931. Instant lastModified = Files.getLastModifiedTime(t)
  932. .toInstant();
  933. if (lastModified.isBefore(threshold)) {
  934. Files.deleteIfExists(t);
  935. }
  936. } catch (IOException e) {
  937. LOG.error(e.getMessage(), e);
  938. }
  939. });
  940. } catch (IOException e) {
  941. LOG.error(e.getMessage(), e);
  942. }
  943. }
  944. /**
  945. * @param ref
  946. * the ref which log should be inspected
  947. * @param minTime only reflog entries not older then this time are processed
  948. * @return the {@link ObjectId}s contained in the reflog
  949. * @throws IOException
  950. */
  951. private Set<ObjectId> listRefLogObjects(Ref ref, long minTime) throws IOException {
  952. ReflogReader reflogReader = repo.getReflogReader(ref.getName());
  953. if (reflogReader == null) {
  954. return Collections.emptySet();
  955. }
  956. List<ReflogEntry> rlEntries = reflogReader
  957. .getReverseEntries();
  958. if (rlEntries == null || rlEntries.isEmpty())
  959. return Collections.<ObjectId> emptySet();
  960. Set<ObjectId> ret = new HashSet<>();
  961. for (ReflogEntry e : rlEntries) {
  962. if (e.getWho().getWhen().getTime() < minTime)
  963. break;
  964. ObjectId newId = e.getNewId();
  965. if (newId != null && !ObjectId.zeroId().equals(newId))
  966. ret.add(newId);
  967. ObjectId oldId = e.getOldId();
  968. if (oldId != null && !ObjectId.zeroId().equals(oldId))
  969. ret.add(oldId);
  970. }
  971. return ret;
  972. }
  973. /**
  974. * Returns a collection of all refs and additional refs.
  975. *
  976. * Additional refs which don't start with "refs/" are not returned because
  977. * they should not save objects from being garbage collected. Examples for
  978. * such references are ORIG_HEAD, MERGE_HEAD, FETCH_HEAD and
  979. * CHERRY_PICK_HEAD.
  980. *
  981. * @return a collection of refs pointing to live objects.
  982. * @throws IOException
  983. */
  984. private Collection<Ref> getAllRefs() throws IOException {
  985. RefDatabase refdb = repo.getRefDatabase();
  986. Collection<Ref> refs = refdb.getRefs(RefDatabase.ALL).values();
  987. List<Ref> addl = refdb.getAdditionalRefs();
  988. if (!addl.isEmpty()) {
  989. List<Ref> all = new ArrayList<>(refs.size() + addl.size());
  990. all.addAll(refs);
  991. // add additional refs which start with refs/
  992. for (Ref r : addl) {
  993. checkCancelled();
  994. if (r.getName().startsWith(Constants.R_REFS)) {
  995. all.add(r);
  996. }
  997. }
  998. return all;
  999. }
  1000. return refs;
  1001. }
  1002. /**
  1003. * Return a list of those objects in the index which differ from whats in
  1004. * HEAD
  1005. *
  1006. * @return a set of ObjectIds of changed objects in the index
  1007. * @throws IOException
  1008. * @throws CorruptObjectException
  1009. * @throws NoWorkTreeException
  1010. */
  1011. private Set<ObjectId> listNonHEADIndexObjects()
  1012. throws CorruptObjectException, IOException {
  1013. if (repo.isBare()) {
  1014. return Collections.emptySet();
  1015. }
  1016. try (TreeWalk treeWalk = new TreeWalk(repo)) {
  1017. treeWalk.addTree(new DirCacheIterator(repo.readDirCache()));
  1018. ObjectId headID = repo.resolve(Constants.HEAD);
  1019. if (headID != null) {
  1020. try (RevWalk revWalk = new RevWalk(repo)) {
  1021. treeWalk.addTree(revWalk.parseTree(headID));
  1022. }
  1023. }
  1024. treeWalk.setFilter(TreeFilter.ANY_DIFF);
  1025. treeWalk.setRecursive(true);
  1026. Set<ObjectId> ret = new HashSet<>();
  1027. while (treeWalk.next()) {
  1028. checkCancelled();
  1029. ObjectId objectId = treeWalk.getObjectId(0);
  1030. switch (treeWalk.getRawMode(0) & FileMode.TYPE_MASK) {
  1031. case FileMode.TYPE_MISSING:
  1032. case FileMode.TYPE_GITLINK:
  1033. continue;
  1034. case FileMode.TYPE_TREE:
  1035. case FileMode.TYPE_FILE:
  1036. case FileMode.TYPE_SYMLINK:
  1037. ret.add(objectId);
  1038. continue;
  1039. default:
  1040. throw new IOException(MessageFormat.format(
  1041. JGitText.get().corruptObjectInvalidMode3,
  1042. String.format("%o", //$NON-NLS-1$
  1043. Integer.valueOf(treeWalk.getRawMode(0))),
  1044. (objectId == null) ? "null" : objectId.name(), //$NON-NLS-1$
  1045. treeWalk.getPathString(), //
  1046. repo.getIndexFile()));
  1047. }
  1048. }
  1049. return ret;
  1050. }
  1051. }
  1052. private PackFile writePack(@NonNull Set<? extends ObjectId> want,
  1053. @NonNull Set<? extends ObjectId> have, @NonNull Set<ObjectId> tags,
  1054. Set<ObjectId> tagTargets, List<ObjectIdSet> excludeObjects)
  1055. throws IOException {
  1056. checkCancelled();
  1057. File tmpPack = null;
  1058. Map<PackExt, File> tmpExts = new TreeMap<>(
  1059. new Comparator<PackExt>() {
  1060. @Override
  1061. public int compare(PackExt o1, PackExt o2) {
  1062. // INDEX entries must be returned last, so the pack
  1063. // scanner does pick up the new pack until all the
  1064. // PackExt entries have been written.
  1065. if (o1 == o2)
  1066. return 0;
  1067. if (o1 == PackExt.INDEX)
  1068. return 1;
  1069. if (o2 == PackExt.INDEX)
  1070. return -1;
  1071. return Integer.signum(o1.hashCode() - o2.hashCode());
  1072. }
  1073. });
  1074. try (PackWriter pw = new PackWriter(
  1075. (pconfig == null) ? new PackConfig(repo) : pconfig,
  1076. repo.newObjectReader())) {
  1077. // prepare the PackWriter
  1078. pw.setDeltaBaseAsOffset(true);
  1079. pw.setReuseDeltaCommits(false);
  1080. if (tagTargets != null) {
  1081. pw.setTagTargets(tagTargets);
  1082. }
  1083. if (excludeObjects != null)
  1084. for (ObjectIdSet idx : excludeObjects)
  1085. pw.excludeObjects(idx);
  1086. pw.preparePack(pm, want, have, PackWriter.NONE, tags);
  1087. if (pw.getObjectCount() == 0)
  1088. return null;
  1089. checkCancelled();
  1090. // create temporary files
  1091. String id = pw.computeName().getName();
  1092. File packdir = repo.getObjectDatabase().getPackDirectory();
  1093. tmpPack = File.createTempFile("gc_", ".pack_tmp", packdir); //$NON-NLS-1$ //$NON-NLS-2$
  1094. final String tmpBase = tmpPack.getName()
  1095. .substring(0, tmpPack.getName().lastIndexOf('.'));
  1096. File tmpIdx = new File(packdir, tmpBase + ".idx_tmp"); //$NON-NLS-1$
  1097. tmpExts.put(INDEX, tmpIdx);
  1098. if (!tmpIdx.createNewFile())
  1099. throw new IOException(MessageFormat.format(
  1100. JGitText.get().cannotCreateIndexfile, tmpIdx.getPath()));
  1101. // write the packfile
  1102. FileOutputStream fos = new FileOutputStream(tmpPack);
  1103. FileChannel channel = fos.getChannel();
  1104. OutputStream channelStream = Channels.newOutputStream(channel);
  1105. try {
  1106. pw.writePack(pm, pm, channelStream);
  1107. } finally {
  1108. channel.force(true);
  1109. channelStream.close();
  1110. fos.close();
  1111. }
  1112. // write the packindex
  1113. fos = new FileOutputStream(tmpIdx);
  1114. FileChannel idxChannel = fos.getChannel();
  1115. OutputStream idxStream = Channels.newOutputStream(idxChannel);
  1116. try {
  1117. pw.writeIndex(idxStream);
  1118. } finally {
  1119. idxChannel.force(true);
  1120. idxStream.close();
  1121. fos.close();
  1122. }
  1123. if (pw.prepareBitmapIndex(pm)) {
  1124. File tmpBitmapIdx = new File(packdir, tmpBase + ".bitmap_tmp"); //$NON-NLS-1$
  1125. tmpExts.put(BITMAP_INDEX, tmpBitmapIdx);
  1126. if (!tmpBitmapIdx.createNewFile())
  1127. throw new IOException(MessageFormat.format(
  1128. JGitText.get().cannotCreateIndexfile,
  1129. tmpBitmapIdx.getPath()));
  1130. fos = new FileOutputStream(tmpBitmapIdx);
  1131. idxChannel = fos.getChannel();
  1132. idxStream = Channels.newOutputStream(idxChannel);
  1133. try {
  1134. pw.writeBitmapIndex(idxStream);
  1135. } finally {
  1136. idxChannel.force(true);
  1137. idxStream.close();
  1138. fos.close();
  1139. }
  1140. }
  1141. // rename the temporary files to real files
  1142. File realPack = nameFor(id, ".pack"); //$NON-NLS-1$
  1143. repo.getObjectDatabase().closeAllPackHandles(realPack);
  1144. tmpPack.setReadOnly();
  1145. FileUtils.rename(tmpPack, realPack, StandardCopyOption.ATOMIC_MOVE);
  1146. for (Map.Entry<PackExt, File> tmpEntry : tmpExts.entrySet()) {
  1147. File tmpExt = tmpEntry.getValue();
  1148. tmpExt.setReadOnly();
  1149. File realExt = nameFor(id,
  1150. "." + tmpEntry.getKey().getExtension()); //$NON-NLS-1$
  1151. try {
  1152. FileUtils.rename(tmpExt, realExt,
  1153. StandardCopyOption.ATOMIC_MOVE);
  1154. } catch (IOException e) {
  1155. File newExt = new File(realExt.getParentFile(),
  1156. realExt.getName() + ".new"); //$NON-NLS-1$
  1157. try {
  1158. FileUtils.rename(tmpExt, newExt,
  1159. StandardCopyOption.ATOMIC_MOVE);
  1160. } catch (IOException e2) {
  1161. newExt = tmpExt;
  1162. e = e2;
  1163. }
  1164. throw new IOException(MessageFormat.format(
  1165. JGitText.get().panicCantRenameIndexFile, newExt,
  1166. realExt), e);
  1167. }
  1168. }
  1169. return repo.getObjectDatabase().openPack(realPack);
  1170. } finally {
  1171. if (tmpPack != null && tmpPack.exists())
  1172. tmpPack.delete();
  1173. for (File tmpExt : tmpExts.values()) {
  1174. if (tmpExt.exists())
  1175. tmpExt.delete();
  1176. }
  1177. }
  1178. }
  1179. private File nameFor(String name, String ext) {
  1180. File packdir = repo.getObjectDatabase().getPackDirectory();
  1181. return new File(packdir, "pack-" + name + ext); //$NON-NLS-1$
  1182. }
  1183. private void checkCancelled() throws CancelledException {
  1184. if (pm.isCancelled() || Thread.currentThread().isInterrupted()) {
  1185. throw new CancelledException(JGitText.get().operationCanceled);
  1186. }
  1187. }
  1188. /**
  1189. * A class holding statistical data for a FileRepository regarding how many
  1190. * objects are stored as loose or packed objects
  1191. */
  1192. public static class RepoStatistics {
  1193. /**
  1194. * The number of objects stored in pack files. If the same object is
  1195. * stored in multiple pack files then it is counted as often as it
  1196. * occurs in pack files.
  1197. */
  1198. public long numberOfPackedObjects;
  1199. /**
  1200. * The number of pack files
  1201. */
  1202. public long numberOfPackFiles;
  1203. /**
  1204. * The number of objects stored as loose objects.
  1205. */
  1206. public long numberOfLooseObjects;
  1207. /**
  1208. * The sum of the sizes of all files used to persist loose objects.
  1209. */
  1210. public long sizeOfLooseObjects;
  1211. /**
  1212. * The sum of the sizes of all pack files.
  1213. */
  1214. public long sizeOfPackedObjects;
  1215. /**
  1216. * The number of loose refs.
  1217. */
  1218. public long numberOfLooseRefs;
  1219. /**
  1220. * The number of refs stored in pack files.
  1221. */
  1222. public long numberOfPackedRefs;
  1223. /**
  1224. * The number of bitmaps in the bitmap indices.
  1225. */
  1226. public long numberOfBitmaps;
  1227. @Override
  1228. public String toString() {
  1229. final StringBuilder b = new StringBuilder();
  1230. b.append("numberOfPackedObjects=").append(numberOfPackedObjects); //$NON-NLS-1$
  1231. b.append(", numberOfPackFiles=").append(numberOfPackFiles); //$NON-NLS-1$
  1232. b.append(", numberOfLooseObjects=").append(numberOfLooseObjects); //$NON-NLS-1$
  1233. b.append(", numberOfLooseRefs=").append(numberOfLooseRefs); //$NON-NLS-1$
  1234. b.append(", numberOfPackedRefs=").append(numberOfPackedRefs); //$NON-NLS-1$
  1235. b.append(", sizeOfLooseObjects=").append(sizeOfLooseObjects); //$NON-NLS-1$
  1236. b.append(", sizeOfPackedObjects=").append(sizeOfPackedObjects); //$NON-NLS-1$
  1237. b.append(", numberOfBitmaps=").append(numberOfBitmaps); //$NON-NLS-1$
  1238. return b.toString();
  1239. }
  1240. }
  1241. /**
  1242. * Returns information about objects and pack files for a FileRepository.
  1243. *
  1244. * @return information about objects and pack files for a FileRepository
  1245. * @throws java.io.IOException
  1246. */
  1247. public RepoStatistics getStatistics() throws IOException {
  1248. RepoStatistics ret = new RepoStatistics();
  1249. Collection<PackFile> packs = repo.getObjectDatabase().getPacks();
  1250. for (PackFile f : packs) {
  1251. ret.numberOfPackedObjects += f.getIndex().getObjectCount();
  1252. ret.numberOfPackFiles++;
  1253. ret.sizeOfPackedObjects += f.getPackFile().length();
  1254. if (f.getBitmapIndex() != null)
  1255. ret.numberOfBitmaps += f.getBitmapIndex().getBitmapCount();
  1256. }
  1257. File objDir = repo.getObjectsDirectory();
  1258. String[] fanout = objDir.list();
  1259. if (fanout != null && fanout.length > 0) {
  1260. for (String d : fanout) {
  1261. if (d.length() != 2)
  1262. continue;
  1263. File[] entries = new File(objDir, d).listFiles();
  1264. if (entries == null)
  1265. continue;
  1266. for (File f : entries) {
  1267. if (f.getName().length() != Constants.OBJECT_ID_STRING_LENGTH - 2)
  1268. continue;
  1269. ret.numberOfLooseObjects++;
  1270. ret.sizeOfLooseObjects += f.length();
  1271. }
  1272. }
  1273. }
  1274. RefDatabase refDb = repo.getRefDatabase();
  1275. for (Ref r : refDb.getRefs(RefDatabase.ALL).values()) {
  1276. Storage storage = r.getStorage();
  1277. if (storage == Storage.LOOSE || storage == Storage.LOOSE_PACKED)
  1278. ret.numberOfLooseRefs++;
  1279. if (storage == Storage.PACKED || storage == Storage.LOOSE_PACKED)
  1280. ret.numberOfPackedRefs++;
  1281. }
  1282. return ret;
  1283. }
  1284. /**
  1285. * Set the progress monitor used for garbage collection methods.
  1286. *
  1287. * @param pm a {@link org.eclipse.jgit.lib.ProgressMonitor} object.
  1288. * @return this
  1289. */
  1290. public GC setProgressMonitor(ProgressMonitor pm) {
  1291. this.pm = (pm == null) ? NullProgressMonitor.INSTANCE : pm;
  1292. return this;
  1293. }
  1294. /**
  1295. * During gc() or prune() each unreferenced, loose object which has been
  1296. * created or modified in the last <code>expireAgeMillis</code> milliseconds
  1297. * will not be pruned. Only older objects may be pruned. If set to 0 then
  1298. * every object is a candidate for pruning.
  1299. *
  1300. * @param expireAgeMillis
  1301. * minimal age of objects to be pruned in milliseconds.
  1302. */
  1303. public void setExpireAgeMillis(long expireAgeMillis) {
  1304. this.expireAgeMillis = expireAgeMillis;
  1305. expire = null;
  1306. }
  1307. /**
  1308. * During gc() or prune() packfiles which are created or modified in the
  1309. * last <code>packExpireAgeMillis</code> milliseconds will not be deleted.
  1310. * Only older packfiles may be deleted. If set to 0 then every packfile is a
  1311. * candidate for deletion.
  1312. *
  1313. * @param packExpireAgeMillis
  1314. * minimal age of packfiles to be deleted in milliseconds.
  1315. */
  1316. public void setPackExpireAgeMillis(long packExpireAgeMillis) {
  1317. this.packExpireAgeMillis = packExpireAgeMillis;
  1318. expire = null;
  1319. }
  1320. /**
  1321. * Set the PackConfig used when (re-)writing packfiles. This allows to
  1322. * influence how packs are written and to implement something similar to
  1323. * "git gc --aggressive"
  1324. *
  1325. * @param pconfig
  1326. * the {@link org.eclipse.jgit.storage.pack.PackConfig} used when
  1327. * writing packs
  1328. */
  1329. public void setPackConfig(PackConfig pconfig) {
  1330. this.pconfig = pconfig;
  1331. }
  1332. /**
  1333. * During gc() or prune() each unreferenced, loose object which has been
  1334. * created or modified after or at <code>expire</code> will not be pruned.
  1335. * Only older objects may be pruned. If set to null then every object is a
  1336. * candidate for pruning.
  1337. *
  1338. * @param expire
  1339. * instant in time which defines object expiration
  1340. * objects with modification time before this instant are expired
  1341. * objects with modification time newer or equal to this instant
  1342. * are not expired
  1343. */
  1344. public void setExpire(Date expire) {
  1345. this.expire = expire;
  1346. expireAgeMillis = -1;
  1347. }
  1348. /**
  1349. * During gc() or prune() packfiles which are created or modified after or
  1350. * at <code>packExpire</code> will not be deleted. Only older packfiles may
  1351. * be deleted. If set to null then every packfile is a candidate for
  1352. * deletion.
  1353. *
  1354. * @param packExpire
  1355. * instant in time which defines packfile expiration
  1356. */
  1357. public void setPackExpire(Date packExpire) {
  1358. this.packExpire = packExpire;
  1359. packExpireAgeMillis = -1;
  1360. }
  1361. /**
  1362. * Set the {@code gc --auto} option.
  1363. *
  1364. * With this option, gc checks whether any housekeeping is required; if not,
  1365. * it exits without performing any work. Some JGit commands run
  1366. * {@code gc --auto} after performing operations that could create many
  1367. * loose objects.
  1368. * <p>
  1369. * Housekeeping is required if there are too many loose objects or too many
  1370. * packs in the repository. If the number of loose objects exceeds the value
  1371. * of the gc.auto option JGit GC consolidates all existing packs into a
  1372. * single pack (equivalent to {@code -A} option), whereas git-core would
  1373. * combine all loose objects into a single pack using {@code repack -d -l}.
  1374. * Setting the value of {@code gc.auto} to 0 disables automatic packing of
  1375. * loose objects.
  1376. * <p>
  1377. * If the number of packs exceeds the value of {@code gc.autoPackLimit},
  1378. * then existing packs (except those marked with a .keep file) are
  1379. * consolidated into a single pack by using the {@code -A} option of repack.
  1380. * Setting {@code gc.autoPackLimit} to 0 disables automatic consolidation of
  1381. * packs.
  1382. * <p>
  1383. * Like git the following jgit commands run auto gc:
  1384. * <ul>
  1385. * <li>fetch</li>
  1386. * <li>merge</li>
  1387. * <li>rebase</li>
  1388. * <li>receive-pack</li>
  1389. * </ul>
  1390. * The auto gc for receive-pack can be suppressed by setting the config
  1391. * option {@code receive.autogc = false}
  1392. *
  1393. * @param auto
  1394. * defines whether gc should do automatic housekeeping
  1395. */
  1396. public void setAuto(boolean auto) {
  1397. this.automatic = auto;
  1398. }
  1399. /**
  1400. * @param background
  1401. * whether to run the gc in a background thread.
  1402. */
  1403. void setBackground(boolean background) {
  1404. this.background = background;
  1405. }
  1406. private boolean needGc() {
  1407. if (tooManyPacks()) {
  1408. addRepackAllOption();
  1409. } else if (!tooManyLooseObjects()) {
  1410. return false;
  1411. }
  1412. // TODO run pre-auto-gc hook, if it fails return false
  1413. return true;
  1414. }
  1415. private void addRepackAllOption() {
  1416. // TODO: if JGit GC is enhanced to support repack's option -l this
  1417. // method needs to be implemented
  1418. }
  1419. /**
  1420. * @return {@code true} if number of packs > gc.autopacklimit (default 50)
  1421. */
  1422. boolean tooManyPacks() {
  1423. int autopacklimit = repo.getConfig().getInt(
  1424. ConfigConstants.CONFIG_GC_SECTION,
  1425. ConfigConstants.CONFIG_KEY_AUTOPACKLIMIT,
  1426. DEFAULT_AUTOPACKLIMIT);
  1427. if (autopacklimit <= 0) {
  1428. return false;
  1429. }
  1430. // JGit always creates two packfiles, one for the objects reachable from
  1431. // branches, and another one for the rest
  1432. return repo.getObjectDatabase().getPacks().size() > (autopacklimit + 1);
  1433. }
  1434. /**
  1435. * Quickly estimate number of loose objects, SHA1 is distributed evenly so
  1436. * counting objects in one directory (bucket 17) is sufficient
  1437. *
  1438. * @return {@code true} if number of loose objects > gc.auto (default 6700)
  1439. */
  1440. boolean tooManyLooseObjects() {
  1441. int auto = getLooseObjectLimit();
  1442. if (auto <= 0) {
  1443. return false;
  1444. }
  1445. int n = 0;
  1446. int threshold = (auto + 255) / 256;
  1447. Path dir = repo.getObjectsDirectory().toPath().resolve("17"); //$NON-NLS-1$
  1448. if (!Files.exists(dir)) {
  1449. return false;
  1450. }
  1451. try (DirectoryStream<Path> stream = Files.newDirectoryStream(dir,
  1452. new DirectoryStream.Filter<Path>() {
  1453. @Override
  1454. public boolean accept(Path file) throws IOException {
  1455. Path fileName = file.getFileName();
  1456. return Files.isRegularFile(file) && fileName != null
  1457. && PATTERN_LOOSE_OBJECT
  1458. .matcher(fileName.toString()).matches();
  1459. }
  1460. })) {
  1461. for (Iterator<Path> iter = stream.iterator(); iter.hasNext();
  1462. iter.next()) {
  1463. if (++n > threshold) {
  1464. return true;
  1465. }
  1466. }
  1467. } catch (IOException e) {
  1468. LOG.error(e.getMessage(), e);
  1469. }
  1470. return false;
  1471. }
  1472. private int getLooseObjectLimit() {
  1473. return repo.getConfig().getInt(ConfigConstants.CONFIG_GC_SECTION,
  1474. ConfigConstants.CONFIG_KEY_AUTO, DEFAULT_AUTOLIMIT);
  1475. }
  1476. }