#!/usr/bin/perl -w
# Copyright (C) 2018 all contributors
# License: AGPL-3.0+
use strict;
use warnings;
use Getopt::Long qw(:config gnu_getopt no_ignore_case auto_abbrev);
use PublicInbox::MIME;
use PublicInbox::InboxWritable;
use PublicInbox::Config;
use PublicInbox::V2Writable;
use PublicInbox::Import;
use PublicInbox::Spawn qw(spawn);
use Cwd 'abs_path';
use File::Copy 'cp'; # preserves permissions:
my $usage = "Usage: public-inbox-convert OLD NEW\n";
my $jobs;
my $index = 1;
my %opts = (
'--jobs|j=i' => \$jobs,
'--index!' => \$index,
);
GetOptions(%opts) or die "bad command-line args\n$usage";
GetOptions(%opts) or die "bad command-line args\n$usage";
my $old_dir = shift or die $usage;
my $new_dir = shift or die $usage;
die "$new_dir exists\n" if -d $new_dir;
die "$old_dir not a directory\n" unless -d $old_dir;
my $config = eval { PublicInbox::Config->new };
$old_dir = abs_path($old_dir);
my $old;
if ($config) {
$config->each_inbox(sub {
$old = $_[0] if abs_path($_[0]->{mainrepo}) eq $old_dir;
});
}
unless ($old) {
warn "W: $old_dir not configured in " .
PublicInbox::Config::default_file() . "\n";
$old = {
mainrepo => $old_dir,
name => 'ignored',
address => [ 'old@example.com' ],
};
$old = PublicInbox::Inbox->new($old);
}
$old = PublicInbox::InboxWritable->new($old);
if (($old->{version} || 1) >= 2) {
die "Only conversion from v1 inboxes is supported\n";
}
my $new = { %$old };
$new->{mainrepo} = abs_path($new_dir);
$new->{version} = 2;
$new = PublicInbox::InboxWritable->new($new);
my $v2w;
$old->umask_prepare;
sub link_or_copy ($$) {
my ($src, $dst) = @_;
link($src, $dst) and return;
$!{EXDEV} or warn "link $src, $dst failed: $!, trying cp\n";
cp($src, $dst) or die "cp $src, $dst failed: $!\n";
}
$old->with_umask(sub {
my $old_cfg = "$old->{mainrepo}/config";
local $ENV{GIT_CONFIG} = $old_cfg;
my $new_cfg = "$new->{mainrepo}/all.git/config";
$v2w = PublicInbox::V2Writable->new($new, 1);
$v2w->init_inbox($jobs);
unlink $new_cfg;
link_or_copy($old_cfg, $new_cfg);
if (my $alt = $new->{altid}) {
require PublicInbox::AltId;
foreach my $i (0..$#$alt) {
my $src = PublicInbox::AltId->new($old, $alt->[$i], 0);
$src->mm_alt or next;
my $dst = PublicInbox::AltId->new($new, $alt->[$i], 1);
$dst = $dst->{filename};
$src->mm_alt->{dbh}->sqlite_backup_to_file($dst);
}
}
my $desc = "$old->{mainrepo}/description";
link_or_copy($desc, "$new->{mainrepo}/description") if -e $desc;
my $clone = "$old->{mainrepo}/cloneurl";
if (-e $clone) {
warn <<"";
$clone may not be valid after migrating to v2, not copying
}
});
my $state = '';
my ($prev, $from);
my $head = $old->{ref_head} || 'HEAD';
my ($rd, $pid) = $old->git->popen(qw(fast-export --use-done-feature), $head);
$v2w->idx_init;
my $im = $v2w->importer;
my ($r, $w) = $im->gfi_start;
my $h = '[0-9a-f]';
my %D;
my $purged = 0;
while (<$rd>) {
if ($_ eq "blob\n") {
$state = 'blob';
} elsif (/^commit /) {
$state = 'commit';
$purged = 0;
} elsif (/^data (\d+)/) {
my $len = $1;
$w->print($_) or $im->wfail;
while ($len) {
my $n = read($rd, my $tmp, $len) or die "read: $!";
warn "$n != $len\n" if $n != $len;
$len -= $n;
$w->print($tmp) or $im->wfail;
}
next;
} elsif ($state eq 'commit') {
if (m/^([MDcRN] | deleteall)/) {
if (!$purged) {
$purged = 1;
$w->print("deleteall\n") or $im->wfail;
}
}
if (m{^M 100644 :(\d+) (${h}{2})/(${h}{38})}o) {
my ($mark, $path) = ($1, $2 . $3);
${D}{$path} = $mark;
$w->print("M 100644 :$mark $path\n") or $im->wfail;
next;
}
if (m{^D (${h}{2})/(${h}{38})}o) {
my $path = $1 . $2;
my $mark = delete $D{$path};
defined $mark or die "undeleted path: $1\n";
$w->print("M 100644 :$mark d\n") or $im->wfail;
next;
}
if (m{^from (:\d+)}) {
$prev = $from;
$from = $1;
# no next
}
}
last if $_ eq "done\n";
$w->print($_) or $im->wfail;
}
$w = $r = undef;
close $rd or die "close fast-export: $!\n";
waitpid($pid, 0) or die "waitpid failed: $!\n";
$? == 0 or die "fast-export failed: $?\n";
my $mm = $old->mm;
$mm->{dbh}->sqlite_backup_to_file("$new_dir/msgmap.sqlite3") if $mm;
$v2w->done;
if ($index) {
$v2w->index_sync;
$v2w->done;
}