* [PATCH] mbox: stream entire thread, regardless of size
@ 2015-08-21 23:31 Eric Wong
0 siblings, 0 replies; only message in thread
From: Eric Wong @ 2015-08-21 23:31 UTC (permalink / raw)
To: meta
Since mbox is usually downloaded, support fetching infinitely large
responses via streaming.
---
lib/PublicInbox/Mbox.pm | 46 +++++++++++++++++++++++++++++-----------------
lib/PublicInbox/Search.pm | 2 +-
2 files changed, 30 insertions(+), 18 deletions(-)
diff --git a/lib/PublicInbox/Mbox.pm b/lib/PublicInbox/Mbox.pm
index 2ec5065..fc9df1a 100644
--- a/lib/PublicInbox/Mbox.pm
+++ b/lib/PublicInbox/Mbox.pm
@@ -9,27 +9,14 @@ use Fcntl qw(SEEK_SET);
sub thread_mbox {
my ($ctx, $srch) = @_;
- my $mid = mid_compressed($ctx->{mid});
- my $res = $srch->get_thread($mid);
- my $msgs = delete $res->{msgs};
- require PublicInbox::GitCatFile;
- require Email::Simple;
- my $git = PublicInbox::GitCatFile->new($ctx->{git_dir});
-
sub {
- my ($res) = @_; # Plack callback
- my $w = $res->([200, [ 'Content-Type' => 'text/plain' ] ]);
- while (defined(my $smsg = shift @$msgs)) {
- my $msg = eval {
- my $path = 'HEAD:' . mid2path($smsg->mid);
- Email::Simple->new($git->cat_file($path));
- };
- emit($w, $msg) if $msg;
- }
+ my ($response) = @_; # Plack callback
+ my $w = $response->([200, ['Content-Type' => 'text/plain']]);
+ emit_mbox($w, $ctx, $srch);
}
}
-sub emit {
+sub emit_msg {
my ($fh, $simple) = @_; # Email::Simple object
# drop potentially confusing headers, ssoma already should've dropped
@@ -52,4 +39,29 @@ sub emit {
$fh->write($buf);
}
+sub emit_mbox {
+ my ($fh, $ctx, $srch) = @_;
+
+ require PublicInbox::GitCatFile;
+ require Email::Simple;
+ my $mid = mid_compressed($ctx->{mid});
+ my $git = PublicInbox::GitCatFile->new($ctx->{git_dir});
+ my %opts = (offset => 0);
+ my $nr;
+ do {
+ my $res = $srch->get_thread($mid, \%opts);
+ my $msgs = $res->{msgs};
+ $nr = scalar @$msgs;
+ while (defined(my $smsg = shift @$msgs)) {
+ my $msg = eval {
+ my $p = 'HEAD:'.mid2path($smsg->mid);
+ Email::Simple->new($git->cat_file($p));
+ };
+ emit_msg($fh, $msg) if $msg;
+ }
+
+ $opts{offset} += $nr;
+ } while ($nr > 0);
+}
+
1;
diff --git a/lib/PublicInbox/Search.pm b/lib/PublicInbox/Search.pm
index f004050..f1ff3a4 100644
--- a/lib/PublicInbox/Search.pm
+++ b/lib/PublicInbox/Search.pm
@@ -247,7 +247,7 @@ sub get_thread {
my $qtid = $qp->parse_query('thread:'.$smsg->thread_id);
my $qsub = $qp->parse_query('path:'.mid_compressed($smsg->path));
my $query = Search::Xapian::Query->new(OP_OR, $qtid, $qsub);
- $self->do_enquire($query);
+ $self->do_enquire($query, $opts);
}
# private subs below
--
EW
^ permalink raw reply related [flat|nested] only message in thread
only message in thread, other threads:[~2015-08-21 23:31 UTC | newest]
Thread overview: (only message) (download: mbox.gz follow: Atom feed
-- links below jump to the message on this page --
2015-08-21 23:31 [PATCH] mbox: stream entire thread, regardless of size Eric Wong
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).