1 7d6d378a 2022-08-24 op #!/usr/bin/env perl
3 1bcb9899 2022-08-29 op # mkindex was written by Omar Polo <op@openbsd.org> and is placed in
4 1bcb9899 2022-08-29 op # the public domain. The author hereby disclaims copyright to this
7 7d6d378a 2022-08-24 op use open ":std", ":encoding(UTF-8)";
12 270695a3 2022-08-30 op use File::Temp qw(tempfile);
14 38232a0a 2023-05-07 op use SMArc qw(parse san urlencode initpage endpage index_header
15 789a106a 2023-05-05 op search thread_header threntry);
17 7d6d378a 2022-08-24 op my $outdir = $ENV{'OUTDIR'};
18 7d6d378a 2022-08-24 op die 'Set $OUTDIR' unless defined $outdir;
20 28ebc168 2022-08-24 op my $tfh; # thread file handle
21 28ebc168 2022-08-24 op my $pfh; # page file handle
27 584d65d8 2022-08-24 op my $threads_seen = 0;
29 584d65d8 2022-08-24 op my $last_level = 0;
31 debcbab2 2022-09-13 op my $last_date;
32 debcbab2 2022-09-13 op my $last_from;
33 debcbab2 2022-09-13 op my $last_subj;
35 c5dff871 2022-08-29 op my $threads = 0;
36 c5dff871 2022-08-29 op my $threads_per_page = 100;
39 d40f4fe2 2022-08-26 op my ($a, $b) = @_;
40 d40f4fe2 2022-08-26 op return $a unless defined $b;
41 d40f4fe2 2022-08-26 op return $a gt $b ? $a : $b;
45 d40f4fe2 2022-08-26 op my ($a, $b) = @_;
46 d40f4fe2 2022-08-26 op return $a unless defined $b;
47 d40f4fe2 2022-08-26 op return $a lt $b ? $a : $b;
50 28ebc168 2022-08-24 op sub pagename {
51 28ebc168 2022-08-24 op my $i = shift;
52 1913b2fb 2022-08-26 op return $i == 1 && "index.html" || "$i.html";
56 ebad21b1 2022-08-26 op say $pfh '</ul></div>';
58 d40f4fe2 2022-08-26 op push @pages, "$from_day - $to_day";
61 28ebc168 2022-08-24 op sub nextfile {
62 ebad21b1 2022-08-26 op endfile if defined $pfh;
66 38232a0a 2023-05-07 op ($pfh, $path) = tempfile "/tmp/smarc.index.XXXXXXXXXX";
67 b031debf 2023-03-29 op binmode($pfh, ':utf8');
68 270695a3 2022-08-30 op push @files, $path;
69 ebad21b1 2022-08-26 op say $pfh "<div class='thread'><ul>";
73 43c49583 2022-08-27 op my ($pfh, $n) = @_;
74 43c49583 2022-08-27 op my ($first, $last) = (pagename(1), pagename($page));
75 6fde8229 2022-08-26 op my ($next, $prev) = (pagename($n+1), pagename($n-1));
77 2eb655f1 2022-08-27 op say $pfh "<nav>";
78 1913b2fb 2022-08-26 op say $pfh "<a href='$first'>First</a>" if $n > 2;
79 1913b2fb 2022-08-26 op say $pfh "<a href='$prev'>Prev</a>" if $n > 1;
80 6fde8229 2022-08-26 op say $pfh "<a href='$next'>Next</a>" if $n < $page;
81 6fde8229 2022-08-26 op say $pfh "<a href='$last'>Last</a>" if $n < $page - 1;
82 6fde8229 2022-08-26 op say $pfh "</nav>";
85 6fde8229 2022-08-26 op sub copyfrom {
86 6fde8229 2022-08-26 op my ($path, $fh) = @_;
88 6fde8229 2022-08-26 op # there are probably faster ways to do this like File::Copy,
89 6fde8229 2022-08-26 op # but it bypasses the bufio cache...
90 6fde8229 2022-08-26 op open(my $pfh, '<', $path) or die "can't open $path: $!";
91 890362cd 2022-08-30 op print $fh $_ while <$pfh>;
94 add05cb0 2022-08-27 op sub renderpages {
97 1913b2fb 2022-08-26 op for (my $i = 1; $i <= $page; $i++) {
98 66e1cf97 2022-08-27 op my $name = pagename($i);
99 270695a3 2022-08-30 op my $path = shift @files;
100 66e1cf97 2022-08-27 op my $dest = "$outdir/$name";
102 6fde8229 2022-08-26 op open(my $pfh, '>', $dest)
103 6fde8229 2022-08-26 op or die "can't open $dest for writing: $!";
105 39c49919 2023-05-05 op my $title = "page $i";
106 d40f4fe2 2022-08-26 op my $subtitle = $pages[$i-1];
108 9ec6c848 2022-08-27 op initpage($pfh, $title);
109 9ec6c848 2022-08-27 op index_header $pfh, $i, $subtitle;
110 9ec6c848 2022-08-27 op say $pfh "<main>";
112 43c49583 2022-08-27 op nav $pfh, $i if $page > 1;
114 6fde8229 2022-08-26 op copyfrom($path, $pfh);
115 43c49583 2022-08-27 op nav $pfh, $i if $page > 1;
117 e773a9f0 2022-08-24 op say $pfh "</main>";
118 e773a9f0 2022-08-24 op endpage($pfh);
121 8d17053d 2022-08-26 op unlink $path;
125 eefeacb7 2022-08-27 op sub endthread {
126 eefeacb7 2022-08-27 op say $tfh "</ul></li>" x $last_level;
127 c13d576c 2022-08-27 op say $tfh "</ul>\n</div>\n";
128 eefeacb7 2022-08-27 op endpage($tfh);
131 eefeacb7 2022-08-27 op $last_level = 0;
134 7d6d378a 2022-08-24 op sub nextthread {
135 eefeacb7 2022-08-27 op endthread if defined $tfh;
136 7d6d378a 2022-08-24 op my ($mid, $subj) = @_;
137 7d6d378a 2022-08-24 op my $dest = "$outdir/thread/$mid.html";
138 7d6d378a 2022-08-24 op open($tfh, '>', $dest) or die "can't open $dest: $!";
139 7d6d378a 2022-08-24 op initpage($tfh, $subj);
140 8f7a9a46 2023-04-04 op thread_header $tfh, ["Thread: $subj"];
141 c13d576c 2022-08-27 op print $tfh "<div class='thread'><ul class='mails'>\n";
144 debcbab2 2022-09-13 op sub index_entry {
145 debcbab2 2022-09-13 op my ($fh, $mid, $date, $from, $subj) = @_;
147 bd3babdf 2023-04-02 op # synthetic mail hash
151 bd3babdf 2023-04-02 op date => $date,
152 bd3babdf 2023-04-02 op from => $from,
153 bd3babdf 2023-04-02 op subj => $subj,
156 bd3babdf 2023-04-02 op threntry $fh, "thread", 0, 0, $mail;
159 1d565e04 2023-05-06 op if (`uname` =~ "OpenBSD") {
160 1d565e04 2023-05-06 op use OpenBSD::Pledge;
161 1d565e04 2023-05-06 op use OpenBSD::Unveil;
163 1d565e04 2023-05-06 op unveil($outdir, "rwc") or die "unveil $outdir: $!";
165 1d565e04 2023-05-06 op # can't use tmppath because File::Temp checks wether /tmp exists.
166 1d565e04 2023-05-06 op unveil("/tmp", "rwc") or die "unveil /tmp: $!";
168 1d565e04 2023-05-06 op # fattr for File::Temp
169 1d565e04 2023-05-06 op pledge("stdio rpath wpath cpath fattr") or die "pledge: $!";
175 6b36ff28 2023-04-01 op my $mail = parse $_;
177 bbdbef1a 2023-04-01 op if ($mail->{level} == 0) {
178 bbdbef1a 2023-04-01 op nextthread $mail->{mid}, $mail->{subj};
181 c5dff871 2022-08-29 op if ($threads > $threads_per_page) {
183 c5dff871 2022-08-29 op $threads = 0;
184 d40f4fe2 2022-08-26 op $to_day = undef;
185 d40f4fe2 2022-08-26 op $from_day = undef;
188 bbdbef1a 2023-04-01 op my $day = $mail->{date} =~ s/ .*//r;
189 a0b4d4b3 2022-08-27 op $to_day = mins $day, $to_day;
190 a0b4d4b3 2022-08-27 op $from_day = maxs $day, $from_day;
193 bd3babdf 2023-04-02 op $last_level = threntry $tfh, "mail", 0, $last_level, $mail;
194 584d65d8 2022-08-24 op $threads_seen = 1;
196 debcbab2 2022-09-13 op index_entry $pfh, $last_tid, $last_date, $last_from, $last_subj
197 bbdbef1a 2023-04-01 op if defined $last_tid && $mail->{level} == 0;
199 257d7c99 2022-10-04 op # `gt' on dates works because the format used allow for
200 257d7c99 2022-10-04 op # lexicographic comparisons.
201 bbdbef1a 2023-04-01 op if ($mail->{level} == 0 || $mail->{date} gt $last_date) {
202 bbdbef1a 2023-04-01 op $last_date = $mail->{date};
203 bbdbef1a 2023-04-01 op $last_from = $mail->{from};
206 bbdbef1a 2023-04-01 op if ($mail->{level} == 0) {
207 bbdbef1a 2023-04-01 op $last_tid = $mail->{mid};
208 bbdbef1a 2023-04-01 op $last_subj = $mail->{subj};
212 debcbab2 2022-09-13 op index_entry $pfh, $last_tid, $last_date, $last_from, $last_subj
213 debcbab2 2022-09-13 op if defined $last_tid;
216 ebad21b1 2022-08-26 op endthread if $threads_seen;