interpret/src/journal.re.c

259 lines
8.2 KiB
C
Raw Normal View History

/** @license 2022 Neil Edelman, distributed under the terms of the
[GNU General Public License 3](https://opensource.org/licenses/GPL-3.0).
Reading all journal entries yyyy-mm-dd in yyyy/mm/dd.txt to a tree.
[re2c](https://re2c.org/) is a convince (and fast) for "looks like" functions,
telling the recursion to go into a directory.
2023-02-02 01:05:55 -05:00
@std GNU, C11, assumes reverse order unions. */
#include "../src/journal.h"
2022-12-27 02:31:08 -05:00
#include <inttypes.h> /* C99 */
#include <limits.h>
2022-12-27 23:45:57 -05:00
#include <stdio.h>
2022-12-27 02:31:08 -05:00
#include <assert.h>
2022-12-27 23:45:57 -05:00
#include <stdlib.h>
#include <unistd.h> /* chdir (POSIX) */
#include <sys/types.h> /* mode_t (POSIX) */
#include <sys/stat.h> /* umask (POSIX) */
#include <dirent.h> /* opendir readdir closedir */
/* Day tree-map from date to pointer; is backed by a huge array of text. */
2022-12-29 02:54:59 -05:00
void date32_to_string(const union date32 d, char (*const a)[12]) {
2022-12-27 23:45:57 -05:00
sprintf(*a, "%" PRIu32 "-%2.2" PRIu32 "-%2.2" PRIu32,
2022-12-28 12:34:19 -05:00
d.year % 10000, d.month % 100, d.day % 100);
2022-12-27 02:31:08 -05:00
}
2022-12-27 23:45:57 -05:00
static int day_compare(const union date32 a, const union date32 b)
2022-12-27 02:31:08 -05:00
{ return a.u32 > b.u32; }
2023-02-02 01:23:35 -05:00
static void day_to_string(const union date32 d, const char *const*const entry,
2022-12-27 23:45:57 -05:00
char (*const a)[12]) { (void)entry; date32_to_string(d, a); }
#define TREE_NAME day
2022-12-27 02:31:08 -05:00
#define TREE_KEY union date32
2023-02-02 01:23:35 -05:00
#define TREE_VALUE const char *
#define TREE_COMPARE
#define TREE_TO_STRING
#define TREE_BODY
2022-12-27 02:31:08 -05:00
#include "../src/tree.h"
/* Temporary filename arrangement in directory; private. */
2022-12-28 03:03:55 -05:00
#if INT_MAX >= 100000000000
#error int_to_string requires truncation on this compiler.
#endif
static void int_to_string(const int *const n, char (*const a)[12])
{ sprintf(*a, "%d", *n); }
#define ARRAY_NAME int
#define ARRAY_TYPE int
#define ARRAY_TO_STRING
#include "../src/array.h"
2023-04-21 23:11:57 -04:00
/** Comparator of `a`, `b`. */
2022-12-28 03:03:55 -05:00
static int int_cmp(const int *const a, const int *const b)
{ return (*b < *a) - (*a < *b); }
2023-04-21 23:11:57 -04:00
/** For `qsort`. */
2022-12-28 03:03:55 -05:00
static int void_int_cmp(const void *const a, const void *const b)
{ return int_cmp(a, b); }
2022-12-27 02:31:08 -05:00
/*!re2c
re2c:yyfill:enable = 0;
re2c:define:YYCTYPE = char;
*/
/** "-"? [1-9][0-9]*$, within the range of `INT_MAX`. */
static int looks_like_year(const char *const a, int *const year) {
const char *YYCURSOR = a, *YYMARKER = a, *s0;
/*!stags:re2c format = 'const char *@@;\n'; */
assert(a && year);
/*!re2c /**/
@s0 ("-"? [1-9][0-9]* | "0") "\x00" {
int sign = 1, mag;
if(*s0 == '-') { sign = -1; s0++; }
for(mag = 0; *s0 != '\0'; s0++) {
int d = *s0 - '0';
if((INT_MAX - d) / 10 < mag) return 0;
mag = mag * 10 + d;
}
*year = sign * mag;
return 1;
}
* { return 0; }
*/
}
/** 1 <= [0-1][0-9]$ <= 12 */
static unsigned looks_like_month(const char *const a) {
const char *YYCURSOR = a, *YYMARKER = a, *s0;
/*!stags:re2c format = 'const char *@@;\n'; */
(void)yyt1;
assert(a);
/*!re2c /**/
@s0 [0-1][0-9] "\x00" {
unsigned val = 10u * (unsigned)(s0[0] - '0') + (unsigned)(s0[1] - '0');
return val < 1 || val > 12 ? 0 : val;
}
* { return 0; }
*/
}
/** 1 <= [0-3][0-9].txt$ <= 31 */
static unsigned looks_like_day(const char *const a) {
const char *YYCURSOR = a, *YYMARKER = a, *s0;
/*!stags:re2c format = 'const char *@@;\n'; */
(void)yyt1;
assert(a);
/*!re2c /**/
@s0 [0-3][0-9] ".txt\x00" {
unsigned val = 10u * (unsigned)(s0[0] - '0') + (unsigned)(s0[1] - '0');
return val < 1 || val > 31 ? 0 : val;
}
* { return 0; }
*/
}
2023-02-17 17:06:21 -05:00
/** Erases memory allocation for `j`. */
2022-12-27 23:45:57 -05:00
void journal_(struct journal *const j) {
2022-12-28 03:03:55 -05:00
if(!j) return;
day_tree_(&j->days);
text_(&j->backing);
2022-12-27 23:45:57 -05:00
}
2023-04-19 18:11:44 -04:00
/** @return A completed journal out of `dir_journal`. Any reading errors and
`errno` will be set, it will be idle. */
2023-04-19 18:11:44 -04:00
struct journal journal(const char *const dir_journal) {
2022-12-27 23:45:57 -05:00
struct journal j = {0};
char *intent = 0;
DIR *dir = 0;
2022-12-28 03:03:55 -05:00
struct dirent *de = 0;
2022-12-27 23:45:57 -05:00
struct int_array years = int_array(), months = int_array(),
days = int_array();
2022-12-28 03:03:55 -05:00
int *y = 0, *y_end, *m = 0, *m_end, *d = 0, *d_end;
2022-12-29 02:54:59 -05:00
struct day_tree_iterator it;
2023-02-02 01:05:55 -05:00
union { const char **text; uintptr_t *offset; } v;
2023-04-19 18:11:44 -04:00
char cwd[256];
int is_dir_journal = 0;
2022-12-27 23:45:57 -05:00
/* Get the years list as directories matching a year. */
2023-04-19 18:11:44 -04:00
if(!getcwd(cwd, sizeof cwd) || chdir(dir_journal) == -1) goto catch;
is_dir_journal = 1;
if(!(dir = opendir("."))) goto catch;
2022-12-27 23:45:57 -05:00
while((de = readdir(dir))) {
struct stat st;
int year, *p;
2022-12-28 03:03:55 -05:00
if(!looks_like_year(de->d_name, &year)) continue;
2022-12-27 23:45:57 -05:00
if(stat(de->d_name, &st)) goto catch;
if(!S_ISDIR(st.st_mode)) continue;
if(!(p = int_array_new(&years))) goto catch;
*p = year;
}
2022-12-28 03:03:55 -05:00
if(closedir(dir)) { dir = 0; goto catch; } dir = 0;
2023-02-02 21:53:59 -05:00
/* Sort the years. */
2022-12-27 23:45:57 -05:00
qsort(years.data, years.size, sizeof *years.data, &void_int_cmp);
fprintf(stderr, "Years in <<%s>>: %s.\n",
2022-12-28 03:03:55 -05:00
dir_journal, int_array_to_string(&years));
2022-12-27 23:45:57 -05:00
/* Go though each year. */
for(y = years.data, y_end = y + years.size; y < y_end; y++) {
char fn[64];
sprintf(fn, "%d", *y);
/* Get the months as directories. */
if(chdir(fn) == -1 || !(dir = opendir("."))) goto catch;
while((de = readdir(dir))) {
struct stat st;
int month, *p;
2022-12-28 03:03:55 -05:00
if(!(month = (int)looks_like_month(de->d_name))) continue;
2022-12-27 23:45:57 -05:00
if(stat(de->d_name, &st)) goto catch;
if(!S_ISDIR(st.st_mode)) continue;
if(!(p = int_array_new(&months))) goto catch;
*p = month;
}
2022-12-28 03:03:55 -05:00
if(closedir(dir)) { dir = 0; goto catch; } dir = 0;
2022-12-27 23:45:57 -05:00
qsort(months.data, months.size, sizeof *months.data, &void_int_cmp);
2022-12-28 12:34:19 -05:00
fprintf(stderr, "Months in <<%s>>: %s.\n",
2022-12-27 23:45:57 -05:00
fn, int_array_to_string(&months));
/* Go though each month. */
for(m = months.data, m_end = m + months.size; m < m_end; m++) {
sprintf(fn, "%.2d", *m);
/* Get the days as files. */
if(chdir(fn) == -1 || !(dir = opendir("."))) goto catch;
while((de = readdir(dir))) {
struct stat st;
int day, *p;
2022-12-28 03:03:55 -05:00
if(!(day = (int)looks_like_day(de->d_name))) continue;
2022-12-27 23:45:57 -05:00
if(stat(de->d_name, &st)) goto catch;
if(S_ISDIR(st.st_mode)) continue;
if(!(p = int_array_new(&days))) goto catch;
*p = day;
}
2022-12-28 03:03:55 -05:00
if(closedir(dir)) { dir = 0; goto catch; } dir = 0;
2022-12-27 23:45:57 -05:00
qsort(days.data, days.size, sizeof *days.data, &void_int_cmp);
2023-02-17 17:06:21 -05:00
/*fprintf(stderr, "Days in <<%s>>: %s.\n",
fn, int_array_to_string(&days)); <- Too much spam. */
2022-12-27 23:45:57 -05:00
for(d = days.data, d_end = d + days.size; d < d_end; d++) {
2022-12-28 03:03:55 -05:00
const union date32 d32 = { .year = (uint32_t)*y,
.month = (uint32_t)*m, .day = (uint32_t)*d };
char *contents = 0;
sprintf(fn, "%.2d.txt", *d); /* Reconstruct. */
2022-12-28 12:34:19 -05:00
if(!(contents = text_append_file(&j.backing, fn))) goto catch;
2023-04-26 03:59:14 -04:00
switch(day_tree_bulk_assign(&j.days, d32, &v.text)) {
2022-12-28 12:34:19 -05:00
case TREE_PRESENT: intent = "not unique", errno = EDOM; /*sic*/
case TREE_ERROR: goto catch;
2022-12-28 03:03:55 -05:00
case TREE_ABSENT: break; /* Expected. */
2022-12-27 23:45:57 -05:00
}
2023-02-02 21:53:59 -05:00
/* Because it's in a flat array, the pointers are not stable
while we are loading it, and we need to store the offsets. */
*v.offset = (uintptr_t)(contents - j.backing.data);
2022-12-27 23:45:57 -05:00
}
2022-12-28 03:03:55 -05:00
d = 0, int_array_clear(&days);
2022-12-27 23:45:57 -05:00
if(chdir("..") == -1) goto catch;
}
2022-12-28 03:03:55 -05:00
m = 0, int_array_clear(&months);
2022-12-27 23:45:57 -05:00
if(chdir("..") == -1) goto catch;
}
2023-04-19 18:11:44 -04:00
if(chdir("../..") == -1 || !day_tree_bulk_finish(&j.days)) goto catch;
/* Structure is now stable because we aren't going to move it;
2023-02-02 21:53:59 -05:00
convert all of offsets back to pointers. */
it = day_tree_iterator(&j.days);
2023-04-21 23:11:57 -04:00
while(day_tree_next(&it))
v.text = day_tree_value(&it), *v.text = j.backing.data + *v.offset;
2022-12-27 23:45:57 -05:00
goto finally;
catch:
2022-12-28 12:34:19 -05:00
fprintf(stderr, "On date: %s/%d-%.2d-%.2d.\n",
2023-02-17 17:06:21 -05:00
dir_journal, y ? *y : 0, m ? *m : 0, d ? *d : 0);
2023-02-02 21:53:59 -05:00
if(intent) fprintf(stderr, "(%s)\n", intent);
2022-12-28 12:34:19 -05:00
recatch:
2023-02-02 01:23:35 -05:00
journal_(&j);
2022-12-27 23:45:57 -05:00
finally:
2022-12-29 13:10:41 -05:00
if(dir) { if(closedir(dir)) { dir = 0; goto recatch; } dir = 0; }
2023-04-19 18:11:44 -04:00
if(is_dir_journal) {
if(chdir(cwd) == -1) { is_dir_journal = 0; goto recatch; }
is_dir_journal = 0;
}
int_array_(&years), int_array_(&months), int_array_(&days); /* Temporary. */
2022-12-28 03:03:55 -05:00
return j;
2022-12-27 23:45:57 -05:00
}
2022-12-27 02:31:08 -05:00
2022-12-28 12:34:19 -05:00
/** @return `j` read in some data? */
int journal_is_empty(const struct journal *const j) {
return !j || !j->days.root.node || !j->backing.data;
}
2022-12-28 03:03:55 -05:00
2022-12-28 12:34:19 -05:00
/** @return `j` as a string. */
2022-12-28 03:03:55 -05:00
const char *journal_to_string(const struct journal *const j)
{ return day_tree_to_string(&j->days); }
2022-12-29 02:54:59 -05:00
struct journal_iterator journal_iterator(struct journal *const j) {
2022-12-29 02:54:59 -05:00
struct journal_iterator it;
it._ = day_tree_iterator(&j->days);
2022-12-29 02:54:59 -05:00
return it;
}
int journal_next(struct journal_iterator *const it,
2023-02-02 01:05:55 -05:00
union date32 *const k, const char **v) {
assert(it && k && v);
if(!day_tree_next(&it->_)) return 0;
*k = day_tree_key(&it->_);
*v = *day_tree_value(&it->_);
2023-02-02 01:05:55 -05:00
return 1;
2022-12-29 02:54:59 -05:00
}