
281 lines
8.8 KiB
Raw Normal View History

2023-03-12 23:48:29 +00:00
/** @license 2022 Neil Edelman, distributed under the terms of the
[MIT License](
2023-04-01 01:54:45 +00:00
Scan journal entries for score. */
2023-03-12 23:48:29 +00:00
2023-04-01 01:54:45 +00:00
#if 0
2023-03-12 23:48:29 +00:00
#include <inttypes.h> /* C99 */
#include <limits.h>
2023-04-01 01:54:45 +00:00
#include "../src/journal.h"
2023-04-07 03:21:38 +00:00
#include "../src/scores.h"
2023-04-01 01:54:45 +00:00
#include <stdio.h>
#include <assert.h>
/* One array. */
static void scorelist_to_string(const struct score *const s,
char (*const z)[12]) {
const char *a = s->name.a, *b;
char *y = *z;
b = s->name.b <= a + 11 ? s->name.b : a + 11;
while(a < b) *(y++) = *(a++);
*y = '\0';
#define ARRAY_NAME scorelist
#define ARRAY_TYPE struct score
#define ARRAY_BODY
#include "../src/array.h"
/* Tree mapping from date-line to indices. */
static void score_to_string(const union line64 line, const size_t *const u,
char (*const a)[12]) { (void)u; date32_to_string(, a); }
static int score_compare(const union line64 a, const union line64 b)
{ return a.u64 > b.u64; }
#define TREE_NAME score
#define TREE_KEY union line64
#define TREE_VALUE size_t
#define TREE_DEFAULT 0
#define TREE_BODY
#include "../src/tree.h"
2023-03-12 23:48:29 +00:00
2023-04-01 03:15:02 +00:00
static int scan(union date32 date, const char *const buffer,
struct scores *const scores) {
2023-04-07 03:21:38 +00:00
const char *YYCURSOR, *YYMARKER, *yyt1, *yyt2, *s0, *s1;
2023-03-12 23:48:29 +00:00
enum YYCONDTYPE condition = yycline;
size_t line = 1;
char datestr[12] = {0};
const char *why = "unexpected";
2023-04-07 03:21:38 +00:00
struct score *score = 0;
2023-04-01 03:15:02 +00:00
assert(buffer && scores);
2023-03-12 23:48:29 +00:00
YYCURSOR = YYMARKER = yyt1 = buffer;
/*!re2c /**/
re2c:define:YYCTYPE = char;
re2c:yyfill:enable = 0;
re2c:define:YYGETCONDITION = "condition";
re2c:define:YYSETCONDITION = "condition = @@;";
re2c:define:YYGETCONDITION:naked = 1;
re2c:define:YYSETCONDITION:naked = 1;
ws = [ \t];
2023-04-07 03:21:38 +00:00
glyph = [^\x00-\x20\x7f]; // [^\x00\n\t ] + all weird
semitext = glyph \ ";";
2023-03-12 23:48:29 +00:00
natural = [1-9][0-9]*;
2023-04-07 03:21:38 +00:00
uint = [0-9]+;
2023-03-12 23:48:29 +00:00
keyword = [A-Za-z0-9][A-Za-z0-9_-]*;
2023-04-07 03:21:38 +00:00
date = natural "-" [0-1][0-9] "-" [0-3][0-9];
2023-03-12 23:48:29 +00:00
for( ; ; ) { /*!re2c /**/
/* Default ignore. */
<skip> [^\n\x00] { continue; }
<skip> "\x00" { why = "no newline at end of file"; goto catch; }
<line> "\x00" { return 1; }
<line, skip> "\n" => line { line++; continue; }
<line> * :=> skip
<line> "::" / [^:] :=> score
2023-04-07 03:21:38 +00:00
<score> * { why = "score unrecognized"; goto catch; }
/* Already there. Use the map to get the index from the keyword and
then stick a marker in the tree with that index. */
2023-04-01 01:54:45 +00:00
<score> @s0 keyword @s1 / "\n" => skip { also_add_to_tree: {
2023-03-12 23:48:29 +00:00
const struct pair keyword = pair(s0, s1);
2023-04-01 03:15:02 +00:00
const union line64 key = { { (uint32_t)line, date } };
2023-04-07 03:21:38 +00:00
size_t idx, *pidx;
2023-03-12 23:48:29 +00:00
if(line > UINT32_MAX)
{ errno = ERANGE; why = "too many lines of text"; goto catch; }
2023-04-07 03:21:38 +00:00
if(!(idx = pair_map_table_get(&scores->map, keyword)))
2023-03-12 23:48:29 +00:00
{ why = "keyword not introduced"; goto catch; }
2023-04-08 00:39:13 +00:00
if(scores->[idx].last.u32 >= date.u32)
{ why = "duplicate key in same day"; goto catch; }
scores->[idx].last.u32 = date.u32;
switch(score_tree_bulk_try(&scores->dates, key, &pidx)) {
case TREE_PRESENT: assert(0); why = "duplicate key"; /* _Sic_. */
2023-03-12 23:48:29 +00:00
case TREE_ERROR: goto catch;
2023-04-07 03:21:38 +00:00
case TREE_ABSENT: *pidx = idx; break;
2023-03-12 23:48:29 +00:00
2023-04-08 02:57:19 +00:00
/*date32_to_string(date, &datestr);
fprintf(stderr, "%s: <%.*s>\n", datestr, (int)(s1 - s0), s0);*/
2023-03-12 23:48:29 +00:00
} }
2023-04-07 03:21:38 +00:00
/* New score. */
<score> @s0 keyword @s1 ":" => score_name {
2023-03-12 23:48:29 +00:00
size_t *idx;
2023-04-07 03:21:38 +00:00
switch(pair_map_table_assign(&scores->map, pair(s0, s1), &idx)) {
2023-03-12 23:48:29 +00:00
case TABLE_PRESENT: errno = EDOM; why = "new keyword already used";
2023-04-07 03:21:38 +00:00
case TABLE_ERROR: goto catch; /* _Sic_. */
case TABLE_ABSENT: *idx = 0; break;
2023-03-12 23:48:29 +00:00
2023-04-01 03:15:02 +00:00
if(!(score = scorelist_array_new(&scores->list))) goto catch;
*idx = (size_t)(score - scores->;
2023-04-08 02:57:19 +00:00
/*struct pair key, name; union date32 date, last; unsigned edges;*/
2023-04-01 03:15:02 +00:00
score->key.a = s0, score->key.b = s1;
score->name.a = 0, score->name.b = 0;
2023-04-08 00:39:13 +00:00
score->date.u32 = score->last.u32 = 0;
2023-04-18 02:46:52 +00:00
score->edges = 0, score->tempscore = 0;
2023-03-12 23:48:29 +00:00
date32_to_string(date, &datestr);
2023-04-07 03:21:38 +00:00
fprintf(stderr, "%s: new score <%.*s> stored in list at %zu.\n",
2023-03-12 23:48:29 +00:00
datestr, (int)(s1 - s0), s0, *idx);
goto also_add_to_tree;
2023-04-07 03:21:38 +00:00
<score_name> * { why = "name unrecognized"; goto catch; }
<score_date> * { why = "date unrecognized"; goto catch; }
<score_edges> * { why = "edges unrecognized"; goto catch; }
<score_name> ws* @s0 semitext+ (" " semitext+)* @s1 /* ws* */ ";"
=> score_date {
score->name.a = s0, score->name.b = s1;
<score_date> ws* "~"? @s0 date ws* ";" => score_edges {
if(!pair_to_date(s0, &score->date)) goto catch;
<score_edges> ws* "~"? @s0 uint @s1 ws* / "\n" => skip {
if(!pair_to_natural(s0, s1, &score->edges)) goto catch;
score = 0; /* Done. */
2023-03-12 23:48:29 +00:00
*/ }
assert(0); /* Never gets here. */
if(!errno) errno = EILSEQ;
date32_to_string(date, &datestr);
2023-04-07 03:21:38 +00:00
fprintf(stderr, "%s line %zu: %s.\n", datestr, line, why);
2023-03-12 23:48:29 +00:00
return 0;
2023-04-01 03:15:02 +00:00
void scores_(struct scores *const s) {
if(!s) return;
struct scores scores(struct journal *const j) {
struct scores s
= { scorelist_array(), pair_map_table(), score_tree() };
struct journal_iterator it;
union date32 k;
const char *v;
{ /* Null is the first item for convenience, (TABLE_DEFAULT). */
struct score *nul;
if(!(nul = scorelist_array_new(&s.list))) goto catch;
nul->key.a = nul->key.b = nul->name.a = nul->name.b = 0;
nul->date.u32 = 0;
nul->edges = 0;
it = journal_iterator(j);
while(journal_next(&it, &k, &v)) if(!scan(k, v, &s)) goto catch;
fprintf(stderr, "List of scores: %s.\n"
"Mapped to indices: %s.\n"
"Date-line tree: %s.\n", scorelist_array_to_string(&s.list),
pair_map_table_to_string(&, score_tree_to_string(&s.dates));
goto finally;
return s;
int scores_is_empty(const struct scores *const s)
{ return !s || !s->dates.root.node; }
2023-04-07 03:21:38 +00:00
2023-04-08 02:57:19 +00:00
const char *scores_to_string(const struct scores *const s)
{ return assert(s), scorelist_array_to_string(&s->list); }
2023-04-08 00:39:13 +00:00
#include <stdlib.h>
2023-04-07 03:21:38 +00:00
int main(void) {
2023-04-08 02:57:19 +00:00
const char *fail = 0;
struct journal jrnl = {0};
struct scores scrs = {0};
errno = 0;
jrnl = journal();
fprintf(stderr, "Journal: %s.\n", journal_to_string(&jrnl));
if(journal_is_empty(&jrnl)) { fail = "journal failed to load"; goto catch; }
scrs = scores(&jrnl);
fprintf(stderr, "Scores: %s.\n", scores_to_string(&scrs));
if(scores_is_empty(&scrs)) { fail = "scores failed to parse"; goto catch; }
struct score_tree_iterator it = score_tree_iterator(&scrs.dates);
union line64 line;
struct score *score;
2023-04-18 02:46:52 +00:00
/* Set score to zero to verify count with paper journal. */
for(size_t i = 0; i < scrs.list.size; i++)[i].tempscore = 0;
2023-04-08 02:57:19 +00:00
printf("set terminal pngcairo dashed transparent truecolor"
" size 840, 480 fontscale 1\n"
"set output \"score.png\"\n");
printf("$Data <<EOD\n"
2023-04-18 02:54:08 +00:00
"# date, key, key score\n");
2023-04-08 02:57:19 +00:00
while(score_tree_next(&it)) {
line = score_tree_key(&it);
score = + *score_tree_value(&it);
char datestr[12];
date32_to_string(, &datestr);
2023-04-18 02:46:52 +00:00
printf("%s, %.*s, %u\n", datestr,
(int)(score->key.b - score->key.a), score->key.a, score->tempscore);
2023-04-08 02:57:19 +00:00
"# theozh\n"
"# get a unique list from datablock\n"
"addToList(list,col) = list.( strstrt(list,'\"'.strcol(col).'\"') \\\n"
" > 0 ? '' : ' \"'.strcol(col).'\"')\n"
"Uniqs = ''\n"
"stats $Data u (Uniqs=addToList(Uniqs,2)) nooutput\n"
"Uniq(i) = word(Uniqs,i)\n"
"getIndex(s) = sum [_i=1:words(Uniqs)] s eq word(Uniqs,_i) ? _i : 0\n"
/*"stats $Data u 3 nooutput\n"
"cumsum = STATS_sum\n"
"stats $Data u 4 nooutput\n"
"setsum = STATS_sum\n"
"myTimeFmt = \"%%Y-%%m-%%d\"\n"
"set format x myTimeFmt timedate\n"
"set xtics format myTimeFmt rotate by -30\n"
"set ylabel \"happiness CDF (days)\"\n"
"set grid\n"
"set key out reverse Left noautotitle\n"
"set style fill solid 0.5\n"
"unset border\n"
"set autoscale xfix # max? hack: can't get x to extend further\n"
/*"set label sprintf(\"%%u cumulative words (duplicate verses counted)\","
" cumsum) center at graph 0.5, first cumsum*100/%zu offset 0,0.5\n"
"set label sprintf(\"%%u unique KJV verse words memorized\", setsum) "
"center at graph 0.5, first setsum*100/%zu offset 0,0.5\n"
"plot \\\n"
" total=0 $Data u"
" (timecolumn(1,myTimeFmt)):(total=total+1) \\\n"
" w steps lc \"black\" dt 1 lw 1, \\\n"
" total=0 '' u \\\n"
" (timecolumn(1,myTimeFmt)): \\\n"
" (total=total+1,total/2.): \\\n"
" (43200): \\\n"
" (total/2.): \\\n"
" (getIndex(strcol(2))) w boxxy lc var lw 1, \\\n"
" for [i=1:words(Uniqs)] keyentry w boxxy lc i ti Uniq(i)\n");
2023-04-07 10:54:38 +00:00
goto finally;
2023-04-08 02:57:19 +00:00
2023-04-07 10:54:38 +00:00
2023-04-08 02:57:19 +00:00
if(!fail) fail = "score";
2023-04-07 10:54:38 +00:00
2023-04-08 02:57:19 +00:00
2023-04-07 03:21:38 +00:00