-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcore-attr.c
666 lines (606 loc) · 14.4 KB
/
core-attr.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
/*
* Copyright Neil Brown ©2015-2021 <[email protected]>
* May be distributed under terms of GPLv2 - see file:COPYING
*
* Attributes.
*
* Attributes are attached to text in buffers and to marks and probably
* other things.
* They are simply name=value pairs, stored as strings though direct
* conversion to numbers and Bools is provided.
* Values must be "small". The name and value together must be less than
* 512 bytes, and there is probably some padding in there. If you get
* even close to this limit you are doing something wrong.
* Larger strings need to be stored elsewhere with some sort of indirect.
* (Hmmm.. this excludes file names - is that a good idea?)
*
* Attributes are stored in a list sorted by attribute name. Strings
* of digits in the name sort like the number they represent, so "6hello"
* comes before "10world". When such a number compares against a single
* non-digit character the char comes first.
*
* Attributes for text are stored in one list for a section of text.
* Each attribute is prefixed by the offset where the attribute applies.
*
* The offsets are really byte offsets - the text is utf-8.
*
* When attributes are stored on non-text objects they don't have
* a number prefix.
*
*/
#include <stdlib.h>
#include <malloc.h>
#include <string.h>
#include <ctype.h>
#include "core.h"
struct attrset {
unsigned short size, /* space allocated */
len; /* space used */
struct attrset *next;
char attrs[0];
};
/* NOTE: this MAX is the largest sized allocation which
* can be shared by multiple attrs. The size is the sum
* of keys and values including nul terminator.
* If an attr is larger, it gets an attrset all of its own.
*/
#if defined(TEST_ATTR_ADD_DEL)
#define MAX_ATTR_SIZE (64 - sizeof(struct attrset))
#else
#define MAX_ATTR_SIZE (512 - sizeof(struct attrset))
#endif
static struct attrset *safe newattr(struct attrset *old, int size)
{
struct attrset *set = realloc(old, sizeof(struct attrset) + size);
set->size = size;
if (old == NULL) {
set->len = 0;
set->next = NULL;
}
return set;
}
/* attr_cmp just deals with bytes and ASCII digits, so it is
* not aware for wchars
*/
static int getcmptok(const char **ap safe)
{
const char *a safe;
char c;
int i;
if (!*ap)
/* FIXME smatch should handle "char * safe *ap safe" */
return 0;
a = *ap;
c = *a++;
if (!isdigit(c)) {
*ap = a;
return c;
}
i = c - '0';
while (isdigit(*a)) {
c = *a++;
i = i*10 + (c - '0');
}
*ap = a;
return i+256;
}
/* Compare 'a' and 'b' treating strings of digits as numbers.
* If bnum >= 0, it is used as a leading number on 'b'.
*/
static int attr_cmp(const char *a safe, const char *b safe, int bnum)
{
while (*a && (*b || bnum >= 0)) {
int ai, bi;
ai = getcmptok(&a);
if (bnum >= 0) {
bi = bnum + 256;
bnum = -1;
if (*a == ' ')
a++;
} else
bi = getcmptok(&b);
if (ai < bi)
return -1;
if (ai > bi)
return 1;
}
if (*a)
return 1;
if (*b)
return -1;
return 0;
}
#ifdef TEST_ATTR_CMP
#include <stdlib.h>
#include <stdio.h>
struct {const char *a, *b; int result;} test[] = {
{ "hello", "there", -1},
{ "6hello", "10world", -1},
{ "0005six", "5six", 0},
{ "ab56", "abc", 1},
};
int main(int argc, char *argv[])
{
int i;
int rv = 0;
for (i = 0; i < sizeof(test)/sizeof(test[0]); i++) {
if (attr_cmp(test[i].a, test[i].b, -1) == test[i].result)
printf("%s <-> %s = %d OK\n",
test[i].a, test[i].b, test[i].result);
else {
printf("%s <-> %s = %d, not %d\n",
test[i].a, test[i].b, attr_cmp(test[i].a,
test[i].b, -1),
test[i].result);
rv = 1;
}
}
exit(rv);
}
#endif
static int _attr_find(struct attrset ***setpp safe, const char *key safe,
int *offsetp safe, int keynum)
{
struct attrset **setp safe;
struct attrset *set;
int i;
if (!*setpp)
/* FIXME smatch should check this */
return -1;
setp = *setpp;
set = *setp;
if (!set)
return -1;
*offsetp = 0;
while (set->next &&
attr_cmp(set->next->attrs, key, keynum) <= 0) {
setp = &set->next;
set = *setp;
}
*setpp = setp;
for (i = 0; i < set->len; ) {
int cmp = attr_cmp(set->attrs + i, key, keynum);
if (cmp >= 0) {
*offsetp = i;
*setpp = setp;
return cmp;
}
i += strlen(set->attrs + i) + 1;
i += strlen(set->attrs + i) + 1;
}
*offsetp = i;
return 1;
}
static void do_del(struct attrset * *setp safe, int offset)
{
int len;
struct attrset *set;
set = safe_cast *setp;
len = strlen(set->attrs + offset) + 1;
len += strlen(set->attrs + offset + len) + 1;
memmove(set->attrs + offset,
set->attrs + offset + len,
set->len - (offset + len));
set->len -= len;
if (set->len == 0) {
*setp = set->next;
free(set);
}
}
bool attr_del(struct attrset * *setp safe, const char *key safe)
{
int offset = 0;
int cmp;
cmp = _attr_find(&setp, key, &offset, -1);
if (cmp)
/* Not found */
return False;
do_del(setp, offset);
return True;
}
void attr_del_all(struct attrset * *setp safe, const char *key safe,
int low, int high)
{
int offset = 0;
/* Delete all attrs 'key' with keynum from 'low' to 'high' */
while (low <= high) {
struct attrset *set;
int n;
int cmp = _attr_find(&setp, key, &offset, low);
if (cmp < 0)
/* Nothing more to find */
return;
low += 1;
if (cmp == 0) {
/* Found, better delete */
do_del(setp, offset);
continue;
}
/* found something higher, possibly update 'low'
* to skip over gaps.
*/
set = *setp;
if (!set || offset >= set->len)
continue;
n = atoi(set->attrs + offset);
if (n > low)
low = n;
}
}
char *attr_get_str(struct attrset *set, const char *key safe, int keynum)
{
struct attrset **setp = &set;
int offset = 0;
int cmp = _attr_find(&setp, key, &offset, keynum);
if (cmp != 0 || !*setp)
return NULL;
set = *setp;
offset += strlen(set->attrs + offset) + 1;
return set->attrs + offset;
}
char *attr_find(struct attrset *set, const char *key safe)
{
return attr_get_str(set, key, -1);
}
const char *attr_get_next_key(struct attrset *set, const char *key safe,
int keynum, const char **valp safe)
{
struct attrset **setp = &set;
int offset = 0;
int cmp = _attr_find(&setp, key, &offset, keynum);
const char *val;
if (cmp < 0)
return NULL;
set = safe_cast *setp;
if (cmp == 0) {
/* Skip the matching key, then value */
offset += strlen(set->attrs + offset) + 1;
offset += strlen(set->attrs + offset) + 1;
}
if (offset >= set->len) {
set = set->next;
offset = 0;
}
if (!set)
return NULL;
key = set->attrs + offset;
val = key + strlen(key) + 1;
if (keynum >= 0) {
int kn = getcmptok(&key);
if (kn != keynum + 256)
return NULL;
if (*key == ' ')
key += 1;
}
*valp = val;
return key;
}
int attr_set_str_key(struct attrset **setp safe,
const char *key safe, const char *val,
int keynum)
{
int offset = 0;
int cmp;
struct attrset *set;
unsigned int len, keylen, vallen;
char nkey[22];
int nkeylen = 0;
cmp = _attr_find(&setp, key, &offset, keynum);
if (cmp == 0)
/* Remove old value */
do_del(setp, offset);
if (!val)
return cmp;
set = *setp;
if (keynum >= 0) {
snprintf(nkey, sizeof(nkey), "%d ", keynum);
nkeylen = strlen(nkey);
} else
nkey[0] = 0;
keylen = strlen(key);
vallen = strlen(val);
len = nkeylen + keylen + 1 + vallen + 1;
while (set == NULL || set->len + len > set->size) {
/* Need to re-alloc or alloc new */
if (!set || (offset == 0 && len + set->len > MAX_ATTR_SIZE)) {
/* Create a new set - which may exceed MAX_ATTR_SIZE */
struct attrset *new = newattr(NULL, len);
new->next = set;
*setp = new;
set = new;
} else if (set->len + len <= MAX_ATTR_SIZE) {
/* Just make this block bigger */
set = newattr(set, set->len + len);
*setp = set;
} else if (offset + len <= MAX_ATTR_SIZE) {
/* split following entries in separate block */
struct attrset *new = newattr(NULL, set->len - offset);
new->next = set->next;
set->next = new;
new->len = set->len - offset;
set->len = offset;
memcpy(new->attrs, set->attrs + offset,
new->len);
} else if (offset == set->len) {
/* Need to add after here */
setp = &set->next;
set = *setp;
offset = 0;
} else {
/* offset must be > 0.
* Split off following entries and try again there.
*/
struct attrset *new = newattr(NULL,
set->len - offset);
new->next = set->next;
set->next = new;
new->len = set->len - offset;
set->len = offset;
memcpy(new->attrs, set->attrs + offset,
new->len);
setp = &set->next;
set = new;
offset = 0;
}
}
memmove(set->attrs + offset + len, set->attrs + offset,
set->len - offset);
memcpy(set->attrs + offset, nkey, nkeylen);
memcpy(set->attrs + offset + nkeylen, key, keylen + 1);
memcpy(set->attrs + offset + nkeylen + keylen + 1, val, vallen + 1);
set->len += len;
return cmp;
}
int attr_set_str(struct attrset **setp safe,
const char *key safe, const char *val)
{
return attr_set_str_key(setp, key, val, -1);
}
#if defined(TEST_ATTR_ADD_DEL) || defined(TEST_ATTR_TRIM)
void attr_dump(struct attrset *set)
{
printf("DUMP ATTRS:\n");
while (set) {
int i;
printf(" %d of %d:\n", set->len, set->size);
for (i = 0; i < set->len; ) {
printf(" %3d: \"%s\"", i, set->attrs + i);
i += strlen(set->attrs+i) + 1;
printf(" -> \"%s\"\n", set->attrs + i);
i += strlen(set->attrs+i) + 1;
}
set = set->next;
}
printf("END DUMP\n");
}
#endif
#ifdef TEST_ATTR_ADD_DEL
enum act { Add, Remove, Find };
struct action {
enum act act;
char *key;
char *val;
} actions[] = {
{ Add, "Hello", "world"},
{ Add, "05 Foo", "Bar" },
{ Add, "1 Bold", "off" },
{ Add, "9 Underline", "on" },
{ Remove, "Hello", NULL },
{ Find, "5 Foo", "Bar" },
{ Add, "20 Thing", "Stuff" },
{ Add, "01 Bold", "on" },
{ Add, "1 StrikeThrough", "no" },
{ Add, "2 StrikeThrough", "no" },
{ Find, "1 StrikeThrough", "no" },
{ Find, "5 Foo", "Bar" },
{ Add, "1 Nextthing", "nonono" },
};
int main(int argc, char *argv[])
{
int i;
int rv = 0;
struct attrset *set = NULL;
for (i = 0; i < sizeof(actions)/sizeof(actions[0]); i++) {
struct action *a = &actions[i];
char *v;
switch(a->act) {
case Add:
attr_set_str(&set, a->key, a->val); continue;
case Remove:
if (!attr_del(&set, a->key)) {
printf("Action %d: Remove %s: failed\n",
i, a->key);
rv = 1;
break;
}
continue;
case Find:
v = attr_find(set, a->key);
if (!v || strcmp(v, a->val) != 0) {
printf("Action %d: Find %s: Found %s\n",
i, a->key, v);
rv = 1;
break;
}
continue;
}
break;
}
attr_dump(set);
exit(rv);
}
#endif
/* Have versions that take and return numbers, '-1' for 'not found' */
int attr_find_int(struct attrset *set, const char *key safe)
{
const char *val = attr_find(set, key);
unsigned long rv;
char *end;
if (!val)
return -1;
rv = strtoul(val, &end, 10);
if (!end || end == val || *end)
return -1;
return rv;
}
int attr_set_int(struct attrset **setp safe, const char *key safe, int val)
{
/* 3 digits per bytes, +1 for sign and +1 for trailing nul */
char sval[sizeof(int)*3+2];
snprintf(sval, sizeof(sval), "%d", val);
return attr_set_str(setp, key, sval);
}
#ifdef TEST_ATTR_INT
int main(int argc, char *argv[])
{
struct attrset *set = NULL;
attr_set_int(&set, "One", 1);
attr_set_int(&set, "Twelve", 12);
attr_set_int(&set, "Four", 4);
if (attr_find_int(set, "One") +
attr_find_int(set, "Twelve") +
attr_find_int(set, "Four")
!= 17) {
printf("Didn't find One, Twelve, Four\n");
exit(2);
}
if (attr_find_int(set, "Three") != -1) {
printf("Surprisingly found Three\n");
exit(2);
}
exit(0);
}
#endif
void attr_free(struct attrset **setp safe)
{
struct attrset *set = *setp;
*setp = NULL;
while (set) {
struct attrset *next = set->next;
free(set);
set = next;
}
}
/*
* When attributes are attached to a section of text,
* we might want to split the text and so split the attributes.
* So:
* 1- 'trim' all attributes beyond a given key
* 2- copy attributes, subtracting some number from the offset.
* At offset '0', an empty value deletes the key.
*/
void attr_trim(struct attrset **setp safe, int nkey)
{
int offset;
struct attrset *set;
_attr_find(&setp, "", &offset, nkey);
set = *setp;
if (!set)
return;
set->len = offset;
if (offset)
setp = &set->next;
attr_free(setp);
}
/* make a copy of 'set', keeping only attributes from 'nkey'
* onwards.
*/
struct attrset *attr_copy_tail(struct attrset *set, int nkey)
{
struct attrset *newset = NULL;
for (; set ; set = set->next) {
int i;
for (i = 0; i < set->len; ) {
char *k, *v;
int n;
k = set->attrs + i;
i += strlen(k) + 1;
v = set->attrs + i;
i += strlen(v) + 1;
n = atoi(k);
if (n < nkey)
continue;
while (*k && *k != ' ')
k++;
if (*k == ' ')
k++;
attr_set_str_key(&newset, k, v, n);
}
}
return newset;
}
/* make a copy of 'set' */
struct attrset *attr_copy(struct attrset *set)
{
struct attrset *newset, **ep = &newset;
for (; set ; set = set->next) {
struct attrset *n = newattr(NULL, set->size);
memcpy(n->attrs, set->attrs, set->len);
n->len = set->len;
*ep = n;
ep = &n->next;
}
*ep = NULL;
return newset;
}
/* Collect the attributes in effect at a given pos and return
* a new set with the new alternate numeric prefix, or nothing if '-1'
*/
struct attrset *attr_collect(struct attrset *set, unsigned int pos,
int prefix)
{
struct attrset *newset = NULL;
char kbuf[512];
for (; set ; set = set->next) {
int i;
for (i = 0; i < set->len; ) {
char *k, *v, *e;
unsigned long n;
k = set->attrs + i;
i += strlen(k) + 1;
v = set->attrs + i;
i += strlen(v) + 1;
n = strtoul(k, &e, 10);
if (n > pos)
goto done;
/* FIXME shouldn't need to test 'e' */
while (e && *e == ' ')
e++;
if (prefix >= 0) {
snprintf(kbuf, 512, "%d %s", prefix, e);
e = kbuf;
}
if (*v == '\0')
v = NULL;
if (!e) e = "FIXME";
attr_set_str(&newset, e, v);
}
}
done:
return newset;
}
#ifdef TEST_ATTR_TRIM
char *keys[] = {
"1 Bold", "2 Bold", "5 Bold", "10 Bold",
"0 Colour", "3 Colour", "08 Colour", "12 Colour",
"2 Invis", "4 Invis", "6 Invis", "9 Invis",
};
int main(int argc, char *argv[])
{
int i;
struct attrset *set = NULL;
struct attrset *newset, *new2;
for (i = 0; i < sizeof(keys)/sizeof(keys[0]); i++)
attr_set_str(&set, keys[i], keys[i], -1);
newset = attr_copy_tail(set, 5);
attr_trim(&set, 5);
new2 = attr_collect(newset, 9, 4);
attr_dump(set);
attr_dump(newset);
attr_dump(new2);
exit(0);
}
#endif
/*
* Iterator for set.
*/