1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
|
# Some useful helpers for dealing with strings.
recipe string-equal [
default-space:address:array:location <- new location:type, 30:literal
a:address:array:character <- next-ingredient
a-len:number <- length a:address:array:character/deref
b:address:array:character <- next-ingredient
b-len:number <- length b:address:array:character/deref
# compare lengths
{
trace [string-equal], [comparing lengths]
length-equal?:boolean <- equal a-len:number, b-len:number
break-if length-equal?:boolean
reply 0:literal
}
# compare each corresponding character
trace [string-equal], [comparing characters]
i:number <- copy 0:literal
{
done?:boolean <- greater-or-equal i:number, a-len:number
break-if done?:boolean
a2:character <- index a:address:array:character/deref, i:number
b2:character <- index b:address:array:character/deref, i:number
{
chars-match?:boolean <- equal a2:character, b2:character
break-if chars-match?:boolean
reply 0:literal
}
i:number <- add i:number, 1:literal
loop
}
reply 1:literal
]
scenario string-equal-reflexive [
run [
default-space:address:array:location <- new location:type, 30:literal
x:address:array:character <- new [abc]
3:boolean/raw <- string-equal x:address:array:character, x:address:array:character
]
memory-should-contain [
3 <- 1 # x == x for all x
]
]
scenario string-equal-identical [
run [
default-space:address:array:location <- new location:type, 30:literal
x:address:array:character <- new [abc]
y:address:array:character <- new [abc]
3:boolean/raw <- string-equal x:address:array:character, y:address:array:character
]
memory-should-contain [
3 <- 1 # abc == abc
]
]
scenario string-equal-distinct-lengths [
run [
default-space:address:array:location <- new location:type, 30:literal
x:address:array:character <- new [abc]
y:address:array:character <- new [abcd]
3:boolean/raw <- string-equal x:address:array:character, y:address:array:character
]
memory-should-contain [
3 <- 0 # abc != abcd
]
trace-should-contain [
string-equal: comparing lengths
]
trace-should-not-contain [
string-equal: comparing characters
]
]
scenario string-equal-with-empty [
run [
default-space:address:array:location <- new location:type, 30:literal
x:address:array:character <- new []
y:address:array:character <- new [abcd]
3:boolean/raw <- string-equal x:address:array:character, y:address:array:character
]
memory-should-contain [
3 <- 0 # "" != abcd
]
]
scenario string-equal-common-lengths-but-distinct [
run [
default-space:address:array:location <- new location:type, 30:literal
x:address:array:character <- new [abc]
y:address:array:character <- new [abd]
3:boolean/raw <- string-equal x:address:array:character, y:address:array:character
]
memory-should-contain [
3 <- 0 # abc != abd
]
]
# A new type to help incrementally construct strings.
container buffer [
length:number
data:address:array:character
]
recipe init-buffer [
default-space:address:array:location <- new location:type, 30:literal
#? $print default-space:address:array:location, [
#? ]
result:address:buffer <- new buffer:type
len:address:number <- get-address result:address:buffer/deref, length:offset
len:address:number/deref <- copy 0:literal
s:address:address:array:character <- get-address result:address:buffer/deref, data:offset
capacity:number <- next-ingredient
s:address:address:array:character/deref <- new character:type, capacity:number
#? $print s:address:address:array:character/deref, [
#? ]
reply result:address:buffer
]
recipe grow-buffer [
default-space:address:array:location <- new location:type, 30:literal
in:address:buffer <- next-ingredient
# double buffer size
x:address:address:array:character <- get-address in:address:buffer/deref, data:offset
oldlen:number <- length x:address:address:array:character/deref/deref
newlen:number <- multiply oldlen:number, 2:literal
olddata:address:array:character <- copy x:address:address:array:character/deref
x:address:address:array:character/deref <- new character:type, newlen:number
# copy old contents
i:number <- copy 0:literal
{
done?:boolean <- greater-or-equal i:number, oldlen:number
break-if done?:boolean
src:character <- index olddata:address:array:character/deref, i:number
dest:address:character <- index-address x:address:address:array:character/deref/deref, i:number
dest:address:character/deref <- copy src:character
i:number <- add i:number, 1:literal
loop
}
reply in:address:buffer
]
recipe buffer-full? [
default-space:address:array:location <- new location:type, 30:literal
in:address:buffer <- next-ingredient
len:number <- get in:address:buffer/deref, length:offset
s:address:array:character <- get in:address:buffer/deref, data:offset
capacity:number <- length s:address:array:character/deref
result:boolean <- greater-or-equal len:number, capacity:number
reply result:boolean
]
# in:address:buffer <- buffer-append in:address:buffer, c:character
recipe buffer-append [
default-space:address:array:location <- new location:type, 30:literal
in:address:buffer <- next-ingredient
c:character <- next-ingredient
{
# grow buffer if necessary
full?:boolean <- buffer-full? in:address:buffer
break-unless full?:boolean
in:address:buffer <- grow-buffer in:address:buffer
}
len:address:number <- get-address in:address:buffer/deref, length:offset
s:address:array:character <- get in:address:buffer/deref, data:offset
dest:address:character <- index-address s:address:array:character/deref, len:address:number/deref
dest:address:character/deref <- copy c:character
len:address:number/deref <- add len:address:number/deref, 1:literal
reply in:address:buffer/same-as-ingredient:0
]
scenario buffer-append-works [
run [
default-space:address:array:location <- new location:type, 30:literal
x:address:buffer <- init-buffer 3:literal
s1:address:array:character <- get x:address:buffer/deref, data:offset
x:address:buffer <- buffer-append x:address:buffer, 97:literal # 'a'
x:address:buffer <- buffer-append x:address:buffer, 98:literal # 'b'
x:address:buffer <- buffer-append x:address:buffer, 99:literal # 'c'
s2:address:array:character <- get x:address:buffer/deref, data:offset
1:boolean/raw <- equal s1:address:array:character, s2:address:array:character
#? $print s2:address:array:character, [
#? ]
#? $print 1060:number/raw, [
#? ]
#? $print 1061:number/raw, [
#? ]
#? $print 1062:number/raw, [
#? ]
#? $print 1063:number/raw, [
#? ]
#? $print 1064:number/raw, [
#? ]
#? $print 1065:number/raw, [
#? ]
2:array:character/raw <- copy s2:address:array:character/deref
+buffer-filled
x:address:buffer <- buffer-append x:address:buffer, 100:literal # 'd'
s3:address:array:character <- get x:address:buffer/deref, data:offset
10:boolean/raw <- equal s1:address:array:character, s3:address:array:character
11:number/raw <- get x:address:buffer/deref, length:offset
12:array:character/raw <- copy s3:address:array:character/deref
]
memory-should-contain [
# before +buffer-filled
1 <- 1 # no change in data pointer
2 <- 3 # size of data
3 <- 97 # data
4 <- 98
5 <- 99
# in the end
10 <- 0 # data pointer has grown
11 <- 4 # final length
12 <- 6 # but data's capacity has doubled
13 <- 97 # data
14 <- 98
15 <- 99
16 <- 100
17 <- 0
18 <- 0
]
]
# result:address:array:character <- integer-to-decimal-string n:number
recipe integer-to-decimal-string [
default-space:address:array:location <- new location:type, 30:literal
n:number <- next-ingredient
# is it zero?
{
break-if n:number
result:address:array:character <- new [0]
reply result:address:array:character
}
# save sign
negate-result:boolean <- copy 0:literal
{
negative?:boolean <- lesser-than n:number, 0:literal
break-unless negative?:boolean
negate-result:boolean <- copy 1:literal
n:number <- multiply n:number, -1:literal
}
# add digits from right to left into intermediate buffer
tmp:address:buffer <- init-buffer 30:literal
digit-base:number <- copy 48:literal # '0'
{
done?:boolean <- equal n:number, 0:literal
break-if done?:boolean
n:number, digit:number <- divide-with-remainder n:number, 10:literal
c:character <- add digit-base:number, digit:number
tmp:address:buffer <- buffer-append tmp:address:buffer, c:character
loop
}
# add sign
{
break-unless negate-result:boolean
tmp:address:buffer <- buffer-append tmp:address:buffer, 45:literal # '-'
}
# reverse buffer into string result
len:number <- get tmp:address:buffer/deref, length:offset
buf:address:array:character <- get tmp:address:buffer/deref, data:offset
result:address:array:character <- new character:type, len:number
i:number <- subtract len:number, 1:literal
j:number <- copy 0:literal
{
# while i >= 0
done?:boolean <- lesser-than i:number, 0:literal
break-if done?:boolean
# result[j] = tmp[i]
src:character <- index buf:address:array:character/deref, i:number
dest:address:character <- index-address result:address:array:character/deref, j:number
dest:address:character/deref <- copy src:character
# ++i
i:number <- subtract i:number, 1:literal
# --j
j:number <- add j:number, 1:literal
loop
}
reply result:address:array:character
]
scenario integer-to-decimal-digit-zero [
run [
1:address:array:character/raw <- integer-to-decimal-string 0:literal
2:array:character/raw <- copy 1:address:array:character/deref/raw
]
memory-should-contain [
2:string <- [0]
]
]
scenario integer-to-decimal-digit-positive [
run [
1:address:array:character/raw <- integer-to-decimal-string 234:literal
2:array:character/raw <- copy 1:address:array:character/deref/raw
]
memory-should-contain [
2:string <- [234]
]
]
scenario integer-to-decimal-digit-negative [
run [
1:address:array:character/raw <- integer-to-decimal-string -1:literal
2:array:character/raw <- copy 1:address:array:character/deref/raw
]
memory-should-contain [
2 <- 2
3 <- 45 # '-'
4 <- 49 # '1'
]
]
# result:address:array:character <- string-append a:address:array:character, b:address:array:character
recipe string-append [
default-space:address:array:location <- new location:type, 30:literal
# result = new character[a.length + b.length]
a:address:array:character <- next-ingredient
a-len:number <- length a:address:array:character/deref
b:address:array:character <- next-ingredient
b-len:number <- length b:address:array:character/deref
result-len:number <- add a-len:number, b-len:number
result:address:array:character <- new character:type, result-len:number
# copy a into result
result-idx:number <- copy 0:literal
i:number <- copy 0:literal
{
# while i < a.length
a-done?:boolean <- greater-or-equal i:number, a-len:number
break-if a-done?:boolean
# result[result-idx] = a[i]
out:address:character <- index-address result:address:array:character/deref, result-idx:number
in:character <- index a:address:array:character/deref, i:number
out:address:character/deref <- copy in:character
# ++i
i:number <- add i:number, 1:literal
# ++result-idx
result-idx:number <- add result-idx:number, 1:literal
loop
}
# copy b into result
i:number <- copy 0:literal
{
# while i < b.length
b-done?:boolean <- greater-or-equal i:number, b-len:number
break-if b-done?:boolean
# result[result-idx] = a[i]
out:address:character <- index-address result:address:array:character/deref, result-idx:number
in:character <- index b:address:array:character/deref, i:number
out:address:character/deref <- copy in:character
# ++i
i:number <- add i:number, 1:literal
# ++result-idx
result-idx:number <- add result-idx:number, 1:literal
loop
}
reply result:address:array:character
]
scenario string-append-1 [
run [
1:address:array:character/raw <- new [hello,]
2:address:array:character/raw <- new [ world!]
3:address:array:character/raw <- string-append 1:address:array:character/raw, 2:address:array:character/raw
4:array:character/raw <- copy 3:address:array:character/raw/deref
]
memory-should-contain [
4:string <- [hello, world!]
]
]
# replace underscores in first with remaining args
# result:address:array:character <- interpolate template:address:array:character, ...
recipe interpolate [
default-space:array:address:location <- new location:type, 60:literal
template:address:array:character <- next-ingredient
# compute result-len, space to allocate for result
tem-len:number <- length template:address:array:character/deref
result-len:number <- copy tem-len:number
{
# while arg received
a:address:array:character, arg-received?:boolean <- next-ingredient
break-unless arg-received?:boolean
# result-len = result-len + arg.length - 1 for the 'underscore' being replaced
a-len:number <- length a:address:array:character/deref
result-len:number <- add result-len:number, a-len:number
result-len:number <- subtract result-len:number, 1:literal
loop
}
#? $print tem-len:number, [ ], $result-len:number, [
#? ] #? 1
rewind-ingredients
_ <- next-ingredient # skip template
# result = new array:character[result-len]
result:address:array:character <- new character:type, result-len:number
# repeatedly copy sections of template and 'holes' into result
result-idx:number <- copy 0:literal
i:number <- copy 0:literal
{
# while arg received
a:address:array:character, arg-received?:boolean <- next-ingredient
break-unless arg-received?:boolean
# copy template into result until '_'
{
# while i < template.length
tem-done?:boolean <- greater-or-equal i:number, tem-len:number
break-if tem-done?:boolean, +done:label
# while template[i] != '_'
in:character <- index template:address:array:character/deref, i:number
underscore?:boolean <- equal in:character, 95:literal # '_'
break-if underscore?:boolean
# result[result-idx] = template[i]
out:address:character <- index-address result:address:array:character/deref, result-idx:number
out:address:character/deref <- copy in:character
# ++i
i:number <- add i:number, 1:literal
# ++result-idx
result-idx:number <- add result-idx:number, 1:literal
loop
}
# copy 'a' into result
j:number <- copy 0:literal
{
# while j < a.length
arg-done?:boolean <- greater-or-equal j:number, a-len:number
break-if arg-done?:boolean
# result[result-idx] = a[j]
in:character <- index a:address:array:character/deref, j:number
out:address:character <- index-address result:address:array:character/deref, result-idx:number
out:address:character/deref <- copy in:character
# ++j
j:number <- add j:number, 1:literal
# ++result-idx
result-idx:number <- add result-idx:number, 1:literal
loop
}
# skip '_' in template
i:number <- add i:number, 1:literal
loop # interpolate next arg
}
+done
# done with holes; copy rest of template directly into result
{
# while i < template.length
tem-done?:boolean <- greater-or-equal i:number, tem-len:number
break-if tem-done?:boolean
# result[result-idx] = template[i]
in:character <- index template:address:array:character/deref, i:number
out:address:character <- index-address result:address:array:character/deref, result-idx:number
out:address:character/deref <- copy in:character
# ++i
i:number <- add i:number, 1:literal
# ++result-idx
result-idx:number <- add result-idx:number, 1:literal
loop
}
reply result:address:array:character
]
scenario interpolate-works [
#? dump run #? 1
run [
1:address:array:character/raw <- new [abc _]
2:address:array:character/raw <- new [def]
3:address:array:character/raw <- interpolate 1:address:array:character/raw, 2:address:array:character/raw
4:array:character/raw <- copy 3:address:array:character/raw/deref
]
memory-should-contain [
4:string <- [abc def]
]
]
scenario interpolate-at-start [
run [
1:address:array:character/raw <- new [_, hello!]
2:address:array:character/raw <- new [abc]
3:address:array:character/raw <- interpolate 1:address:array:character/raw, 2:address:array:character/raw
4:array:character/raw <- copy 3:address:array:character/raw/deref
]
memory-should-contain [
4:string <- [abc, hello!]
16 <- 0 # out of bounds
]
]
scenario interpolate-at-end [
run [
1:address:array:character/raw <- new [hello, _]
2:address:array:character/raw <- new [abc]
3:address:array:character/raw <- interpolate 1:address:array:character/raw, 2:address:array:character/raw
4:array:character/raw <- copy 3:address:array:character/raw/deref
]
memory-should-contain [
4:string <- [hello, abc]
]
]
# result:boolean <- space? c:character
recipe space? [
default-space:array:address:location <- new location:type, 30:literal
c:character <- next-ingredient
# most common case first
result:boolean <- equal c:character, 32:literal/space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 10:literal/newline
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 9:literal/tab
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 13:literal/carriage-return
# remaining uncommon cases in sorted order
# http://unicode.org code-points in unicode-set Z and Pattern_White_Space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 11:literal/ctrl-k
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 12:literal/ctrl-l
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 133:literal/ctrl-0085
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 160:literal/no-break-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 5760:literal/ogham-space-mark
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8192:literal/en-quad
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8193:literal/em-quad
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8194:literal/en-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8195:literal/em-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8196:literal/three-per-em-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8197:literal/four-per-em-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8198:literal/six-per-em-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8199:literal/figure-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8200:literal/punctuation-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8201:literal/thin-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8202:literal/hair-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8206:literal/left-to-right
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8207:literal/right-to-left
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8232:literal/line-separator
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8233:literal/paragraph-separator
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8239:literal/narrow-no-break-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 8287:literal/medium-mathematical-space
jump-if result:boolean, +reply:label
result:boolean <- equal c:character, 12288:literal/ideographic-space
jump-if result:boolean, +reply:label
+reply
reply result:boolean
]
# result:address:array:character <- trim s:address:array:character
recipe trim [
default-space:array:address:location <- new location:type, 30:literal
s:address:array:character <- next-ingredient
len:number <- length s:address:array:character/deref
# left trim: compute start
start:number <- copy 0:literal
{
{
at-end?:boolean <- greater-or-equal start:number, len:number
break-unless at-end?:boolean
result:address:array:character <- new character:type, 0:literal
reply result:address:array:character
}
curr:character <- index s:address:array:character/deref, start:number
whitespace?:boolean <- space? curr:character
break-unless whitespace?:boolean
start:number <- add start:number, 1:literal
loop
}
# right trim: compute end
end:number <- subtract len:number, 1:literal
{
not-at-start?:boolean <- greater-than end:number, start:number
assert not-at-start?:boolean [end ran up against start]
curr:character <- index s:address:array:character/deref, end:number
whitespace?:boolean <- space? curr:character
break-unless whitespace?:boolean
end:number <- subtract end:number, 1:literal
loop
}
# result = new character[end+1 - start]
new-len:number <- subtract end:number, start:number, -1:literal
result:address:array:character <- new character:type, new-len:number
# i = start, j = 0
i:number <- copy start:number
j:number <- copy 0:literal
{
# while i <= end
done?:boolean <- greater-than i:number, end:number
break-if done?:boolean
# result[j] = s[i]
src:character <- index s:address:array:character/deref, i:number
dest:address:character <- index-address result:address:array:character/deref, j:number
dest:address:character/deref <- copy src:character
# ++i, ++j
i:number <- add i:number, 1:literal
j:number <- add j:number, 1:literal
loop
}
reply result:address:array:character
]
scenario trim-unmodified [
run [
1:address:array:character <- new [abc]
2:address:array:character <- trim 1:address:array:character
3:array:character <- copy 2:address:array:character/deref
]
memory-should-contain [
3:string <- [abc]
]
]
scenario trim-left [
run [
1:address:array:character <- new [ abc]
2:address:array:character <- trim 1:address:array:character
3:array:character <- copy 2:address:array:character/deref
]
memory-should-contain [
3:string <- [abc]
]
]
scenario trim-right [
run [
1:address:array:character <- new [abc ]
2:address:array:character <- trim 1:address:array:character
3:array:character <- copy 2:address:array:character/deref
]
memory-should-contain [
3:string <- [abc]
]
]
scenario trim-left-right [
run [
1:address:array:character <- new [ abc ]
2:address:array:character <- trim 1:address:array:character
3:array:character <- copy 2:address:array:character/deref
]
memory-should-contain [
3:string <- [abc]
]
]
scenario trim-newline-tab [
run [
1:address:array:character <- new [ abc
]
2:address:array:character <- trim 1:address:array:character
3:array:character <- copy 2:address:array:character/deref
]
memory-should-contain [
3:string <- [abc]
]
]
|