1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
|
# See https://www.rfc-editor.org/rfc/rfc1524
import osproc
import streams
import strutils
import types/url
import types/opt
import utils/twtstr
import chakasu/charset
type
MailcapParser = object
stream: Stream
hasbuf: bool
buf: char
MailcapFlags* = enum
NEEDSTERMINAL = "needsterminal"
COPIOUSOUTPUT = "copiousoutput"
HTMLOUTPUT = "x-htmloutput" # from w3m
MailcapEntry* = object
mt*: string
subt*: string
cmd*: string
flags*: set[MailcapFlags]
nametemplate*: string
edit*: string
test*: string
Mailcap* = seq[MailcapEntry]
const DefaultMailcap* = @[
MailcapEntry(
mt: "*",
subt: "*",
cmd: "xdg-open '%s'"
)
]
proc has(state: MailcapParser): bool {.inline.} =
return not state.stream.atEnd
proc consume(state: var MailcapParser): char =
if state.hasbuf:
state.hasbuf = false
return state.buf
return state.stream.readChar()
proc reconsume(state: var MailcapParser, c: char) =
state.buf = c
state.hasbuf = true
proc skipBlanks(state: var MailcapParser, c: var char): bool =
while state.has():
c = state.consume()
if c notin AsciiWhitespace - {'\n'}:
return true
proc skipBlanks(state: var MailcapParser) =
var c: char
if state.skipBlanks(c):
state.reconsume(c)
proc skipLine(state: var MailcapParser) =
while state.has():
let c = state.consume()
if c == '\n':
break
proc consumeTypeField(state: var MailcapParser): Result[string, string] =
var s = ""
# type
while state.has():
let c = state.consume()
if c == '/':
s &= c
break
if c notin AsciiAlphaNumeric + {'-', '*'}:
return err("Invalid character encountered in type field")
s &= c.toLowerAscii()
if not state.has():
return err("Missing subtype")
# subtype
while state.has():
let c = state.consume()
if c in AsciiWhitespace + {';'}:
state.reconsume(c)
break
if c notin AsciiAlphaNumeric + {'-', '.', '*', '_', '+'}:
return err("Invalid character encountered in subtype field")
s &= c.toLowerAscii()
var c: char
if not state.skipBlanks(c) or c != ';':
return err("Semicolon not found")
return ok(s)
proc consumeCommand(state: var MailcapParser): Result[string, string] =
state.skipBlanks()
var quoted = false
var s = ""
while state.has():
let c = state.consume()
if not quoted:
if c == '\r':
continue
if c == ';' or c == '\n':
state.reconsume(c)
return ok(s)
if c == '\\':
quoted = true
continue
if c notin Ascii - Controls:
return err("Invalid character encountered in command")
else:
quoted = false
s &= c
return ok(s)
type NamedField = enum
NO_NAMED_FIELD, NAMED_FIELD_TEST, NAMED_FIELD_NAMETEMPLATE, NAMED_FIELD_EDIT
proc parseFieldKey(entry: var MailcapEntry, k: string): NamedField =
case k
of "needsterminal":
entry.flags.incl(NEEDSTERMINAL)
of "copiousoutput":
entry.flags.incl(COPIOUSOUTPUT)
of "x-htmloutput":
entry.flags.incl(HTMLOUTPUT)
of "test":
return NAMED_FIELD_TEST
of "nametemplate":
return NAMED_FIELD_NAMETEMPLATE
of "edit":
return NAMED_FIELD_EDIT
return NO_NAMED_FIELD
proc consumeField(state: var MailcapParser, entry: var MailcapEntry):
Result[bool, string] =
state.skipBlanks()
if not state.has():
return ok(false)
var buf = ""
while state.has():
let c = state.consume()
case c
of ';', '\n':
if parseFieldKey(entry, buf) != NO_NAMED_FIELD:
return err("Expected command")
return ok(c == ';')
of '\r':
continue
of '=':
let f = parseFieldKey(entry, buf)
let cmd = ?state.consumeCommand()
case f
of NO_NAMED_FIELD:
discard
of NAMED_FIELD_TEST:
entry.test = cmd
of NAMED_FIELD_NAMETEMPLATE:
entry.nametemplate = cmd
of NAMED_FIELD_EDIT:
entry.edit = cmd
return ok(state.consume() == ';')
else:
if c in Controls:
return err("Invalid character encountered in field")
buf &= c
proc parseMailcap*(stream: Stream): Result[Mailcap, string] =
var state = MailcapParser(stream: stream)
var mailcap: Mailcap
while not stream.atEnd():
let c = state.consume()
if c == '#':
state.skipLine()
continue
state.reconsume(c)
state.skipBlanks()
let c2 = state.consume()
if c2 == '\n' or c2 == '\r':
continue
state.reconsume(c2)
let t = ?state.consumeTypeField()
let mt = t.until('/') #TODO this could be more efficient
let subt = t[mt.len + 1 .. ^1]
var entry = MailcapEntry(
mt: mt,
subt: subt,
cmd: ?state.consumeCommand()
)
if state.consume() == ';':
while ?state.consumeField(entry):
discard
mailcap.add(entry)
return ok(mailcap)
# Mostly based on w3m's mailcap quote/unquote
type UnquoteState = enum
STATE_NORMAL, STATE_QUOTED, STATE_PERC, STATE_ATTR, STATE_ATTR_QUOTED,
STATE_DOLLAR
type UnquoteResult* = object
canpipe*: bool
cmd*: string
type QuoteState = enum
QS_NORMAL, QS_DQUOTED, QS_SQUOTED
proc quoteFile(file: string, qs: QuoteState): string =
var s = ""
for c in file:
case c
of '$', '`', '"', '\\':
if qs != QS_SQUOTED:
s &= '\\'
of '\'':
if qs == QS_SQUOTED:
s &= "'\\'" # then re-open the quote by appending c
elif qs == QS_NORMAL:
s &= '\\'
# double-quoted: append normally
of '_', '.', ':', '/':
discard # no need to quote
else:
if c notin AsciiAlpha and qs == QS_NORMAL:
s &= '\\'
s &= c
return s
proc unquoteCommand*(ecmd, contentType, outpath: string, url: URL,
charset: Charset, canpipe: var bool): string =
var cmd = ""
var attrname = ""
var state: UnquoteState
var qss = @[QS_NORMAL] # quote state stack. len >1
template qs: var QuoteState = qss[^1]
for c in ecmd:
case state
of STATE_QUOTED:
cmd &= c
state = STATE_NORMAL
of STATE_ATTR_QUOTED:
attrname &= c.toLowerAscii()
state = STATE_ATTR
of STATE_NORMAL, STATE_DOLLAR:
let prev_dollar = state == STATE_DOLLAR
state = STATE_NORMAL
case c
of '%':
state = STATE_PERC
of '\\':
state = STATE_QUOTED
of '\'':
if qs == QS_SQUOTED:
qs = QS_NORMAL
else:
qs = QS_SQUOTED
cmd &= c
of '"':
if qs == QS_DQUOTED:
qs = QS_NORMAL
else:
qs = QS_DQUOTED
cmd &= c
of '$':
if qs != QS_SQUOTED:
state = STATE_DOLLAR
cmd &= c
of '(':
if prev_dollar:
qss.add(QS_NORMAL)
cmd &= c
of ')':
if qs != QS_SQUOTED:
if qss.len > 1:
qss.setLen(qss.len - 1)
else:
# mismatched parens; probably an invalid shell command...
qss[0] = QS_NORMAL
cmd &= c
else:
cmd &= c
of STATE_PERC:
if c == '%':
cmd &= c
elif c == 's':
cmd &= quoteFile(outpath, qs)
canpipe = false
elif c == 't':
cmd &= quoteFile(contentType.until(';'), qs)
elif c == 'u': # extension
cmd &= quoteFile($url, qs)
elif c == '{':
state = STATE_ATTR
continue
state = STATE_NORMAL
of STATE_ATTR:
if c == '}':
if attrname == "charset":
cmd &= quoteFile($charset, qs)
continue
#TODO this is broken, because content-type is stripped of ; fields
let kvs = contentType.after(';').toLowerAscii()
var i = kvs.find(attrname)
var s = ""
if i != -1 and kvs.len > i + attrname.len and
kvs[i + attrname.len] == '=':
i = skipBlanks(kvs, i + attrname.len + 1)
var q = false
for j in i ..< kvs.len:
if not q and kvs[j] == '\\':
q = true
elif not q and (kvs[j] == ';' or kvs[j] in AsciiWhitespace):
break
else:
s &= kvs[j]
cmd &= quoteFile(s, qs)
attrname = ""
elif c == '\\':
state = STATE_ATTR_QUOTED
else:
attrname &= c
return cmd
proc unquoteCommand*(ecmd, contentType, outpath: string, url: URL,
charset: Charset): string =
var canpipe: bool
return unquoteCommand(ecmd, contentType, outpath, url, charset, canpipe)
proc getMailcapEntry*(mailcap: Mailcap, mimeType, outpath: string,
url: URL, charset: Charset): ptr MailcapEntry =
let mt = mimeType.until('/')
if mt.len + 1 >= mimeType.len:
return nil
let st = mimeType[mt.len + 1 .. ^1]
for entry in mailcap:
if not (entry.mt.len == 1 and entry.mt[0] == '*') and
entry.mt != mt:
continue
if not (entry.subt.len == 1 and entry.subt[0] == '*') and
entry.subt != st:
continue
if entry.test != "":
var canpipe = true
let cmd = unquoteCommand(entry.test, mimeType, outpath, url, charset,
canpipe)
#TODO TODO TODO if not canpipe ...
if execCmd(cmd) != 0:
continue
return unsafeAddr entry
|