Nimitai is a compile-time parser generator for binary data. It transforms JSON objects into parsing procedures.
Each input object should describe a binary format according to Kaitai Struct conventions.
Exported symbol | Production |
---|---|
macro injectParser(spec: static[JsonNode]) |
static library (compile time code embedding) |
proc createDynlib(spec: JsonNode, path: string) |
dynamic library |
proc outputModule(spec: JsonNode): string |
nim module (source code) |
The project is stalled indefinitely because Kaitai Struct semantics are not idiomatic for Nim and therefore it is not worth the effort (there are better native solutions; see binaryparse)
Being ubiquitous and easily parsable, JSON is a great base format, and there is even a CT parser in Nim stdlib. However, writing in JSON is not appealing at all. Luckily there are a couple of nice JSON superset, and nimitai can work in conjuction with any CT parser that outputs JsonNode
. The end-goal is to use nimitai alongside a YAML compiler in order to leverage the excellent Kaitai Struct IDE. Sadly, we don't have one that works at compile-time yet. The plan is to refactor NimYAML. Nevertheless, nimitai can progress independently.
Pluggable spec-as-compiler: Instead of being an external compiler, nimitai is a CT library which means you don't have to mess with makefiles or similar mechanisms - everything is done within the language. The moment you tweak your spec, your project that links to it has a brand new compiler! No scripts needed at all.
buffered_struct.nim (...)
import json, nimitai, nimitai/runtime
injectParser(parseJson(readFile"buffered_struct.json"))
buffered_struct.json
{
"meta": {
"id": "buffered_struct",
"endian": "le"
},
"seq": [
{
"id": "len1",
"type": "u4"
},
{
"id": "block1",
"type": "block",
"size": "len1"
},
{
"id": "len2",
"type": "u4"
},
{
"id": "block2",
"type": "block",
"size": "len2"
},
{
"id": "finisher",
"type": "u4"
}
],
"types": {
"block": {
"seq": [
{
"id": "number1",
"type": "u4"
},
{
"id": "number2",
"type": "u4"
}
]
}
}
}
generated code
type
Buffered_struct* = ref object of KaitaiStruct
parent*: KaitaiStruct
len1*: uint32
block1*: Buffered_structBlock
block1Io: KaitaiStream
block1Raw: seq[byte]
len2*: uint32
block2*: Buffered_structBlock
block2Io: KaitaiStream
block2Raw: seq[byte]
finisher*: uint32
Buffered_structBlock* = ref object of KaitaiStruct
parent*: Buffered_struct
number1*: uint32
number2*: uint32
proc read*(_: typedesc[Buffered_structBlock]; io: KaitaiStream;
root: KaitaiStruct; parent: Buffered_struct): Buffered_structBlock
proc read*(_: typedesc[Buffered_struct]; io: KaitaiStream; root: KaitaiStruct;
parent: KaitaiStruct): Buffered_struct
proc read*(_: typedesc[Buffered_structBlock]; io: KaitaiStream;
root: KaitaiStruct; parent: Buffered_struct): Buffered_structBlock =
template this(): untyped =
result
this = Buffered_structBlock(io: io, parent: parent)
this.root = if root == nil: this else: root
this.number1 = readu4le(this.io)
this.number2 = readu4le(this.io)
proc read*(_: typedesc[Buffered_struct]; io: KaitaiStream; root: KaitaiStruct;
parent: KaitaiStruct): Buffered_struct =
template this(): untyped =
result
this = Buffered_struct(io: io, parent: parent)
this.root = if root == nil: this else: root
this.len1 = readu4le(this.io)
this.block1Raw = readBytes(this.io, int(this.len1))
this.block1Io = newKaitaiStream(this.block1Raw)
this.block1 = Buffered_structBlock.read(this.block1io, this.root, this)
this.len2 = readu4le(this.io)
this.block2Raw = readBytes(this.io, int(this.len2))
this.block2Io = newKaitaiStream(this.block2Raw)
this.block2 = Buffered_structBlock.read(this.block2io, this.root, this)
this.finisher = readu4le(this.io)
proc fromFile*(_: typedesc[Buffered_structBlock]; filename: string): Buffered_structBlock =
read(Buffered_structBlock, newKaitaiFileStream(filename), nil, nil)
proc fromFile*(_: typedesc[Buffered_struct]; filename: string): Buffered_struct =
read(Buffered_struct, newKaitaiFileStream(filename), nil, nil)
(...) buffered_struct.nim
let x = BufferedStruct.fromFile("buffered_struct.bin")
echo "Block1, number1: " & toHex(x.block1.number1.int64, 2)
echo "Block1, number2: " & toHex(x.block1.number2.int64, 2)
echo "Block2, number1: " & toHex(x.block2.number1.int64, 2)
echo "Block2, number2: " & toHex(x.block2.number2.int64, 2)
buffered_struct.bin (hex view)
10 00 00 00 42 00 00 00 43 00 00 00 ff ff ff ff
ff ff ff ff 08 00 00 00 44 00 00 00 45 00 00 00
ee 00 00 00
output:
Block1, number1: 42
Block1, number2: 43
Block2, number1: 44
Block2, number2: 45