mirror of
git://jb55.com/damus
synced 2024-09-30 00:40:45 +00:00
ndb: fix iterators, pack id tags, more tests
This commit is contained in:
parent
1a33d639ed
commit
e34351ca37
@ -75,6 +75,7 @@
|
||||
4C285C8A2838B985008A31F1 /* ProfilePictureSelector.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4C285C892838B985008A31F1 /* ProfilePictureSelector.swift */; };
|
||||
4C285C8C28398BC7008A31F1 /* Keys.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4C285C8B28398BC6008A31F1 /* Keys.swift */; };
|
||||
4C285C8E28399BFE008A31F1 /* SaveKeysView.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4C285C8D28399BFD008A31F1 /* SaveKeysView.swift */; };
|
||||
4C28A4122A6D03D200C1A7A5 /* ReferencedId.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4C28A4112A6D03D200C1A7A5 /* ReferencedId.swift */; };
|
||||
4C2CDDF7299D4A5E00879FD5 /* Debouncer.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4C2CDDF6299D4A5E00879FD5 /* Debouncer.swift */; };
|
||||
4C30AC7229A5677A00E2BD5A /* NotificationsView.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4C30AC7129A5677A00E2BD5A /* NotificationsView.swift */; };
|
||||
4C30AC7429A5680900E2BD5A /* EventGroupView.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4C30AC7329A5680900E2BD5A /* EventGroupView.swift */; };
|
||||
@ -527,6 +528,7 @@
|
||||
4C285C892838B985008A31F1 /* ProfilePictureSelector.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = ProfilePictureSelector.swift; sourceTree = "<group>"; };
|
||||
4C285C8B28398BC6008A31F1 /* Keys.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = Keys.swift; sourceTree = "<group>"; };
|
||||
4C285C8D28399BFD008A31F1 /* SaveKeysView.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = SaveKeysView.swift; sourceTree = "<group>"; };
|
||||
4C28A4112A6D03D200C1A7A5 /* ReferencedId.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = ReferencedId.swift; sourceTree = "<group>"; };
|
||||
4C2CDDF6299D4A5E00879FD5 /* Debouncer.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = Debouncer.swift; sourceTree = "<group>"; };
|
||||
4C30AC7129A5677A00E2BD5A /* NotificationsView.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = NotificationsView.swift; sourceTree = "<group>"; };
|
||||
4C30AC7329A5680900E2BD5A /* EventGroupView.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = EventGroupView.swift; sourceTree = "<group>"; };
|
||||
@ -1215,6 +1217,7 @@
|
||||
4C3BEFD32819DE8F00B3DE84 /* NostrKind.swift */,
|
||||
4C363A8F28247A1D006E126D /* NostrLink.swift */,
|
||||
50088DA029E8271A008A1FDF /* WebSocket.swift */,
|
||||
4C28A4112A6D03D200C1A7A5 /* ReferencedId.swift */,
|
||||
);
|
||||
path = Nostr;
|
||||
sourceTree = "<group>";
|
||||
@ -1919,6 +1922,7 @@
|
||||
4C363AA228296A7E006E126D /* SearchView.swift in Sources */,
|
||||
4CC7AAED297F0B9E00430951 /* Highlight.swift in Sources */,
|
||||
4CA927652A290F1A0098A105 /* TimeDot.swift in Sources */,
|
||||
4C28A4122A6D03D200C1A7A5 /* ReferencedId.swift in Sources */,
|
||||
4CC6193A29DC777C006A86D1 /* RelayBootstrap.swift in Sources */,
|
||||
4C285C8A2838B985008A31F1 /* ProfilePictureSelector.swift in Sources */,
|
||||
4CFD502F2A2DA45800A229DB /* MediaView.swift in Sources */,
|
||||
|
@ -20,32 +20,6 @@ enum ValidationResult: Decodable {
|
||||
case bad_sig
|
||||
}
|
||||
|
||||
struct ReferencedId: Identifiable, Hashable, Equatable {
|
||||
let ref_id: String
|
||||
let relay_id: String?
|
||||
let key: String
|
||||
|
||||
var id: String {
|
||||
return ref_id
|
||||
}
|
||||
|
||||
static func q(_ id: String, relay_id: String? = nil) -> ReferencedId {
|
||||
return ReferencedId(ref_id: id, relay_id: relay_id, key: "q")
|
||||
}
|
||||
|
||||
static func e(_ id: String, relay_id: String? = nil) -> ReferencedId {
|
||||
return ReferencedId(ref_id: id, relay_id: relay_id, key: "e")
|
||||
}
|
||||
|
||||
static func p(_ pk: String, relay_id: String? = nil) -> ReferencedId {
|
||||
return ReferencedId(ref_id: pk, relay_id: relay_id, key: "p")
|
||||
}
|
||||
|
||||
static func t(_ hashtag: String, relay_id: String? = nil) -> ReferencedId {
|
||||
return ReferencedId(ref_id: hashtag, relay_id: relay_id, key: "t")
|
||||
}
|
||||
}
|
||||
|
||||
class NostrEvent: Codable, Identifiable, CustomStringConvertible, Equatable, Hashable, Comparable {
|
||||
// TODO: memory mapped db events
|
||||
/*
|
||||
|
69
damus/Nostr/ReferencedId.swift
Normal file
69
damus/Nostr/ReferencedId.swift
Normal file
@ -0,0 +1,69 @@
|
||||
//
|
||||
// ReferencedId.swift
|
||||
// damus
|
||||
//
|
||||
// Created by William Casarin on 2023-07-22.
|
||||
//
|
||||
|
||||
import Foundation
|
||||
|
||||
struct Reference {
|
||||
let key: AsciiCharacter
|
||||
let id: NdbTagElem
|
||||
|
||||
func to_referenced_id() -> ReferencedId {
|
||||
ReferencedId(ref_id: id.string(), relay_id: nil, key: key.string)
|
||||
}
|
||||
}
|
||||
|
||||
struct References: Sequence, IteratorProtocol {
|
||||
let note: NdbNote
|
||||
var tags: TagsIterator
|
||||
|
||||
mutating func next() -> Reference? {
|
||||
while let tag = tags.next() {
|
||||
guard let key = tag[0], key.count == 1,
|
||||
let id = tag[1], id.is_id
|
||||
else { continue }
|
||||
|
||||
for c in key {
|
||||
guard let a = AsciiCharacter(c) else { break }
|
||||
return Reference(key: a, id: id)
|
||||
}
|
||||
}
|
||||
|
||||
return nil
|
||||
}
|
||||
|
||||
init(note: NdbNote) {
|
||||
self.note = note
|
||||
self.tags = note.tags().makeIterator()
|
||||
}
|
||||
}
|
||||
|
||||
struct ReferencedId: Identifiable, Hashable, Equatable {
|
||||
let ref_id: String
|
||||
let relay_id: String?
|
||||
let key: String
|
||||
|
||||
var id: String {
|
||||
return ref_id
|
||||
}
|
||||
|
||||
static func q(_ id: String, relay_id: String? = nil) -> ReferencedId {
|
||||
return ReferencedId(ref_id: id, relay_id: relay_id, key: "q")
|
||||
}
|
||||
|
||||
static func e(_ id: String, relay_id: String? = nil) -> ReferencedId {
|
||||
return ReferencedId(ref_id: id, relay_id: relay_id, key: "e")
|
||||
}
|
||||
|
||||
static func p(_ pk: String, relay_id: String? = nil) -> ReferencedId {
|
||||
return ReferencedId(ref_id: pk, relay_id: relay_id, key: "p")
|
||||
}
|
||||
|
||||
static func t(_ hashtag: String, relay_id: String? = nil) -> ReferencedId {
|
||||
return ReferencedId(ref_id: hashtag, relay_id: relay_id, key: "t")
|
||||
}
|
||||
}
|
||||
|
@ -7,18 +7,42 @@
|
||||
|
||||
import Foundation
|
||||
|
||||
struct NdbNote {
|
||||
// we can have owned notes, but we can also have lmdb virtual-memory mapped notes so its optional
|
||||
private var owned: Data?
|
||||
let note: UnsafeMutablePointer<ndb_note>
|
||||
|
||||
init(note: UnsafeMutablePointer<ndb_note>, data: Data?) {
|
||||
self.note = note
|
||||
self.owned = data
|
||||
struct NdbStr {
|
||||
let note: NdbNote
|
||||
let str: UnsafePointer<CChar>
|
||||
}
|
||||
|
||||
struct NdbId {
|
||||
let note: NdbNote
|
||||
let id: Data
|
||||
}
|
||||
|
||||
enum NdbData {
|
||||
case id(NdbId)
|
||||
case str(NdbStr)
|
||||
|
||||
init(note: NdbNote, str: ndb_str) {
|
||||
guard str.flag == NDB_PACKED_ID else {
|
||||
self = .str(NdbStr(note: note, str: str.str))
|
||||
return
|
||||
}
|
||||
|
||||
var owned_size: Int? {
|
||||
return owned?.count
|
||||
let buffer = UnsafeBufferPointer(start: str.id, count: 32)
|
||||
self = .id(NdbId(note: note, id: Data(buffer: buffer)))
|
||||
}
|
||||
}
|
||||
|
||||
class NdbNote {
|
||||
// we can have owned notes, but we can also have lmdb virtual-memory mapped notes so its optional
|
||||
private let owned: Bool
|
||||
let count: Int
|
||||
let note: UnsafeMutablePointer<ndb_note>
|
||||
|
||||
init(note: UnsafeMutablePointer<ndb_note>, owned_size: Int?) {
|
||||
self.note = note
|
||||
self.owned = owned_size != nil
|
||||
self.count = owned_size ?? 0
|
||||
}
|
||||
|
||||
var content: String {
|
||||
@ -33,10 +57,12 @@ struct NdbNote {
|
||||
ndb_note_content_length(note)
|
||||
}
|
||||
|
||||
/// These are unsafe if working on owned data and if this outlives the NdbNote
|
||||
var id: Data {
|
||||
Data(buffer: UnsafeBufferPointer(start: ndb_note_id(note), count: 32))
|
||||
}
|
||||
|
||||
/// Make a copy if this outlives the note and the note has owned data!
|
||||
var pubkey: Data {
|
||||
Data(buffer: UnsafeBufferPointer(start: ndb_note_pubkey(note), count: 32))
|
||||
}
|
||||
@ -53,21 +79,30 @@ struct NdbNote {
|
||||
return .init(note: self)
|
||||
}
|
||||
|
||||
deinit {
|
||||
if self.owned {
|
||||
free(note)
|
||||
}
|
||||
}
|
||||
|
||||
static func owned_from_json(json: String, bufsize: Int = 2 << 18) -> NdbNote? {
|
||||
var data = Data(capacity: bufsize)
|
||||
let data = malloc(bufsize)
|
||||
guard var json_cstr = json.cString(using: .utf8) else { return nil }
|
||||
|
||||
var note: UnsafeMutablePointer<ndb_note>?
|
||||
|
||||
let len = data.withUnsafeMutableBytes { (bytes: UnsafeMutableRawBufferPointer) in
|
||||
return ndb_note_from_json(&json_cstr, Int32(json_cstr.count), ¬e, bytes.baseAddress, Int32(bufsize))
|
||||
let len = ndb_note_from_json(&json_cstr, Int32(json_cstr.count), ¬e, data, Int32(bufsize))
|
||||
|
||||
if len == 0 {
|
||||
free(data)
|
||||
return nil
|
||||
}
|
||||
|
||||
guard let note else { return nil }
|
||||
|
||||
// Create new Data with just the valid bytes
|
||||
let smol_data = Data(bytes: ¬e.pointee, count: Int(len))
|
||||
return NdbNote(note: note, data: smol_data)
|
||||
guard let note_data = realloc(data, Int(len)) else { return nil }
|
||||
|
||||
let new_note = note_data.assumingMemoryBound(to: ndb_note.self)
|
||||
return NdbNote(note: new_note, owned_size: Int(len))
|
||||
}
|
||||
}
|
||||
|
||||
@ -99,20 +134,35 @@ extension NdbNote {
|
||||
return parse_note_content_ndb(note: self)
|
||||
}
|
||||
|
||||
/*
|
||||
|
||||
func get_inner_event(cache: EventCache) -> NostrEvent? {
|
||||
guard self.known_kind == .boost else {
|
||||
return nil
|
||||
}
|
||||
|
||||
if self.content == "", let ref = self.referenced_ids.first {
|
||||
return cache.lookup(ref.ref_id)
|
||||
// TODO: raw id cache lookups
|
||||
let id = ref.id.string()
|
||||
return cache.lookup(id)
|
||||
}
|
||||
|
||||
return self.inner_event
|
||||
// TODO: how to handle inner events?
|
||||
return nil
|
||||
//return self.inner_event
|
||||
}
|
||||
|
||||
// TODO: References iterator
|
||||
public var referenced_ids: LazyFilterSequence<References> {
|
||||
References(note: self).lazy
|
||||
.filter() { ref in ref.key == "e" }
|
||||
}
|
||||
|
||||
public var referenced_pubkeys: LazyFilterSequence<References> {
|
||||
References(note: self).lazy
|
||||
.filter() { ref in ref.key == "p" }
|
||||
}
|
||||
|
||||
/*
|
||||
|
||||
func event_refs(_ privkey: String?) -> [EventRef] {
|
||||
if let rs = _event_refs {
|
||||
return rs
|
||||
@ -122,7 +172,6 @@ extension NdbNote {
|
||||
return refs
|
||||
}
|
||||
|
||||
|
||||
func decrypted(privkey: String?) -> String? {
|
||||
if let decrypted_content = decrypted_content {
|
||||
return decrypted_content
|
||||
@ -272,3 +321,9 @@ extension NdbNote {
|
||||
}
|
||||
*/
|
||||
}
|
||||
|
||||
extension LazyFilterSequence {
|
||||
var first: Element? {
|
||||
self.first(where: { _ in true })
|
||||
}
|
||||
}
|
||||
|
@ -7,9 +7,33 @@
|
||||
|
||||
import Foundation
|
||||
|
||||
struct NdbTagElem {
|
||||
private let note: NdbNote
|
||||
private let tag: UnsafeMutablePointer<ndb_tag>
|
||||
struct NdbStrIter: IteratorProtocol {
|
||||
typealias Element = CChar
|
||||
|
||||
var ind: Int
|
||||
let str: ndb_str
|
||||
let tag: NdbTagElem // stored for lifetime reasons
|
||||
|
||||
mutating func next() -> CChar? {
|
||||
let c = str.str[ind]
|
||||
if (c != 0) {
|
||||
ind += 1
|
||||
return c
|
||||
}
|
||||
|
||||
return nil
|
||||
}
|
||||
|
||||
init(tag: NdbTagElem) {
|
||||
self.str = ndb_tag_str(tag.note.note, tag.tag, tag.index)
|
||||
self.ind = 0
|
||||
self.tag = tag
|
||||
}
|
||||
}
|
||||
|
||||
struct NdbTagElem: Sequence {
|
||||
let note: NdbNote
|
||||
let tag: UnsafeMutablePointer<ndb_tag>
|
||||
let index: Int32
|
||||
|
||||
init(note: NdbNote, tag: UnsafeMutablePointer<ndb_tag>, index: Int32) {
|
||||
@ -18,12 +42,44 @@ struct NdbTagElem {
|
||||
self.index = index
|
||||
}
|
||||
|
||||
var is_id: Bool {
|
||||
return ndb_tag_str(note.note, tag, index).flag == NDB_PACKED_ID
|
||||
}
|
||||
|
||||
var count: Int {
|
||||
let r = ndb_tag_str(note.note, tag, index)
|
||||
if r.flag == NDB_PACKED_ID {
|
||||
return 32
|
||||
} else {
|
||||
return strlen(r.str)
|
||||
}
|
||||
}
|
||||
|
||||
func matches_char(_ c: AsciiCharacter) -> Bool {
|
||||
return ndb_tag_matches_char(note.note, tag, index, c.cchar) == 1
|
||||
}
|
||||
|
||||
func data() -> NdbData {
|
||||
let s = ndb_tag_str(note.note, tag, index)
|
||||
return NdbData(note: note, str: s)
|
||||
}
|
||||
|
||||
func id() -> Data? {
|
||||
guard case .id(let id) = self.data() else { return nil }
|
||||
return id.id
|
||||
}
|
||||
|
||||
func string() -> String {
|
||||
return String(cString: ndb_tag_str(note.note, tag, index), encoding: .utf8) ?? ""
|
||||
switch self.data() {
|
||||
case .id(let id):
|
||||
return hex_encode(id.id)
|
||||
case .str(let s):
|
||||
return String(cString: s.str, encoding: .utf8) ?? ""
|
||||
}
|
||||
}
|
||||
|
||||
func makeIterator() -> NdbStrIter {
|
||||
return NdbStrIter(tag: self)
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -16,9 +16,7 @@ struct TagSequence: Sequence {
|
||||
}
|
||||
|
||||
subscript(index: Int) -> NdbTagElem? {
|
||||
if index >= tag.pointee.count {
|
||||
return nil
|
||||
}
|
||||
guard index < count else { return nil }
|
||||
|
||||
return NdbTagElem(note: note, tag: tag, index: Int32(index))
|
||||
}
|
||||
@ -40,14 +38,6 @@ struct TagIterator: IteratorProtocol {
|
||||
return el
|
||||
}
|
||||
|
||||
subscript(index: Int) -> NdbTagElem? {
|
||||
if index >= tag.pointee.count {
|
||||
return nil
|
||||
}
|
||||
|
||||
return NdbTagElem(note: note, tag: tag, index: Int32(index))
|
||||
}
|
||||
|
||||
var index: Int32
|
||||
let note: NdbNote
|
||||
var tag: UnsafeMutablePointer<ndb_tag>
|
||||
@ -62,10 +52,3 @@ struct TagIterator: IteratorProtocol {
|
||||
self.index = 0
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
func ndb_maybe_pointee<T>(_ p: UnsafeMutablePointer<T>!) -> T? {
|
||||
guard p != nil else { return nil }
|
||||
return p.pointee
|
||||
}
|
||||
|
||||
|
@ -15,24 +15,22 @@ struct TagsIterator: IteratorProtocol {
|
||||
var note: NdbNote
|
||||
|
||||
mutating func next() -> TagSequence? {
|
||||
guard !done else { return nil }
|
||||
guard ndb_tags_iterate_next(&self.iter) == 1 else {
|
||||
done = true
|
||||
return nil
|
||||
}
|
||||
|
||||
let tag_seq = TagSequence(note: note, tag: self.iter.tag)
|
||||
|
||||
let ok = ndb_tags_iterate_next(&self.iter)
|
||||
done = ok == 0
|
||||
|
||||
return tag_seq
|
||||
return TagSequence(note: note, tag: self.iter.tag)
|
||||
}
|
||||
|
||||
var count: UInt16 {
|
||||
return iter.tag.pointee.count
|
||||
return note.note.pointee.tags.count
|
||||
}
|
||||
|
||||
init(note: NdbNote) {
|
||||
self.iter = ndb_iterator()
|
||||
let res = ndb_tags_iterate_start(note.note, &self.iter)
|
||||
self.done = res == 0
|
||||
ndb_tags_iterate_start(note.note, &self.iter)
|
||||
self.done = false
|
||||
self.note = note
|
||||
}
|
||||
}
|
||||
@ -44,6 +42,9 @@ struct TagsSequence: Sequence {
|
||||
note.note.pointee.tags.count
|
||||
}
|
||||
|
||||
// no O(1) indexing on top-level tag lists unfortunately :(
|
||||
// bit it's very fast to iterate over each tag since the number of tags
|
||||
// are stored and the elements are fixed size.
|
||||
subscript(index: Int) -> Iterator.Element? {
|
||||
var i = 0
|
||||
for element in self {
|
||||
|
@ -28,25 +28,74 @@ final class NdbTests: XCTestCase {
|
||||
XCTAssertEqual(hex_encode(note.id), id)
|
||||
XCTAssertEqual(hex_encode(note.pubkey), pubkey)
|
||||
|
||||
XCTAssertEqual(note.owned_size, 59062)
|
||||
XCTAssertEqual(note.count, 34058)
|
||||
XCTAssertEqual(note.kind, 3)
|
||||
XCTAssertEqual(note.created_at, 1689904312)
|
||||
XCTAssertEqual(note.tags().reduce(0, { sum, _ in sum + 1 }), 786)
|
||||
|
||||
let expected_count: UInt16 = 786
|
||||
XCTAssertEqual(note.tags().count, expected_count)
|
||||
XCTAssertEqual(note.tags().reduce(0, { sum, _ in sum + 1 }), expected_count)
|
||||
|
||||
var count = 0
|
||||
var tags = 0
|
||||
var total_count_stored = 0
|
||||
var total_count_iter = 0
|
||||
//let tags = note.tags()
|
||||
for tag in note.tags() {
|
||||
total_count_stored += Int(tag.count)
|
||||
|
||||
if tags == 0 || tags == 1 || tags == 2 {
|
||||
XCTAssertEqual(tag.count, 3)
|
||||
}
|
||||
|
||||
if tags == 6 {
|
||||
XCTAssertEqual(tag.count, 2)
|
||||
}
|
||||
|
||||
if tags == 7 {
|
||||
XCTAssertEqual(tag[2]?.string(), "wss://nostr-pub.wellorder.net")
|
||||
}
|
||||
|
||||
for elem in tag {
|
||||
print("test_ndb_iterator \(elem.string())")
|
||||
}
|
||||
print("tag[\(tags)][\(elem.index)]")
|
||||
total_count_iter += 1
|
||||
}
|
||||
|
||||
tags += 1
|
||||
}
|
||||
|
||||
func testPerformanceExample() throws {
|
||||
XCTAssertEqual(tags, 786)
|
||||
XCTAssertEqual(total_count_stored, total_count_iter)
|
||||
}
|
||||
|
||||
func test_decode_perf() throws {
|
||||
// This is an example of a performance test case.
|
||||
self.measure {
|
||||
// Put the code you want to measure the time of here.
|
||||
_ = NdbNote.owned_from_json(json: test_contact_list_json)
|
||||
}
|
||||
}
|
||||
|
||||
func test_iteration_perf() throws {
|
||||
guard let note = NdbNote.owned_from_json(json: test_contact_list_json) else {
|
||||
XCTAssert(false)
|
||||
return
|
||||
}
|
||||
|
||||
var count = 0
|
||||
for tag in note.tags() {
|
||||
for elem in tag {
|
||||
print("iter_elem \(elem.string())")
|
||||
/*
|
||||
for _ in elem {
|
||||
count += 1
|
||||
}
|
||||
*/
|
||||
}
|
||||
count += 1
|
||||
}
|
||||
|
||||
XCTAssertEqual(count, 786)
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
|
@ -57,24 +57,6 @@ int ndb_builder_new(struct ndb_builder *builder, unsigned char *buf,
|
||||
return 1;
|
||||
}
|
||||
|
||||
/// Check for small strings to pack
|
||||
static inline int ndb_builder_try_compact_str(struct ndb_builder *builder,
|
||||
const char *str, int len,
|
||||
union packed_str *pstr)
|
||||
{
|
||||
if (len == 0) {
|
||||
*pstr = ndb_char_to_packed_str(0);
|
||||
return 1;
|
||||
} else if (len == 1) {
|
||||
*pstr = ndb_char_to_packed_str(str[0]);
|
||||
return 1;
|
||||
} else if (len == 2) {
|
||||
*pstr = ndb_chars_to_packed_str(str[0], str[1]);
|
||||
return 1;
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
|
||||
static inline int ndb_json_parser_init(struct ndb_json_parser *p,
|
||||
@ -146,7 +128,7 @@ struct ndb_note * ndb_builder_note(struct ndb_builder *builder)
|
||||
/// builder phase just for this purpose.
|
||||
static inline int ndb_builder_find_str(struct ndb_builder *builder,
|
||||
const char *str, int len,
|
||||
union packed_str *pstr)
|
||||
union ndb_packed_str *pstr)
|
||||
{
|
||||
// find existing matching string to avoid duplicate strings
|
||||
int indices = cursor_count(&builder->str_indices, sizeof(uint32_t));
|
||||
@ -165,7 +147,7 @@ static inline int ndb_builder_find_str(struct ndb_builder *builder,
|
||||
}
|
||||
|
||||
static int ndb_builder_push_str(struct ndb_builder *builder, const char *str,
|
||||
int len, union packed_str *pstr)
|
||||
int len, union ndb_packed_str *pstr)
|
||||
{
|
||||
uint32_t loc;
|
||||
|
||||
@ -185,9 +167,52 @@ static int ndb_builder_push_str(struct ndb_builder *builder, const char *str,
|
||||
return 1;
|
||||
}
|
||||
|
||||
static int ndb_builder_push_packed_id(struct ndb_builder *builder,
|
||||
unsigned char *id,
|
||||
union ndb_packed_str *pstr)
|
||||
{
|
||||
if (ndb_builder_find_str(builder, (const char*)id, 32, pstr)) {
|
||||
pstr->packed.flag = NDB_PACKED_ID;
|
||||
return 1;
|
||||
}
|
||||
|
||||
if (ndb_builder_push_str(builder, (const char*)id, 32, pstr)) {
|
||||
pstr->packed.flag = NDB_PACKED_ID;
|
||||
return 1;
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
|
||||
/// Check for small strings to pack
|
||||
static inline int ndb_builder_try_compact_str(struct ndb_builder *builder,
|
||||
const char *str, int len,
|
||||
union ndb_packed_str *pstr,
|
||||
int pack_ids)
|
||||
{
|
||||
unsigned char id_buf[32];
|
||||
|
||||
if (len == 0) {
|
||||
*pstr = ndb_char_to_packed_str(0);
|
||||
return 1;
|
||||
} else if (len == 1) {
|
||||
*pstr = ndb_char_to_packed_str(str[0]);
|
||||
return 1;
|
||||
} else if (len == 2) {
|
||||
*pstr = ndb_chars_to_packed_str(str[0], str[1]);
|
||||
return 1;
|
||||
} else if (pack_ids && len == 64 && hex_decode(str, 64, id_buf, 32)) {
|
||||
return ndb_builder_push_packed_id(builder, id_buf, pstr);
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
|
||||
static int ndb_builder_push_unpacked_str(struct ndb_builder *builder,
|
||||
const char *str, int len,
|
||||
union packed_str *pstr)
|
||||
union ndb_packed_str *pstr)
|
||||
{
|
||||
if (ndb_builder_find_str(builder, str, len, pstr))
|
||||
return 1;
|
||||
@ -196,9 +221,9 @@ static int ndb_builder_push_unpacked_str(struct ndb_builder *builder,
|
||||
}
|
||||
|
||||
int ndb_builder_make_str(struct ndb_builder *builder, const char *str, int len,
|
||||
union packed_str *pstr)
|
||||
union ndb_packed_str *pstr, int pack_ids)
|
||||
{
|
||||
if (ndb_builder_try_compact_str(builder, str, len, pstr))
|
||||
if (ndb_builder_try_compact_str(builder, str, len, pstr, pack_ids))
|
||||
return 1;
|
||||
|
||||
return ndb_builder_push_unpacked_str(builder, str, len, pstr);
|
||||
@ -207,8 +232,10 @@ int ndb_builder_make_str(struct ndb_builder *builder, const char *str, int len,
|
||||
int ndb_builder_set_content(struct ndb_builder *builder, const char *content,
|
||||
int len)
|
||||
{
|
||||
int pack_ids = 0;
|
||||
builder->note->content_length = len;
|
||||
return ndb_builder_make_str(builder, content, len, &builder->note->content);
|
||||
return ndb_builder_make_str(builder, content, len,
|
||||
&builder->note->content, pack_ids);
|
||||
}
|
||||
|
||||
|
||||
@ -228,7 +255,7 @@ static inline int toksize(jsmntok_t *tok)
|
||||
}
|
||||
|
||||
static int ndb_builder_finalize_tag(struct ndb_builder *builder,
|
||||
union packed_str offset)
|
||||
union ndb_packed_str offset)
|
||||
{
|
||||
if (!cursor_push_u32(&builder->note_cur, offset.offset))
|
||||
return 0;
|
||||
@ -239,8 +266,8 @@ static int ndb_builder_finalize_tag(struct ndb_builder *builder,
|
||||
/// Unescape and push json strings
|
||||
static int ndb_builder_make_json_str(struct ndb_builder *builder,
|
||||
const char *str, int len,
|
||||
union packed_str *pstr,
|
||||
int *written)
|
||||
union ndb_packed_str *pstr,
|
||||
int *written, int pack_ids)
|
||||
{
|
||||
// let's not care about de-duping these. we should just unescape
|
||||
// in-place directly into the strings table.
|
||||
@ -249,7 +276,7 @@ static int ndb_builder_make_json_str(struct ndb_builder *builder,
|
||||
unsigned char *builder_start;
|
||||
|
||||
// always try compact strings first
|
||||
if (ndb_builder_try_compact_str(builder, str, len, pstr))
|
||||
if (ndb_builder_try_compact_str(builder, str, len, pstr, pack_ids))
|
||||
return 1;
|
||||
|
||||
end = str + len;
|
||||
@ -327,8 +354,9 @@ static int ndb_builder_make_json_str(struct ndb_builder *builder,
|
||||
static int ndb_builder_push_json_tag(struct ndb_builder *builder,
|
||||
const char *str, int len)
|
||||
{
|
||||
union packed_str pstr;
|
||||
if (!ndb_builder_make_json_str(builder, str, len, &pstr, NULL))
|
||||
union ndb_packed_str pstr;
|
||||
int pack_ids = 1;
|
||||
if (!ndb_builder_make_json_str(builder, str, len, &pstr, NULL, pack_ids))
|
||||
return 0;
|
||||
return ndb_builder_finalize_tag(builder, pstr);
|
||||
}
|
||||
@ -474,13 +502,13 @@ int ndb_note_from_json(const char *json, int len, struct ndb_note **note,
|
||||
} else if (jsoneq(json, tok, tok_len, "content")) {
|
||||
// content
|
||||
tok = &parser.toks[i+1];
|
||||
union packed_str pstr;
|
||||
union ndb_packed_str pstr;
|
||||
tok_len = toksize(tok);
|
||||
int written;
|
||||
int written, pack_ids = 0;
|
||||
if (!ndb_builder_make_json_str(&parser.builder,
|
||||
json + tok->start,
|
||||
tok_len, &pstr,
|
||||
&written)) {
|
||||
&written, pack_ids)) {
|
||||
return 0;
|
||||
}
|
||||
parser.builder.note->content_length = written;
|
||||
@ -531,8 +559,9 @@ int ndb_builder_new_tag(struct ndb_builder *builder)
|
||||
inline int ndb_builder_push_tag_str(struct ndb_builder *builder,
|
||||
const char *str, int len)
|
||||
{
|
||||
union packed_str pstr;
|
||||
if (!ndb_builder_make_str(builder, str, len, &pstr))
|
||||
union ndb_packed_str pstr;
|
||||
int pack_ids = 1;
|
||||
if (!ndb_builder_make_str(builder, str, len, &pstr, pack_ids))
|
||||
return 0;
|
||||
return ndb_builder_finalize_tag(builder, pstr);
|
||||
}
|
||||
|
@ -4,25 +4,36 @@
|
||||
#include <inttypes.h>
|
||||
#include "cursor.h"
|
||||
|
||||
struct ndb_str {
|
||||
unsigned char flag;
|
||||
union {
|
||||
const char *str;
|
||||
unsigned char *id;
|
||||
};
|
||||
};
|
||||
|
||||
// these must be byte-aligned, they are directly accessing the serialized data
|
||||
// representation
|
||||
#pragma pack(push, 1)
|
||||
|
||||
union packed_str {
|
||||
uint32_t offset;
|
||||
/// We can store byte data in the string table, so
|
||||
#define NDB_PACKED_STR 0x1
|
||||
#define NDB_PACKED_ID 0x2
|
||||
|
||||
union ndb_packed_str {
|
||||
struct {
|
||||
char str[3];
|
||||
// we assume little endian everywhere. sorry not sorry.
|
||||
unsigned char flag;
|
||||
unsigned char flag; // NDB_PACKED_STR, etc
|
||||
} packed;
|
||||
|
||||
uint32_t offset;
|
||||
unsigned char bytes[4];
|
||||
};
|
||||
|
||||
struct ndb_tag {
|
||||
uint16_t count;
|
||||
union packed_str strs[0];
|
||||
union ndb_packed_str strs[0];
|
||||
};
|
||||
|
||||
struct ndb_tags {
|
||||
@ -41,9 +52,8 @@ struct ndb_note {
|
||||
uint32_t created_at;
|
||||
uint32_t kind;
|
||||
uint32_t content_length;
|
||||
union packed_str content;
|
||||
union ndb_packed_str content;
|
||||
uint32_t strings;
|
||||
uint32_t json;
|
||||
|
||||
// nothing can come after tags since it contains variadic data
|
||||
struct ndb_tags tags;
|
||||
@ -80,39 +90,39 @@ int ndb_builder_new_tag(struct ndb_builder *builder);
|
||||
int ndb_builder_push_tag_str(struct ndb_builder *builder, const char *str, int len);
|
||||
// BYE BUILDER
|
||||
|
||||
static inline int ndb_str_is_packed(union packed_str str)
|
||||
static inline struct ndb_str ndb_note_str(struct ndb_note *note,
|
||||
union ndb_packed_str *pstr)
|
||||
{
|
||||
return (str.offset >> 31) & 0x1;
|
||||
struct ndb_str str;
|
||||
str.flag = pstr->packed.flag;
|
||||
|
||||
if (str.flag == NDB_PACKED_STR) {
|
||||
str.str = pstr->packed.str;
|
||||
return str;
|
||||
}
|
||||
|
||||
str.str = ((const char *)note) + note->strings + (pstr->offset & 0xFFFFFF);
|
||||
return str;
|
||||
}
|
||||
|
||||
|
||||
static inline const char * ndb_note_str(struct ndb_note *note,
|
||||
union packed_str *str)
|
||||
{
|
||||
if (ndb_str_is_packed(*str))
|
||||
return str->packed.str;
|
||||
|
||||
return ((const char *)note) + note->strings + str->offset;
|
||||
}
|
||||
|
||||
static inline const char * ndb_tag_str(struct ndb_note *note,
|
||||
static inline struct ndb_str ndb_tag_str(struct ndb_note *note,
|
||||
struct ndb_tag *tag, int ind)
|
||||
{
|
||||
return ndb_note_str(note, &tag->strs[ind]);
|
||||
}
|
||||
|
||||
static int ndb_tag_matches_char(struct ndb_note *note,
|
||||
static inline int ndb_tag_matches_char(struct ndb_note *note,
|
||||
struct ndb_tag *tag, int ind, char c)
|
||||
{
|
||||
const char *str = ndb_tag_str(note, tag, ind);
|
||||
if (str[0] == '\0')
|
||||
struct ndb_str str = ndb_tag_str(note, tag, ind);
|
||||
if (str.str[0] == '\0')
|
||||
return 0;
|
||||
else if (str[0] == c)
|
||||
else if (str.str[0] == c)
|
||||
return 1;
|
||||
return 0;
|
||||
}
|
||||
|
||||
static inline const char * ndb_iter_tag_str(struct ndb_iterator *iter,
|
||||
static inline struct ndb_str ndb_iter_tag_str(struct ndb_iterator *iter,
|
||||
int ind)
|
||||
{
|
||||
return ndb_tag_str(iter->note, iter->tag, ind);
|
||||
@ -143,9 +153,9 @@ static inline uint32_t ndb_note_kind(struct ndb_note *note)
|
||||
return note->kind;
|
||||
}
|
||||
|
||||
static inline const char * ndb_note_content(struct ndb_note *note)
|
||||
static inline const char *ndb_note_content(struct ndb_note *note)
|
||||
{
|
||||
return ndb_note_str(note, ¬e->content);
|
||||
return ndb_note_str(note, ¬e->content).str;
|
||||
}
|
||||
|
||||
static inline uint32_t ndb_note_content_length(struct ndb_note *note)
|
||||
@ -161,55 +171,50 @@ static inline struct ndb_note * ndb_note_from_bytes(unsigned char *bytes)
|
||||
return note;
|
||||
}
|
||||
|
||||
static inline union packed_str ndb_offset_str(uint32_t offset)
|
||||
static inline union ndb_packed_str ndb_offset_str(uint32_t offset)
|
||||
{
|
||||
// ensure accidents like -1 don't corrupt our packed_str
|
||||
union packed_str str;
|
||||
str.offset = offset & 0x7FFFFFFF;
|
||||
union ndb_packed_str str;
|
||||
// most significant byte is reserved for ndb_packtype
|
||||
str.offset = offset & 0xFFFFFF;
|
||||
return str;
|
||||
}
|
||||
|
||||
static inline union packed_str ndb_char_to_packed_str(char c)
|
||||
static inline union ndb_packed_str ndb_char_to_packed_str(char c)
|
||||
{
|
||||
union packed_str str;
|
||||
str.packed.flag = 0xFF;
|
||||
union ndb_packed_str str;
|
||||
str.packed.flag = NDB_PACKED_STR;
|
||||
str.packed.str[0] = c;
|
||||
str.packed.str[1] = '\0';
|
||||
return str;
|
||||
}
|
||||
|
||||
static inline union packed_str ndb_chars_to_packed_str(char c1, char c2)
|
||||
static inline union ndb_packed_str ndb_chars_to_packed_str(char c1, char c2)
|
||||
{
|
||||
union packed_str str;
|
||||
str.packed.flag = 0xFF;
|
||||
union ndb_packed_str str;
|
||||
str.packed.flag = NDB_PACKED_STR;
|
||||
str.packed.str[0] = c1;
|
||||
str.packed.str[1] = c2;
|
||||
str.packed.str[2] = '\0';
|
||||
return str;
|
||||
}
|
||||
|
||||
static inline const char * ndb_note_tag_index(struct ndb_note *note,
|
||||
struct ndb_tag *tag, int index)
|
||||
{
|
||||
if (index >= tag->count) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
return ndb_note_str(note, &tag->strs[index]);
|
||||
}
|
||||
|
||||
static inline int ndb_tags_iterate_start(struct ndb_note *note,
|
||||
static inline void ndb_tags_iterate_start(struct ndb_note *note,
|
||||
struct ndb_iterator *iter)
|
||||
{
|
||||
iter->note = note;
|
||||
iter->tag = note->tags.tag;
|
||||
iter->index = 0;
|
||||
|
||||
return note->tags.count != 0 && iter->tag->count != 0;
|
||||
iter->tag = NULL;
|
||||
iter->index = -1;
|
||||
}
|
||||
|
||||
static inline int ndb_tags_iterate_next(struct ndb_iterator *iter)
|
||||
{
|
||||
if (iter->tag == NULL || iter->index == -1) {
|
||||
iter->tag = iter->note->tags.tag;
|
||||
iter->index = 0;
|
||||
return iter->note->tags.count != 0;
|
||||
}
|
||||
|
||||
struct ndb_tags *tags = &iter->note->tags;
|
||||
|
||||
if (++iter->index < tags->count) {
|
||||
|
Loading…
Reference in New Issue
Block a user