* Move nquads into quad. * Create cquads simplified parser in quad. * Move Triple (renamed Quad) to quad. Also made sure mongo actually implements BulkLoader.
221 lines
4.9 KiB
Go
221 lines
4.9 KiB
Go
// Copyright 2014 The Cayley Authors. All rights reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package leveldb
|
|
|
|
import (
|
|
"bytes"
|
|
"fmt"
|
|
"strings"
|
|
|
|
ldbit "github.com/syndtr/goleveldb/leveldb/iterator"
|
|
"github.com/syndtr/goleveldb/leveldb/opt"
|
|
|
|
"github.com/google/cayley/graph"
|
|
"github.com/google/cayley/graph/iterator"
|
|
"github.com/google/cayley/quad"
|
|
)
|
|
|
|
type Iterator struct {
|
|
iterator.Base
|
|
nextPrefix []byte
|
|
checkId []byte
|
|
dir quad.Direction
|
|
open bool
|
|
iter ldbit.Iterator
|
|
qs *TripleStore
|
|
ro *opt.ReadOptions
|
|
originalPrefix string
|
|
}
|
|
|
|
func NewIterator(prefix string, d quad.Direction, value graph.Value, qs *TripleStore) *Iterator {
|
|
var it Iterator
|
|
iterator.BaseInit(&it.Base)
|
|
it.checkId = value.([]byte)
|
|
it.dir = d
|
|
it.originalPrefix = prefix
|
|
it.nextPrefix = make([]byte, 0, 2+qs.hasher.Size())
|
|
it.nextPrefix = append(it.nextPrefix, []byte(prefix)...)
|
|
it.nextPrefix = append(it.nextPrefix, []byte(it.checkId[1:])...)
|
|
it.ro = &opt.ReadOptions{}
|
|
it.ro.DontFillCache = true
|
|
it.iter = qs.db.NewIterator(nil, it.ro)
|
|
it.open = true
|
|
it.qs = qs
|
|
ok := it.iter.Seek(it.nextPrefix)
|
|
if !ok {
|
|
it.open = false
|
|
it.iter.Release()
|
|
}
|
|
return &it
|
|
}
|
|
|
|
func (it *Iterator) Reset() {
|
|
if !it.open {
|
|
it.iter = it.qs.db.NewIterator(nil, it.ro)
|
|
it.open = true
|
|
}
|
|
ok := it.iter.Seek(it.nextPrefix)
|
|
if !ok {
|
|
it.open = false
|
|
it.iter.Release()
|
|
}
|
|
}
|
|
|
|
func (it *Iterator) Clone() graph.Iterator {
|
|
out := NewIterator(it.originalPrefix, it.dir, it.checkId, it.qs)
|
|
out.CopyTagsFrom(it)
|
|
return out
|
|
}
|
|
|
|
func (it *Iterator) Close() {
|
|
if it.open {
|
|
it.iter.Release()
|
|
it.open = false
|
|
}
|
|
}
|
|
|
|
func (it *Iterator) Next() (graph.Value, bool) {
|
|
if it.iter == nil {
|
|
it.Last = nil
|
|
return nil, false
|
|
}
|
|
if !it.open {
|
|
it.Last = nil
|
|
return nil, false
|
|
}
|
|
if !it.iter.Valid() {
|
|
it.Last = nil
|
|
it.Close()
|
|
return nil, false
|
|
}
|
|
if bytes.HasPrefix(it.iter.Key(), it.nextPrefix) {
|
|
out := make([]byte, len(it.iter.Key()))
|
|
copy(out, it.iter.Key())
|
|
it.Last = out
|
|
ok := it.iter.Next()
|
|
if !ok {
|
|
it.Close()
|
|
}
|
|
return out, true
|
|
}
|
|
it.Close()
|
|
it.Last = nil
|
|
return nil, false
|
|
}
|
|
|
|
func PositionOf(prefix []byte, d quad.Direction, qs *TripleStore) int {
|
|
if bytes.Equal(prefix, []byte("sp")) {
|
|
switch d {
|
|
case quad.Subject:
|
|
return 2
|
|
case quad.Predicate:
|
|
return qs.hasher.Size() + 2
|
|
case quad.Object:
|
|
return 2*qs.hasher.Size() + 2
|
|
case quad.Provenance:
|
|
return -1
|
|
}
|
|
}
|
|
if bytes.Equal(prefix, []byte("po")) {
|
|
switch d {
|
|
case quad.Subject:
|
|
return 2*qs.hasher.Size() + 2
|
|
case quad.Predicate:
|
|
return 2
|
|
case quad.Object:
|
|
return qs.hasher.Size() + 2
|
|
case quad.Provenance:
|
|
return -1
|
|
}
|
|
}
|
|
if bytes.Equal(prefix, []byte("os")) {
|
|
switch d {
|
|
case quad.Subject:
|
|
return qs.hasher.Size() + 2
|
|
case quad.Predicate:
|
|
return 2*qs.hasher.Size() + 2
|
|
case quad.Object:
|
|
return 2
|
|
case quad.Provenance:
|
|
return -1
|
|
}
|
|
}
|
|
if bytes.Equal(prefix, []byte("cp")) {
|
|
switch d {
|
|
case quad.Subject:
|
|
return 2*qs.hasher.Size() + 2
|
|
case quad.Predicate:
|
|
return qs.hasher.Size() + 2
|
|
case quad.Object:
|
|
return 3*qs.hasher.Size() + 2
|
|
case quad.Provenance:
|
|
return 2
|
|
}
|
|
}
|
|
panic("unreachable")
|
|
}
|
|
|
|
func (it *Iterator) Check(v graph.Value) bool {
|
|
val := v.([]byte)
|
|
if val[0] == 'z' {
|
|
return false
|
|
}
|
|
offset := PositionOf(val[0:2], it.dir, it.qs)
|
|
if offset != -1 {
|
|
if bytes.HasPrefix(val[offset:], it.checkId[1:]) {
|
|
return true
|
|
}
|
|
} else {
|
|
nameForDir := it.qs.Quad(v).Get(it.dir)
|
|
hashForDir := it.qs.ValueOf(nameForDir).([]byte)
|
|
if bytes.Equal(hashForDir, it.checkId) {
|
|
return true
|
|
}
|
|
}
|
|
return false
|
|
}
|
|
|
|
func (it *Iterator) Size() (int64, bool) {
|
|
return it.qs.SizeOf(it.checkId), true
|
|
}
|
|
|
|
func (it *Iterator) DebugString(indent int) string {
|
|
size, _ := it.Size()
|
|
return fmt.Sprintf("%s(%s %d tags: %v dir: %s size:%d %s)", strings.Repeat(" ", indent), it.Type(), it.UID(), it.Tags(), it.dir, size, it.qs.NameOf(it.checkId))
|
|
}
|
|
|
|
var levelDBType graph.Type
|
|
|
|
func init() {
|
|
levelDBType = graph.RegisterIterator("leveldb")
|
|
}
|
|
|
|
func Type() graph.Type { return levelDBType }
|
|
|
|
func (it *Iterator) Type() graph.Type { return levelDBType }
|
|
func (it *Iterator) Sorted() bool { return false }
|
|
|
|
func (it *Iterator) Optimize() (graph.Iterator, bool) {
|
|
return it, false
|
|
}
|
|
|
|
func (it *Iterator) Stats() graph.IteratorStats {
|
|
s, _ := it.Size()
|
|
return graph.IteratorStats{
|
|
CheckCost: 1,
|
|
NextCost: 2,
|
|
Size: s,
|
|
}
|
|
}
|