First reasonably fast integration test

This commit is contained in:
Barak Michener 2015-07-27 16:53:34 -04:00
parent 13d4d8b7b4
commit 425292811b
7 changed files with 209 additions and 833 deletions

File diff suppressed because it is too large Load diff

View file

@ -1,110 +0,0 @@
// Copyright 2015 The Cayley Authors. All rights reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package sql
import (
"flag"
"fmt"
"testing"
"github.com/google/cayley/graph"
"github.com/google/cayley/graph/iterator"
"github.com/google/cayley/quad"
)
var dbpath = flag.String("dbpath", "", "Path to running DB")
func TestSimpleSQL(t *testing.T) {
it := NewStatementIterator(nil, quad.Object, "cool")
s, v := it.buildQuery(false, nil)
fmt.Println(s, v)
}
// Functional tests
func TestQuadIteration(t *testing.T) {
if *dbpath == "" {
t.SkipNow()
}
db, err := newQuadStore(*dbpath, nil)
if err != nil {
t.Fatal(err)
}
it := NewStatementIterator(db.(*QuadStore), quad.Object, "Humphrey Bogart")
for graph.Next(it) {
fmt.Println(it.Result())
}
it = NewStatementIterator(db.(*QuadStore), quad.Subject, "/en/casablanca_1942")
s, v := it.buildQuery(false, nil)
fmt.Println(s, v)
c := 0
for graph.Next(it) {
fmt.Println(it.Result())
c += 1
}
if c != 18 {
t.Errorf("Not enough results, got %d expected 18")
}
}
func TestNodeIteration(t *testing.T) {
if *dbpath == "" {
t.SkipNow()
}
db, err := newQuadStore(*dbpath, nil)
if err != nil {
t.Fatal(err)
}
it := &StatementIterator{
uid: iterator.NextUID(),
qs: db.(*QuadStore),
stType: node,
dir: quad.Object,
tags: []tag{
tag{
pair: tableDir{
table: "t_4",
dir: quad.Subject,
},
t: "x",
},
},
where: baseClause{
pair: tableDir{
table: "t_4",
dir: quad.Subject,
},
strTarget: []string{"/en/casablanca_1942"},
},
}
s, v := it.buildQuery(false, nil)
it.Tagger().Add("id")
fmt.Println(s, v)
for graph.Next(it) {
fmt.Println(it.Result())
out := make(map[string]graph.Value)
it.TagResults(out)
for k, v := range out {
fmt.Printf("%s: %v\n", k, v.(string))
}
}
contains := it.Contains("Casablanca")
s, v = it.buildQuery(true, "Casablanca")
fmt.Println(s, v)
it.Tagger().Add("id")
if !contains {
t.Error("Didn't contain Casablanca")
}
}

View file

@ -45,7 +45,6 @@ func intersectNode(a *SQLNodeIterator, b *SQLNodeIterator) (graph.Iterator, erro
qs: a.qs,
tableName: newTableName(),
linkIts: append(a.linkIts, b.linkIts...),
tagdirs: append(a.tagdirs, b.tagdirs...),
}
m.Tagger().CopyFrom(a)
m.Tagger().CopyFrom(b)
@ -59,6 +58,7 @@ func intersectLink(a *SQLLinkIterator, b *SQLLinkIterator) (graph.Iterator, erro
tableName: newTableName(),
nodeIts: append(a.nodeIts, b.nodeIts...),
constraints: append(a.constraints, b.constraints...),
tagdirs: append(a.tagdirs, b.tagdirs...),
}
m.Tagger().CopyFrom(a)
m.Tagger().CopyFrom(b)
@ -150,25 +150,24 @@ func (qs *QuadStore) optimizeLinksTo(it *iterator.LinksTo) (graph.Iterator, bool
}
newit.Tagger().CopyFrom(it)
return newit, true
//case graph.All:
//newit := &StatementIterator{
//uid: iterator.NextUID(),
//qs: qs,
//stType: link,
//size: qs.Size(),
//}
//for _, t := range primary.Tagger().Tags() {
//newit.tags = append(newit.tags, tag{
//pair: tableDir{"", it.Direction()},
//t: t,
//})
//}
//for k, v := range primary.Tagger().Fixed() {
//newit.tagger.AddFixed(k, v)
//}
//newit.tagger.CopyFrom(it)
case graph.All:
newit := &SQLLinkIterator{
uid: iterator.NextUID(),
qs: qs,
size: qs.Size(),
}
for _, t := range primary.Tagger().Tags() {
newit.tagdirs = append(newit.tagdirs, tagDir{
dir: it.Direction(),
tag: t,
})
}
for k, v := range primary.Tagger().Fixed() {
newit.tagger.AddFixed(k, v)
}
newit.tagger.CopyFrom(it)
//return newit, true
return newit, true
}
return it, false
}

View file

@ -45,11 +45,26 @@ type constraint struct {
}
type tagDir struct {
tag string
dir quad.Direction
tag string
dir quad.Direction
table string
justLocal bool
}
// Not to be stored in the iterator directly
table string
func (t tagDir) String() string {
if t.dir == quad.Any {
if t.justLocal {
return fmt.Sprintf("%s.__execd as %s", t.table, t.tag)
}
return fmt.Sprintf("%s.%s as %s", t.table, t.tag, t.tag)
}
return fmt.Sprintf("%s.%s as %s", t.table, t.dir, t.tag)
}
type tableDef struct {
table string
name string
values []string
}
type sqlItDir struct {
@ -58,8 +73,9 @@ type sqlItDir struct {
}
type sqlIterator interface {
buildSQL(next bool, val graph.Value) (string, []string)
sqlClone() sqlIterator
getTables() []string
getTables() []tableDef
getTags() []tagDir
buildWhere() (string, []string)
tableID() tagDir
@ -76,6 +92,7 @@ type SQLLinkIterator struct {
constraints []constraint
tableName string
size int64
tagdirs []tagDir
result map[string]string
resultIndex int
@ -111,7 +128,8 @@ func (l *SQLLinkIterator) Clone() graph.Iterator {
qs: l.qs,
tableName: l.tableName,
size: l.size,
constraints: make([]constraint, 0, len(l.constraints)),
constraints: make([]constraint, len(l.constraints)),
tagdirs: make([]tagDir, len(l.tagdirs)),
}
for _, i := range l.nodeIts {
m.nodeIts = append(m.nodeIts, sqlItDir{
@ -120,6 +138,7 @@ func (l *SQLLinkIterator) Clone() graph.Iterator {
})
}
copy(m.constraints, l.constraints)
copy(m.tagdirs, l.tagdirs)
m.tagger.CopyFrom(l)
return m
}
@ -187,6 +206,9 @@ func (l *SQLLinkIterator) Size() (int64, bool) {
}
if len(l.constraints) > 0 {
l.size = l.qs.sizeForIterator(false, l.constraints[0].dir, l.constraints[0].vals[0])
} else if len(l.nodeIts) > 1 {
subsize, _ := l.nodeIts[0].it.(*SQLNodeIterator).Size()
return subsize * 20, false
} else {
return l.qs.Size(), false
}
@ -216,11 +238,31 @@ func (l *SQLLinkIterator) Type() graph.Type {
return sqlLinkType
}
func (l *SQLLinkIterator) preFilter(v graph.Value) bool {
for _, c := range l.constraints {
none := true
desired := v.(quad.Quad).Get(c.dir)
for _, s := range c.vals {
if s == desired {
none = false
break
}
}
if none {
return true
}
}
return false
}
func (l *SQLLinkIterator) Contains(v graph.Value) bool {
var err error
//if it.preFilter(v) {
//return false
//}
if l.preFilter(v) {
return false
}
if len(l.nodeIts) == 0 {
return true
}
err = l.makeCursor(false, v)
if err != nil {
glog.Errorf("Couldn't make query: %v", err)
@ -288,8 +330,8 @@ func (l *SQLLinkIterator) buildResult(i int) {
}
}
func (l *SQLLinkIterator) getTables() []string {
out := []string{l.tableName}
func (l *SQLLinkIterator) getTables() []tableDef {
out := []tableDef{tableDef{table: "quads", name: l.tableName}}
for _, i := range l.nodeIts {
out = append(out, i.it.getTables()...)
}
@ -305,6 +347,14 @@ func (l *SQLLinkIterator) getTags() []tagDir {
tag: tag,
})
}
for _, tag := range l.tagdirs {
out = append(out, tagDir{
dir: tag.dir,
table: l.tableName,
tag: tag.tag,
})
}
for _, i := range l.nodeIts {
out = append(out, i.it.getTags()...)
}
@ -320,7 +370,11 @@ func (l *SQLLinkIterator) buildWhere() (string, []string) {
}
for _, i := range l.nodeIts {
t := i.it.tableID()
q = append(q, fmt.Sprintf("%s.%s = %s.%s", l.tableName, i.dir, t.table, t.dir))
dir := t.dir.String()
if t.dir == quad.Any {
dir = t.tag
}
q = append(q, fmt.Sprintf("%s.%s = %s.%s", l.tableName, i.dir, t.table, dir))
}
for _, i := range l.nodeIts {
s, v := i.it.buildWhere()
@ -339,7 +393,7 @@ func (l *SQLLinkIterator) tableID() tagDir {
}
func (l *SQLLinkIterator) buildSQL(next bool, val graph.Value) (string, []string) {
query := "SELECT "
query := "SELECT DISTINCT "
t := []string{
fmt.Sprintf("%s.subject", l.tableName),
fmt.Sprintf("%s.predicate", l.tableName),
@ -347,18 +401,21 @@ func (l *SQLLinkIterator) buildSQL(next bool, val graph.Value) (string, []string
fmt.Sprintf("%s.label", l.tableName),
}
for _, v := range l.getTags() {
t = append(t, fmt.Sprintf("%s.%s as %s", v.table, v.dir, v.tag))
t = append(t, v.String())
}
query += strings.Join(t, ", ")
query += " FROM "
t = []string{}
var values []string
for _, k := range l.getTables() {
t = append(t, fmt.Sprintf("quads as %s", k))
values = append(values, k.values...)
t = append(t, fmt.Sprintf("%s as %s", k.table, k.name))
}
query += strings.Join(t, ", ")
query += " WHERE "
constraint, values := l.buildWhere()
constraint, wherevalues := l.buildWhere()
values = append(values, wherevalues...)
if !next {
v := val.(quad.Quad)
if constraint != "" {

View file

@ -15,6 +15,7 @@
package sql
import (
"flag"
"fmt"
"testing"
@ -23,6 +24,8 @@ import (
"github.com/google/cayley/quad"
)
var dbpath = flag.String("dbpath", "", "Path to running DB")
func TestSQLLink(t *testing.T) {
it := NewSQLLinkIterator(nil, quad.Object, "cool")
s, v := it.buildSQL(true, nil)

View file

@ -18,6 +18,7 @@ import (
"database/sql"
"fmt"
"strings"
"sync/atomic"
"github.com/barakmich/glog"
"github.com/google/cayley/graph"
@ -26,9 +27,16 @@ import (
)
var sqlNodeType graph.Type
var sqlNodeTableID uint64
func init() {
sqlNodeType = graph.RegisterIterator("sqlnode")
atomic.StoreUint64(&sqlNodeTableID, 0)
}
func newNodeTableName() string {
id := atomic.AddUint64(&sqlNodeTableID, 1)
return fmt.Sprintf("n_%d", id)
}
type SQLNodeIterator struct {
@ -38,10 +46,10 @@ type SQLNodeIterator struct {
tableName string
err error
cursor *sql.Rows
linkIts []sqlItDir
size int64
tagdirs []tagDir
cursor *sql.Rows
linkIts []sqlItDir
nodetables []string
size int64
result map[string]string
resultIndex int
@ -67,7 +75,6 @@ func (n *SQLNodeIterator) Clone() graph.Iterator {
it: i.it.sqlClone(),
})
}
copy(n.tagdirs, m.tagdirs)
m.tagger.CopyFrom(n)
return m
}
@ -173,47 +180,106 @@ func (n *SQLNodeIterator) buildResult(i int) {
}
}
func (n *SQLNodeIterator) getTables() []string {
var out []string
for _, i := range n.linkIts {
out = append(out, i.it.getTables()...)
func (n *SQLNodeIterator) makeNodeTableNames() {
if n.nodetables != nil {
return
}
n.nodetables = make([]string, len(n.linkIts))
for i, _ := range n.nodetables {
n.nodetables[i] = newNodeTableName()
}
}
func (n *SQLNodeIterator) getTables() []tableDef {
var out []tableDef
switch len(n.linkIts) {
case 0:
return []tableDef{tableDef{table: "quads", name: n.tableName}}
case 1:
out = n.linkIts[0].it.getTables()
default:
return n.buildSubqueries()
}
if len(out) == 0 {
out = append(out, n.tableName)
out = append(out, tableDef{table: "quads", name: n.tableName})
}
return out
}
func (n *SQLNodeIterator) buildSubqueries() []tableDef {
var out []tableDef
n.makeNodeTableNames()
for i, it := range n.linkIts {
var td tableDef
// TODO(barakmich): This is a dirty hack. The real implementation is to
// separate SQL iterators to build a similar tree as we're doing here, and
// have a single graph.Iterator 'caddy' structure around it.
subNode := &SQLNodeIterator{
uid: iterator.NextUID(),
tableName: newTableName(),
linkIts: []sqlItDir{it},
}
var table string
table, td.values = subNode.buildSQL(true, nil)
td.table = fmt.Sprintf("\n(%s)", table[:len(table)-1])
td.name = n.nodetables[i]
out = append(out, td)
}
return out
}
func (n *SQLNodeIterator) tableID() tagDir {
if len(n.linkIts) == 0 {
switch len(n.linkIts) {
case 0:
return tagDir{
table: n.tableName,
dir: quad.Any,
tag: "__execd",
}
case 1:
return tagDir{
table: n.linkIts[0].it.tableID().table,
dir: n.linkIts[0].dir,
tag: "__execd",
}
default:
n.makeNodeTableNames()
return tagDir{
table: n.nodetables[0],
dir: quad.Any,
tag: "__execd",
}
}
return tagDir{
table: n.linkIts[0].it.tableID().table,
dir: n.linkIts[0].dir,
}
}
func (n *SQLNodeIterator) getTags() []tagDir {
func (n *SQLNodeIterator) getLocalTags() []tagDir {
myTag := n.tableID()
var out []tagDir
for _, tag := range n.tagger.Tags() {
out = append(out, tagDir{
dir: myTag.dir,
table: myTag.table,
tag: tag,
dir: myTag.dir,
table: myTag.table,
tag: tag,
justLocal: true,
})
}
for _, tag := range n.tagdirs {
out = append(out, tagDir{
dir: tag.dir,
table: myTag.table,
tag: tag.tag,
})
return out
}
func (n *SQLNodeIterator) getTags() []tagDir {
out := n.getLocalTags()
if len(n.linkIts) > 1 {
n.makeNodeTableNames()
for i, it := range n.linkIts {
for _, v := range it.it.getTags() {
out = append(out, tagDir{
tag: v.tag,
dir: quad.Any,
table: n.nodetables[i],
})
}
}
return out
}
for _, i := range n.linkIts {
out = append(out, i.it.getTags()...)
@ -225,18 +291,15 @@ func (n *SQLNodeIterator) buildWhere() (string, []string) {
var q []string
var vals []string
if len(n.linkIts) > 1 {
baseTable := n.linkIts[0].it.tableID().table
baseDir := n.linkIts[0].dir
for _, i := range n.linkIts[1:] {
table := i.it.tableID().table
dir := i.dir
q = append(q, fmt.Sprintf("%s.%s = %s.%s", baseTable, baseDir, table, dir))
for _, tb := range n.nodetables[1:] {
q = append(q, fmt.Sprintf("%s.__execd = %s.__execd", n.nodetables[0], tb))
}
} else {
for _, i := range n.linkIts {
s, v := i.it.buildWhere()
q = append(q, s)
vals = append(vals, v...)
}
}
for _, i := range n.linkIts {
s, v := i.it.buildWhere()
q = append(q, s)
vals = append(vals, v...)
}
query := strings.Join(q, " AND ")
return query, vals
@ -244,21 +307,26 @@ func (n *SQLNodeIterator) buildWhere() (string, []string) {
func (n *SQLNodeIterator) buildSQL(next bool, val graph.Value) (string, []string) {
topData := n.tableID()
query := "SELECT "
tags := []tagDir{topData}
tags = append(tags, n.getTags()...)
query := "SELECT DISTINCT "
var t []string
t = append(t, fmt.Sprintf("%s.%s as __execd", topData.table, topData.dir))
for _, v := range n.getTags() {
t = append(t, fmt.Sprintf("%s.%s as %s", v.table, v.dir, v.tag))
for _, v := range tags {
t = append(t, v.String())
}
query += strings.Join(t, ", ")
query += " FROM "
t = []string{}
var values []string
for _, k := range n.getTables() {
t = append(t, fmt.Sprintf("quads as %s", k))
values = append(values, k.values...)
t = append(t, fmt.Sprintf("%s as %s", k.table, k.name))
}
query += strings.Join(t, ", ")
query += " WHERE "
constraint, values := n.buildWhere()
constraint, wherevalues := n.buildWhere()
values = append(values, wherevalues...)
if !next {
v := val.(string)
@ -368,6 +436,7 @@ func (n *SQLNodeIterator) makeCursor(next bool, value graph.Value) error {
cursor, err := n.qs.db.Query(q, ivalues...)
if err != nil {
glog.Errorf("Couldn't get cursor from SQL database: %v", err)
glog.Errorf("Query: %v", q)
cursor = nil
return err
}