First reasonably fast integration test

This commit is contained in:
Barak Michener 2015-07-27 16:53:34 -04:00
parent 13d4d8b7b4
commit 425292811b
7 changed files with 209 additions and 833 deletions

File diff suppressed because it is too large Load diff

View file

@ -1,110 +0,0 @@
// Copyright 2015 The Cayley Authors. All rights reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package sql
import (
"flag"
"fmt"
"testing"
"github.com/google/cayley/graph"
"github.com/google/cayley/graph/iterator"
"github.com/google/cayley/quad"
)
var dbpath = flag.String("dbpath", "", "Path to running DB")
func TestSimpleSQL(t *testing.T) {
it := NewStatementIterator(nil, quad.Object, "cool")
s, v := it.buildQuery(false, nil)
fmt.Println(s, v)
}
// Functional tests
func TestQuadIteration(t *testing.T) {
if *dbpath == "" {
t.SkipNow()
}
db, err := newQuadStore(*dbpath, nil)
if err != nil {
t.Fatal(err)
}
it := NewStatementIterator(db.(*QuadStore), quad.Object, "Humphrey Bogart")
for graph.Next(it) {
fmt.Println(it.Result())
}
it = NewStatementIterator(db.(*QuadStore), quad.Subject, "/en/casablanca_1942")
s, v := it.buildQuery(false, nil)
fmt.Println(s, v)
c := 0
for graph.Next(it) {
fmt.Println(it.Result())
c += 1
}
if c != 18 {
t.Errorf("Not enough results, got %d expected 18")
}
}
func TestNodeIteration(t *testing.T) {
if *dbpath == "" {
t.SkipNow()
}
db, err := newQuadStore(*dbpath, nil)
if err != nil {
t.Fatal(err)
}
it := &StatementIterator{
uid: iterator.NextUID(),
qs: db.(*QuadStore),
stType: node,
dir: quad.Object,
tags: []tag{
tag{
pair: tableDir{
table: "t_4",
dir: quad.Subject,
},
t: "x",
},
},
where: baseClause{
pair: tableDir{
table: "t_4",
dir: quad.Subject,
},
strTarget: []string{"/en/casablanca_1942"},
},
}
s, v := it.buildQuery(false, nil)
it.Tagger().Add("id")
fmt.Println(s, v)
for graph.Next(it) {
fmt.Println(it.Result())
out := make(map[string]graph.Value)
it.TagResults(out)
for k, v := range out {
fmt.Printf("%s: %v\n", k, v.(string))
}
}
contains := it.Contains("Casablanca")
s, v = it.buildQuery(true, "Casablanca")
fmt.Println(s, v)
it.Tagger().Add("id")
if !contains {
t.Error("Didn't contain Casablanca")
}
}

View file

@ -45,7 +45,6 @@ func intersectNode(a *SQLNodeIterator, b *SQLNodeIterator) (graph.Iterator, erro
qs: a.qs, qs: a.qs,
tableName: newTableName(), tableName: newTableName(),
linkIts: append(a.linkIts, b.linkIts...), linkIts: append(a.linkIts, b.linkIts...),
tagdirs: append(a.tagdirs, b.tagdirs...),
} }
m.Tagger().CopyFrom(a) m.Tagger().CopyFrom(a)
m.Tagger().CopyFrom(b) m.Tagger().CopyFrom(b)
@ -59,6 +58,7 @@ func intersectLink(a *SQLLinkIterator, b *SQLLinkIterator) (graph.Iterator, erro
tableName: newTableName(), tableName: newTableName(),
nodeIts: append(a.nodeIts, b.nodeIts...), nodeIts: append(a.nodeIts, b.nodeIts...),
constraints: append(a.constraints, b.constraints...), constraints: append(a.constraints, b.constraints...),
tagdirs: append(a.tagdirs, b.tagdirs...),
} }
m.Tagger().CopyFrom(a) m.Tagger().CopyFrom(a)
m.Tagger().CopyFrom(b) m.Tagger().CopyFrom(b)
@ -150,25 +150,24 @@ func (qs *QuadStore) optimizeLinksTo(it *iterator.LinksTo) (graph.Iterator, bool
} }
newit.Tagger().CopyFrom(it) newit.Tagger().CopyFrom(it)
return newit, true return newit, true
//case graph.All: case graph.All:
//newit := &StatementIterator{ newit := &SQLLinkIterator{
//uid: iterator.NextUID(), uid: iterator.NextUID(),
//qs: qs, qs: qs,
//stType: link, size: qs.Size(),
//size: qs.Size(), }
//} for _, t := range primary.Tagger().Tags() {
//for _, t := range primary.Tagger().Tags() { newit.tagdirs = append(newit.tagdirs, tagDir{
//newit.tags = append(newit.tags, tag{ dir: it.Direction(),
//pair: tableDir{"", it.Direction()}, tag: t,
//t: t, })
//}) }
//} for k, v := range primary.Tagger().Fixed() {
//for k, v := range primary.Tagger().Fixed() { newit.tagger.AddFixed(k, v)
//newit.tagger.AddFixed(k, v) }
//} newit.tagger.CopyFrom(it)
//newit.tagger.CopyFrom(it)
//return newit, true return newit, true
} }
return it, false return it, false
} }

View file

@ -45,11 +45,26 @@ type constraint struct {
} }
type tagDir struct { type tagDir struct {
tag string tag string
dir quad.Direction dir quad.Direction
table string
justLocal bool
}
// Not to be stored in the iterator directly func (t tagDir) String() string {
table string if t.dir == quad.Any {
if t.justLocal {
return fmt.Sprintf("%s.__execd as %s", t.table, t.tag)
}
return fmt.Sprintf("%s.%s as %s", t.table, t.tag, t.tag)
}
return fmt.Sprintf("%s.%s as %s", t.table, t.dir, t.tag)
}
type tableDef struct {
table string
name string
values []string
} }
type sqlItDir struct { type sqlItDir struct {
@ -58,8 +73,9 @@ type sqlItDir struct {
} }
type sqlIterator interface { type sqlIterator interface {
buildSQL(next bool, val graph.Value) (string, []string)
sqlClone() sqlIterator sqlClone() sqlIterator
getTables() []string getTables() []tableDef
getTags() []tagDir getTags() []tagDir
buildWhere() (string, []string) buildWhere() (string, []string)
tableID() tagDir tableID() tagDir
@ -76,6 +92,7 @@ type SQLLinkIterator struct {
constraints []constraint constraints []constraint
tableName string tableName string
size int64 size int64
tagdirs []tagDir
result map[string]string result map[string]string
resultIndex int resultIndex int
@ -111,7 +128,8 @@ func (l *SQLLinkIterator) Clone() graph.Iterator {
qs: l.qs, qs: l.qs,
tableName: l.tableName, tableName: l.tableName,
size: l.size, size: l.size,
constraints: make([]constraint, 0, len(l.constraints)), constraints: make([]constraint, len(l.constraints)),
tagdirs: make([]tagDir, len(l.tagdirs)),
} }
for _, i := range l.nodeIts { for _, i := range l.nodeIts {
m.nodeIts = append(m.nodeIts, sqlItDir{ m.nodeIts = append(m.nodeIts, sqlItDir{
@ -120,6 +138,7 @@ func (l *SQLLinkIterator) Clone() graph.Iterator {
}) })
} }
copy(m.constraints, l.constraints) copy(m.constraints, l.constraints)
copy(m.tagdirs, l.tagdirs)
m.tagger.CopyFrom(l) m.tagger.CopyFrom(l)
return m return m
} }
@ -187,6 +206,9 @@ func (l *SQLLinkIterator) Size() (int64, bool) {
} }
if len(l.constraints) > 0 { if len(l.constraints) > 0 {
l.size = l.qs.sizeForIterator(false, l.constraints[0].dir, l.constraints[0].vals[0]) l.size = l.qs.sizeForIterator(false, l.constraints[0].dir, l.constraints[0].vals[0])
} else if len(l.nodeIts) > 1 {
subsize, _ := l.nodeIts[0].it.(*SQLNodeIterator).Size()
return subsize * 20, false
} else { } else {
return l.qs.Size(), false return l.qs.Size(), false
} }
@ -216,11 +238,31 @@ func (l *SQLLinkIterator) Type() graph.Type {
return sqlLinkType return sqlLinkType
} }
func (l *SQLLinkIterator) preFilter(v graph.Value) bool {
for _, c := range l.constraints {
none := true
desired := v.(quad.Quad).Get(c.dir)
for _, s := range c.vals {
if s == desired {
none = false
break
}
}
if none {
return true
}
}
return false
}
func (l *SQLLinkIterator) Contains(v graph.Value) bool { func (l *SQLLinkIterator) Contains(v graph.Value) bool {
var err error var err error
//if it.preFilter(v) { if l.preFilter(v) {
//return false return false
//} }
if len(l.nodeIts) == 0 {
return true
}
err = l.makeCursor(false, v) err = l.makeCursor(false, v)
if err != nil { if err != nil {
glog.Errorf("Couldn't make query: %v", err) glog.Errorf("Couldn't make query: %v", err)
@ -288,8 +330,8 @@ func (l *SQLLinkIterator) buildResult(i int) {
} }
} }
func (l *SQLLinkIterator) getTables() []string { func (l *SQLLinkIterator) getTables() []tableDef {
out := []string{l.tableName} out := []tableDef{tableDef{table: "quads", name: l.tableName}}
for _, i := range l.nodeIts { for _, i := range l.nodeIts {
out = append(out, i.it.getTables()...) out = append(out, i.it.getTables()...)
} }
@ -305,6 +347,14 @@ func (l *SQLLinkIterator) getTags() []tagDir {
tag: tag, tag: tag,
}) })
} }
for _, tag := range l.tagdirs {
out = append(out, tagDir{
dir: tag.dir,
table: l.tableName,
tag: tag.tag,
})
}
for _, i := range l.nodeIts { for _, i := range l.nodeIts {
out = append(out, i.it.getTags()...) out = append(out, i.it.getTags()...)
} }
@ -320,7 +370,11 @@ func (l *SQLLinkIterator) buildWhere() (string, []string) {
} }
for _, i := range l.nodeIts { for _, i := range l.nodeIts {
t := i.it.tableID() t := i.it.tableID()
q = append(q, fmt.Sprintf("%s.%s = %s.%s", l.tableName, i.dir, t.table, t.dir)) dir := t.dir.String()
if t.dir == quad.Any {
dir = t.tag
}
q = append(q, fmt.Sprintf("%s.%s = %s.%s", l.tableName, i.dir, t.table, dir))
} }
for _, i := range l.nodeIts { for _, i := range l.nodeIts {
s, v := i.it.buildWhere() s, v := i.it.buildWhere()
@ -339,7 +393,7 @@ func (l *SQLLinkIterator) tableID() tagDir {
} }
func (l *SQLLinkIterator) buildSQL(next bool, val graph.Value) (string, []string) { func (l *SQLLinkIterator) buildSQL(next bool, val graph.Value) (string, []string) {
query := "SELECT " query := "SELECT DISTINCT "
t := []string{ t := []string{
fmt.Sprintf("%s.subject", l.tableName), fmt.Sprintf("%s.subject", l.tableName),
fmt.Sprintf("%s.predicate", l.tableName), fmt.Sprintf("%s.predicate", l.tableName),
@ -347,18 +401,21 @@ func (l *SQLLinkIterator) buildSQL(next bool, val graph.Value) (string, []string
fmt.Sprintf("%s.label", l.tableName), fmt.Sprintf("%s.label", l.tableName),
} }
for _, v := range l.getTags() { for _, v := range l.getTags() {
t = append(t, fmt.Sprintf("%s.%s as %s", v.table, v.dir, v.tag)) t = append(t, v.String())
} }
query += strings.Join(t, ", ") query += strings.Join(t, ", ")
query += " FROM " query += " FROM "
t = []string{} t = []string{}
var values []string
for _, k := range l.getTables() { for _, k := range l.getTables() {
t = append(t, fmt.Sprintf("quads as %s", k)) values = append(values, k.values...)
t = append(t, fmt.Sprintf("%s as %s", k.table, k.name))
} }
query += strings.Join(t, ", ") query += strings.Join(t, ", ")
query += " WHERE " query += " WHERE "
constraint, values := l.buildWhere() constraint, wherevalues := l.buildWhere()
values = append(values, wherevalues...)
if !next { if !next {
v := val.(quad.Quad) v := val.(quad.Quad)
if constraint != "" { if constraint != "" {

View file

@ -15,6 +15,7 @@
package sql package sql
import ( import (
"flag"
"fmt" "fmt"
"testing" "testing"
@ -23,6 +24,8 @@ import (
"github.com/google/cayley/quad" "github.com/google/cayley/quad"
) )
var dbpath = flag.String("dbpath", "", "Path to running DB")
func TestSQLLink(t *testing.T) { func TestSQLLink(t *testing.T) {
it := NewSQLLinkIterator(nil, quad.Object, "cool") it := NewSQLLinkIterator(nil, quad.Object, "cool")
s, v := it.buildSQL(true, nil) s, v := it.buildSQL(true, nil)

View file

@ -18,6 +18,7 @@ import (
"database/sql" "database/sql"
"fmt" "fmt"
"strings" "strings"
"sync/atomic"
"github.com/barakmich/glog" "github.com/barakmich/glog"
"github.com/google/cayley/graph" "github.com/google/cayley/graph"
@ -26,9 +27,16 @@ import (
) )
var sqlNodeType graph.Type var sqlNodeType graph.Type
var sqlNodeTableID uint64
func init() { func init() {
sqlNodeType = graph.RegisterIterator("sqlnode") sqlNodeType = graph.RegisterIterator("sqlnode")
atomic.StoreUint64(&sqlNodeTableID, 0)
}
func newNodeTableName() string {
id := atomic.AddUint64(&sqlNodeTableID, 1)
return fmt.Sprintf("n_%d", id)
} }
type SQLNodeIterator struct { type SQLNodeIterator struct {
@ -38,10 +46,10 @@ type SQLNodeIterator struct {
tableName string tableName string
err error err error
cursor *sql.Rows cursor *sql.Rows
linkIts []sqlItDir linkIts []sqlItDir
size int64 nodetables []string
tagdirs []tagDir size int64
result map[string]string result map[string]string
resultIndex int resultIndex int
@ -67,7 +75,6 @@ func (n *SQLNodeIterator) Clone() graph.Iterator {
it: i.it.sqlClone(), it: i.it.sqlClone(),
}) })
} }
copy(n.tagdirs, m.tagdirs)
m.tagger.CopyFrom(n) m.tagger.CopyFrom(n)
return m return m
} }
@ -173,47 +180,106 @@ func (n *SQLNodeIterator) buildResult(i int) {
} }
} }
func (n *SQLNodeIterator) getTables() []string { func (n *SQLNodeIterator) makeNodeTableNames() {
var out []string if n.nodetables != nil {
for _, i := range n.linkIts { return
out = append(out, i.it.getTables()...) }
n.nodetables = make([]string, len(n.linkIts))
for i, _ := range n.nodetables {
n.nodetables[i] = newNodeTableName()
}
}
func (n *SQLNodeIterator) getTables() []tableDef {
var out []tableDef
switch len(n.linkIts) {
case 0:
return []tableDef{tableDef{table: "quads", name: n.tableName}}
case 1:
out = n.linkIts[0].it.getTables()
default:
return n.buildSubqueries()
} }
if len(out) == 0 { if len(out) == 0 {
out = append(out, n.tableName) out = append(out, tableDef{table: "quads", name: n.tableName})
}
return out
}
func (n *SQLNodeIterator) buildSubqueries() []tableDef {
var out []tableDef
n.makeNodeTableNames()
for i, it := range n.linkIts {
var td tableDef
// TODO(barakmich): This is a dirty hack. The real implementation is to
// separate SQL iterators to build a similar tree as we're doing here, and
// have a single graph.Iterator 'caddy' structure around it.
subNode := &SQLNodeIterator{
uid: iterator.NextUID(),
tableName: newTableName(),
linkIts: []sqlItDir{it},
}
var table string
table, td.values = subNode.buildSQL(true, nil)
td.table = fmt.Sprintf("\n(%s)", table[:len(table)-1])
td.name = n.nodetables[i]
out = append(out, td)
} }
return out return out
} }
func (n *SQLNodeIterator) tableID() tagDir { func (n *SQLNodeIterator) tableID() tagDir {
if len(n.linkIts) == 0 { switch len(n.linkIts) {
case 0:
return tagDir{ return tagDir{
table: n.tableName, table: n.tableName,
dir: quad.Any, dir: quad.Any,
tag: "__execd",
}
case 1:
return tagDir{
table: n.linkIts[0].it.tableID().table,
dir: n.linkIts[0].dir,
tag: "__execd",
}
default:
n.makeNodeTableNames()
return tagDir{
table: n.nodetables[0],
dir: quad.Any,
tag: "__execd",
} }
}
return tagDir{
table: n.linkIts[0].it.tableID().table,
dir: n.linkIts[0].dir,
} }
} }
func (n *SQLNodeIterator) getTags() []tagDir { func (n *SQLNodeIterator) getLocalTags() []tagDir {
myTag := n.tableID() myTag := n.tableID()
var out []tagDir var out []tagDir
for _, tag := range n.tagger.Tags() { for _, tag := range n.tagger.Tags() {
out = append(out, tagDir{ out = append(out, tagDir{
dir: myTag.dir, dir: myTag.dir,
table: myTag.table, table: myTag.table,
tag: tag, tag: tag,
justLocal: true,
}) })
} }
for _, tag := range n.tagdirs { return out
out = append(out, tagDir{ }
dir: tag.dir,
table: myTag.table,
tag: tag.tag,
})
func (n *SQLNodeIterator) getTags() []tagDir {
out := n.getLocalTags()
if len(n.linkIts) > 1 {
n.makeNodeTableNames()
for i, it := range n.linkIts {
for _, v := range it.it.getTags() {
out = append(out, tagDir{
tag: v.tag,
dir: quad.Any,
table: n.nodetables[i],
})
}
}
return out
} }
for _, i := range n.linkIts { for _, i := range n.linkIts {
out = append(out, i.it.getTags()...) out = append(out, i.it.getTags()...)
@ -225,18 +291,15 @@ func (n *SQLNodeIterator) buildWhere() (string, []string) {
var q []string var q []string
var vals []string var vals []string
if len(n.linkIts) > 1 { if len(n.linkIts) > 1 {
baseTable := n.linkIts[0].it.tableID().table for _, tb := range n.nodetables[1:] {
baseDir := n.linkIts[0].dir q = append(q, fmt.Sprintf("%s.__execd = %s.__execd", n.nodetables[0], tb))
for _, i := range n.linkIts[1:] { }
table := i.it.tableID().table } else {
dir := i.dir for _, i := range n.linkIts {
q = append(q, fmt.Sprintf("%s.%s = %s.%s", baseTable, baseDir, table, dir)) s, v := i.it.buildWhere()
q = append(q, s)
vals = append(vals, v...)
} }
}
for _, i := range n.linkIts {
s, v := i.it.buildWhere()
q = append(q, s)
vals = append(vals, v...)
} }
query := strings.Join(q, " AND ") query := strings.Join(q, " AND ")
return query, vals return query, vals
@ -244,21 +307,26 @@ func (n *SQLNodeIterator) buildWhere() (string, []string) {
func (n *SQLNodeIterator) buildSQL(next bool, val graph.Value) (string, []string) { func (n *SQLNodeIterator) buildSQL(next bool, val graph.Value) (string, []string) {
topData := n.tableID() topData := n.tableID()
query := "SELECT " tags := []tagDir{topData}
tags = append(tags, n.getTags()...)
query := "SELECT DISTINCT "
var t []string var t []string
t = append(t, fmt.Sprintf("%s.%s as __execd", topData.table, topData.dir)) for _, v := range tags {
for _, v := range n.getTags() { t = append(t, v.String())
t = append(t, fmt.Sprintf("%s.%s as %s", v.table, v.dir, v.tag))
} }
query += strings.Join(t, ", ") query += strings.Join(t, ", ")
query += " FROM " query += " FROM "
t = []string{} t = []string{}
var values []string
for _, k := range n.getTables() { for _, k := range n.getTables() {
t = append(t, fmt.Sprintf("quads as %s", k)) values = append(values, k.values...)
t = append(t, fmt.Sprintf("%s as %s", k.table, k.name))
} }
query += strings.Join(t, ", ") query += strings.Join(t, ", ")
query += " WHERE " query += " WHERE "
constraint, values := n.buildWhere()
constraint, wherevalues := n.buildWhere()
values = append(values, wherevalues...)
if !next { if !next {
v := val.(string) v := val.(string)
@ -368,6 +436,7 @@ func (n *SQLNodeIterator) makeCursor(next bool, value graph.Value) error {
cursor, err := n.qs.db.Query(q, ivalues...) cursor, err := n.qs.db.Query(q, ivalues...)
if err != nil { if err != nil {
glog.Errorf("Couldn't get cursor from SQL database: %v", err) glog.Errorf("Couldn't get cursor from SQL database: %v", err)
glog.Errorf("Query: %v", q)
cursor = nil cursor = nil
return err return err
} }

View file

@ -58,7 +58,6 @@ var benchmarkQueries = []struct {
// Easy one to get us started. How quick is the most straightforward retrieval? // Easy one to get us started. How quick is the most straightforward retrieval?
{ {
message: "name predicate", message: "name predicate",
skip: true,
query: ` query: `
g.V("Humphrey Bogart").In("name").All() g.V("Humphrey Bogart").In("name").All()
`, `,
@ -72,7 +71,6 @@ var benchmarkQueries = []struct {
// that's going to be measurably slower for every other backend. // that's going to be measurably slower for every other backend.
{ {
message: "two large sets with no intersection", message: "two large sets with no intersection",
skip: true,
query: ` query: `
function getId(x) { return g.V(x).In("name") } function getId(x) { return g.V(x).In("name") }
var actor_to_film = g.M().In("/film/performance/actor").In("/film/film/starring") var actor_to_film = g.M().In("/film/performance/actor").In("/film/film/starring")
@ -526,6 +524,7 @@ func TestQueries(t *testing.T) {
} }
func TestDeletedAndRecreatedQueries(t *testing.T) { func TestDeletedAndRecreatedQueries(t *testing.T) {
t.Skip()
if testing.Short() { if testing.Short() {
t.Skip() t.Skip()
} }
@ -541,7 +540,8 @@ func checkQueries(t *testing.T) {
if test.skip { if test.skip {
continue continue
} }
fmt.Printf("Now testing %s\n", test.message) tInit := time.Now()
fmt.Printf("Now testing %s ", test.message)
ses := gremlin.NewSession(handle.QuadStore, cfg.Timeout, true) ses := gremlin.NewSession(handle.QuadStore, cfg.Timeout, true)
_, err := ses.Parse(test.query) _, err := ses.Parse(test.query)
if err != nil { if err != nil {
@ -570,6 +570,7 @@ func checkQueries(t *testing.T) {
t.Error("Query timed out: skipping validation.") t.Error("Query timed out: skipping validation.")
continue continue
} }
fmt.Printf("(%v)\n", time.Since(tInit))
if len(got) != len(test.expect) { if len(got) != len(test.expect) {
t.Errorf("Unexpected number of results, got:%d expect:%d on %s.", len(got), len(test.expect), test.message) t.Errorf("Unexpected number of results, got:%d expect:%d on %s.", len(got), len(test.expect), test.message)