sq/drivers/userdriver/xmlud/xmlimport_test.go
Neil O'Toole ad23d5c116
Auto-detect CSV headers (#188)
* wip: initial header detection

* wip: refactored csv driver

* wip: Fixes to kind.Detector

* typo

* Refactor pkg csv files

* Update to changelog

* workflow: now running codacy and codeql on cron, not on push/pr
2023-04-09 08:44:27 -06:00

125 lines
3.9 KiB
Go
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

package xmlud_test
import (
"bytes"
"testing"
"github.com/neilotoole/sq/libsq/core/stringz"
"github.com/stretchr/testify/assert"
"github.com/stretchr/testify/require"
"gopkg.in/yaml.v3"
"github.com/neilotoole/sq/cli/config"
"github.com/neilotoole/sq/drivers/userdriver/xmlud"
"github.com/neilotoole/sq/testh"
"github.com/neilotoole/sq/testh/proj"
"github.com/neilotoole/sq/testh/testsrc"
)
const (
driverRSS = "rss"
driverPpl = "ppl"
)
func TestImport_Ppl(t *testing.T) {
th := testh.New(t)
ext := &config.Ext{}
require.NoError(t, yaml.Unmarshal(proj.ReadFile(testsrc.PathDriverDefPpl), ext))
require.Equal(t, 1, len(ext.UserDrivers))
udDef := ext.UserDrivers[0]
require.Equal(t, driverPpl, udDef.Name)
require.Equal(t, xmlud.Genre, udDef.Genre)
scratchDB, err := th.Databases().OpenScratch(th.Context, "ppl")
require.NoError(t, err)
t.Cleanup(func() {
assert.NoError(t, scratchDB.Close())
})
data := proj.ReadFile("drivers/userdriver/xmlud/testdata/people.xml")
err = xmlud.Import(th.Context, udDef, bytes.NewReader(data), scratchDB)
require.NoError(t, err)
srcMeta, err := scratchDB.SourceMetadata(th.Context)
require.NoError(t, err)
require.Equal(t, 2, len(srcMeta.Tables))
require.Equal(t, "person", srcMeta.Tables[0].Name)
require.Equal(t, "skill", srcMeta.Tables[1].Name)
sink, err := th.QuerySQL(scratchDB.Source(), "SELECT * FROM person")
require.NoError(t, err)
require.Equal(t, 3, len(sink.Recs))
require.Equal(t, "Nikola", stringz.Val(sink.Recs[0][1]))
for i, rec := range sink.Recs {
// Verify that the primary id cols are sequential
require.Equal(t, int64(i+1), stringz.Val(rec[0]))
}
sink, err = th.QuerySQL(scratchDB.Source(), "SELECT * FROM skill")
require.NoError(t, err)
require.Equal(t, 6, len(sink.Recs))
require.Equal(t, "Electrifying", stringz.Val(sink.Recs[0][2]))
for i, rec := range sink.Recs {
// Verify that the primary id cols are sequential
require.Equal(t, int64(i+1), stringz.Val(rec[0]))
}
}
func TestImport_RSS(t *testing.T) {
th := testh.New(t)
ext := &config.Ext{}
require.NoError(t, yaml.Unmarshal(proj.ReadFile(testsrc.PathDriverDefRSS), ext))
require.Equal(t, 1, len(ext.UserDrivers))
udDef := ext.UserDrivers[0]
require.Equal(t, driverRSS, udDef.Name)
require.Equal(t, xmlud.Genre, udDef.Genre)
scratchDB, err := th.Databases().OpenScratch(th.Context, "rss")
require.NoError(t, err)
t.Cleanup(func() {
assert.NoError(t, scratchDB.Close())
})
data := proj.ReadFile("drivers/userdriver/xmlud/testdata/nytimes_local.rss.xml")
err = xmlud.Import(th.Context, udDef, bytes.NewReader(data), scratchDB)
require.NoError(t, err)
srcMeta, err := scratchDB.SourceMetadata(th.Context)
require.NoError(t, err)
require.Equal(t, 3, len(srcMeta.Tables))
require.Equal(t, "category", srcMeta.Tables[0].Name)
require.Equal(t, "channel", srcMeta.Tables[1].Name)
require.Equal(t, "item", srcMeta.Tables[2].Name)
sink, err := th.QuerySQL(scratchDB.Source(), "SELECT * FROM channel")
require.NoError(t, err)
require.Equal(t, 1, len(sink.Recs))
require.Equal(t, "NYT > World", stringz.Val(sink.Recs[0][1]))
for i, rec := range sink.Recs {
// Verify that the primary id cols are sequential
require.Equal(t, int64(i+1), stringz.Val(rec[0]))
}
sink, err = th.QuerySQL(scratchDB.Source(), "SELECT * FROM category")
require.NoError(t, err)
require.Equal(t, 251, len(sink.Recs))
require.EqualValues(t, "Extradition", stringz.Val(sink.Recs[0][2]))
for i, rec := range sink.Recs {
// Verify that the primary id cols are sequential
require.Equal(t, int64(i+1), stringz.Val(rec[0]))
}
sink, err = th.QuerySQL(scratchDB.Source(), "SELECT * FROM item")
require.NoError(t, err)
require.Equal(t, 45, len(sink.Recs))
require.EqualValues(t, "Trilobites: Fishing for Clues to Solve Namibias Fairy Circle Mystery",
stringz.Val(sink.Recs[17][4]))
for i, rec := range sink.Recs {
// Verify that the primary id cols are sequential
require.Equal(t, int64(i+1), stringz.Val(rec[0]))
}
}