2020-08-06 20:58:47 +03:00
|
|
|
package cli
|
|
|
|
|
|
|
|
import (
|
2022-12-25 07:04:18 +03:00
|
|
|
"bytes"
|
|
|
|
"context"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
|
|
|
"os"
|
2020-08-06 20:58:47 +03:00
|
|
|
"strings"
|
|
|
|
|
2022-12-25 07:04:18 +03:00
|
|
|
"github.com/neilotoole/sq/cli/output"
|
2020-08-06 20:58:47 +03:00
|
|
|
"github.com/spf13/cobra"
|
2022-12-25 07:04:18 +03:00
|
|
|
"golang.org/x/term"
|
2020-08-06 20:58:47 +03:00
|
|
|
|
|
|
|
"github.com/neilotoole/sq/drivers/sqlite3"
|
2020-08-23 13:42:15 +03:00
|
|
|
"github.com/neilotoole/sq/libsq/core/errz"
|
|
|
|
"github.com/neilotoole/sq/libsq/core/options"
|
|
|
|
"github.com/neilotoole/sq/libsq/core/stringz"
|
2020-08-06 20:58:47 +03:00
|
|
|
"github.com/neilotoole/sq/libsq/source"
|
|
|
|
)
|
|
|
|
|
2021-02-22 10:37:00 +03:00
|
|
|
func newSrcAddCmd() *cobra.Command {
|
2020-08-06 20:58:47 +03:00
|
|
|
cmd := &cobra.Command{
|
2023-04-16 01:28:51 +03:00
|
|
|
Use: "add [--handle @HANDLE] LOCATION",
|
|
|
|
RunE: execSrcAdd,
|
|
|
|
Args: cobra.ExactArgs(1),
|
2023-01-01 06:17:44 +03:00
|
|
|
Example: `
|
|
|
|
When adding a data source, LOCATION is the only required arg.
|
2020-08-06 20:58:47 +03:00
|
|
|
|
2023-04-16 01:28:51 +03:00
|
|
|
$ sq add ./actor.csv
|
|
|
|
@actor csv actor.csv
|
|
|
|
|
|
|
|
Note that sq generated the handle "@actor". But you can explicitly specify
|
|
|
|
a handle.
|
|
|
|
|
|
|
|
# Add a postgres source with handle "@sakila/pg"
|
|
|
|
$ sq add -h @sakila/pg 'postgres://user:pass@localhost/sakila'
|
2020-08-06 20:58:47 +03:00
|
|
|
|
2023-04-16 01:28:51 +03:00
|
|
|
This handle format "@sakila/pg" includes a group, "sakila". Using a group
|
|
|
|
is entirely optional: it is a way to organize sources. For example:
|
|
|
|
|
|
|
|
$ sq add -h @dev/pg 'postgres://user:pass@dev.db.example.com/sakila'
|
|
|
|
$ sq add -h @prod/pg 'postgres://user:pass@prod.db.acme.com/sakila'
|
|
|
|
|
|
|
|
The format of LOCATION is driver-specific, but is generally a DB connection
|
2023-03-19 07:58:00 +03:00
|
|
|
string, a file path, or a URL.
|
2020-08-06 20:58:47 +03:00
|
|
|
|
|
|
|
DRIVER://USER:PASS@HOST:PORT/DBNAME
|
|
|
|
/path/to/local/file.ext
|
|
|
|
https://sq.io/data/test1.xlsx
|
|
|
|
|
|
|
|
If flag --handle is omitted, sq will generate a handle based
|
|
|
|
on LOCATION and the source driver type.
|
|
|
|
|
2022-12-25 07:04:18 +03:00
|
|
|
It's a security hazard to expose the data source password via
|
|
|
|
the LOCATION string. If flag --password (-p) is set, sq prompt the
|
|
|
|
user for the password:
|
|
|
|
|
|
|
|
$ sq add 'postgres://user@localhost/sakila' -p
|
|
|
|
Password: ****
|
|
|
|
|
|
|
|
However, if there's input on stdin, sq will read the password from
|
|
|
|
there instead of prompting the user:
|
|
|
|
|
|
|
|
# Add a source, but read password from an environment variable
|
2023-03-12 07:21:05 +03:00
|
|
|
$ export PASSWD='open:;"_Ses@me'
|
|
|
|
$ sq add 'postgres://user@localhost/sakila' -p <<< $PASSWD
|
2020-08-06 20:58:47 +03:00
|
|
|
|
2022-12-25 07:04:18 +03:00
|
|
|
# Same as above, but instead read password from file
|
|
|
|
$ echo 'open:;"_Ses@me' > password.txt
|
|
|
|
$ sq add 'postgres://user@localhost/sakila' -p < password.txt
|
|
|
|
|
|
|
|
Flag --opts sets source-specific options. Generally, opts are relevant
|
2020-08-06 20:58:47 +03:00
|
|
|
to document source types (such as a CSV file). The most common
|
|
|
|
use is to specify that the document has a header row:
|
|
|
|
|
2021-02-22 10:37:00 +03:00
|
|
|
$ sq add actor.csv --opts=header=true
|
2020-08-06 20:58:47 +03:00
|
|
|
|
2022-12-25 07:04:18 +03:00
|
|
|
Use query string encoding for multiple options, e.g. "--opts a=b&x=y".
|
|
|
|
|
|
|
|
If flag --driver is omitted, sq will attempt to determine the
|
|
|
|
type from LOCATION via file suffix, content type, etc.. If the result
|
|
|
|
is ambiguous, explicitly specify the driver type.
|
|
|
|
|
|
|
|
$ sq add --driver=tsv ./mystery.data
|
2020-08-06 20:58:47 +03:00
|
|
|
|
2023-03-19 07:58:00 +03:00
|
|
|
Available source driver types can be listed via "sq driver ls". At a
|
2022-12-25 07:04:18 +03:00
|
|
|
minimum, the following drivers are bundled:
|
2020-08-06 20:58:47 +03:00
|
|
|
|
2021-02-22 10:37:00 +03:00
|
|
|
sqlite3 SQLite
|
|
|
|
postgres PostgreSQL
|
2022-12-25 07:04:18 +03:00
|
|
|
sqlserver Microsoft SQL Server / Azure SQL Edge
|
2021-02-22 10:37:00 +03:00
|
|
|
mysql MySQL
|
|
|
|
csv Comma-Separated Values
|
|
|
|
tsv Tab-Separated Values
|
|
|
|
json JSON
|
|
|
|
jsona JSON Array: LF-delimited JSON arrays
|
|
|
|
jsonl JSON Lines: LF-delimited JSON objects
|
2022-12-25 07:04:18 +03:00
|
|
|
xlsx Microsoft Excel XLSX
|
|
|
|
|
2023-03-19 07:58:00 +03:00
|
|
|
If there isn't already an active source, the newly added source becomes the
|
2023-04-16 01:28:51 +03:00
|
|
|
active source (but the active group does not change). Otherwise you can
|
|
|
|
use flag --active to make the new source active.
|
2023-03-19 07:58:00 +03:00
|
|
|
|
2022-12-25 07:04:18 +03:00
|
|
|
More examples:
|
|
|
|
|
|
|
|
# Add a source, but prompt user for password
|
|
|
|
$ sq add 'postgres://user@localhost/sakila' -p
|
|
|
|
Password: ****
|
|
|
|
|
|
|
|
# Explicitly set flags
|
|
|
|
$ sq add --handle=@sakila_pg --driver=postgres 'postgres://user:pass@localhost/sakila'
|
|
|
|
|
|
|
|
# Same as above, but with short flags
|
|
|
|
$ sq add -h @sakila_pg --d postgres 'postgres://user:pass@localhost/sakila'
|
|
|
|
|
|
|
|
# Add a SQL Server source; will have generated handle @sakila_mssql or similar
|
|
|
|
$ sq add 'sqlserver://user:pass@localhost?database=sakila'
|
2023-03-19 09:18:54 +03:00
|
|
|
|
|
|
|
# Add a sqlite db, and immediately make it the active source
|
2023-04-16 01:28:51 +03:00
|
|
|
$ sq add ./testdata/sqlite1.db --active
|
2022-12-25 07:04:18 +03:00
|
|
|
|
|
|
|
# Add an Excel spreadsheet, with options
|
|
|
|
$ sq add ./testdata/test1.xlsx --opts=header=true
|
|
|
|
|
|
|
|
# Add a CSV source, with options
|
|
|
|
$ sq add ./testdata/person.csv --opts=header=true
|
|
|
|
|
|
|
|
# Add a CSV source from a URL (will be downloaded)
|
2023-04-16 01:28:51 +03:00
|
|
|
$ sq add https://sq.io/testdata/actor.csv
|
|
|
|
|
|
|
|
# Add a source, and make it the active source (and group)
|
|
|
|
$ sq add ./actor.csv -h @csv/actor`,
|
|
|
|
Short: "Add data source",
|
|
|
|
Long: `Add data source specified by LOCATION, optionally identified by @HANDLE.`,
|
2020-08-06 20:58:47 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
cmd.Flags().StringP(flagDriver, flagDriverShort, "", flagDriverUsage)
|
2022-12-25 07:09:20 +03:00
|
|
|
panicOn(cmd.RegisterFlagCompletionFunc(flagDriver, completeDriverType))
|
2020-08-06 20:58:47 +03:00
|
|
|
cmd.Flags().StringP(flagSrcOptions, "", "", flagSrcOptionsUsage)
|
|
|
|
cmd.Flags().StringP(flagHandle, flagHandleShort, "", flagHandleUsage)
|
2022-12-25 07:04:18 +03:00
|
|
|
cmd.Flags().BoolP(flagPasswordPrompt, flagPasswordPromptShort, false, flagPasswordPromptUsage)
|
|
|
|
cmd.Flags().Bool(flagSkipVerify, false, flagSkipVerifyUsage)
|
2023-01-01 06:17:44 +03:00
|
|
|
cmd.Flags().BoolP(flagJSON, flagJSONShort, false, flagJSONUsage)
|
2023-03-19 09:18:54 +03:00
|
|
|
cmd.Flags().BoolP(flagAddActive, flagAddActiveShort, false, flagAddActiveUsage)
|
2021-02-22 10:37:00 +03:00
|
|
|
return cmd
|
2020-08-06 20:58:47 +03:00
|
|
|
}
|
|
|
|
|
2021-02-22 10:37:00 +03:00
|
|
|
func execSrcAdd(cmd *cobra.Command, args []string) error {
|
|
|
|
rc := RunContextFrom(cmd.Context())
|
2020-08-06 20:58:47 +03:00
|
|
|
cfg := rc.Config
|
2023-01-01 06:17:44 +03:00
|
|
|
|
2020-08-06 20:58:47 +03:00
|
|
|
loc := source.AbsLocation(strings.TrimSpace(args[0]))
|
|
|
|
var err error
|
|
|
|
var typ source.Type
|
2020-10-20 18:05:43 +03:00
|
|
|
|
2023-01-01 06:17:44 +03:00
|
|
|
if cmdFlagChanged(cmd, flagDriver) {
|
2020-08-06 20:58:47 +03:00
|
|
|
val, _ := cmd.Flags().GetString(flagDriver)
|
|
|
|
typ = source.Type(strings.TrimSpace(val))
|
|
|
|
} else {
|
2021-02-22 10:37:00 +03:00
|
|
|
typ, err = rc.files.Type(cmd.Context(), loc)
|
2020-08-06 20:58:47 +03:00
|
|
|
if err != nil {
|
2020-10-20 18:05:43 +03:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
if typ == source.TypeNone {
|
|
|
|
return errz.Errorf("unable to determine source type: use --driver flag")
|
2020-08-06 20:58:47 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-10-20 18:05:43 +03:00
|
|
|
if rc.registry.ProviderFor(typ) == nil {
|
2023-04-02 22:49:45 +03:00
|
|
|
return errz.Errorf("unsupported source type {%s}", typ)
|
2020-10-20 18:05:43 +03:00
|
|
|
}
|
|
|
|
|
2020-08-06 20:58:47 +03:00
|
|
|
var handle string
|
2023-01-01 06:17:44 +03:00
|
|
|
if cmdFlagChanged(cmd, flagHandle) {
|
2020-08-06 20:58:47 +03:00
|
|
|
handle, _ = cmd.Flags().GetString(flagHandle)
|
|
|
|
} else {
|
2023-04-16 01:28:51 +03:00
|
|
|
handle, err = source.SuggestHandle(rc.Config.Sources, typ, loc)
|
2020-08-06 20:58:47 +03:00
|
|
|
if err != nil {
|
|
|
|
return errz.Wrap(err, "unable to suggest a handle: use --handle flag")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if stringz.InSlice(source.ReservedHandles(), handle) {
|
|
|
|
return errz.Errorf("handle reserved for system use: %s", handle)
|
|
|
|
}
|
|
|
|
|
2023-04-16 01:28:51 +03:00
|
|
|
if err = source.ValidHandle(handle); err != nil {
|
2020-08-06 20:58:47 +03:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-04-16 01:28:51 +03:00
|
|
|
if cfg.Sources.IsExistingSource(handle) {
|
2020-08-06 20:58:47 +03:00
|
|
|
return errz.Errorf("source handle already exists: %s", handle)
|
|
|
|
}
|
|
|
|
|
|
|
|
var opts options.Options
|
2023-01-01 06:17:44 +03:00
|
|
|
if cmdFlagChanged(cmd, flagSrcOptions) {
|
2020-08-06 20:58:47 +03:00
|
|
|
val, _ := cmd.Flags().GetString(flagSrcOptions)
|
|
|
|
val = strings.TrimSpace(val)
|
|
|
|
if val != "" {
|
|
|
|
opts, err = options.ParseOptions(val)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if typ == sqlite3.Type {
|
2023-01-01 06:17:44 +03:00
|
|
|
// Special handling for SQLite, because it's a file-based DB.
|
|
|
|
loc, err = sqlite3.MungeLocation(loc)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
2020-08-06 20:58:47 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-12-25 07:04:18 +03:00
|
|
|
// If the -p flag is set, sq looks for password input on stdin,
|
|
|
|
// or sq prompts the user.
|
|
|
|
if cmdFlagTrue(cmd, flagPasswordPrompt) {
|
2022-12-25 07:09:20 +03:00
|
|
|
var passwd []byte
|
|
|
|
passwd, err = readPassword(cmd.Context(), rc.Stdin, rc.Out, rc.writers.fm)
|
2022-12-25 07:04:18 +03:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
loc, err = source.LocationWithPassword(loc, string(passwd))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-08-08 06:06:56 +03:00
|
|
|
src, err := newSource(rc.Log, rc.registry, typ, handle, loc, opts)
|
2020-08-06 20:58:47 +03:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
err = cfg.Sources.Add(src)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-03-19 09:18:54 +03:00
|
|
|
if cfg.Sources.Active() == nil || cmdFlagTrue(cmd, flagAddActive) {
|
|
|
|
// If no current active data source, use this one, OR if
|
|
|
|
// flagAddActive is true.
|
2023-04-16 01:28:51 +03:00
|
|
|
if _, err = cfg.Sources.SetActive(src.Handle, false); err != nil {
|
2020-08-06 20:58:47 +03:00
|
|
|
return err
|
|
|
|
}
|
2023-04-16 01:28:51 +03:00
|
|
|
|
|
|
|
// However, we do not set the active group to the src's group.
|
|
|
|
// In UX testing, it led to confused users.
|
2020-08-06 20:58:47 +03:00
|
|
|
}
|
|
|
|
|
2020-08-08 06:06:56 +03:00
|
|
|
drvr, err := rc.registry.DriverFor(src.Type)
|
2020-08-06 20:58:47 +03:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2022-12-25 07:04:18 +03:00
|
|
|
if !cmdFlagTrue(cmd, flagSkipVerify) {
|
|
|
|
// Typically we want to ping the source before adding it.
|
|
|
|
if err = drvr.Ping(cmd.Context(), src); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2020-08-06 20:58:47 +03:00
|
|
|
}
|
|
|
|
|
2023-04-16 01:28:51 +03:00
|
|
|
if err = rc.ConfigStore.Save(rc.Config); err != nil {
|
2020-08-06 20:58:47 +03:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-04-16 01:28:51 +03:00
|
|
|
return rc.writers.srcw.Source(rc.Config.Sources, src)
|
2020-08-06 20:58:47 +03:00
|
|
|
}
|
2022-12-25 07:04:18 +03:00
|
|
|
|
|
|
|
// readPassword reads a password from stdin pipe, or if nothing on stdin,
|
|
|
|
// it prints a prompt to stdout, and then accepts input (which must be
|
|
|
|
// followed by a return).
|
|
|
|
func readPassword(ctx context.Context, stdin *os.File, stdout io.Writer, fm *output.Formatting) ([]byte, error) {
|
2022-12-25 07:09:20 +03:00
|
|
|
resultCh := make(chan []byte)
|
|
|
|
errCh := make(chan error)
|
2022-12-25 07:04:18 +03:00
|
|
|
|
|
|
|
// Check if there is something to read on STDIN.
|
2023-04-16 01:28:51 +03:00
|
|
|
stat, err := stdin.Stat()
|
|
|
|
if err != nil {
|
|
|
|
// Shouldn't happen
|
|
|
|
return nil, errz.Err(err)
|
|
|
|
}
|
2022-12-25 07:04:18 +03:00
|
|
|
if (stat.Mode() & os.ModeCharDevice) == 0 {
|
|
|
|
b, err := io.ReadAll(stdin)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
b = bytes.TrimSuffix(b, []byte("\n"))
|
|
|
|
return b, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Run this is a goroutine so that we can handle ctrl-c.
|
|
|
|
go func() {
|
|
|
|
buf := &bytes.Buffer{}
|
|
|
|
fmt.Fprint(buf, "Password: ")
|
|
|
|
fm.Faint.Fprint(buf, "[ENTER]")
|
|
|
|
fmt.Fprint(buf, " ")
|
|
|
|
stdout.Write(buf.Bytes())
|
|
|
|
|
|
|
|
b, err := term.ReadPassword(int(stdin.Fd()))
|
|
|
|
// Regardless of whether there's an error, we print
|
|
|
|
// newline for presentation.
|
|
|
|
fmt.Fprintln(stdout)
|
|
|
|
if err != nil {
|
|
|
|
errCh <- errz.Err(err)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
resultCh <- b
|
|
|
|
}()
|
|
|
|
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
// Print newline so that cancel msg is printed on its own line.
|
|
|
|
fmt.Fprintln(stdout)
|
|
|
|
return nil, errz.Err(ctx.Err())
|
|
|
|
case err := <-errCh:
|
|
|
|
return nil, err
|
|
|
|
case b := <-resultCh:
|
|
|
|
return b, nil
|
|
|
|
}
|
|
|
|
}
|