sq/libsq/source/location/location.go

402 lines
9.2 KiB
Go
Raw Normal View History

// Package location contains functionality related to source location.
package location
2020-08-06 20:58:47 +03:00
import (
"net/url"
"path"
"path/filepath"
"strconv"
"strings"
"github.com/xo/dburl"
"github.com/neilotoole/sq/libsq/core/errz"
"github.com/neilotoole/sq/libsq/source/drivertype"
2020-08-06 20:58:47 +03:00
)
// dbSchemes is a list of known SQL driver schemes.
2020-08-06 20:58:47 +03:00
var dbSchemes = []string{
"mysql",
"sqlserver",
"postgres",
"sqlite3",
}
// Filename returns the final component of the file/URL path.
func Filename(loc string) (string, error) {
if IsSQL(loc) {
return "", errz.Errorf("location is not a file: %s", loc)
2020-08-06 20:58:47 +03:00
}
fields, err := Parse(loc)
2020-08-06 20:58:47 +03:00
if err != nil {
return "", err
}
return fields.Name + fields.Ext, nil
2020-08-06 20:58:47 +03:00
}
// IsSQL returns true if source location loc seems to be
2020-08-06 20:58:47 +03:00
// a DSN for a SQL driver.
func IsSQL(loc string) bool {
2020-08-06 20:58:47 +03:00
for _, dbScheme := range dbSchemes {
if strings.HasPrefix(loc, dbScheme+"://") {
return true
}
}
return false
}
// WithPassword returns the location string with the password
// value set, overriding any existing password. If loc is not a URL
// (e.g. it's a file path), it is returned unmodified.
func WithPassword(loc, passw string) (string, error) {
if _, ok := isFpath(loc); ok {
return loc, nil
}
u, err := url.ParseRequestURI(loc)
if err != nil {
return "", errz.Err(err)
}
if passw == "" {
// This will effectively remove any existing password in loc
u.User = url.User(u.User.Username())
} else {
u.User = url.UserPassword(u.User.Username(), passw)
}
return u.String(), nil
}
// Short returns a short location string. For example, the
// base name (data.xlsx) for a file, or for a DSN, user@host[:port]/db.
func Short(loc string) string {
if !IsSQL(loc) {
2020-08-06 20:58:47 +03:00
// NOT a SQL location, must be a document (local filepath or URL).
// Let's check if it's http
u, ok := isHTTP(loc)
2020-08-06 20:58:47 +03:00
if ok {
name := path.Base(u.Path)
if name == "" || name == "/" || name == "." {
// Well, if we don't have a good name from u.Path, we'll
// fall back to the hostname.
name = u.Hostname()
}
return name
}
// It's not a http URL, so it must be a filepath
loc = filepath.Clean(loc)
return filepath.Base(loc)
}
// It's a SQL driver
u, err := dburl.Parse(loc)
if err != nil {
return loc
}
if u.Scheme == "sqlite3" {
// special handling for sqlite
return path.Base(u.DSN)
}
sb := strings.Builder{}
if u.User != nil && len(u.User.Username()) > 0 {
sb.WriteString(u.User.Username())
sb.WriteString("@")
}
sb.WriteString(u.Host)
if u.Path != "" {
sb.WriteString(u.Path)
// path contains the db name
return sb.String()
}
// Else path is empty, db name was prob part of params
u2, err := url.ParseRequestURI(loc)
if err != nil {
return loc
}
vals, err := url.ParseQuery(u2.RawQuery)
2020-08-06 20:58:47 +03:00
if err != nil {
return loc
}
db := vals.Get("database")
if db == "" {
return loc
}
sb.WriteRune('/')
sb.WriteString(db)
return sb.String()
}
// Fields is a parsed representation of a source location.
type Fields struct {
// Loc is the original unparsed location value.
Loc string
2020-08-06 20:58:47 +03:00
// DriverType is the associated source driver type, which may
2020-08-06 20:58:47 +03:00
// be empty until later determination.
DriverType drivertype.Type
2020-08-06 20:58:47 +03:00
// Scheme is the original location Scheme.
Scheme string
2020-08-06 20:58:47 +03:00
// User is the username, if applicable.
User string
2020-08-06 20:58:47 +03:00
// Pass is the password, if applicable.
Pass string
2020-08-06 20:58:47 +03:00
// Hostname is the Hostname, if applicable.
Hostname string
2020-08-06 20:58:47 +03:00
// Name is the "source Name", e.g. "sakila". Typically this
// is the database Name, but for a file location such
2020-08-06 20:58:47 +03:00
// as "/path/to/things.xlsx" it would be "things".
Name string
2020-08-06 20:58:47 +03:00
// Ext is the file extension, if applicable.
Ext string
2020-08-06 20:58:47 +03:00
// DSN is the connection "data source Name" that can be used in a
// call to sql.Open. Empty for non-SQL locations.
DSN string
// Port is the Port number or 0 if not applicable.
Port int
2020-08-06 20:58:47 +03:00
}
// Parse parses a location string, returning a Fields instance representing
// the decomposition of the location. On return the Fields.DriverType field
// may not be set: further processing may be required.
func Parse(loc string) (*Fields, error) {
fields := &Fields{Loc: loc}
2020-08-06 20:58:47 +03:00
if !strings.Contains(loc, "://") {
if strings.Contains(loc, ":/") {
// malformed location, such as "sqlite3:/path/to/file"
return nil, errz.Errorf("parse location: invalid scheme: %s", loc)
}
// no scheme: it's just a regular file path for a document such as an Excel file
2020-08-06 20:58:47 +03:00
name := filepath.Base(loc)
fields.Ext = filepath.Ext(name)
if fields.Ext != "" {
name = name[:len(name)-len(fields.Ext)]
2020-08-06 20:58:47 +03:00
}
fields.Name = name
return fields, nil
2020-08-06 20:58:47 +03:00
}
if u, ok := isHTTP(loc); ok {
2020-08-06 20:58:47 +03:00
// It's a http or https URL
fields.Scheme = u.Scheme
fields.Hostname = u.Hostname()
2020-08-06 20:58:47 +03:00
if u.Port() != "" {
var err error
fields.Port, err = strconv.Atoi(u.Port())
2020-08-06 20:58:47 +03:00
if err != nil {
return nil, errz.Wrapf(err, "parse location: invalid port {%s}: {%s}", u.Port(), loc)
2020-08-06 20:58:47 +03:00
}
}
name := path.Base(u.Path)
fields.Ext = path.Ext(name)
if fields.Ext != "" {
name = name[:len(name)-len(fields.Ext)]
2020-08-06 20:58:47 +03:00
}
fields.Name = name
return fields, nil
2020-08-06 20:58:47 +03:00
}
// sqlite3 is a special case, handle it now
const sqlitePrefix = "sqlite3://"
if strings.HasPrefix(loc, sqlitePrefix) {
fpath := strings.TrimPrefix(loc, sqlitePrefix)
fields.Scheme = "sqlite3"
fields.DriverType = drivertype.SQLite
fields.DSN = fpath
// fpath could include params, e.g. "sqlite3://C:\sakila.db?param=val"
if i := strings.IndexRune(fpath, '?'); i >= 0 {
// Snip off the params
fpath = fpath[:i]
}
name := filepath.Base(fpath)
fields.Ext = filepath.Ext(name)
if fields.Ext != "" {
name = name[:len(name)-len(fields.Ext)]
2020-08-06 20:58:47 +03:00
}
fields.Name = name
return fields, nil
2020-08-06 20:58:47 +03:00
}
u, err := dburl.Parse(loc)
if err != nil {
return nil, errz.Err(err)
}
fields.Scheme = u.OriginalScheme
fields.DSN = u.DSN
fields.User = u.User.Username()
fields.Pass, _ = u.User.Password()
fields.Hostname = u.Hostname()
2020-08-06 20:58:47 +03:00
if u.Port() != "" {
fields.Port, err = strconv.Atoi(u.Port())
2020-08-06 20:58:47 +03:00
if err != nil {
return nil, errz.Wrapf(err, "parse location: invalid port {%s}: %s", u.Port(), loc)
2020-08-06 20:58:47 +03:00
}
}
switch fields.Scheme {
2020-08-06 20:58:47 +03:00
default:
return nil, errz.Errorf("parse location: invalid scheme: %s", loc)
case "sqlserver":
fields.DriverType = drivertype.MSSQL
u2, err := url.ParseRequestURI(loc)
if err != nil {
return nil, errz.Wrapf(err, "parse location: %s", loc)
}
vals, err := url.ParseQuery(u2.RawQuery)
2020-08-06 20:58:47 +03:00
if err != nil {
return nil,
errz.Wrapf(err, "parse location: %s", loc)
2020-08-06 20:58:47 +03:00
}
fields.Name = vals.Get("database")
2020-08-06 20:58:47 +03:00
case "postgres":
fields.DriverType = drivertype.Pg
fields.Name = strings.TrimPrefix(u.Path, "/")
2020-08-06 20:58:47 +03:00
case "mysql":
fields.DriverType = drivertype.MySQL
fields.Name = strings.TrimPrefix(u.Path, "/")
2020-08-06 20:58:47 +03:00
}
return fields, nil
2020-08-06 20:58:47 +03:00
}
// Abs returns the absolute path of loc. That is, relative
// paths etc. are resolved. If loc is not a file path or
// it cannot be processed, loc is returned unmodified.
func Abs(loc string) string {
if fpath, ok := isFpath(loc); ok {
return fpath
}
return loc
}
// isFpath returns the absolute filepath and true if loc is a file path.
func isFpath(loc string) (fpath string, ok bool) {
// This is not exactly an industrial-strength algorithm...
if strings.Contains(loc, ":/") {
// Excludes "http:/" etc
return "", false
}
if strings.Contains(loc, "sqlite:") {
// Excludes "sqlite:my_file.db"
// Be wary of windows paths, e.g. "D:\a\b\c.file"
return "", false
}
fpath, err := filepath.Abs(loc)
if err != nil {
return "", false
}
return fpath, true
}
// Type is an enumeration of the various types of source location.
type Type string
const (
TypeStdin = "stdin"
TypeLocalFile = "local_file"
TypeSQL = "sql"
TypeRemoteFile = "remote_file"
TypeUnknown = "unknown"
)
// TypeOf returns the type of loc, or locTypeUnknown if it
// can't be determined.
func TypeOf(loc string) Type {
switch {
case loc == "@stdin":
// Convention: the "location" of stdin is always "@stdin"
return TypeStdin
case IsSQL(loc):
return TypeSQL
case strings.HasPrefix(loc, "http://"),
strings.HasPrefix(loc, "https://"):
return TypeRemoteFile
default:
}
if _, err := filepath.Abs(loc); err != nil {
return TypeUnknown
}
return TypeLocalFile
}
// isHTTP tests if s is a well-structured HTTP or HTTPS url, and
// if so, returns the url and true.
func isHTTP(s string) (u *url.URL, ok bool) {
var err error
u, err = url.Parse(s)
if err != nil || u.Host == "" || !(u.Scheme == "http" || u.Scheme == "https") {
return nil, false
}
return u, true
}
// Redact returns a redacted version of the source
// location loc, with the password component (if any) of
// the location masked.
func Redact(loc string) string {
switch {
case loc == "",
strings.HasPrefix(loc, "/"),
strings.HasPrefix(loc, "sqlite3://"):
// REVISIT: If it's a sqlite URI, could it have auth details in there?
// e.g. "?_auth_pass=foo"
return loc
case strings.HasPrefix(loc, "http://"), strings.HasPrefix(loc, "https://"):
u, err := url.ParseRequestURI(loc)
if err != nil {
// If we can't parse it, just return the original loc
return loc
}
return u.Redacted()
}
// At this point, we expect it's a DSN
dbu, err := dburl.Parse(loc)
if err != nil {
// Shouldn't happen, but if it does, simply return the
// unmodified loc.
return loc
}
return dbu.Redacted()
}