graphql-engine/server/src-lib/Hasura/Backends/BigQuery/Plan.hs

-- | Planning T-SQL queries and subscriptions.

module Hasura.Backends.BigQuery.Plan
  ( planNoPlan
  , planToForest
  ) where

import           Hasura.Prelude

import qualified Data.Text.Lazy                           as LT

import           Control.Monad.Validate
import           Data.Aeson.Text
import           Data.Text.Extended
import           Data.Tree

import qualified Hasura.Backends.BigQuery.DataLoader.Plan as DataLoader
import qualified Hasura.Base.Error                        as E
import qualified Hasura.GraphQL.Parser                    as GraphQL
import qualified Hasura.RQL.Types.Column                  as RQL

import           Hasura.Backends.BigQuery.FromIr          as BigQuery
import           Hasura.Backends.BigQuery.Types           as BigQuery
import           Hasura.RQL.IR
import           Hasura.SQL.Backend
import           Hasura.SQL.Types
import           Hasura.Session


-- --------------------------------------------------------------------------------
-- -- Top-level planner

planToForest ::
     MonadError E.QErr m
  => UserInfo
  -> QueryDB 'BigQuery (GraphQL.UnpreparedValue 'BigQuery)
  -> m (Forest DataLoader.PlannedAction)
planToForest userInfo qrf = do
  select <- planNoPlan userInfo qrf
  let (!_headAndTail, !plannedActionsList) =
        DataLoader.runPlan
          (DataLoader.planSelectHeadAndTail Nothing Nothing select)
      !actionsForest = DataLoader.actionsForest id plannedActionsList
  pure actionsForest

planNoPlan ::
     MonadError E.QErr m
  => UserInfo
  -> QueryDB 'BigQuery (GraphQL.UnpreparedValue 'BigQuery)
  -> m Select
planNoPlan userInfo queryDB = do
  rootField <- traverseQueryDB (prepareValueNoPlan (_uiSession userInfo)) queryDB
  runValidate (BigQuery.runFromIr (BigQuery.fromRootField rootField))
    `onLeft` (E.throw400 E.NotSupported . (tshow :: NonEmpty Error -> Text))

--------------------------------------------------------------------------------
-- Resolving values

-- | Prepare a value without any query planning; we just execute the
-- query with the values embedded.
prepareValueNoPlan ::
     (MonadError E.QErr m)
  => SessionVariables
  -> GraphQL.UnpreparedValue 'BigQuery
  -> m BigQuery.Expression
prepareValueNoPlan sessionVariables =
  \case
    GraphQL.UVLiteral x -> pure x
    GraphQL.UVSession -> pure globalSessionExpression
    -- To be honest, I'm not sure if it's indeed the JSON_VALUE operator we need here...
    GraphQL.UVSessionVar typ text ->
      case typ of
        CollectableTypeScalar scalarType ->
          pure
            (CastExpression
               (JsonValueExpression
                  globalSessionExpression
                  (FieldPath RootPath (toTxt text)))
               scalarType)
        CollectableTypeArray {} ->
          throwError $ E.internalError "Cannot currently prepare array types in BigQuery."
    GraphQL.UVParameter _ RQL.ColumnValue {..} -> pure (ValueExpression cvValue)
  where
    globalSessionExpression =
      ValueExpression
        (StringValue (LT.toStrict (encodeToLazyText sessionVariables)))
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00			`-- \| Planning T-SQL queries and subscriptions.`

			`module Hasura.Backends.BigQuery.Plan`
			`( planNoPlan`
			`, planToForest`
			`) where`

server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`import Hasura.Prelude`
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`import qualified Data.Text.Lazy as LT`
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00
			`import Control.Monad.Validate`
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`import Data.Aeson.Text`
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00			`import Data.Text.Extended`
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`import Data.Tree`
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`import qualified Hasura.Backends.BigQuery.DataLoader.Plan as DataLoader`
			`import qualified Hasura.Base.Error as E`
			`import qualified Hasura.GraphQL.Parser as GraphQL`
			`import qualified Hasura.RQL.Types.Column as RQL`
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`import Hasura.Backends.BigQuery.FromIr as BigQuery`
			`import Hasura.Backends.BigQuery.Types as BigQuery`
server: support remote relationships on SQL Server and BigQuery (#1497) Remote relationships are now supported on SQL Server and BigQuery. The major change though is the re-architecture of remote join execution logic. Prior to this PR, each backend is responsible for processing the remote relationships that are part of their AST. This is not ideal as there is nothing specific about a remote join's execution that ties it to a backend. The only backend specific part is whether or not the specification of the remote relationship is valid (i.e, we'll need to validate whether the scalars are compatible). The approach now changes to this: 1. Before delegating the AST to the backend, we traverse the AST, collect all the remote joins while modifying the AST to add necessary join fields where needed. 1. Once the remote joins are collected from the AST, the database call is made to fetch the response. The necessary data for the remote join(s) is collected from the database's response and one or more remote schema calls are constructed as necessary. 1. The remote schema calls are then executed and the data from the database and from the remote schemas is joined to produce the final response. ### Known issues 1. Ideally the traversal of the IR to collect remote joins should return an AST which does not include remote join fields. This operation can be type safe but isn't taken up as part of the PR. 1. There is a lot of code duplication between `Transport/HTTP.hs` and `Transport/Websocket.hs` which needs to be fixed ASAP. This too hasn't been taken up by this PR. 1. The type which represents the execution plan is only modified to handle our current remote joins and as such it will have to be changed to accommodate general remote joins. 1. Use of lenses would have reduced the boilerplate code to collect remote joins from the base AST. 1. The current remote join logic assumes that the join columns of a remote relationship appear with their names in the database response. This however is incorrect as they could be aliased. This can be taken up by anyone, I've left a comment in the code. ### Notes to the reviewers I think it is best reviewed commit by commit. 1. The first one is very straight forward. 1. The second one refactors the remote join execution logic but other than moving things around, it doesn't change the user facing functionality. This moves Postgres specific parts to `Backends/Postgres` module from `Execute`. Some IR related code to `Hasura.RQL.IR` module. Simplifies various type class function signatures as a backend doesn't have to handle remote joins anymore 1. The third one fixes partial case matches that for some weird reason weren't shown as warnings before this refactor 1. The fourth one generalizes the validation logic of remote relationships and implements `scalarTypeGraphQLName` function on SQL Server and BigQuery which is used by the validation logic. This enables remote relationships on BigQuery and SQL Server. https://github.com/hasura/graphql-engine-mono/pull/1497 GitOrigin-RevId: 77dd8eed326602b16e9a8496f52f46d22b795598 2021-06-11 06:26:50 +03:00			`import Hasura.RQL.IR`
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00			`import Hasura.SQL.Backend`
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`import Hasura.SQL.Types`
			`import Hasura.Session`

BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00
			`-- --------------------------------------------------------------------------------`
			`-- -- Top-level planner`

			`planToForest ::`
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`MonadError E.QErr m`
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00			`=> UserInfo`
			`-> QueryDB 'BigQuery (GraphQL.UnpreparedValue 'BigQuery)`
			`-> m (Forest DataLoader.PlannedAction)`
			`planToForest userInfo qrf = do`
			`select <- planNoPlan userInfo qrf`
			`let (!_headAndTail, !plannedActionsList) =`
			`DataLoader.runPlan`
			`(DataLoader.planSelectHeadAndTail Nothing Nothing select)`
			`!actionsForest = DataLoader.actionsForest id plannedActionsList`
			`pure actionsForest`

			`planNoPlan ::`
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`MonadError E.QErr m`
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00			`=> UserInfo`
			`-> QueryDB 'BigQuery (GraphQL.UnpreparedValue 'BigQuery)`
			`-> m Select`
			`planNoPlan userInfo queryDB = do`
			`rootField <- traverseQueryDB (prepareValueNoPlan (_uiSession userInfo)) queryDB`
Bigquery/cleanups A pull request for cleaning up small issues, bugs, redundancies and missing things in the BigQuery backend. Summary: 1. Remove duplicate projection fields - BigQuery rejects these. 2. Add order_by to the test suite cases, as it was returning inconsistent results. 3. Add lots of in FromIr about how the dataloader approach is given support. 4. Produce the correct output structure for aggregates: a. Should be a singleton object for a top-level aggregate query. b. Should have appropriate aggregate{} and nodes{} labels. c. Support for nodes (via array_agg). 5. Smooth over support of array aggregates by removing the fields used for joining with an explicit projection of each wanted field. https://github.com/hasura/graphql-engine-mono/pull/1317 Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: cd3899f4667770a27055f94988ef2a6d5808f1f5 2021-06-15 11:58:21 +03:00			`runValidate (BigQuery.runFromIr (BigQuery.fromRootField rootField))`
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`onLeft` (E.throw400 E.NotSupported . (tshow :: NonEmpty Error -> Text))
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00
			`--------------------------------------------------------------------------------`
			`-- Resolving values`

			`-- \| Prepare a value without any query planning; we just execute the`
			`-- query with the values embedded.`
			`prepareValueNoPlan ::`
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`(MonadError E.QErr m)`
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00			`=> SessionVariables`
			`-> GraphQL.UnpreparedValue 'BigQuery`
			`-> m BigQuery.Expression`
			`prepareValueNoPlan sessionVariables =`
			`\case`
			`GraphQL.UVLiteral x -> pure x`
			`GraphQL.UVSession -> pure globalSessionExpression`
			`-- To be honest, I'm not sure if it's indeed the JSON_VALUE operator we need here...`
			`GraphQL.UVSessionVar typ text ->`
			`case typ of`
			`CollectableTypeScalar scalarType ->`
			`pure`
			`(CastExpression`
			`(JsonValueExpression`
			`globalSessionExpression`
			`(FieldPath RootPath (toTxt text)))`
			`scalarType)`
			`CollectableTypeArray {} ->`
server: introduce Hasura.Base (take 2) GitOrigin-RevId: 0dd10f1ccd338b1cf382ebff59b6ee7f209d39a1 2021-05-11 18:18:31 +03:00			`throwError $ E.internalError "Cannot currently prepare array types in BigQuery."`
BigQuery Feature Branch This will implement BigQuery support. Co-authored-by: Antoine Leblanc <1618949+nicuveo@users.noreply.github.com> Co-authored-by: Sibi Prabakaran <737477+psibi@users.noreply.github.com> Co-authored-by: Aniket Deshpande <922486+aniketd@users.noreply.github.com> Co-authored-by: Vamshi Surabhi <6562944+0x777@users.noreply.github.com> GitOrigin-RevId: 1a6ffaf34233e13e8125a5c908eaa7e32d65007b 2021-04-12 13:18:29 +03:00			`GraphQL.UVParameter _ RQL.ColumnValue {..} -> pure (ValueExpression cvValue)`
			`where`
			`globalSessionExpression =`
			`ValueExpression`
			`(StringValue (LT.toStrict (encodeToLazyText sessionVariables)))`