Skip to content

Commit 0f4a3fd

Browse files
Improved N-1 join query performance for DW SQL (#2631)
## Why make this change? - Back 1 year ago, as DW SQL does not support `JSON PATH` for converting the execution to json format. Hence we had to use `STRING_AGG` as the workaround. - Recently, we've noticed `JSON PATH` is now supported for outer query in DW, and we can use `JSON_OBJECT` + `JSON_PATH` to address the json conversion for N-to-1 relations, which can optimize the performance. - For N-N relations, we're still looking into any resolutions as `JSON_ARRAYAGG` does not provide much performance improvements. - - For other scenarios when joins are not needed for a simple SELECT, we will `JSON PATH` instead of `STRING_AGG` for better performance. ## What is this change? This PR covers 1. Introduced a feature flag to safeguard the changes, the feature flag is default as False when not provided to avoid any regressions. It will be removed once the changes are validated in production with scoped audiences. 2. For DW query builder, use `JSON_OBJECT` to generate the columns for sub-queries and applied `JSON PATH` to handle outer query, which fully replace the need of `STRING_AGG`. 3. Also, for non-join queries (in which we don't need to handle the relations), used `JSON PATH` to replace the need of `STRING_AGG` for better performance as well. This will have impact on aggregations, non-join queries and pagination. 4. Added some helper functions into the unit tests module, which aims to compare the results from GraphQL & DB engine easily for deeply nested queries. ## How was this tested? - [x] Unit Tests - As this change does not introduce new scenarios, so mostly added some new test cases to get more coverage when M-M / M-1 join queries are needed. - [x] Integration Tests ### Manual Testing - Join Scenarios #### Query 1-1 relation - As expected, optimization applied ![image](https://github.com/user-attachments/assets/514626e6-bcf5-4c37-a82e-0de13d947fd7) ![image](https://github.com/user-attachments/assets/a1921dfb-689b-496d-9f2e-520944c44ac8) #### Query N-1 relation - As expected, optimization applied ![image](https://github.com/user-attachments/assets/86b6e25d-6f1a-48de-8ac5-f0e0ea6dd555) ![image](https://github.com/user-attachments/assets/8f9d47ff-6d4a-4207-843f-fdcf7d45a3a3) #### Query 1-N Relation - As expected, optimization not applied ![image](https://github.com/user-attachments/assets/bea0d845-2e74-4a37-9410-9133f52fcdc5) ![image](https://github.com/user-attachments/assets/bd8d3a78-3d12-4909-abcc-4f6957e84564) #### Query N-N Relation - As expected, optimization not applied ![image](https://github.com/user-attachments/assets/8e5777c1-34ba-433e-a7b2-4c0a806533ea) ![image](https://github.com/user-attachments/assets/5660ec06-e63b-4db7-be4a-9dfbd828c95a) ### Other Scenarios We've applied the `JSON PATH` when there is no join in the query to replace the `STRING_AGG` for better performance. #### Aggregation ![image](https://github.com/user-attachments/assets/0adc0f75-92a6-418e-a756-22d349baec94) #### Non-Join Query ![image](https://github.com/user-attachments/assets/8b0f799a-a424-44cb-975d-d346eb1ae5b0) #### Pagination - N to 1, total items: 3 ![image](https://github.com/user-attachments/assets/b7ac611b-af4f-46de-b023-24d9f77acdae) ![image](https://github.com/user-attachments/assets/4b7a028d-255b-41da-b085-b7197bfef181) - N to N ![image](https://github.com/user-attachments/assets/ec611346-5fcf-47a4-894b-454547fc99a6) ![image](https://github.com/user-attachments/assets/9714bdac-6467-492b-b15f-02a2cb2939c4) ![image](https://github.com/user-attachments/assets/a193b95d-d37e-4879-b43b-6402d758e3bf)
1 parent a6eccb7 commit 0f4a3fd

11 files changed

+868
-93
lines changed

src/Cli.Tests/ModuleInitializer.cs

+4
Original file line numberDiff line numberDiff line change
@@ -79,6 +79,10 @@ public static void Init()
7979
VerifierSettings.IgnoreMember<RuntimeConfig>(options => options.EnableAggregation);
8080
// Ignore the EnableAggregation as that's unimportant from a test standpoint.
8181
VerifierSettings.IgnoreMember<GraphQLRuntimeOptions>(options => options.EnableAggregation);
82+
// Ignore the EnableDwNto1JoinOpt as that's unimportant from a test standpoint.
83+
VerifierSettings.IgnoreMember<RuntimeConfig>(options => options.EnableDwNto1JoinOpt);
84+
// Ignore the FeatureFlags as that's unimportant from a test standpoint.
85+
VerifierSettings.IgnoreMember<GraphQLRuntimeOptions>(options => options.FeatureFlags);
8286
// Ignore the JSON schema path as that's unimportant from a test standpoint.
8387
VerifierSettings.IgnoreMember<RuntimeConfig>(config => config.Schema);
8488
// Ignore the message as that's not serialized in our config file anyway.
+19
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,19 @@
1+
namespace Azure.DataApiBuilder.Config.ObjectModel
2+
{
3+
/// <summary>
4+
/// The class is used for ephemeral feature flags to turn on/off features in development
5+
/// </summary>
6+
public class FeatureFlags
7+
{
8+
/// <summary>
9+
/// By default EnableDwNto1JoinQueryOptimization is disabled
10+
/// We should change the default as True once got more confidence with the fix
11+
/// </summary>
12+
public bool EnableDwNto1JoinQueryOptimization { get; set; }
13+
14+
public FeatureFlags()
15+
{
16+
this.EnableDwNto1JoinQueryOptimization = false;
17+
}
18+
}
19+
}

src/Config/ObjectModel/GraphQLRuntimeOptions.cs

+8-1
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,8 @@ public record GraphQLRuntimeOptions(bool Enabled = true,
1111
bool AllowIntrospection = true,
1212
int? DepthLimit = null,
1313
MultipleMutationOptions? MultipleMutationOptions = null,
14-
bool EnableAggregation = true)
14+
bool EnableAggregation = true,
15+
FeatureFlags? FeatureFlags = null)
1516
{
1617
public const string DEFAULT_PATH = "/graphql";
1718

@@ -24,4 +25,10 @@ public record GraphQLRuntimeOptions(bool Enabled = true,
2425
[JsonIgnore(Condition = JsonIgnoreCondition.Always)]
2526
[MemberNotNullWhen(true, nameof(DepthLimit))]
2627
public bool UserProvidedDepthLimit { get; init; } = false;
28+
29+
/// <summary>
30+
/// Feature flag contains ephemeral flags passed in to init the runtime options
31+
/// </summary>
32+
[JsonIgnore(Condition = JsonIgnoreCondition.Always)]
33+
public FeatureFlags FeatureFlags { get; init; } = FeatureFlags ?? new FeatureFlags();
2734
}

src/Config/ObjectModel/RuntimeConfig.cs

+10
Original file line numberDiff line numberDiff line change
@@ -150,6 +150,16 @@ Runtime is not null &&
150150
Runtime.GraphQL is not null &&
151151
Runtime.GraphQL.EnableAggregation;
152152

153+
/// <summary>
154+
/// Retrieves the value of runtime.graphql.dwnto1joinopt.enabled property if present, default is false.
155+
/// </summary>
156+
[JsonIgnore]
157+
public bool EnableDwNto1JoinOpt =>
158+
Runtime is not null &&
159+
Runtime.GraphQL is not null &&
160+
Runtime.GraphQL.FeatureFlags is not null &&
161+
Runtime.GraphQL.FeatureFlags.EnableDwNto1JoinQueryOptimization;
162+
153163
private Dictionary<string, DataSource> _dataSourceNameToDataSource;
154164

155165
private Dictionary<string, string> _entityNameToDataSourceName = new();
+132
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,132 @@
1+
using Azure.DataApiBuilder.Config.ObjectModel;
2+
using Azure.DataApiBuilder.Core.Models;
3+
4+
namespace Azure.DataApiBuilder.Core.Resolvers
5+
{
6+
/// <summary>
7+
/// Base query builder class for T-SQL engine
8+
/// Can be used by dwsql and mssql
9+
/// </summary>
10+
public abstract class BaseTSqlQueryBuilder : BaseSqlQueryBuilder
11+
{
12+
protected const string FOR_JSON_SUFFIX = " FOR JSON PATH, INCLUDE_NULL_VALUES";
13+
protected const string WITHOUT_ARRAY_WRAPPER_SUFFIX = "WITHOUT_ARRAY_WRAPPER";
14+
15+
/// <summary>
16+
/// Build the Json Path query needed to append to the main query
17+
/// </summary>
18+
/// <param name="structure">Sql query structure to build query on</param>
19+
/// <returns>SQL query with JSON PATH format</returns>
20+
protected virtual string BuildJsonPath(SqlQueryStructure structure)
21+
{
22+
string query = string.Empty;
23+
query += FOR_JSON_SUFFIX;
24+
if (!structure.IsListQuery)
25+
{
26+
query += "," + WITHOUT_ARRAY_WRAPPER_SUFFIX;
27+
}
28+
29+
return query;
30+
}
31+
32+
/// <summary>
33+
/// Build the predicates query needed to append to the main query
34+
/// </summary>
35+
/// <param name="structure">Sql query structure to build query on</param>
36+
/// <returns>SQL query with predicates</returns>
37+
protected virtual string BuildPredicates(SqlQueryStructure structure)
38+
{
39+
return JoinPredicateStrings(
40+
structure.GetDbPolicyForOperation(EntityActionOperation.Read),
41+
structure.FilterPredicates,
42+
Build(structure.Predicates),
43+
Build(structure.PaginationMetadata.PaginationPredicate));
44+
}
45+
46+
/// <summary>
47+
/// Build the Group By Clause needed to append to the main query
48+
/// </summary>
49+
/// <param name="structure">Sql query structure to build query on</param>
50+
/// <returns>SQL query with group-by clause</returns>
51+
protected virtual string BuildGroupBy(SqlQueryStructure structure)
52+
{
53+
// Add GROUP BY clause if there are any group by columns
54+
if (structure.GroupByMetadata.Fields.Any())
55+
{
56+
return $" GROUP BY {string.Join(", ", structure.GroupByMetadata.Fields.Values.Select(c => Build(c)))}";
57+
}
58+
59+
return string.Empty;
60+
}
61+
62+
/// <summary>
63+
/// Build the Having clause needed to append to the main query
64+
/// </summary>
65+
/// <param name="structure">Sql query structure to build query on</param>
66+
/// <returns>SQL query with having clause</returns>
67+
protected virtual string BuildHaving(SqlQueryStructure structure)
68+
{
69+
if (structure.GroupByMetadata.Aggregations.Count > 0)
70+
{
71+
List<Predicate>? havingPredicates = structure.GroupByMetadata.Aggregations
72+
.SelectMany(aggregation => aggregation.HavingPredicates ?? new List<Predicate>())
73+
.ToList();
74+
75+
if (havingPredicates.Any())
76+
{
77+
return $" HAVING {Build(havingPredicates)}";
78+
}
79+
}
80+
81+
return string.Empty;
82+
}
83+
84+
/// <summary>
85+
/// Build the Order By clause needed to append to the main query
86+
/// </summary>
87+
/// <param name="structure">Sql query structure to build query on</param>
88+
/// <returns>SQL query with order-by clause</returns>
89+
protected virtual string BuildOrderBy(SqlQueryStructure structure)
90+
{
91+
if (structure.OrderByColumns.Any())
92+
{
93+
return $" ORDER BY {Build(structure.OrderByColumns)}";
94+
}
95+
96+
return string.Empty;
97+
}
98+
99+
/// <summary>
100+
/// Build the aggregation columns needed to append to the main query
101+
/// </summary>
102+
/// <param name="structure">Sql query structure to build query on</param>
103+
/// <returns>SQL query with aggregation columns</returns>
104+
protected virtual string BuildAggregationColumns(SqlQueryStructure structure)
105+
{
106+
string aggregations = string.Empty;
107+
if (structure.GroupByMetadata.Aggregations.Count > 0)
108+
{
109+
if (structure.Columns.Any())
110+
{
111+
aggregations = $",{BuildAggregationColumns(structure.GroupByMetadata)}";
112+
}
113+
else
114+
{
115+
aggregations = $"{BuildAggregationColumns(structure.GroupByMetadata)}";
116+
}
117+
}
118+
119+
return aggregations;
120+
}
121+
122+
/// <summary>
123+
/// Build the aggregation columns needed to append to the main query
124+
/// </summary>
125+
/// <param name="metadata">GroupByMetadata</param>
126+
/// <returns>SQL query with aggregation columns</returns>
127+
protected virtual string BuildAggregationColumns(GroupByMetadata metadata)
128+
{
129+
return string.Join(", ", metadata.Aggregations.Select(aggregation => Build(aggregation.Column, useAlias: true)));
130+
}
131+
}
132+
}

0 commit comments

Comments
 (0)