ALTER TABLE SWITCH语句失败。表X中分区1定义的范围不是表Y

时间:2019-02-14 21:30:48

标签: azure-sql-data-warehouse

我试图根据此处的https://docs.microsoft.com/en-us/azure/sql-data-warehouse/sql-data-warehouse-develop-best-practices-transactions

在Azure SQL DataWarehouse中创建一个简单的分区交换例程。

我认为我要交换的分区已经对齐,但是出现一个错误,似乎是在告诉我它们不是(ALTER TABLE SWITCH语句失败。表'Distribution_55由分区1定义的范围。 dbo.Table_42b5ce68198a4fe1a2c5a597075b93d5_55'不是表'Distribution_55.dbo.Table_62915da3af53441980fedba6da729c62_55')中分区2定义的范围子集。

这是我的完整副本:

--Create a view for us to use to look up the partition numbers later
CREATE VIEW dbo.TablePartitions
AS
    SELECT
        s.name SchemaName
        ,t.name TableName
        ,CAST(r.value as nvarchar(128)) BoundaryValue
        ,p.partition_number PartitionNumber
    FROM        
        sys.schemas s
        JOIN sys.tables t
            ON s.[schema_id] = t.[schema_id]
        JOIN sys.indexes i
            ON t.[object_id] = i.[object_id]
        JOIN sys.partitions p 
            ON i.[object_id] = p.[object_id] 
            AND i.[index_id] = p.[index_id] 
        JOIN sys.partition_schemes h 
            ON i.[data_space_id] = h.[data_space_id]
        JOIN sys.partition_functions f
            ON h.[function_id] = f.[function_id]
        LEFT JOIN sys.partition_range_values r
            ON f.[function_id] = r.[function_id] 
            AND r.[boundary_id] = p.[partition_number]
    WHERE 
        i.[index_id] <= 1;

--Create our main partitioned table
CREATE TABLE [dbo].[PartitionedTable](
    [DistributionField] [nvarchar](30) NOT NULL,
    [PartitionField] [int] NOT NULL,
    [Value] [int] NOT NULL
)
WITH (
    DISTRIBUTION = HASH( [DistributionField] ),
    PARTITION ( [PartitionField] RANGE RIGHT FOR VALUES() ),
    CLUSTERED COLUMNSTORE INDEX
)

--Create the main table's partition boundaries
ALTER TABLE dbo.[PartitionedTable] SPLIT RANGE (1)
ALTER TABLE dbo.[PartitionedTable] SPLIT RANGE (2)
ALTER TABLE dbo.[PartitionedTable] SPLIT RANGE (3)

--Create a staging table for partition swapping
CREATE TABLE [dbo].[PartitionedTableStaging]
WITH
(    
    DISTRIBUTION = HASH( [DistributionField] ),
    PARTITION ( [PartitionField] RANGE RIGHT FOR VALUES() ),
    CLUSTERED COLUMNSTORE INDEX
)
AS
SELECT *
FROM    [dbo].[PartitionedTable]
WHERE 1=2

--Create boundaries that will align the partition that PartitionValue = 2 will fall into
ALTER TABLE dbo.[PartitionedTableStaging] SPLIT RANGE (2)
ALTER TABLE dbo.[PartitionedTableStaging] SPLIT RANGE (3)

--Load the staging table with values where PartitionValue = 2
INSERT INTO PartitionedTableStaging (DistributionField, PartitionField, Value) VALUES ('X', 2, 1)
INSERT INTO PartitionedTableStaging (DistributionField, PartitionField, Value) VALUES ('Y', 2, 2)
INSERT INTO PartitionedTableStaging (DistributionField, PartitionField, Value) VALUES ('Z', 2, 3)

--Find the partition numbers that we will swap
select * from TablePartitions where SchemaName = 'dbo' and TableName = 'PartitionedTable' and BoundaryValue = 2
select * from TablePartitions where SchemaName = 'dbo' and TableName = 'PartitionedTableStaging' and BoundaryValue = 2

--Swap the staged partition over to the main table
ALTER TABLE PartitionedTableStaging SWITCH PARTITION 1 TO PartitionedTable PARTITION 2;

保持PartitionField = 2的分区的边界不是对齐的吗?

1 个答案:

答案 0 :(得分:1)

事实证明,我误解了RANGE RIGHT和RANGE LEFT的工作方式。首先,RANGE RIGHT将值(2是repro所关注的值)放入分区3而不是分区2中。如果将repro更改为使用RANGE LEFT,并在登台表上为分区2创建下限(通过为值1)创建边界,然后将登台表和活动表上的分区2对齐,交换工作。这是更正后的示例:

--Create a view for us to use to look up the partition numbers later
CREATE VIEW dbo.TablePartitions
AS
    SELECT
        s.name SchemaName
        ,t.name TableName
        ,CAST(r.value as nvarchar(128)) BoundaryValue
        ,p.partition_number PartitionNumber
    FROM        
        sys.schemas s
        JOIN sys.tables t
            ON s.[schema_id] = t.[schema_id]
        JOIN sys.indexes i
            ON t.[object_id] = i.[object_id]
        JOIN sys.partitions p 
            ON i.[object_id] = p.[object_id] 
            AND i.[index_id] = p.[index_id] 
        JOIN sys.partition_schemes h 
            ON i.[data_space_id] = h.[data_space_id]
        JOIN sys.partition_functions f
            ON h.[function_id] = f.[function_id]
        LEFT JOIN sys.partition_range_values r
            ON f.[function_id] = r.[function_id] 
            AND r.[boundary_id] = p.[partition_number]
    WHERE 
        i.[index_id] <= 1;

--Create our main partitioned table
CREATE TABLE [dbo].[PartitionedTable](
    [DistributionField] [nvarchar](30) NOT NULL,
    [PartitionField] [int] NOT NULL,
    [Value] [int] NOT NULL
)
WITH (
    DISTRIBUTION = HASH( [DistributionField] ),
    PARTITION ( [PartitionField] RANGE LEFT FOR VALUES() ),
    CLUSTERED COLUMNSTORE INDEX
)

--Create the main table's partition boundaries
ALTER TABLE dbo.[PartitionedTable] SPLIT RANGE (1)
ALTER TABLE dbo.[PartitionedTable] SPLIT RANGE (2)
ALTER TABLE dbo.[PartitionedTable] SPLIT RANGE (3)

--Create a staging table for partition swapping
CREATE TABLE [dbo].[PartitionedTableStaging]
WITH
(    
    DISTRIBUTION = HASH( [DistributionField] ),
    PARTITION ( [PartitionField] RANGE LEFT FOR VALUES() ),
    CLUSTERED COLUMNSTORE INDEX
)
AS
SELECT *
FROM    [dbo].[PartitionedTable]
WHERE 1=2

--Create boundaries that will align the partition that PartitionValue = 2 will fall into
ALTER TABLE dbo.[PartitionedTableStaging] SPLIT RANGE (1)
ALTER TABLE dbo.[PartitionedTableStaging] SPLIT RANGE (2)

--Load the staging table with values where PartitionValue = 2
INSERT INTO PartitionedTableStaging (DistributionField, PartitionField, Value) VALUES ('X', 2, 1)
INSERT INTO PartitionedTableStaging (DistributionField, PartitionField, Value) VALUES ('Y', 2, 2)
INSERT INTO PartitionedTableStaging (DistributionField, PartitionField, Value) VALUES ('Z', 2, 3)

--Find the partition numbers that we will swap
select * from TablePartitions where SchemaName = 'dbo' and TableName = 'PartitionedTable' and BoundaryValue = 2
select * from TablePartitions where SchemaName = 'dbo' and TableName = 'PartitionedTableStaging' and BoundaryValue = 2

--Swap the staged partition over to the main table
ALTER TABLE PartitionedTableStaging SWITCH PARTITION 2 TO PartitionedTable PARTITION 2;