提高SSIS包将数据从Excel转储到SQL Server表的性能

时间:2014-03-11 14:45:19

标签: sql sql-server excel ssis

我创建了一个SSIS包,用于将数据从Excel文件转储到SQL Server表。该软件包只有两个任务: 脚本组件任务& OLE DB目标

Package with 2 tasks to dump data from xlsx file to sql server table

请在下面找到我在脚本任务中添加的代码:

/* Microsoft SQL Server Integration Services Script Component
*  Write scripts using Microsoft Visual C# 2008.
*  ScriptMain is the entry point class of the script.*/

using System;
using System.Data;
using Microsoft.SqlServer.Dts.Pipeline.Wrapper;
using Microsoft.SqlServer.Dts.Runtime.Wrapper;
using System.IO;
using System.Data.OleDb;
using System.Xml;

[Microsoft.SqlServer.Dts.Pipeline.SSISScriptComponentEntryPointAttribute]


public class ScriptMain : UserComponent
{
    private OleDbDataReader excelReader;
    private OleDbConnection excelConnection;
    private OleDbCommand excelCommand;

    DataTable tablesInFile;
    string currentTable;

    public override void PreExecute()
    {
        base.PreExecute();
        GetDataFromExcelToReader(Variables.FilePath);

    }
    public override void PostExecute()
    {
        base.PostExecute();
        excelReader.Close();
        excelConnection.Close();
    }
    //private void GetDataFromExcelToReader(string p_strFileName, string p_strTabName)
    private void GetDataFromExcelToReader(string p_strFileName)
    {
        string l_strConnectionString;
        if (File.Exists(p_strFileName))
        {
            l_strConnectionString = "Provider=Microsoft.ACE.OLEDB.12.0;" +
            "Data Source=" + p_strFileName + ";Extended Properties=\"Excel 12.0;HDR=YES;IMEX=1\";";

            excelConnection = new OleDbConnection(l_strConnectionString);
            excelConnection.Open();
            tablesInFile = excelConnection.GetSchema("Tables");


            foreach (DataRow tableInFile in tablesInFile.Rows)
            {
                currentTable = tableInFile["TABLE_NAME"].ToString();
                break;
            }

            excelCommand = excelConnection.CreateCommand();
            //excelCommand.CommandText = "SELECT * FROM [" + p_strTabName + "A1:AX1048576]";
            excelCommand.CommandText = "SELECT * FROM [" + currentTable + "]";
            excelCommand.CommandType = CommandType.Text;
            excelReader = excelCommand.ExecuteReader();
        }
    }
    public override void CreateNewOutputRows()
    {
        int counter = 0;
        while (excelReader.Read())
        {
            Output0Buffer.AddRow();
            Output0Buffer.Source = Variables.Source.ToString();
            Output0Buffer.Column = excelReader.FieldCount > 0 ? excelReader[0].ToString() : null;
            Output0Buffer.Column1 = excelReader.FieldCount > 1 ? excelReader[1].ToString() : null;
            Output0Buffer.Column2 = excelReader.FieldCount > 2 ? excelReader[2].ToString() : null;
            Output0Buffer.Column3 = excelReader.FieldCount > 3 ? excelReader[3].ToString() : null;
            Output0Buffer.Column4 = excelReader.FieldCount > 4 ? excelReader[4].ToString() : null;
            Output0Buffer.Column5 = excelReader.FieldCount > 5 ? excelReader[5].ToString() : null;
            Output0Buffer.Column6 = excelReader.FieldCount > 6 ? excelReader[6].ToString() : null;
            Output0Buffer.Column7 = excelReader.FieldCount > 7 ? excelReader[7].ToString() : null;
            Output0Buffer.Column8 = excelReader.FieldCount > 8 ? excelReader[8].ToString() : null;
            Output0Buffer.Column9 = excelReader.FieldCount > 9 ? excelReader[9].ToString() : null;
            Output0Buffer.Column10 = excelReader.FieldCount > 10 ? excelReader[10].ToString() : null;
            Output0Buffer.Column11 = excelReader.FieldCount > 11 ? excelReader[11].ToString() : null;
            Output0Buffer.Column12 = excelReader.FieldCount > 12 ? excelReader[12].ToString() : null;
            Output0Buffer.Column13 = excelReader.FieldCount > 13 ? excelReader[13].ToString() : null;
            Output0Buffer.Column14 = excelReader.FieldCount > 14 ? excelReader[14].ToString() : null;
            Output0Buffer.Column15 = excelReader.FieldCount > 15 ? excelReader[15].ToString() : null;
            Output0Buffer.Column16 = excelReader.FieldCount > 16 ? excelReader[16].ToString() : null;
            Output0Buffer.Column17 = excelReader.FieldCount > 17 ? excelReader[17].ToString() : null;
            Output0Buffer.Column18 = excelReader.FieldCount > 18 ? excelReader[18].ToString() : null;
            Output0Buffer.Column19 = excelReader.FieldCount > 19 ? excelReader[19].ToString() : null;
            Output0Buffer.Column20 = excelReader.FieldCount > 20 ? excelReader[20].ToString() : null;
            Output0Buffer.Column21 = excelReader.FieldCount > 21 ? excelReader[21].ToString() : null;
            Output0Buffer.Column22 = excelReader.FieldCount > 22 ? excelReader[22].ToString() : null;
            Output0Buffer.Column23 = excelReader.FieldCount > 23 ? excelReader[23].ToString() : null;
            Output0Buffer.Column24 = excelReader.FieldCount > 24 ? excelReader[24].ToString() : null;
            Output0Buffer.Column25 = excelReader.FieldCount > 25 ? excelReader[25].ToString() : null;
            Output0Buffer.Column26 = excelReader.FieldCount > 26 ? excelReader[26].ToString() : null;
            Output0Buffer.Column27 = excelReader.FieldCount > 27 ? excelReader[27].ToString() : null;
            Output0Buffer.Column28 = excelReader.FieldCount > 28 ? excelReader[28].ToString() : null;
            Output0Buffer.Column29 = excelReader.FieldCount > 29 ? excelReader[29].ToString() : null;
            Output0Buffer.Column30 = excelReader.FieldCount > 30 ? excelReader[30].ToString() : null;
            Output0Buffer.Column31 = excelReader.FieldCount > 31 ? excelReader[31].ToString() : null;
            Output0Buffer.Column32 = excelReader.FieldCount > 32 ? excelReader[32].ToString() : null;
            Output0Buffer.Column33 = excelReader.FieldCount > 33 ? excelReader[33].ToString() : null;
            Output0Buffer.Column34 = excelReader.FieldCount > 34 ? excelReader[34].ToString() : null;
            Output0Buffer.Column35 = excelReader.FieldCount > 35 ? excelReader[35].ToString() : null;
            Output0Buffer.Column36 = excelReader.FieldCount > 36 ? excelReader[36].ToString() : null;
            Output0Buffer.Column37 = excelReader.FieldCount > 37 ? excelReader[37].ToString() : null;
            Output0Buffer.Column38 = excelReader.FieldCount > 38 ? excelReader[38].ToString() : null;
            Output0Buffer.Column39 = excelReader.FieldCount > 39 ? excelReader[39].ToString() : null;
            Output0Buffer.Column40 = excelReader.FieldCount > 40 ? excelReader[40].ToString() : null;
            Output0Buffer.Column41 = excelReader.FieldCount > 41 ? excelReader[41].ToString() : null;
            Output0Buffer.Column42 = excelReader.FieldCount > 42 ? excelReader[42].ToString() : null;
            Output0Buffer.Column43 = excelReader.FieldCount > 43 ? excelReader[43].ToString() : null;
            Output0Buffer.Column44 = excelReader.FieldCount > 44 ? excelReader[44].ToString() : null;
            Output0Buffer.Column45 = excelReader.FieldCount > 45 ? excelReader[45].ToString() : null;
            Output0Buffer.Column46 = excelReader.FieldCount > 46 ? excelReader[46].ToString() : null;
            Output0Buffer.Column47 = excelReader.FieldCount > 47 ? excelReader[47].ToString() : null;
            Output0Buffer.Column48 = excelReader.FieldCount > 48 ? excelReader[48].ToString() : null;
            Output0Buffer.Column49 = excelReader.FieldCount > 49 ? excelReader[49].ToString() : null;
        }
    }
}

请在下面找到OLE DB目标任务中完成的配置快照:

Configuration inside OLE DB Destination task

目前,如果我运行包含大约99000条记录的xlsx文件包,则需要4分钟才能将数据转储到相当大的数据库中。期望是在几秒钟内完成整个过程。 我怎样才能在这个包里面实现这个目标。我的Excel文件是动态的,可以包含最少1条记录,最多可记录1.5 - 2条记录。

请帮忙。在此先感谢!!

2 个答案:

答案 0 :(得分:1)

在OLE DB目标任务中进行更改符合我的目的,并且我能够显着提高性能。

我通过调整其几个属性来使用快速加载选项。现在,我能够在大约15秒内转储2laks记录。

答案 1 :(得分:0)

如果您正在寻找性能观点,那么我建议您使用以下内容:

1)在数据库中创建一个完全相同的临时表,在该过程完成后将被删除或截断。

2)将excel源中的记录插入TEMP TABLE。

3)下一步,从TEMP TABLE获取记录并插入目的地表。

注意:对于第一步,您可以拖动Execute SQL Task在存储过程中执行或只是简单查询