Remove any special characters from CSV file import

  • Hi,

    I'm trying to import a CSV file however it contains the OBJ character 

    http://www.fileformat.info/info/unicode/char/fffc/index.htm

    I've created a script task to remove this but it doesn't seem to be working:

    using System;

    using System.Data;

    using System.Text.RegularExpressions;

    using Microsoft.SqlServer.Dts.Pipeline.Wrapper;

    using Microsoft.SqlServer.Dts.Runtime.Wrapper;

    [Microsoft.SqlServer.Dts.Pipeline.SSISScriptComponentEntryPointAttribute]

    public class ScriptMain : UserComponent

    {

    public override void PreExecute()

    {

    base.PreExecute();

    }

    public override void PostExecute()

    {

    base.PostExecute();

    }

    string toreplace = "[\uFFFC]";

    string replacewith = "";

    public override void Input0_ProcessInputRow(Input0Buffer Row)

    {

    Regex reg = new Regex(toreplace);

    Row.CSVFileRows = reg.Replace(Row.CSVFileRows, replacewith);

    }

    }

    Is there anyway to only allow standard ASCII characters and remove any non printable ASCII characters?

  • Not sure whether it will work, but I think your regex may be incorrect.

    string toreplace = "[\uFFFC]";

    Can you try removing the square brackets?

    string toreplace = "\uFFFC";

    The absence of evidence is not evidence of absence.
    Martin Rees

    You can lead a horse to water, but a pencil must be lead.
    Stan Laurel

Viewing 2 posts - 1 through 1 (of 1 total)

You must be logged in to reply to this topic. Login to reply