将Unicode字符串写入txt文件

时间:2016-12-23 22:17:04

标签: c++ unicode wofstream

我制作了一个简单的txt扫描程序,将文本写入符合我选择范围的文件中。问题是写入文件而不是笔写,例如,洀洀。在图片上你可以看到例如:

enter image description here

#include <iostream>
#include <fstream>
#include <string>

using namespace std;

int main()
{
int offset;
wstring DBSearchLine, ScanLine;

wifstream ScanFile, DBSearchFile;
wofstream ResultFile;
ScanFile.open("ScanFile.txt", ios_base::binary);
ResultFile.open("ResultFile.txt", ios::out, ios_base::binary);

if (ScanFile.is_open())
{
    while (!ScanFile.eof())
    {
        DBSearchFile.open("DBSearchFile.txt", ios_base::binary);
        if (!DBSearchFile.is_open())
        {
            cout << "Error open DBSearchFile.txt" << "\n";
            break;
        }

        getline(ScanFile, ScanLine);
        wcout << "Scan line is - " << ScanLine << "\n";

        while (!DBSearchFile.eof())
        {
            getline(DBSearchFile, DBSearchLine);
            wcout << "DBSearchLine is -" << DBSearchLine << "\n";
            if ((offset = ScanLine.find(DBSearchLine, 0)) != string::npos)
            {
                ResultFile << ScanLine << L"\n";
            }
        }
        DBSearchFile.close();
    }
    ScanFile.close();
}
else
{
    cout << "Error open ScanFile.txt" << "\n";
}
system("PAUSE");
return 0;
}

1 个答案:

答案 0 :(得分:0)

#include <iostream>
#include <fstream>
#include <string>
#include <locale>
#include <codecvt>

using namespace std;

int main()
{
    /* via http://stackoverflow.com/a/5105192/4005233 
       changes the encoding of the console and all subsequently opened 
       files */
    std::locale::global(std::locale(""));

    wifstream ScanFile;
    ScanFile.open("ScanFile.txt", ios_base::binary);
    if (!ScanFile.is_open()) {
        cout << "Error open ScanFile.txt" << "\n";
        return 1;
    }

    wofstream ResultFile("ResultFile.txt", ios::out);

    while (!ScanFile.eof())
    {
        wifstream DBSearchFile;
        DBSearchFile.open("DBSearchFile.txt", ios_base::binary);
        if (!DBSearchFile.is_open())
        {
            cout << "Error open DBSearchFile.txt" << "\n";
            break;
        }

        wstring ScanLine;
        getline(ScanFile, ScanLine);
        wcout << "Scan line is - " << ScanLine << "\n";

        do
        {
            wstring DBSearchLine; 
            getline(DBSearchFile, DBSearchLine);
            // have all lines been read?
            if(!DBSearchLine.length())
                break;
            wcout << "DBSearchLine is -" << DBSearchLine << "\n";

            if (ScanLine.find(DBSearchLine, 0) != string::npos)
            {
                ResultFile << ScanLine << L"\n";
                break; // found a match, no need to search further
            }
        }while(1);
        DBSearchFile.close();
    }

    ScanFile.close();

    return 0;
}

使用包含和不包含BOM的文件对此进行了测试。

必须更改最里面的循环以处理末尾带换行符的文件;如果我没有这样做,它将匹配一个永远为真的空字符串。

(根据我的编码风格,我也改变了一些其他的东西,重要的变化是顶部的那个)